diff --git "a/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" "b/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" --- "a/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" +++ "b/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.8067, "train/learning_rate": 9.92e-05, "train/epoch": 0.42, "train/global_step": 500, "_runtime": 2790, "_timestamp": 1646182171, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 16.0, 20.0, 36.0, 74.0, 142.0, 342.0, 148.0, 80.0, 51.0, 38.0, 11.0, 7.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0], "bins": [-412.4659423828125, -404.3079528808594, -396.1499938964844, -387.99200439453125, -379.8340148925781, -371.676025390625, -363.51806640625, -355.3600769042969, -347.20208740234375, -339.0440979003906, -330.8861389160156, -322.7281494140625, -314.5701599121094, -306.41217041015625, -298.25421142578125, -290.0962219238281, -281.9382629394531, -273.7802734375, -265.622314453125, -257.4643249511719, -249.30633544921875, -241.1483612060547, -232.99038696289062, -224.8323974609375, -216.67442321777344, -208.51644897460938, -200.35845947265625, -192.2004852294922, -184.04251098632812, -175.884521484375, -167.72654724121094, -159.56857299804688, -151.41058349609375, -143.2526092529297, -135.09461975097656, -126.9366455078125, -118.7786636352539, -110.62068176269531, -102.46270751953125, -94.30472564697266, -86.14674377441406, -77.98876190185547, -69.83078002929688, -61.67280578613281, -53.51482391357422, -45.356842041015625, -37.1988639831543, -29.04088592529297, -20.882904052734375, -12.724924087524414, -4.566944122314453, 3.591035842895508, 11.749015808105469, 19.906997680664062, 28.06497573852539, 36.22295379638672, 44.38093566894531, 52.538917541503906, 60.696895599365234, 68.85487365722656, 77.01285552978516, 85.17083740234375, 93.32881164550781, 101.4867935180664, 109.644775390625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 14.0, 8.0, 12.0, 11.0, 16.0, 13.0, 24.0, 17.0, 27.0, 29.0, 37.0, 44.0, 47.0, 61.0, 62.0, 56.0, 57.0, 48.0, 49.0, 56.0, 38.0, 47.0, 44.0, 25.0, 21.0, 16.0, 21.0, 10.0, 10.0, 6.0, 10.0, 5.0, 9.0, 10.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-280.0460205078125, -271.1632385253906, -262.28045654296875, -253.39767456054688, -244.514892578125, -235.63211059570312, -226.7493438720703, -217.86656188964844, -208.98377990722656, -200.1009979248047, -191.2182159423828, -182.33543395996094, -173.45266723632812, -164.56988525390625, -155.68710327148438, -146.8043212890625, -137.92153930664062, -129.03875732421875, -120.15597534179688, -111.27320098876953, -102.39041900634766, -93.50763702392578, -84.62486267089844, -75.74208068847656, -66.85929870605469, -57.97651672363281, -49.0937385559082, -40.210960388183594, -31.32817840576172, -22.445396423339844, -13.562618255615234, -4.679840087890625, 4.202972412109375, 13.085752487182617, 21.96853256225586, 30.8513126373291, 39.734092712402344, 48.61687469482422, 57.49965286254883, 66.38243103027344, 75.26521301269531, 84.14799499511719, 93.03077697753906, 101.9135513305664, 110.79633331298828, 119.67911529541016, 128.5618896484375, 137.44467163085938, 146.32745361328125, 155.21023559570312, 164.093017578125, 172.97579956054688, 181.85858154296875, 190.74136352539062, 199.62413024902344, 208.5069122314453, 217.3896942138672, 226.27247619628906, 235.15525817871094, 244.0380401611328, 252.92080688476562, 261.8035888671875, 270.6863708496094, 279.56915283203125, 288.4519348144531]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 4.0, 12.0, 12.0, 16.0, 10.0, 24.0, 22.0, 33.0, 31.0, 48.0, 48.0, 68.0, 75.0, 86.0, 73.0, 57.0, 73.0, 64.0, 55.0, 45.0, 23.0, 25.0, 16.0, 11.0, 13.0, 10.0, 17.0, 10.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.21875, -22.638671875, -22.05859375, -21.478515625, -20.8984375, -20.318359375, -19.73828125, -19.158203125, -18.578125, -17.998046875, -17.41796875, -16.837890625, -16.2578125, -15.677734375, -15.09765625, -14.517578125, -13.9375, -13.357421875, -12.77734375, -12.197265625, -11.6171875, -11.037109375, -10.45703125, -9.876953125, -9.296875, -8.716796875, -8.13671875, -7.556640625, -6.9765625, -6.396484375, -5.81640625, -5.236328125, -4.65625, -4.076171875, -3.49609375, -2.916015625, -2.3359375, -1.755859375, -1.17578125, -0.595703125, -0.015625, 0.564453125, 1.14453125, 1.724609375, 2.3046875, 2.884765625, 3.46484375, 4.044921875, 4.625, 5.205078125, 5.78515625, 6.365234375, 6.9453125, 7.525390625, 8.10546875, 8.685546875, 9.265625, 9.845703125, 10.42578125, 11.005859375, 11.5859375, 12.166015625, 12.74609375, 13.326171875, 13.90625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 2.0, 6.0, 10.0, 9.0, 7.0, 13.0, 14.0, 32.0, 34.0, 52.0, 73.0, 87.0, 131.0, 212.0, 374.0, 611.0, 930.0, 1633.0, 2808.0, 5113.0, 9959.0, 22721.0, 68432.0, 2844560.0, 1138653.0, 58512.0, 20115.0, 8731.0, 4430.0, 2482.0, 1417.0, 831.0, 505.0, 287.0, 183.0, 115.0, 69.0, 52.0, 30.0, 12.0, 9.0, 13.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-92.875, -90.54833984375, -88.2216796875, -85.89501953125, -83.568359375, -81.24169921875, -78.9150390625, -76.58837890625, -74.26171875, -71.93505859375, -69.6083984375, -67.28173828125, -64.955078125, -62.62841796875, -60.3017578125, -57.97509765625, -55.6484375, -53.32177734375, -50.9951171875, -48.66845703125, -46.341796875, -44.01513671875, -41.6884765625, -39.36181640625, -37.03515625, -34.70849609375, -32.3818359375, -30.05517578125, -27.728515625, -25.40185546875, -23.0751953125, -20.74853515625, -18.421875, -16.09521484375, -13.7685546875, -11.44189453125, -9.115234375, -6.78857421875, -4.4619140625, -2.13525390625, 0.19140625, 2.51806640625, 4.8447265625, 7.17138671875, 9.498046875, 11.82470703125, 14.1513671875, 16.47802734375, 18.8046875, 21.13134765625, 23.4580078125, 25.78466796875, 28.111328125, 30.43798828125, 32.7646484375, 35.09130859375, 37.41796875, 39.74462890625, 42.0712890625, 44.39794921875, 46.724609375, 49.05126953125, 51.3779296875, 53.70458984375, 56.03125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 9.0, 3.0, 11.0, 12.0, 6.0, 8.0, 14.0, 11.0, 17.0, 32.0, 33.0, 46.0, 41.0, 60.0, 64.0, 85.0, 150.0, 328.0, 780.0, 1135.0, 500.0, 219.0, 106.0, 70.0, 61.0, 47.0, 39.0, 37.0, 20.0, 25.0, 23.0, 9.0, 10.0, 13.0, 10.0, 5.0, 6.0, 5.0, 3.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-59.28125, -57.44580078125, -55.6103515625, -53.77490234375, -51.939453125, -50.10400390625, -48.2685546875, -46.43310546875, -44.59765625, -42.76220703125, -40.9267578125, -39.09130859375, -37.255859375, -35.42041015625, -33.5849609375, -31.74951171875, -29.9140625, -28.07861328125, -26.2431640625, -24.40771484375, -22.572265625, -20.73681640625, -18.9013671875, -17.06591796875, -15.23046875, -13.39501953125, -11.5595703125, -9.72412109375, -7.888671875, -6.05322265625, -4.2177734375, -2.38232421875, -0.546875, 1.28857421875, 3.1240234375, 4.95947265625, 6.794921875, 8.63037109375, 10.4658203125, 12.30126953125, 14.13671875, 15.97216796875, 17.8076171875, 19.64306640625, 21.478515625, 23.31396484375, 25.1494140625, 26.98486328125, 28.8203125, 30.65576171875, 32.4912109375, 34.32666015625, 36.162109375, 37.99755859375, 39.8330078125, 41.66845703125, 43.50390625, 45.33935546875, 47.1748046875, 49.01025390625, 50.845703125, 52.68115234375, 54.5166015625, 56.35205078125, 58.1875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 11.0, 9.0, 21.0, 11.0, 24.0, 30.0, 34.0, 26.0, 35.0, 54.0, 64.0, 93.0, 148.0, 241.0, 452.0, 1090.0, 2693.0, 8453.0, 29725.0, 155251.0, 3728229.0, 215283.0, 36396.0, 9951.0, 3345.0, 1228.0, 514.0, 240.0, 143.0, 101.0, 76.0, 50.0, 33.0, 43.0, 27.0, 18.0, 22.0, 21.0, 16.0, 23.0, 8.0, 9.0, 5.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-171.0, -165.583984375, -160.16796875, -154.751953125, -149.3359375, -143.919921875, -138.50390625, -133.087890625, -127.671875, -122.255859375, -116.83984375, -111.423828125, -106.0078125, -100.591796875, -95.17578125, -89.759765625, -84.34375, -78.927734375, -73.51171875, -68.095703125, -62.6796875, -57.263671875, -51.84765625, -46.431640625, -41.015625, -35.599609375, -30.18359375, -24.767578125, -19.3515625, -13.935546875, -8.51953125, -3.103515625, 2.3125, 7.728515625, 13.14453125, 18.560546875, 23.9765625, 29.392578125, 34.80859375, 40.224609375, 45.640625, 51.056640625, 56.47265625, 61.888671875, 67.3046875, 72.720703125, 78.13671875, 83.552734375, 88.96875, 94.384765625, 99.80078125, 105.216796875, 110.6328125, 116.048828125, 121.46484375, 126.880859375, 132.296875, 137.712890625, 143.12890625, 148.544921875, 153.9609375, 159.376953125, 164.79296875, 170.208984375, 175.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 8.0, 13.0, 16.0, 20.0, 34.0, 50.0, 105.0, 191.0, 240.0, 119.0, 66.0, 59.0, 24.0, 12.0, 17.0, 9.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.90673828125, -118.60746002197266, -111.30818176269531, -104.00889587402344, -96.7096176147461, -89.41033935546875, -82.1110610961914, -74.81178283691406, -67.51249694824219, -60.213218688964844, -52.913936614990234, -45.61465835571289, -38.31537628173828, -31.016098022460938, -23.716819763183594, -16.417537689208984, -9.118263244628906, -1.818983554840088, 5.4802961349487305, 12.77957534790039, 20.078855514526367, 27.378135681152344, 34.67741394042969, 41.9766960144043, 49.27597427368164, 56.575252532958984, 63.874534606933594, 71.17381286621094, 78.47309112548828, 85.77236938476562, 93.0716552734375, 100.37093353271484, 107.67021179199219, 114.96949005126953, 122.26876831054688, 129.56805419921875, 136.86732482910156, 144.16661071777344, 151.46588134765625, 158.76516723632812, 166.064453125, 173.36373901367188, 180.6630096435547, 187.96229553222656, 195.26156616210938, 202.56085205078125, 209.86013793945312, 217.15940856933594, 224.45867919921875, 231.75796508789062, 239.05723571777344, 246.3565216064453, 253.65579223632812, 260.955078125, 268.2543640136719, 275.55364990234375, 282.8529357910156, 290.1522216796875, 297.4515075683594, 304.7507629394531, 312.050048828125, 319.3493347167969, 326.64862060546875, 333.9479064941406, 341.2471618652344]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 9.0, 8.0, 9.0, 9.0, 8.0, 11.0, 16.0, 29.0, 25.0, 24.0, 27.0, 23.0, 37.0, 26.0, 44.0, 44.0, 43.0, 43.0, 52.0, 46.0, 39.0, 47.0, 40.0, 26.0, 40.0, 35.0, 28.0, 37.0, 28.0, 34.0, 21.0, 11.0, 20.0, 11.0, 10.0, 10.0, 14.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-201.2471466064453, -194.98915100097656, -188.73114013671875, -182.47314453125, -176.21514892578125, -169.95713806152344, -163.6991424560547, -157.44113159179688, -151.18313598632812, -144.92514038085938, -138.66712951660156, -132.4091339111328, -126.15113067626953, -119.89312744140625, -113.6351318359375, -107.37712860107422, -101.11913299560547, -94.86112976074219, -88.60313415527344, -82.34513092041016, -76.08712768554688, -69.82913208007812, -63.571128845214844, -57.31312561035156, -51.05512619018555, -44.79712677001953, -38.53912353515625, -32.281124114990234, -26.023122787475586, -19.765121459960938, -13.507122039794922, -7.249118804931641, -0.991119384765625, 5.266881465911865, 11.524882316589355, 17.782882690429688, 24.040884017944336, 30.298885345458984, 36.556884765625, 42.81488800048828, 49.0728874206543, 55.33088684082031, 61.588890075683594, 67.84689331054688, 74.10488891601562, 80.3628921508789, 86.62089538574219, 92.87889099121094, 99.13689422607422, 105.3948974609375, 111.65289306640625, 117.91089630126953, 124.16889953613281, 130.42689514160156, 136.68490600585938, 142.94290161132812, 149.20089721679688, 155.45889282226562, 161.71690368652344, 167.9748992919922, 174.23289489746094, 180.49090576171875, 186.7489013671875, 193.00689697265625, 199.26490783691406]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 8.0, 6.0, 4.0, 6.0, 11.0, 17.0, 15.0, 26.0, 33.0, 31.0, 34.0, 35.0, 45.0, 59.0, 75.0, 70.0, 64.0, 81.0, 48.0, 50.0, 53.0, 46.0, 26.0, 26.0, 20.0, 28.0, 16.0, 16.0, 13.0, 13.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.203125, -22.6290283203125, -22.054931640625, -21.4808349609375, -20.90673828125, -20.3326416015625, -19.758544921875, -19.1844482421875, -18.6103515625, -18.0362548828125, -17.462158203125, -16.8880615234375, -16.31396484375, -15.7398681640625, -15.165771484375, -14.5916748046875, -14.017578125, -13.4434814453125, -12.869384765625, -12.2952880859375, -11.72119140625, -11.1470947265625, -10.572998046875, -9.9989013671875, -9.4248046875, -8.8507080078125, -8.276611328125, -7.7025146484375, -7.12841796875, -6.5543212890625, -5.980224609375, -5.4061279296875, -4.83203125, -4.2579345703125, -3.683837890625, -3.1097412109375, -2.53564453125, -1.9615478515625, -1.387451171875, -0.8133544921875, -0.2392578125, 0.3348388671875, 0.908935546875, 1.4830322265625, 2.05712890625, 2.6312255859375, 3.205322265625, 3.7794189453125, 4.353515625, 4.9276123046875, 5.501708984375, 6.0758056640625, 6.64990234375, 7.2239990234375, 7.798095703125, 8.3721923828125, 8.9462890625, 9.5203857421875, 10.094482421875, 10.6685791015625, 11.24267578125, 11.8167724609375, 12.390869140625, 12.9649658203125, 13.5390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 10.0, 11.0, 15.0, 29.0, 32.0, 48.0, 77.0, 146.0, 278.0, 482.0, 986.0, 1836.0, 3659.0, 7567.0, 15823.0, 35311.0, 90968.0, 302783.0, 390622.0, 117781.0, 43274.0, 18753.0, 9055.0, 4372.0, 2231.0, 1115.0, 533.0, 320.0, 158.0, 99.0, 60.0, 36.0, 25.0, 15.0, 5.0, 10.0, 10.0, 6.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9140625, -0.8776702880859375, -0.841278076171875, -0.8048858642578125, -0.76849365234375, -0.7321014404296875, -0.695709228515625, -0.6593170166015625, -0.6229248046875, -0.5865325927734375, -0.550140380859375, -0.5137481689453125, -0.47735595703125, -0.4409637451171875, -0.404571533203125, -0.3681793212890625, -0.331787109375, -0.2953948974609375, -0.259002685546875, -0.2226104736328125, -0.18621826171875, -0.1498260498046875, -0.113433837890625, -0.0770416259765625, -0.0406494140625, -0.0042572021484375, 0.032135009765625, 0.0685272216796875, 0.10491943359375, 0.1413116455078125, 0.177703857421875, 0.2140960693359375, 0.25048828125, 0.2868804931640625, 0.323272705078125, 0.3596649169921875, 0.39605712890625, 0.4324493408203125, 0.468841552734375, 0.5052337646484375, 0.5416259765625, 0.5780181884765625, 0.614410400390625, 0.6508026123046875, 0.68719482421875, 0.7235870361328125, 0.759979248046875, 0.7963714599609375, 0.832763671875, 0.8691558837890625, 0.905548095703125, 0.9419403076171875, 0.97833251953125, 1.0147247314453125, 1.051116943359375, 1.0875091552734375, 1.1239013671875, 1.1602935791015625, 1.196685791015625, 1.2330780029296875, 1.26947021484375, 1.3058624267578125, 1.342254638671875, 1.3786468505859375, 1.4150390625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 7.0, 9.0, 15.0, 17.0, 7.0, 21.0, 26.0, 17.0, 27.0, 27.0, 36.0, 30.0, 38.0, 34.0, 43.0, 45.0, 47.0, 44.0, 1062.0, 36.0, 30.0, 32.0, 41.0, 24.0, 38.0, 31.0, 20.0, 31.0, 25.0, 21.0, 21.0, 26.0, 5.0, 12.0, 17.0, 10.0, 7.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.609375, -8.340576171875, -8.07177734375, -7.802978515625, -7.5341796875, -7.265380859375, -6.99658203125, -6.727783203125, -6.458984375, -6.190185546875, -5.92138671875, -5.652587890625, -5.3837890625, -5.114990234375, -4.84619140625, -4.577392578125, -4.30859375, -4.039794921875, -3.77099609375, -3.502197265625, -3.2333984375, -2.964599609375, -2.69580078125, -2.427001953125, -2.158203125, -1.889404296875, -1.62060546875, -1.351806640625, -1.0830078125, -0.814208984375, -0.54541015625, -0.276611328125, -0.0078125, 0.260986328125, 0.52978515625, 0.798583984375, 1.0673828125, 1.336181640625, 1.60498046875, 1.873779296875, 2.142578125, 2.411376953125, 2.68017578125, 2.948974609375, 3.2177734375, 3.486572265625, 3.75537109375, 4.024169921875, 4.29296875, 4.561767578125, 4.83056640625, 5.099365234375, 5.3681640625, 5.636962890625, 5.90576171875, 6.174560546875, 6.443359375, 6.712158203125, 6.98095703125, 7.249755859375, 7.5185546875, 7.787353515625, 8.05615234375, 8.324951171875, 8.59375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 9.0, 6.0, 8.0, 17.0, 15.0, 30.0, 55.0, 58.0, 93.0, 148.0, 193.0, 250.0, 351.0, 507.0, 724.0, 1014.0, 1416.0, 1956.0, 2931.0, 4078.0, 5789.0, 8300.0, 11923.0, 16859.0, 25351.0, 38396.0, 59914.0, 99510.0, 177281.0, 1271767.0, 137788.0, 79461.0, 48913.0, 31960.0, 21346.0, 14647.0, 10107.0, 7077.0, 4983.0, 3521.0, 2392.0, 1774.0, 1273.0, 867.0, 600.0, 407.0, 295.0, 230.0, 163.0, 125.0, 94.0, 56.0, 30.0, 27.0, 16.0, 15.0, 20.0, 5.0, 4.0, 0.0, 2.0], "bins": [-0.525390625, -0.5091171264648438, -0.4928436279296875, -0.47657012939453125, -0.460296630859375, -0.44402313232421875, -0.4277496337890625, -0.41147613525390625, -0.39520263671875, -0.37892913818359375, -0.3626556396484375, -0.34638214111328125, -0.330108642578125, -0.31383514404296875, -0.2975616455078125, -0.28128814697265625, -0.2650146484375, -0.24874114990234375, -0.2324676513671875, -0.21619415283203125, -0.199920654296875, -0.18364715576171875, -0.1673736572265625, -0.15110015869140625, -0.13482666015625, -0.11855316162109375, -0.1022796630859375, -0.08600616455078125, -0.069732666015625, -0.05345916748046875, -0.0371856689453125, -0.02091217041015625, -0.004638671875, 0.01163482666015625, 0.0279083251953125, 0.04418182373046875, 0.060455322265625, 0.07672882080078125, 0.0930023193359375, 0.10927581787109375, 0.12554931640625, 0.14182281494140625, 0.1580963134765625, 0.17436981201171875, 0.190643310546875, 0.20691680908203125, 0.2231903076171875, 0.23946380615234375, 0.2557373046875, 0.27201080322265625, 0.2882843017578125, 0.30455780029296875, 0.320831298828125, 0.33710479736328125, 0.3533782958984375, 0.36965179443359375, 0.38592529296875, 0.40219879150390625, 0.4184722900390625, 0.43474578857421875, 0.451019287109375, 0.46729278564453125, 0.4835662841796875, 0.49983978271484375, 0.51611328125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 10.0, 10.0, 6.0, 4.0, 7.0, 10.0, 17.0, 23.0, 19.0, 24.0, 18.0, 24.0, 34.0, 41.0, 34.0, 41.0, 49.0, 51.0, 37.0, 37.0, 43.0, 49.0, 39.0, 49.0, 47.0, 35.0, 41.0, 26.0, 27.0, 16.0, 20.0, 18.0, 13.0, 10.0, 12.0, 8.0, 8.0, 5.0, 6.0, 7.0, 4.0, 8.0, 6.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0017871856689453125, -0.001730591058731079, -0.0016739964485168457, -0.0016174018383026123, -0.001560807228088379, -0.0015042126178741455, -0.0014476180076599121, -0.0013910233974456787, -0.0013344287872314453, -0.001277834177017212, -0.0012212395668029785, -0.0011646449565887451, -0.0011080503463745117, -0.0010514557361602783, -0.000994861125946045, -0.0009382665157318115, -0.0008816719055175781, -0.0008250772953033447, -0.0007684826850891113, -0.0007118880748748779, -0.0006552934646606445, -0.0005986988544464111, -0.0005421042442321777, -0.00048550963401794434, -0.00042891502380371094, -0.00037232041358947754, -0.00031572580337524414, -0.00025913119316101074, -0.00020253658294677734, -0.00014594197273254395, -8.934736251831055e-05, -3.275275230407715e-05, 2.384185791015625e-05, 8.043646812438965e-05, 0.00013703107833862305, 0.00019362568855285645, 0.00025022029876708984, 0.00030681490898132324, 0.00036340951919555664, 0.00042000412940979004, 0.00047659873962402344, 0.0005331933498382568, 0.0005897879600524902, 0.0006463825702667236, 0.000702977180480957, 0.0007595717906951904, 0.0008161664009094238, 0.0008727610111236572, 0.0009293556213378906, 0.000985950231552124, 0.0010425448417663574, 0.0010991394519805908, 0.0011557340621948242, 0.0012123286724090576, 0.001268923282623291, 0.0013255178928375244, 0.0013821125030517578, 0.0014387071132659912, 0.0014953017234802246, 0.001551896333694458, 0.0016084909439086914, 0.0016650855541229248, 0.0017216801643371582, 0.0017782747745513916, 0.001834869384765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 2.0, 1.0, 6.0, 9.0, 6.0, 6.0, 4.0, 12.0, 20.0, 17.0, 21.0, 14.0, 24.0, 33.0, 34.0, 38.0, 55.0, 77.0, 62.0, 69.0, 78.0, 92.0, 117.0, 140.0, 222.0, 341.0, 895.0, 11178.0, 898856.0, 131620.0, 2613.0, 560.0, 268.0, 157.0, 155.0, 114.0, 106.0, 76.0, 67.0, 52.0, 47.0, 35.0, 53.0, 19.0, 26.0, 20.0, 20.0, 25.0, 13.0, 17.0, 13.0, 16.0, 11.0, 4.0, 7.0, 8.0, 4.0, 1.0, 4.0, 3.0, 2.0], "bins": [-0.0301361083984375, -0.029187679290771484, -0.02823925018310547, -0.027290821075439453, -0.026342391967773438, -0.025393962860107422, -0.024445533752441406, -0.02349710464477539, -0.022548675537109375, -0.02160024642944336, -0.020651817321777344, -0.019703388214111328, -0.018754959106445312, -0.017806529998779297, -0.01685810089111328, -0.015909671783447266, -0.01496124267578125, -0.014012813568115234, -0.013064384460449219, -0.012115955352783203, -0.011167526245117188, -0.010219097137451172, -0.009270668029785156, -0.00832223892211914, -0.007373809814453125, -0.006425380706787109, -0.005476951599121094, -0.004528522491455078, -0.0035800933837890625, -0.002631664276123047, -0.0016832351684570312, -0.0007348060607910156, 0.000213623046875, 0.0011620521545410156, 0.0021104812622070312, 0.003058910369873047, 0.0040073394775390625, 0.004955768585205078, 0.005904197692871094, 0.006852626800537109, 0.007801055908203125, 0.00874948501586914, 0.009697914123535156, 0.010646343231201172, 0.011594772338867188, 0.012543201446533203, 0.013491630554199219, 0.014440059661865234, 0.01538848876953125, 0.016336917877197266, 0.01728534698486328, 0.018233776092529297, 0.019182205200195312, 0.020130634307861328, 0.021079063415527344, 0.02202749252319336, 0.022975921630859375, 0.02392435073852539, 0.024872779846191406, 0.025821208953857422, 0.026769638061523438, 0.027718067169189453, 0.02866649627685547, 0.029614925384521484, 0.0305633544921875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 102.0, 803.0, 88.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016998164355754852, -0.016654565930366516, -0.01631096936762333, -0.015967370942234993, -0.015623772516846657, -0.015280175022780895, -0.014936577528715134, -0.014592979103326797, -0.014249381609261036, -0.013905784115195274, -0.013562185689806938, -0.013218588195741177, -0.01287498977035284, -0.012531392276287079, -0.012187793850898743, -0.011844196356832981, -0.01150059886276722, -0.011157001368701458, -0.010813402943313122, -0.01046980544924736, -0.010126207023859024, -0.009782609529793262, -0.009439012035727501, -0.009095413610339165, -0.008751815184950829, -0.008408217690885067, -0.00806461926549673, -0.007721021771430969, -0.00737742381170392, -0.0070338258519768715, -0.006690227892249823, -0.006346629932522774, -0.006003032438457012, -0.005659434478729963, -0.005315836519002914, -0.004972239024937153, -0.004628641065210104, -0.004285043105483055, -0.003941445145756006, -0.003597847418859601, -0.003254249459132552, -0.0029106514994055033, -0.002567053772509098, -0.002223455812782049, -0.0018798579694703221, -0.001536260126158595, -0.0011926621664315462, -0.000849064439535141, -0.0005054664798080921, -0.00016186860739253461, 0.0001817292650230229, 0.0005253271665424109, 0.0008689250098541379, 0.001212522853165865, 0.0015561208128929138, 0.001899718539789319, 0.002243316499516368, 0.002586914459243417, 0.002930512186139822, 0.003274110145866871, 0.0036177081055939198, 0.003961306065320969, 0.00430490355938673, 0.004648501519113779, 0.004992099478840828]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 15.0, 10.0, 15.0, 17.0, 15.0, 16.0, 25.0, 25.0, 27.0, 29.0, 25.0, 31.0, 42.0, 35.0, 46.0, 37.0, 37.0, 33.0, 32.0, 42.0, 51.0, 37.0, 34.0, 46.0, 29.0, 26.0, 33.0, 24.0, 19.0, 17.0, 14.0, 14.0, 15.0, 11.0, 13.0, 15.0, 5.0, 8.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.001232743263244629, -0.0011970698833465576, -0.0011613965034484863, -0.001125723123550415, -0.0010900497436523438, -0.0010543763637542725, -0.0010187029838562012, -0.0009830296039581299, -0.0009473562240600586, -0.0009116828441619873, -0.000876009464263916, -0.0008403360843658447, -0.0008046627044677734, -0.0007689893245697021, -0.0007333159446716309, -0.0006976425647735596, -0.0006619691848754883, -0.000626295804977417, -0.0005906224250793457, -0.0005549490451812744, -0.0005192756652832031, -0.00048360228538513184, -0.00044792890548706055, -0.00041225552558898926, -0.00037658214569091797, -0.0003409087657928467, -0.0003052353858947754, -0.0002695620059967041, -0.0002338886260986328, -0.00019821524620056152, -0.00016254186630249023, -0.00012686848640441895, -9.119510650634766e-05, -5.552172660827637e-05, -1.9848346710205078e-05, 1.582503318786621e-05, 5.14984130859375e-05, 8.717179298400879e-05, 0.00012284517288208008, 0.00015851855278015137, 0.00019419193267822266, 0.00022986531257629395, 0.00026553869247436523, 0.0003012120723724365, 0.0003368854522705078, 0.0003725588321685791, 0.0004082322120666504, 0.0004439055919647217, 0.00047957897186279297, 0.0005152523517608643, 0.0005509257316589355, 0.0005865991115570068, 0.0006222724914550781, 0.0006579458713531494, 0.0006936192512512207, 0.000729292631149292, 0.0007649660110473633, 0.0008006393909454346, 0.0008363127708435059, 0.0008719861507415771, 0.0009076595306396484, 0.0009433329105377197, 0.000979006290435791, 0.0010146796703338623, 0.0010503530502319336]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 8.0, 6.0, 4.0, 6.0, 11.0, 17.0, 15.0, 26.0, 33.0, 31.0, 34.0, 35.0, 45.0, 59.0, 75.0, 70.0, 64.0, 81.0, 48.0, 50.0, 53.0, 46.0, 26.0, 26.0, 20.0, 28.0, 16.0, 16.0, 13.0, 13.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.203125, -22.6290283203125, -22.054931640625, -21.4808349609375, -20.90673828125, -20.3326416015625, -19.758544921875, -19.1844482421875, -18.6103515625, -18.0362548828125, -17.462158203125, -16.8880615234375, -16.31396484375, -15.7398681640625, -15.165771484375, -14.5916748046875, -14.017578125, -13.4434814453125, -12.869384765625, -12.2952880859375, -11.72119140625, -11.1470947265625, -10.572998046875, -9.9989013671875, -9.4248046875, -8.8507080078125, -8.276611328125, -7.7025146484375, -7.12841796875, -6.5543212890625, -5.980224609375, -5.4061279296875, -4.83203125, -4.2579345703125, -3.683837890625, -3.1097412109375, -2.53564453125, -1.9615478515625, -1.387451171875, -0.8133544921875, -0.2392578125, 0.3348388671875, 0.908935546875, 1.4830322265625, 2.05712890625, 2.6312255859375, 3.205322265625, 3.7794189453125, 4.353515625, 4.9276123046875, 5.501708984375, 6.0758056640625, 6.64990234375, 7.2239990234375, 7.798095703125, 8.3721923828125, 8.9462890625, 9.5203857421875, 10.094482421875, 10.6685791015625, 11.24267578125, 11.8167724609375, 12.390869140625, 12.9649658203125, 13.5390625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 18.0, 26.0, 48.0, 52.0, 120.0, 166.0, 250.0, 389.0, 705.0, 1297.0, 2091.0, 3753.0, 7717.0, 20928.0, 109099.0, 789731.0, 79444.0, 17472.0, 7041.0, 3454.0, 1843.0, 1088.0, 682.0, 416.0, 269.0, 166.0, 98.0, 66.0, 39.0, 21.0, 16.0, 9.0, 9.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-71.375, -69.3603515625, -67.345703125, -65.3310546875, -63.31640625, -61.3017578125, -59.287109375, -57.2724609375, -55.2578125, -53.2431640625, -51.228515625, -49.2138671875, -47.19921875, -45.1845703125, -43.169921875, -41.1552734375, -39.140625, -37.1259765625, -35.111328125, -33.0966796875, -31.08203125, -29.0673828125, -27.052734375, -25.0380859375, -23.0234375, -21.0087890625, -18.994140625, -16.9794921875, -14.96484375, -12.9501953125, -10.935546875, -8.9208984375, -6.90625, -4.8916015625, -2.876953125, -0.8623046875, 1.15234375, 3.1669921875, 5.181640625, 7.1962890625, 9.2109375, 11.2255859375, 13.240234375, 15.2548828125, 17.26953125, 19.2841796875, 21.298828125, 23.3134765625, 25.328125, 27.3427734375, 29.357421875, 31.3720703125, 33.38671875, 35.4013671875, 37.416015625, 39.4306640625, 41.4453125, 43.4599609375, 45.474609375, 47.4892578125, 49.50390625, 51.5185546875, 53.533203125, 55.5478515625, 57.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 6.0, 8.0, 7.0, 9.0, 11.0, 11.0, 16.0, 23.0, 23.0, 21.0, 25.0, 34.0, 38.0, 36.0, 43.0, 45.0, 43.0, 65.0, 88.0, 1866.0, 145.0, 72.0, 48.0, 53.0, 41.0, 38.0, 33.0, 29.0, 24.0, 23.0, 19.0, 14.0, 17.0, 9.0, 11.0, 15.0, 6.0, 7.0, 6.0, 1.0, 5.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-49.34375, -47.8779296875, -46.412109375, -44.9462890625, -43.48046875, -42.0146484375, -40.548828125, -39.0830078125, -37.6171875, -36.1513671875, -34.685546875, -33.2197265625, -31.75390625, -30.2880859375, -28.822265625, -27.3564453125, -25.890625, -24.4248046875, -22.958984375, -21.4931640625, -20.02734375, -18.5615234375, -17.095703125, -15.6298828125, -14.1640625, -12.6982421875, -11.232421875, -9.7666015625, -8.30078125, -6.8349609375, -5.369140625, -3.9033203125, -2.4375, -0.9716796875, 0.494140625, 1.9599609375, 3.42578125, 4.8916015625, 6.357421875, 7.8232421875, 9.2890625, 10.7548828125, 12.220703125, 13.6865234375, 15.15234375, 16.6181640625, 18.083984375, 19.5498046875, 21.015625, 22.4814453125, 23.947265625, 25.4130859375, 26.87890625, 28.3447265625, 29.810546875, 31.2763671875, 32.7421875, 34.2080078125, 35.673828125, 37.1396484375, 38.60546875, 40.0712890625, 41.537109375, 43.0029296875, 44.46875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 1.0, 4.0, 6.0, 6.0, 7.0, 16.0, 6.0, 10.0, 16.0, 16.0, 19.0, 23.0, 23.0, 40.0, 48.0, 59.0, 94.0, 206.0, 520.0, 3208.0, 3032694.0, 106368.0, 1388.0, 376.0, 157.0, 82.0, 57.0, 38.0, 34.0, 30.0, 25.0, 18.0, 19.0, 20.0, 8.0, 15.0, 7.0, 11.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-212.625, -205.728515625, -198.83203125, -191.935546875, -185.0390625, -178.142578125, -171.24609375, -164.349609375, -157.453125, -150.556640625, -143.66015625, -136.763671875, -129.8671875, -122.970703125, -116.07421875, -109.177734375, -102.28125, -95.384765625, -88.48828125, -81.591796875, -74.6953125, -67.798828125, -60.90234375, -54.005859375, -47.109375, -40.212890625, -33.31640625, -26.419921875, -19.5234375, -12.626953125, -5.73046875, 1.166015625, 8.0625, 14.958984375, 21.85546875, 28.751953125, 35.6484375, 42.544921875, 49.44140625, 56.337890625, 63.234375, 70.130859375, 77.02734375, 83.923828125, 90.8203125, 97.716796875, 104.61328125, 111.509765625, 118.40625, 125.302734375, 132.19921875, 139.095703125, 145.9921875, 152.888671875, 159.78515625, 166.681640625, 173.578125, 180.474609375, 187.37109375, 194.267578125, 201.1640625, 208.060546875, 214.95703125, 221.853515625, 228.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 67.0, 556.0, 364.0, 23.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.14572143554688, -237.601806640625, -228.05789184570312, -218.51397705078125, -208.97006225585938, -199.4261474609375, -189.88223266601562, -180.33831787109375, -170.79440307617188, -161.25048828125, -151.70657348632812, -142.16265869140625, -132.61874389648438, -123.0748291015625, -113.5309066772461, -103.98699188232422, -94.44306945800781, -84.89915466308594, -75.35523986816406, -65.81132507324219, -56.26740646362305, -46.72349166870117, -37.17957305908203, -27.635658264160156, -18.09174346923828, -8.54782772064209, 0.9960880279541016, 10.54000473022461, 20.083919525146484, 29.62783432006836, 39.1717529296875, 48.715667724609375, 58.25958251953125, 67.80349731445312, 77.347412109375, 86.89132690429688, 96.43524169921875, 105.97915649414062, 115.52307891845703, 125.0669937133789, 134.61090087890625, 144.15481567382812, 153.69873046875, 163.24264526367188, 172.78656005859375, 182.33047485351562, 191.8743896484375, 201.41830444335938, 210.9622344970703, 220.5061492919922, 230.05006408691406, 239.59397888183594, 249.1378936767578, 258.68182373046875, 268.2257385253906, 277.7696533203125, 287.3135681152344, 296.85748291015625, 306.4013977050781, 315.9453125, 325.4892272949219, 335.03314208984375, 344.5770568847656, 354.1209716796875, 363.6648864746094]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 5.0, 5.0, 6.0, 9.0, 8.0, 19.0, 13.0, 16.0, 21.0, 16.0, 18.0, 32.0, 36.0, 29.0, 32.0, 44.0, 46.0, 45.0, 34.0, 35.0, 33.0, 45.0, 51.0, 40.0, 36.0, 33.0, 42.0, 29.0, 33.0, 16.0, 24.0, 26.0, 21.0, 22.0, 19.0, 11.0, 8.0, 8.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-162.52908325195312, -157.9332733154297, -153.33746337890625, -148.74163818359375, -144.1458282470703, -139.55001831054688, -134.95420837402344, -130.3583984375, -125.7625732421875, -121.16676330566406, -116.5709457397461, -111.97513580322266, -107.37931823730469, -102.78350830078125, -98.18769836425781, -93.59188079833984, -88.9960708618164, -84.40026092529297, -79.804443359375, -75.20863342285156, -70.6128158569336, -66.01700592041016, -61.42119216918945, -56.82537841796875, -52.22956466674805, -47.633750915527344, -43.03793716430664, -38.44212341308594, -33.8463134765625, -29.250497817993164, -24.654685974121094, -20.05887222290039, -15.463058471679688, -10.867244720458984, -6.271431922912598, -1.675619125366211, 2.920194625854492, 7.516008377075195, 12.111820220947266, 16.70763397216797, 21.303447723388672, 25.899261474609375, 30.495075225830078, 35.09088897705078, 39.68669891357422, 44.28251647949219, 48.878326416015625, 53.47414016723633, 58.06995391845703, 62.665767669677734, 67.26158142089844, 71.85739135742188, 76.45320892333984, 81.04901885986328, 85.64483642578125, 90.24064636230469, 94.83645629882812, 99.43226623535156, 104.02808380126953, 108.62389373779297, 113.21971130371094, 117.81552124023438, 122.41133117675781, 127.00714874267578, 131.60296630859375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 6.0, 10.0, 10.0, 17.0, 23.0, 30.0, 34.0, 30.0, 33.0, 34.0, 54.0, 64.0, 68.0, 83.0, 67.0, 58.0, 66.0, 55.0, 35.0, 34.0, 33.0, 29.0, 17.0, 20.0, 21.0, 10.0, 19.0, 10.0, 4.0, 14.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.65625, -24.040283203125, -23.42431640625, -22.808349609375, -22.1923828125, -21.576416015625, -20.96044921875, -20.344482421875, -19.728515625, -19.112548828125, -18.49658203125, -17.880615234375, -17.2646484375, -16.648681640625, -16.03271484375, -15.416748046875, -14.80078125, -14.184814453125, -13.56884765625, -12.952880859375, -12.3369140625, -11.720947265625, -11.10498046875, -10.489013671875, -9.873046875, -9.257080078125, -8.64111328125, -8.025146484375, -7.4091796875, -6.793212890625, -6.17724609375, -5.561279296875, -4.9453125, -4.329345703125, -3.71337890625, -3.097412109375, -2.4814453125, -1.865478515625, -1.24951171875, -0.633544921875, -0.017578125, 0.598388671875, 1.21435546875, 1.830322265625, 2.4462890625, 3.062255859375, 3.67822265625, 4.294189453125, 4.91015625, 5.526123046875, 6.14208984375, 6.758056640625, 7.3740234375, 7.989990234375, 8.60595703125, 9.221923828125, 9.837890625, 10.453857421875, 11.06982421875, 11.685791015625, 12.3017578125, 12.917724609375, 13.53369140625, 14.149658203125, 14.765625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 1.0, 7.0, 4.0, 7.0, 6.0, 13.0, 24.0, 9.0, 29.0, 41.0, 57.0, 81.0, 104.0, 183.0, 246.0, 366.0, 570.0, 850.0, 1403.0, 2181.0, 3745.0, 6359.0, 11639.0, 22950.0, 53076.0, 655125.0, 3283281.0, 85628.0, 30613.0, 15263.0, 8198.0, 4792.0, 2820.0, 1695.0, 1097.0, 668.0, 430.0, 268.0, 185.0, 99.0, 67.0, 41.0, 25.0, 15.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0], "bins": [-92.375, -90.076171875, -87.77734375, -85.478515625, -83.1796875, -80.880859375, -78.58203125, -76.283203125, -73.984375, -71.685546875, -69.38671875, -67.087890625, -64.7890625, -62.490234375, -60.19140625, -57.892578125, -55.59375, -53.294921875, -50.99609375, -48.697265625, -46.3984375, -44.099609375, -41.80078125, -39.501953125, -37.203125, -34.904296875, -32.60546875, -30.306640625, -28.0078125, -25.708984375, -23.41015625, -21.111328125, -18.8125, -16.513671875, -14.21484375, -11.916015625, -9.6171875, -7.318359375, -5.01953125, -2.720703125, -0.421875, 1.876953125, 4.17578125, 6.474609375, 8.7734375, 11.072265625, 13.37109375, 15.669921875, 17.96875, 20.267578125, 22.56640625, 24.865234375, 27.1640625, 29.462890625, 31.76171875, 34.060546875, 36.359375, 38.658203125, 40.95703125, 43.255859375, 45.5546875, 47.853515625, 50.15234375, 52.451171875, 54.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 11.0, 8.0, 18.0, 15.0, 10.0, 18.0, 14.0, 19.0, 22.0, 53.0, 44.0, 38.0, 59.0, 96.0, 224.0, 619.0, 1329.0, 747.0, 282.0, 107.0, 62.0, 44.0, 31.0, 25.0, 28.0, 24.0, 16.0, 16.0, 18.0, 22.0, 9.0, 4.0, 6.0, 2.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.6875, -57.734375, -55.78125, -53.828125, -51.875, -49.921875, -47.96875, -46.015625, -44.0625, -42.109375, -40.15625, -38.203125, -36.25, -34.296875, -32.34375, -30.390625, -28.4375, -26.484375, -24.53125, -22.578125, -20.625, -18.671875, -16.71875, -14.765625, -12.8125, -10.859375, -8.90625, -6.953125, -5.0, -3.046875, -1.09375, 0.859375, 2.8125, 4.765625, 6.71875, 8.671875, 10.625, 12.578125, 14.53125, 16.484375, 18.4375, 20.390625, 22.34375, 24.296875, 26.25, 28.203125, 30.15625, 32.109375, 34.0625, 36.015625, 37.96875, 39.921875, 41.875, 43.828125, 45.78125, 47.734375, 49.6875, 51.640625, 53.59375, 55.546875, 57.5, 59.453125, 61.40625, 63.359375, 65.3125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 3.0, 7.0, 13.0, 22.0, 33.0, 41.0, 61.0, 93.0, 140.0, 209.0, 242.0, 386.0, 585.0, 892.0, 1273.0, 1981.0, 2894.0, 4466.0, 6745.0, 10643.0, 16930.0, 29238.0, 52183.0, 120434.0, 1713136.0, 1976618.0, 124885.0, 52937.0, 29000.0, 17250.0, 10761.0, 6916.0, 4497.0, 2831.0, 1935.0, 1232.0, 832.0, 629.0, 412.0, 265.0, 190.0, 131.0, 93.0, 58.0, 54.0, 33.0, 26.0, 10.0, 10.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0], "bins": [-85.0625, -82.5615234375, -80.060546875, -77.5595703125, -75.05859375, -72.5576171875, -70.056640625, -67.5556640625, -65.0546875, -62.5537109375, -60.052734375, -57.5517578125, -55.05078125, -52.5498046875, -50.048828125, -47.5478515625, -45.046875, -42.5458984375, -40.044921875, -37.5439453125, -35.04296875, -32.5419921875, -30.041015625, -27.5400390625, -25.0390625, -22.5380859375, -20.037109375, -17.5361328125, -15.03515625, -12.5341796875, -10.033203125, -7.5322265625, -5.03125, -2.5302734375, -0.029296875, 2.4716796875, 4.97265625, 7.4736328125, 9.974609375, 12.4755859375, 14.9765625, 17.4775390625, 19.978515625, 22.4794921875, 24.98046875, 27.4814453125, 29.982421875, 32.4833984375, 34.984375, 37.4853515625, 39.986328125, 42.4873046875, 44.98828125, 47.4892578125, 49.990234375, 52.4912109375, 54.9921875, 57.4931640625, 59.994140625, 62.4951171875, 64.99609375, 67.4970703125, 69.998046875, 72.4990234375, 75.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 24.0, 60.0, 191.0, 534.0, 129.0, 46.0, 18.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1674.283935546875, -1642.9210205078125, -1611.55810546875, -1580.1951904296875, -1548.832275390625, -1517.469482421875, -1486.1065673828125, -1454.74365234375, -1423.3807373046875, -1392.017822265625, -1360.6549072265625, -1329.2919921875, -1297.92919921875, -1266.5662841796875, -1235.203369140625, -1203.8404541015625, -1172.4775390625, -1141.1146240234375, -1109.751708984375, -1078.3887939453125, -1047.02587890625, -1015.6630249023438, -984.3001708984375, -952.937255859375, -921.5743408203125, -890.21142578125, -858.8485107421875, -827.4856567382812, -796.1227416992188, -764.7598266601562, -733.39697265625, -702.0340576171875, -670.6712036132812, -639.3082885742188, -607.9454345703125, -576.58251953125, -545.2196044921875, -513.856689453125, -482.4938049316406, -451.13092041015625, -419.76800537109375, -388.40509033203125, -357.0422058105469, -325.6793212890625, -294.31640625, -262.9534912109375, -231.59060668945312, -200.2277069091797, -168.86480712890625, -137.5019073486328, -106.13900756835938, -74.77610778808594, -43.4132080078125, -12.050308227539062, 19.312591552734375, 50.67549133300781, 82.03839111328125, 113.40129089355469, 144.76419067382812, 176.12709045410156, 207.489990234375, 238.85289001464844, 270.2157897949219, 301.57867431640625, 332.94158935546875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 12.0, 5.0, 9.0, 10.0, 15.0, 9.0, 12.0, 19.0, 16.0, 26.0, 19.0, 30.0, 37.0, 31.0, 17.0, 27.0, 44.0, 30.0, 43.0, 34.0, 42.0, 39.0, 39.0, 35.0, 45.0, 35.0, 30.0, 41.0, 26.0, 22.0, 39.0, 31.0, 24.0, 16.0, 15.0, 17.0, 12.0, 10.0, 7.0, 6.0, 1.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-189.21368408203125, -183.88751220703125, -178.5613555908203, -173.2351837158203, -167.90902709960938, -162.58285522460938, -157.25669860839844, -151.93052673339844, -146.6043701171875, -141.2781982421875, -135.95204162597656, -130.62586975097656, -125.29971313476562, -119.97354125976562, -114.64737701416016, -109.32121276855469, -103.99504089355469, -98.66887664794922, -93.34271240234375, -88.01654815673828, -82.69038391113281, -77.36421203613281, -72.03804779052734, -66.71188354492188, -61.385719299316406, -56.05955505371094, -50.73339080810547, -45.407222747802734, -40.081058502197266, -34.7548942565918, -29.428728103637695, -24.102561950683594, -18.776397705078125, -13.45023250579834, -8.124067306518555, -2.7979021072387695, 2.5282630920410156, 7.854427337646484, 13.180593490600586, 18.506759643554688, 23.832923889160156, 29.159088134765625, 34.485252380371094, 39.81142044067383, 45.1375846862793, 50.463748931884766, 55.7899169921875, 61.11608123779297, 66.44224548339844, 71.7684097290039, 77.09457397460938, 82.42073822021484, 87.74690246582031, 93.07307434082031, 98.39923858642578, 103.72540283203125, 109.05156707763672, 114.37773132324219, 119.70389556884766, 125.03005981445312, 130.35623168945312, 135.68238830566406, 141.00856018066406, 146.334716796875, 151.660888671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 8.0, 7.0, 12.0, 10.0, 9.0, 21.0, 22.0, 29.0, 20.0, 32.0, 33.0, 38.0, 52.0, 47.0, 57.0, 51.0, 54.0, 47.0, 44.0, 57.0, 45.0, 38.0, 30.0, 34.0, 31.0, 26.0, 29.0, 17.0, 20.0, 12.0, 12.0, 15.0, 6.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.234375, -19.6695556640625, -19.104736328125, -18.5399169921875, -17.97509765625, -17.4102783203125, -16.845458984375, -16.2806396484375, -15.7158203125, -15.1510009765625, -14.586181640625, -14.0213623046875, -13.45654296875, -12.8917236328125, -12.326904296875, -11.7620849609375, -11.197265625, -10.6324462890625, -10.067626953125, -9.5028076171875, -8.93798828125, -8.3731689453125, -7.808349609375, -7.2435302734375, -6.6787109375, -6.1138916015625, -5.549072265625, -4.9842529296875, -4.41943359375, -3.8546142578125, -3.289794921875, -2.7249755859375, -2.16015625, -1.5953369140625, -1.030517578125, -0.4656982421875, 0.09912109375, 0.6639404296875, 1.228759765625, 1.7935791015625, 2.3583984375, 2.9232177734375, 3.488037109375, 4.0528564453125, 4.61767578125, 5.1824951171875, 5.747314453125, 6.3121337890625, 6.876953125, 7.4417724609375, 8.006591796875, 8.5714111328125, 9.13623046875, 9.7010498046875, 10.265869140625, 10.8306884765625, 11.3955078125, 11.9603271484375, 12.525146484375, 13.0899658203125, 13.65478515625, 14.2196044921875, 14.784423828125, 15.3492431640625, 15.9140625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 13.0, 9.0, 16.0, 30.0, 40.0, 59.0, 77.0, 132.0, 178.0, 299.0, 452.0, 685.0, 1057.0, 1683.0, 2711.0, 4335.0, 7001.0, 11553.0, 19648.0, 34971.0, 67303.0, 151632.0, 331257.0, 215428.0, 92072.0, 44584.0, 24368.0, 14293.0, 8433.0, 5246.0, 3307.0, 2069.0, 1256.0, 798.0, 511.0, 322.0, 234.0, 161.0, 106.0, 57.0, 63.0, 29.0, 25.0, 13.0, 9.0, 8.0, 10.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.970703125, -0.9410171508789062, -0.9113311767578125, -0.8816452026367188, -0.851959228515625, -0.8222732543945312, -0.7925872802734375, -0.7629013061523438, -0.73321533203125, -0.7035293579101562, -0.6738433837890625, -0.6441574096679688, -0.614471435546875, -0.5847854614257812, -0.5550994873046875, -0.5254135131835938, -0.4957275390625, -0.46604156494140625, -0.4363555908203125, -0.40666961669921875, -0.376983642578125, -0.34729766845703125, -0.3176116943359375, -0.28792572021484375, -0.25823974609375, -0.22855377197265625, -0.1988677978515625, -0.16918182373046875, -0.139495849609375, -0.10980987548828125, -0.0801239013671875, -0.05043792724609375, -0.020751953125, 0.00893402099609375, 0.0386199951171875, 0.06830596923828125, 0.097991943359375, 0.12767791748046875, 0.1573638916015625, 0.18704986572265625, 0.21673583984375, 0.24642181396484375, 0.2761077880859375, 0.30579376220703125, 0.335479736328125, 0.36516571044921875, 0.3948516845703125, 0.42453765869140625, 0.4542236328125, 0.48390960693359375, 0.5135955810546875, 0.5432815551757812, 0.572967529296875, 0.6026535034179688, 0.6323394775390625, 0.6620254516601562, 0.69171142578125, 0.7213973999023438, 0.7510833740234375, 0.7807693481445312, 0.810455322265625, 0.8401412963867188, 0.8698272705078125, 0.8995132446289062, 0.92919921875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 9.0, 9.0, 16.0, 8.0, 22.0, 17.0, 26.0, 22.0, 26.0, 25.0, 39.0, 27.0, 47.0, 40.0, 57.0, 42.0, 47.0, 1073.0, 50.0, 44.0, 34.0, 31.0, 41.0, 38.0, 31.0, 38.0, 24.0, 23.0, 26.0, 14.0, 24.0, 13.0, 10.0, 10.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.5299072265625, -9.169189453125, -8.8084716796875, -8.44775390625, -8.0870361328125, -7.726318359375, -7.3656005859375, -7.0048828125, -6.6441650390625, -6.283447265625, -5.9227294921875, -5.56201171875, -5.2012939453125, -4.840576171875, -4.4798583984375, -4.119140625, -3.7584228515625, -3.397705078125, -3.0369873046875, -2.67626953125, -2.3155517578125, -1.954833984375, -1.5941162109375, -1.2333984375, -0.8726806640625, -0.511962890625, -0.1512451171875, 0.20947265625, 0.5701904296875, 0.930908203125, 1.2916259765625, 1.65234375, 2.0130615234375, 2.373779296875, 2.7344970703125, 3.09521484375, 3.4559326171875, 3.816650390625, 4.1773681640625, 4.5380859375, 4.8988037109375, 5.259521484375, 5.6202392578125, 5.98095703125, 6.3416748046875, 6.702392578125, 7.0631103515625, 7.423828125, 7.7845458984375, 8.145263671875, 8.5059814453125, 8.86669921875, 9.2274169921875, 9.588134765625, 9.9488525390625, 10.3095703125, 10.6702880859375, 11.031005859375, 11.3917236328125, 11.75244140625, 12.1131591796875, 12.473876953125, 12.8345947265625, 13.1953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 11.0, 6.0, 14.0, 23.0, 31.0, 58.0, 62.0, 102.0, 171.0, 275.0, 434.0, 703.0, 1053.0, 1740.0, 2788.0, 4264.0, 6452.0, 10065.0, 15544.0, 24556.0, 39759.0, 67017.0, 124043.0, 1283977.0, 240293.0, 111925.0, 61504.0, 36599.0, 22827.0, 14365.0, 9412.0, 6172.0, 3908.0, 2561.0, 1641.0, 1018.0, 636.0, 400.0, 250.0, 161.0, 103.0, 67.0, 38.0, 32.0, 14.0, 19.0, 9.0, 9.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.75830078125, -0.7352676391601562, -0.7122344970703125, -0.6892013549804688, -0.666168212890625, -0.6431350708007812, -0.6201019287109375, -0.5970687866210938, -0.57403564453125, -0.5510025024414062, -0.5279693603515625, -0.5049362182617188, -0.481903076171875, -0.45886993408203125, -0.4358367919921875, -0.41280364990234375, -0.3897705078125, -0.36673736572265625, -0.3437042236328125, -0.32067108154296875, -0.297637939453125, -0.27460479736328125, -0.2515716552734375, -0.22853851318359375, -0.20550537109375, -0.18247222900390625, -0.1594390869140625, -0.13640594482421875, -0.113372802734375, -0.09033966064453125, -0.0673065185546875, -0.04427337646484375, -0.021240234375, 0.00179290771484375, 0.0248260498046875, 0.04785919189453125, 0.070892333984375, 0.09392547607421875, 0.1169586181640625, 0.13999176025390625, 0.16302490234375, 0.18605804443359375, 0.2090911865234375, 0.23212432861328125, 0.255157470703125, 0.27819061279296875, 0.3012237548828125, 0.32425689697265625, 0.3472900390625, 0.37032318115234375, 0.3933563232421875, 0.41638946533203125, 0.439422607421875, 0.46245574951171875, 0.4854888916015625, 0.5085220336914062, 0.53155517578125, 0.5545883178710938, 0.5776214599609375, 0.6006546020507812, 0.623687744140625, 0.6467208862304688, 0.6697540283203125, 0.6927871704101562, 0.7158203125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 6.0, 6.0, 8.0, 18.0, 31.0, 22.0, 33.0, 30.0, 51.0, 49.0, 51.0, 38.0, 63.0, 60.0, 58.0, 49.0, 53.0, 38.0, 44.0, 53.0, 52.0, 27.0, 30.0, 29.0, 15.0, 10.0, 13.0, 12.0, 6.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002773284912109375, -0.0026823580265045166, -0.002591431140899658, -0.0025005042552948, -0.0024095773696899414, -0.002318650484085083, -0.0022277235984802246, -0.002136796712875366, -0.002045869827270508, -0.0019549429416656494, -0.001864016056060791, -0.0017730891704559326, -0.0016821622848510742, -0.0015912353992462158, -0.0015003085136413574, -0.001409381628036499, -0.0013184547424316406, -0.0012275278568267822, -0.0011366009712219238, -0.0010456740856170654, -0.000954747200012207, -0.0008638203144073486, -0.0007728934288024902, -0.0006819665431976318, -0.0005910396575927734, -0.000500112771987915, -0.00040918588638305664, -0.00031825900077819824, -0.00022733211517333984, -0.00013640522956848145, -4.547834396362305e-05, 4.544854164123535e-05, 0.00013637542724609375, 0.00022730231285095215, 0.00031822919845581055, 0.00040915608406066895, 0.0005000829696655273, 0.0005910098552703857, 0.0006819367408752441, 0.0007728636264801025, 0.0008637905120849609, 0.0009547173976898193, 0.0010456442832946777, 0.0011365711688995361, 0.0012274980545043945, 0.001318424940109253, 0.0014093518257141113, 0.0015002787113189697, 0.0015912055969238281, 0.0016821324825286865, 0.001773059368133545, 0.0018639862537384033, 0.0019549131393432617, 0.00204584002494812, 0.0021367669105529785, 0.002227693796157837, 0.0023186206817626953, 0.0024095475673675537, 0.002500474452972412, 0.0025914013385772705, 0.002682328224182129, 0.0027732551097869873, 0.0028641819953918457, 0.002955108880996704, 0.0030460357666015625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 0.0, 3.0, 6.0, 4.0, 12.0, 20.0, 9.0, 30.0, 29.0, 26.0, 62.0, 85.0, 98.0, 158.0, 215.0, 330.0, 961.0, 23502.0, 1000249.0, 20712.0, 930.0, 355.0, 231.0, 145.0, 101.0, 76.0, 64.0, 27.0, 38.0, 34.0, 17.0, 8.0, 3.0, 6.0, 1.0, 13.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0777587890625, -0.07573843002319336, -0.07371807098388672, -0.07169771194458008, -0.06967735290527344, -0.0676569938659668, -0.06563663482666016, -0.06361627578735352, -0.061595916748046875, -0.059575557708740234, -0.057555198669433594, -0.05553483963012695, -0.05351448059082031, -0.05149412155151367, -0.04947376251220703, -0.04745340347290039, -0.04543304443359375, -0.04341268539428711, -0.04139232635498047, -0.03937196731567383, -0.03735160827636719, -0.03533124923706055, -0.033310890197753906, -0.031290531158447266, -0.029270172119140625, -0.027249813079833984, -0.025229454040527344, -0.023209095001220703, -0.021188735961914062, -0.019168376922607422, -0.01714801788330078, -0.01512765884399414, -0.0131072998046875, -0.01108694076538086, -0.009066581726074219, -0.007046222686767578, -0.0050258636474609375, -0.003005504608154297, -0.0009851455688476562, 0.0010352134704589844, 0.003055572509765625, 0.005075931549072266, 0.007096290588378906, 0.009116649627685547, 0.011137008666992188, 0.013157367706298828, 0.015177726745605469, 0.01719808578491211, 0.01921844482421875, 0.02123880386352539, 0.02325916290283203, 0.025279521942138672, 0.027299880981445312, 0.029320240020751953, 0.031340599060058594, 0.033360958099365234, 0.035381317138671875, 0.037401676177978516, 0.039422035217285156, 0.0414423942565918, 0.04346275329589844, 0.04548311233520508, 0.04750347137451172, 0.04952383041381836, 0.051544189453125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 387.0, 592.0, 29.0, 1.0], "bins": [-0.04468172416090965, -0.04395001381635666, -0.043218307197093964, -0.04248659685254097, -0.041754886507987976, -0.04102317616343498, -0.04029146581888199, -0.03955975919961929, -0.0388280488550663, -0.038096338510513306, -0.03736463189125061, -0.03663292154669762, -0.03590121120214462, -0.03516950085759163, -0.034437790513038635, -0.03370608389377594, -0.032974373549222946, -0.03224266320466995, -0.03151095658540726, -0.030779246240854263, -0.03004753589630127, -0.029315825551748276, -0.02858411706984043, -0.027852408587932587, -0.027120698243379593, -0.0263889878988266, -0.025657279416918755, -0.02492557093501091, -0.024193860590457916, -0.023462150245904922, -0.022730441763997078, -0.021998733282089233, -0.02126702107489109, -0.020535312592983246, -0.019803602248430252, -0.01907189190387726, -0.018340183421969414, -0.01760847494006157, -0.016876764595508575, -0.01614505425095558, -0.015413345769047737, -0.014681636355817318, -0.013949926942586899, -0.01321821752935648, -0.01248650811612606, -0.011754798702895641, -0.011023089289665222, -0.010291379876434803, -0.009559670463204384, -0.008827961049973965, -0.008096251636743546, -0.007364542223513126, -0.006632832810282707, -0.005901123397052288, -0.005169413983821869, -0.00443770457059145, -0.0037059953901916742, -0.002974285976961255, -0.002242576563730836, -0.0015108671505004168, -0.0007791577372699976, -4.744832403957844e-05, 0.0006842610891908407, 0.0014159705024212599, 0.002147679915651679]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 1.0, 4.0, 6.0, 10.0, 10.0, 18.0, 15.0, 16.0, 17.0, 23.0, 32.0, 37.0, 32.0, 34.0, 28.0, 34.0, 40.0, 53.0, 42.0, 28.0, 37.0, 48.0, 42.0, 30.0, 47.0, 44.0, 34.0, 36.0, 34.0, 20.0, 13.0, 18.0, 17.0, 12.0, 20.0, 14.0, 13.0, 13.0, 4.0, 4.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015085339546203613, -0.0014608250930905342, -0.001413116231560707, -0.00136540737003088, -0.0013176985085010529, -0.0012699896469712257, -0.0012222807854413986, -0.0011745719239115715, -0.0011268630623817444, -0.0010791542008519173, -0.0010314453393220901, -0.000983736477792263, -0.0009360276162624359, -0.0008883187547326088, -0.0008406098932027817, -0.0007929010316729546, -0.0007451921701431274, -0.0006974833086133003, -0.0006497744470834732, -0.0006020655855536461, -0.000554356724023819, -0.0005066478624939919, -0.00045893900096416473, -0.0004112301394343376, -0.0003635212779045105, -0.0003158124163746834, -0.00026810355484485626, -0.00022039469331502914, -0.00017268583178520203, -0.0001249769702553749, -7.726810872554779e-05, -2.9559247195720673e-05, 1.8149614334106445e-05, 6.585847586393356e-05, 0.00011356733739376068, 0.0001612761989235878, 0.00020898506045341492, 0.00025669392198324203, 0.00030440278351306915, 0.00035211164504289627, 0.0003998205065727234, 0.0004475293681025505, 0.0004952382296323776, 0.0005429470911622047, 0.0005906559526920319, 0.000638364814221859, 0.0006860736757516861, 0.0007337825372815132, 0.0007814913988113403, 0.0008292002603411674, 0.0008769091218709946, 0.0009246179834008217, 0.0009723268449306488, 0.001020035706460476, 0.001067744567990303, 0.0011154534295201302, 0.0011631622910499573, 0.0012108711525797844, 0.0012585800141096115, 0.0013062888756394386, 0.0013539977371692657, 0.0014017065986990929, 0.00144941546022892, 0.001497124321758747, 0.0015448331832885742]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 8.0, 7.0, 12.0, 10.0, 9.0, 21.0, 22.0, 29.0, 20.0, 32.0, 33.0, 38.0, 52.0, 47.0, 57.0, 51.0, 54.0, 47.0, 44.0, 57.0, 45.0, 38.0, 30.0, 34.0, 31.0, 26.0, 29.0, 17.0, 20.0, 12.0, 12.0, 15.0, 6.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.234375, -19.6695556640625, -19.104736328125, -18.5399169921875, -17.97509765625, -17.4102783203125, -16.845458984375, -16.2806396484375, -15.7158203125, -15.1510009765625, -14.586181640625, -14.0213623046875, -13.45654296875, -12.8917236328125, -12.326904296875, -11.7620849609375, -11.197265625, -10.6324462890625, -10.067626953125, -9.5028076171875, -8.93798828125, -8.3731689453125, -7.808349609375, -7.2435302734375, -6.6787109375, -6.1138916015625, -5.549072265625, -4.9842529296875, -4.41943359375, -3.8546142578125, -3.289794921875, -2.7249755859375, -2.16015625, -1.5953369140625, -1.030517578125, -0.4656982421875, 0.09912109375, 0.6639404296875, 1.228759765625, 1.7935791015625, 2.3583984375, 2.9232177734375, 3.488037109375, 4.0528564453125, 4.61767578125, 5.1824951171875, 5.747314453125, 6.3121337890625, 6.876953125, 7.4417724609375, 8.006591796875, 8.5714111328125, 9.13623046875, 9.7010498046875, 10.265869140625, 10.8306884765625, 11.3955078125, 11.9603271484375, 12.525146484375, 13.0899658203125, 13.65478515625, 14.2196044921875, 14.784423828125, 15.3492431640625, 15.9140625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 13.0, 11.0, 17.0, 24.0, 44.0, 47.0, 71.0, 119.0, 157.0, 228.0, 353.0, 523.0, 809.0, 1341.0, 2367.0, 4309.0, 9355.0, 25477.0, 101787.0, 661113.0, 178840.0, 36654.0, 12319.0, 5421.0, 2760.0, 1540.0, 978.0, 623.0, 411.0, 252.0, 193.0, 113.0, 79.0, 69.0, 39.0, 25.0, 18.0, 14.0, 9.0, 8.0, 8.0, 1.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.890625, -22.24853515625, -21.6064453125, -20.96435546875, -20.322265625, -19.68017578125, -19.0380859375, -18.39599609375, -17.75390625, -17.11181640625, -16.4697265625, -15.82763671875, -15.185546875, -14.54345703125, -13.9013671875, -13.25927734375, -12.6171875, -11.97509765625, -11.3330078125, -10.69091796875, -10.048828125, -9.40673828125, -8.7646484375, -8.12255859375, -7.48046875, -6.83837890625, -6.1962890625, -5.55419921875, -4.912109375, -4.27001953125, -3.6279296875, -2.98583984375, -2.34375, -1.70166015625, -1.0595703125, -0.41748046875, 0.224609375, 0.86669921875, 1.5087890625, 2.15087890625, 2.79296875, 3.43505859375, 4.0771484375, 4.71923828125, 5.361328125, 6.00341796875, 6.6455078125, 7.28759765625, 7.9296875, 8.57177734375, 9.2138671875, 9.85595703125, 10.498046875, 11.14013671875, 11.7822265625, 12.42431640625, 13.06640625, 13.70849609375, 14.3505859375, 14.99267578125, 15.634765625, 16.27685546875, 16.9189453125, 17.56103515625, 18.203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 13.0, 6.0, 6.0, 16.0, 10.0, 16.0, 19.0, 12.0, 15.0, 30.0, 43.0, 35.0, 28.0, 49.0, 48.0, 48.0, 37.0, 55.0, 1755.0, 254.0, 54.0, 51.0, 31.0, 47.0, 45.0, 34.0, 43.0, 37.0, 26.0, 26.0, 21.0, 22.0, 9.0, 17.0, 13.0, 17.0, 11.0, 12.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-61.1875, -59.43603515625, -57.6845703125, -55.93310546875, -54.181640625, -52.43017578125, -50.6787109375, -48.92724609375, -47.17578125, -45.42431640625, -43.6728515625, -41.92138671875, -40.169921875, -38.41845703125, -36.6669921875, -34.91552734375, -33.1640625, -31.41259765625, -29.6611328125, -27.90966796875, -26.158203125, -24.40673828125, -22.6552734375, -20.90380859375, -19.15234375, -17.40087890625, -15.6494140625, -13.89794921875, -12.146484375, -10.39501953125, -8.6435546875, -6.89208984375, -5.140625, -3.38916015625, -1.6376953125, 0.11376953125, 1.865234375, 3.61669921875, 5.3681640625, 7.11962890625, 8.87109375, 10.62255859375, 12.3740234375, 14.12548828125, 15.876953125, 17.62841796875, 19.3798828125, 21.13134765625, 22.8828125, 24.63427734375, 26.3857421875, 28.13720703125, 29.888671875, 31.64013671875, 33.3916015625, 35.14306640625, 36.89453125, 38.64599609375, 40.3974609375, 42.14892578125, 43.900390625, 45.65185546875, 47.4033203125, 49.15478515625, 50.90625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 6.0, 11.0, 15.0, 20.0, 30.0, 27.0, 38.0, 60.0, 91.0, 132.0, 199.0, 400.0, 945.0, 2811.0, 12094.0, 153460.0, 2949834.0, 18988.0, 4142.0, 1219.0, 475.0, 238.0, 149.0, 96.0, 53.0, 43.0, 29.0, 23.0, 20.0, 13.0, 12.0, 3.0, 2.0, 5.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-181.625, -176.3046875, -170.984375, -165.6640625, -160.34375, -155.0234375, -149.703125, -144.3828125, -139.0625, -133.7421875, -128.421875, -123.1015625, -117.78125, -112.4609375, -107.140625, -101.8203125, -96.5, -91.1796875, -85.859375, -80.5390625, -75.21875, -69.8984375, -64.578125, -59.2578125, -53.9375, -48.6171875, -43.296875, -37.9765625, -32.65625, -27.3359375, -22.015625, -16.6953125, -11.375, -6.0546875, -0.734375, 4.5859375, 9.90625, 15.2265625, 20.546875, 25.8671875, 31.1875, 36.5078125, 41.828125, 47.1484375, 52.46875, 57.7890625, 63.109375, 68.4296875, 73.75, 79.0703125, 84.390625, 89.7109375, 95.03125, 100.3515625, 105.671875, 110.9921875, 116.3125, 121.6328125, 126.953125, 132.2734375, 137.59375, 142.9140625, 148.234375, 153.5546875, 158.875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [12.0, 187.0, 778.0, 40.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.22724151611328, -38.65522766113281, -8.083213806152344, 22.488800048828125, 53.060813903808594, 83.6328353881836, 114.20484161376953, 144.77685546875, 175.348876953125, 205.9208984375, 236.49290466308594, 267.0649108886719, 297.6369323730469, 328.2089538574219, 358.78094482421875, 389.35296630859375, 419.92498779296875, 450.49700927734375, 481.06903076171875, 511.6410217285156, 542.2130126953125, 572.7850341796875, 603.3570556640625, 633.9290771484375, 664.5010986328125, 695.0731201171875, 725.6451416015625, 756.2171630859375, 786.7891845703125, 817.3612060546875, 847.9331665039062, 878.5051879882812, 909.0771484375, 939.649169921875, 970.22119140625, 1000.793212890625, 1031.365234375, 1061.937255859375, 1092.50927734375, 1123.081298828125, 1153.6533203125, 1184.225341796875, 1214.79736328125, 1245.369384765625, 1275.94140625, 1306.513427734375, 1337.08544921875, 1367.657470703125, 1398.2293701171875, 1428.8013916015625, 1459.3734130859375, 1489.9454345703125, 1520.5174560546875, 1551.0894775390625, 1581.6614990234375, 1612.2333984375, 1642.805419921875, 1673.37744140625, 1703.949462890625, 1734.521484375, 1765.093505859375, 1795.66552734375, 1826.237548828125, 1856.8095703125, 1887.381591796875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 9.0, 11.0, 9.0, 18.0, 16.0, 20.0, 20.0, 25.0, 31.0, 26.0, 34.0, 32.0, 43.0, 24.0, 37.0, 33.0, 38.0, 29.0, 40.0, 35.0, 32.0, 29.0, 32.0, 37.0, 33.0, 32.0, 38.0, 34.0, 33.0, 24.0, 17.0, 16.0, 10.0, 16.0, 17.0, 4.0, 11.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-176.732421875, -171.211669921875, -165.69091796875, -160.17015075683594, -154.64939880371094, -149.12864685058594, -143.60787963867188, -138.08712768554688, -132.56637573242188, -127.04562377929688, -121.52486419677734, -116.00410461425781, -110.48335266113281, -104.96260070800781, -99.44184112548828, -93.92108154296875, -88.40032958984375, -82.87957763671875, -77.35881805419922, -71.83805847167969, -66.31730651855469, -60.79655075073242, -55.275794982910156, -49.75503921508789, -44.234283447265625, -38.71352767944336, -33.192771911621094, -27.672016143798828, -22.151260375976562, -16.630504608154297, -11.109748840332031, -5.588993072509766, -0.0682373046875, 5.452518463134766, 10.973274230957031, 16.494029998779297, 22.014785766601562, 27.535541534423828, 33.056297302246094, 38.57705307006836, 44.097808837890625, 49.61856460571289, 55.139320373535156, 60.66007614135742, 66.18083190917969, 71.70158386230469, 77.22234344482422, 82.74310302734375, 88.26385498046875, 93.78460693359375, 99.30536651611328, 104.82612609863281, 110.34687805175781, 115.86763000488281, 121.38838958740234, 126.90914916992188, 132.42990112304688, 137.95065307617188, 143.47140502929688, 148.99217224121094, 154.51292419433594, 160.03367614746094, 165.554443359375, 171.0751953125, 176.595947265625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 10.0, 8.0, 14.0, 13.0, 18.0, 18.0, 25.0, 31.0, 22.0, 38.0, 50.0, 46.0, 50.0, 57.0, 48.0, 52.0, 48.0, 60.0, 46.0, 46.0, 44.0, 34.0, 28.0, 23.0, 35.0, 30.0, 15.0, 17.0, 16.0, 7.0, 10.0, 5.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.59375, -20.987548828125, -20.38134765625, -19.775146484375, -19.1689453125, -18.562744140625, -17.95654296875, -17.350341796875, -16.744140625, -16.137939453125, -15.53173828125, -14.925537109375, -14.3193359375, -13.713134765625, -13.10693359375, -12.500732421875, -11.89453125, -11.288330078125, -10.68212890625, -10.075927734375, -9.4697265625, -8.863525390625, -8.25732421875, -7.651123046875, -7.044921875, -6.438720703125, -5.83251953125, -5.226318359375, -4.6201171875, -4.013916015625, -3.40771484375, -2.801513671875, -2.1953125, -1.589111328125, -0.98291015625, -0.376708984375, 0.2294921875, 0.835693359375, 1.44189453125, 2.048095703125, 2.654296875, 3.260498046875, 3.86669921875, 4.472900390625, 5.0791015625, 5.685302734375, 6.29150390625, 6.897705078125, 7.50390625, 8.110107421875, 8.71630859375, 9.322509765625, 9.9287109375, 10.534912109375, 11.14111328125, 11.747314453125, 12.353515625, 12.959716796875, 13.56591796875, 14.172119140625, 14.7783203125, 15.384521484375, 15.99072265625, 16.596923828125, 17.203125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 10.0, 10.0, 9.0, 14.0, 21.0, 27.0, 41.0, 66.0, 97.0, 140.0, 234.0, 394.0, 754.0, 1295.0, 2561.0, 5169.0, 12360.0, 35462.0, 2517678.0, 1562068.0, 33889.0, 11639.0, 4972.0, 2476.0, 1187.0, 737.0, 362.0, 208.0, 148.0, 91.0, 47.0, 47.0, 24.0, 14.0, 8.0, 6.0, 3.0, 3.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-118.0, -114.7197265625, -111.439453125, -108.1591796875, -104.87890625, -101.5986328125, -98.318359375, -95.0380859375, -91.7578125, -88.4775390625, -85.197265625, -81.9169921875, -78.63671875, -75.3564453125, -72.076171875, -68.7958984375, -65.515625, -62.2353515625, -58.955078125, -55.6748046875, -52.39453125, -49.1142578125, -45.833984375, -42.5537109375, -39.2734375, -35.9931640625, -32.712890625, -29.4326171875, -26.15234375, -22.8720703125, -19.591796875, -16.3115234375, -13.03125, -9.7509765625, -6.470703125, -3.1904296875, 0.08984375, 3.3701171875, 6.650390625, 9.9306640625, 13.2109375, 16.4912109375, 19.771484375, 23.0517578125, 26.33203125, 29.6123046875, 32.892578125, 36.1728515625, 39.453125, 42.7333984375, 46.013671875, 49.2939453125, 52.57421875, 55.8544921875, 59.134765625, 62.4150390625, 65.6953125, 68.9755859375, 72.255859375, 75.5361328125, 78.81640625, 82.0966796875, 85.376953125, 88.6572265625, 91.9375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 0.0, 4.0, 6.0, 9.0, 17.0, 10.0, 7.0, 13.0, 17.0, 21.0, 26.0, 26.0, 41.0, 67.0, 154.0, 417.0, 1333.0, 1170.0, 368.0, 108.0, 55.0, 38.0, 33.0, 28.0, 20.0, 16.0, 15.0, 10.0, 6.0, 7.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.4375, -65.10546875, -62.7734375, -60.44140625, -58.109375, -55.77734375, -53.4453125, -51.11328125, -48.78125, -46.44921875, -44.1171875, -41.78515625, -39.453125, -37.12109375, -34.7890625, -32.45703125, -30.125, -27.79296875, -25.4609375, -23.12890625, -20.796875, -18.46484375, -16.1328125, -13.80078125, -11.46875, -9.13671875, -6.8046875, -4.47265625, -2.140625, 0.19140625, 2.5234375, 4.85546875, 7.1875, 9.51953125, 11.8515625, 14.18359375, 16.515625, 18.84765625, 21.1796875, 23.51171875, 25.84375, 28.17578125, 30.5078125, 32.83984375, 35.171875, 37.50390625, 39.8359375, 42.16796875, 44.5, 46.83203125, 49.1640625, 51.49609375, 53.828125, 56.16015625, 58.4921875, 60.82421875, 63.15625, 65.48828125, 67.8203125, 70.15234375, 72.484375, 74.81640625, 77.1484375, 79.48046875, 81.8125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 5.0, 13.0, 18.0, 29.0, 41.0, 60.0, 86.0, 112.0, 160.0, 238.0, 356.0, 435.0, 687.0, 1057.0, 1679.0, 2587.0, 3975.0, 6574.0, 11113.0, 19682.0, 39225.0, 108633.0, 2953856.0, 887357.0, 79907.0, 32965.0, 17355.0, 9819.0, 5957.0, 3603.0, 2207.0, 1480.0, 924.0, 622.0, 457.0, 294.0, 191.0, 136.0, 87.0, 79.0, 45.0, 42.0, 32.0, 27.0, 19.0, 11.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0], "bins": [-95.1875, -92.29296875, -89.3984375, -86.50390625, -83.609375, -80.71484375, -77.8203125, -74.92578125, -72.03125, -69.13671875, -66.2421875, -63.34765625, -60.453125, -57.55859375, -54.6640625, -51.76953125, -48.875, -45.98046875, -43.0859375, -40.19140625, -37.296875, -34.40234375, -31.5078125, -28.61328125, -25.71875, -22.82421875, -19.9296875, -17.03515625, -14.140625, -11.24609375, -8.3515625, -5.45703125, -2.5625, 0.33203125, 3.2265625, 6.12109375, 9.015625, 11.91015625, 14.8046875, 17.69921875, 20.59375, 23.48828125, 26.3828125, 29.27734375, 32.171875, 35.06640625, 37.9609375, 40.85546875, 43.75, 46.64453125, 49.5390625, 52.43359375, 55.328125, 58.22265625, 61.1171875, 64.01171875, 66.90625, 69.80078125, 72.6953125, 75.58984375, 78.484375, 81.37890625, 84.2734375, 87.16796875, 90.0625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 10.0, 8.0, 20.0, 37.0, 71.0, 93.0, 244.0, 250.0, 106.0, 71.0, 36.0, 19.0, 9.0, 6.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-276.7287902832031, -262.95281982421875, -249.17681884765625, -235.40084838867188, -221.62484741210938, -207.848876953125, -194.07289123535156, -180.29690551757812, -166.5209197998047, -152.74493408203125, -138.9689483642578, -125.1929702758789, -111.41698455810547, -97.64099884033203, -83.86502075195312, -70.08903503417969, -56.31304931640625, -42.53706359863281, -28.76108169555664, -14.985099792480469, -1.2091140747070312, 12.566871643066406, 26.342849731445312, 40.11883544921875, 53.89482116699219, 67.67080688476562, 81.44679260253906, 95.22277069091797, 108.9987564086914, 122.77474212646484, 136.55072021484375, 150.3267059326172, 164.10272216796875, 177.8787078857422, 191.65469360351562, 205.4306640625, 219.2066650390625, 232.98263549804688, 246.7586212158203, 260.53460693359375, 274.31060791015625, 288.0865783691406, 301.8625793457031, 315.6385498046875, 329.41455078125, 343.1905212402344, 356.96649169921875, 370.74249267578125, 384.5184631347656, 398.29443359375, 412.0704345703125, 425.8464050292969, 439.6224060058594, 453.39837646484375, 467.17437744140625, 480.9503479003906, 494.726318359375, 508.5022888183594, 522.2782592773438, 536.0542602539062, 549.8302612304688, 563.6062622070312, 577.3822021484375, 591.158203125, 604.9342041015625]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 4.0, 7.0, 10.0, 11.0, 9.0, 11.0, 13.0, 14.0, 21.0, 27.0, 40.0, 24.0, 28.0, 35.0, 33.0, 38.0, 38.0, 42.0, 42.0, 47.0, 46.0, 45.0, 46.0, 32.0, 43.0, 27.0, 34.0, 25.0, 24.0, 27.0, 26.0, 19.0, 24.0, 19.0, 11.0, 10.0, 19.0, 5.0, 3.0, 4.0, 9.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-181.99717712402344, -176.496826171875, -170.99647521972656, -165.49612426757812, -159.9957733154297, -154.49542236328125, -148.99505615234375, -143.49472045898438, -137.99435424804688, -132.49400329589844, -126.99365234375, -121.49330139160156, -115.99295043945312, -110.49259948730469, -104.99224090576172, -99.49188995361328, -93.99154663085938, -88.49119567871094, -82.9908447265625, -77.49049377441406, -71.99014282226562, -66.48979187011719, -60.98943328857422, -55.48908233642578, -49.988731384277344, -44.488380432128906, -38.98802947998047, -33.487674713134766, -27.987323760986328, -22.48697280883789, -16.986618041992188, -11.48626708984375, -5.985931396484375, -0.4855794906616211, 5.014772415161133, 10.515125274658203, 16.01547622680664, 21.515827178955078, 27.01618194580078, 32.51653289794922, 38.016883850097656, 43.517234802246094, 49.01758575439453, 54.517940521240234, 60.01829147338867, 65.51864624023438, 71.01899719238281, 76.51934814453125, 82.01969909667969, 87.52005004882812, 93.02040100097656, 98.520751953125, 104.02110290527344, 109.52145385742188, 115.02181243896484, 120.52216339111328, 126.02251434326172, 131.5228729248047, 137.02322387695312, 142.52357482910156, 148.02392578125, 153.52427673339844, 159.02462768554688, 164.5249786376953, 170.02532958984375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 2.0, 11.0, 7.0, 12.0, 10.0, 16.0, 9.0, 18.0, 23.0, 31.0, 26.0, 39.0, 34.0, 38.0, 40.0, 50.0, 50.0, 41.0, 42.0, 54.0, 60.0, 47.0, 26.0, 43.0, 24.0, 35.0, 25.0, 25.0, 29.0, 24.0, 18.0, 12.0, 19.0, 8.0, 11.0, 8.0, 9.0, 1.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.890625, -19.3154296875, -18.740234375, -18.1650390625, -17.58984375, -17.0146484375, -16.439453125, -15.8642578125, -15.2890625, -14.7138671875, -14.138671875, -13.5634765625, -12.98828125, -12.4130859375, -11.837890625, -11.2626953125, -10.6875, -10.1123046875, -9.537109375, -8.9619140625, -8.38671875, -7.8115234375, -7.236328125, -6.6611328125, -6.0859375, -5.5107421875, -4.935546875, -4.3603515625, -3.78515625, -3.2099609375, -2.634765625, -2.0595703125, -1.484375, -0.9091796875, -0.333984375, 0.2412109375, 0.81640625, 1.3916015625, 1.966796875, 2.5419921875, 3.1171875, 3.6923828125, 4.267578125, 4.8427734375, 5.41796875, 5.9931640625, 6.568359375, 7.1435546875, 7.71875, 8.2939453125, 8.869140625, 9.4443359375, 10.01953125, 10.5947265625, 11.169921875, 11.7451171875, 12.3203125, 12.8955078125, 13.470703125, 14.0458984375, 14.62109375, 15.1962890625, 15.771484375, 16.3466796875, 16.921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 18.0, 22.0, 26.0, 54.0, 65.0, 91.0, 145.0, 232.0, 313.0, 495.0, 700.0, 1087.0, 1548.0, 2395.0, 3713.0, 5612.0, 9082.0, 14475.0, 23921.0, 41916.0, 77279.0, 161972.0, 301917.0, 193403.0, 89581.0, 47337.0, 26969.0, 16218.0, 9925.0, 6142.0, 3991.0, 2665.0, 1712.0, 1154.0, 787.0, 496.0, 344.0, 238.0, 150.0, 121.0, 80.0, 47.0, 42.0, 28.0, 11.0, 12.0, 9.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.92919921875, -0.9007034301757812, -0.8722076416015625, -0.8437118530273438, -0.815216064453125, -0.7867202758789062, -0.7582244873046875, -0.7297286987304688, -0.70123291015625, -0.6727371215820312, -0.6442413330078125, -0.6157455444335938, -0.587249755859375, -0.5587539672851562, -0.5302581787109375, -0.5017623901367188, -0.4732666015625, -0.44477081298828125, -0.4162750244140625, -0.38777923583984375, -0.359283447265625, -0.33078765869140625, -0.3022918701171875, -0.27379608154296875, -0.24530029296875, -0.21680450439453125, -0.1883087158203125, -0.15981292724609375, -0.131317138671875, -0.10282135009765625, -0.0743255615234375, -0.04582977294921875, -0.017333984375, 0.01116180419921875, 0.0396575927734375, 0.06815338134765625, 0.096649169921875, 0.12514495849609375, 0.1536407470703125, 0.18213653564453125, 0.21063232421875, 0.23912811279296875, 0.2676239013671875, 0.29611968994140625, 0.324615478515625, 0.35311126708984375, 0.3816070556640625, 0.41010284423828125, 0.4385986328125, 0.46709442138671875, 0.4955902099609375, 0.5240859985351562, 0.552581787109375, 0.5810775756835938, 0.6095733642578125, 0.6380691528320312, 0.66656494140625, 0.6950607299804688, 0.7235565185546875, 0.7520523071289062, 0.780548095703125, 0.8090438842773438, 0.8375396728515625, 0.8660354614257812, 0.89453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 7.0, 6.0, 11.0, 13.0, 18.0, 16.0, 26.0, 17.0, 23.0, 24.0, 50.0, 28.0, 31.0, 34.0, 35.0, 29.0, 33.0, 39.0, 1071.0, 36.0, 40.0, 41.0, 34.0, 33.0, 36.0, 32.0, 38.0, 27.0, 29.0, 23.0, 23.0, 21.0, 15.0, 14.0, 9.0, 4.0, 10.0, 12.0, 4.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.2578125, -9.933837890625, -9.60986328125, -9.285888671875, -8.9619140625, -8.637939453125, -8.31396484375, -7.989990234375, -7.666015625, -7.342041015625, -7.01806640625, -6.694091796875, -6.3701171875, -6.046142578125, -5.72216796875, -5.398193359375, -5.07421875, -4.750244140625, -4.42626953125, -4.102294921875, -3.7783203125, -3.454345703125, -3.13037109375, -2.806396484375, -2.482421875, -2.158447265625, -1.83447265625, -1.510498046875, -1.1865234375, -0.862548828125, -0.53857421875, -0.214599609375, 0.109375, 0.433349609375, 0.75732421875, 1.081298828125, 1.4052734375, 1.729248046875, 2.05322265625, 2.377197265625, 2.701171875, 3.025146484375, 3.34912109375, 3.673095703125, 3.9970703125, 4.321044921875, 4.64501953125, 4.968994140625, 5.29296875, 5.616943359375, 5.94091796875, 6.264892578125, 6.5888671875, 6.912841796875, 7.23681640625, 7.560791015625, 7.884765625, 8.208740234375, 8.53271484375, 8.856689453125, 9.1806640625, 9.504638671875, 9.82861328125, 10.152587890625, 10.4765625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 9.0, 15.0, 10.0, 24.0, 19.0, 44.0, 67.0, 104.0, 158.0, 171.0, 271.0, 342.0, 485.0, 726.0, 948.0, 1389.0, 1833.0, 2563.0, 3682.0, 5106.0, 6997.0, 10235.0, 14593.0, 21067.0, 31115.0, 46949.0, 72699.0, 119143.0, 1206601.0, 228935.0, 111091.0, 68378.0, 44141.0, 29724.0, 20043.0, 13853.0, 9694.0, 6826.0, 4797.0, 3459.0, 2500.0, 1776.0, 1278.0, 902.0, 730.0, 469.0, 353.0, 248.0, 160.0, 124.0, 81.0, 76.0, 40.0, 33.0, 25.0, 15.0, 9.0, 4.0, 6.0, 1.0, 2.0], "bins": [-0.5966796875, -0.5779953002929688, -0.5593109130859375, -0.5406265258789062, -0.521942138671875, -0.5032577514648438, -0.4845733642578125, -0.46588897705078125, -0.44720458984375, -0.42852020263671875, -0.4098358154296875, -0.39115142822265625, -0.372467041015625, -0.35378265380859375, -0.3350982666015625, -0.31641387939453125, -0.2977294921875, -0.27904510498046875, -0.2603607177734375, -0.24167633056640625, -0.222991943359375, -0.20430755615234375, -0.1856231689453125, -0.16693878173828125, -0.14825439453125, -0.12957000732421875, -0.1108856201171875, -0.09220123291015625, -0.073516845703125, -0.05483245849609375, -0.0361480712890625, -0.01746368408203125, 0.001220703125, 0.01990509033203125, 0.0385894775390625, 0.05727386474609375, 0.075958251953125, 0.09464263916015625, 0.1133270263671875, 0.13201141357421875, 0.15069580078125, 0.16938018798828125, 0.1880645751953125, 0.20674896240234375, 0.225433349609375, 0.24411773681640625, 0.2628021240234375, 0.28148651123046875, 0.3001708984375, 0.31885528564453125, 0.3375396728515625, 0.35622406005859375, 0.374908447265625, 0.39359283447265625, 0.4122772216796875, 0.43096160888671875, 0.44964599609375, 0.46833038330078125, 0.4870147705078125, 0.5056991577148438, 0.524383544921875, 0.5430679321289062, 0.5617523193359375, 0.5804367065429688, 0.59912109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 10.0, 7.0, 14.0, 19.0, 15.0, 17.0, 28.0, 25.0, 34.0, 37.0, 43.0, 52.0, 59.0, 51.0, 44.0, 62.0, 51.0, 58.0, 48.0, 44.0, 42.0, 44.0, 33.0, 23.0, 22.0, 20.0, 13.0, 13.0, 12.0, 6.0, 16.0, 5.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024890899658203125, -0.0024011433124542236, -0.0023131966590881348, -0.002225250005722046, -0.002137303352355957, -0.002049356698989868, -0.0019614100456237793, -0.0018734633922576904, -0.0017855167388916016, -0.0016975700855255127, -0.0016096234321594238, -0.001521676778793335, -0.001433730125427246, -0.0013457834720611572, -0.0012578368186950684, -0.0011698901653289795, -0.0010819435119628906, -0.0009939968585968018, -0.0009060502052307129, -0.000818103551864624, -0.0007301568984985352, -0.0006422102451324463, -0.0005542635917663574, -0.00046631693840026855, -0.0003783702850341797, -0.0002904236316680908, -0.00020247697830200195, -0.00011453032493591309, -2.658367156982422e-05, 6.136298179626465e-05, 0.00014930963516235352, 0.00023725628852844238, 0.00032520294189453125, 0.0004131495952606201, 0.000501096248626709, 0.0005890429019927979, 0.0006769895553588867, 0.0007649362087249756, 0.0008528828620910645, 0.0009408295154571533, 0.0010287761688232422, 0.001116722822189331, 0.00120466947555542, 0.0012926161289215088, 0.0013805627822875977, 0.0014685094356536865, 0.0015564560890197754, 0.0016444027423858643, 0.0017323493957519531, 0.001820296049118042, 0.0019082427024841309, 0.0019961893558502197, 0.0020841360092163086, 0.0021720826625823975, 0.0022600293159484863, 0.002347975969314575, 0.002435922622680664, 0.002523869276046753, 0.002611815929412842, 0.0026997625827789307, 0.0027877092361450195, 0.0028756558895111084, 0.0029636025428771973, 0.003051549196243286, 0.003139495849609375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 4.0, 3.0, 10.0, 10.0, 21.0, 23.0, 18.0, 35.0, 40.0, 64.0, 86.0, 76.0, 117.0, 156.0, 218.0, 376.0, 1117.0, 12674.0, 534965.0, 484375.0, 11746.0, 1118.0, 353.0, 229.0, 182.0, 121.0, 96.0, 76.0, 42.0, 54.0, 31.0, 16.0, 16.0, 24.0, 18.0, 13.0, 11.0, 3.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.052032470703125, -0.050586700439453125, -0.04914093017578125, -0.047695159912109375, -0.0462493896484375, -0.044803619384765625, -0.04335784912109375, -0.041912078857421875, -0.04046630859375, -0.039020538330078125, -0.03757476806640625, -0.036128997802734375, -0.0346832275390625, -0.033237457275390625, -0.03179168701171875, -0.030345916748046875, -0.028900146484375, -0.027454376220703125, -0.02600860595703125, -0.024562835693359375, -0.0231170654296875, -0.021671295166015625, -0.02022552490234375, -0.018779754638671875, -0.017333984375, -0.015888214111328125, -0.01444244384765625, -0.012996673583984375, -0.0115509033203125, -0.010105133056640625, -0.00865936279296875, -0.007213592529296875, -0.005767822265625, -0.004322052001953125, -0.00287628173828125, -0.001430511474609375, 1.52587890625e-05, 0.001461029052734375, 0.00290679931640625, 0.004352569580078125, 0.00579833984375, 0.007244110107421875, 0.00868988037109375, 0.010135650634765625, 0.0115814208984375, 0.013027191162109375, 0.01447296142578125, 0.015918731689453125, 0.017364501953125, 0.018810272216796875, 0.02025604248046875, 0.021701812744140625, 0.0231475830078125, 0.024593353271484375, 0.02603912353515625, 0.027484893798828125, 0.0289306640625, 0.030376434326171875, 0.03182220458984375, 0.033267974853515625, 0.0347137451171875, 0.036159515380859375, 0.03760528564453125, 0.039051055908203125, 0.040496826171875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 13.0, 41.0, 157.0, 527.0, 204.0, 54.0, 16.0, 4.0, 1.0], "bins": [-0.020976660773158073, -0.020618431270122528, -0.020260199904441833, -0.019901970401406288, -0.019543740898370743, -0.019185509532690048, -0.018827280029654503, -0.018469050526618958, -0.018110821023583412, -0.017752591520547867, -0.017394360154867172, -0.017036130651831627, -0.01667790114879608, -0.016319669783115387, -0.01596144028007984, -0.015603210777044296, -0.015244979411363602, -0.014886748977005482, -0.014528519473969936, -0.014170289039611816, -0.013812059536576271, -0.013453829102218151, -0.013095598667860031, -0.012737369164824486, -0.01237913966178894, -0.01202090922743082, -0.011662679724395275, -0.011304449290037155, -0.01094621978700161, -0.01058798935264349, -0.01022975891828537, -0.009871529415249825, -0.009513298980891705, -0.009155068546533585, -0.00879683904349804, -0.00843860860913992, -0.008080379106104374, -0.007722148671746254, -0.007363918703049421, -0.007005688734352589, -0.006647458299994469, -0.006289228331297636, -0.005930998362600803, -0.005572767928242683, -0.005214537959545851, -0.004856307990849018, -0.0044980780221521854, -0.004139848053455353, -0.003781617619097233, -0.0034233876504004, -0.003065157448872924, -0.002706927480176091, -0.002348697278648615, -0.0019904673099517822, -0.0016322373412549496, -0.0012740071397274733, -0.0009157772874459624, -0.0005575472023338079, -0.00019931717542931437, 0.0001589128514751792, 0.0005171429365873337, 0.0008753730216994882, 0.0012336029903963208, 0.0015918331919237971, 0.0019500631606206298]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 9.0, 8.0, 5.0, 4.0, 12.0, 8.0, 17.0, 23.0, 20.0, 19.0, 19.0, 27.0, 17.0, 28.0, 34.0, 36.0, 37.0, 30.0, 38.0, 36.0, 44.0, 38.0, 40.0, 45.0, 34.0, 32.0, 38.0, 33.0, 34.0, 22.0, 26.0, 23.0, 18.0, 18.0, 23.0, 21.0, 18.0, 13.0, 10.0, 7.0, 5.0, 9.0, 6.0, 9.0, 0.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0015026330947875977, -0.0014580637216567993, -0.001413494348526001, -0.0013689249753952026, -0.0013243556022644043, -0.001279786229133606, -0.0012352168560028076, -0.0011906474828720093, -0.001146078109741211, -0.0011015087366104126, -0.0010569393634796143, -0.001012369990348816, -0.0009678006172180176, -0.0009232312440872192, -0.0008786618709564209, -0.0008340924978256226, -0.0007895231246948242, -0.0007449537515640259, -0.0007003843784332275, -0.0006558150053024292, -0.0006112456321716309, -0.0005666762590408325, -0.0005221068859100342, -0.00047753751277923584, -0.0004329681396484375, -0.00038839876651763916, -0.0003438293933868408, -0.0002992600202560425, -0.00025469064712524414, -0.0002101212739944458, -0.00016555190086364746, -0.00012098252773284912, -7.641315460205078e-05, -3.184378147125244e-05, 1.2725591659545898e-05, 5.729496479034424e-05, 0.00010186433792114258, 0.00014643371105194092, 0.00019100308418273926, 0.0002355724573135376, 0.00028014183044433594, 0.0003247112035751343, 0.0003692805767059326, 0.00041384994983673096, 0.0004584193229675293, 0.0005029886960983276, 0.000547558069229126, 0.0005921274423599243, 0.0006366968154907227, 0.000681266188621521, 0.0007258355617523193, 0.0007704049348831177, 0.000814974308013916, 0.0008595436811447144, 0.0009041130542755127, 0.000948682427406311, 0.0009932518005371094, 0.0010378211736679077, 0.001082390546798706, 0.0011269599199295044, 0.0011715292930603027, 0.001216098666191101, 0.0012606680393218994, 0.0013052374124526978, 0.001349806785583496]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 2.0, 11.0, 7.0, 12.0, 10.0, 16.0, 9.0, 18.0, 23.0, 31.0, 26.0, 39.0, 34.0, 38.0, 40.0, 50.0, 50.0, 41.0, 42.0, 54.0, 60.0, 47.0, 26.0, 43.0, 24.0, 35.0, 25.0, 25.0, 29.0, 24.0, 18.0, 12.0, 19.0, 8.0, 11.0, 8.0, 9.0, 1.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.890625, -19.3154296875, -18.740234375, -18.1650390625, -17.58984375, -17.0146484375, -16.439453125, -15.8642578125, -15.2890625, -14.7138671875, -14.138671875, -13.5634765625, -12.98828125, -12.4130859375, -11.837890625, -11.2626953125, -10.6875, -10.1123046875, -9.537109375, -8.9619140625, -8.38671875, -7.8115234375, -7.236328125, -6.6611328125, -6.0859375, -5.5107421875, -4.935546875, -4.3603515625, -3.78515625, -3.2099609375, -2.634765625, -2.0595703125, -1.484375, -0.9091796875, -0.333984375, 0.2412109375, 0.81640625, 1.3916015625, 1.966796875, 2.5419921875, 3.1171875, 3.6923828125, 4.267578125, 4.8427734375, 5.41796875, 5.9931640625, 6.568359375, 7.1435546875, 7.71875, 8.2939453125, 8.869140625, 9.4443359375, 10.01953125, 10.5947265625, 11.169921875, 11.7451171875, 12.3203125, 12.8955078125, 13.470703125, 14.0458984375, 14.62109375, 15.1962890625, 15.771484375, 16.3466796875, 16.921875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 11.0, 16.0, 21.0, 27.0, 37.0, 48.0, 69.0, 101.0, 162.0, 183.0, 258.0, 399.0, 601.0, 922.0, 1533.0, 2549.0, 4570.0, 8604.0, 17594.0, 40294.0, 107310.0, 447846.0, 275244.0, 77736.0, 31252.0, 14269.0, 7135.0, 3743.0, 2134.0, 1311.0, 804.0, 530.0, 349.0, 235.0, 176.0, 133.0, 91.0, 66.0, 48.0, 31.0, 25.0, 32.0, 14.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.633056640625, -9.32080078125, -9.008544921875, -8.6962890625, -8.384033203125, -8.07177734375, -7.759521484375, -7.447265625, -7.135009765625, -6.82275390625, -6.510498046875, -6.1982421875, -5.885986328125, -5.57373046875, -5.261474609375, -4.94921875, -4.636962890625, -4.32470703125, -4.012451171875, -3.7001953125, -3.387939453125, -3.07568359375, -2.763427734375, -2.451171875, -2.138916015625, -1.82666015625, -1.514404296875, -1.2021484375, -0.889892578125, -0.57763671875, -0.265380859375, 0.046875, 0.359130859375, 0.67138671875, 0.983642578125, 1.2958984375, 1.608154296875, 1.92041015625, 2.232666015625, 2.544921875, 2.857177734375, 3.16943359375, 3.481689453125, 3.7939453125, 4.106201171875, 4.41845703125, 4.730712890625, 5.04296875, 5.355224609375, 5.66748046875, 5.979736328125, 6.2919921875, 6.604248046875, 6.91650390625, 7.228759765625, 7.541015625, 7.853271484375, 8.16552734375, 8.477783203125, 8.7900390625, 9.102294921875, 9.41455078125, 9.726806640625, 10.0390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 3.0, 2.0, 4.0, 9.0, 5.0, 11.0, 15.0, 14.0, 14.0, 21.0, 25.0, 16.0, 25.0, 27.0, 38.0, 33.0, 46.0, 40.0, 53.0, 53.0, 61.0, 154.0, 1867.0, 64.0, 44.0, 45.0, 39.0, 37.0, 36.0, 37.0, 39.0, 28.0, 20.0, 23.0, 16.0, 14.0, 16.0, 8.0, 9.0, 4.0, 8.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-60.03125, -58.103515625, -56.17578125, -54.248046875, -52.3203125, -50.392578125, -48.46484375, -46.537109375, -44.609375, -42.681640625, -40.75390625, -38.826171875, -36.8984375, -34.970703125, -33.04296875, -31.115234375, -29.1875, -27.259765625, -25.33203125, -23.404296875, -21.4765625, -19.548828125, -17.62109375, -15.693359375, -13.765625, -11.837890625, -9.91015625, -7.982421875, -6.0546875, -4.126953125, -2.19921875, -0.271484375, 1.65625, 3.583984375, 5.51171875, 7.439453125, 9.3671875, 11.294921875, 13.22265625, 15.150390625, 17.078125, 19.005859375, 20.93359375, 22.861328125, 24.7890625, 26.716796875, 28.64453125, 30.572265625, 32.5, 34.427734375, 36.35546875, 38.283203125, 40.2109375, 42.138671875, 44.06640625, 45.994140625, 47.921875, 49.849609375, 51.77734375, 53.705078125, 55.6328125, 57.560546875, 59.48828125, 61.416015625, 63.34375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 15.0, 21.0, 29.0, 57.0, 92.0, 167.0, 409.0, 1114.0, 3520.0, 12675.0, 3043126.0, 73038.0, 7821.0, 2182.0, 784.0, 283.0, 125.0, 83.0, 32.0, 29.0, 21.0, 14.0, 9.0, 13.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.375, -161.56640625, -155.7578125, -149.94921875, -144.140625, -138.33203125, -132.5234375, -126.71484375, -120.90625, -115.09765625, -109.2890625, -103.48046875, -97.671875, -91.86328125, -86.0546875, -80.24609375, -74.4375, -68.62890625, -62.8203125, -57.01171875, -51.203125, -45.39453125, -39.5859375, -33.77734375, -27.96875, -22.16015625, -16.3515625, -10.54296875, -4.734375, 1.07421875, 6.8828125, 12.69140625, 18.5, 24.30859375, 30.1171875, 35.92578125, 41.734375, 47.54296875, 53.3515625, 59.16015625, 64.96875, 70.77734375, 76.5859375, 82.39453125, 88.203125, 94.01171875, 99.8203125, 105.62890625, 111.4375, 117.24609375, 123.0546875, 128.86328125, 134.671875, 140.48046875, 146.2890625, 152.09765625, 157.90625, 163.71484375, 169.5234375, 175.33203125, 181.140625, 186.94921875, 192.7578125, 198.56640625, 204.375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 16.0, 970.0, 34.0], "bins": [-3499.896240234375, -3443.91357421875, -3387.930908203125, -3331.9482421875, -3275.965576171875, -3219.98291015625, -3164.00048828125, -3108.017578125, -3052.03515625, -2996.052490234375, -2940.06982421875, -2884.087158203125, -2828.1044921875, -2772.121826171875, -2716.13916015625, -2660.15673828125, -2604.173828125, -2548.191162109375, -2492.20849609375, -2436.225830078125, -2380.2431640625, -2324.260498046875, -2268.27783203125, -2212.29541015625, -2156.312744140625, -2100.330078125, -2044.347412109375, -1988.36474609375, -1932.3822021484375, -1876.3995361328125, -1820.4168701171875, -1764.4342041015625, -1708.4515380859375, -1652.4688720703125, -1596.4862060546875, -1540.503662109375, -1484.52099609375, -1428.538330078125, -1372.5556640625, -1316.572998046875, -1260.59033203125, -1204.607666015625, -1148.625, -1092.642333984375, -1036.6597900390625, -980.6771240234375, -924.6944580078125, -868.7117919921875, -812.7291870117188, -756.7465209960938, -700.763916015625, -644.78125, -588.798583984375, -532.81591796875, -476.83331298828125, -420.85064697265625, -364.8680419921875, -308.8854064941406, -252.90274047851562, -196.92010498046875, -140.9374542236328, -84.95480346679688, -28.97216796875, 27.010498046875, 82.9931411743164]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 9.0, 11.0, 11.0, 10.0, 19.0, 15.0, 15.0, 19.0, 20.0, 17.0, 26.0, 34.0, 32.0, 35.0, 45.0, 41.0, 42.0, 48.0, 41.0, 35.0, 40.0, 37.0, 44.0, 37.0, 28.0, 22.0, 32.0, 26.0, 34.0, 21.0, 31.0, 15.0, 27.0, 13.0, 14.0, 11.0, 4.0, 7.0, 4.0, 11.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-220.40110778808594, -213.7253875732422, -207.04966735839844, -200.3739471435547, -193.69822692871094, -187.0225067138672, -180.34677124023438, -173.67105102539062, -166.99533081054688, -160.31961059570312, -153.64389038085938, -146.96817016601562, -140.29244995117188, -133.61672973632812, -126.94100189208984, -120.2652816772461, -113.58956909179688, -106.91384887695312, -100.23812866210938, -93.56240844726562, -86.88668823242188, -80.21096801757812, -73.53524017333984, -66.8595199584961, -60.183799743652344, -53.508079528808594, -46.832359313964844, -40.15663528442383, -33.48091506958008, -26.805194854736328, -20.129470825195312, -13.453750610351562, -6.778045654296875, -0.1023244857788086, 6.573396682739258, 13.24911880493164, 19.92483901977539, 26.60055923461914, 33.276283264160156, 39.952003479003906, 46.627723693847656, 53.303443908691406, 59.979164123535156, 66.65489196777344, 73.33061218261719, 80.00633239746094, 86.68205261230469, 93.35777282714844, 100.03349304199219, 106.70921325683594, 113.38493347167969, 120.06065368652344, 126.73637390136719, 133.41209411621094, 140.08782958984375, 146.7635498046875, 153.43927001953125, 160.114990234375, 166.79071044921875, 173.4664306640625, 180.14215087890625, 186.81787109375, 193.49359130859375, 200.1693115234375, 206.84503173828125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 2.0, 7.0, 4.0, 8.0, 8.0, 11.0, 16.0, 13.0, 10.0, 16.0, 28.0, 29.0, 27.0, 40.0, 41.0, 39.0, 40.0, 38.0, 51.0, 52.0, 46.0, 53.0, 47.0, 42.0, 39.0, 37.0, 28.0, 33.0, 29.0, 16.0, 29.0, 32.0, 13.0, 10.0, 9.0, 12.0, 13.0, 6.0, 9.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-21.3125, -20.725341796875, -20.13818359375, -19.551025390625, -18.9638671875, -18.376708984375, -17.78955078125, -17.202392578125, -16.615234375, -16.028076171875, -15.44091796875, -14.853759765625, -14.2666015625, -13.679443359375, -13.09228515625, -12.505126953125, -11.91796875, -11.330810546875, -10.74365234375, -10.156494140625, -9.5693359375, -8.982177734375, -8.39501953125, -7.807861328125, -7.220703125, -6.633544921875, -6.04638671875, -5.459228515625, -4.8720703125, -4.284912109375, -3.69775390625, -3.110595703125, -2.5234375, -1.936279296875, -1.34912109375, -0.761962890625, -0.1748046875, 0.412353515625, 0.99951171875, 1.586669921875, 2.173828125, 2.760986328125, 3.34814453125, 3.935302734375, 4.5224609375, 5.109619140625, 5.69677734375, 6.283935546875, 6.87109375, 7.458251953125, 8.04541015625, 8.632568359375, 9.2197265625, 9.806884765625, 10.39404296875, 10.981201171875, 11.568359375, 12.155517578125, 12.74267578125, 13.329833984375, 13.9169921875, 14.504150390625, 15.09130859375, 15.678466796875, 16.265625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 11.0, 17.0, 12.0, 22.0, 19.0, 47.0, 55.0, 69.0, 103.0, 135.0, 174.0, 277.0, 375.0, 542.0, 779.0, 1071.0, 1654.0, 2557.0, 3871.0, 6406.0, 11118.0, 21404.0, 87938.0, 3270350.0, 705252.0, 39485.0, 16059.0, 8844.0, 5352.0, 3339.0, 2152.0, 1477.0, 964.0, 682.0, 521.0, 343.0, 231.0, 166.0, 113.0, 92.0, 66.0, 41.0, 24.0, 21.0, 19.0, 15.0, 6.0, 5.0, 3.0, 2.0, 4.0], "bins": [-71.8125, -69.861328125, -67.91015625, -65.958984375, -64.0078125, -62.056640625, -60.10546875, -58.154296875, -56.203125, -54.251953125, -52.30078125, -50.349609375, -48.3984375, -46.447265625, -44.49609375, -42.544921875, -40.59375, -38.642578125, -36.69140625, -34.740234375, -32.7890625, -30.837890625, -28.88671875, -26.935546875, -24.984375, -23.033203125, -21.08203125, -19.130859375, -17.1796875, -15.228515625, -13.27734375, -11.326171875, -9.375, -7.423828125, -5.47265625, -3.521484375, -1.5703125, 0.380859375, 2.33203125, 4.283203125, 6.234375, 8.185546875, 10.13671875, 12.087890625, 14.0390625, 15.990234375, 17.94140625, 19.892578125, 21.84375, 23.794921875, 25.74609375, 27.697265625, 29.6484375, 31.599609375, 33.55078125, 35.501953125, 37.453125, 39.404296875, 41.35546875, 43.306640625, 45.2578125, 47.208984375, 49.16015625, 51.111328125, 53.0625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 8.0, 10.0, 18.0, 18.0, 34.0, 26.0, 44.0, 62.0, 148.0, 546.0, 1935.0, 802.0, 162.0, 67.0, 50.0, 23.0, 21.0, 16.0, 12.0, 12.0, 16.0, 9.0, 10.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.6875, -72.73046875, -69.7734375, -66.81640625, -63.859375, -60.90234375, -57.9453125, -54.98828125, -52.03125, -49.07421875, -46.1171875, -43.16015625, -40.203125, -37.24609375, -34.2890625, -31.33203125, -28.375, -25.41796875, -22.4609375, -19.50390625, -16.546875, -13.58984375, -10.6328125, -7.67578125, -4.71875, -1.76171875, 1.1953125, 4.15234375, 7.109375, 10.06640625, 13.0234375, 15.98046875, 18.9375, 21.89453125, 24.8515625, 27.80859375, 30.765625, 33.72265625, 36.6796875, 39.63671875, 42.59375, 45.55078125, 48.5078125, 51.46484375, 54.421875, 57.37890625, 60.3359375, 63.29296875, 66.25, 69.20703125, 72.1640625, 75.12109375, 78.078125, 81.03515625, 83.9921875, 86.94921875, 89.90625, 92.86328125, 95.8203125, 98.77734375, 101.734375, 104.69140625, 107.6484375, 110.60546875, 113.5625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 4.0, 4.0, 8.0, 10.0, 16.0, 32.0, 39.0, 55.0, 96.0, 171.0, 296.0, 697.0, 1630.0, 4104.0, 11374.0, 32198.0, 150688.0, 3838907.0, 110372.0, 27130.0, 9814.0, 3790.0, 1535.0, 613.0, 304.0, 144.0, 89.0, 44.0, 37.0, 29.0, 17.0, 17.0, 8.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.0, -202.587890625, -197.17578125, -191.763671875, -186.3515625, -180.939453125, -175.52734375, -170.115234375, -164.703125, -159.291015625, -153.87890625, -148.466796875, -143.0546875, -137.642578125, -132.23046875, -126.818359375, -121.40625, -115.994140625, -110.58203125, -105.169921875, -99.7578125, -94.345703125, -88.93359375, -83.521484375, -78.109375, -72.697265625, -67.28515625, -61.873046875, -56.4609375, -51.048828125, -45.63671875, -40.224609375, -34.8125, -29.400390625, -23.98828125, -18.576171875, -13.1640625, -7.751953125, -2.33984375, 3.072265625, 8.484375, 13.896484375, 19.30859375, 24.720703125, 30.1328125, 35.544921875, 40.95703125, 46.369140625, 51.78125, 57.193359375, 62.60546875, 68.017578125, 73.4296875, 78.841796875, 84.25390625, 89.666015625, 95.078125, 100.490234375, 105.90234375, 111.314453125, 116.7265625, 122.138671875, 127.55078125, 132.962890625, 138.375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 12.0, 4.0, 12.0, 11.0, 21.0, 35.0, 54.0, 70.0, 151.0, 242.0, 150.0, 78.0, 42.0, 38.0, 22.0, 20.0, 12.0, 11.0, 5.0, 0.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-408.8102722167969, -398.4637756347656, -388.1172790527344, -377.77081298828125, -367.42431640625, -357.07781982421875, -346.7313232421875, -336.38482666015625, -326.0383605957031, -315.6918640136719, -305.3453674316406, -294.9989013671875, -284.65240478515625, -274.305908203125, -263.95941162109375, -253.61293029785156, -243.2664337158203, -232.91993713378906, -222.57345581054688, -212.22695922851562, -201.88047790527344, -191.5339813232422, -181.1875, -170.84100341796875, -160.4945068359375, -150.14801025390625, -139.80152893066406, -129.4550323486328, -119.10855102539062, -108.76205444335938, -98.41556549072266, -88.06907653808594, -77.72257995605469, -67.37609100341797, -57.02960205078125, -46.683109283447266, -36.33662033081055, -25.990131378173828, -15.643638610839844, -5.297149658203125, 5.049339294433594, 15.395829200744629, 25.742319107055664, 36.088809967041016, 46.435298919677734, 56.78178787231445, 67.12828063964844, 77.47476959228516, 87.82125854492188, 98.1677474975586, 108.51423645019531, 118.86073303222656, 129.20721435546875, 139.5537109375, 149.90020751953125, 160.24668884277344, 170.59317016601562, 180.93966674804688, 191.28614807128906, 201.6326446533203, 211.9791259765625, 222.32562255859375, 232.672119140625, 243.0186004638672, 253.36509704589844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 4.0, 4.0, 7.0, 9.0, 11.0, 10.0, 14.0, 11.0, 24.0, 11.0, 22.0, 23.0, 31.0, 33.0, 40.0, 36.0, 40.0, 52.0, 45.0, 31.0, 37.0, 43.0, 37.0, 44.0, 45.0, 42.0, 35.0, 38.0, 38.0, 24.0, 25.0, 19.0, 13.0, 17.0, 16.0, 11.0, 15.0, 9.0, 8.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-174.0596923828125, -168.74830627441406, -163.43692016601562, -158.12551879882812, -152.8141326904297, -147.50274658203125, -142.1913604736328, -136.87997436523438, -131.56857299804688, -126.25718688964844, -120.94579315185547, -115.63440704345703, -110.32301330566406, -105.01162719726562, -99.70024108886719, -94.38885498046875, -89.07746887207031, -83.76608276367188, -78.4546890258789, -73.14330291748047, -67.8319091796875, -62.52052307128906, -57.209136962890625, -51.89774703979492, -46.58635711669922, -41.274967193603516, -35.96357727050781, -30.652191162109375, -25.340801239013672, -20.02941131591797, -14.718023300170898, -9.406635284423828, -4.095245361328125, 1.2161436080932617, 6.527532577514648, 11.838921546936035, 17.150310516357422, 22.461700439453125, 27.773088455200195, 33.084476470947266, 38.39586639404297, 43.70725631713867, 49.018646240234375, 54.33003234863281, 59.641422271728516, 64.95281219482422, 70.26419830322266, 75.57559204101562, 80.88697814941406, 86.1983642578125, 91.50975799560547, 96.8211441040039, 102.13253784179688, 107.44392395019531, 112.75531005859375, 118.06669616699219, 123.37808990478516, 128.68948364257812, 134.00086975097656, 139.312255859375, 144.62364196777344, 149.93502807617188, 155.24642944335938, 160.5578155517578, 165.86920166015625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 5.0, 4.0, 20.0, 11.0, 15.0, 13.0, 16.0, 28.0, 31.0, 28.0, 24.0, 42.0, 35.0, 50.0, 44.0, 48.0, 58.0, 53.0, 48.0, 37.0, 46.0, 45.0, 43.0, 40.0, 27.0, 35.0, 31.0, 18.0, 15.0, 17.0, 6.0, 9.0, 7.0, 12.0, 9.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.103271484375, -19.45654296875, -18.809814453125, -18.1630859375, -17.516357421875, -16.86962890625, -16.222900390625, -15.576171875, -14.929443359375, -14.28271484375, -13.635986328125, -12.9892578125, -12.342529296875, -11.69580078125, -11.049072265625, -10.40234375, -9.755615234375, -9.10888671875, -8.462158203125, -7.8154296875, -7.168701171875, -6.52197265625, -5.875244140625, -5.228515625, -4.581787109375, -3.93505859375, -3.288330078125, -2.6416015625, -1.994873046875, -1.34814453125, -0.701416015625, -0.0546875, 0.592041015625, 1.23876953125, 1.885498046875, 2.5322265625, 3.178955078125, 3.82568359375, 4.472412109375, 5.119140625, 5.765869140625, 6.41259765625, 7.059326171875, 7.7060546875, 8.352783203125, 8.99951171875, 9.646240234375, 10.29296875, 10.939697265625, 11.58642578125, 12.233154296875, 12.8798828125, 13.526611328125, 14.17333984375, 14.820068359375, 15.466796875, 16.113525390625, 16.76025390625, 17.406982421875, 18.0537109375, 18.700439453125, 19.34716796875, 19.993896484375, 20.640625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 10.0, 5.0, 7.0, 11.0, 13.0, 22.0, 26.0, 39.0, 61.0, 99.0, 124.0, 186.0, 242.0, 345.0, 551.0, 745.0, 1152.0, 1713.0, 2464.0, 3959.0, 6021.0, 9312.0, 15027.0, 24916.0, 42390.0, 76121.0, 148355.0, 274903.0, 202377.0, 100710.0, 54149.0, 31111.0, 18653.0, 11557.0, 7334.0, 4617.0, 3011.0, 1968.0, 1375.0, 883.0, 590.0, 425.0, 305.0, 197.0, 152.0, 100.0, 76.0, 47.0, 30.0, 26.0, 17.0, 7.0, 13.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.90234375, -0.8738937377929688, -0.8454437255859375, -0.8169937133789062, -0.788543701171875, -0.7600936889648438, -0.7316436767578125, -0.7031936645507812, -0.67474365234375, -0.6462936401367188, -0.6178436279296875, -0.5893936157226562, -0.560943603515625, -0.5324935913085938, -0.5040435791015625, -0.47559356689453125, -0.4471435546875, -0.41869354248046875, -0.3902435302734375, -0.36179351806640625, -0.333343505859375, -0.30489349365234375, -0.2764434814453125, -0.24799346923828125, -0.21954345703125, -0.19109344482421875, -0.1626434326171875, -0.13419342041015625, -0.105743408203125, -0.07729339599609375, -0.0488433837890625, -0.02039337158203125, 0.008056640625, 0.03650665283203125, 0.0649566650390625, 0.09340667724609375, 0.121856689453125, 0.15030670166015625, 0.1787567138671875, 0.20720672607421875, 0.23565673828125, 0.26410675048828125, 0.2925567626953125, 0.32100677490234375, 0.349456787109375, 0.37790679931640625, 0.4063568115234375, 0.43480682373046875, 0.4632568359375, 0.49170684814453125, 0.5201568603515625, 0.5486068725585938, 0.577056884765625, 0.6055068969726562, 0.6339569091796875, 0.6624069213867188, 0.69085693359375, 0.7193069458007812, 0.7477569580078125, 0.7762069702148438, 0.804656982421875, 0.8331069946289062, 0.8615570068359375, 0.8900070190429688, 0.91845703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 9.0, 8.0, 8.0, 12.0, 9.0, 10.0, 15.0, 18.0, 22.0, 12.0, 31.0, 34.0, 25.0, 32.0, 43.0, 35.0, 35.0, 48.0, 41.0, 33.0, 1070.0, 45.0, 38.0, 51.0, 27.0, 31.0, 31.0, 33.0, 38.0, 27.0, 20.0, 18.0, 17.0, 17.0, 9.0, 6.0, 13.0, 16.0, 7.0, 8.0, 8.0, 2.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9884033203125, -10.617431640625, -10.2464599609375, -9.87548828125, -9.5045166015625, -9.133544921875, -8.7625732421875, -8.3916015625, -8.0206298828125, -7.649658203125, -7.2786865234375, -6.90771484375, -6.5367431640625, -6.165771484375, -5.7947998046875, -5.423828125, -5.0528564453125, -4.681884765625, -4.3109130859375, -3.93994140625, -3.5689697265625, -3.197998046875, -2.8270263671875, -2.4560546875, -2.0850830078125, -1.714111328125, -1.3431396484375, -0.97216796875, -0.6011962890625, -0.230224609375, 0.1407470703125, 0.51171875, 0.8826904296875, 1.253662109375, 1.6246337890625, 1.99560546875, 2.3665771484375, 2.737548828125, 3.1085205078125, 3.4794921875, 3.8504638671875, 4.221435546875, 4.5924072265625, 4.96337890625, 5.3343505859375, 5.705322265625, 6.0762939453125, 6.447265625, 6.8182373046875, 7.189208984375, 7.5601806640625, 7.93115234375, 8.3021240234375, 8.673095703125, 9.0440673828125, 9.4150390625, 9.7860107421875, 10.156982421875, 10.5279541015625, 10.89892578125, 11.2698974609375, 11.640869140625, 12.0118408203125, 12.3828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 14.0, 17.0, 34.0, 37.0, 68.0, 87.0, 139.0, 185.0, 275.0, 406.0, 565.0, 848.0, 1138.0, 1657.0, 2343.0, 3197.0, 4458.0, 6348.0, 8870.0, 13132.0, 19308.0, 28858.0, 44294.0, 70852.0, 124277.0, 1259095.0, 207284.0, 109669.0, 63999.0, 40627.0, 26593.0, 17697.0, 12115.0, 8347.0, 5917.0, 4148.0, 3016.0, 2084.0, 1572.0, 1100.0, 736.0, 548.0, 365.0, 274.0, 180.0, 122.0, 69.0, 68.0, 33.0, 22.0, 16.0, 7.0, 12.0, 3.0, 6.0, 1.0, 1.0], "bins": [-0.73486328125, -0.7125244140625, -0.690185546875, -0.6678466796875, -0.6455078125, -0.6231689453125, -0.600830078125, -0.5784912109375, -0.55615234375, -0.5338134765625, -0.511474609375, -0.4891357421875, -0.466796875, -0.4444580078125, -0.422119140625, -0.3997802734375, -0.37744140625, -0.3551025390625, -0.332763671875, -0.3104248046875, -0.2880859375, -0.2657470703125, -0.243408203125, -0.2210693359375, -0.19873046875, -0.1763916015625, -0.154052734375, -0.1317138671875, -0.109375, -0.0870361328125, -0.064697265625, -0.0423583984375, -0.02001953125, 0.0023193359375, 0.024658203125, 0.0469970703125, 0.0693359375, 0.0916748046875, 0.114013671875, 0.1363525390625, 0.15869140625, 0.1810302734375, 0.203369140625, 0.2257080078125, 0.248046875, 0.2703857421875, 0.292724609375, 0.3150634765625, 0.33740234375, 0.3597412109375, 0.382080078125, 0.4044189453125, 0.4267578125, 0.4490966796875, 0.471435546875, 0.4937744140625, 0.51611328125, 0.5384521484375, 0.560791015625, 0.5831298828125, 0.60546875, 0.6278076171875, 0.650146484375, 0.6724853515625, 0.69482421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 7.0, 7.0, 8.0, 11.0, 19.0, 15.0, 21.0, 30.0, 32.0, 34.0, 34.0, 40.0, 56.0, 60.0, 52.0, 62.0, 55.0, 51.0, 53.0, 50.0, 47.0, 46.0, 40.0, 31.0, 25.0, 17.0, 21.0, 13.0, 12.0, 10.0, 4.0, 5.0, 6.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003070831298828125, -0.0029622912406921387, -0.0028537511825561523, -0.002745211124420166, -0.0026366710662841797, -0.0025281310081481934, -0.002419590950012207, -0.0023110508918762207, -0.0022025108337402344, -0.002093970775604248, -0.0019854307174682617, -0.0018768906593322754, -0.001768350601196289, -0.0016598105430603027, -0.0015512704849243164, -0.00144273042678833, -0.0013341903686523438, -0.0012256503105163574, -0.001117110252380371, -0.0010085701942443848, -0.0009000301361083984, -0.0007914900779724121, -0.0006829500198364258, -0.0005744099617004395, -0.0004658699035644531, -0.0003573298454284668, -0.00024878978729248047, -0.00014024972915649414, -3.170967102050781e-05, 7.683038711547852e-05, 0.00018537044525146484, 0.00029391050338745117, 0.0004024505615234375, 0.0005109906196594238, 0.0006195306777954102, 0.0007280707359313965, 0.0008366107940673828, 0.0009451508522033691, 0.0010536909103393555, 0.0011622309684753418, 0.0012707710266113281, 0.0013793110847473145, 0.0014878511428833008, 0.0015963912010192871, 0.0017049312591552734, 0.0018134713172912598, 0.001922011375427246, 0.0020305514335632324, 0.0021390914916992188, 0.002247631549835205, 0.0023561716079711914, 0.0024647116661071777, 0.002573251724243164, 0.0026817917823791504, 0.0027903318405151367, 0.002898871898651123, 0.0030074119567871094, 0.0031159520149230957, 0.003224492073059082, 0.0033330321311950684, 0.0034415721893310547, 0.003550112247467041, 0.0036586523056030273, 0.0037671923637390137, 0.003875732421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 13.0, 10.0, 16.0, 19.0, 14.0, 20.0, 35.0, 39.0, 53.0, 71.0, 86.0, 92.0, 150.0, 234.0, 380.0, 967.0, 9066.0, 298852.0, 716523.0, 19168.0, 1356.0, 395.0, 239.0, 177.0, 120.0, 88.0, 89.0, 63.0, 43.0, 40.0, 27.0, 21.0, 17.0, 10.0, 10.0, 11.0, 9.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.053741455078125, -0.05216646194458008, -0.050591468811035156, -0.049016475677490234, -0.04744148254394531, -0.04586648941040039, -0.04429149627685547, -0.04271650314331055, -0.041141510009765625, -0.0395665168762207, -0.03799152374267578, -0.03641653060913086, -0.03484153747558594, -0.033266544342041016, -0.031691551208496094, -0.030116558074951172, -0.02854156494140625, -0.026966571807861328, -0.025391578674316406, -0.023816585540771484, -0.022241592407226562, -0.02066659927368164, -0.01909160614013672, -0.017516613006591797, -0.015941619873046875, -0.014366626739501953, -0.012791633605957031, -0.01121664047241211, -0.009641647338867188, -0.008066654205322266, -0.006491661071777344, -0.004916667938232422, -0.0033416748046875, -0.0017666816711425781, -0.00019168853759765625, 0.0013833045959472656, 0.0029582977294921875, 0.004533290863037109, 0.006108283996582031, 0.007683277130126953, 0.009258270263671875, 0.010833263397216797, 0.012408256530761719, 0.01398324966430664, 0.015558242797851562, 0.017133235931396484, 0.018708229064941406, 0.020283222198486328, 0.02185821533203125, 0.023433208465576172, 0.025008201599121094, 0.026583194732666016, 0.028158187866210938, 0.02973318099975586, 0.03130817413330078, 0.0328831672668457, 0.034458160400390625, 0.03603315353393555, 0.03760814666748047, 0.03918313980102539, 0.04075813293457031, 0.042333126068115234, 0.043908119201660156, 0.04548311233520508, 0.04705810546875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 43.0, 445.0, 437.0, 70.0, 9.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026122938841581345, -0.025485867634415627, -0.02484879456460476, -0.02421172335743904, -0.023574650287628174, -0.022937579080462456, -0.022300507873296738, -0.02166343480348587, -0.021026363596320152, -0.020389292389154434, -0.019752219319343567, -0.01911514811217785, -0.01847807504236698, -0.017841003835201263, -0.017203930765390396, -0.016566859558224678, -0.01592978835105896, -0.015292716212570667, -0.014655644074082375, -0.014018572866916656, -0.013381500728428364, -0.012744428589940071, -0.012107356451451778, -0.011470284312963486, -0.010833211243152618, -0.010196139104664326, -0.009559066966176033, -0.008921995759010315, -0.008284923620522022, -0.0076478514820337296, -0.007010779343545437, -0.0063737076707184315, -0.0057366350665688515, -0.005099562928080559, -0.004462491255253553, -0.0038254191167652607, -0.0031883472111076117, -0.0025512753054499626, -0.00191420316696167, -0.0012771314941346645, -0.0006400593556463718, -2.9873917810618877e-06, 0.0006340845720842481, 0.001271156594157219, 0.001908228499814868, 0.002545300405472517, 0.0031823725439608097, 0.003819444216787815, 0.004456516355276108, 0.0050935884937644005, 0.005730660166591406, 0.0063677323050796986, 0.007004803977906704, 0.007641876116394997, 0.00827894825488329, 0.008916020393371582, 0.0095530916005373, 0.010190163739025593, 0.010827235877513885, 0.011464307084679604, 0.012101379223167896, 0.012738451361656189, 0.013375523500144482, 0.014012595638632774, 0.014649667777121067]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 6.0, 5.0, 6.0, 3.0, 14.0, 11.0, 9.0, 13.0, 19.0, 22.0, 18.0, 18.0, 22.0, 21.0, 33.0, 30.0, 39.0, 47.0, 45.0, 43.0, 37.0, 42.0, 42.0, 33.0, 45.0, 50.0, 40.0, 43.0, 35.0, 37.0, 24.0, 26.0, 18.0, 24.0, 26.0, 15.0, 13.0, 10.0, 4.0, 7.0, 5.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0024372339248657227, -0.002367524430155754, -0.0022978149354457855, -0.002228105440735817, -0.0021583959460258484, -0.00208868645131588, -0.0020189769566059113, -0.0019492674618959427, -0.0018795579671859741, -0.0018098484724760056, -0.001740138977766037, -0.0016704294830560684, -0.0016007199883460999, -0.0015310104936361313, -0.0014613009989261627, -0.0013915915042161942, -0.0013218820095062256, -0.001252172514796257, -0.0011824630200862885, -0.0011127535253763199, -0.0010430440306663513, -0.0009733345359563828, -0.0009036250412464142, -0.0008339155465364456, -0.000764206051826477, -0.0006944965571165085, -0.0006247870624065399, -0.0005550775676965714, -0.0004853680729866028, -0.0004156585782766342, -0.00034594908356666565, -0.0002762395888566971, -0.00020653009414672852, -0.00013682059943675995, -6.711110472679138e-05, 2.598389983177185e-06, 7.230788469314575e-05, 0.00014201737940311432, 0.00021172687411308289, 0.00028143636882305145, 0.00035114586353302, 0.0004208553582429886, 0.0004905648529529572, 0.0005602743476629257, 0.0006299838423728943, 0.0006996933370828629, 0.0007694028317928314, 0.0008391123265028, 0.0009088218212127686, 0.0009785313159227371, 0.0010482408106327057, 0.0011179503053426743, 0.0011876598000526428, 0.0012573692947626114, 0.00132707878947258, 0.0013967882841825485, 0.001466497778892517, 0.0015362072736024857, 0.0016059167683124542, 0.0016756262630224228, 0.0017453357577323914, 0.00181504525244236, 0.0018847547471523285, 0.001954464241862297, 0.0020241737365722656]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 5.0, 4.0, 20.0, 11.0, 15.0, 13.0, 16.0, 28.0, 31.0, 28.0, 24.0, 42.0, 35.0, 50.0, 44.0, 48.0, 58.0, 53.0, 48.0, 37.0, 46.0, 45.0, 43.0, 40.0, 27.0, 35.0, 31.0, 18.0, 15.0, 17.0, 6.0, 9.0, 7.0, 12.0, 9.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.103271484375, -19.45654296875, -18.809814453125, -18.1630859375, -17.516357421875, -16.86962890625, -16.222900390625, -15.576171875, -14.929443359375, -14.28271484375, -13.635986328125, -12.9892578125, -12.342529296875, -11.69580078125, -11.049072265625, -10.40234375, -9.755615234375, -9.10888671875, -8.462158203125, -7.8154296875, -7.168701171875, -6.52197265625, -5.875244140625, -5.228515625, -4.581787109375, -3.93505859375, -3.288330078125, -2.6416015625, -1.994873046875, -1.34814453125, -0.701416015625, -0.0546875, 0.592041015625, 1.23876953125, 1.885498046875, 2.5322265625, 3.178955078125, 3.82568359375, 4.472412109375, 5.119140625, 5.765869140625, 6.41259765625, 7.059326171875, 7.7060546875, 8.352783203125, 8.99951171875, 9.646240234375, 10.29296875, 10.939697265625, 11.58642578125, 12.233154296875, 12.8798828125, 13.526611328125, 14.17333984375, 14.820068359375, 15.466796875, 16.113525390625, 16.76025390625, 17.406982421875, 18.0537109375, 18.700439453125, 19.34716796875, 19.993896484375, 20.640625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 8.0, 13.0, 16.0, 17.0, 38.0, 55.0, 57.0, 85.0, 124.0, 186.0, 323.0, 436.0, 619.0, 792.0, 1302.0, 1990.0, 3341.0, 6201.0, 12680.0, 34174.0, 144960.0, 643027.0, 137692.0, 32546.0, 12140.0, 6144.0, 3411.0, 2093.0, 1315.0, 832.0, 598.0, 426.0, 306.0, 174.0, 121.0, 63.0, 75.0, 55.0, 35.0, 26.0, 18.0, 12.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.640625, -14.18994140625, -13.7392578125, -13.28857421875, -12.837890625, -12.38720703125, -11.9365234375, -11.48583984375, -11.03515625, -10.58447265625, -10.1337890625, -9.68310546875, -9.232421875, -8.78173828125, -8.3310546875, -7.88037109375, -7.4296875, -6.97900390625, -6.5283203125, -6.07763671875, -5.626953125, -5.17626953125, -4.7255859375, -4.27490234375, -3.82421875, -3.37353515625, -2.9228515625, -2.47216796875, -2.021484375, -1.57080078125, -1.1201171875, -0.66943359375, -0.21875, 0.23193359375, 0.6826171875, 1.13330078125, 1.583984375, 2.03466796875, 2.4853515625, 2.93603515625, 3.38671875, 3.83740234375, 4.2880859375, 4.73876953125, 5.189453125, 5.64013671875, 6.0908203125, 6.54150390625, 6.9921875, 7.44287109375, 7.8935546875, 8.34423828125, 8.794921875, 9.24560546875, 9.6962890625, 10.14697265625, 10.59765625, 11.04833984375, 11.4990234375, 11.94970703125, 12.400390625, 12.85107421875, 13.3017578125, 13.75244140625, 14.203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 7.0, 8.0, 6.0, 10.0, 11.0, 18.0, 18.0, 12.0, 18.0, 16.0, 27.0, 27.0, 24.0, 35.0, 30.0, 25.0, 25.0, 45.0, 41.0, 35.0, 77.0, 1910.0, 123.0, 51.0, 31.0, 38.0, 38.0, 34.0, 41.0, 29.0, 26.0, 22.0, 30.0, 21.0, 18.0, 24.0, 11.0, 11.0, 16.0, 12.0, 5.0, 3.0, 5.0, 4.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-53.4375, -51.697265625, -49.95703125, -48.216796875, -46.4765625, -44.736328125, -42.99609375, -41.255859375, -39.515625, -37.775390625, -36.03515625, -34.294921875, -32.5546875, -30.814453125, -29.07421875, -27.333984375, -25.59375, -23.853515625, -22.11328125, -20.373046875, -18.6328125, -16.892578125, -15.15234375, -13.412109375, -11.671875, -9.931640625, -8.19140625, -6.451171875, -4.7109375, -2.970703125, -1.23046875, 0.509765625, 2.25, 3.990234375, 5.73046875, 7.470703125, 9.2109375, 10.951171875, 12.69140625, 14.431640625, 16.171875, 17.912109375, 19.65234375, 21.392578125, 23.1328125, 24.873046875, 26.61328125, 28.353515625, 30.09375, 31.833984375, 33.57421875, 35.314453125, 37.0546875, 38.794921875, 40.53515625, 42.275390625, 44.015625, 45.755859375, 47.49609375, 49.236328125, 50.9765625, 52.716796875, 54.45703125, 56.197265625, 57.9375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 8.0, 7.0, 19.0, 26.0, 23.0, 48.0, 54.0, 81.0, 137.0, 182.0, 396.0, 813.0, 2969.0, 23509.0, 3080609.0, 31451.0, 3413.0, 915.0, 400.0, 216.0, 124.0, 82.0, 53.0, 35.0, 28.0, 23.0, 25.0, 13.0, 14.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.3125, -91.0849609375, -86.857421875, -82.6298828125, -78.40234375, -74.1748046875, -69.947265625, -65.7197265625, -61.4921875, -57.2646484375, -53.037109375, -48.8095703125, -44.58203125, -40.3544921875, -36.126953125, -31.8994140625, -27.671875, -23.4443359375, -19.216796875, -14.9892578125, -10.76171875, -6.5341796875, -2.306640625, 1.9208984375, 6.1484375, 10.3759765625, 14.603515625, 18.8310546875, 23.05859375, 27.2861328125, 31.513671875, 35.7412109375, 39.96875, 44.1962890625, 48.423828125, 52.6513671875, 56.87890625, 61.1064453125, 65.333984375, 69.5615234375, 73.7890625, 78.0166015625, 82.244140625, 86.4716796875, 90.69921875, 94.9267578125, 99.154296875, 103.3818359375, 107.609375, 111.8369140625, 116.064453125, 120.2919921875, 124.51953125, 128.7470703125, 132.974609375, 137.2021484375, 141.4296875, 145.6572265625, 149.884765625, 154.1123046875, 158.33984375, 162.5673828125, 166.794921875, 171.0224609375, 175.25]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 307.0, 694.0, 17.0], "bins": [-1668.79833984375, -1641.927490234375, -1615.056640625, -1588.185791015625, -1561.31494140625, -1534.444091796875, -1507.5732421875, -1480.7022705078125, -1453.8314208984375, -1426.9605712890625, -1400.0897216796875, -1373.2188720703125, -1346.3480224609375, -1319.47705078125, -1292.606201171875, -1265.7353515625, -1238.864501953125, -1211.99365234375, -1185.122802734375, -1158.251953125, -1131.381103515625, -1104.51025390625, -1077.639404296875, -1050.7684326171875, -1023.897705078125, -997.02685546875, -970.156005859375, -943.28515625, -916.4142456054688, -889.5433959960938, -862.6725463867188, -835.8016967773438, -808.9307861328125, -782.0599365234375, -755.1890869140625, -728.3182373046875, -701.4473266601562, -674.5764770507812, -647.7056274414062, -620.8347778320312, -593.9639282226562, -567.0930786132812, -540.2222290039062, -513.351318359375, -486.48046875, -459.609619140625, -432.73876953125, -405.867919921875, -378.9970397949219, -352.1261901855469, -325.25531005859375, -298.38446044921875, -271.51361083984375, -244.64273071289062, -217.77188110351562, -190.90101623535156, -164.0301513671875, -137.15928649902344, -110.2884292602539, -83.41757202148438, -56.54670715332031, -29.67584228515625, -2.80499267578125, 24.065872192382812, 50.93674087524414]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 10.0, 8.0, 7.0, 6.0, 9.0, 19.0, 18.0, 22.0, 21.0, 27.0, 24.0, 35.0, 34.0, 34.0, 37.0, 51.0, 45.0, 42.0, 45.0, 50.0, 48.0, 60.0, 35.0, 36.0, 34.0, 29.0, 28.0, 29.0, 28.0, 21.0, 14.0, 20.0, 13.0, 7.0, 10.0, 10.0, 2.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.66770935058594, -188.0906219482422, -181.51353454589844, -174.9364471435547, -168.35935974121094, -161.78228759765625, -155.2052001953125, -148.62811279296875, -142.051025390625, -135.47393798828125, -128.8968505859375, -122.31976318359375, -115.74268341064453, -109.16559600830078, -102.58850860595703, -96.01142883300781, -89.43433380126953, -82.85724639892578, -76.28015899658203, -69.70307922363281, -63.12599182128906, -56.54890441894531, -49.97181701660156, -43.39473342895508, -36.81764602661133, -30.24056053161621, -23.663475036621094, -17.086387634277344, -10.509302139282227, -3.9322166442871094, 2.6448707580566406, 9.221954345703125, 15.799041748046875, 22.376127243041992, 28.95321273803711, 35.53030014038086, 42.107383728027344, 48.684471130371094, 55.261558532714844, 61.83864212036133, 68.41572570800781, 74.99281311035156, 81.56990051269531, 88.14698791503906, 94.72406768798828, 101.30115509033203, 107.87824249267578, 114.455322265625, 121.03241729736328, 127.60950469970703, 134.18658447265625, 140.763671875, 147.34075927734375, 153.9178466796875, 160.49493408203125, 167.072021484375, 173.64910888671875, 180.2261962890625, 186.80328369140625, 193.38037109375, 199.95745849609375, 206.5345458984375, 213.11163330078125, 219.68870544433594, 226.2657928466797]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 6.0, 3.0, 5.0, 10.0, 15.0, 11.0, 19.0, 14.0, 13.0, 22.0, 24.0, 40.0, 33.0, 36.0, 35.0, 44.0, 56.0, 61.0, 56.0, 45.0, 53.0, 44.0, 38.0, 40.0, 42.0, 38.0, 24.0, 39.0, 25.0, 21.0, 17.0, 9.0, 12.0, 12.0, 9.0, 6.0, 6.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.9375, -21.270751953125, -20.60400390625, -19.937255859375, -19.2705078125, -18.603759765625, -17.93701171875, -17.270263671875, -16.603515625, -15.936767578125, -15.27001953125, -14.603271484375, -13.9365234375, -13.269775390625, -12.60302734375, -11.936279296875, -11.26953125, -10.602783203125, -9.93603515625, -9.269287109375, -8.6025390625, -7.935791015625, -7.26904296875, -6.602294921875, -5.935546875, -5.268798828125, -4.60205078125, -3.935302734375, -3.2685546875, -2.601806640625, -1.93505859375, -1.268310546875, -0.6015625, 0.065185546875, 0.73193359375, 1.398681640625, 2.0654296875, 2.732177734375, 3.39892578125, 4.065673828125, 4.732421875, 5.399169921875, 6.06591796875, 6.732666015625, 7.3994140625, 8.066162109375, 8.73291015625, 9.399658203125, 10.06640625, 10.733154296875, 11.39990234375, 12.066650390625, 12.7333984375, 13.400146484375, 14.06689453125, 14.733642578125, 15.400390625, 16.067138671875, 16.73388671875, 17.400634765625, 18.0673828125, 18.734130859375, 19.40087890625, 20.067626953125, 20.734375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 13.0, 13.0, 18.0, 32.0, 49.0, 48.0, 81.0, 129.0, 157.0, 214.0, 351.0, 441.0, 674.0, 943.0, 1403.0, 2136.0, 3312.0, 5407.0, 8909.0, 16474.0, 41704.0, 917798.0, 3059854.0, 85520.0, 20752.0, 10674.0, 6078.0, 3735.0, 2460.0, 1499.0, 1034.0, 643.0, 486.0, 353.0, 251.0, 198.0, 130.0, 92.0, 73.0, 41.0, 26.0, 27.0, 15.0, 11.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.9375, -63.88671875, -61.8359375, -59.78515625, -57.734375, -55.68359375, -53.6328125, -51.58203125, -49.53125, -47.48046875, -45.4296875, -43.37890625, -41.328125, -39.27734375, -37.2265625, -35.17578125, -33.125, -31.07421875, -29.0234375, -26.97265625, -24.921875, -22.87109375, -20.8203125, -18.76953125, -16.71875, -14.66796875, -12.6171875, -10.56640625, -8.515625, -6.46484375, -4.4140625, -2.36328125, -0.3125, 1.73828125, 3.7890625, 5.83984375, 7.890625, 9.94140625, 11.9921875, 14.04296875, 16.09375, 18.14453125, 20.1953125, 22.24609375, 24.296875, 26.34765625, 28.3984375, 30.44921875, 32.5, 34.55078125, 36.6015625, 38.65234375, 40.703125, 42.75390625, 44.8046875, 46.85546875, 48.90625, 50.95703125, 53.0078125, 55.05859375, 57.109375, 59.16015625, 61.2109375, 63.26171875, 65.3125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 10.0, 4.0, 12.0, 11.0, 16.0, 21.0, 25.0, 32.0, 43.0, 93.0, 184.0, 498.0, 1606.0, 949.0, 252.0, 86.0, 46.0, 34.0, 31.0, 31.0, 19.0, 16.0, 9.0, 8.0, 7.0, 10.0, 2.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0625, -70.4248046875, -67.787109375, -65.1494140625, -62.51171875, -59.8740234375, -57.236328125, -54.5986328125, -51.9609375, -49.3232421875, -46.685546875, -44.0478515625, -41.41015625, -38.7724609375, -36.134765625, -33.4970703125, -30.859375, -28.2216796875, -25.583984375, -22.9462890625, -20.30859375, -17.6708984375, -15.033203125, -12.3955078125, -9.7578125, -7.1201171875, -4.482421875, -1.8447265625, 0.79296875, 3.4306640625, 6.068359375, 8.7060546875, 11.34375, 13.9814453125, 16.619140625, 19.2568359375, 21.89453125, 24.5322265625, 27.169921875, 29.8076171875, 32.4453125, 35.0830078125, 37.720703125, 40.3583984375, 42.99609375, 45.6337890625, 48.271484375, 50.9091796875, 53.546875, 56.1845703125, 58.822265625, 61.4599609375, 64.09765625, 66.7353515625, 69.373046875, 72.0107421875, 74.6484375, 77.2861328125, 79.923828125, 82.5615234375, 85.19921875, 87.8369140625, 90.474609375, 93.1123046875, 95.75]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 10.0, 9.0, 21.0, 20.0, 41.0, 49.0, 66.0, 114.0, 202.0, 335.0, 559.0, 940.0, 1765.0, 3336.0, 6334.0, 12999.0, 30339.0, 93751.0, 3062780.0, 863104.0, 68902.0, 25475.0, 11163.0, 5473.0, 2830.0, 1549.0, 849.0, 512.0, 284.0, 147.0, 117.0, 64.0, 52.0, 32.0, 15.0, 14.0, 13.0, 8.0, 11.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.3125, -103.8388671875, -100.365234375, -96.8916015625, -93.41796875, -89.9443359375, -86.470703125, -82.9970703125, -79.5234375, -76.0498046875, -72.576171875, -69.1025390625, -65.62890625, -62.1552734375, -58.681640625, -55.2080078125, -51.734375, -48.2607421875, -44.787109375, -41.3134765625, -37.83984375, -34.3662109375, -30.892578125, -27.4189453125, -23.9453125, -20.4716796875, -16.998046875, -13.5244140625, -10.05078125, -6.5771484375, -3.103515625, 0.3701171875, 3.84375, 7.3173828125, 10.791015625, 14.2646484375, 17.73828125, 21.2119140625, 24.685546875, 28.1591796875, 31.6328125, 35.1064453125, 38.580078125, 42.0537109375, 45.52734375, 49.0009765625, 52.474609375, 55.9482421875, 59.421875, 62.8955078125, 66.369140625, 69.8427734375, 73.31640625, 76.7900390625, 80.263671875, 83.7373046875, 87.2109375, 90.6845703125, 94.158203125, 97.6318359375, 101.10546875, 104.5791015625, 108.052734375, 111.5263671875, 115.0]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 6.0, 13.0, 22.0, 29.0, 40.0, 65.0, 97.0, 177.0, 211.0, 95.0, 67.0, 49.0, 30.0, 20.0, 17.0, 8.0, 11.0, 6.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-368.1773681640625, -359.00347900390625, -349.82958984375, -340.6557312011719, -331.4818420410156, -322.3079528808594, -313.1340637207031, -303.9601745605469, -294.78631591796875, -285.6124267578125, -276.43853759765625, -267.2646789550781, -258.0907897949219, -248.91690063476562, -239.74301147460938, -230.56912231445312, -221.39523315429688, -212.22134399414062, -203.04747009277344, -193.8735809326172, -184.69970703125, -175.52581787109375, -166.3519287109375, -157.17803955078125, -148.00416564941406, -138.8302764892578, -129.65640258789062, -120.48251342773438, -111.30863189697266, -102.13475036621094, -92.96086120605469, -83.78697967529297, -74.61306762695312, -65.4391860961914, -56.26530075073242, -47.09141540527344, -37.91753387451172, -28.74365234375, -19.569766998291016, -10.395881652832031, -1.2220001220703125, 7.951883316040039, 17.12576675415039, 26.299650192260742, 35.473533630371094, 44.64741516113281, 53.8213005065918, 62.99518585205078, 72.1690673828125, 81.34294891357422, 90.51683044433594, 99.69071960449219, 108.8646011352539, 118.03848266601562, 127.21237182617188, 136.38626098632812, 145.5601348876953, 154.73402404785156, 163.90789794921875, 173.081787109375, 182.25567626953125, 191.42955017089844, 200.6034393310547, 209.77731323242188, 218.95120239257812]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 8.0, 7.0, 5.0, 10.0, 8.0, 9.0, 15.0, 13.0, 12.0, 12.0, 29.0, 29.0, 25.0, 26.0, 30.0, 27.0, 43.0, 38.0, 35.0, 45.0, 35.0, 51.0, 47.0, 48.0, 38.0, 36.0, 32.0, 26.0, 39.0, 25.0, 19.0, 23.0, 22.0, 25.0, 17.0, 11.0, 14.0, 14.0, 10.0, 14.0, 8.0, 7.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-144.2861785888672, -139.2480010986328, -134.20982360839844, -129.17164611816406, -124.13346862792969, -119.09529113769531, -114.05711364746094, -109.01893615722656, -103.98075866699219, -98.94258117675781, -93.90440368652344, -88.86622619628906, -83.82804870605469, -78.78987121582031, -73.75169372558594, -68.71351623535156, -63.675331115722656, -58.63715362548828, -53.598976135253906, -48.56079864501953, -43.522621154785156, -38.48444366455078, -33.44626235961914, -28.408084869384766, -23.36990737915039, -18.331729888916016, -13.293551445007324, -8.255373001098633, -3.217195510864258, 1.8209819793701172, 6.859161376953125, 11.8973388671875, 16.935516357421875, 21.97369384765625, 27.011871337890625, 32.050048828125, 37.088226318359375, 42.12640380859375, 47.16458511352539, 52.202762603759766, 57.24094009399414, 62.279117584228516, 67.31729888916016, 72.35547637939453, 77.3936538696289, 82.43183135986328, 87.47000885009766, 92.50818634033203, 97.5463638305664, 102.58454132080078, 107.62271881103516, 112.66089630126953, 117.6990737915039, 122.73725128173828, 127.77543640136719, 132.81361389160156, 137.85179138183594, 142.8899688720703, 147.9281463623047, 152.96632385253906, 158.00450134277344, 163.0426788330078, 168.0808563232422, 173.11903381347656, 178.15721130371094]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 8.0, 9.0, 10.0, 11.0, 16.0, 24.0, 17.0, 12.0, 21.0, 27.0, 33.0, 45.0, 38.0, 45.0, 55.0, 51.0, 49.0, 48.0, 48.0, 50.0, 49.0, 48.0, 30.0, 59.0, 32.0, 23.0, 19.0, 24.0, 26.0, 14.0, 9.0, 9.0, 6.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.84375, -23.14794921875, -22.4521484375, -21.75634765625, -21.060546875, -20.36474609375, -19.6689453125, -18.97314453125, -18.27734375, -17.58154296875, -16.8857421875, -16.18994140625, -15.494140625, -14.79833984375, -14.1025390625, -13.40673828125, -12.7109375, -12.01513671875, -11.3193359375, -10.62353515625, -9.927734375, -9.23193359375, -8.5361328125, -7.84033203125, -7.14453125, -6.44873046875, -5.7529296875, -5.05712890625, -4.361328125, -3.66552734375, -2.9697265625, -2.27392578125, -1.578125, -0.88232421875, -0.1865234375, 0.50927734375, 1.205078125, 1.90087890625, 2.5966796875, 3.29248046875, 3.98828125, 4.68408203125, 5.3798828125, 6.07568359375, 6.771484375, 7.46728515625, 8.1630859375, 8.85888671875, 9.5546875, 10.25048828125, 10.9462890625, 11.64208984375, 12.337890625, 13.03369140625, 13.7294921875, 14.42529296875, 15.12109375, 15.81689453125, 16.5126953125, 17.20849609375, 17.904296875, 18.60009765625, 19.2958984375, 19.99169921875, 20.6875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 11.0, 14.0, 11.0, 20.0, 34.0, 56.0, 76.0, 114.0, 160.0, 221.0, 330.0, 493.0, 751.0, 1124.0, 1656.0, 2532.0, 3729.0, 5515.0, 8564.0, 13363.0, 21693.0, 37104.0, 66091.0, 127740.0, 247233.0, 235443.0, 119253.0, 62188.0, 34860.0, 20715.0, 12960.0, 8359.0, 5434.0, 3540.0, 2408.0, 1553.0, 1041.0, 640.0, 478.0, 353.0, 223.0, 146.0, 98.0, 79.0, 46.0, 36.0, 19.0, 18.0, 13.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.94873046875, -0.919036865234375, -0.88934326171875, -0.859649658203125, -0.8299560546875, -0.800262451171875, -0.77056884765625, -0.740875244140625, -0.711181640625, -0.681488037109375, -0.65179443359375, -0.622100830078125, -0.5924072265625, -0.562713623046875, -0.53302001953125, -0.503326416015625, -0.4736328125, -0.443939208984375, -0.41424560546875, -0.384552001953125, -0.3548583984375, -0.325164794921875, -0.29547119140625, -0.265777587890625, -0.236083984375, -0.206390380859375, -0.17669677734375, -0.147003173828125, -0.1173095703125, -0.087615966796875, -0.05792236328125, -0.028228759765625, 0.00146484375, 0.031158447265625, 0.06085205078125, 0.090545654296875, 0.1202392578125, 0.149932861328125, 0.17962646484375, 0.209320068359375, 0.239013671875, 0.268707275390625, 0.29840087890625, 0.328094482421875, 0.3577880859375, 0.387481689453125, 0.41717529296875, 0.446868896484375, 0.4765625, 0.506256103515625, 0.53594970703125, 0.565643310546875, 0.5953369140625, 0.625030517578125, 0.65472412109375, 0.684417724609375, 0.714111328125, 0.743804931640625, 0.77349853515625, 0.803192138671875, 0.8328857421875, 0.862579345703125, 0.89227294921875, 0.921966552734375, 0.95166015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 3.0, 8.0, 7.0, 13.0, 12.0, 10.0, 7.0, 18.0, 20.0, 23.0, 24.0, 23.0, 31.0, 30.0, 26.0, 36.0, 40.0, 37.0, 38.0, 36.0, 32.0, 1071.0, 45.0, 48.0, 30.0, 44.0, 21.0, 31.0, 42.0, 22.0, 26.0, 25.0, 21.0, 18.0, 18.0, 14.0, 16.0, 14.0, 9.0, 6.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.8609619140625, -9.510986328125, -9.1610107421875, -8.81103515625, -8.4610595703125, -8.111083984375, -7.7611083984375, -7.4111328125, -7.0611572265625, -6.711181640625, -6.3612060546875, -6.01123046875, -5.6612548828125, -5.311279296875, -4.9613037109375, -4.611328125, -4.2613525390625, -3.911376953125, -3.5614013671875, -3.21142578125, -2.8614501953125, -2.511474609375, -2.1614990234375, -1.8115234375, -1.4615478515625, -1.111572265625, -0.7615966796875, -0.41162109375, -0.0616455078125, 0.288330078125, 0.6383056640625, 0.98828125, 1.3382568359375, 1.688232421875, 2.0382080078125, 2.38818359375, 2.7381591796875, 3.088134765625, 3.4381103515625, 3.7880859375, 4.1380615234375, 4.488037109375, 4.8380126953125, 5.18798828125, 5.5379638671875, 5.887939453125, 6.2379150390625, 6.587890625, 6.9378662109375, 7.287841796875, 7.6378173828125, 7.98779296875, 8.3377685546875, 8.687744140625, 9.0377197265625, 9.3876953125, 9.7376708984375, 10.087646484375, 10.4376220703125, 10.78759765625, 11.1375732421875, 11.487548828125, 11.8375244140625, 12.1875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 8.0, 25.0, 37.0, 52.0, 74.0, 106.0, 160.0, 245.0, 400.0, 526.0, 767.0, 1123.0, 1661.0, 2431.0, 3380.0, 5062.0, 7194.0, 10509.0, 15735.0, 23383.0, 36193.0, 57590.0, 97386.0, 176709.0, 1283480.0, 145924.0, 81806.0, 49417.0, 31117.0, 20712.0, 13921.0, 9371.0, 6431.0, 4409.0, 3039.0, 2126.0, 1422.0, 1058.0, 724.0, 454.0, 303.0, 234.0, 155.0, 97.0, 59.0, 40.0, 24.0, 14.0, 18.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.75927734375, -0.7365036010742188, -0.7137298583984375, -0.6909561157226562, -0.668182373046875, -0.6454086303710938, -0.6226348876953125, -0.5998611450195312, -0.57708740234375, -0.5543136596679688, -0.5315399169921875, -0.5087661743164062, -0.485992431640625, -0.46321868896484375, -0.4404449462890625, -0.41767120361328125, -0.3948974609375, -0.37212371826171875, -0.3493499755859375, -0.32657623291015625, -0.303802490234375, -0.28102874755859375, -0.2582550048828125, -0.23548126220703125, -0.21270751953125, -0.18993377685546875, -0.1671600341796875, -0.14438629150390625, -0.121612548828125, -0.09883880615234375, -0.0760650634765625, -0.05329132080078125, -0.030517578125, -0.00774383544921875, 0.0150299072265625, 0.03780364990234375, 0.060577392578125, 0.08335113525390625, 0.1061248779296875, 0.12889862060546875, 0.15167236328125, 0.17444610595703125, 0.1972198486328125, 0.21999359130859375, 0.242767333984375, 0.26554107666015625, 0.2883148193359375, 0.31108856201171875, 0.3338623046875, 0.35663604736328125, 0.3794097900390625, 0.40218353271484375, 0.424957275390625, 0.44773101806640625, 0.4705047607421875, 0.49327850341796875, 0.51605224609375, 0.5388259887695312, 0.5615997314453125, 0.5843734741210938, 0.607147216796875, 0.6299209594726562, 0.6526947021484375, 0.6754684448242188, 0.6982421875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 11.0, 17.0, 16.0, 15.0, 24.0, 26.0, 39.0, 38.0, 47.0, 44.0, 55.0, 72.0, 69.0, 69.0, 73.0, 61.0, 49.0, 44.0, 47.0, 29.0, 42.0, 17.0, 19.0, 11.0, 11.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0041656494140625, -0.004054933786392212, -0.003944218158721924, -0.0038335025310516357, -0.0037227869033813477, -0.0036120712757110596, -0.0035013556480407715, -0.0033906400203704834, -0.0032799243927001953, -0.0031692087650299072, -0.003058493137359619, -0.002947777509689331, -0.002837061882019043, -0.002726346254348755, -0.002615630626678467, -0.0025049149990081787, -0.0023941993713378906, -0.0022834837436676025, -0.0021727681159973145, -0.0020620524883270264, -0.0019513368606567383, -0.0018406212329864502, -0.0017299056053161621, -0.001619189977645874, -0.001508474349975586, -0.0013977587223052979, -0.0012870430946350098, -0.0011763274669647217, -0.0010656118392944336, -0.0009548962116241455, -0.0008441805839538574, -0.0007334649562835693, -0.0006227493286132812, -0.0005120337009429932, -0.0004013180732727051, -0.000290602445602417, -0.0001798868179321289, -6.917119026184082e-05, 4.1544437408447266e-05, 0.00015226006507873535, 0.00026297569274902344, 0.0003736913204193115, 0.0004844069480895996, 0.0005951225757598877, 0.0007058382034301758, 0.0008165538311004639, 0.000927269458770752, 0.00103798508644104, 0.0011487007141113281, 0.0012594163417816162, 0.0013701319694519043, 0.0014808475971221924, 0.0015915632247924805, 0.0017022788524627686, 0.0018129944801330566, 0.0019237101078033447, 0.002034425735473633, 0.002145141363143921, 0.002255856990814209, 0.002366572618484497, 0.002477288246154785, 0.0025880038738250732, 0.0026987195014953613, 0.0028094351291656494, 0.0029201507568359375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 13.0, 12.0, 12.0, 20.0, 35.0, 43.0, 54.0, 78.0, 112.0, 157.0, 214.0, 340.0, 673.0, 4853.0, 240217.0, 784873.0, 14566.0, 988.0, 399.0, 245.0, 183.0, 141.0, 81.0, 62.0, 52.0, 35.0, 24.0, 14.0, 8.0, 8.0, 5.0, 9.0, 3.0, 6.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055999755859375, -0.05425834655761719, -0.052516937255859375, -0.05077552795410156, -0.04903411865234375, -0.04729270935058594, -0.045551300048828125, -0.04380989074707031, -0.0420684814453125, -0.04032707214355469, -0.038585662841796875, -0.03684425354003906, -0.03510284423828125, -0.03336143493652344, -0.031620025634765625, -0.029878616333007812, -0.02813720703125, -0.026395797729492188, -0.024654388427734375, -0.022912979125976562, -0.02117156982421875, -0.019430160522460938, -0.017688751220703125, -0.015947341918945312, -0.0142059326171875, -0.012464523315429688, -0.010723114013671875, -0.008981704711914062, -0.00724029541015625, -0.0054988861083984375, -0.003757476806640625, -0.0020160675048828125, -0.000274658203125, 0.0014667510986328125, 0.003208160400390625, 0.0049495697021484375, 0.00669097900390625, 0.008432388305664062, 0.010173797607421875, 0.011915206909179688, 0.0136566162109375, 0.015398025512695312, 0.017139434814453125, 0.018880844116210938, 0.02062225341796875, 0.022363662719726562, 0.024105072021484375, 0.025846481323242188, 0.027587890625, 0.029329299926757812, 0.031070709228515625, 0.03281211853027344, 0.03455352783203125, 0.03629493713378906, 0.038036346435546875, 0.03977775573730469, 0.0415191650390625, 0.04326057434082031, 0.045001983642578125, 0.04674339294433594, 0.04848480224609375, 0.05022621154785156, 0.051967620849609375, 0.05370903015136719, 0.055450439453125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 43.0, 236.0, 524.0, 151.0, 29.0, 15.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015575243160128593, -0.015108834952116013, -0.014642426744103432, -0.014176017604768276, -0.013709609396755695, -0.013243201188743114, -0.012776792049407959, -0.012310383841395378, -0.011843975633382797, -0.011377567425370216, -0.010911159217357635, -0.01044475007802248, -0.0099783418700099, -0.009511933661997318, -0.009045524522662163, -0.008579116314649582, -0.008112708106637001, -0.00764629989862442, -0.007179891224950552, -0.006713482551276684, -0.006247074343264103, -0.005780666135251522, -0.005314257461577654, -0.004847848787903786, -0.004381440579891205, -0.003915032371878624, -0.0034486236982047558, -0.0029822152573615313, -0.0025158068165183067, -0.002049398375675082, -0.0015829899348318577, -0.0011165814939886332, -0.0006501730531454086, -0.0001837646123021841, 0.0002826438285410404, 0.000749052269384265, 0.0012154607102274895, 0.001681869151070714, 0.0021482775919139385, 0.002614686032757163, 0.0030810944736003876, 0.003547502914443612, 0.004013911355286837, 0.004480320028960705, 0.004946728236973286, 0.0054131364449858665, 0.005879545118659735, 0.006345953792333603, 0.006812362000346184, 0.007278770208358765, 0.007745178882032633, 0.008211587555706501, 0.008677995763719082, 0.009144403971731663, 0.009610813111066818, 0.010077221319079399, 0.01054362952709198, 0.01101003773510456, 0.011476445943117142, 0.011942855082452297, 0.012409263290464878, 0.012875671498477459, 0.013342080637812614, 0.013808488845825195, 0.014274897053837776]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 4.0, 9.0, 17.0, 10.0, 16.0, 25.0, 12.0, 24.0, 21.0, 31.0, 43.0, 29.0, 34.0, 31.0, 41.0, 50.0, 44.0, 35.0, 44.0, 32.0, 38.0, 51.0, 40.0, 45.0, 37.0, 32.0, 32.0, 28.0, 19.0, 17.0, 14.0, 16.0, 13.0, 8.0, 8.0, 8.0, 3.0, 9.0, 9.0, 7.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0021110177040100098, -0.0020444775000214577, -0.0019779372960329056, -0.0019113970920443535, -0.0018448568880558014, -0.0017783166840672493, -0.0017117764800786972, -0.0016452362760901451, -0.001578696072101593, -0.001512155868113041, -0.0014456156641244888, -0.0013790754601359367, -0.0013125352561473846, -0.0012459950521588326, -0.0011794548481702805, -0.0011129146441817284, -0.0010463744401931763, -0.0009798342362046242, -0.0009132940322160721, -0.00084675382822752, -0.0007802136242389679, -0.0007136734202504158, -0.0006471332162618637, -0.0005805930122733116, -0.0005140528082847595, -0.00044751260429620743, -0.00038097240030765533, -0.00031443219631910324, -0.00024789199233055115, -0.00018135178834199905, -0.00011481158435344696, -4.827138036489487e-05, 1.8268823623657227e-05, 8.480902761220932e-05, 0.00015134923160076141, 0.0002178894355893135, 0.0002844296395778656, 0.0003509698435664177, 0.0004175100475549698, 0.0004840502515435219, 0.000550590455532074, 0.0006171306595206261, 0.0006836708635091782, 0.0007502110674977303, 0.0008167512714862823, 0.0008832914754748344, 0.0009498316794633865, 0.0010163718834519386, 0.0010829120874404907, 0.0011494522914290428, 0.001215992495417595, 0.001282532699406147, 0.001349072903394699, 0.0014156131073832512, 0.0014821533113718033, 0.0015486935153603554, 0.0016152337193489075, 0.0016817739233374596, 0.0017483141273260117, 0.0018148543313145638, 0.0018813945353031158, 0.001947934739291668, 0.00201447494328022, 0.002081015147268772, 0.0021475553512573242]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 8.0, 9.0, 10.0, 11.0, 16.0, 24.0, 17.0, 12.0, 21.0, 27.0, 33.0, 45.0, 38.0, 45.0, 55.0, 51.0, 49.0, 48.0, 48.0, 50.0, 49.0, 48.0, 30.0, 59.0, 32.0, 23.0, 19.0, 24.0, 26.0, 14.0, 9.0, 9.0, 6.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.84375, -23.14794921875, -22.4521484375, -21.75634765625, -21.060546875, -20.36474609375, -19.6689453125, -18.97314453125, -18.27734375, -17.58154296875, -16.8857421875, -16.18994140625, -15.494140625, -14.79833984375, -14.1025390625, -13.40673828125, -12.7109375, -12.01513671875, -11.3193359375, -10.62353515625, -9.927734375, -9.23193359375, -8.5361328125, -7.84033203125, -7.14453125, -6.44873046875, -5.7529296875, -5.05712890625, -4.361328125, -3.66552734375, -2.9697265625, -2.27392578125, -1.578125, -0.88232421875, -0.1865234375, 0.50927734375, 1.205078125, 1.90087890625, 2.5966796875, 3.29248046875, 3.98828125, 4.68408203125, 5.3798828125, 6.07568359375, 6.771484375, 7.46728515625, 8.1630859375, 8.85888671875, 9.5546875, 10.25048828125, 10.9462890625, 11.64208984375, 12.337890625, 13.03369140625, 13.7294921875, 14.42529296875, 15.12109375, 15.81689453125, 16.5126953125, 17.20849609375, 17.904296875, 18.60009765625, 19.2958984375, 19.99169921875, 20.6875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 6.0, 13.0, 11.0, 20.0, 21.0, 46.0, 47.0, 64.0, 77.0, 123.0, 161.0, 224.0, 302.0, 435.0, 598.0, 858.0, 1292.0, 2105.0, 3706.0, 6972.0, 15230.0, 41269.0, 158384.0, 597550.0, 148758.0, 38766.0, 14850.0, 6774.0, 3550.0, 2093.0, 1274.0, 850.0, 598.0, 428.0, 296.0, 199.0, 162.0, 116.0, 90.0, 58.0, 39.0, 31.0, 35.0, 20.0, 12.0, 9.0, 4.0, 7.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0], "bins": [-14.328125, -13.900146484375, -13.47216796875, -13.044189453125, -12.6162109375, -12.188232421875, -11.76025390625, -11.332275390625, -10.904296875, -10.476318359375, -10.04833984375, -9.620361328125, -9.1923828125, -8.764404296875, -8.33642578125, -7.908447265625, -7.48046875, -7.052490234375, -6.62451171875, -6.196533203125, -5.7685546875, -5.340576171875, -4.91259765625, -4.484619140625, -4.056640625, -3.628662109375, -3.20068359375, -2.772705078125, -2.3447265625, -1.916748046875, -1.48876953125, -1.060791015625, -0.6328125, -0.204833984375, 0.22314453125, 0.651123046875, 1.0791015625, 1.507080078125, 1.93505859375, 2.363037109375, 2.791015625, 3.218994140625, 3.64697265625, 4.074951171875, 4.5029296875, 4.930908203125, 5.35888671875, 5.786865234375, 6.21484375, 6.642822265625, 7.07080078125, 7.498779296875, 7.9267578125, 8.354736328125, 8.78271484375, 9.210693359375, 9.638671875, 10.066650390625, 10.49462890625, 10.922607421875, 11.3505859375, 11.778564453125, 12.20654296875, 12.634521484375, 13.0625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 8.0, 6.0, 2.0, 10.0, 19.0, 17.0, 18.0, 13.0, 21.0, 35.0, 19.0, 32.0, 38.0, 42.0, 38.0, 54.0, 62.0, 150.0, 1869.0, 122.0, 75.0, 61.0, 36.0, 39.0, 35.0, 23.0, 23.0, 20.0, 22.0, 20.0, 20.0, 17.0, 23.0, 14.0, 12.0, 6.0, 9.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -64.294921875, -62.02734375, -59.759765625, -57.4921875, -55.224609375, -52.95703125, -50.689453125, -48.421875, -46.154296875, -43.88671875, -41.619140625, -39.3515625, -37.083984375, -34.81640625, -32.548828125, -30.28125, -28.013671875, -25.74609375, -23.478515625, -21.2109375, -18.943359375, -16.67578125, -14.408203125, -12.140625, -9.873046875, -7.60546875, -5.337890625, -3.0703125, -0.802734375, 1.46484375, 3.732421875, 6.0, 8.267578125, 10.53515625, 12.802734375, 15.0703125, 17.337890625, 19.60546875, 21.873046875, 24.140625, 26.408203125, 28.67578125, 30.943359375, 33.2109375, 35.478515625, 37.74609375, 40.013671875, 42.28125, 44.548828125, 46.81640625, 49.083984375, 51.3515625, 53.619140625, 55.88671875, 58.154296875, 60.421875, 62.689453125, 64.95703125, 67.224609375, 69.4921875, 71.759765625, 74.02734375, 76.294921875, 78.5625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 14.0, 17.0, 22.0, 17.0, 23.0, 28.0, 24.0, 24.0, 39.0, 59.0, 101.0, 138.0, 240.0, 419.0, 1085.0, 13589.0, 3077902.0, 48799.0, 1818.0, 488.0, 277.0, 151.0, 105.0, 71.0, 45.0, 38.0, 34.0, 19.0, 14.0, 20.0, 11.0, 15.0, 8.0, 2.0, 7.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-125.3125, -121.6953125, -118.078125, -114.4609375, -110.84375, -107.2265625, -103.609375, -99.9921875, -96.375, -92.7578125, -89.140625, -85.5234375, -81.90625, -78.2890625, -74.671875, -71.0546875, -67.4375, -63.8203125, -60.203125, -56.5859375, -52.96875, -49.3515625, -45.734375, -42.1171875, -38.5, -34.8828125, -31.265625, -27.6484375, -24.03125, -20.4140625, -16.796875, -13.1796875, -9.5625, -5.9453125, -2.328125, 1.2890625, 4.90625, 8.5234375, 12.140625, 15.7578125, 19.375, 22.9921875, 26.609375, 30.2265625, 33.84375, 37.4609375, 41.078125, 44.6953125, 48.3125, 51.9296875, 55.546875, 59.1640625, 62.78125, 66.3984375, 70.015625, 73.6328125, 77.25, 80.8671875, 84.484375, 88.1015625, 91.71875, 95.3359375, 98.953125, 102.5703125, 106.1875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 92.0, 698.0, 201.0, 16.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-498.83734130859375, -487.66375732421875, -476.49017333984375, -465.3165588378906, -454.1429748535156, -442.9693908691406, -431.7957763671875, -420.6221923828125, -409.4486083984375, -398.2750244140625, -387.1014404296875, -375.9278259277344, -364.7542419433594, -353.5806579589844, -342.40704345703125, -331.23345947265625, -320.05987548828125, -308.88629150390625, -297.71270751953125, -286.5390930175781, -275.3655090332031, -264.1919250488281, -253.01832580566406, -241.8447265625, -230.671142578125, -219.49755859375, -208.32395935058594, -197.15036010742188, -185.97677612304688, -174.80319213867188, -163.6295928955078, -152.45599365234375, -141.28244018554688, -130.10885620117188, -118.93525695800781, -107.76166534423828, -96.58807373046875, -85.41448211669922, -74.24089050292969, -63.067298889160156, -51.893707275390625, -40.720115661621094, -29.546524047851562, -18.37293243408203, -7.1993408203125, 3.9742507934570312, 15.147842407226562, 26.321434020996094, 37.495025634765625, 48.668617248535156, 59.84220886230469, 71.01580047607422, 82.18939208984375, 93.36298370361328, 104.53657531738281, 115.71016693115234, 126.88375854492188, 138.05734252929688, 149.23094177246094, 160.404541015625, 171.578125, 182.751708984375, 193.92530822753906, 205.09890747070312, 216.27249145507812]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 11.0, 8.0, 10.0, 13.0, 15.0, 17.0, 20.0, 25.0, 34.0, 26.0, 30.0, 41.0, 43.0, 44.0, 39.0, 49.0, 46.0, 35.0, 47.0, 42.0, 45.0, 32.0, 29.0, 30.0, 40.0, 33.0, 23.0, 29.0, 18.0, 14.0, 23.0, 18.0, 16.0, 14.0, 8.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-216.22706604003906, -209.43746948242188, -202.6478729248047, -195.8582763671875, -189.06869506835938, -182.2790985107422, -175.489501953125, -168.6999053955078, -161.91030883789062, -155.12071228027344, -148.33111572265625, -141.54153442382812, -134.75193786621094, -127.96234130859375, -121.17274475097656, -114.38314819335938, -107.59355926513672, -100.80396270751953, -94.01437377929688, -87.22477722167969, -80.4351806640625, -73.64558410644531, -66.85599517822266, -60.06639862060547, -53.27680587768555, -46.487213134765625, -39.69761657714844, -32.908023834228516, -26.11842918395996, -19.328834533691406, -12.539241790771484, -5.749645233154297, 1.039947509765625, 7.8295416831970215, 14.619135856628418, 21.408729553222656, 28.19832420349121, 34.987918853759766, 41.77751159667969, 48.567108154296875, 55.3567008972168, 62.14629364013672, 68.9358901977539, 75.72547912597656, 82.51507568359375, 89.30467224121094, 96.09426879882812, 102.88386535644531, 109.67345428466797, 116.46305084228516, 123.25263977050781, 130.042236328125, 136.8318328857422, 143.62142944335938, 150.4110107421875, 157.20062255859375, 163.99020385742188, 170.77980041503906, 177.56939697265625, 184.35897827148438, 191.14857482910156, 197.93817138671875, 204.72776794433594, 211.51736450195312, 218.3069610595703]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 11.0, 6.0, 7.0, 9.0, 16.0, 18.0, 19.0, 16.0, 17.0, 21.0, 28.0, 38.0, 35.0, 37.0, 42.0, 60.0, 48.0, 43.0, 53.0, 45.0, 46.0, 56.0, 40.0, 35.0, 45.0, 33.0, 31.0, 16.0, 25.0, 22.0, 22.0, 6.0, 12.0, 7.0, 10.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.375, -22.692626953125, -22.01025390625, -21.327880859375, -20.6455078125, -19.963134765625, -19.28076171875, -18.598388671875, -17.916015625, -17.233642578125, -16.55126953125, -15.868896484375, -15.1865234375, -14.504150390625, -13.82177734375, -13.139404296875, -12.45703125, -11.774658203125, -11.09228515625, -10.409912109375, -9.7275390625, -9.045166015625, -8.36279296875, -7.680419921875, -6.998046875, -6.315673828125, -5.63330078125, -4.950927734375, -4.2685546875, -3.586181640625, -2.90380859375, -2.221435546875, -1.5390625, -0.856689453125, -0.17431640625, 0.508056640625, 1.1904296875, 1.872802734375, 2.55517578125, 3.237548828125, 3.919921875, 4.602294921875, 5.28466796875, 5.967041015625, 6.6494140625, 7.331787109375, 8.01416015625, 8.696533203125, 9.37890625, 10.061279296875, 10.74365234375, 11.426025390625, 12.1083984375, 12.790771484375, 13.47314453125, 14.155517578125, 14.837890625, 15.520263671875, 16.20263671875, 16.885009765625, 17.5673828125, 18.249755859375, 18.93212890625, 19.614501953125, 20.296875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 10.0, 11.0, 18.0, 25.0, 38.0, 58.0, 81.0, 88.0, 173.0, 262.0, 345.0, 573.0, 872.0, 1305.0, 2124.0, 3373.0, 5435.0, 9796.0, 17769.0, 44683.0, 631207.0, 3268150.0, 148280.0, 27810.0, 13367.0, 7246.0, 4211.0, 2545.0, 1568.0, 986.0, 613.0, 434.0, 256.0, 177.0, 125.0, 67.0, 63.0, 45.0, 24.0, 21.0, 14.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-65.25, -63.28857421875, -61.3271484375, -59.36572265625, -57.404296875, -55.44287109375, -53.4814453125, -51.52001953125, -49.55859375, -47.59716796875, -45.6357421875, -43.67431640625, -41.712890625, -39.75146484375, -37.7900390625, -35.82861328125, -33.8671875, -31.90576171875, -29.9443359375, -27.98291015625, -26.021484375, -24.06005859375, -22.0986328125, -20.13720703125, -18.17578125, -16.21435546875, -14.2529296875, -12.29150390625, -10.330078125, -8.36865234375, -6.4072265625, -4.44580078125, -2.484375, -0.52294921875, 1.4384765625, 3.39990234375, 5.361328125, 7.32275390625, 9.2841796875, 11.24560546875, 13.20703125, 15.16845703125, 17.1298828125, 19.09130859375, 21.052734375, 23.01416015625, 24.9755859375, 26.93701171875, 28.8984375, 30.85986328125, 32.8212890625, 34.78271484375, 36.744140625, 38.70556640625, 40.6669921875, 42.62841796875, 44.58984375, 46.55126953125, 48.5126953125, 50.47412109375, 52.435546875, 54.39697265625, 56.3583984375, 58.31982421875, 60.28125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 9.0, 8.0, 7.0, 10.0, 16.0, 17.0, 34.0, 52.0, 54.0, 79.0, 178.0, 738.0, 1675.0, 727.0, 203.0, 76.0, 59.0, 33.0, 22.0, 20.0, 19.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.125, -76.13671875, -73.1484375, -70.16015625, -67.171875, -64.18359375, -61.1953125, -58.20703125, -55.21875, -52.23046875, -49.2421875, -46.25390625, -43.265625, -40.27734375, -37.2890625, -34.30078125, -31.3125, -28.32421875, -25.3359375, -22.34765625, -19.359375, -16.37109375, -13.3828125, -10.39453125, -7.40625, -4.41796875, -1.4296875, 1.55859375, 4.546875, 7.53515625, 10.5234375, 13.51171875, 16.5, 19.48828125, 22.4765625, 25.46484375, 28.453125, 31.44140625, 34.4296875, 37.41796875, 40.40625, 43.39453125, 46.3828125, 49.37109375, 52.359375, 55.34765625, 58.3359375, 61.32421875, 64.3125, 67.30078125, 70.2890625, 73.27734375, 76.265625, 79.25390625, 82.2421875, 85.23046875, 88.21875, 91.20703125, 94.1953125, 97.18359375, 100.171875, 103.16015625, 106.1484375, 109.13671875, 112.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 17.0, 24.0, 33.0, 66.0, 96.0, 148.0, 257.0, 503.0, 917.0, 1734.0, 3686.0, 8205.0, 21613.0, 76096.0, 3030056.0, 959128.0, 59923.0, 18013.0, 7128.0, 3226.0, 1504.0, 838.0, 432.0, 235.0, 146.0, 77.0, 50.0, 40.0, 21.0, 15.0, 10.0, 14.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.125, -139.8759765625, -135.626953125, -131.3779296875, -127.12890625, -122.8798828125, -118.630859375, -114.3818359375, -110.1328125, -105.8837890625, -101.634765625, -97.3857421875, -93.13671875, -88.8876953125, -84.638671875, -80.3896484375, -76.140625, -71.8916015625, -67.642578125, -63.3935546875, -59.14453125, -54.8955078125, -50.646484375, -46.3974609375, -42.1484375, -37.8994140625, -33.650390625, -29.4013671875, -25.15234375, -20.9033203125, -16.654296875, -12.4052734375, -8.15625, -3.9072265625, 0.341796875, 4.5908203125, 8.83984375, 13.0888671875, 17.337890625, 21.5869140625, 25.8359375, 30.0849609375, 34.333984375, 38.5830078125, 42.83203125, 47.0810546875, 51.330078125, 55.5791015625, 59.828125, 64.0771484375, 68.326171875, 72.5751953125, 76.82421875, 81.0732421875, 85.322265625, 89.5712890625, 93.8203125, 98.0693359375, 102.318359375, 106.5673828125, 110.81640625, 115.0654296875, 119.314453125, 123.5634765625, 127.8125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 16.0, 12.0, 32.0, 64.0, 169.0, 423.0, 174.0, 57.0, 31.0, 11.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-641.5611572265625, -619.0591430664062, -596.5571899414062, -574.05517578125, -551.55322265625, -529.0512084960938, -506.5492248535156, -484.0472412109375, -461.5452575683594, -439.04327392578125, -416.5412902832031, -394.039306640625, -371.53729248046875, -349.03533935546875, -326.5333251953125, -304.0313415527344, -281.52935791015625, -259.0273742675781, -236.525390625, -214.0233917236328, -191.5214080810547, -169.01942443847656, -146.51742553710938, -124.01544189453125, -101.51345825195312, -79.011474609375, -56.509483337402344, -34.00749206542969, -11.505508422851562, 10.996475219726562, 33.49847412109375, 56.000457763671875, 78.50238037109375, 101.00436401367188, 123.50635528564453, 146.0083465576172, 168.5103302001953, 191.01231384277344, 213.51431274414062, 236.01629638671875, 258.5182800292969, 281.020263671875, 303.5222473144531, 326.02423095703125, 348.5262451171875, 371.0281982421875, 393.53021240234375, 416.0321960449219, 438.5341796875, 461.0361633300781, 483.53814697265625, 506.0401611328125, 528.5421142578125, 551.0441284179688, 573.546142578125, 596.048095703125, 618.550048828125, 641.0520629882812, 663.5540161132812, 686.0560302734375, 708.5579833984375, 731.0599975585938, 753.56201171875, 776.06396484375, 798.5659790039062]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 9.0, 10.0, 11.0, 11.0, 15.0, 23.0, 31.0, 26.0, 27.0, 33.0, 33.0, 38.0, 53.0, 44.0, 51.0, 48.0, 32.0, 59.0, 48.0, 44.0, 36.0, 31.0, 41.0, 34.0, 22.0, 29.0, 25.0, 24.0, 17.0, 11.0, 15.0, 15.0, 12.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-183.6816864013672, -177.49147033691406, -171.30123901367188, -165.11102294921875, -158.92079162597656, -152.73057556152344, -146.54034423828125, -140.35012817382812, -134.159912109375, -127.96968841552734, -121.77946472167969, -115.58924865722656, -109.39901733398438, -103.20880126953125, -97.0185775756836, -90.82835388183594, -84.63812255859375, -78.4478988647461, -72.25767517089844, -66.06745910644531, -59.87723159790039, -53.687007904052734, -47.496788024902344, -41.30656433105469, -35.11634063720703, -28.926116943359375, -22.73589515686035, -16.545673370361328, -10.355449676513672, -4.165225982666016, 2.024993896484375, 8.215217590332031, 14.40545654296875, 20.595680236816406, 26.78590202331543, 32.97612380981445, 39.16634750366211, 45.356571197509766, 51.546791076660156, 57.73701477050781, 63.92723846435547, 70.11746215820312, 76.30768585205078, 82.49790954589844, 88.68812561035156, 94.87835693359375, 101.06857299804688, 107.25879669189453, 113.44902038574219, 119.63924407958984, 125.8294677734375, 132.01968383789062, 138.2099151611328, 144.40013122558594, 150.59036254882812, 156.78057861328125, 162.97079467773438, 169.1610107421875, 175.3512420654297, 181.5414581298828, 187.731689453125, 193.92190551757812, 200.11212158203125, 206.30235290527344, 212.49258422851562]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 21.0, 21.0, 17.0, 26.0, 24.0, 31.0, 33.0, 25.0, 39.0, 43.0, 50.0, 54.0, 49.0, 46.0, 57.0, 40.0, 40.0, 35.0, 36.0, 28.0, 32.0, 37.0, 27.0, 19.0, 20.0, 22.0, 15.0, 10.0, 12.0, 7.0, 6.0, 5.0, 5.0, 0.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.135498046875, -20.47412109375, -19.812744140625, -19.1513671875, -18.489990234375, -17.82861328125, -17.167236328125, -16.505859375, -15.844482421875, -15.18310546875, -14.521728515625, -13.8603515625, -13.198974609375, -12.53759765625, -11.876220703125, -11.21484375, -10.553466796875, -9.89208984375, -9.230712890625, -8.5693359375, -7.907958984375, -7.24658203125, -6.585205078125, -5.923828125, -5.262451171875, -4.60107421875, -3.939697265625, -3.2783203125, -2.616943359375, -1.95556640625, -1.294189453125, -0.6328125, 0.028564453125, 0.68994140625, 1.351318359375, 2.0126953125, 2.674072265625, 3.33544921875, 3.996826171875, 4.658203125, 5.319580078125, 5.98095703125, 6.642333984375, 7.3037109375, 7.965087890625, 8.62646484375, 9.287841796875, 9.94921875, 10.610595703125, 11.27197265625, 11.933349609375, 12.5947265625, 13.256103515625, 13.91748046875, 14.578857421875, 15.240234375, 15.901611328125, 16.56298828125, 17.224365234375, 17.8857421875, 18.547119140625, 19.20849609375, 19.869873046875, 20.53125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 10.0, 26.0, 20.0, 49.0, 57.0, 91.0, 119.0, 181.0, 258.0, 480.0, 617.0, 962.0, 1647.0, 2613.0, 4071.0, 6841.0, 11517.0, 19838.0, 35394.0, 66014.0, 135851.0, 282736.0, 239671.0, 111181.0, 55066.0, 29999.0, 17178.0, 10171.0, 6061.0, 3686.0, 2187.0, 1416.0, 869.0, 559.0, 355.0, 250.0, 167.0, 108.0, 63.0, 53.0, 28.0, 27.0, 21.0, 14.0, 8.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.0157928466796875, -0.981781005859375, -0.9477691650390625, -0.91375732421875, -0.8797454833984375, -0.845733642578125, -0.8117218017578125, -0.7777099609375, -0.7436981201171875, -0.709686279296875, -0.6756744384765625, -0.64166259765625, -0.6076507568359375, -0.573638916015625, -0.5396270751953125, -0.505615234375, -0.4716033935546875, -0.437591552734375, -0.4035797119140625, -0.36956787109375, -0.3355560302734375, -0.301544189453125, -0.2675323486328125, -0.2335205078125, -0.1995086669921875, -0.165496826171875, -0.1314849853515625, -0.09747314453125, -0.0634613037109375, -0.029449462890625, 0.0045623779296875, 0.03857421875, 0.0725860595703125, 0.106597900390625, 0.1406097412109375, 0.17462158203125, 0.2086334228515625, 0.242645263671875, 0.2766571044921875, 0.3106689453125, 0.3446807861328125, 0.378692626953125, 0.4127044677734375, 0.44671630859375, 0.4807281494140625, 0.514739990234375, 0.5487518310546875, 0.582763671875, 0.6167755126953125, 0.650787353515625, 0.6847991943359375, 0.71881103515625, 0.7528228759765625, 0.786834716796875, 0.8208465576171875, 0.8548583984375, 0.8888702392578125, 0.922882080078125, 0.9568939208984375, 0.99090576171875, 1.0249176025390625, 1.058929443359375, 1.0929412841796875, 1.126953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 8.0, 6.0, 7.0, 6.0, 12.0, 14.0, 16.0, 19.0, 17.0, 18.0, 21.0, 30.0, 26.0, 25.0, 20.0, 31.0, 37.0, 39.0, 31.0, 37.0, 30.0, 1064.0, 41.0, 50.0, 38.0, 30.0, 29.0, 35.0, 33.0, 32.0, 22.0, 26.0, 22.0, 14.0, 25.0, 16.0, 7.0, 10.0, 15.0, 15.0, 10.0, 11.0, 6.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.7734375, -11.4246826171875, -11.075927734375, -10.7271728515625, -10.37841796875, -10.0296630859375, -9.680908203125, -9.3321533203125, -8.9833984375, -8.6346435546875, -8.285888671875, -7.9371337890625, -7.58837890625, -7.2396240234375, -6.890869140625, -6.5421142578125, -6.193359375, -5.8446044921875, -5.495849609375, -5.1470947265625, -4.79833984375, -4.4495849609375, -4.100830078125, -3.7520751953125, -3.4033203125, -3.0545654296875, -2.705810546875, -2.3570556640625, -2.00830078125, -1.6595458984375, -1.310791015625, -0.9620361328125, -0.61328125, -0.2645263671875, 0.084228515625, 0.4329833984375, 0.78173828125, 1.1304931640625, 1.479248046875, 1.8280029296875, 2.1767578125, 2.5255126953125, 2.874267578125, 3.2230224609375, 3.57177734375, 3.9205322265625, 4.269287109375, 4.6180419921875, 4.966796875, 5.3155517578125, 5.664306640625, 6.0130615234375, 6.36181640625, 6.7105712890625, 7.059326171875, 7.4080810546875, 7.7568359375, 8.1055908203125, 8.454345703125, 8.8031005859375, 9.15185546875, 9.5006103515625, 9.849365234375, 10.1981201171875, 10.546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 11.0, 12.0, 18.0, 34.0, 46.0, 71.0, 96.0, 159.0, 237.0, 345.0, 458.0, 682.0, 935.0, 1321.0, 1913.0, 2570.0, 3538.0, 4901.0, 6741.0, 9337.0, 13102.0, 18382.0, 26788.0, 39120.0, 59116.0, 95894.0, 163946.0, 1255091.0, 139907.0, 82531.0, 52285.0, 34842.0, 23898.0, 16568.0, 11854.0, 8465.0, 6123.0, 4459.0, 3295.0, 2323.0, 1693.0, 1230.0, 859.0, 626.0, 424.0, 285.0, 207.0, 147.0, 90.0, 54.0, 45.0, 28.0, 12.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.6611328125, -0.640045166015625, -0.61895751953125, -0.597869873046875, -0.5767822265625, -0.555694580078125, -0.53460693359375, -0.513519287109375, -0.492431640625, -0.471343994140625, -0.45025634765625, -0.429168701171875, -0.4080810546875, -0.386993408203125, -0.36590576171875, -0.344818115234375, -0.32373046875, -0.302642822265625, -0.28155517578125, -0.260467529296875, -0.2393798828125, -0.218292236328125, -0.19720458984375, -0.176116943359375, -0.155029296875, -0.133941650390625, -0.11285400390625, -0.091766357421875, -0.0706787109375, -0.049591064453125, -0.02850341796875, -0.007415771484375, 0.013671875, 0.034759521484375, 0.05584716796875, 0.076934814453125, 0.0980224609375, 0.119110107421875, 0.14019775390625, 0.161285400390625, 0.182373046875, 0.203460693359375, 0.22454833984375, 0.245635986328125, 0.2667236328125, 0.287811279296875, 0.30889892578125, 0.329986572265625, 0.35107421875, 0.372161865234375, 0.39324951171875, 0.414337158203125, 0.4354248046875, 0.456512451171875, 0.47760009765625, 0.498687744140625, 0.519775390625, 0.540863037109375, 0.56195068359375, 0.583038330078125, 0.6041259765625, 0.625213623046875, 0.64630126953125, 0.667388916015625, 0.6884765625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 11.0, 11.0, 11.0, 7.0, 19.0, 25.0, 25.0, 17.0, 33.0, 18.0, 30.0, 38.0, 38.0, 45.0, 34.0, 39.0, 54.0, 46.0, 53.0, 34.0, 37.0, 31.0, 49.0, 42.0, 25.0, 31.0, 24.0, 28.0, 20.0, 24.0, 13.0, 9.0, 7.0, 8.0, 8.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.002750396728515625, -0.002663552761077881, -0.0025767087936401367, -0.0024898648262023926, -0.0024030208587646484, -0.0023161768913269043, -0.00222933292388916, -0.002142488956451416, -0.002055644989013672, -0.0019688010215759277, -0.0018819570541381836, -0.0017951130867004395, -0.0017082691192626953, -0.0016214251518249512, -0.001534581184387207, -0.0014477372169494629, -0.0013608932495117188, -0.0012740492820739746, -0.0011872053146362305, -0.0011003613471984863, -0.0010135173797607422, -0.000926673412322998, -0.0008398294448852539, -0.0007529854774475098, -0.0006661415100097656, -0.0005792975425720215, -0.0004924535751342773, -0.0004056096076965332, -0.00031876564025878906, -0.00023192167282104492, -0.00014507770538330078, -5.823373794555664e-05, 2.86102294921875e-05, 0.00011545419692993164, 0.00020229816436767578, 0.0002891421318054199, 0.00037598609924316406, 0.0004628300666809082, 0.0005496740341186523, 0.0006365180015563965, 0.0007233619689941406, 0.0008102059364318848, 0.0008970499038696289, 0.000983893871307373, 0.0010707378387451172, 0.0011575818061828613, 0.0012444257736206055, 0.0013312697410583496, 0.0014181137084960938, 0.0015049576759338379, 0.001591801643371582, 0.0016786456108093262, 0.0017654895782470703, 0.0018523335456848145, 0.0019391775131225586, 0.0020260214805603027, 0.002112865447998047, 0.002199709415435791, 0.002286553382873535, 0.0023733973503112793, 0.0024602413177490234, 0.0025470852851867676, 0.0026339292526245117, 0.002720773220062256, 0.0028076171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 6.0, 12.0, 9.0, 16.0, 17.0, 25.0, 23.0, 44.0, 54.0, 53.0, 62.0, 85.0, 124.0, 204.0, 310.0, 518.0, 2552.0, 27832.0, 666074.0, 331560.0, 15730.0, 1837.0, 481.0, 257.0, 169.0, 114.0, 75.0, 64.0, 49.0, 42.0, 35.0, 23.0, 18.0, 15.0, 16.0, 7.0, 10.0, 3.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051849365234375, -0.05027294158935547, -0.04869651794433594, -0.047120094299316406, -0.045543670654296875, -0.043967247009277344, -0.04239082336425781, -0.04081439971923828, -0.03923797607421875, -0.03766155242919922, -0.03608512878417969, -0.034508705139160156, -0.032932281494140625, -0.031355857849121094, -0.029779434204101562, -0.02820301055908203, -0.0266265869140625, -0.02505016326904297, -0.023473739624023438, -0.021897315979003906, -0.020320892333984375, -0.018744468688964844, -0.017168045043945312, -0.015591621398925781, -0.01401519775390625, -0.012438774108886719, -0.010862350463867188, -0.009285926818847656, -0.007709503173828125, -0.006133079528808594, -0.0045566558837890625, -0.0029802322387695312, -0.00140380859375, 0.00017261505126953125, 0.0017490386962890625, 0.0033254623413085938, 0.004901885986328125, 0.006478309631347656, 0.008054733276367188, 0.009631156921386719, 0.01120758056640625, 0.012784004211425781, 0.014360427856445312, 0.015936851501464844, 0.017513275146484375, 0.019089698791503906, 0.020666122436523438, 0.02224254608154297, 0.0238189697265625, 0.02539539337158203, 0.026971817016601562, 0.028548240661621094, 0.030124664306640625, 0.031701087951660156, 0.03327751159667969, 0.03485393524169922, 0.03643035888671875, 0.03800678253173828, 0.03958320617675781, 0.041159629821777344, 0.042736053466796875, 0.044312477111816406, 0.04588890075683594, 0.04746532440185547, 0.049041748046875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 16.0, 30.0, 98.0, 250.0, 306.0, 156.0, 65.0, 35.0, 24.0, 13.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004133736249059439, -0.0037919438909739256, -0.003450151300057769, -0.0031083589419722557, -0.002766566351056099, -0.002424773992970586, -0.0020829816348850727, -0.001741189043968916, -0.0013993966858834028, -0.0010576042113825679, -0.0007158117950893939, -0.0003740193787962198, -3.2226904295384884e-05, 0.00030956557020545006, 0.0006513579282909632, 0.00099315051920712, 0.001334942877292633, 0.001676735351793468, 0.002018527826294303, 0.002360320184379816, 0.002702112775295973, 0.003043905133381486, 0.003385697491466999, 0.003727490082383156, 0.004069282673299313, 0.004411075264215469, 0.004752867389470339, 0.005094659980386496, 0.005436452571302652, 0.005778244696557522, 0.006120037287473679, 0.006461829878389835, 0.0068036215379834175, 0.007145414128899574, 0.007487206254154444, 0.007828999310731888, 0.00817079097032547, 0.008512583561241627, 0.008854376152157784, 0.00919616874307394, 0.009537961333990097, 0.009879753924906254, 0.01022154651582241, 0.010563338175415993, 0.01090513076633215, 0.011246923357248306, 0.011588715948164463, 0.01193050853908062, 0.012272300198674202, 0.012614092789590359, 0.012955885380506516, 0.013297677040100098, 0.013639469631016254, 0.013981262221932411, 0.014323054812848568, 0.014664847403764725, 0.015006639994680882, 0.015348432585597038, 0.01569022424519062, 0.016032017767429352, 0.016373809427022934, 0.016715602949261665, 0.017057394608855247, 0.01739918813109398, 0.01774097979068756]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 4.0, 9.0, 9.0, 13.0, 12.0, 13.0, 11.0, 16.0, 26.0, 27.0, 22.0, 31.0, 27.0, 38.0, 46.0, 52.0, 43.0, 51.0, 41.0, 48.0, 41.0, 41.0, 46.0, 36.0, 34.0, 36.0, 33.0, 29.0, 23.0, 27.0, 18.0, 27.0, 14.0, 16.0, 7.0, 11.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.002096116542816162, -0.0020323926582932472, -0.0019686687737703323, -0.0019049448892474174, -0.0018412210047245026, -0.0017774971202015877, -0.0017137732356786728, -0.001650049351155758, -0.001586325466632843, -0.0015226015821099281, -0.0014588776975870132, -0.0013951538130640984, -0.0013314299285411835, -0.0012677060440182686, -0.0012039821594953537, -0.0011402582749724388, -0.001076534390449524, -0.001012810505926609, -0.0009490866214036942, -0.0008853627368807793, -0.0008216388523578644, -0.0007579149678349495, -0.0006941910833120346, -0.0006304671987891197, -0.0005667433142662048, -0.00050301942974329, -0.00043929554522037506, -0.0003755716606974602, -0.0003118477761745453, -0.0002481238916516304, -0.00018440000712871552, -0.00012067612260580063, -5.695223808288574e-05, 6.771646440029144e-06, 7.049553096294403e-05, 0.00013421941548585892, 0.0001979433000087738, 0.0002616671845316887, 0.0003253910690546036, 0.00038911495357751846, 0.00045283883810043335, 0.0005165627226233482, 0.0005802866071462631, 0.000644010491669178, 0.0007077343761920929, 0.0007714582607150078, 0.0008351821452379227, 0.0008989060297608376, 0.0009626299142837524, 0.0010263537988066673, 0.0010900776833295822, 0.001153801567852497, 0.001217525452375412, 0.0012812493368983269, 0.0013449732214212418, 0.0014086971059441566, 0.0014724209904670715, 0.0015361448749899864, 0.0015998687595129013, 0.0016635926440358162, 0.001727316528558731, 0.001791040413081646, 0.0018547642976045609, 0.0019184881821274757, 0.0019822120666503906]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 21.0, 21.0, 17.0, 26.0, 24.0, 31.0, 33.0, 25.0, 39.0, 43.0, 50.0, 54.0, 49.0, 46.0, 57.0, 40.0, 40.0, 35.0, 36.0, 28.0, 32.0, 37.0, 27.0, 19.0, 20.0, 22.0, 15.0, 10.0, 12.0, 7.0, 6.0, 5.0, 5.0, 0.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.135498046875, -20.47412109375, -19.812744140625, -19.1513671875, -18.489990234375, -17.82861328125, -17.167236328125, -16.505859375, -15.844482421875, -15.18310546875, -14.521728515625, -13.8603515625, -13.198974609375, -12.53759765625, -11.876220703125, -11.21484375, -10.553466796875, -9.89208984375, -9.230712890625, -8.5693359375, -7.907958984375, -7.24658203125, -6.585205078125, -5.923828125, -5.262451171875, -4.60107421875, -3.939697265625, -3.2783203125, -2.616943359375, -1.95556640625, -1.294189453125, -0.6328125, 0.028564453125, 0.68994140625, 1.351318359375, 2.0126953125, 2.674072265625, 3.33544921875, 3.996826171875, 4.658203125, 5.319580078125, 5.98095703125, 6.642333984375, 7.3037109375, 7.965087890625, 8.62646484375, 9.287841796875, 9.94921875, 10.610595703125, 11.27197265625, 11.933349609375, 12.5947265625, 13.256103515625, 13.91748046875, 14.578857421875, 15.240234375, 15.901611328125, 16.56298828125, 17.224365234375, 17.8857421875, 18.547119140625, 19.20849609375, 19.869873046875, 20.53125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 4.0, 3.0, 7.0, 7.0, 16.0, 11.0, 25.0, 23.0, 31.0, 47.0, 82.0, 87.0, 142.0, 228.0, 335.0, 538.0, 849.0, 1608.0, 3469.0, 9822.0, 48825.0, 878050.0, 83218.0, 12436.0, 4148.0, 1870.0, 970.0, 594.0, 353.0, 231.0, 152.0, 104.0, 70.0, 54.0, 43.0, 29.0, 20.0, 14.0, 13.0, 11.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.5625, -45.0888671875, -43.615234375, -42.1416015625, -40.66796875, -39.1943359375, -37.720703125, -36.2470703125, -34.7734375, -33.2998046875, -31.826171875, -30.3525390625, -28.87890625, -27.4052734375, -25.931640625, -24.4580078125, -22.984375, -21.5107421875, -20.037109375, -18.5634765625, -17.08984375, -15.6162109375, -14.142578125, -12.6689453125, -11.1953125, -9.7216796875, -8.248046875, -6.7744140625, -5.30078125, -3.8271484375, -2.353515625, -0.8798828125, 0.59375, 2.0673828125, 3.541015625, 5.0146484375, 6.48828125, 7.9619140625, 9.435546875, 10.9091796875, 12.3828125, 13.8564453125, 15.330078125, 16.8037109375, 18.27734375, 19.7509765625, 21.224609375, 22.6982421875, 24.171875, 25.6455078125, 27.119140625, 28.5927734375, 30.06640625, 31.5400390625, 33.013671875, 34.4873046875, 35.9609375, 37.4345703125, 38.908203125, 40.3818359375, 41.85546875, 43.3291015625, 44.802734375, 46.2763671875, 47.75]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 10.0, 9.0, 15.0, 17.0, 19.0, 15.0, 22.0, 26.0, 43.0, 19.0, 36.0, 37.0, 48.0, 56.0, 57.0, 76.0, 130.0, 1775.0, 119.0, 62.0, 56.0, 38.0, 53.0, 43.0, 35.0, 30.0, 29.0, 25.0, 16.0, 27.0, 14.0, 12.0, 11.0, 16.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-62.3125, -60.2685546875, -58.224609375, -56.1806640625, -54.13671875, -52.0927734375, -50.048828125, -48.0048828125, -45.9609375, -43.9169921875, -41.873046875, -39.8291015625, -37.78515625, -35.7412109375, -33.697265625, -31.6533203125, -29.609375, -27.5654296875, -25.521484375, -23.4775390625, -21.43359375, -19.3896484375, -17.345703125, -15.3017578125, -13.2578125, -11.2138671875, -9.169921875, -7.1259765625, -5.08203125, -3.0380859375, -0.994140625, 1.0498046875, 3.09375, 5.1376953125, 7.181640625, 9.2255859375, 11.26953125, 13.3134765625, 15.357421875, 17.4013671875, 19.4453125, 21.4892578125, 23.533203125, 25.5771484375, 27.62109375, 29.6650390625, 31.708984375, 33.7529296875, 35.796875, 37.8408203125, 39.884765625, 41.9287109375, 43.97265625, 46.0166015625, 48.060546875, 50.1044921875, 52.1484375, 54.1923828125, 56.236328125, 58.2802734375, 60.32421875, 62.3681640625, 64.412109375, 66.4560546875, 68.5]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 10.0, 11.0, 27.0, 50.0, 77.0, 137.0, 222.0, 579.0, 2422.0, 56608.0, 3074877.0, 8880.0, 1025.0, 350.0, 173.0, 96.0, 53.0, 40.0, 18.0, 20.0, 7.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-355.0, -346.79296875, -338.5859375, -330.37890625, -322.171875, -313.96484375, -305.7578125, -297.55078125, -289.34375, -281.13671875, -272.9296875, -264.72265625, -256.515625, -248.30859375, -240.1015625, -231.89453125, -223.6875, -215.48046875, -207.2734375, -199.06640625, -190.859375, -182.65234375, -174.4453125, -166.23828125, -158.03125, -149.82421875, -141.6171875, -133.41015625, -125.203125, -116.99609375, -108.7890625, -100.58203125, -92.375, -84.16796875, -75.9609375, -67.75390625, -59.546875, -51.33984375, -43.1328125, -34.92578125, -26.71875, -18.51171875, -10.3046875, -2.09765625, 6.109375, 14.31640625, 22.5234375, 30.73046875, 38.9375, 47.14453125, 55.3515625, 63.55859375, 71.765625, 79.97265625, 88.1796875, 96.38671875, 104.59375, 112.80078125, 121.0078125, 129.21484375, 137.421875, 145.62890625, 153.8359375, 162.04296875, 170.25]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 37.0, 503.0, 428.0, 44.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1105.7313232421875, -1086.3189697265625, -1066.90673828125, -1047.494384765625, -1028.08203125, -1008.6697387695312, -989.2574462890625, -969.8450927734375, -950.4328002929688, -931.0205078125, -911.608154296875, -892.1958618164062, -872.7835083007812, -853.3712158203125, -833.9588623046875, -814.5465698242188, -795.13427734375, -775.7219848632812, -756.3096313476562, -736.8973388671875, -717.4849853515625, -698.0726928710938, -678.660400390625, -659.248046875, -639.835693359375, -620.4234008789062, -601.0110473632812, -581.5987548828125, -562.1864013671875, -542.7741088867188, -523.36181640625, -503.949462890625, -484.5372314453125, -465.1249084472656, -445.71258544921875, -426.30029296875, -406.8879699707031, -387.47564697265625, -368.0633239746094, -348.6510009765625, -329.2386779785156, -309.82635498046875, -290.4140319824219, -271.001708984375, -251.58941650390625, -232.17709350585938, -212.7647705078125, -193.3524627685547, -173.9401397705078, -154.52781677246094, -135.11550903320312, -115.70318603515625, -96.2908706665039, -76.87855529785156, -57.46623229980469, -38.053924560546875, -18.6416015625, 0.7707157135009766, 20.183032989501953, 39.59535217285156, 59.007667541503906, 78.41998291015625, 97.83230590820312, 117.24461364746094, 136.6569366455078]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 8.0, 13.0, 5.0, 9.0, 15.0, 14.0, 26.0, 23.0, 25.0, 20.0, 38.0, 29.0, 29.0, 31.0, 30.0, 39.0, 48.0, 56.0, 50.0, 47.0, 43.0, 50.0, 44.0, 42.0, 44.0, 29.0, 41.0, 26.0, 23.0, 14.0, 22.0, 20.0, 13.0, 6.0, 9.0, 5.0, 3.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-239.0789794921875, -232.3161163330078, -225.5532684326172, -218.7904052734375, -212.0275421142578, -205.26467895507812, -198.5018310546875, -191.7389678955078, -184.97610473632812, -178.21324157714844, -171.4503936767578, -164.68753051757812, -157.92466735839844, -151.16180419921875, -144.39895629882812, -137.63609313964844, -130.8732452392578, -124.11038970947266, -117.34752655029297, -110.58467102050781, -103.82180786132812, -97.05895233154297, -90.29609680175781, -83.53323364257812, -76.77037811279297, -70.00752258300781, -63.244659423828125, -56.48180389404297, -49.71894454956055, -42.956085205078125, -36.19322967529297, -29.430370330810547, -22.667510986328125, -15.90465259552002, -9.141794204711914, -2.378936767578125, 4.383922576904297, 11.146781921386719, 17.909637451171875, 24.672496795654297, 31.43535614013672, 38.19821548461914, 44.96107482910156, 51.72393035888672, 58.48678970336914, 65.24964904785156, 72.01250457763672, 78.77536010742188, 85.53822326660156, 92.30107879638672, 99.0639419555664, 105.82679748535156, 112.58966064453125, 119.3525161743164, 126.11537170410156, 132.87823486328125, 139.64108276367188, 146.40394592285156, 153.1667938232422, 159.92965698242188, 166.69252014160156, 173.45538330078125, 180.21823120117188, 186.98109436035156, 193.74395751953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 8.0, 11.0, 11.0, 14.0, 21.0, 21.0, 23.0, 19.0, 25.0, 21.0, 42.0, 33.0, 26.0, 38.0, 46.0, 49.0, 41.0, 59.0, 52.0, 48.0, 42.0, 40.0, 31.0, 37.0, 42.0, 27.0, 23.0, 21.0, 17.0, 16.0, 13.0, 18.0, 14.0, 11.0, 7.0, 2.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.703125, -21.0322265625, -20.361328125, -19.6904296875, -19.01953125, -18.3486328125, -17.677734375, -17.0068359375, -16.3359375, -15.6650390625, -14.994140625, -14.3232421875, -13.65234375, -12.9814453125, -12.310546875, -11.6396484375, -10.96875, -10.2978515625, -9.626953125, -8.9560546875, -8.28515625, -7.6142578125, -6.943359375, -6.2724609375, -5.6015625, -4.9306640625, -4.259765625, -3.5888671875, -2.91796875, -2.2470703125, -1.576171875, -0.9052734375, -0.234375, 0.4365234375, 1.107421875, 1.7783203125, 2.44921875, 3.1201171875, 3.791015625, 4.4619140625, 5.1328125, 5.8037109375, 6.474609375, 7.1455078125, 7.81640625, 8.4873046875, 9.158203125, 9.8291015625, 10.5, 11.1708984375, 11.841796875, 12.5126953125, 13.18359375, 13.8544921875, 14.525390625, 15.1962890625, 15.8671875, 16.5380859375, 17.208984375, 17.8798828125, 18.55078125, 19.2216796875, 19.892578125, 20.5634765625, 21.234375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 17.0, 15.0, 14.0, 44.0, 37.0, 59.0, 83.0, 147.0, 223.0, 388.0, 651.0, 1246.0, 2424.0, 4557.0, 9792.0, 24248.0, 247275.0, 3705066.0, 159029.0, 21310.0, 8898.0, 4033.0, 2098.0, 1114.0, 567.0, 304.0, 197.0, 124.0, 116.0, 55.0, 45.0, 27.0, 12.0, 12.0, 10.0, 6.0, 11.0, 10.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.0625, -75.498046875, -72.93359375, -70.369140625, -67.8046875, -65.240234375, -62.67578125, -60.111328125, -57.546875, -54.982421875, -52.41796875, -49.853515625, -47.2890625, -44.724609375, -42.16015625, -39.595703125, -37.03125, -34.466796875, -31.90234375, -29.337890625, -26.7734375, -24.208984375, -21.64453125, -19.080078125, -16.515625, -13.951171875, -11.38671875, -8.822265625, -6.2578125, -3.693359375, -1.12890625, 1.435546875, 4.0, 6.564453125, 9.12890625, 11.693359375, 14.2578125, 16.822265625, 19.38671875, 21.951171875, 24.515625, 27.080078125, 29.64453125, 32.208984375, 34.7734375, 37.337890625, 39.90234375, 42.466796875, 45.03125, 47.595703125, 50.16015625, 52.724609375, 55.2890625, 57.853515625, 60.41796875, 62.982421875, 65.546875, 68.111328125, 70.67578125, 73.240234375, 75.8046875, 78.369140625, 80.93359375, 83.498046875, 86.0625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 9.0, 9.0, 12.0, 19.0, 39.0, 21.0, 61.0, 102.0, 355.0, 1181.0, 1507.0, 410.0, 118.0, 63.0, 36.0, 34.0, 22.0, 19.0, 12.0, 5.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.1875, -106.076171875, -102.96484375, -99.853515625, -96.7421875, -93.630859375, -90.51953125, -87.408203125, -84.296875, -81.185546875, -78.07421875, -74.962890625, -71.8515625, -68.740234375, -65.62890625, -62.517578125, -59.40625, -56.294921875, -53.18359375, -50.072265625, -46.9609375, -43.849609375, -40.73828125, -37.626953125, -34.515625, -31.404296875, -28.29296875, -25.181640625, -22.0703125, -18.958984375, -15.84765625, -12.736328125, -9.625, -6.513671875, -3.40234375, -0.291015625, 2.8203125, 5.931640625, 9.04296875, 12.154296875, 15.265625, 18.376953125, 21.48828125, 24.599609375, 27.7109375, 30.822265625, 33.93359375, 37.044921875, 40.15625, 43.267578125, 46.37890625, 49.490234375, 52.6015625, 55.712890625, 58.82421875, 61.935546875, 65.046875, 68.158203125, 71.26953125, 74.380859375, 77.4921875, 80.603515625, 83.71484375, 86.826171875, 89.9375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 7.0, 9.0, 15.0, 24.0, 44.0, 47.0, 72.0, 115.0, 211.0, 272.0, 505.0, 849.0, 1572.0, 2987.0, 6223.0, 14412.0, 41137.0, 242944.0, 3706924.0, 123189.0, 30585.0, 11346.0, 5069.0, 2517.0, 1345.0, 723.0, 415.0, 268.0, 140.0, 103.0, 75.0, 38.0, 34.0, 25.0, 8.0, 11.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.5625, -122.76953125, -118.9765625, -115.18359375, -111.390625, -107.59765625, -103.8046875, -100.01171875, -96.21875, -92.42578125, -88.6328125, -84.83984375, -81.046875, -77.25390625, -73.4609375, -69.66796875, -65.875, -62.08203125, -58.2890625, -54.49609375, -50.703125, -46.91015625, -43.1171875, -39.32421875, -35.53125, -31.73828125, -27.9453125, -24.15234375, -20.359375, -16.56640625, -12.7734375, -8.98046875, -5.1875, -1.39453125, 2.3984375, 6.19140625, 9.984375, 13.77734375, 17.5703125, 21.36328125, 25.15625, 28.94921875, 32.7421875, 36.53515625, 40.328125, 44.12109375, 47.9140625, 51.70703125, 55.5, 59.29296875, 63.0859375, 66.87890625, 70.671875, 74.46484375, 78.2578125, 82.05078125, 85.84375, 89.63671875, 93.4296875, 97.22265625, 101.015625, 104.80859375, 108.6015625, 112.39453125, 116.1875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 16.0, 27.0, 34.0, 37.0, 69.0, 143.0, 254.0, 160.0, 100.0, 53.0, 25.0, 27.0, 13.0, 11.0, 8.0, 5.0, 10.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-385.98712158203125, -374.1722717285156, -362.357421875, -350.5425720214844, -338.72772216796875, -326.9128723144531, -315.0980224609375, -303.28314208984375, -291.46832275390625, -279.6534729003906, -267.838623046875, -256.0237731933594, -244.20892333984375, -232.39407348632812, -220.57920837402344, -208.7643585205078, -196.94949340820312, -185.1346435546875, -173.31979370117188, -161.50494384765625, -149.69009399414062, -137.875244140625, -126.06037902832031, -114.24552917480469, -102.43067932128906, -90.61582946777344, -78.80097961425781, -66.98612213134766, -55.17127227783203, -43.356422424316406, -31.54156494140625, -19.726715087890625, -7.911834716796875, 3.903017044067383, 15.71786880493164, 27.53272247314453, 39.347572326660156, 51.16242218017578, 62.97727966308594, 74.79212951660156, 86.60697937011719, 98.42182922363281, 110.23667907714844, 122.0515365600586, 133.86639404296875, 145.68124389648438, 157.49609375, 169.31094360351562, 181.12579345703125, 192.94064331054688, 204.7554931640625, 216.57034301757812, 228.38519287109375, 240.20004272460938, 252.01490783691406, 263.82977294921875, 275.64459228515625, 287.4594421386719, 299.2742919921875, 311.0891418457031, 322.90399169921875, 334.7188415527344, 346.53369140625, 358.34857177734375, 370.1634216308594]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 9.0, 3.0, 7.0, 8.0, 12.0, 9.0, 14.0, 16.0, 11.0, 21.0, 15.0, 21.0, 23.0, 28.0, 24.0, 44.0, 36.0, 31.0, 38.0, 37.0, 34.0, 51.0, 37.0, 42.0, 22.0, 44.0, 38.0, 32.0, 30.0, 31.0, 25.0, 26.0, 34.0, 19.0, 16.0, 19.0, 13.0, 16.0, 14.0, 9.0, 11.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-156.39993286132812, -151.50070190429688, -146.6014862060547, -141.70225524902344, -136.80303955078125, -131.90380859375, -127.00457763671875, -122.10535430908203, -117.20613098144531, -112.3069076538086, -107.40768432617188, -102.50845336914062, -97.6092300415039, -92.71000671386719, -87.81077575683594, -82.91155242919922, -78.0123291015625, -73.11310577392578, -68.21388244628906, -63.31465148925781, -58.415428161621094, -53.516204833984375, -48.61697769165039, -43.717750549316406, -38.81852722167969, -33.91930389404297, -29.020076751708984, -24.120851516723633, -19.22162628173828, -14.32240104675293, -9.423175811767578, -4.523948669433594, 0.3752593994140625, 5.274484634399414, 10.173709869384766, 15.072935104370117, 19.97216033935547, 24.87138557434082, 29.770610809326172, 34.669837951660156, 39.569061279296875, 44.468284606933594, 49.36751174926758, 54.26673889160156, 59.16596221923828, 64.065185546875, 68.96441650390625, 73.86363983154297, 78.76286315917969, 83.6620864868164, 88.56130981445312, 93.46054077148438, 98.3597640991211, 103.25898742675781, 108.15821838378906, 113.05744171142578, 117.9566650390625, 122.85588836669922, 127.75511169433594, 132.6543426513672, 137.55355834960938, 142.45278930664062, 147.35202026367188, 152.25125122070312, 157.1504669189453]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 13.0, 9.0, 11.0, 8.0, 15.0, 16.0, 24.0, 21.0, 24.0, 27.0, 36.0, 29.0, 29.0, 36.0, 34.0, 44.0, 41.0, 52.0, 45.0, 48.0, 51.0, 38.0, 42.0, 39.0, 37.0, 33.0, 35.0, 32.0, 22.0, 16.0, 15.0, 11.0, 10.0, 14.0, 8.0, 10.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.640625, -21.959716796875, -21.27880859375, -20.597900390625, -19.9169921875, -19.236083984375, -18.55517578125, -17.874267578125, -17.193359375, -16.512451171875, -15.83154296875, -15.150634765625, -14.4697265625, -13.788818359375, -13.10791015625, -12.427001953125, -11.74609375, -11.065185546875, -10.38427734375, -9.703369140625, -9.0224609375, -8.341552734375, -7.66064453125, -6.979736328125, -6.298828125, -5.617919921875, -4.93701171875, -4.256103515625, -3.5751953125, -2.894287109375, -2.21337890625, -1.532470703125, -0.8515625, -0.170654296875, 0.51025390625, 1.191162109375, 1.8720703125, 2.552978515625, 3.23388671875, 3.914794921875, 4.595703125, 5.276611328125, 5.95751953125, 6.638427734375, 7.3193359375, 8.000244140625, 8.68115234375, 9.362060546875, 10.04296875, 10.723876953125, 11.40478515625, 12.085693359375, 12.7666015625, 13.447509765625, 14.12841796875, 14.809326171875, 15.490234375, 16.171142578125, 16.85205078125, 17.532958984375, 18.2138671875, 18.894775390625, 19.57568359375, 20.256591796875, 20.9375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 18.0, 20.0, 31.0, 44.0, 74.0, 78.0, 113.0, 188.0, 256.0, 364.0, 543.0, 803.0, 1104.0, 1591.0, 2370.0, 3310.0, 4767.0, 7199.0, 10689.0, 16557.0, 26224.0, 42710.0, 72432.0, 127791.0, 226672.0, 209347.0, 116501.0, 66716.0, 38902.0, 24262.0, 15303.0, 10148.0, 6627.0, 4606.0, 3093.0, 2154.0, 1485.0, 1071.0, 714.0, 507.0, 354.0, 227.0, 175.0, 129.0, 71.0, 57.0, 54.0, 35.0, 21.0, 11.0, 12.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.9423828125, -0.9128570556640625, -0.883331298828125, -0.8538055419921875, -0.82427978515625, -0.7947540283203125, -0.765228271484375, -0.7357025146484375, -0.7061767578125, -0.6766510009765625, -0.647125244140625, -0.6175994873046875, -0.58807373046875, -0.5585479736328125, -0.529022216796875, -0.4994964599609375, -0.469970703125, -0.4404449462890625, -0.410919189453125, -0.3813934326171875, -0.35186767578125, -0.3223419189453125, -0.292816162109375, -0.2632904052734375, -0.2337646484375, -0.2042388916015625, -0.174713134765625, -0.1451873779296875, -0.11566162109375, -0.0861358642578125, -0.056610107421875, -0.0270843505859375, 0.00244140625, 0.0319671630859375, 0.061492919921875, 0.0910186767578125, 0.12054443359375, 0.1500701904296875, 0.179595947265625, 0.2091217041015625, 0.2386474609375, 0.2681732177734375, 0.297698974609375, 0.3272247314453125, 0.35675048828125, 0.3862762451171875, 0.415802001953125, 0.4453277587890625, 0.474853515625, 0.5043792724609375, 0.533905029296875, 0.5634307861328125, 0.59295654296875, 0.6224822998046875, 0.652008056640625, 0.6815338134765625, 0.7110595703125, 0.7405853271484375, 0.770111083984375, 0.7996368408203125, 0.82916259765625, 0.8586883544921875, 0.888214111328125, 0.9177398681640625, 0.947265625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 3.0, 6.0, 4.0, 11.0, 12.0, 12.0, 13.0, 15.0, 19.0, 31.0, 24.0, 29.0, 26.0, 34.0, 28.0, 33.0, 33.0, 40.0, 38.0, 41.0, 32.0, 1061.0, 34.0, 39.0, 40.0, 33.0, 34.0, 30.0, 31.0, 22.0, 29.0, 18.0, 24.0, 19.0, 20.0, 21.0, 17.0, 12.0, 7.0, 13.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.046875, -10.6693115234375, -10.291748046875, -9.9141845703125, -9.53662109375, -9.1590576171875, -8.781494140625, -8.4039306640625, -8.0263671875, -7.6488037109375, -7.271240234375, -6.8936767578125, -6.51611328125, -6.1385498046875, -5.760986328125, -5.3834228515625, -5.005859375, -4.6282958984375, -4.250732421875, -3.8731689453125, -3.49560546875, -3.1180419921875, -2.740478515625, -2.3629150390625, -1.9853515625, -1.6077880859375, -1.230224609375, -0.8526611328125, -0.47509765625, -0.0975341796875, 0.280029296875, 0.6575927734375, 1.03515625, 1.4127197265625, 1.790283203125, 2.1678466796875, 2.54541015625, 2.9229736328125, 3.300537109375, 3.6781005859375, 4.0556640625, 4.4332275390625, 4.810791015625, 5.1883544921875, 5.56591796875, 5.9434814453125, 6.321044921875, 6.6986083984375, 7.076171875, 7.4537353515625, 7.831298828125, 8.2088623046875, 8.58642578125, 8.9639892578125, 9.341552734375, 9.7191162109375, 10.0966796875, 10.4742431640625, 10.851806640625, 11.2293701171875, 11.60693359375, 11.9844970703125, 12.362060546875, 12.7396240234375, 13.1171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 8.0, 4.0, 4.0, 14.0, 15.0, 23.0, 39.0, 47.0, 70.0, 98.0, 151.0, 226.0, 295.0, 396.0, 608.0, 770.0, 1125.0, 1582.0, 2273.0, 3174.0, 4578.0, 6586.0, 9200.0, 13276.0, 18864.0, 28304.0, 42104.0, 66645.0, 109073.0, 187192.0, 1249909.0, 126112.0, 75599.0, 47626.0, 31210.0, 21180.0, 14452.0, 10121.0, 7145.0, 5044.0, 3480.0, 2485.0, 1841.0, 1173.0, 887.0, 613.0, 429.0, 314.0, 224.0, 181.0, 120.0, 75.0, 49.0, 40.0, 30.0, 21.0, 15.0, 12.0, 7.0, 1.0, 2.0], "bins": [-0.771484375, -0.748199462890625, -0.72491455078125, -0.701629638671875, -0.6783447265625, -0.655059814453125, -0.63177490234375, -0.608489990234375, -0.585205078125, -0.561920166015625, -0.53863525390625, -0.515350341796875, -0.4920654296875, -0.468780517578125, -0.44549560546875, -0.422210693359375, -0.39892578125, -0.375640869140625, -0.35235595703125, -0.329071044921875, -0.3057861328125, -0.282501220703125, -0.25921630859375, -0.235931396484375, -0.212646484375, -0.189361572265625, -0.16607666015625, -0.142791748046875, -0.1195068359375, -0.096221923828125, -0.07293701171875, -0.049652099609375, -0.0263671875, -0.003082275390625, 0.02020263671875, 0.043487548828125, 0.0667724609375, 0.090057373046875, 0.11334228515625, 0.136627197265625, 0.159912109375, 0.183197021484375, 0.20648193359375, 0.229766845703125, 0.2530517578125, 0.276336669921875, 0.29962158203125, 0.322906494140625, 0.34619140625, 0.369476318359375, 0.39276123046875, 0.416046142578125, 0.4393310546875, 0.462615966796875, 0.48590087890625, 0.509185791015625, 0.532470703125, 0.555755615234375, 0.57904052734375, 0.602325439453125, 0.6256103515625, 0.648895263671875, 0.67218017578125, 0.695465087890625, 0.71875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 9.0, 5.0, 7.0, 10.0, 14.0, 18.0, 22.0, 26.0, 30.0, 33.0, 49.0, 39.0, 50.0, 63.0, 62.0, 66.0, 65.0, 59.0, 62.0, 60.0, 36.0, 48.0, 30.0, 29.0, 27.0, 22.0, 11.0, 8.0, 8.0, 12.0, 6.0, 4.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004283905029296875, -0.00415194034576416, -0.004019975662231445, -0.0038880109786987305, -0.0037560462951660156, -0.0036240816116333008, -0.003492116928100586, -0.003360152244567871, -0.0032281875610351562, -0.0030962228775024414, -0.0029642581939697266, -0.0028322935104370117, -0.002700328826904297, -0.002568364143371582, -0.002436399459838867, -0.0023044347763061523, -0.0021724700927734375, -0.0020405054092407227, -0.0019085407257080078, -0.001776576042175293, -0.0016446113586425781, -0.0015126466751098633, -0.0013806819915771484, -0.0012487173080444336, -0.0011167526245117188, -0.000984787940979004, -0.0008528232574462891, -0.0007208585739135742, -0.0005888938903808594, -0.00045692920684814453, -0.0003249645233154297, -0.00019299983978271484, -6.103515625e-05, 7.092952728271484e-05, 0.0002028942108154297, 0.00033485889434814453, 0.0004668235778808594, 0.0005987882614135742, 0.0007307529449462891, 0.0008627176284790039, 0.0009946823120117188, 0.0011266469955444336, 0.0012586116790771484, 0.0013905763626098633, 0.0015225410461425781, 0.001654505729675293, 0.0017864704132080078, 0.0019184350967407227, 0.0020503997802734375, 0.0021823644638061523, 0.002314329147338867, 0.002446293830871582, 0.002578258514404297, 0.0027102231979370117, 0.0028421878814697266, 0.0029741525650024414, 0.0031061172485351562, 0.003238081932067871, 0.003370046615600586, 0.0035020112991333008, 0.0036339759826660156, 0.0037659406661987305, 0.0038979053497314453, 0.00402987003326416, 0.004161834716796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 11.0, 12.0, 7.0, 20.0, 16.0, 25.0, 36.0, 26.0, 53.0, 76.0, 108.0, 201.0, 265.0, 473.0, 1718.0, 70479.0, 946752.0, 26016.0, 1082.0, 393.0, 252.0, 140.0, 122.0, 65.0, 64.0, 39.0, 27.0, 22.0, 16.0, 7.0, 6.0, 4.0, 8.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06793212890625, -0.06569671630859375, -0.0634613037109375, -0.06122589111328125, -0.058990478515625, -0.05675506591796875, -0.0545196533203125, -0.05228424072265625, -0.050048828125, -0.04781341552734375, -0.0455780029296875, -0.04334259033203125, -0.041107177734375, -0.03887176513671875, -0.0366363525390625, -0.03440093994140625, -0.03216552734375, -0.02993011474609375, -0.0276947021484375, -0.02545928955078125, -0.023223876953125, -0.02098846435546875, -0.0187530517578125, -0.01651763916015625, -0.0142822265625, -0.01204681396484375, -0.0098114013671875, -0.00757598876953125, -0.005340576171875, -0.00310516357421875, -0.0008697509765625, 0.00136566162109375, 0.00360107421875, 0.00583648681640625, 0.0080718994140625, 0.01030731201171875, 0.012542724609375, 0.01477813720703125, 0.0170135498046875, 0.01924896240234375, 0.021484375, 0.02371978759765625, 0.0259552001953125, 0.02819061279296875, 0.030426025390625, 0.03266143798828125, 0.0348968505859375, 0.03713226318359375, 0.03936767578125, 0.04160308837890625, 0.0438385009765625, 0.04607391357421875, 0.048309326171875, 0.05054473876953125, 0.0527801513671875, 0.05501556396484375, 0.0572509765625, 0.05948638916015625, 0.0617218017578125, 0.06395721435546875, 0.066192626953125, 0.06842803955078125, 0.0706634521484375, 0.07289886474609375, 0.07513427734375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 184.0, 761.0, 64.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03840736299753189, -0.037218060344457626, -0.03602875769138336, -0.0348394550383091, -0.03365015238523483, -0.03246085345745087, -0.0312715508043766, -0.030082248151302338, -0.028892945498228073, -0.02770364284515381, -0.026514340192079544, -0.02532503940165043, -0.024135736748576164, -0.0229464340955019, -0.021757133305072784, -0.02056783065199852, -0.019378527998924255, -0.01818922534584999, -0.016999922692775726, -0.01581062190234661, -0.014621319249272346, -0.013432016596198082, -0.012242714874446392, -0.011053413152694702, -0.009864110499620438, -0.008674807846546173, -0.007485506124794483, -0.006296203937381506, -0.005106901749968529, -0.0039175995625555515, -0.0027282973751425743, -0.0015389956533908844, -0.0003496892750263214, 0.0008396129123866558, 0.002028915099799633, 0.0032182172872126102, 0.0044075194746255875, 0.005596821662038565, 0.006786123849451542, 0.007975425571203232, 0.009164728224277496, 0.01035403087735176, 0.01154333259910345, 0.01273263432085514, 0.013921936973929405, 0.01511123962700367, 0.016300540417432785, 0.01748984307050705, 0.018679145723581314, 0.01986844837665558, 0.021057751029729843, 0.02224705182015896, 0.023436354473233223, 0.024625657126307487, 0.025814957916736603, 0.027004260569810867, 0.028193563222885132, 0.029382865875959396, 0.03057216852903366, 0.031761471182107925, 0.03295077383518219, 0.034140072762966156, 0.03532937541604042, 0.036518678069114685, 0.03770798072218895]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 9.0, 10.0, 10.0, 16.0, 21.0, 35.0, 23.0, 22.0, 27.0, 26.0, 31.0, 32.0, 49.0, 28.0, 40.0, 52.0, 40.0, 50.0, 40.0, 58.0, 45.0, 37.0, 29.0, 37.0, 30.0, 36.0, 21.0, 25.0, 20.0, 21.0, 18.0, 15.0, 6.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0027756094932556152, -0.0026910006999969482, -0.0026063919067382812, -0.0025217831134796143, -0.0024371743202209473, -0.0023525655269622803, -0.0022679567337036133, -0.0021833479404449463, -0.0020987391471862793, -0.0020141303539276123, -0.0019295215606689453, -0.0018449127674102783, -0.0017603039741516113, -0.0016756951808929443, -0.0015910863876342773, -0.0015064775943756104, -0.0014218688011169434, -0.0013372600078582764, -0.0012526512145996094, -0.0011680424213409424, -0.0010834336280822754, -0.0009988248348236084, -0.0009142160415649414, -0.0008296072483062744, -0.0007449984550476074, -0.0006603896617889404, -0.0005757808685302734, -0.0004911720752716064, -0.00040656328201293945, -0.00032195448875427246, -0.00023734569549560547, -0.00015273690223693848, -6.812810897827148e-05, 1.6480684280395508e-05, 0.0001010894775390625, 0.0001856982707977295, 0.0002703070640563965, 0.0003549158573150635, 0.00043952465057373047, 0.0005241334438323975, 0.0006087422370910645, 0.0006933510303497314, 0.0007779598236083984, 0.0008625686168670654, 0.0009471774101257324, 0.0010317862033843994, 0.0011163949966430664, 0.0012010037899017334, 0.0012856125831604004, 0.0013702213764190674, 0.0014548301696777344, 0.0015394389629364014, 0.0016240477561950684, 0.0017086565494537354, 0.0017932653427124023, 0.0018778741359710693, 0.0019624829292297363, 0.0020470917224884033, 0.0021317005157470703, 0.0022163093090057373, 0.0023009181022644043, 0.0023855268955230713, 0.0024701356887817383, 0.0025547444820404053, 0.0026393532752990723]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 13.0, 9.0, 11.0, 8.0, 15.0, 16.0, 24.0, 21.0, 24.0, 27.0, 36.0, 29.0, 29.0, 36.0, 34.0, 44.0, 41.0, 52.0, 45.0, 48.0, 51.0, 38.0, 42.0, 39.0, 37.0, 33.0, 35.0, 32.0, 22.0, 16.0, 15.0, 11.0, 10.0, 14.0, 8.0, 10.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.640625, -21.959716796875, -21.27880859375, -20.597900390625, -19.9169921875, -19.236083984375, -18.55517578125, -17.874267578125, -17.193359375, -16.512451171875, -15.83154296875, -15.150634765625, -14.4697265625, -13.788818359375, -13.10791015625, -12.427001953125, -11.74609375, -11.065185546875, -10.38427734375, -9.703369140625, -9.0224609375, -8.341552734375, -7.66064453125, -6.979736328125, -6.298828125, -5.617919921875, -4.93701171875, -4.256103515625, -3.5751953125, -2.894287109375, -2.21337890625, -1.532470703125, -0.8515625, -0.170654296875, 0.51025390625, 1.191162109375, 1.8720703125, 2.552978515625, 3.23388671875, 3.914794921875, 4.595703125, 5.276611328125, 5.95751953125, 6.638427734375, 7.3193359375, 8.000244140625, 8.68115234375, 9.362060546875, 10.04296875, 10.723876953125, 11.40478515625, 12.085693359375, 12.7666015625, 13.447509765625, 14.12841796875, 14.809326171875, 15.490234375, 16.171142578125, 16.85205078125, 17.532958984375, 18.2138671875, 18.894775390625, 19.57568359375, 20.256591796875, 20.9375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 5.0, 9.0, 11.0, 19.0, 29.0, 32.0, 39.0, 72.0, 86.0, 135.0, 165.0, 266.0, 426.0, 559.0, 790.0, 1273.0, 2045.0, 3235.0, 5761.0, 12266.0, 40816.0, 708726.0, 226213.0, 23639.0, 9415.0, 4750.0, 2646.0, 1645.0, 1065.0, 773.0, 493.0, 337.0, 280.0, 152.0, 113.0, 64.0, 58.0, 44.0, 32.0, 25.0, 16.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-38.59375, -37.41796875, -36.2421875, -35.06640625, -33.890625, -32.71484375, -31.5390625, -30.36328125, -29.1875, -28.01171875, -26.8359375, -25.66015625, -24.484375, -23.30859375, -22.1328125, -20.95703125, -19.78125, -18.60546875, -17.4296875, -16.25390625, -15.078125, -13.90234375, -12.7265625, -11.55078125, -10.375, -9.19921875, -8.0234375, -6.84765625, -5.671875, -4.49609375, -3.3203125, -2.14453125, -0.96875, 0.20703125, 1.3828125, 2.55859375, 3.734375, 4.91015625, 6.0859375, 7.26171875, 8.4375, 9.61328125, 10.7890625, 11.96484375, 13.140625, 14.31640625, 15.4921875, 16.66796875, 17.84375, 19.01953125, 20.1953125, 21.37109375, 22.546875, 23.72265625, 24.8984375, 26.07421875, 27.25, 28.42578125, 29.6015625, 30.77734375, 31.953125, 33.12890625, 34.3046875, 35.48046875, 36.65625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 7.0, 4.0, 2.0, 10.0, 11.0, 18.0, 20.0, 23.0, 31.0, 33.0, 35.0, 39.0, 50.0, 49.0, 54.0, 52.0, 88.0, 1738.0, 241.0, 85.0, 74.0, 51.0, 50.0, 43.0, 36.0, 39.0, 21.0, 31.0, 22.0, 18.0, 20.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.8125, -74.240234375, -71.66796875, -69.095703125, -66.5234375, -63.951171875, -61.37890625, -58.806640625, -56.234375, -53.662109375, -51.08984375, -48.517578125, -45.9453125, -43.373046875, -40.80078125, -38.228515625, -35.65625, -33.083984375, -30.51171875, -27.939453125, -25.3671875, -22.794921875, -20.22265625, -17.650390625, -15.078125, -12.505859375, -9.93359375, -7.361328125, -4.7890625, -2.216796875, 0.35546875, 2.927734375, 5.5, 8.072265625, 10.64453125, 13.216796875, 15.7890625, 18.361328125, 20.93359375, 23.505859375, 26.078125, 28.650390625, 31.22265625, 33.794921875, 36.3671875, 38.939453125, 41.51171875, 44.083984375, 46.65625, 49.228515625, 51.80078125, 54.373046875, 56.9453125, 59.517578125, 62.08984375, 64.662109375, 67.234375, 69.806640625, 72.37890625, 74.951171875, 77.5234375, 80.095703125, 82.66796875, 85.240234375, 87.8125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 13.0, 19.0, 15.0, 37.0, 54.0, 70.0, 90.0, 185.0, 485.0, 1861.0, 16555.0, 3076125.0, 45541.0, 3317.0, 679.0, 264.0, 113.0, 77.0, 52.0, 38.0, 24.0, 13.0, 12.0, 10.0, 11.0, 5.0, 8.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-211.625, -203.685546875, -195.74609375, -187.806640625, -179.8671875, -171.927734375, -163.98828125, -156.048828125, -148.109375, -140.169921875, -132.23046875, -124.291015625, -116.3515625, -108.412109375, -100.47265625, -92.533203125, -84.59375, -76.654296875, -68.71484375, -60.775390625, -52.8359375, -44.896484375, -36.95703125, -29.017578125, -21.078125, -13.138671875, -5.19921875, 2.740234375, 10.6796875, 18.619140625, 26.55859375, 34.498046875, 42.4375, 50.376953125, 58.31640625, 66.255859375, 74.1953125, 82.134765625, 90.07421875, 98.013671875, 105.953125, 113.892578125, 121.83203125, 129.771484375, 137.7109375, 145.650390625, 153.58984375, 161.529296875, 169.46875, 177.408203125, 185.34765625, 193.287109375, 201.2265625, 209.166015625, 217.10546875, 225.044921875, 232.984375, 240.923828125, 248.86328125, 256.802734375, 264.7421875, 272.681640625, 280.62109375, 288.560546875, 296.5]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 29.0, 381.0, 542.0, 59.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1419.4779052734375, -1394.1719970703125, -1368.8662109375, -1343.560302734375, -1318.2545166015625, -1292.9486083984375, -1267.642822265625, -1242.3369140625, -1217.031005859375, -1191.72509765625, -1166.4193115234375, -1141.1134033203125, -1115.8076171875, -1090.501708984375, -1065.19580078125, -1039.8900146484375, -1014.5841674804688, -989.2783203125, -963.9724731445312, -938.6666259765625, -913.3607177734375, -888.0548706054688, -862.7490234375, -837.4431762695312, -812.1373291015625, -786.8314819335938, -761.525634765625, -736.2197265625, -710.9138793945312, -685.6080322265625, -660.3021850585938, -634.996337890625, -609.6904296875, -584.3845825195312, -559.0787353515625, -533.7728271484375, -508.46697998046875, -483.1611328125, -457.85528564453125, -432.5494384765625, -407.24359130859375, -381.937744140625, -356.6318664550781, -331.3260192871094, -306.0201416015625, -280.71429443359375, -255.408447265625, -230.1025848388672, -204.7967071533203, -179.4908447265625, -154.18499755859375, -128.87913513183594, -103.57327270507812, -78.26741027832031, -52.96156311035156, -27.65570068359375, -2.3498382568359375, 22.95602035522461, 48.261878967285156, 73.56773376464844, 98.87359619140625, 124.17945861816406, 149.4853057861328, 174.79116821289062, 200.09703063964844]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 6.0, 9.0, 9.0, 11.0, 14.0, 18.0, 9.0, 21.0, 22.0, 20.0, 24.0, 37.0, 31.0, 38.0, 47.0, 33.0, 39.0, 46.0, 46.0, 39.0, 38.0, 47.0, 33.0, 33.0, 38.0, 35.0, 39.0, 27.0, 19.0, 16.0, 27.0, 20.0, 15.0, 17.0, 11.0, 12.0, 10.0, 8.0, 10.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-165.22840881347656, -159.32656860351562, -153.42474365234375, -147.5229034423828, -141.62106323242188, -135.71922302246094, -129.8173828125, -123.91555786132812, -118.01371765136719, -112.11187744140625, -106.21004486083984, -100.30821228027344, -94.4063720703125, -88.50453186035156, -82.60269927978516, -76.70086669921875, -70.79902648925781, -64.89718627929688, -58.99535369873047, -53.0935173034668, -47.191680908203125, -41.28984451293945, -35.38800811767578, -29.48617172241211, -23.584335327148438, -17.682498931884766, -11.780662536621094, -5.878826141357422, 0.02301025390625, 5.924846649169922, 11.826683044433594, 17.728519439697266, 23.630340576171875, 29.532176971435547, 35.43401336669922, 41.33584976196289, 47.23768615722656, 53.139522552490234, 59.041358947753906, 64.94319152832031, 70.84503173828125, 76.74687194824219, 82.6487045288086, 88.550537109375, 94.45237731933594, 100.35421752929688, 106.25605010986328, 112.15788269042969, 118.05972290039062, 123.96156311035156, 129.8634033203125, 135.76522827148438, 141.6670684814453, 147.56890869140625, 153.47073364257812, 159.37257385253906, 165.2744140625, 171.17625427246094, 177.07809448242188, 182.97991943359375, 188.8817596435547, 194.78359985351562, 200.6854248046875, 206.58726501464844, 212.48910522460938]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 3.0, 13.0, 9.0, 14.0, 14.0, 11.0, 27.0, 19.0, 30.0, 27.0, 29.0, 34.0, 33.0, 44.0, 26.0, 32.0, 33.0, 41.0, 36.0, 51.0, 42.0, 39.0, 43.0, 50.0, 37.0, 32.0, 30.0, 15.0, 24.0, 37.0, 12.0, 15.0, 11.0, 16.0, 7.0, 9.0, 16.0, 3.0, 3.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-22.71875, -22.04248046875, -21.3662109375, -20.68994140625, -20.013671875, -19.33740234375, -18.6611328125, -17.98486328125, -17.30859375, -16.63232421875, -15.9560546875, -15.27978515625, -14.603515625, -13.92724609375, -13.2509765625, -12.57470703125, -11.8984375, -11.22216796875, -10.5458984375, -9.86962890625, -9.193359375, -8.51708984375, -7.8408203125, -7.16455078125, -6.48828125, -5.81201171875, -5.1357421875, -4.45947265625, -3.783203125, -3.10693359375, -2.4306640625, -1.75439453125, -1.078125, -0.40185546875, 0.2744140625, 0.95068359375, 1.626953125, 2.30322265625, 2.9794921875, 3.65576171875, 4.33203125, 5.00830078125, 5.6845703125, 6.36083984375, 7.037109375, 7.71337890625, 8.3896484375, 9.06591796875, 9.7421875, 10.41845703125, 11.0947265625, 11.77099609375, 12.447265625, 13.12353515625, 13.7998046875, 14.47607421875, 15.15234375, 15.82861328125, 16.5048828125, 17.18115234375, 17.857421875, 18.53369140625, 19.2099609375, 19.88623046875, 20.5625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 7.0, 11.0, 8.0, 17.0, 29.0, 43.0, 55.0, 65.0, 75.0, 123.0, 194.0, 245.0, 353.0, 549.0, 876.0, 1248.0, 2088.0, 3330.0, 6036.0, 10655.0, 22832.0, 288712.0, 3513319.0, 294603.0, 23791.0, 10349.0, 5652.0, 3275.0, 1994.0, 1170.0, 805.0, 529.0, 346.0, 236.0, 175.0, 130.0, 98.0, 67.0, 44.0, 32.0, 27.0, 24.0, 19.0, 8.0, 3.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0], "bins": [-75.5625, -73.3720703125, -71.181640625, -68.9912109375, -66.80078125, -64.6103515625, -62.419921875, -60.2294921875, -58.0390625, -55.8486328125, -53.658203125, -51.4677734375, -49.27734375, -47.0869140625, -44.896484375, -42.7060546875, -40.515625, -38.3251953125, -36.134765625, -33.9443359375, -31.75390625, -29.5634765625, -27.373046875, -25.1826171875, -22.9921875, -20.8017578125, -18.611328125, -16.4208984375, -14.23046875, -12.0400390625, -9.849609375, -7.6591796875, -5.46875, -3.2783203125, -1.087890625, 1.1025390625, 3.29296875, 5.4833984375, 7.673828125, 9.8642578125, 12.0546875, 14.2451171875, 16.435546875, 18.6259765625, 20.81640625, 23.0068359375, 25.197265625, 27.3876953125, 29.578125, 31.7685546875, 33.958984375, 36.1494140625, 38.33984375, 40.5302734375, 42.720703125, 44.9111328125, 47.1015625, 49.2919921875, 51.482421875, 53.6728515625, 55.86328125, 58.0537109375, 60.244140625, 62.4345703125, 64.625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 6.0, 4.0, 10.0, 7.0, 12.0, 13.0, 25.0, 28.0, 29.0, 46.0, 76.0, 171.0, 543.0, 1441.0, 1048.0, 312.0, 106.0, 57.0, 27.0, 25.0, 14.0, 16.0, 10.0, 7.0, 11.0, 3.0, 3.0, 6.0, 8.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.9375, -90.185546875, -87.43359375, -84.681640625, -81.9296875, -79.177734375, -76.42578125, -73.673828125, -70.921875, -68.169921875, -65.41796875, -62.666015625, -59.9140625, -57.162109375, -54.41015625, -51.658203125, -48.90625, -46.154296875, -43.40234375, -40.650390625, -37.8984375, -35.146484375, -32.39453125, -29.642578125, -26.890625, -24.138671875, -21.38671875, -18.634765625, -15.8828125, -13.130859375, -10.37890625, -7.626953125, -4.875, -2.123046875, 0.62890625, 3.380859375, 6.1328125, 8.884765625, 11.63671875, 14.388671875, 17.140625, 19.892578125, 22.64453125, 25.396484375, 28.1484375, 30.900390625, 33.65234375, 36.404296875, 39.15625, 41.908203125, 44.66015625, 47.412109375, 50.1640625, 52.916015625, 55.66796875, 58.419921875, 61.171875, 63.923828125, 66.67578125, 69.427734375, 72.1796875, 74.931640625, 77.68359375, 80.435546875, 83.1875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 7.0, 7.0, 5.0, 20.0, 24.0, 35.0, 89.0, 175.0, 339.0, 797.0, 2397.0, 7768.0, 35755.0, 3476308.0, 635450.0, 25602.0, 6122.0, 2001.0, 720.0, 305.0, 158.0, 81.0, 41.0, 17.0, 14.0, 10.0, 7.0, 8.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-209.125, -202.1328125, -195.140625, -188.1484375, -181.15625, -174.1640625, -167.171875, -160.1796875, -153.1875, -146.1953125, -139.203125, -132.2109375, -125.21875, -118.2265625, -111.234375, -104.2421875, -97.25, -90.2578125, -83.265625, -76.2734375, -69.28125, -62.2890625, -55.296875, -48.3046875, -41.3125, -34.3203125, -27.328125, -20.3359375, -13.34375, -6.3515625, 0.640625, 7.6328125, 14.625, 21.6171875, 28.609375, 35.6015625, 42.59375, 49.5859375, 56.578125, 63.5703125, 70.5625, 77.5546875, 84.546875, 91.5390625, 98.53125, 105.5234375, 112.515625, 119.5078125, 126.5, 133.4921875, 140.484375, 147.4765625, 154.46875, 161.4609375, 168.453125, 175.4453125, 182.4375, 189.4296875, 196.421875, 203.4140625, 210.40625, 217.3984375, 224.390625, 231.3828125, 238.375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 3.0, 8.0, 17.0, 12.0, 12.0, 35.0, 43.0, 59.0, 89.0, 108.0, 175.0, 147.0, 86.0, 49.0, 41.0, 29.0, 24.0, 13.0, 11.0, 6.0, 5.0, 7.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-314.72857666015625, -305.9132080078125, -297.0978088378906, -288.2824401855469, -279.4670715332031, -270.65167236328125, -261.8363037109375, -253.02093505859375, -244.20555114746094, -235.39016723632812, -226.57479858398438, -217.75941467285156, -208.94403076171875, -200.128662109375, -191.3132781982422, -182.49789428710938, -173.68252563476562, -164.8671417236328, -156.05177307128906, -147.23638916015625, -138.4210205078125, -129.6056365966797, -120.79025268554688, -111.9748764038086, -103.15950012207031, -94.34412384033203, -85.52874755859375, -76.71336364746094, -67.89798736572266, -59.082611083984375, -50.26723098754883, -41.45185089111328, -32.636505126953125, -23.82112693786621, -15.005748748779297, -6.190370559692383, 2.6250076293945312, 11.440383911132812, 20.25576400756836, 29.071144104003906, 37.88652038574219, 46.70189666748047, 55.517276763916016, 64.33265686035156, 73.14803314208984, 81.96340942382812, 90.77879333496094, 99.59416961669922, 108.4095458984375, 117.22492218017578, 126.04029846191406, 134.85568237304688, 143.67105102539062, 152.48643493652344, 161.30181884765625, 170.1171875, 178.9325714111328, 187.74795532226562, 196.56332397460938, 205.3787078857422, 214.194091796875, 223.00946044921875, 231.82484436035156, 240.64022827148438, 249.45559692382812]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 10.0, 11.0, 11.0, 15.0, 11.0, 23.0, 20.0, 21.0, 28.0, 26.0, 34.0, 25.0, 26.0, 38.0, 33.0, 36.0, 39.0, 46.0, 38.0, 32.0, 27.0, 32.0, 48.0, 39.0, 34.0, 25.0, 30.0, 27.0, 17.0, 33.0, 28.0, 17.0, 23.0, 11.0, 14.0, 10.0, 7.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-165.3268280029297, -159.85072326660156, -154.37461853027344, -148.8985137939453, -143.4224090576172, -137.94630432128906, -132.47019958496094, -126.99409484863281, -121.51799011230469, -116.04188537597656, -110.56578063964844, -105.08967590332031, -99.61357116699219, -94.13746643066406, -88.66136169433594, -83.18525695800781, -77.70915222167969, -72.23304748535156, -66.75694274902344, -61.28083801269531, -55.80473327636719, -50.32862854003906, -44.85252380371094, -39.37641906738281, -33.90031433105469, -28.424209594726562, -22.948104858398438, -17.472000122070312, -11.995895385742188, -6.5197906494140625, -1.0436859130859375, 4.4324188232421875, 9.908523559570312, 15.384628295898438, 20.860733032226562, 26.336837768554688, 31.812942504882812, 37.28904724121094, 42.76515197753906, 48.24125671386719, 53.71736145019531, 59.19346618652344, 64.66957092285156, 70.14567565917969, 75.62178039550781, 81.09788513183594, 86.57398986816406, 92.05009460449219, 97.52619934082031, 103.00230407714844, 108.47840881347656, 113.95451354980469, 119.43061828613281, 124.90672302246094, 130.38282775878906, 135.8589324951172, 141.3350372314453, 146.81114196777344, 152.28724670410156, 157.7633514404297, 163.2394561767578, 168.71556091308594, 174.19166564941406, 179.6677703857422, 185.1438751220703]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 6.0, 3.0, 10.0, 13.0, 12.0, 18.0, 16.0, 20.0, 21.0, 16.0, 24.0, 24.0, 37.0, 27.0, 40.0, 30.0, 35.0, 45.0, 39.0, 45.0, 38.0, 51.0, 41.0, 46.0, 35.0, 26.0, 34.0, 36.0, 34.0, 23.0, 23.0, 22.0, 20.0, 15.0, 18.0, 8.0, 14.0, 6.0, 3.0, 8.0, 6.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-24.5625, -23.861572265625, -23.16064453125, -22.459716796875, -21.7587890625, -21.057861328125, -20.35693359375, -19.656005859375, -18.955078125, -18.254150390625, -17.55322265625, -16.852294921875, -16.1513671875, -15.450439453125, -14.74951171875, -14.048583984375, -13.34765625, -12.646728515625, -11.94580078125, -11.244873046875, -10.5439453125, -9.843017578125, -9.14208984375, -8.441162109375, -7.740234375, -7.039306640625, -6.33837890625, -5.637451171875, -4.9365234375, -4.235595703125, -3.53466796875, -2.833740234375, -2.1328125, -1.431884765625, -0.73095703125, -0.030029296875, 0.6708984375, 1.371826171875, 2.07275390625, 2.773681640625, 3.474609375, 4.175537109375, 4.87646484375, 5.577392578125, 6.2783203125, 6.979248046875, 7.68017578125, 8.381103515625, 9.08203125, 9.782958984375, 10.48388671875, 11.184814453125, 11.8857421875, 12.586669921875, 13.28759765625, 13.988525390625, 14.689453125, 15.390380859375, 16.09130859375, 16.792236328125, 17.4931640625, 18.194091796875, 18.89501953125, 19.595947265625, 20.296875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 7.0, 16.0, 15.0, 21.0, 35.0, 43.0, 59.0, 104.0, 148.0, 211.0, 280.0, 463.0, 669.0, 949.0, 1418.0, 2082.0, 3190.0, 4572.0, 7086.0, 10650.0, 16193.0, 25402.0, 40588.0, 67823.0, 119891.0, 216746.0, 220539.0, 123168.0, 69836.0, 41360.0, 25898.0, 16620.0, 10757.0, 7214.0, 4763.0, 3195.0, 2089.0, 1475.0, 969.0, 644.0, 405.0, 334.0, 205.0, 126.0, 98.0, 67.0, 49.0, 37.0, 19.0, 13.0, 10.0, 6.0, 2.0, 2.0, 0.0, 4.0], "bins": [-1.1591796875, -1.1251068115234375, -1.091033935546875, -1.0569610595703125, -1.02288818359375, -0.9888153076171875, -0.954742431640625, -0.9206695556640625, -0.8865966796875, -0.8525238037109375, -0.818450927734375, -0.7843780517578125, -0.75030517578125, -0.7162322998046875, -0.682159423828125, -0.6480865478515625, -0.614013671875, -0.5799407958984375, -0.545867919921875, -0.5117950439453125, -0.47772216796875, -0.4436492919921875, -0.409576416015625, -0.3755035400390625, -0.3414306640625, -0.3073577880859375, -0.273284912109375, -0.2392120361328125, -0.20513916015625, -0.1710662841796875, -0.136993408203125, -0.1029205322265625, -0.06884765625, -0.0347747802734375, -0.000701904296875, 0.0333709716796875, 0.06744384765625, 0.1015167236328125, 0.135589599609375, 0.1696624755859375, 0.2037353515625, 0.2378082275390625, 0.271881103515625, 0.3059539794921875, 0.34002685546875, 0.3740997314453125, 0.408172607421875, 0.4422454833984375, 0.476318359375, 0.5103912353515625, 0.544464111328125, 0.5785369873046875, 0.61260986328125, 0.6466827392578125, 0.680755615234375, 0.7148284912109375, 0.7489013671875, 0.7829742431640625, 0.817047119140625, 0.8511199951171875, 0.88519287109375, 0.9192657470703125, 0.953338623046875, 0.9874114990234375, 1.021484375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 10.0, 9.0, 12.0, 13.0, 14.0, 14.0, 17.0, 23.0, 24.0, 17.0, 22.0, 25.0, 24.0, 33.0, 40.0, 34.0, 50.0, 44.0, 46.0, 1066.0, 49.0, 38.0, 42.0, 33.0, 36.0, 38.0, 34.0, 34.0, 22.0, 24.0, 20.0, 19.0, 24.0, 11.0, 13.0, 17.0, 11.0, 7.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21875, -13.7652587890625, -13.311767578125, -12.8582763671875, -12.40478515625, -11.9512939453125, -11.497802734375, -11.0443115234375, -10.5908203125, -10.1373291015625, -9.683837890625, -9.2303466796875, -8.77685546875, -8.3233642578125, -7.869873046875, -7.4163818359375, -6.962890625, -6.5093994140625, -6.055908203125, -5.6024169921875, -5.14892578125, -4.6954345703125, -4.241943359375, -3.7884521484375, -3.3349609375, -2.8814697265625, -2.427978515625, -1.9744873046875, -1.52099609375, -1.0675048828125, -0.614013671875, -0.1605224609375, 0.29296875, 0.7464599609375, 1.199951171875, 1.6534423828125, 2.10693359375, 2.5604248046875, 3.013916015625, 3.4674072265625, 3.9208984375, 4.3743896484375, 4.827880859375, 5.2813720703125, 5.73486328125, 6.1883544921875, 6.641845703125, 7.0953369140625, 7.548828125, 8.0023193359375, 8.455810546875, 8.9093017578125, 9.36279296875, 9.8162841796875, 10.269775390625, 10.7232666015625, 11.1767578125, 11.6302490234375, 12.083740234375, 12.5372314453125, 12.99072265625, 13.4442138671875, 13.897705078125, 14.3511962890625, 14.8046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 14.0, 12.0, 27.0, 33.0, 31.0, 66.0, 79.0, 119.0, 173.0, 241.0, 356.0, 614.0, 770.0, 1051.0, 1666.0, 2482.0, 3561.0, 4951.0, 7153.0, 10249.0, 14289.0, 21341.0, 31892.0, 49215.0, 80445.0, 141262.0, 1273089.0, 175777.0, 99584.0, 59217.0, 37338.0, 24903.0, 16711.0, 11425.0, 8245.0, 5690.0, 4057.0, 2864.0, 1934.0, 1326.0, 913.0, 594.0, 413.0, 273.0, 205.0, 144.0, 122.0, 73.0, 50.0, 29.0, 16.0, 13.0, 11.0, 8.0, 4.0, 7.0, 1.0, 4.0], "bins": [-0.87353515625, -0.8468170166015625, -0.820098876953125, -0.7933807373046875, -0.76666259765625, -0.7399444580078125, -0.713226318359375, -0.6865081787109375, -0.6597900390625, -0.6330718994140625, -0.606353759765625, -0.5796356201171875, -0.55291748046875, -0.5261993408203125, -0.499481201171875, -0.4727630615234375, -0.446044921875, -0.4193267822265625, -0.392608642578125, -0.3658905029296875, -0.33917236328125, -0.3124542236328125, -0.285736083984375, -0.2590179443359375, -0.2322998046875, -0.2055816650390625, -0.178863525390625, -0.1521453857421875, -0.12542724609375, -0.0987091064453125, -0.071990966796875, -0.0452728271484375, -0.0185546875, 0.0081634521484375, 0.034881591796875, 0.0615997314453125, 0.08831787109375, 0.1150360107421875, 0.141754150390625, 0.1684722900390625, 0.1951904296875, 0.2219085693359375, 0.248626708984375, 0.2753448486328125, 0.30206298828125, 0.3287811279296875, 0.355499267578125, 0.3822174072265625, 0.408935546875, 0.4356536865234375, 0.462371826171875, 0.4890899658203125, 0.51580810546875, 0.5425262451171875, 0.569244384765625, 0.5959625244140625, 0.6226806640625, 0.6493988037109375, 0.676116943359375, 0.7028350830078125, 0.72955322265625, 0.7562713623046875, 0.782989501953125, 0.8097076416015625, 0.83642578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 8.0, 9.0, 8.0, 15.0, 15.0, 27.0, 17.0, 38.0, 47.0, 46.0, 48.0, 47.0, 68.0, 62.0, 68.0, 69.0, 44.0, 64.0, 60.0, 45.0, 36.0, 25.0, 27.0, 20.0, 18.0, 12.0, 7.0, 7.0, 18.0, 4.0, 10.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003726959228515625, -0.003591299057006836, -0.003455638885498047, -0.003319978713989258, -0.0031843185424804688, -0.0030486583709716797, -0.0029129981994628906, -0.0027773380279541016, -0.0026416778564453125, -0.0025060176849365234, -0.0023703575134277344, -0.0022346973419189453, -0.0020990371704101562, -0.001963376998901367, -0.0018277168273925781, -0.001692056655883789, -0.001556396484375, -0.001420736312866211, -0.0012850761413574219, -0.0011494159698486328, -0.0010137557983398438, -0.0008780956268310547, -0.0007424354553222656, -0.0006067752838134766, -0.0004711151123046875, -0.00033545494079589844, -0.00019979476928710938, -6.413459777832031e-05, 7.152557373046875e-05, 0.0002071857452392578, 0.0003428459167480469, 0.00047850608825683594, 0.000614166259765625, 0.0007498264312744141, 0.0008854866027832031, 0.0010211467742919922, 0.0011568069458007812, 0.0012924671173095703, 0.0014281272888183594, 0.0015637874603271484, 0.0016994476318359375, 0.0018351078033447266, 0.0019707679748535156, 0.0021064281463623047, 0.0022420883178710938, 0.002377748489379883, 0.002513408660888672, 0.002649068832397461, 0.00278472900390625, 0.002920389175415039, 0.003056049346923828, 0.003191709518432617, 0.0033273696899414062, 0.0034630298614501953, 0.0035986900329589844, 0.0037343502044677734, 0.0038700103759765625, 0.0040056705474853516, 0.004141330718994141, 0.00427699089050293, 0.004412651062011719, 0.004548311233520508, 0.004683971405029297, 0.004819631576538086, 0.004955291748046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 6.0, 7.0, 10.0, 11.0, 12.0, 17.0, 18.0, 18.0, 30.0, 46.0, 51.0, 79.0, 121.0, 186.0, 394.0, 2132.0, 76691.0, 939136.0, 27411.0, 1244.0, 346.0, 190.0, 132.0, 73.0, 52.0, 40.0, 18.0, 28.0, 11.0, 11.0, 9.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0887451171875, -0.08630561828613281, -0.08386611938476562, -0.08142662048339844, -0.07898712158203125, -0.07654762268066406, -0.07410812377929688, -0.07166862487792969, -0.0692291259765625, -0.06678962707519531, -0.06435012817382812, -0.06191062927246094, -0.05947113037109375, -0.05703163146972656, -0.054592132568359375, -0.05215263366699219, -0.049713134765625, -0.04727363586425781, -0.044834136962890625, -0.04239463806152344, -0.03995513916015625, -0.03751564025878906, -0.035076141357421875, -0.03263664245605469, -0.0301971435546875, -0.027757644653320312, -0.025318145751953125, -0.022878646850585938, -0.02043914794921875, -0.017999649047851562, -0.015560150146484375, -0.013120651245117188, -0.01068115234375, -0.008241653442382812, -0.005802154541015625, -0.0033626556396484375, -0.00092315673828125, 0.0015163421630859375, 0.003955841064453125, 0.0063953399658203125, 0.0088348388671875, 0.011274337768554688, 0.013713836669921875, 0.016153335571289062, 0.01859283447265625, 0.021032333374023438, 0.023471832275390625, 0.025911331176757812, 0.028350830078125, 0.030790328979492188, 0.033229827880859375, 0.03566932678222656, 0.03810882568359375, 0.04054832458496094, 0.042987823486328125, 0.04542732238769531, 0.0478668212890625, 0.05030632019042969, 0.052745819091796875, 0.05518531799316406, 0.05762481689453125, 0.06006431579589844, 0.06250381469726562, 0.06494331359863281, 0.0673828125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 13.0, 17.0, 16.0, 18.0, 37.0, 50.0, 67.0, 82.0, 102.0, 118.0, 118.0, 91.0, 70.0, 48.0, 33.0, 27.0, 25.0, 12.0, 7.0, 9.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003312567714601755, -0.003192593576386571, -0.0030726194381713867, -0.002952645532786846, -0.002832671394571662, -0.0027126972563564777, -0.0025927231181412935, -0.0024727489799261093, -0.0023527750745415688, -0.0022328009363263845, -0.0021128267981112003, -0.0019928528927266598, -0.0018728787545114756, -0.0017529046162962914, -0.0016329304780811071, -0.001512956339865923, -0.0013929822016507387, -0.0012730080634355545, -0.0011530340416356921, -0.001033059903420508, -0.0009130858234129846, -0.0007931117434054613, -0.0006731376051902771, -0.0005531635251827538, -0.0004331894451752305, -0.0003132153651677072, -0.00019324125605635345, -7.32671469449997e-05, 4.6706933062523603e-05, 0.0001666810130700469, 0.0002866551512852311, 0.0004066292312927544, 0.0005266033113002777, 0.000646577391307801, 0.0007665514713153243, 0.0008865256095305085, 0.001006499631330371, 0.0011264737695455551, 0.0012464479077607393, 0.0013664220459759235, 0.001486396067775786, 0.0016063702059909701, 0.0017263442277908325, 0.0018463183660060167, 0.001966292504221201, 0.0020862664096057415, 0.0022062407806515694, 0.00232621468603611, 0.002446188824251294, 0.0025661629624664783, 0.0026861371006816626, 0.0028061112388968468, 0.0029260851442813873, 0.0030460592824965715, 0.0031660334207117558, 0.00328600755892694, 0.003405981697142124, 0.0035259558353573084, 0.0036459299735724926, 0.003765903878957033, 0.0038858780171722174, 0.004005852155387402, 0.004125826060771942, 0.00424580043181777, 0.0043657743372023106]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 6.0, 16.0, 16.0, 11.0, 18.0, 30.0, 24.0, 26.0, 25.0, 32.0, 35.0, 34.0, 35.0, 32.0, 42.0, 39.0, 39.0, 38.0, 37.0, 43.0, 46.0, 45.0, 30.0, 35.0, 40.0, 27.0, 16.0, 25.0, 22.0, 26.0, 18.0, 18.0, 5.0, 10.0, 7.0, 7.0, 9.0, 7.0, 1.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002184927463531494, -0.002119190990924835, -0.0020534545183181763, -0.0019877180457115173, -0.0019219815731048584, -0.0018562451004981995, -0.0017905086278915405, -0.0017247721552848816, -0.0016590356826782227, -0.0015932992100715637, -0.0015275627374649048, -0.0014618262648582458, -0.001396089792251587, -0.001330353319644928, -0.001264616847038269, -0.00119888037443161, -0.0011331439018249512, -0.0010674074292182922, -0.0010016709566116333, -0.0009359344840049744, -0.0008701980113983154, -0.0008044615387916565, -0.0007387250661849976, -0.0006729885935783386, -0.0006072521209716797, -0.0005415156483650208, -0.0004757791757583618, -0.0004100427031517029, -0.00034430623054504395, -0.000278569757938385, -0.00021283328533172607, -0.00014709681272506714, -8.13603401184082e-05, -1.5623867511749268e-05, 5.011260509490967e-05, 0.0001158490777015686, 0.00018158555030822754, 0.0002473220229148865, 0.0003130584955215454, 0.00037879496812820435, 0.0004445314407348633, 0.0005102679133415222, 0.0005760043859481812, 0.0006417408585548401, 0.000707477331161499, 0.000773213803768158, 0.0008389502763748169, 0.0009046867489814758, 0.0009704232215881348, 0.0010361596941947937, 0.0011018961668014526, 0.0011676326394081116, 0.0012333691120147705, 0.0012991055846214294, 0.0013648420572280884, 0.0014305785298347473, 0.0014963150024414062, 0.0015620514750480652, 0.0016277879476547241, 0.001693524420261383, 0.001759260892868042, 0.001824997365474701, 0.0018907338380813599, 0.001956470310688019, 0.0020222067832946777]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 6.0, 3.0, 10.0, 13.0, 12.0, 18.0, 16.0, 20.0, 21.0, 16.0, 24.0, 24.0, 37.0, 27.0, 40.0, 30.0, 35.0, 45.0, 39.0, 45.0, 38.0, 51.0, 41.0, 46.0, 35.0, 26.0, 34.0, 36.0, 34.0, 23.0, 23.0, 22.0, 20.0, 15.0, 18.0, 8.0, 14.0, 6.0, 3.0, 8.0, 6.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-24.5625, -23.861572265625, -23.16064453125, -22.459716796875, -21.7587890625, -21.057861328125, -20.35693359375, -19.656005859375, -18.955078125, -18.254150390625, -17.55322265625, -16.852294921875, -16.1513671875, -15.450439453125, -14.74951171875, -14.048583984375, -13.34765625, -12.646728515625, -11.94580078125, -11.244873046875, -10.5439453125, -9.843017578125, -9.14208984375, -8.441162109375, -7.740234375, -7.039306640625, -6.33837890625, -5.637451171875, -4.9365234375, -4.235595703125, -3.53466796875, -2.833740234375, -2.1328125, -1.431884765625, -0.73095703125, -0.030029296875, 0.6708984375, 1.371826171875, 2.07275390625, 2.773681640625, 3.474609375, 4.175537109375, 4.87646484375, 5.577392578125, 6.2783203125, 6.979248046875, 7.68017578125, 8.381103515625, 9.08203125, 9.782958984375, 10.48388671875, 11.184814453125, 11.8857421875, 12.586669921875, 13.28759765625, 13.988525390625, 14.689453125, 15.390380859375, 16.09130859375, 16.792236328125, 17.4931640625, 18.194091796875, 18.89501953125, 19.595947265625, 20.296875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 11.0, 6.0, 14.0, 22.0, 22.0, 36.0, 50.0, 70.0, 104.0, 133.0, 211.0, 278.0, 385.0, 564.0, 784.0, 1095.0, 1584.0, 2614.0, 4522.0, 9308.0, 23532.0, 83585.0, 550163.0, 281691.0, 52681.0, 16858.0, 7378.0, 3793.0, 2210.0, 1478.0, 1027.0, 698.0, 479.0, 332.0, 242.0, 166.0, 115.0, 89.0, 55.0, 52.0, 31.0, 32.0, 13.0, 11.0, 11.0, 7.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.8125, -16.315673828125, -15.81884765625, -15.322021484375, -14.8251953125, -14.328369140625, -13.83154296875, -13.334716796875, -12.837890625, -12.341064453125, -11.84423828125, -11.347412109375, -10.8505859375, -10.353759765625, -9.85693359375, -9.360107421875, -8.86328125, -8.366455078125, -7.86962890625, -7.372802734375, -6.8759765625, -6.379150390625, -5.88232421875, -5.385498046875, -4.888671875, -4.391845703125, -3.89501953125, -3.398193359375, -2.9013671875, -2.404541015625, -1.90771484375, -1.410888671875, -0.9140625, -0.417236328125, 0.07958984375, 0.576416015625, 1.0732421875, 1.570068359375, 2.06689453125, 2.563720703125, 3.060546875, 3.557373046875, 4.05419921875, 4.551025390625, 5.0478515625, 5.544677734375, 6.04150390625, 6.538330078125, 7.03515625, 7.531982421875, 8.02880859375, 8.525634765625, 9.0224609375, 9.519287109375, 10.01611328125, 10.512939453125, 11.009765625, 11.506591796875, 12.00341796875, 12.500244140625, 12.9970703125, 13.493896484375, 13.99072265625, 14.487548828125, 14.984375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 6.0, 8.0, 10.0, 8.0, 23.0, 16.0, 13.0, 27.0, 18.0, 34.0, 32.0, 38.0, 37.0, 28.0, 47.0, 47.0, 74.0, 219.0, 1831.0, 102.0, 48.0, 57.0, 31.0, 36.0, 34.0, 38.0, 23.0, 35.0, 13.0, 16.0, 18.0, 19.0, 17.0, 16.0, 9.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-93.5, -90.84375, -88.1875, -85.53125, -82.875, -80.21875, -77.5625, -74.90625, -72.25, -69.59375, -66.9375, -64.28125, -61.625, -58.96875, -56.3125, -53.65625, -51.0, -48.34375, -45.6875, -43.03125, -40.375, -37.71875, -35.0625, -32.40625, -29.75, -27.09375, -24.4375, -21.78125, -19.125, -16.46875, -13.8125, -11.15625, -8.5, -5.84375, -3.1875, -0.53125, 2.125, 4.78125, 7.4375, 10.09375, 12.75, 15.40625, 18.0625, 20.71875, 23.375, 26.03125, 28.6875, 31.34375, 34.0, 36.65625, 39.3125, 41.96875, 44.625, 47.28125, 49.9375, 52.59375, 55.25, 57.90625, 60.5625, 63.21875, 65.875, 68.53125, 71.1875, 73.84375, 76.5]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 6.0, 16.0, 19.0, 32.0, 26.0, 26.0, 43.0, 70.0, 117.0, 148.0, 231.0, 443.0, 1453.0, 61870.0, 3075614.0, 4102.0, 615.0, 268.0, 165.0, 129.0, 80.0, 61.0, 44.0, 23.0, 30.0, 18.0, 13.0, 10.0, 11.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-210.25, -204.27734375, -198.3046875, -192.33203125, -186.359375, -180.38671875, -174.4140625, -168.44140625, -162.46875, -156.49609375, -150.5234375, -144.55078125, -138.578125, -132.60546875, -126.6328125, -120.66015625, -114.6875, -108.71484375, -102.7421875, -96.76953125, -90.796875, -84.82421875, -78.8515625, -72.87890625, -66.90625, -60.93359375, -54.9609375, -48.98828125, -43.015625, -37.04296875, -31.0703125, -25.09765625, -19.125, -13.15234375, -7.1796875, -1.20703125, 4.765625, 10.73828125, 16.7109375, 22.68359375, 28.65625, 34.62890625, 40.6015625, 46.57421875, 52.546875, 58.51953125, 64.4921875, 70.46484375, 76.4375, 82.41015625, 88.3828125, 94.35546875, 100.328125, 106.30078125, 112.2734375, 118.24609375, 124.21875, 130.19140625, 136.1640625, 142.13671875, 148.109375, 154.08203125, 160.0546875, 166.02734375, 172.0]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 14.0, 30.0, 96.0, 257.0, 345.0, 178.0, 64.0, 22.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.8077850341797, -201.80271911621094, -196.79766845703125, -191.7926025390625, -186.78753662109375, -181.782470703125, -176.7774200439453, -171.77235412597656, -166.76730346679688, -161.76223754882812, -156.75718688964844, -151.7521209716797, -146.74705505371094, -141.74200439453125, -136.7369384765625, -131.73187255859375, -126.726806640625, -121.72174835205078, -116.71668243408203, -111.71162414550781, -106.70655822753906, -101.70149993896484, -96.69644165039062, -91.69137573242188, -86.68631744384766, -81.68125915527344, -76.67619323730469, -71.67113494873047, -66.66607666015625, -61.6610107421875, -56.65595245361328, -51.6508903503418, -46.64582061767578, -41.6407585144043, -36.63569641113281, -31.630638122558594, -26.62557601928711, -21.620513916015625, -16.615453720092773, -11.610393524169922, -6.6053314208984375, -1.6002702713012695, 3.4047908782958984, 8.409852027893066, 13.414913177490234, 18.41997528076172, 23.42503547668457, 28.430095672607422, 33.435157775878906, 38.44021987915039, 43.445281982421875, 48.450340270996094, 53.45540237426758, 58.46046447753906, 63.46552276611328, 68.4705810546875, 73.47564697265625, 78.48070526123047, 83.48577117919922, 88.49082946777344, 93.49589538574219, 98.5009536743164, 103.50601196289062, 108.51107788085938, 113.5161361694336]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 11.0, 4.0, 14.0, 11.0, 7.0, 12.0, 11.0, 23.0, 23.0, 21.0, 29.0, 37.0, 32.0, 39.0, 35.0, 46.0, 27.0, 40.0, 48.0, 43.0, 44.0, 39.0, 45.0, 36.0, 45.0, 47.0, 30.0, 26.0, 26.0, 20.0, 25.0, 16.0, 20.0, 11.0, 7.0, 10.0, 8.0, 11.0, 6.0, 6.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-230.90023803710938, -223.32843017578125, -215.75662231445312, -208.184814453125, -200.61300659179688, -193.04119873046875, -185.46939086914062, -177.8975830078125, -170.32577514648438, -162.75396728515625, -155.18215942382812, -147.6103515625, -140.03854370117188, -132.46673583984375, -124.89492797851562, -117.3231201171875, -109.75131225585938, -102.17950439453125, -94.60769653320312, -87.035888671875, -79.46408081054688, -71.89227294921875, -64.32046508789062, -56.7486572265625, -49.176849365234375, -41.60504150390625, -34.033233642578125, -26.46142578125, -18.889617919921875, -11.31781005859375, -3.746002197265625, 3.8258056640625, 11.397628784179688, 18.969436645507812, 26.541244506835938, 34.11305236816406, 41.68486022949219, 49.25666809082031, 56.82847595214844, 64.40028381347656, 71.97209167480469, 79.54389953613281, 87.11570739746094, 94.68751525878906, 102.25932312011719, 109.83113098144531, 117.40293884277344, 124.97474670410156, 132.5465545654297, 140.1183624267578, 147.69017028808594, 155.26197814941406, 162.8337860107422, 170.4055938720703, 177.97740173339844, 185.54920959472656, 193.1210174560547, 200.6928253173828, 208.26463317871094, 215.83644104003906, 223.4082489013672, 230.9800567626953, 238.55186462402344, 246.12367248535156, 253.6954803466797]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 1.0, 6.0, 15.0, 8.0, 14.0, 23.0, 19.0, 13.0, 19.0, 22.0, 22.0, 28.0, 39.0, 32.0, 32.0, 37.0, 32.0, 44.0, 46.0, 40.0, 34.0, 50.0, 44.0, 43.0, 47.0, 23.0, 32.0, 38.0, 19.0, 24.0, 23.0, 25.0, 17.0, 19.0, 11.0, 14.0, 4.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0], "bins": [-25.703125, -24.981201171875, -24.25927734375, -23.537353515625, -22.8154296875, -22.093505859375, -21.37158203125, -20.649658203125, -19.927734375, -19.205810546875, -18.48388671875, -17.761962890625, -17.0400390625, -16.318115234375, -15.59619140625, -14.874267578125, -14.15234375, -13.430419921875, -12.70849609375, -11.986572265625, -11.2646484375, -10.542724609375, -9.82080078125, -9.098876953125, -8.376953125, -7.655029296875, -6.93310546875, -6.211181640625, -5.4892578125, -4.767333984375, -4.04541015625, -3.323486328125, -2.6015625, -1.879638671875, -1.15771484375, -0.435791015625, 0.2861328125, 1.008056640625, 1.72998046875, 2.451904296875, 3.173828125, 3.895751953125, 4.61767578125, 5.339599609375, 6.0615234375, 6.783447265625, 7.50537109375, 8.227294921875, 8.94921875, 9.671142578125, 10.39306640625, 11.114990234375, 11.8369140625, 12.558837890625, 13.28076171875, 14.002685546875, 14.724609375, 15.446533203125, 16.16845703125, 16.890380859375, 17.6123046875, 18.334228515625, 19.05615234375, 19.778076171875, 20.5]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 6.0, 8.0, 15.0, 19.0, 17.0, 28.0, 40.0, 44.0, 88.0, 101.0, 138.0, 199.0, 279.0, 394.0, 550.0, 732.0, 1080.0, 1582.0, 2584.0, 4430.0, 8155.0, 16076.0, 107642.0, 2871617.0, 1096990.0, 51566.0, 13100.0, 6531.0, 3663.0, 2142.0, 1360.0, 955.0, 610.0, 456.0, 283.0, 208.0, 154.0, 114.0, 85.0, 60.0, 45.0, 38.0, 24.0, 23.0, 14.0, 12.0, 6.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-69.25, -67.2041015625, -65.158203125, -63.1123046875, -61.06640625, -59.0205078125, -56.974609375, -54.9287109375, -52.8828125, -50.8369140625, -48.791015625, -46.7451171875, -44.69921875, -42.6533203125, -40.607421875, -38.5615234375, -36.515625, -34.4697265625, -32.423828125, -30.3779296875, -28.33203125, -26.2861328125, -24.240234375, -22.1943359375, -20.1484375, -18.1025390625, -16.056640625, -14.0107421875, -11.96484375, -9.9189453125, -7.873046875, -5.8271484375, -3.78125, -1.7353515625, 0.310546875, 2.3564453125, 4.40234375, 6.4482421875, 8.494140625, 10.5400390625, 12.5859375, 14.6318359375, 16.677734375, 18.7236328125, 20.76953125, 22.8154296875, 24.861328125, 26.9072265625, 28.953125, 30.9990234375, 33.044921875, 35.0908203125, 37.13671875, 39.1826171875, 41.228515625, 43.2744140625, 45.3203125, 47.3662109375, 49.412109375, 51.4580078125, 53.50390625, 55.5498046875, 57.595703125, 59.6416015625, 61.6875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 2.0, 6.0, 10.0, 7.0, 8.0, 19.0, 19.0, 13.0, 26.0, 18.0, 39.0, 74.0, 134.0, 334.0, 771.0, 1172.0, 734.0, 298.0, 116.0, 73.0, 42.0, 40.0, 22.0, 11.0, 14.0, 9.0, 9.0, 15.0, 11.0, 8.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -73.00341796875, -70.9443359375, -68.88525390625, -66.826171875, -64.76708984375, -62.7080078125, -60.64892578125, -58.58984375, -56.53076171875, -54.4716796875, -52.41259765625, -50.353515625, -48.29443359375, -46.2353515625, -44.17626953125, -42.1171875, -40.05810546875, -37.9990234375, -35.93994140625, -33.880859375, -31.82177734375, -29.7626953125, -27.70361328125, -25.64453125, -23.58544921875, -21.5263671875, -19.46728515625, -17.408203125, -15.34912109375, -13.2900390625, -11.23095703125, -9.171875, -7.11279296875, -5.0537109375, -2.99462890625, -0.935546875, 1.12353515625, 3.1826171875, 5.24169921875, 7.30078125, 9.35986328125, 11.4189453125, 13.47802734375, 15.537109375, 17.59619140625, 19.6552734375, 21.71435546875, 23.7734375, 25.83251953125, 27.8916015625, 29.95068359375, 32.009765625, 34.06884765625, 36.1279296875, 38.18701171875, 40.24609375, 42.30517578125, 44.3642578125, 46.42333984375, 48.482421875, 50.54150390625, 52.6005859375, 54.65966796875, 56.71875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 15.0, 11.0, 19.0, 47.0, 52.0, 75.0, 88.0, 199.0, 285.0, 545.0, 997.0, 2023.0, 4536.0, 10389.0, 28581.0, 132445.0, 3703272.0, 250016.0, 37333.0, 12967.0, 5289.0, 2486.0, 1176.0, 586.0, 332.0, 162.0, 141.0, 49.0, 46.0, 41.0, 19.0, 17.0, 10.0, 1.0, 7.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-93.8125, -90.4150390625, -87.017578125, -83.6201171875, -80.22265625, -76.8251953125, -73.427734375, -70.0302734375, -66.6328125, -63.2353515625, -59.837890625, -56.4404296875, -53.04296875, -49.6455078125, -46.248046875, -42.8505859375, -39.453125, -36.0556640625, -32.658203125, -29.2607421875, -25.86328125, -22.4658203125, -19.068359375, -15.6708984375, -12.2734375, -8.8759765625, -5.478515625, -2.0810546875, 1.31640625, 4.7138671875, 8.111328125, 11.5087890625, 14.90625, 18.3037109375, 21.701171875, 25.0986328125, 28.49609375, 31.8935546875, 35.291015625, 38.6884765625, 42.0859375, 45.4833984375, 48.880859375, 52.2783203125, 55.67578125, 59.0732421875, 62.470703125, 65.8681640625, 69.265625, 72.6630859375, 76.060546875, 79.4580078125, 82.85546875, 86.2529296875, 89.650390625, 93.0478515625, 96.4453125, 99.8427734375, 103.240234375, 106.6376953125, 110.03515625, 113.4326171875, 116.830078125, 120.2275390625, 123.625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 7.0, 7.0, 8.0, 15.0, 22.0, 37.0, 63.0, 96.0, 196.0, 225.0, 127.0, 93.0, 43.0, 23.0, 13.0, 5.0, 6.0, 10.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.8699493408203, -231.9002685546875, -221.93060302734375, -211.96092224121094, -201.99124145507812, -192.02157592773438, -182.05189514160156, -172.08221435546875, -162.112548828125, -152.1428680419922, -142.17320251464844, -132.20352172851562, -122.23384094238281, -112.26416778564453, -102.29449462890625, -92.32481384277344, -82.35513305664062, -72.38545989990234, -62.41577911376953, -52.44610595703125, -42.4764289855957, -32.506752014160156, -22.537078857421875, -12.567398071289062, -2.5977249145507812, 7.371951103210449, 17.34162712097168, 27.311302185058594, 37.28097915649414, 47.25065612792969, 57.22032928466797, 67.19001007080078, 77.15966796875, 87.12934112548828, 97.0990219116211, 107.06869506835938, 117.03837585449219, 127.00804901123047, 136.97772216796875, 146.94740295410156, 156.91708374023438, 166.8867645263672, 176.85643005371094, 186.82611083984375, 196.79579162597656, 206.76547241210938, 216.73513793945312, 226.70481872558594, 236.6744842529297, 246.6441650390625, 256.61383056640625, 266.58349609375, 276.5531921386719, 286.5228576660156, 296.4925537109375, 306.46221923828125, 316.431884765625, 326.40155029296875, 336.3712463378906, 346.3409118652344, 356.3105773925781, 366.2802734375, 376.24993896484375, 386.2196044921875, 396.1893005371094]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 10.0, 5.0, 9.0, 3.0, 7.0, 16.0, 9.0, 21.0, 19.0, 19.0, 30.0, 20.0, 25.0, 30.0, 40.0, 38.0, 30.0, 35.0, 44.0, 46.0, 36.0, 46.0, 45.0, 35.0, 41.0, 45.0, 44.0, 44.0, 21.0, 23.0, 17.0, 22.0, 15.0, 20.0, 15.0, 13.0, 14.0, 7.0, 9.0, 12.0, 8.0, 5.0, 4.0, 0.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-172.6673583984375, -167.89022827148438, -163.1131134033203, -158.3359832763672, -153.55885314941406, -148.78173828125, -144.00460815429688, -139.22747802734375, -134.45034790039062, -129.6732177734375, -124.8960952758789, -120.11897277832031, -115.34184265136719, -110.5647201538086, -105.78759765625, -101.01046752929688, -96.23335266113281, -91.45623016357422, -86.6791000366211, -81.9019775390625, -77.12484741210938, -72.34772491455078, -67.57060241699219, -62.79347610473633, -58.01634979248047, -53.23922348022461, -48.46209716796875, -43.684974670410156, -38.9078483581543, -34.13072204589844, -29.35359764099121, -24.576473236083984, -19.799346923828125, -15.022221565246582, -10.245096206665039, -5.467970848083496, -0.6908454895019531, 4.086280822753906, 8.863405227661133, 13.64052963256836, 18.41765594482422, 23.194782257080078, 27.971906661987305, 32.74903106689453, 37.52615737915039, 42.30328369140625, 47.080406188964844, 51.8575325012207, 56.63465881347656, 61.41178512573242, 66.18891143798828, 70.96603393554688, 75.7431640625, 80.5202865600586, 85.29740905761719, 90.07453918457031, 94.8516616821289, 99.6287841796875, 104.40591430664062, 109.18303680419922, 113.96015930175781, 118.73728942871094, 123.51441192626953, 128.29153442382812, 133.06866455078125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 9.0, 11.0, 7.0, 15.0, 11.0, 21.0, 16.0, 27.0, 22.0, 25.0, 24.0, 36.0, 27.0, 38.0, 46.0, 31.0, 38.0, 35.0, 38.0, 45.0, 42.0, 47.0, 46.0, 43.0, 31.0, 33.0, 30.0, 31.0, 22.0, 21.0, 20.0, 21.0, 14.0, 10.0, 14.0, 10.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.75, -22.0517578125, -21.353515625, -20.6552734375, -19.95703125, -19.2587890625, -18.560546875, -17.8623046875, -17.1640625, -16.4658203125, -15.767578125, -15.0693359375, -14.37109375, -13.6728515625, -12.974609375, -12.2763671875, -11.578125, -10.8798828125, -10.181640625, -9.4833984375, -8.78515625, -8.0869140625, -7.388671875, -6.6904296875, -5.9921875, -5.2939453125, -4.595703125, -3.8974609375, -3.19921875, -2.5009765625, -1.802734375, -1.1044921875, -0.40625, 0.2919921875, 0.990234375, 1.6884765625, 2.38671875, 3.0849609375, 3.783203125, 4.4814453125, 5.1796875, 5.8779296875, 6.576171875, 7.2744140625, 7.97265625, 8.6708984375, 9.369140625, 10.0673828125, 10.765625, 11.4638671875, 12.162109375, 12.8603515625, 13.55859375, 14.2568359375, 14.955078125, 15.6533203125, 16.3515625, 17.0498046875, 17.748046875, 18.4462890625, 19.14453125, 19.8427734375, 20.541015625, 21.2392578125, 21.9375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 8.0, 18.0, 18.0, 40.0, 46.0, 68.0, 118.0, 144.0, 216.0, 337.0, 496.0, 703.0, 1073.0, 1590.0, 2401.0, 3744.0, 5741.0, 9121.0, 14297.0, 23457.0, 38361.0, 66288.0, 118587.0, 209825.0, 229935.0, 134067.0, 74685.0, 43008.0, 25807.0, 15791.0, 10097.0, 6352.0, 4092.0, 2633.0, 1727.0, 1237.0, 767.0, 510.0, 382.0, 244.0, 157.0, 117.0, 83.0, 45.0, 38.0, 29.0, 12.0, 15.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.1259765625, -1.0919647216796875, -1.057952880859375, -1.0239410400390625, -0.98992919921875, -0.9559173583984375, -0.921905517578125, -0.8878936767578125, -0.8538818359375, -0.8198699951171875, -0.785858154296875, -0.7518463134765625, -0.71783447265625, -0.6838226318359375, -0.649810791015625, -0.6157989501953125, -0.581787109375, -0.5477752685546875, -0.513763427734375, -0.4797515869140625, -0.44573974609375, -0.4117279052734375, -0.377716064453125, -0.3437042236328125, -0.3096923828125, -0.2756805419921875, -0.241668701171875, -0.2076568603515625, -0.17364501953125, -0.1396331787109375, -0.105621337890625, -0.0716094970703125, -0.03759765625, -0.0035858154296875, 0.030426025390625, 0.0644378662109375, 0.09844970703125, 0.1324615478515625, 0.166473388671875, 0.2004852294921875, 0.2344970703125, 0.2685089111328125, 0.302520751953125, 0.3365325927734375, 0.37054443359375, 0.4045562744140625, 0.438568115234375, 0.4725799560546875, 0.506591796875, 0.5406036376953125, 0.574615478515625, 0.6086273193359375, 0.64263916015625, 0.6766510009765625, 0.710662841796875, 0.7446746826171875, 0.7786865234375, 0.8126983642578125, 0.846710205078125, 0.8807220458984375, 0.91473388671875, 0.9487457275390625, 0.982757568359375, 1.0167694091796875, 1.05078125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 11.0, 9.0, 12.0, 16.0, 20.0, 17.0, 25.0, 36.0, 27.0, 20.0, 25.0, 41.0, 29.0, 31.0, 42.0, 44.0, 47.0, 1076.0, 43.0, 41.0, 36.0, 38.0, 33.0, 42.0, 30.0, 24.0, 24.0, 24.0, 26.0, 16.0, 16.0, 19.0, 10.0, 13.0, 11.0, 13.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3671875, -13.9031982421875, -13.439208984375, -12.9752197265625, -12.51123046875, -12.0472412109375, -11.583251953125, -11.1192626953125, -10.6552734375, -10.1912841796875, -9.727294921875, -9.2633056640625, -8.79931640625, -8.3353271484375, -7.871337890625, -7.4073486328125, -6.943359375, -6.4793701171875, -6.015380859375, -5.5513916015625, -5.08740234375, -4.6234130859375, -4.159423828125, -3.6954345703125, -3.2314453125, -2.7674560546875, -2.303466796875, -1.8394775390625, -1.37548828125, -0.9114990234375, -0.447509765625, 0.0164794921875, 0.48046875, 0.9444580078125, 1.408447265625, 1.8724365234375, 2.33642578125, 2.8004150390625, 3.264404296875, 3.7283935546875, 4.1923828125, 4.6563720703125, 5.120361328125, 5.5843505859375, 6.04833984375, 6.5123291015625, 6.976318359375, 7.4403076171875, 7.904296875, 8.3682861328125, 8.832275390625, 9.2962646484375, 9.76025390625, 10.2242431640625, 10.688232421875, 11.1522216796875, 11.6162109375, 12.0802001953125, 12.544189453125, 13.0081787109375, 13.47216796875, 13.9361572265625, 14.400146484375, 14.8641357421875, 15.328125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 19.0, 33.0, 45.0, 76.0, 105.0, 155.0, 243.0, 364.0, 505.0, 793.0, 1125.0, 1634.0, 2397.0, 3444.0, 4932.0, 7236.0, 10369.0, 15147.0, 21752.0, 33017.0, 51416.0, 84440.0, 150369.0, 1278106.0, 168074.0, 93569.0, 56396.0, 36015.0, 23567.0, 15893.0, 11053.0, 7682.0, 5328.0, 3746.0, 2544.0, 1822.0, 1212.0, 785.0, 563.0, 391.0, 253.0, 153.0, 121.0, 66.0, 51.0, 41.0, 28.0, 13.0, 14.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.9169921875, -0.88885498046875, -0.8607177734375, -0.83258056640625, -0.804443359375, -0.77630615234375, -0.7481689453125, -0.72003173828125, -0.69189453125, -0.66375732421875, -0.6356201171875, -0.60748291015625, -0.579345703125, -0.55120849609375, -0.5230712890625, -0.49493408203125, -0.466796875, -0.43865966796875, -0.4105224609375, -0.38238525390625, -0.354248046875, -0.32611083984375, -0.2979736328125, -0.26983642578125, -0.24169921875, -0.21356201171875, -0.1854248046875, -0.15728759765625, -0.129150390625, -0.10101318359375, -0.0728759765625, -0.04473876953125, -0.0166015625, 0.01153564453125, 0.0396728515625, 0.06781005859375, 0.095947265625, 0.12408447265625, 0.1522216796875, 0.18035888671875, 0.20849609375, 0.23663330078125, 0.2647705078125, 0.29290771484375, 0.321044921875, 0.34918212890625, 0.3773193359375, 0.40545654296875, 0.43359375, 0.46173095703125, 0.4898681640625, 0.51800537109375, 0.546142578125, 0.57427978515625, 0.6024169921875, 0.63055419921875, 0.65869140625, 0.68682861328125, 0.7149658203125, 0.74310302734375, 0.771240234375, 0.79937744140625, 0.8275146484375, 0.85565185546875, 0.8837890625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 12.0, 12.0, 14.0, 26.0, 31.0, 26.0, 48.0, 60.0, 61.0, 76.0, 78.0, 78.0, 53.0, 65.0, 67.0, 57.0, 46.0, 40.0, 37.0, 22.0, 10.0, 16.0, 18.0, 8.0, 9.0, 9.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005794525146484375, -0.005633056163787842, -0.005471587181091309, -0.005310118198394775, -0.005148649215698242, -0.004987180233001709, -0.004825711250305176, -0.004664242267608643, -0.004502773284912109, -0.004341304302215576, -0.004179835319519043, -0.00401836633682251, -0.0038568973541259766, -0.0036954283714294434, -0.00353395938873291, -0.003372490406036377, -0.0032110214233398438, -0.0030495524406433105, -0.0028880834579467773, -0.002726614475250244, -0.002565145492553711, -0.0024036765098571777, -0.0022422075271606445, -0.0020807385444641113, -0.0019192695617675781, -0.001757800579071045, -0.0015963315963745117, -0.0014348626136779785, -0.0012733936309814453, -0.0011119246482849121, -0.0009504556655883789, -0.0007889866828918457, -0.0006275177001953125, -0.0004660487174987793, -0.0003045797348022461, -0.0001431107521057129, 1.8358230590820312e-05, 0.00017982721328735352, 0.0003412961959838867, 0.0005027651786804199, 0.0006642341613769531, 0.0008257031440734863, 0.0009871721267700195, 0.0011486411094665527, 0.001310110092163086, 0.0014715790748596191, 0.0016330480575561523, 0.0017945170402526855, 0.0019559860229492188, 0.002117455005645752, 0.002278923988342285, 0.0024403929710388184, 0.0026018619537353516, 0.0027633309364318848, 0.002924799919128418, 0.003086268901824951, 0.0032477378845214844, 0.0034092068672180176, 0.0035706758499145508, 0.003732144832611084, 0.003893613815307617, 0.00405508279800415, 0.004216551780700684, 0.004378020763397217, 0.00453948974609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 11.0, 19.0, 21.0, 19.0, 23.0, 35.0, 49.0, 72.0, 96.0, 160.0, 260.0, 773.0, 12765.0, 919352.0, 111488.0, 2319.0, 408.0, 233.0, 124.0, 78.0, 79.0, 43.0, 25.0, 24.0, 22.0, 9.0, 12.0, 7.0, 8.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.078948974609375, -0.0762939453125, -0.073638916015625, -0.07098388671875, -0.068328857421875, -0.065673828125, -0.063018798828125, -0.06036376953125, -0.057708740234375, -0.0550537109375, -0.052398681640625, -0.04974365234375, -0.047088623046875, -0.04443359375, -0.041778564453125, -0.03912353515625, -0.036468505859375, -0.0338134765625, -0.031158447265625, -0.02850341796875, -0.025848388671875, -0.023193359375, -0.020538330078125, -0.01788330078125, -0.015228271484375, -0.0125732421875, -0.009918212890625, -0.00726318359375, -0.004608154296875, -0.001953125, 0.000701904296875, 0.00335693359375, 0.006011962890625, 0.0086669921875, 0.011322021484375, 0.01397705078125, 0.016632080078125, 0.019287109375, 0.021942138671875, 0.02459716796875, 0.027252197265625, 0.0299072265625, 0.032562255859375, 0.03521728515625, 0.037872314453125, 0.04052734375, 0.043182373046875, 0.04583740234375, 0.048492431640625, 0.0511474609375, 0.053802490234375, 0.05645751953125, 0.059112548828125, 0.061767578125, 0.064422607421875, 0.06707763671875, 0.069732666015625, 0.0723876953125, 0.075042724609375, 0.07769775390625, 0.080352783203125, 0.0830078125, 0.085662841796875, 0.08831787109375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 12.0, 46.0, 175.0, 426.0, 249.0, 78.0, 14.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008297149091959, -0.007826501503586769, -0.007355854846537113, -0.00688520772382617, -0.006414560601115227, -0.005943913012742996, -0.00547326635569334, -0.00500261876732111, -0.004531972110271454, -0.004061324987560511, -0.0035906778648495674, -0.003120030742138624, -0.002649383619427681, -0.002178736263886094, -0.0017080891411751509, -0.0012374420184642076, -0.0007667946629226208, -0.0002961475111078471, 0.00017449964070692658, 0.0006451468216255307, 0.001115793944336474, 0.001586441183462739, 0.002057088306173682, 0.0025277354288846254, 0.0029983825515955687, 0.003469029674306512, 0.003939677029848099, 0.004410324152559042, 0.004880971275269985, 0.005351618397980928, 0.005822265520691872, 0.006292912643402815, 0.006763559766113758, 0.007234206888824701, 0.0077048540115356445, 0.008175501599907875, 0.008646148256957531, 0.009116795845329762, 0.009587442502379417, 0.010058090090751648, 0.010528736747801304, 0.010999384336173534, 0.01147003099322319, 0.01194067858159542, 0.012411325238645077, 0.012881972827017307, 0.013352619484066963, 0.013823267072439194, 0.014293914660811424, 0.014764562249183655, 0.01523520890623331, 0.015705855563282967, 0.016176503151655197, 0.016647150740027428, 0.017117798328399658, 0.01758844405412674, 0.01805909164249897, 0.0185297392308712, 0.01900038681924343, 0.019471032544970512, 0.019941680133342743, 0.020412327721714973, 0.020882975310087204, 0.021353621035814285, 0.021824268624186516]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 4.0, 9.0, 12.0, 14.0, 12.0, 20.0, 22.0, 19.0, 21.0, 23.0, 34.0, 31.0, 42.0, 39.0, 30.0, 47.0, 50.0, 34.0, 27.0, 34.0, 38.0, 41.0, 34.0, 27.0, 43.0, 33.0, 32.0, 30.0, 23.0, 22.0, 27.0, 16.0, 15.0, 8.0, 15.0, 7.0, 10.0, 11.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0], "bins": [-0.002365589141845703, -0.00229695625603199, -0.002228323370218277, -0.002159690484404564, -0.002091057598590851, -0.0020224247127771378, -0.0019537918269634247, -0.0018851589411497116, -0.0018165260553359985, -0.0017478931695222855, -0.0016792602837085724, -0.0016106273978948593, -0.0015419945120811462, -0.0014733616262674332, -0.00140472874045372, -0.001336095854640007, -0.001267462968826294, -0.0011988300830125809, -0.0011301971971988678, -0.0010615643113851547, -0.0009929314255714417, -0.0009242985397577286, -0.0008556656539440155, -0.0007870327681303024, -0.0007183998823165894, -0.0006497669965028763, -0.0005811341106891632, -0.0005125012248754501, -0.00044386833906173706, -0.000375235453248024, -0.0003066025674343109, -0.00023796968162059784, -0.00016933679580688477, -0.00010070390999317169, -3.207102417945862e-05, 3.6561861634254456e-05, 0.00010519474744796753, 0.0001738276332616806, 0.00024246051907539368, 0.00031109340488910675, 0.0003797262907028198, 0.0004483591765165329, 0.000516992062330246, 0.000585624948143959, 0.0006542578339576721, 0.0007228907197713852, 0.0007915236055850983, 0.0008601564913988113, 0.0009287893772125244, 0.0009974222630262375, 0.0010660551488399506, 0.0011346880346536636, 0.0012033209204673767, 0.0012719538062810898, 0.0013405866920948029, 0.001409219577908516, 0.001477852463722229, 0.001546485349535942, 0.0016151182353496552, 0.0016837511211633682, 0.0017523840069770813, 0.0018210168927907944, 0.0018896497786045074, 0.0019582826644182205, 0.0020269155502319336]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 9.0, 11.0, 7.0, 15.0, 11.0, 21.0, 16.0, 27.0, 22.0, 25.0, 24.0, 36.0, 27.0, 38.0, 46.0, 31.0, 38.0, 35.0, 38.0, 45.0, 42.0, 47.0, 46.0, 43.0, 31.0, 33.0, 30.0, 31.0, 22.0, 21.0, 20.0, 21.0, 14.0, 10.0, 14.0, 10.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.75, -22.0517578125, -21.353515625, -20.6552734375, -19.95703125, -19.2587890625, -18.560546875, -17.8623046875, -17.1640625, -16.4658203125, -15.767578125, -15.0693359375, -14.37109375, -13.6728515625, -12.974609375, -12.2763671875, -11.578125, -10.8798828125, -10.181640625, -9.4833984375, -8.78515625, -8.0869140625, -7.388671875, -6.6904296875, -5.9921875, -5.2939453125, -4.595703125, -3.8974609375, -3.19921875, -2.5009765625, -1.802734375, -1.1044921875, -0.40625, 0.2919921875, 0.990234375, 1.6884765625, 2.38671875, 3.0849609375, 3.783203125, 4.4814453125, 5.1796875, 5.8779296875, 6.576171875, 7.2744140625, 7.97265625, 8.6708984375, 9.369140625, 10.0673828125, 10.765625, 11.4638671875, 12.162109375, 12.8603515625, 13.55859375, 14.2568359375, 14.955078125, 15.6533203125, 16.3515625, 17.0498046875, 17.748046875, 18.4462890625, 19.14453125, 19.8427734375, 20.541015625, 21.2392578125, 21.9375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 5.0, 4.0, 6.0, 10.0, 11.0, 13.0, 20.0, 21.0, 32.0, 43.0, 71.0, 97.0, 117.0, 213.0, 335.0, 534.0, 939.0, 1600.0, 3276.0, 7390.0, 22385.0, 135605.0, 749149.0, 95001.0, 18477.0, 6458.0, 2909.0, 1538.0, 877.0, 488.0, 303.0, 195.0, 141.0, 80.0, 44.0, 49.0, 34.0, 22.0, 14.0, 18.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-38.90625, -37.7421875, -36.578125, -35.4140625, -34.25, -33.0859375, -31.921875, -30.7578125, -29.59375, -28.4296875, -27.265625, -26.1015625, -24.9375, -23.7734375, -22.609375, -21.4453125, -20.28125, -19.1171875, -17.953125, -16.7890625, -15.625, -14.4609375, -13.296875, -12.1328125, -10.96875, -9.8046875, -8.640625, -7.4765625, -6.3125, -5.1484375, -3.984375, -2.8203125, -1.65625, -0.4921875, 0.671875, 1.8359375, 3.0, 4.1640625, 5.328125, 6.4921875, 7.65625, 8.8203125, 9.984375, 11.1484375, 12.3125, 13.4765625, 14.640625, 15.8046875, 16.96875, 18.1328125, 19.296875, 20.4609375, 21.625, 22.7890625, 23.953125, 25.1171875, 26.28125, 27.4453125, 28.609375, 29.7734375, 30.9375, 32.1015625, 33.265625, 34.4296875, 35.59375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 15.0, 16.0, 8.0, 12.0, 13.0, 15.0, 22.0, 21.0, 46.0, 40.0, 39.0, 67.0, 60.0, 64.0, 102.0, 178.0, 1719.0, 129.0, 75.0, 54.0, 55.0, 37.0, 38.0, 38.0, 25.0, 23.0, 19.0, 21.0, 18.0, 13.0, 13.0, 12.0, 6.0, 4.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-90.0, -87.1259765625, -84.251953125, -81.3779296875, -78.50390625, -75.6298828125, -72.755859375, -69.8818359375, -67.0078125, -64.1337890625, -61.259765625, -58.3857421875, -55.51171875, -52.6376953125, -49.763671875, -46.8896484375, -44.015625, -41.1416015625, -38.267578125, -35.3935546875, -32.51953125, -29.6455078125, -26.771484375, -23.8974609375, -21.0234375, -18.1494140625, -15.275390625, -12.4013671875, -9.52734375, -6.6533203125, -3.779296875, -0.9052734375, 1.96875, 4.8427734375, 7.716796875, 10.5908203125, 13.46484375, 16.3388671875, 19.212890625, 22.0869140625, 24.9609375, 27.8349609375, 30.708984375, 33.5830078125, 36.45703125, 39.3310546875, 42.205078125, 45.0791015625, 47.953125, 50.8271484375, 53.701171875, 56.5751953125, 59.44921875, 62.3232421875, 65.197265625, 68.0712890625, 70.9453125, 73.8193359375, 76.693359375, 79.5673828125, 82.44140625, 85.3154296875, 88.189453125, 91.0634765625, 93.9375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 8.0, 12.0, 22.0, 29.0, 39.0, 66.0, 77.0, 126.0, 227.0, 439.0, 1515.0, 24387.0, 3108477.0, 8236.0, 1056.0, 398.0, 189.0, 138.0, 75.0, 46.0, 31.0, 26.0, 21.0, 15.0, 17.0, 5.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-248.875, -239.064453125, -229.25390625, -219.443359375, -209.6328125, -199.822265625, -190.01171875, -180.201171875, -170.390625, -160.580078125, -150.76953125, -140.958984375, -131.1484375, -121.337890625, -111.52734375, -101.716796875, -91.90625, -82.095703125, -72.28515625, -62.474609375, -52.6640625, -42.853515625, -33.04296875, -23.232421875, -13.421875, -3.611328125, 6.19921875, 16.009765625, 25.8203125, 35.630859375, 45.44140625, 55.251953125, 65.0625, 74.873046875, 84.68359375, 94.494140625, 104.3046875, 114.115234375, 123.92578125, 133.736328125, 143.546875, 153.357421875, 163.16796875, 172.978515625, 182.7890625, 192.599609375, 202.41015625, 212.220703125, 222.03125, 231.841796875, 241.65234375, 251.462890625, 261.2734375, 271.083984375, 280.89453125, 290.705078125, 300.515625, 310.326171875, 320.13671875, 329.947265625, 339.7578125, 349.568359375, 359.37890625, 369.189453125, 379.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 8.0, 12.0, 39.0, 70.0, 157.0, 269.0, 219.0, 123.0, 59.0, 24.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.35208892822266, -83.11502075195312, -77.8779525756836, -72.64088439941406, -67.40380859375, -62.16674041748047, -56.92967224121094, -51.69260025024414, -46.45553207397461, -41.21846389770508, -35.98139190673828, -30.74432373046875, -25.507253646850586, -20.270183563232422, -15.03311538696289, -9.796043395996094, -4.5589752197265625, 0.6780943870544434, 5.915163993835449, 11.152233123779297, 16.38930320739746, 21.626373291015625, 26.863441467285156, 32.10051345825195, 37.337581634521484, 42.574649810791016, 47.81172180175781, 53.048789978027344, 58.285858154296875, 63.52293014526367, 68.75999450683594, 73.9970703125, 79.234130859375, 84.47119903564453, 89.70826721191406, 94.94534301757812, 100.18241119384766, 105.41947937011719, 110.65654754638672, 115.89361572265625, 121.13069152832031, 126.36775970458984, 131.60482788085938, 136.84190368652344, 142.07896423339844, 147.3160400390625, 152.5531005859375, 157.79017639160156, 163.02725219726562, 168.2643280029297, 173.5013885498047, 178.73846435546875, 183.97552490234375, 189.2126007080078, 194.44967651367188, 199.68673706054688, 204.92379760742188, 210.16087341308594, 215.39793395996094, 220.635009765625, 225.8720703125, 231.10914611816406, 236.34622192382812, 241.58328247070312, 246.8203582763672]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 6.0, 9.0, 3.0, 11.0, 17.0, 10.0, 18.0, 16.0, 18.0, 21.0, 10.0, 25.0, 20.0, 31.0, 28.0, 35.0, 39.0, 39.0, 51.0, 36.0, 44.0, 36.0, 41.0, 43.0, 39.0, 45.0, 36.0, 36.0, 29.0, 33.0, 23.0, 16.0, 25.0, 19.0, 19.0, 18.0, 14.0, 13.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-184.27944946289062, -178.48728942871094, -172.6951446533203, -166.90298461914062, -161.11082458496094, -155.3186798095703, -149.52651977539062, -143.734375, -137.9422149658203, -132.15005493164062, -126.35790252685547, -120.56575012207031, -114.77359771728516, -108.9814453125, -103.18928527832031, -97.39713287353516, -91.60497283935547, -85.81282043457031, -80.02066040039062, -74.22850799560547, -68.43635559082031, -62.64419937133789, -56.85204315185547, -51.05989074707031, -45.26773452758789, -39.47557830810547, -33.68342590332031, -27.89126968383789, -22.0991153717041, -16.306961059570312, -10.51480484008789, -4.722652435302734, 1.0695037841796875, 6.861658573150635, 12.653813362121582, 18.445968627929688, 24.238122940063477, 30.030277252197266, 35.82243347167969, 41.614585876464844, 47.406742095947266, 53.19889831542969, 58.991050720214844, 64.783203125, 70.57536315917969, 76.36751556396484, 82.15966796875, 87.95182800292969, 93.74398040771484, 99.5361328125, 105.32829284667969, 111.12044525146484, 116.91259765625, 122.70475769042969, 128.49691772460938, 134.2890625, 140.0812225341797, 145.87338256835938, 151.66552734375, 157.4576873779297, 163.24984741210938, 169.0419921875, 174.8341522216797, 180.62631225585938, 186.41845703125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 9.0, 10.0, 17.0, 4.0, 13.0, 14.0, 14.0, 26.0, 15.0, 16.0, 33.0, 22.0, 30.0, 37.0, 38.0, 41.0, 31.0, 34.0, 36.0, 39.0, 49.0, 47.0, 44.0, 34.0, 37.0, 36.0, 34.0, 37.0, 23.0, 25.0, 19.0, 14.0, 21.0, 19.0, 16.0, 15.0, 11.0, 9.0, 3.0, 9.0, 6.0, 1.0, 0.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.3125, -22.601806640625, -21.89111328125, -21.180419921875, -20.4697265625, -19.759033203125, -19.04833984375, -18.337646484375, -17.626953125, -16.916259765625, -16.20556640625, -15.494873046875, -14.7841796875, -14.073486328125, -13.36279296875, -12.652099609375, -11.94140625, -11.230712890625, -10.52001953125, -9.809326171875, -9.0986328125, -8.387939453125, -7.67724609375, -6.966552734375, -6.255859375, -5.545166015625, -4.83447265625, -4.123779296875, -3.4130859375, -2.702392578125, -1.99169921875, -1.281005859375, -0.5703125, 0.140380859375, 0.85107421875, 1.561767578125, 2.2724609375, 2.983154296875, 3.69384765625, 4.404541015625, 5.115234375, 5.825927734375, 6.53662109375, 7.247314453125, 7.9580078125, 8.668701171875, 9.37939453125, 10.090087890625, 10.80078125, 11.511474609375, 12.22216796875, 12.932861328125, 13.6435546875, 14.354248046875, 15.06494140625, 15.775634765625, 16.486328125, 17.197021484375, 17.90771484375, 18.618408203125, 19.3291015625, 20.039794921875, 20.75048828125, 21.461181640625, 22.171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 8.0, 6.0, 9.0, 18.0, 23.0, 24.0, 33.0, 37.0, 37.0, 81.0, 113.0, 176.0, 274.0, 378.0, 519.0, 900.0, 1453.0, 2549.0, 4656.0, 9643.0, 25315.0, 558615.0, 3422234.0, 135125.0, 16635.0, 6917.0, 3468.0, 1935.0, 1095.0, 683.0, 424.0, 260.0, 187.0, 113.0, 84.0, 64.0, 43.0, 42.0, 25.0, 19.0, 14.0, 12.0, 10.0, 2.0, 1.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-79.6875, -77.220703125, -74.75390625, -72.287109375, -69.8203125, -67.353515625, -64.88671875, -62.419921875, -59.953125, -57.486328125, -55.01953125, -52.552734375, -50.0859375, -47.619140625, -45.15234375, -42.685546875, -40.21875, -37.751953125, -35.28515625, -32.818359375, -30.3515625, -27.884765625, -25.41796875, -22.951171875, -20.484375, -18.017578125, -15.55078125, -13.083984375, -10.6171875, -8.150390625, -5.68359375, -3.216796875, -0.75, 1.716796875, 4.18359375, 6.650390625, 9.1171875, 11.583984375, 14.05078125, 16.517578125, 18.984375, 21.451171875, 23.91796875, 26.384765625, 28.8515625, 31.318359375, 33.78515625, 36.251953125, 38.71875, 41.185546875, 43.65234375, 46.119140625, 48.5859375, 51.052734375, 53.51953125, 55.986328125, 58.453125, 60.919921875, 63.38671875, 65.853515625, 68.3203125, 70.787109375, 73.25390625, 75.720703125, 78.1875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 6.0, 13.0, 13.0, 14.0, 20.0, 17.0, 43.0, 36.0, 87.0, 179.0, 495.0, 1086.0, 1154.0, 437.0, 181.0, 88.0, 35.0, 30.0, 28.0, 25.0, 13.0, 17.0, 7.0, 6.0, 12.0, 3.0, 9.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.5625, -77.2236328125, -74.884765625, -72.5458984375, -70.20703125, -67.8681640625, -65.529296875, -63.1904296875, -60.8515625, -58.5126953125, -56.173828125, -53.8349609375, -51.49609375, -49.1572265625, -46.818359375, -44.4794921875, -42.140625, -39.8017578125, -37.462890625, -35.1240234375, -32.78515625, -30.4462890625, -28.107421875, -25.7685546875, -23.4296875, -21.0908203125, -18.751953125, -16.4130859375, -14.07421875, -11.7353515625, -9.396484375, -7.0576171875, -4.71875, -2.3798828125, -0.041015625, 2.2978515625, 4.63671875, 6.9755859375, 9.314453125, 11.6533203125, 13.9921875, 16.3310546875, 18.669921875, 21.0087890625, 23.34765625, 25.6865234375, 28.025390625, 30.3642578125, 32.703125, 35.0419921875, 37.380859375, 39.7197265625, 42.05859375, 44.3974609375, 46.736328125, 49.0751953125, 51.4140625, 53.7529296875, 56.091796875, 58.4306640625, 60.76953125, 63.1083984375, 65.447265625, 67.7861328125, 70.125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 9.0, 12.0, 17.0, 26.0, 33.0, 69.0, 82.0, 161.0, 289.0, 580.0, 1509.0, 4069.0, 13027.0, 55027.0, 3359384.0, 706603.0, 37737.0, 9992.0, 3302.0, 1246.0, 508.0, 228.0, 135.0, 88.0, 42.0, 29.0, 28.0, 13.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.75, -133.140625, -128.53125, -123.921875, -119.3125, -114.703125, -110.09375, -105.484375, -100.875, -96.265625, -91.65625, -87.046875, -82.4375, -77.828125, -73.21875, -68.609375, -64.0, -59.390625, -54.78125, -50.171875, -45.5625, -40.953125, -36.34375, -31.734375, -27.125, -22.515625, -17.90625, -13.296875, -8.6875, -4.078125, 0.53125, 5.140625, 9.75, 14.359375, 18.96875, 23.578125, 28.1875, 32.796875, 37.40625, 42.015625, 46.625, 51.234375, 55.84375, 60.453125, 65.0625, 69.671875, 74.28125, 78.890625, 83.5, 88.109375, 92.71875, 97.328125, 101.9375, 106.546875, 111.15625, 115.765625, 120.375, 124.984375, 129.59375, 134.203125, 138.8125, 143.421875, 148.03125, 152.640625, 157.25]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 6.0, 17.0, 9.0, 9.0, 28.0, 42.0, 62.0, 125.0, 182.0, 189.0, 113.0, 73.0, 53.0, 26.0, 18.0, 15.0, 11.0, 5.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.41448974609375, -139.1709442138672, -129.92739868164062, -120.6838607788086, -111.44031524658203, -102.19676971435547, -92.95323181152344, -83.70968627929688, -74.46614074707031, -65.22259521484375, -55.97905349731445, -46.735511779785156, -37.491966247558594, -28.24842071533203, -19.004878997802734, -9.761337280273438, -0.517791748046875, 8.725751876831055, 17.969295501708984, 27.212839126586914, 36.456382751464844, 45.699928283691406, 54.9434700012207, 64.18701171875, 73.43055725097656, 82.67410278320312, 91.91764831542969, 101.16118621826172, 110.40473175048828, 119.64827728271484, 128.89181518554688, 138.13536071777344, 147.37893676757812, 156.6224822998047, 165.86602783203125, 175.1095733642578, 184.35311889648438, 193.59664916992188, 202.84019470214844, 212.083740234375, 221.32728576660156, 230.57083129882812, 239.8143768310547, 249.05792236328125, 258.30145263671875, 267.5450134277344, 276.7885437011719, 286.0321044921875, 295.275634765625, 304.5191650390625, 313.7627258300781, 323.0062561035156, 332.24981689453125, 341.49334716796875, 350.7369079589844, 359.9804382324219, 369.2239990234375, 378.467529296875, 387.7110900878906, 396.9546203613281, 406.19818115234375, 415.44171142578125, 424.6852722167969, 433.9288024902344, 443.1723327636719]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 4.0, 2.0, 10.0, 13.0, 6.0, 6.0, 13.0, 12.0, 18.0, 17.0, 32.0, 19.0, 31.0, 29.0, 29.0, 25.0, 40.0, 25.0, 36.0, 32.0, 45.0, 43.0, 28.0, 27.0, 34.0, 40.0, 33.0, 30.0, 37.0, 28.0, 34.0, 24.0, 24.0, 16.0, 18.0, 23.0, 23.0, 13.0, 13.0, 11.0, 10.0, 13.0, 8.0, 8.0, 8.0, 3.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-149.5488739013672, -145.10719299316406, -140.66549682617188, -136.22381591796875, -131.78211975097656, -127.34043884277344, -122.89875030517578, -118.45706176757812, -114.01537322998047, -109.57368469238281, -105.13199615478516, -100.6903076171875, -96.24862670898438, -91.80693054199219, -87.36524963378906, -82.9235610961914, -78.48187255859375, -74.0401840209961, -69.59849548339844, -65.15680694580078, -60.71512222290039, -56.273433685302734, -51.831748962402344, -47.39006042480469, -42.94837188720703, -38.506683349609375, -34.06499481201172, -29.623310089111328, -25.181621551513672, -20.739933013916016, -16.298246383666992, -11.856559753417969, -7.41485595703125, -2.97316837310791, 1.4685192108154297, 5.9102067947387695, 10.35189437866211, 14.793582916259766, 19.23526954650879, 23.676956176757812, 28.11864471435547, 32.560333251953125, 37.00202178955078, 41.44370651245117, 45.88539505004883, 50.327083587646484, 54.768768310546875, 59.21045684814453, 63.65214538574219, 68.09383392333984, 72.5355224609375, 76.97721099853516, 81.41889953613281, 85.86058044433594, 90.3022689819336, 94.74395751953125, 99.1856460571289, 103.62733459472656, 108.06902313232422, 112.51071166992188, 116.952392578125, 121.39408874511719, 125.83576965332031, 130.2774658203125, 134.71914672851562]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 9.0, 17.0, 14.0, 20.0, 15.0, 22.0, 22.0, 25.0, 35.0, 30.0, 25.0, 38.0, 36.0, 47.0, 35.0, 32.0, 62.0, 43.0, 45.0, 46.0, 33.0, 49.0, 36.0, 34.0, 35.0, 26.0, 27.0, 21.0, 21.0, 16.0, 14.0, 13.0, 6.0, 6.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.671875, -21.929443359375, -21.18701171875, -20.444580078125, -19.7021484375, -18.959716796875, -18.21728515625, -17.474853515625, -16.732421875, -15.989990234375, -15.24755859375, -14.505126953125, -13.7626953125, -13.020263671875, -12.27783203125, -11.535400390625, -10.79296875, -10.050537109375, -9.30810546875, -8.565673828125, -7.8232421875, -7.080810546875, -6.33837890625, -5.595947265625, -4.853515625, -4.111083984375, -3.36865234375, -2.626220703125, -1.8837890625, -1.141357421875, -0.39892578125, 0.343505859375, 1.0859375, 1.828369140625, 2.57080078125, 3.313232421875, 4.0556640625, 4.798095703125, 5.54052734375, 6.282958984375, 7.025390625, 7.767822265625, 8.51025390625, 9.252685546875, 9.9951171875, 10.737548828125, 11.47998046875, 12.222412109375, 12.96484375, 13.707275390625, 14.44970703125, 15.192138671875, 15.9345703125, 16.677001953125, 17.41943359375, 18.161865234375, 18.904296875, 19.646728515625, 20.38916015625, 21.131591796875, 21.8740234375, 22.616455078125, 23.35888671875, 24.101318359375, 24.84375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 15.0, 10.0, 18.0, 40.0, 45.0, 67.0, 107.0, 133.0, 170.0, 272.0, 391.0, 609.0, 945.0, 1353.0, 2031.0, 3016.0, 4694.0, 7000.0, 10896.0, 17308.0, 27318.0, 45237.0, 75592.0, 133611.0, 222504.0, 201665.0, 117143.0, 67223.0, 39958.0, 24675.0, 15454.0, 9976.0, 6544.0, 4074.0, 2726.0, 1800.0, 1303.0, 823.0, 562.0, 388.0, 289.0, 151.0, 115.0, 83.0, 58.0, 45.0, 46.0, 20.0, 18.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0], "bins": [-1.1494140625, -1.1154937744140625, -1.081573486328125, -1.0476531982421875, -1.01373291015625, -0.9798126220703125, -0.945892333984375, -0.9119720458984375, -0.8780517578125, -0.8441314697265625, -0.810211181640625, -0.7762908935546875, -0.74237060546875, -0.7084503173828125, -0.674530029296875, -0.6406097412109375, -0.606689453125, -0.5727691650390625, -0.538848876953125, -0.5049285888671875, -0.47100830078125, -0.4370880126953125, -0.403167724609375, -0.3692474365234375, -0.3353271484375, -0.3014068603515625, -0.267486572265625, -0.2335662841796875, -0.19964599609375, -0.1657257080078125, -0.131805419921875, -0.0978851318359375, -0.06396484375, -0.0300445556640625, 0.003875732421875, 0.0377960205078125, 0.07171630859375, 0.1056365966796875, 0.139556884765625, 0.1734771728515625, 0.2073974609375, 0.2413177490234375, 0.275238037109375, 0.3091583251953125, 0.34307861328125, 0.3769989013671875, 0.410919189453125, 0.4448394775390625, 0.478759765625, 0.5126800537109375, 0.546600341796875, 0.5805206298828125, 0.61444091796875, 0.6483612060546875, 0.682281494140625, 0.7162017822265625, 0.7501220703125, 0.7840423583984375, 0.817962646484375, 0.8518829345703125, 0.88580322265625, 0.9197235107421875, 0.953643798828125, 0.9875640869140625, 1.021484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 8.0, 8.0, 15.0, 15.0, 16.0, 19.0, 22.0, 27.0, 32.0, 32.0, 31.0, 55.0, 51.0, 51.0, 52.0, 35.0, 1073.0, 55.0, 43.0, 47.0, 28.0, 36.0, 31.0, 37.0, 25.0, 31.0, 19.0, 19.0, 14.0, 21.0, 16.0, 11.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-18.796875, -18.2950439453125, -17.793212890625, -17.2913818359375, -16.78955078125, -16.2877197265625, -15.785888671875, -15.2840576171875, -14.7822265625, -14.2803955078125, -13.778564453125, -13.2767333984375, -12.77490234375, -12.2730712890625, -11.771240234375, -11.2694091796875, -10.767578125, -10.2657470703125, -9.763916015625, -9.2620849609375, -8.76025390625, -8.2584228515625, -7.756591796875, -7.2547607421875, -6.7529296875, -6.2510986328125, -5.749267578125, -5.2474365234375, -4.74560546875, -4.2437744140625, -3.741943359375, -3.2401123046875, -2.73828125, -2.2364501953125, -1.734619140625, -1.2327880859375, -0.73095703125, -0.2291259765625, 0.272705078125, 0.7745361328125, 1.2763671875, 1.7781982421875, 2.280029296875, 2.7818603515625, 3.28369140625, 3.7855224609375, 4.287353515625, 4.7891845703125, 5.291015625, 5.7928466796875, 6.294677734375, 6.7965087890625, 7.29833984375, 7.8001708984375, 8.302001953125, 8.8038330078125, 9.3056640625, 9.8074951171875, 10.309326171875, 10.8111572265625, 11.31298828125, 11.8148193359375, 12.316650390625, 12.8184814453125, 13.3203125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 11.0, 11.0, 20.0, 35.0, 37.0, 67.0, 82.0, 149.0, 204.0, 320.0, 493.0, 734.0, 1118.0, 1643.0, 2530.0, 3899.0, 5814.0, 8718.0, 13920.0, 21844.0, 36409.0, 62708.0, 117720.0, 253413.0, 1267008.0, 127291.0, 67418.0, 38545.0, 23094.0, 14563.0, 9414.0, 6091.0, 3921.0, 2687.0, 1710.0, 1174.0, 832.0, 474.0, 331.0, 243.0, 165.0, 88.0, 61.0, 40.0, 27.0, 20.0, 12.0, 8.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.0283203125, -0.995208740234375, -0.96209716796875, -0.928985595703125, -0.8958740234375, -0.862762451171875, -0.82965087890625, -0.796539306640625, -0.763427734375, -0.730316162109375, -0.69720458984375, -0.664093017578125, -0.6309814453125, -0.597869873046875, -0.56475830078125, -0.531646728515625, -0.49853515625, -0.465423583984375, -0.43231201171875, -0.399200439453125, -0.3660888671875, -0.332977294921875, -0.29986572265625, -0.266754150390625, -0.233642578125, -0.200531005859375, -0.16741943359375, -0.134307861328125, -0.1011962890625, -0.068084716796875, -0.03497314453125, -0.001861572265625, 0.03125, 0.064361572265625, 0.09747314453125, 0.130584716796875, 0.1636962890625, 0.196807861328125, 0.22991943359375, 0.263031005859375, 0.296142578125, 0.329254150390625, 0.36236572265625, 0.395477294921875, 0.4285888671875, 0.461700439453125, 0.49481201171875, 0.527923583984375, 0.56103515625, 0.594146728515625, 0.62725830078125, 0.660369873046875, 0.6934814453125, 0.726593017578125, 0.75970458984375, 0.792816162109375, 0.825927734375, 0.859039306640625, 0.89215087890625, 0.925262451171875, 0.9583740234375, 0.991485595703125, 1.02459716796875, 1.057708740234375, 1.0908203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 11.0, 14.0, 17.0, 25.0, 28.0, 39.0, 39.0, 43.0, 49.0, 49.0, 42.0, 60.0, 50.0, 42.0, 61.0, 48.0, 55.0, 50.0, 46.0, 41.0, 35.0, 17.0, 19.0, 14.0, 20.0, 13.0, 17.0, 9.0, 4.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.004486083984375, -0.004356026649475098, -0.004225969314575195, -0.004095911979675293, -0.003965854644775391, -0.0038357973098754883, -0.003705739974975586, -0.0035756826400756836, -0.0034456253051757812, -0.003315567970275879, -0.0031855106353759766, -0.0030554533004760742, -0.002925395965576172, -0.0027953386306762695, -0.002665281295776367, -0.002535223960876465, -0.0024051666259765625, -0.00227510929107666, -0.002145051956176758, -0.0020149946212768555, -0.0018849372863769531, -0.0017548799514770508, -0.0016248226165771484, -0.001494765281677246, -0.0013647079467773438, -0.0012346506118774414, -0.001104593276977539, -0.0009745359420776367, -0.0008444786071777344, -0.000714421272277832, -0.0005843639373779297, -0.00045430660247802734, -0.000324249267578125, -0.00019419193267822266, -6.413459777832031e-05, 6.592273712158203e-05, 0.00019598007202148438, 0.0003260374069213867, 0.00045609474182128906, 0.0005861520767211914, 0.0007162094116210938, 0.0008462667465209961, 0.0009763240814208984, 0.0011063814163208008, 0.0012364387512207031, 0.0013664960861206055, 0.0014965534210205078, 0.0016266107559204102, 0.0017566680908203125, 0.0018867254257202148, 0.002016782760620117, 0.0021468400955200195, 0.002276897430419922, 0.0024069547653198242, 0.0025370121002197266, 0.002667069435119629, 0.0027971267700195312, 0.0029271841049194336, 0.003057241439819336, 0.0031872987747192383, 0.0033173561096191406, 0.003447413444519043, 0.0035774707794189453, 0.0037075281143188477, 0.00383758544921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 6.0, 13.0, 16.0, 19.0, 12.0, 26.0, 30.0, 43.0, 47.0, 93.0, 108.0, 165.0, 309.0, 1347.0, 39224.0, 972675.0, 32292.0, 1165.0, 322.0, 192.0, 112.0, 78.0, 59.0, 53.0, 37.0, 24.0, 17.0, 18.0, 12.0, 9.0, 9.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.081298828125, -0.07871627807617188, -0.07613372802734375, -0.07355117797851562, -0.0709686279296875, -0.06838607788085938, -0.06580352783203125, -0.06322097778320312, -0.060638427734375, -0.058055877685546875, -0.05547332763671875, -0.052890777587890625, -0.0503082275390625, -0.047725677490234375, -0.04514312744140625, -0.042560577392578125, -0.03997802734375, -0.037395477294921875, -0.03481292724609375, -0.032230377197265625, -0.0296478271484375, -0.027065277099609375, -0.02448272705078125, -0.021900177001953125, -0.019317626953125, -0.016735076904296875, -0.01415252685546875, -0.011569976806640625, -0.0089874267578125, -0.006404876708984375, -0.00382232666015625, -0.001239776611328125, 0.0013427734375, 0.003925323486328125, 0.00650787353515625, 0.009090423583984375, 0.0116729736328125, 0.014255523681640625, 0.01683807373046875, 0.019420623779296875, 0.022003173828125, 0.024585723876953125, 0.02716827392578125, 0.029750823974609375, 0.0323333740234375, 0.034915924072265625, 0.03749847412109375, 0.040081024169921875, 0.04266357421875, 0.045246124267578125, 0.04782867431640625, 0.050411224365234375, 0.0529937744140625, 0.055576324462890625, 0.05815887451171875, 0.060741424560546875, 0.063323974609375, 0.06590652465820312, 0.06848907470703125, 0.07107162475585938, 0.0736541748046875, 0.07623672485351562, 0.07881927490234375, 0.08140182495117188, 0.083984375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 10.0, 72.0, 440.0, 382.0, 87.0, 15.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014348218217492104, -0.013694781810045242, -0.013041345402598381, -0.01238790899515152, -0.011734472587704659, -0.011081036180257797, -0.010427598841488361, -0.0097741624340415, -0.009120726026594639, -0.008467289619147778, -0.007813853211700916, -0.007160416338592768, -0.0065069799311459064, -0.005853543523699045, -0.005200106650590897, -0.004546670243144035, -0.003893233835697174, -0.003239797428250313, -0.002586360787972808, -0.001932924147695303, -0.0012794877402484417, -0.0006260513328015804, 2.7385540306568146e-05, 0.0006808219477534294, 0.0013342583552002907, 0.001987694762647152, 0.002641131402924657, 0.003294568043202162, 0.003948004450649023, 0.004601440858095884, 0.005254877731204033, 0.005908314138650894, 0.006561752408742905, 0.007215188816189766, 0.007868625223636627, 0.008522061631083488, 0.00917549803853035, 0.009828934445977211, 0.010482371784746647, 0.011135808192193508, 0.01178924459964037, 0.01244268100708723, 0.013096117414534092, 0.013749554753303528, 0.014402991160750389, 0.01505642756819725, 0.01570986397564411, 0.016363300383090973, 0.017016736790537834, 0.017670173197984695, 0.018323609605431557, 0.018977046012878418, 0.01963048242032528, 0.02028391882777214, 0.02093735709786415, 0.021590791642665863, 0.022244229912757874, 0.022897666320204735, 0.023551102727651596, 0.024204539135098457, 0.02485797554254532, 0.02551141194999218, 0.02616484835743904, 0.02681828662753105, 0.027471721172332764]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 10.0, 9.0, 15.0, 9.0, 23.0, 15.0, 16.0, 26.0, 33.0, 23.0, 28.0, 29.0, 26.0, 40.0, 42.0, 38.0, 46.0, 31.0, 43.0, 32.0, 47.0, 37.0, 38.0, 30.0, 42.0, 27.0, 29.0, 31.0, 24.0, 24.0, 24.0, 22.0, 17.0, 13.0, 12.0, 11.0, 14.0, 5.0, 1.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002149343490600586, -0.0020791543647646904, -0.002008965238928795, -0.0019387761130928993, -0.0018685869872570038, -0.0017983978614211082, -0.0017282087355852127, -0.0016580196097493172, -0.0015878304839134216, -0.001517641358077526, -0.0014474522322416306, -0.001377263106405735, -0.0013070739805698395, -0.001236884854733944, -0.0011666957288980484, -0.0010965066030621529, -0.0010263174772262573, -0.0009561283513903618, -0.0008859392255544662, -0.0008157500997185707, -0.0007455609738826752, -0.0006753718480467796, -0.0006051827222108841, -0.0005349935963749886, -0.000464804470539093, -0.0003946153447031975, -0.00032442621886730194, -0.0002542370930314064, -0.00018404796719551086, -0.00011385884135961533, -4.366971552371979e-05, 2.651941031217575e-05, 9.670853614807129e-05, 0.00016689766198396683, 0.00023708678781986237, 0.0003072759136557579, 0.00037746503949165344, 0.000447654165327549, 0.0005178432911634445, 0.0005880324169993401, 0.0006582215428352356, 0.0007284106686711311, 0.0007985997945070267, 0.0008687889203429222, 0.0009389780461788177, 0.0010091671720147133, 0.0010793562978506088, 0.0011495454236865044, 0.0012197345495224, 0.0012899236753582954, 0.001360112801194191, 0.0014303019270300865, 0.001500491052865982, 0.0015706801787018776, 0.0016408693045377731, 0.0017110584303736687, 0.0017812475562095642, 0.0018514366820454597, 0.0019216258078813553, 0.001991814933717251, 0.0020620040595531464, 0.002132193185389042, 0.0022023823112249374, 0.002272571437060833, 0.0023427605628967285]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 9.0, 17.0, 14.0, 20.0, 15.0, 22.0, 22.0, 25.0, 35.0, 30.0, 25.0, 38.0, 36.0, 47.0, 35.0, 32.0, 62.0, 43.0, 45.0, 46.0, 33.0, 49.0, 36.0, 34.0, 35.0, 26.0, 27.0, 21.0, 21.0, 16.0, 14.0, 13.0, 6.0, 6.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.671875, -21.929443359375, -21.18701171875, -20.444580078125, -19.7021484375, -18.959716796875, -18.21728515625, -17.474853515625, -16.732421875, -15.989990234375, -15.24755859375, -14.505126953125, -13.7626953125, -13.020263671875, -12.27783203125, -11.535400390625, -10.79296875, -10.050537109375, -9.30810546875, -8.565673828125, -7.8232421875, -7.080810546875, -6.33837890625, -5.595947265625, -4.853515625, -4.111083984375, -3.36865234375, -2.626220703125, -1.8837890625, -1.141357421875, -0.39892578125, 0.343505859375, 1.0859375, 1.828369140625, 2.57080078125, 3.313232421875, 4.0556640625, 4.798095703125, 5.54052734375, 6.282958984375, 7.025390625, 7.767822265625, 8.51025390625, 9.252685546875, 9.9951171875, 10.737548828125, 11.47998046875, 12.222412109375, 12.96484375, 13.707275390625, 14.44970703125, 15.192138671875, 15.9345703125, 16.677001953125, 17.41943359375, 18.161865234375, 18.904296875, 19.646728515625, 20.38916015625, 21.131591796875, 21.8740234375, 22.616455078125, 23.35888671875, 24.101318359375, 24.84375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 12.0, 9.0, 12.0, 6.0, 24.0, 28.0, 45.0, 56.0, 88.0, 120.0, 187.0, 289.0, 416.0, 599.0, 1005.0, 1588.0, 2712.0, 4909.0, 9430.0, 23553.0, 103341.0, 679998.0, 164657.0, 30620.0, 11143.0, 5457.0, 3186.0, 1837.0, 1120.0, 690.0, 433.0, 315.0, 222.0, 114.0, 91.0, 63.0, 57.0, 34.0, 28.0, 12.0, 15.0, 10.0, 6.0, 9.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-32.09375, -31.138916015625, -30.18408203125, -29.229248046875, -28.2744140625, -27.319580078125, -26.36474609375, -25.409912109375, -24.455078125, -23.500244140625, -22.54541015625, -21.590576171875, -20.6357421875, -19.680908203125, -18.72607421875, -17.771240234375, -16.81640625, -15.861572265625, -14.90673828125, -13.951904296875, -12.9970703125, -12.042236328125, -11.08740234375, -10.132568359375, -9.177734375, -8.222900390625, -7.26806640625, -6.313232421875, -5.3583984375, -4.403564453125, -3.44873046875, -2.493896484375, -1.5390625, -0.584228515625, 0.37060546875, 1.325439453125, 2.2802734375, 3.235107421875, 4.18994140625, 5.144775390625, 6.099609375, 7.054443359375, 8.00927734375, 8.964111328125, 9.9189453125, 10.873779296875, 11.82861328125, 12.783447265625, 13.73828125, 14.693115234375, 15.64794921875, 16.602783203125, 17.5576171875, 18.512451171875, 19.46728515625, 20.422119140625, 21.376953125, 22.331787109375, 23.28662109375, 24.241455078125, 25.1962890625, 26.151123046875, 27.10595703125, 28.060791015625, 29.015625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 7.0, 9.0, 10.0, 23.0, 11.0, 13.0, 20.0, 30.0, 36.0, 47.0, 35.0, 45.0, 63.0, 56.0, 77.0, 279.0, 1726.0, 94.0, 74.0, 52.0, 48.0, 37.0, 39.0, 33.0, 32.0, 28.0, 22.0, 19.0, 14.0, 15.0, 9.0, 8.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0], "bins": [-87.25, -84.6953125, -82.140625, -79.5859375, -77.03125, -74.4765625, -71.921875, -69.3671875, -66.8125, -64.2578125, -61.703125, -59.1484375, -56.59375, -54.0390625, -51.484375, -48.9296875, -46.375, -43.8203125, -41.265625, -38.7109375, -36.15625, -33.6015625, -31.046875, -28.4921875, -25.9375, -23.3828125, -20.828125, -18.2734375, -15.71875, -13.1640625, -10.609375, -8.0546875, -5.5, -2.9453125, -0.390625, 2.1640625, 4.71875, 7.2734375, 9.828125, 12.3828125, 14.9375, 17.4921875, 20.046875, 22.6015625, 25.15625, 27.7109375, 30.265625, 32.8203125, 35.375, 37.9296875, 40.484375, 43.0390625, 45.59375, 48.1484375, 50.703125, 53.2578125, 55.8125, 58.3671875, 60.921875, 63.4765625, 66.03125, 68.5859375, 71.140625, 73.6953125, 76.25]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 6.0, 15.0, 17.0, 27.0, 43.0, 65.0, 102.0, 137.0, 295.0, 980.0, 22992.0, 3114994.0, 4917.0, 585.0, 196.0, 116.0, 72.0, 45.0, 32.0, 17.0, 12.0, 10.0, 5.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.5, -297.98046875, -287.4609375, -276.94140625, -266.421875, -255.90234375, -245.3828125, -234.86328125, -224.34375, -213.82421875, -203.3046875, -192.78515625, -182.265625, -171.74609375, -161.2265625, -150.70703125, -140.1875, -129.66796875, -119.1484375, -108.62890625, -98.109375, -87.58984375, -77.0703125, -66.55078125, -56.03125, -45.51171875, -34.9921875, -24.47265625, -13.953125, -3.43359375, 7.0859375, 17.60546875, 28.125, 38.64453125, 49.1640625, 59.68359375, 70.203125, 80.72265625, 91.2421875, 101.76171875, 112.28125, 122.80078125, 133.3203125, 143.83984375, 154.359375, 164.87890625, 175.3984375, 185.91796875, 196.4375, 206.95703125, 217.4765625, 227.99609375, 238.515625, 249.03515625, 259.5546875, 270.07421875, 280.59375, 291.11328125, 301.6328125, 312.15234375, 322.671875, 333.19140625, 343.7109375, 354.23046875, 364.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 8.0, 6.0, 10.0, 31.0, 50.0, 92.0, 138.0, 248.0, 216.0, 103.0, 56.0, 19.0, 15.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.34490203857422, -58.84526062011719, -53.345619201660156, -47.84598159790039, -42.34634017944336, -36.84669876098633, -31.347061157226562, -25.84741973876953, -20.3477783203125, -14.848137855529785, -9.34849739074707, -3.848857879638672, 1.6507835388183594, 7.150424957275391, 12.650062561035156, 18.149703979492188, 23.64934539794922, 29.14898681640625, 34.64862823486328, 40.14826583862305, 45.64790725708008, 51.14754867553711, 56.647186279296875, 62.146827697753906, 67.64646911621094, 73.14611053466797, 78.645751953125, 84.1453857421875, 89.64503479003906, 95.14466857910156, 100.6443099975586, 106.14395141601562, 111.64358520507812, 117.14322662353516, 122.64286804199219, 128.1425018310547, 133.64215087890625, 139.14178466796875, 144.64141845703125, 150.1410675048828, 155.64071655273438, 161.14035034179688, 166.63999938964844, 172.13963317871094, 177.6392822265625, 183.138916015625, 188.6385498046875, 194.13819885253906, 199.63783264160156, 205.13746643066406, 210.63711547851562, 216.13674926757812, 221.6363983154297, 227.1360321044922, 232.63568115234375, 238.13531494140625, 243.63494873046875, 249.13458251953125, 254.6342315673828, 260.1338806152344, 265.6335144042969, 271.1331481933594, 276.6327819824219, 282.1324462890625, 287.632080078125]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 9.0, 8.0, 9.0, 12.0, 7.0, 11.0, 18.0, 18.0, 22.0, 25.0, 24.0, 20.0, 14.0, 25.0, 29.0, 32.0, 36.0, 33.0, 33.0, 33.0, 48.0, 48.0, 41.0, 29.0, 44.0, 40.0, 27.0, 41.0, 40.0, 33.0, 33.0, 27.0, 14.0, 25.0, 16.0, 12.0, 6.0, 8.0, 9.0, 5.0, 10.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-224.2779998779297, -218.01217651367188, -211.746337890625, -205.4805145263672, -199.21469116210938, -192.9488525390625, -186.6830291748047, -180.41720581054688, -174.1513671875, -167.8855438232422, -161.6197052001953, -155.3538818359375, -149.0880584716797, -142.8222198486328, -136.556396484375, -130.29055786132812, -124.02474212646484, -117.7589111328125, -111.49308776855469, -105.22725677490234, -98.96142578125, -92.69560241699219, -86.42977142333984, -80.1639404296875, -73.89811706542969, -67.63228607177734, -61.366458892822266, -55.10063171386719, -48.834800720214844, -42.568973541259766, -36.30314636230469, -30.037315368652344, -23.771484375, -17.50565528869629, -11.239827156066895, -4.9739990234375, 1.291830062866211, 7.557659149169922, 13.823486328125, 20.089317321777344, 26.355144500732422, 32.6209716796875, 38.886802673339844, 45.15262985229492, 51.41845703125, 57.684288024902344, 63.95011520385742, 70.2159423828125, 76.48177337646484, 82.74760437011719, 89.013427734375, 95.27925872802734, 101.54508972167969, 107.8109130859375, 114.07674407958984, 120.34257507324219, 126.6083984375, 132.8742218017578, 139.1400604248047, 145.4058837890625, 151.6717071533203, 157.9375457763672, 164.203369140625, 170.46920776367188, 176.7350311279297]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 12.0, 11.0, 7.0, 19.0, 16.0, 20.0, 17.0, 15.0, 27.0, 33.0, 24.0, 36.0, 38.0, 48.0, 34.0, 42.0, 37.0, 43.0, 55.0, 40.0, 38.0, 45.0, 38.0, 46.0, 32.0, 28.0, 35.0, 25.0, 22.0, 26.0, 9.0, 18.0, 16.0, 5.0, 9.0, 5.0, 3.0, 2.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.46875, -24.66552734375, -23.8623046875, -23.05908203125, -22.255859375, -21.45263671875, -20.6494140625, -19.84619140625, -19.04296875, -18.23974609375, -17.4365234375, -16.63330078125, -15.830078125, -15.02685546875, -14.2236328125, -13.42041015625, -12.6171875, -11.81396484375, -11.0107421875, -10.20751953125, -9.404296875, -8.60107421875, -7.7978515625, -6.99462890625, -6.19140625, -5.38818359375, -4.5849609375, -3.78173828125, -2.978515625, -2.17529296875, -1.3720703125, -0.56884765625, 0.234375, 1.03759765625, 1.8408203125, 2.64404296875, 3.447265625, 4.25048828125, 5.0537109375, 5.85693359375, 6.66015625, 7.46337890625, 8.2666015625, 9.06982421875, 9.873046875, 10.67626953125, 11.4794921875, 12.28271484375, 13.0859375, 13.88916015625, 14.6923828125, 15.49560546875, 16.298828125, 17.10205078125, 17.9052734375, 18.70849609375, 19.51171875, 20.31494140625, 21.1181640625, 21.92138671875, 22.724609375, 23.52783203125, 24.3310546875, 25.13427734375, 25.9375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 16.0, 20.0, 19.0, 14.0, 35.0, 33.0, 55.0, 66.0, 88.0, 139.0, 227.0, 325.0, 530.0, 1042.0, 2168.0, 4836.0, 11022.0, 53803.0, 2614181.0, 1452386.0, 35847.0, 9371.0, 3878.0, 1826.0, 913.0, 494.0, 282.0, 198.0, 129.0, 90.0, 57.0, 47.0, 32.0, 28.0, 17.0, 15.0, 17.0, 7.0, 4.0, 9.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.1875, -79.529296875, -76.87109375, -74.212890625, -71.5546875, -68.896484375, -66.23828125, -63.580078125, -60.921875, -58.263671875, -55.60546875, -52.947265625, -50.2890625, -47.630859375, -44.97265625, -42.314453125, -39.65625, -36.998046875, -34.33984375, -31.681640625, -29.0234375, -26.365234375, -23.70703125, -21.048828125, -18.390625, -15.732421875, -13.07421875, -10.416015625, -7.7578125, -5.099609375, -2.44140625, 0.216796875, 2.875, 5.533203125, 8.19140625, 10.849609375, 13.5078125, 16.166015625, 18.82421875, 21.482421875, 24.140625, 26.798828125, 29.45703125, 32.115234375, 34.7734375, 37.431640625, 40.08984375, 42.748046875, 45.40625, 48.064453125, 50.72265625, 53.380859375, 56.0390625, 58.697265625, 61.35546875, 64.013671875, 66.671875, 69.330078125, 71.98828125, 74.646484375, 77.3046875, 79.962890625, 82.62109375, 85.279296875, 87.9375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 5.0, 6.0, 5.0, 6.0, 12.0, 10.0, 10.0, 25.0, 16.0, 25.0, 30.0, 37.0, 61.0, 94.0, 172.0, 334.0, 605.0, 986.0, 725.0, 380.0, 174.0, 85.0, 66.0, 38.0, 35.0, 28.0, 20.0, 16.0, 14.0, 8.0, 12.0, 7.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.0, -48.25048828125, -46.5009765625, -44.75146484375, -43.001953125, -41.25244140625, -39.5029296875, -37.75341796875, -36.00390625, -34.25439453125, -32.5048828125, -30.75537109375, -29.005859375, -27.25634765625, -25.5068359375, -23.75732421875, -22.0078125, -20.25830078125, -18.5087890625, -16.75927734375, -15.009765625, -13.26025390625, -11.5107421875, -9.76123046875, -8.01171875, -6.26220703125, -4.5126953125, -2.76318359375, -1.013671875, 0.73583984375, 2.4853515625, 4.23486328125, 5.984375, 7.73388671875, 9.4833984375, 11.23291015625, 12.982421875, 14.73193359375, 16.4814453125, 18.23095703125, 19.98046875, 21.72998046875, 23.4794921875, 25.22900390625, 26.978515625, 28.72802734375, 30.4775390625, 32.22705078125, 33.9765625, 35.72607421875, 37.4755859375, 39.22509765625, 40.974609375, 42.72412109375, 44.4736328125, 46.22314453125, 47.97265625, 49.72216796875, 51.4716796875, 53.22119140625, 54.970703125, 56.72021484375, 58.4697265625, 60.21923828125, 61.96875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 11.0, 8.0, 13.0, 16.0, 23.0, 32.0, 52.0, 96.0, 201.0, 474.0, 1481.0, 5490.0, 28805.0, 1324035.0, 2791166.0, 33466.0, 6173.0, 1651.0, 562.0, 229.0, 91.0, 51.0, 33.0, 31.0, 13.0, 14.0, 11.0, 9.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-205.25, -199.5546875, -193.859375, -188.1640625, -182.46875, -176.7734375, -171.078125, -165.3828125, -159.6875, -153.9921875, -148.296875, -142.6015625, -136.90625, -131.2109375, -125.515625, -119.8203125, -114.125, -108.4296875, -102.734375, -97.0390625, -91.34375, -85.6484375, -79.953125, -74.2578125, -68.5625, -62.8671875, -57.171875, -51.4765625, -45.78125, -40.0859375, -34.390625, -28.6953125, -23.0, -17.3046875, -11.609375, -5.9140625, -0.21875, 5.4765625, 11.171875, 16.8671875, 22.5625, 28.2578125, 33.953125, 39.6484375, 45.34375, 51.0390625, 56.734375, 62.4296875, 68.125, 73.8203125, 79.515625, 85.2109375, 90.90625, 96.6015625, 102.296875, 107.9921875, 113.6875, 119.3828125, 125.078125, 130.7734375, 136.46875, 142.1640625, 147.859375, 153.5546875, 159.25]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 19.0, 36.0, 125.0, 357.0, 326.0, 92.0, 27.0, 11.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-317.2574462890625, -295.9310607910156, -274.60467529296875, -253.2782745361328, -231.95188903808594, -210.62550354003906, -189.29910278320312, -167.97271728515625, -146.64633178710938, -125.3199462890625, -103.9935531616211, -82.66716003417969, -61.34077453613281, -40.01438903808594, -18.68799591064453, 2.638397216796875, 23.96478271484375, 45.29117202758789, 66.61756134033203, 87.94395446777344, 109.27033996582031, 130.5967254638672, 151.92312622070312, 173.24951171875, 194.57589721679688, 215.90228271484375, 237.22866821289062, 258.5550537109375, 279.8814697265625, 301.20782470703125, 322.53424072265625, 343.8606262207031, 365.18701171875, 386.5133972167969, 407.83978271484375, 429.1661682128906, 450.4925537109375, 471.8189697265625, 493.1453552246094, 514.4717407226562, 535.798095703125, 557.12451171875, 578.4508666992188, 599.7772827148438, 621.1036376953125, 642.4300537109375, 663.7564086914062, 685.0828247070312, 706.4092407226562, 727.7356567382812, 749.06201171875, 770.388427734375, 791.7147827148438, 813.0411987304688, 834.3675537109375, 855.6939697265625, 877.0203857421875, 898.3468017578125, 919.6731567382812, 940.9995727539062, 962.325927734375, 983.65234375, 1004.9786987304688, 1026.30517578125, 1047.6314697265625]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 9.0, 7.0, 4.0, 8.0, 5.0, 7.0, 10.0, 13.0, 12.0, 21.0, 19.0, 17.0, 27.0, 23.0, 24.0, 23.0, 33.0, 26.0, 31.0, 25.0, 32.0, 25.0, 39.0, 43.0, 40.0, 40.0, 47.0, 41.0, 40.0, 25.0, 27.0, 29.0, 26.0, 25.0, 26.0, 23.0, 23.0, 13.0, 12.0, 13.0, 8.0, 17.0, 9.0, 8.0, 2.0, 6.0, 9.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.8083724975586, -115.5762939453125, -111.3442153930664, -107.11213684082031, -102.88005828857422, -98.64797973632812, -94.41590881347656, -90.18382263183594, -85.95175170898438, -81.71967315673828, -77.48759460449219, -73.2555160522461, -69.0234375, -64.7913589477539, -60.55928421020508, -56.327205657958984, -52.095123291015625, -47.86304473876953, -43.63096618652344, -39.398887634277344, -35.16680908203125, -30.93473243713379, -26.702655792236328, -22.470577239990234, -18.23849868774414, -14.006420135498047, -9.77434253692627, -5.542264938354492, -1.3101863861083984, 2.9218921661376953, 7.153968811035156, 11.38604736328125, 15.618133544921875, 19.85021209716797, 24.082290649414062, 28.314367294311523, 32.54644775390625, 36.778526306152344, 41.01060104370117, 45.242679595947266, 49.47475814819336, 53.70683670043945, 57.93891525268555, 62.170989990234375, 66.40306854248047, 70.63514709472656, 74.86722564697266, 79.09930419921875, 83.33138275146484, 87.56346130371094, 91.79553985595703, 96.02761840820312, 100.25969696044922, 104.49177551269531, 108.72384643554688, 112.9559326171875, 117.18800354003906, 121.42008209228516, 125.65216064453125, 129.8842315673828, 134.11631774902344, 138.348388671875, 142.58047485351562, 146.8125457763672, 151.0446319580078]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 7.0, 7.0, 15.0, 14.0, 21.0, 22.0, 21.0, 20.0, 41.0, 29.0, 31.0, 33.0, 32.0, 52.0, 50.0, 43.0, 65.0, 55.0, 46.0, 41.0, 44.0, 40.0, 35.0, 41.0, 36.0, 18.0, 32.0, 19.0, 19.0, 13.0, 8.0, 8.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.384033203125, -22.53369140625, -21.683349609375, -20.8330078125, -19.982666015625, -19.13232421875, -18.281982421875, -17.431640625, -16.581298828125, -15.73095703125, -14.880615234375, -14.0302734375, -13.179931640625, -12.32958984375, -11.479248046875, -10.62890625, -9.778564453125, -8.92822265625, -8.077880859375, -7.2275390625, -6.377197265625, -5.52685546875, -4.676513671875, -3.826171875, -2.975830078125, -2.12548828125, -1.275146484375, -0.4248046875, 0.425537109375, 1.27587890625, 2.126220703125, 2.9765625, 3.826904296875, 4.67724609375, 5.527587890625, 6.3779296875, 7.228271484375, 8.07861328125, 8.928955078125, 9.779296875, 10.629638671875, 11.47998046875, 12.330322265625, 13.1806640625, 14.031005859375, 14.88134765625, 15.731689453125, 16.58203125, 17.432373046875, 18.28271484375, 19.133056640625, 19.9833984375, 20.833740234375, 21.68408203125, 22.534423828125, 23.384765625, 24.235107421875, 25.08544921875, 25.935791015625, 26.7861328125, 27.636474609375, 28.48681640625, 29.337158203125, 30.1875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 18.0, 18.0, 20.0, 28.0, 55.0, 96.0, 108.0, 222.0, 316.0, 498.0, 822.0, 1324.0, 2176.0, 3583.0, 6306.0, 10997.0, 20429.0, 39454.0, 80230.0, 173485.0, 320301.0, 200144.0, 90844.0, 44695.0, 22978.0, 12338.0, 6972.0, 4016.0, 2320.0, 1412.0, 870.0, 515.0, 326.0, 242.0, 123.0, 89.0, 62.0, 35.0, 32.0, 24.0, 8.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.54296875, -1.4956207275390625, -1.448272705078125, -1.4009246826171875, -1.35357666015625, -1.3062286376953125, -1.258880615234375, -1.2115325927734375, -1.1641845703125, -1.1168365478515625, -1.069488525390625, -1.0221405029296875, -0.97479248046875, -0.9274444580078125, -0.880096435546875, -0.8327484130859375, -0.785400390625, -0.7380523681640625, -0.690704345703125, -0.6433563232421875, -0.59600830078125, -0.5486602783203125, -0.501312255859375, -0.4539642333984375, -0.4066162109375, -0.3592681884765625, -0.311920166015625, -0.2645721435546875, -0.21722412109375, -0.1698760986328125, -0.122528076171875, -0.0751800537109375, -0.02783203125, 0.0195159912109375, 0.066864013671875, 0.1142120361328125, 0.16156005859375, 0.2089080810546875, 0.256256103515625, 0.3036041259765625, 0.3509521484375, 0.3983001708984375, 0.445648193359375, 0.4929962158203125, 0.54034423828125, 0.5876922607421875, 0.635040283203125, 0.6823883056640625, 0.729736328125, 0.7770843505859375, 0.824432373046875, 0.8717803955078125, 0.91912841796875, 0.9664764404296875, 1.013824462890625, 1.0611724853515625, 1.1085205078125, 1.1558685302734375, 1.203216552734375, 1.2505645751953125, 1.29791259765625, 1.3452606201171875, 1.392608642578125, 1.4399566650390625, 1.4873046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 3.0, 7.0, 4.0, 8.0, 10.0, 13.0, 5.0, 11.0, 19.0, 27.0, 31.0, 27.0, 37.0, 25.0, 46.0, 45.0, 40.0, 41.0, 50.0, 35.0, 1070.0, 48.0, 41.0, 43.0, 36.0, 43.0, 31.0, 38.0, 26.0, 30.0, 29.0, 21.0, 12.0, 16.0, 10.0, 14.0, 7.0, 9.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-19.375, -18.843017578125, -18.31103515625, -17.779052734375, -17.2470703125, -16.715087890625, -16.18310546875, -15.651123046875, -15.119140625, -14.587158203125, -14.05517578125, -13.523193359375, -12.9912109375, -12.459228515625, -11.92724609375, -11.395263671875, -10.86328125, -10.331298828125, -9.79931640625, -9.267333984375, -8.7353515625, -8.203369140625, -7.67138671875, -7.139404296875, -6.607421875, -6.075439453125, -5.54345703125, -5.011474609375, -4.4794921875, -3.947509765625, -3.41552734375, -2.883544921875, -2.3515625, -1.819580078125, -1.28759765625, -0.755615234375, -0.2236328125, 0.308349609375, 0.84033203125, 1.372314453125, 1.904296875, 2.436279296875, 2.96826171875, 3.500244140625, 4.0322265625, 4.564208984375, 5.09619140625, 5.628173828125, 6.16015625, 6.692138671875, 7.22412109375, 7.756103515625, 8.2880859375, 8.820068359375, 9.35205078125, 9.884033203125, 10.416015625, 10.947998046875, 11.47998046875, 12.011962890625, 12.5439453125, 13.075927734375, 13.60791015625, 14.139892578125, 14.671875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 14.0, 16.0, 22.0, 33.0, 40.0, 68.0, 98.0, 153.0, 246.0, 383.0, 497.0, 715.0, 1075.0, 1577.0, 2392.0, 3434.0, 5229.0, 8080.0, 12744.0, 20119.0, 32511.0, 54576.0, 95883.0, 177710.0, 1297028.0, 162030.0, 86696.0, 50471.0, 30145.0, 18678.0, 11796.0, 7645.0, 4923.0, 3244.0, 2219.0, 1417.0, 1016.0, 701.0, 515.0, 334.0, 210.0, 151.0, 101.0, 70.0, 44.0, 25.0, 22.0, 16.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.083984375, -1.0494842529296875, -1.014984130859375, -0.9804840087890625, -0.94598388671875, -0.9114837646484375, -0.876983642578125, -0.8424835205078125, -0.8079833984375, -0.7734832763671875, -0.738983154296875, -0.7044830322265625, -0.66998291015625, -0.6354827880859375, -0.600982666015625, -0.5664825439453125, -0.531982421875, -0.4974822998046875, -0.462982177734375, -0.4284820556640625, -0.39398193359375, -0.3594818115234375, -0.324981689453125, -0.2904815673828125, -0.2559814453125, -0.2214813232421875, -0.186981201171875, -0.1524810791015625, -0.11798095703125, -0.0834808349609375, -0.048980712890625, -0.0144805908203125, 0.02001953125, 0.0545196533203125, 0.089019775390625, 0.1235198974609375, 0.15802001953125, 0.1925201416015625, 0.227020263671875, 0.2615203857421875, 0.2960205078125, 0.3305206298828125, 0.365020751953125, 0.3995208740234375, 0.43402099609375, 0.4685211181640625, 0.503021240234375, 0.5375213623046875, 0.572021484375, 0.6065216064453125, 0.641021728515625, 0.6755218505859375, 0.71002197265625, 0.7445220947265625, 0.779022216796875, 0.8135223388671875, 0.8480224609375, 0.8825225830078125, 0.917022705078125, 0.9515228271484375, 0.98602294921875, 1.0205230712890625, 1.055023193359375, 1.0895233154296875, 1.1240234375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 7.0, 5.0, 8.0, 8.0, 9.0, 19.0, 24.0, 25.0, 29.0, 37.0, 46.0, 44.0, 52.0, 61.0, 48.0, 56.0, 63.0, 49.0, 73.0, 57.0, 49.0, 48.0, 27.0, 24.0, 19.0, 18.0, 20.0, 15.0, 7.0, 14.0, 7.0, 3.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00559234619140625, -0.00543135404586792, -0.00527036190032959, -0.00510936975479126, -0.00494837760925293, -0.0047873854637146, -0.0046263933181762695, -0.0044654011726379395, -0.004304409027099609, -0.004143416881561279, -0.003982424736022949, -0.003821432590484619, -0.003660440444946289, -0.003499448299407959, -0.003338456153869629, -0.003177464008331299, -0.0030164718627929688, -0.0028554797172546387, -0.0026944875717163086, -0.0025334954261779785, -0.0023725032806396484, -0.0022115111351013184, -0.0020505189895629883, -0.0018895268440246582, -0.0017285346984863281, -0.001567542552947998, -0.001406550407409668, -0.0012455582618713379, -0.0010845661163330078, -0.0009235739707946777, -0.0007625818252563477, -0.0006015896797180176, -0.0004405975341796875, -0.0002796053886413574, -0.00011861324310302734, 4.2378902435302734e-05, 0.0002033710479736328, 0.0003643631935119629, 0.000525355339050293, 0.000686347484588623, 0.0008473396301269531, 0.0010083317756652832, 0.0011693239212036133, 0.0013303160667419434, 0.0014913082122802734, 0.0016523003578186035, 0.0018132925033569336, 0.0019742846488952637, 0.0021352767944335938, 0.002296268939971924, 0.002457261085510254, 0.002618253231048584, 0.002779245376586914, 0.002940237522125244, 0.0031012296676635742, 0.0032622218132019043, 0.0034232139587402344, 0.0035842061042785645, 0.0037451982498168945, 0.0039061903953552246, 0.004067182540893555, 0.004228174686431885, 0.004389166831970215, 0.004550158977508545, 0.004711151123046875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 14.0, 8.0, 15.0, 18.0, 13.0, 25.0, 32.0, 47.0, 67.0, 92.0, 144.0, 253.0, 565.0, 15519.0, 1010788.0, 19626.0, 588.0, 252.0, 150.0, 76.0, 68.0, 41.0, 25.0, 36.0, 18.0, 10.0, 13.0, 9.0, 2.0, 5.0, 5.0, 7.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1038818359375, -0.10036277770996094, -0.09684371948242188, -0.09332466125488281, -0.08980560302734375, -0.08628654479980469, -0.08276748657226562, -0.07924842834472656, -0.0757293701171875, -0.07221031188964844, -0.06869125366210938, -0.06517219543457031, -0.06165313720703125, -0.05813407897949219, -0.054615020751953125, -0.05109596252441406, -0.047576904296875, -0.04405784606933594, -0.040538787841796875, -0.03701972961425781, -0.03350067138671875, -0.029981613159179688, -0.026462554931640625, -0.022943496704101562, -0.0194244384765625, -0.015905380249023438, -0.012386322021484375, -0.008867263793945312, -0.00534820556640625, -0.0018291473388671875, 0.001689910888671875, 0.0052089691162109375, 0.00872802734375, 0.012247085571289062, 0.015766143798828125, 0.019285202026367188, 0.02280426025390625, 0.026323318481445312, 0.029842376708984375, 0.03336143493652344, 0.0368804931640625, 0.04039955139160156, 0.043918609619140625, 0.04743766784667969, 0.05095672607421875, 0.05447578430175781, 0.057994842529296875, 0.06151390075683594, 0.065032958984375, 0.06855201721191406, 0.07207107543945312, 0.07559013366699219, 0.07910919189453125, 0.08262825012207031, 0.08614730834960938, 0.08966636657714844, 0.0931854248046875, 0.09670448303222656, 0.10022354125976562, 0.10374259948730469, 0.10726165771484375, 0.11078071594238281, 0.11429977416992188, 0.11781883239746094, 0.121337890625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 15.0, 202.0, 601.0, 166.0, 24.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00406833877786994, -0.0033215638250112534, -0.0025747891049832106, -0.0018280143849551678, -0.0010812394320964813, -0.0003344644792377949, 0.00041231000795960426, 0.0011590849608182907, 0.0019058599136769772, 0.0026526348665356636, 0.0033994095865637064, 0.004146184306591749, 0.004892959259450436, 0.005639734212309122, 0.006386508699506521, 0.007133283652365208, 0.007880058139562607, 0.008626832626760006, 0.00937360804527998, 0.010120382532477379, 0.010867157950997353, 0.011613932438194752, 0.012360706925392151, 0.013107482343912125, 0.013854257762432098, 0.014601032249629498, 0.015347807668149471, 0.01609458215534687, 0.016841357573866844, 0.01758813112974167, 0.018334906548261642, 0.019081681966781616, 0.01982845738530159, 0.020575232803821564, 0.021322006359696388, 0.022068781778216362, 0.022815557196736336, 0.02356233075261116, 0.024309106171131134, 0.025055881589651108, 0.02580265700817108, 0.026549432426691055, 0.02729620598256588, 0.028042981401085854, 0.028789756819605827, 0.029536530375480652, 0.030283305794000626, 0.0310300812125206, 0.031776852905750275, 0.03252362832427025, 0.03327040374279022, 0.0340171754360199, 0.03476395085453987, 0.035510726273059845, 0.03625750169157982, 0.03700427711009979, 0.037751052528619766, 0.03849782794713974, 0.039244603365659714, 0.03999137878417969, 0.04073815047740936, 0.04148492589592934, 0.04223170131444931, 0.042978476732969284, 0.04372525215148926]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 11.0, 6.0, 13.0, 9.0, 15.0, 17.0, 22.0, 24.0, 27.0, 21.0, 29.0, 35.0, 26.0, 25.0, 33.0, 31.0, 57.0, 44.0, 35.0, 44.0, 44.0, 43.0, 47.0, 42.0, 37.0, 27.0, 30.0, 19.0, 30.0, 17.0, 18.0, 17.0, 24.0, 11.0, 14.0, 11.0, 10.0, 3.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.002600252628326416, -0.0025182142853736877, -0.0024361759424209595, -0.002354137599468231, -0.002272099256515503, -0.0021900609135627747, -0.0021080225706100464, -0.002025984227657318, -0.0019439458847045898, -0.0018619075417518616, -0.0017798691987991333, -0.001697830855846405, -0.0016157925128936768, -0.0015337541699409485, -0.0014517158269882202, -0.001369677484035492, -0.0012876391410827637, -0.0012056007981300354, -0.0011235624551773071, -0.0010415241122245789, -0.0009594857692718506, -0.0008774474263191223, -0.000795409083366394, -0.0007133707404136658, -0.0006313323974609375, -0.0005492940545082092, -0.00046725571155548096, -0.0003852173686027527, -0.0003031790256500244, -0.00022114068269729614, -0.00013910233974456787, -5.70639967918396e-05, 2.4974346160888672e-05, 0.00010701268911361694, 0.00018905103206634521, 0.0002710893750190735, 0.00035312771797180176, 0.00043516606092453003, 0.0005172044038772583, 0.0005992427468299866, 0.0006812810897827148, 0.0007633194327354431, 0.0008453577756881714, 0.0009273961186408997, 0.001009434461593628, 0.0010914728045463562, 0.0011735111474990845, 0.0012555494904518127, 0.001337587833404541, 0.0014196261763572693, 0.0015016645193099976, 0.0015837028622627258, 0.001665741205215454, 0.0017477795481681824, 0.0018298178911209106, 0.001911856234073639, 0.001993894577026367, 0.0020759329199790955, 0.0021579712629318237, 0.002240009605884552, 0.0023220479488372803, 0.0024040862917900085, 0.002486124634742737, 0.002568162977695465, 0.0026502013206481934]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 7.0, 7.0, 16.0, 14.0, 20.0, 23.0, 20.0, 21.0, 41.0, 29.0, 30.0, 33.0, 34.0, 52.0, 48.0, 43.0, 65.0, 56.0, 45.0, 41.0, 44.0, 40.0, 35.0, 42.0, 35.0, 18.0, 33.0, 18.0, 19.0, 13.0, 8.0, 8.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.36865234375, -22.5185546875, -21.66845703125, -20.818359375, -19.96826171875, -19.1181640625, -18.26806640625, -17.41796875, -16.56787109375, -15.7177734375, -14.86767578125, -14.017578125, -13.16748046875, -12.3173828125, -11.46728515625, -10.6171875, -9.76708984375, -8.9169921875, -8.06689453125, -7.216796875, -6.36669921875, -5.5166015625, -4.66650390625, -3.81640625, -2.96630859375, -2.1162109375, -1.26611328125, -0.416015625, 0.43408203125, 1.2841796875, 2.13427734375, 2.984375, 3.83447265625, 4.6845703125, 5.53466796875, 6.384765625, 7.23486328125, 8.0849609375, 8.93505859375, 9.78515625, 10.63525390625, 11.4853515625, 12.33544921875, 13.185546875, 14.03564453125, 14.8857421875, 15.73583984375, 16.5859375, 17.43603515625, 18.2861328125, 19.13623046875, 19.986328125, 20.83642578125, 21.6865234375, 22.53662109375, 23.38671875, 24.23681640625, 25.0869140625, 25.93701171875, 26.787109375, 27.63720703125, 28.4873046875, 29.33740234375, 30.1875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 5.0, 9.0, 10.0, 22.0, 39.0, 42.0, 67.0, 94.0, 129.0, 192.0, 318.0, 464.0, 748.0, 1124.0, 1955.0, 3517.0, 7279.0, 27914.0, 456038.0, 503001.0, 29210.0, 7501.0, 3491.0, 2034.0, 1174.0, 755.0, 454.0, 298.0, 242.0, 133.0, 86.0, 63.0, 36.0, 35.0, 20.0, 12.0, 13.0, 3.0, 6.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.375, -38.14501953125, -36.9150390625, -35.68505859375, -34.455078125, -33.22509765625, -31.9951171875, -30.76513671875, -29.53515625, -28.30517578125, -27.0751953125, -25.84521484375, -24.615234375, -23.38525390625, -22.1552734375, -20.92529296875, -19.6953125, -18.46533203125, -17.2353515625, -16.00537109375, -14.775390625, -13.54541015625, -12.3154296875, -11.08544921875, -9.85546875, -8.62548828125, -7.3955078125, -6.16552734375, -4.935546875, -3.70556640625, -2.4755859375, -1.24560546875, -0.015625, 1.21435546875, 2.4443359375, 3.67431640625, 4.904296875, 6.13427734375, 7.3642578125, 8.59423828125, 9.82421875, 11.05419921875, 12.2841796875, 13.51416015625, 14.744140625, 15.97412109375, 17.2041015625, 18.43408203125, 19.6640625, 20.89404296875, 22.1240234375, 23.35400390625, 24.583984375, 25.81396484375, 27.0439453125, 28.27392578125, 29.50390625, 30.73388671875, 31.9638671875, 33.19384765625, 34.423828125, 35.65380859375, 36.8837890625, 38.11376953125, 39.34375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 6.0, 8.0, 13.0, 18.0, 20.0, 32.0, 36.0, 30.0, 30.0, 46.0, 51.0, 51.0, 77.0, 91.0, 1796.0, 215.0, 66.0, 72.0, 60.0, 33.0, 44.0, 40.0, 26.0, 28.0, 25.0, 20.0, 20.0, 9.0, 11.0, 16.0, 8.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-89.125, -86.318359375, -83.51171875, -80.705078125, -77.8984375, -75.091796875, -72.28515625, -69.478515625, -66.671875, -63.865234375, -61.05859375, -58.251953125, -55.4453125, -52.638671875, -49.83203125, -47.025390625, -44.21875, -41.412109375, -38.60546875, -35.798828125, -32.9921875, -30.185546875, -27.37890625, -24.572265625, -21.765625, -18.958984375, -16.15234375, -13.345703125, -10.5390625, -7.732421875, -4.92578125, -2.119140625, 0.6875, 3.494140625, 6.30078125, 9.107421875, 11.9140625, 14.720703125, 17.52734375, 20.333984375, 23.140625, 25.947265625, 28.75390625, 31.560546875, 34.3671875, 37.173828125, 39.98046875, 42.787109375, 45.59375, 48.400390625, 51.20703125, 54.013671875, 56.8203125, 59.626953125, 62.43359375, 65.240234375, 68.046875, 70.853515625, 73.66015625, 76.466796875, 79.2734375, 82.080078125, 84.88671875, 87.693359375, 90.5]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 9.0, 6.0, 8.0, 11.0, 13.0, 24.0, 36.0, 38.0, 43.0, 61.0, 88.0, 128.0, 167.0, 263.0, 454.0, 1994.0, 113710.0, 3022741.0, 4343.0, 582.0, 281.0, 179.0, 141.0, 101.0, 75.0, 56.0, 30.0, 28.0, 28.0, 10.0, 13.0, 7.0, 6.0, 6.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-290.75, -283.322265625, -275.89453125, -268.466796875, -261.0390625, -253.611328125, -246.18359375, -238.755859375, -231.328125, -223.900390625, -216.47265625, -209.044921875, -201.6171875, -194.189453125, -186.76171875, -179.333984375, -171.90625, -164.478515625, -157.05078125, -149.623046875, -142.1953125, -134.767578125, -127.33984375, -119.912109375, -112.484375, -105.056640625, -97.62890625, -90.201171875, -82.7734375, -75.345703125, -67.91796875, -60.490234375, -53.0625, -45.634765625, -38.20703125, -30.779296875, -23.3515625, -15.923828125, -8.49609375, -1.068359375, 6.359375, 13.787109375, 21.21484375, 28.642578125, 36.0703125, 43.498046875, 50.92578125, 58.353515625, 65.78125, 73.208984375, 80.63671875, 88.064453125, 95.4921875, 102.919921875, 110.34765625, 117.775390625, 125.203125, 132.630859375, 140.05859375, 147.486328125, 154.9140625, 162.341796875, 169.76953125, 177.197265625, 184.625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 10.0, 26.0, 47.0, 90.0, 194.0, 232.0, 208.0, 115.0, 59.0, 19.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-191.43386840820312, -187.41830444335938, -183.40272521972656, -179.3871612548828, -175.37159729003906, -171.35601806640625, -167.3404541015625, -163.32489013671875, -159.309326171875, -155.29376220703125, -151.27818298339844, -147.2626190185547, -143.24705505371094, -139.23147583007812, -135.21591186523438, -131.20034790039062, -127.18476867675781, -123.16919708251953, -119.15363311767578, -115.1380615234375, -111.12249755859375, -107.10692596435547, -103.09135437011719, -99.07579040527344, -95.06021881103516, -91.04464721679688, -87.02908325195312, -83.01351165771484, -78.99794006347656, -74.98237609863281, -70.96680450439453, -66.95123291015625, -62.93565368652344, -58.92008590698242, -54.904518127441406, -50.888946533203125, -46.87337875366211, -42.857810974121094, -38.84223937988281, -34.8266716003418, -30.81110382080078, -26.795536041259766, -22.779966354370117, -18.76439666748047, -14.748828887939453, -10.733261108398438, -6.717691421508789, -2.7021217346191406, 1.313446044921875, 5.329014778137207, 9.344583511352539, 13.360152244567871, 17.375720977783203, 21.39128875732422, 25.406858444213867, 29.422428131103516, 33.43799591064453, 37.45356369018555, 41.46913146972656, 45.484703063964844, 49.50027084350586, 53.515838623046875, 57.531410217285156, 61.54697799682617, 65.56254577636719]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 6.0, 9.0, 14.0, 5.0, 18.0, 13.0, 12.0, 12.0, 23.0, 17.0, 16.0, 16.0, 31.0, 31.0, 32.0, 34.0, 31.0, 40.0, 30.0, 37.0, 38.0, 34.0, 35.0, 39.0, 46.0, 35.0, 26.0, 38.0, 29.0, 29.0, 30.0, 31.0, 24.0, 23.0, 23.0, 12.0, 12.0, 12.0, 10.0, 6.0, 9.0, 5.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-173.79222106933594, -168.29708862304688, -162.80194091796875, -157.3068084716797, -151.81167602539062, -146.31654357910156, -140.8214111328125, -135.32626342773438, -129.8311309814453, -124.33599853515625, -118.84085845947266, -113.34571838378906, -107.8505859375, -102.35545349121094, -96.86031341552734, -91.36517333984375, -85.87004089355469, -80.37490844726562, -74.87976837158203, -69.38462829589844, -63.889495849609375, -58.39435958862305, -52.89922332763672, -47.40408706665039, -41.90895080566406, -36.413814544677734, -30.918678283691406, -25.423542022705078, -19.92840576171875, -14.433269500732422, -8.938133239746094, -3.4429969787597656, 2.0521240234375, 7.547260284423828, 13.042396545410156, 18.537532806396484, 24.032669067382812, 29.52780532836914, 35.02294158935547, 40.5180778503418, 46.013214111328125, 51.50835037231445, 57.00348663330078, 62.49862289428711, 67.99375915527344, 73.4888916015625, 78.9840316772461, 84.47917175292969, 89.97430419921875, 95.46943664550781, 100.9645767211914, 106.459716796875, 111.95484924316406, 117.44998168945312, 122.94512176513672, 128.4402618408203, 133.93539428710938, 139.43052673339844, 144.9256591796875, 150.42080688476562, 155.9159393310547, 161.41107177734375, 166.90621948242188, 172.40135192871094, 177.896484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 6.0, 8.0, 13.0, 12.0, 18.0, 12.0, 22.0, 23.0, 19.0, 30.0, 33.0, 38.0, 43.0, 37.0, 40.0, 55.0, 54.0, 66.0, 55.0, 48.0, 44.0, 36.0, 49.0, 44.0, 33.0, 28.0, 31.0, 24.0, 15.0, 17.0, 13.0, 12.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.46875, -25.53662109375, -24.6044921875, -23.67236328125, -22.740234375, -21.80810546875, -20.8759765625, -19.94384765625, -19.01171875, -18.07958984375, -17.1474609375, -16.21533203125, -15.283203125, -14.35107421875, -13.4189453125, -12.48681640625, -11.5546875, -10.62255859375, -9.6904296875, -8.75830078125, -7.826171875, -6.89404296875, -5.9619140625, -5.02978515625, -4.09765625, -3.16552734375, -2.2333984375, -1.30126953125, -0.369140625, 0.56298828125, 1.4951171875, 2.42724609375, 3.359375, 4.29150390625, 5.2236328125, 6.15576171875, 7.087890625, 8.02001953125, 8.9521484375, 9.88427734375, 10.81640625, 11.74853515625, 12.6806640625, 13.61279296875, 14.544921875, 15.47705078125, 16.4091796875, 17.34130859375, 18.2734375, 19.20556640625, 20.1376953125, 21.06982421875, 22.001953125, 22.93408203125, 23.8662109375, 24.79833984375, 25.73046875, 26.66259765625, 27.5947265625, 28.52685546875, 29.458984375, 30.39111328125, 31.3232421875, 32.25537109375, 33.1875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 9.0, 11.0, 11.0, 12.0, 27.0, 25.0, 38.0, 32.0, 84.0, 121.0, 151.0, 180.0, 285.0, 540.0, 755.0, 1392.0, 2533.0, 5353.0, 12125.0, 44598.0, 959723.0, 2992231.0, 141810.0, 17173.0, 6999.0, 3420.0, 1791.0, 1017.0, 581.0, 397.0, 267.0, 164.0, 102.0, 78.0, 67.0, 37.0, 27.0, 26.0, 29.0, 14.0, 17.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.71875, -57.60205078125, -55.4853515625, -53.36865234375, -51.251953125, -49.13525390625, -47.0185546875, -44.90185546875, -42.78515625, -40.66845703125, -38.5517578125, -36.43505859375, -34.318359375, -32.20166015625, -30.0849609375, -27.96826171875, -25.8515625, -23.73486328125, -21.6181640625, -19.50146484375, -17.384765625, -15.26806640625, -13.1513671875, -11.03466796875, -8.91796875, -6.80126953125, -4.6845703125, -2.56787109375, -0.451171875, 1.66552734375, 3.7822265625, 5.89892578125, 8.015625, 10.13232421875, 12.2490234375, 14.36572265625, 16.482421875, 18.59912109375, 20.7158203125, 22.83251953125, 24.94921875, 27.06591796875, 29.1826171875, 31.29931640625, 33.416015625, 35.53271484375, 37.6494140625, 39.76611328125, 41.8828125, 43.99951171875, 46.1162109375, 48.23291015625, 50.349609375, 52.46630859375, 54.5830078125, 56.69970703125, 58.81640625, 60.93310546875, 63.0498046875, 65.16650390625, 67.283203125, 69.39990234375, 71.5166015625, 73.63330078125, 75.75]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 6.0, 9.0, 10.0, 8.0, 13.0, 19.0, 31.0, 48.0, 72.0, 127.0, 265.0, 587.0, 1120.0, 853.0, 434.0, 187.0, 78.0, 58.0, 43.0, 26.0, 21.0, 14.0, 8.0, 7.0, 7.0, 9.0, 3.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.59375, -53.51611328125, -51.4384765625, -49.36083984375, -47.283203125, -45.20556640625, -43.1279296875, -41.05029296875, -38.97265625, -36.89501953125, -34.8173828125, -32.73974609375, -30.662109375, -28.58447265625, -26.5068359375, -24.42919921875, -22.3515625, -20.27392578125, -18.1962890625, -16.11865234375, -14.041015625, -11.96337890625, -9.8857421875, -7.80810546875, -5.73046875, -3.65283203125, -1.5751953125, 0.50244140625, 2.580078125, 4.65771484375, 6.7353515625, 8.81298828125, 10.890625, 12.96826171875, 15.0458984375, 17.12353515625, 19.201171875, 21.27880859375, 23.3564453125, 25.43408203125, 27.51171875, 29.58935546875, 31.6669921875, 33.74462890625, 35.822265625, 37.89990234375, 39.9775390625, 42.05517578125, 44.1328125, 46.21044921875, 48.2880859375, 50.36572265625, 52.443359375, 54.52099609375, 56.5986328125, 58.67626953125, 60.75390625, 62.83154296875, 64.9091796875, 66.98681640625, 69.064453125, 71.14208984375, 73.2197265625, 75.29736328125, 77.375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 11.0, 10.0, 11.0, 17.0, 26.0, 43.0, 81.0, 132.0, 249.0, 738.0, 2732.0, 15443.0, 807929.0, 3340128.0, 21820.0, 3375.0, 867.0, 318.0, 136.0, 76.0, 50.0, 21.0, 13.0, 14.0, 11.0, 11.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-236.5, -230.12109375, -223.7421875, -217.36328125, -210.984375, -204.60546875, -198.2265625, -191.84765625, -185.46875, -179.08984375, -172.7109375, -166.33203125, -159.953125, -153.57421875, -147.1953125, -140.81640625, -134.4375, -128.05859375, -121.6796875, -115.30078125, -108.921875, -102.54296875, -96.1640625, -89.78515625, -83.40625, -77.02734375, -70.6484375, -64.26953125, -57.890625, -51.51171875, -45.1328125, -38.75390625, -32.375, -25.99609375, -19.6171875, -13.23828125, -6.859375, -0.48046875, 5.8984375, 12.27734375, 18.65625, 25.03515625, 31.4140625, 37.79296875, 44.171875, 50.55078125, 56.9296875, 63.30859375, 69.6875, 76.06640625, 82.4453125, 88.82421875, 95.203125, 101.58203125, 107.9609375, 114.33984375, 120.71875, 127.09765625, 133.4765625, 139.85546875, 146.234375, 152.61328125, 158.9921875, 165.37109375, 171.75]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 10.0, 9.0, 5.0, 13.0, 9.0, 17.0, 19.0, 42.0, 34.0, 46.0, 87.0, 79.0, 106.0, 95.0, 86.0, 64.0, 59.0, 44.0, 38.0, 33.0, 16.0, 13.0, 17.0, 12.0, 8.0, 5.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-117.79104614257812, -113.89295959472656, -109.994873046875, -106.09678649902344, -102.19869995117188, -98.30061340332031, -94.40252685546875, -90.50444030761719, -86.60635375976562, -82.70826721191406, -78.8101806640625, -74.91209411621094, -71.01400756835938, -67.11592102050781, -63.21783447265625, -59.31974792480469, -55.42166519165039, -51.52357864379883, -47.625492095947266, -43.7274055480957, -39.82931900024414, -35.931236267089844, -32.03314971923828, -28.135061264038086, -24.236974716186523, -20.33888816833496, -16.4408016204834, -12.542716026306152, -8.64462947845459, -4.746543884277344, -0.8484573364257812, 3.0496292114257812, 6.947715759277344, 10.845802307128906, 14.743888854980469, 18.64197540283203, 22.540061950683594, 26.438146591186523, 30.336233139038086, 34.23432159423828, 38.132408142089844, 42.030494689941406, 45.92858123779297, 49.82666778564453, 53.724754333496094, 57.622840881347656, 61.52092742919922, 65.41901397705078, 69.31709289550781, 73.21517944335938, 77.11326599121094, 81.0113525390625, 84.90943908691406, 88.80752563476562, 92.70561218261719, 96.60369873046875, 100.50178527832031, 104.39987182617188, 108.29795837402344, 112.196044921875, 116.09413146972656, 119.99221801757812, 123.89030456542969, 127.78839111328125, 131.6864776611328]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 8.0, 4.0, 1.0, 8.0, 4.0, 12.0, 17.0, 12.0, 13.0, 21.0, 18.0, 19.0, 22.0, 21.0, 29.0, 26.0, 34.0, 37.0, 27.0, 36.0, 34.0, 31.0, 32.0, 40.0, 33.0, 26.0, 30.0, 31.0, 50.0, 31.0, 31.0, 26.0, 25.0, 18.0, 18.0, 19.0, 23.0, 28.0, 24.0, 18.0, 10.0, 6.0, 11.0, 9.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-109.8528823852539, -106.22437286376953, -102.59586334228516, -98.96735382080078, -95.3388442993164, -91.71033477783203, -88.08183288574219, -84.45332336425781, -80.82481384277344, -77.19630432128906, -73.56779479980469, -69.93928527832031, -66.31077575683594, -62.68226623535156, -59.05376052856445, -55.42525100708008, -51.79673767089844, -48.16822814941406, -44.53971862792969, -40.91120910644531, -37.28269958496094, -33.65419006347656, -30.025684356689453, -26.397174835205078, -22.768665313720703, -19.140155792236328, -15.51164722442627, -11.883138656616211, -8.254629135131836, -4.626119613647461, -0.9976119995117188, 2.6308975219726562, 6.2594146728515625, 9.887924194335938, 13.516432762145996, 17.144941329956055, 20.77345085144043, 24.401960372924805, 28.030467987060547, 31.658977508544922, 35.2874870300293, 38.91599655151367, 42.54450607299805, 46.173011779785156, 49.80152130126953, 53.430030822753906, 57.05854034423828, 60.687049865722656, 64.31555938720703, 67.9440689086914, 71.57257843017578, 75.20108795166016, 78.82959747314453, 82.4581069946289, 86.08660888671875, 89.71511840820312, 93.3436279296875, 96.97213745117188, 100.60064697265625, 104.22915649414062, 107.857666015625, 111.48617553710938, 115.11468505859375, 118.74319458007812, 122.3717041015625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 12.0, 9.0, 13.0, 11.0, 15.0, 20.0, 21.0, 21.0, 24.0, 28.0, 27.0, 30.0, 30.0, 37.0, 46.0, 42.0, 49.0, 44.0, 49.0, 53.0, 45.0, 48.0, 36.0, 43.0, 35.0, 22.0, 33.0, 29.0, 21.0, 22.0, 12.0, 11.0, 8.0, 12.0, 4.0, 7.0, 7.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.6298828125, -20.853515625, -20.0771484375, -19.30078125, -18.5244140625, -17.748046875, -16.9716796875, -16.1953125, -15.4189453125, -14.642578125, -13.8662109375, -13.08984375, -12.3134765625, -11.537109375, -10.7607421875, -9.984375, -9.2080078125, -8.431640625, -7.6552734375, -6.87890625, -6.1025390625, -5.326171875, -4.5498046875, -3.7734375, -2.9970703125, -2.220703125, -1.4443359375, -0.66796875, 0.1083984375, 0.884765625, 1.6611328125, 2.4375, 3.2138671875, 3.990234375, 4.7666015625, 5.54296875, 6.3193359375, 7.095703125, 7.8720703125, 8.6484375, 9.4248046875, 10.201171875, 10.9775390625, 11.75390625, 12.5302734375, 13.306640625, 14.0830078125, 14.859375, 15.6357421875, 16.412109375, 17.1884765625, 17.96484375, 18.7412109375, 19.517578125, 20.2939453125, 21.0703125, 21.8466796875, 22.623046875, 23.3994140625, 24.17578125, 24.9521484375, 25.728515625, 26.5048828125, 27.28125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 21.0, 27.0, 36.0, 69.0, 93.0, 137.0, 216.0, 327.0, 423.0, 685.0, 1095.0, 1614.0, 2463.0, 3920.0, 6189.0, 9925.0, 16158.0, 27052.0, 46040.0, 82163.0, 154382.0, 254706.0, 195557.0, 103829.0, 57121.0, 32507.0, 19286.0, 11733.0, 7326.0, 4729.0, 2961.0, 1947.0, 1285.0, 877.0, 557.0, 361.0, 257.0, 150.0, 103.0, 79.0, 49.0, 23.0, 24.0, 14.0, 10.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.104400634765625, -1.06719970703125, -1.029998779296875, -0.9927978515625, -0.955596923828125, -0.91839599609375, -0.881195068359375, -0.843994140625, -0.806793212890625, -0.76959228515625, -0.732391357421875, -0.6951904296875, -0.657989501953125, -0.62078857421875, -0.583587646484375, -0.54638671875, -0.509185791015625, -0.47198486328125, -0.434783935546875, -0.3975830078125, -0.360382080078125, -0.32318115234375, -0.285980224609375, -0.248779296875, -0.211578369140625, -0.17437744140625, -0.137176513671875, -0.0999755859375, -0.062774658203125, -0.02557373046875, 0.011627197265625, 0.048828125, 0.086029052734375, 0.12322998046875, 0.160430908203125, 0.1976318359375, 0.234832763671875, 0.27203369140625, 0.309234619140625, 0.346435546875, 0.383636474609375, 0.42083740234375, 0.458038330078125, 0.4952392578125, 0.532440185546875, 0.56964111328125, 0.606842041015625, 0.64404296875, 0.681243896484375, 0.71844482421875, 0.755645751953125, 0.7928466796875, 0.830047607421875, 0.86724853515625, 0.904449462890625, 0.941650390625, 0.978851318359375, 1.01605224609375, 1.053253173828125, 1.0904541015625, 1.127655029296875, 1.16485595703125, 1.202056884765625, 1.2392578125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 11.0, 8.0, 8.0, 13.0, 23.0, 18.0, 15.0, 23.0, 18.0, 28.0, 26.0, 33.0, 31.0, 36.0, 34.0, 42.0, 48.0, 46.0, 1064.0, 37.0, 37.0, 36.0, 38.0, 40.0, 38.0, 33.0, 33.0, 30.0, 25.0, 23.0, 16.0, 17.0, 17.0, 17.0, 11.0, 6.0, 8.0, 3.0, 3.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.78125, -14.322265625, -13.86328125, -13.404296875, -12.9453125, -12.486328125, -12.02734375, -11.568359375, -11.109375, -10.650390625, -10.19140625, -9.732421875, -9.2734375, -8.814453125, -8.35546875, -7.896484375, -7.4375, -6.978515625, -6.51953125, -6.060546875, -5.6015625, -5.142578125, -4.68359375, -4.224609375, -3.765625, -3.306640625, -2.84765625, -2.388671875, -1.9296875, -1.470703125, -1.01171875, -0.552734375, -0.09375, 0.365234375, 0.82421875, 1.283203125, 1.7421875, 2.201171875, 2.66015625, 3.119140625, 3.578125, 4.037109375, 4.49609375, 4.955078125, 5.4140625, 5.873046875, 6.33203125, 6.791015625, 7.25, 7.708984375, 8.16796875, 8.626953125, 9.0859375, 9.544921875, 10.00390625, 10.462890625, 10.921875, 11.380859375, 11.83984375, 12.298828125, 12.7578125, 13.216796875, 13.67578125, 14.134765625, 14.59375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 6.0, 15.0, 10.0, 23.0, 28.0, 48.0, 91.0, 94.0, 116.0, 139.0, 244.0, 354.0, 486.0, 646.0, 912.0, 1205.0, 1756.0, 2516.0, 3603.0, 5046.0, 7123.0, 10030.0, 14713.0, 21393.0, 32197.0, 49692.0, 80094.0, 134422.0, 1254787.0, 177852.0, 105967.0, 64289.0, 40538.0, 26905.0, 17950.0, 12380.0, 8708.0, 5916.0, 4365.0, 2999.0, 2123.0, 1513.0, 1097.0, 763.0, 557.0, 430.0, 285.0, 187.0, 175.0, 116.0, 73.0, 49.0, 41.0, 22.0, 13.0, 11.0, 10.0, 5.0, 6.0, 9.0], "bins": [-0.89501953125, -0.8677139282226562, -0.8404083251953125, -0.8131027221679688, -0.785797119140625, -0.7584915161132812, -0.7311859130859375, -0.7038803100585938, -0.67657470703125, -0.6492691040039062, -0.6219635009765625, -0.5946578979492188, -0.567352294921875, -0.5400466918945312, -0.5127410888671875, -0.48543548583984375, -0.4581298828125, -0.43082427978515625, -0.4035186767578125, -0.37621307373046875, -0.348907470703125, -0.32160186767578125, -0.2942962646484375, -0.26699066162109375, -0.23968505859375, -0.21237945556640625, -0.1850738525390625, -0.15776824951171875, -0.130462646484375, -0.10315704345703125, -0.0758514404296875, -0.04854583740234375, -0.021240234375, 0.00606536865234375, 0.0333709716796875, 0.06067657470703125, 0.087982177734375, 0.11528778076171875, 0.1425933837890625, 0.16989898681640625, 0.19720458984375, 0.22451019287109375, 0.2518157958984375, 0.27912139892578125, 0.306427001953125, 0.33373260498046875, 0.3610382080078125, 0.38834381103515625, 0.4156494140625, 0.44295501708984375, 0.4702606201171875, 0.49756622314453125, 0.524871826171875, 0.5521774291992188, 0.5794830322265625, 0.6067886352539062, 0.63409423828125, 0.6613998413085938, 0.6887054443359375, 0.7160110473632812, 0.743316650390625, 0.7706222534179688, 0.7979278564453125, 0.8252334594726562, 0.8525390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 12.0, 12.0, 11.0, 24.0, 13.0, 21.0, 33.0, 23.0, 34.0, 34.0, 30.0, 42.0, 53.0, 48.0, 46.0, 63.0, 49.0, 57.0, 35.0, 44.0, 35.0, 35.0, 28.0, 36.0, 33.0, 34.0, 15.0, 14.0, 12.0, 8.0, 10.0, 10.0, 5.0, 5.0, 6.0, 1.0, 5.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004241943359375, -0.004106760025024414, -0.003971576690673828, -0.003836393356323242, -0.0037012100219726562, -0.0035660266876220703, -0.0034308433532714844, -0.0032956600189208984, -0.0031604766845703125, -0.0030252933502197266, -0.0028901100158691406, -0.0027549266815185547, -0.0026197433471679688, -0.002484560012817383, -0.002349376678466797, -0.002214193344116211, -0.002079010009765625, -0.001943826675415039, -0.0018086433410644531, -0.0016734600067138672, -0.0015382766723632812, -0.0014030933380126953, -0.0012679100036621094, -0.0011327266693115234, -0.0009975433349609375, -0.0008623600006103516, -0.0007271766662597656, -0.0005919933319091797, -0.00045680999755859375, -0.0003216266632080078, -0.00018644332885742188, -5.125999450683594e-05, 8.392333984375e-05, 0.00021910667419433594, 0.0003542900085449219, 0.0004894733428955078, 0.0006246566772460938, 0.0007598400115966797, 0.0008950233459472656, 0.0010302066802978516, 0.0011653900146484375, 0.0013005733489990234, 0.0014357566833496094, 0.0015709400177001953, 0.0017061233520507812, 0.0018413066864013672, 0.001976490020751953, 0.002111673355102539, 0.002246856689453125, 0.002382040023803711, 0.002517223358154297, 0.002652406692504883, 0.0027875900268554688, 0.0029227733612060547, 0.0030579566955566406, 0.0031931400299072266, 0.0033283233642578125, 0.0034635066986083984, 0.0035986900329589844, 0.0037338733673095703, 0.0038690567016601562, 0.004004240036010742, 0.004139423370361328, 0.004274606704711914, 0.0044097900390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 3.0, 7.0, 14.0, 11.0, 11.0, 13.0, 17.0, 29.0, 39.0, 46.0, 43.0, 64.0, 90.0, 110.0, 164.0, 336.0, 1209.0, 57666.0, 967072.0, 19913.0, 817.0, 280.0, 141.0, 106.0, 75.0, 51.0, 47.0, 37.0, 29.0, 21.0, 19.0, 17.0, 10.0, 12.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08831787109375, -0.08550453186035156, -0.08269119262695312, -0.07987785339355469, -0.07706451416015625, -0.07425117492675781, -0.07143783569335938, -0.06862449645996094, -0.0658111572265625, -0.06299781799316406, -0.060184478759765625, -0.05737113952636719, -0.05455780029296875, -0.05174446105957031, -0.048931121826171875, -0.04611778259277344, -0.043304443359375, -0.04049110412597656, -0.037677764892578125, -0.03486442565917969, -0.03205108642578125, -0.029237747192382812, -0.026424407958984375, -0.023611068725585938, -0.0207977294921875, -0.017984390258789062, -0.015171051025390625, -0.012357711791992188, -0.00954437255859375, -0.0067310333251953125, -0.003917694091796875, -0.0011043548583984375, 0.001708984375, 0.0045223236083984375, 0.007335662841796875, 0.010149002075195312, 0.01296234130859375, 0.015775680541992188, 0.018589019775390625, 0.021402359008789062, 0.0242156982421875, 0.027029037475585938, 0.029842376708984375, 0.03265571594238281, 0.03546905517578125, 0.03828239440917969, 0.041095733642578125, 0.04390907287597656, 0.046722412109375, 0.04953575134277344, 0.052349090576171875, 0.05516242980957031, 0.05797576904296875, 0.06078910827636719, 0.06360244750976562, 0.06641578674316406, 0.0692291259765625, 0.07204246520996094, 0.07485580444335938, 0.07766914367675781, 0.08048248291015625, 0.08329582214355469, 0.08610916137695312, 0.08892250061035156, 0.09173583984375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 12.0, 18.0, 41.0, 68.0, 60.0, 121.0, 142.0, 162.0, 124.0, 99.0, 59.0, 29.0, 22.0, 11.0, 12.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022897045128047466, -0.0021149171516299248, -0.0019401300232857466, -0.0017653426621109247, -0.0015905554173514247, -0.0014157681725919247, -0.0012409808114171028, -0.0010661935666576028, -0.0008914063218981028, -0.0007166190771386027, -0.0005418317741714418, -0.00036704447120428085, -0.00019225722644478083, -1.74699816852808e-05, 0.00015731737948954105, 0.0003321046242490411, 0.0005068918690085411, 0.0006816791137680411, 0.0008564664167352021, 0.001031253719702363, 0.001206040964461863, 0.001380828209221363, 0.001555615570396185, 0.001730402815155685, 0.001905190059915185, 0.002079977421090007, 0.002254764549434185, 0.002429551910609007, 0.0026043392717838287, 0.002779126400128007, 0.002953913761302829, 0.003128700889647007, 0.003303488716483116, 0.003478276077657938, 0.003653063206002116, 0.003827850567176938, 0.004002637695521116, 0.004177425056695938, 0.00435221241787076, 0.004526999779045582, 0.004701786674559116, 0.004876574035733938, 0.00505136139690876, 0.005226148292422295, 0.0054009356535971165, 0.005575723014771938, 0.00575051037594676, 0.005925297737121582, 0.006100085098296404, 0.006274872459471226, 0.006449659820646048, 0.0066244471818208694, 0.006799234077334404, 0.006974021438509226, 0.007148808799684048, 0.0073235961608588696, 0.007498383522033691, 0.007673170883208513, 0.007847958244383335, 0.00802274513989687, 0.008197532966732979, 0.008372319862246513, 0.008547106757760048, 0.008721894584596157, 0.008896681480109692]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 2.0, 11.0, 8.0, 15.0, 10.0, 13.0, 14.0, 28.0, 15.0, 32.0, 30.0, 40.0, 32.0, 31.0, 26.0, 36.0, 38.0, 44.0, 38.0, 41.0, 42.0, 36.0, 40.0, 40.0, 37.0, 26.0, 34.0, 22.0, 27.0, 28.0, 28.0, 25.0, 24.0, 15.0, 12.0, 16.0, 8.0, 6.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025544166564941406, -0.0024745389819145203, -0.0023946613073349, -0.0023147836327552795, -0.002234905958175659, -0.002155028283596039, -0.0020751506090164185, -0.001995272934436798, -0.0019153952598571777, -0.0018355175852775574, -0.001755639910697937, -0.0016757622361183167, -0.0015958845615386963, -0.001516006886959076, -0.0014361292123794556, -0.0013562515377998352, -0.0012763738632202148, -0.0011964961886405945, -0.0011166185140609741, -0.0010367408394813538, -0.0009568631649017334, -0.000876985490322113, -0.0007971078157424927, -0.0007172301411628723, -0.000637352466583252, -0.0005574747920036316, -0.00047759711742401123, -0.00039771944284439087, -0.0003178417682647705, -0.00023796409368515015, -0.00015808641910552979, -7.820874452590942e-05, 1.6689300537109375e-06, 8.15466046333313e-05, 0.00016142427921295166, 0.00024130195379257202, 0.0003211796283721924, 0.00040105730295181274, 0.0004809349775314331, 0.0005608126521110535, 0.0006406903266906738, 0.0007205680012702942, 0.0008004456758499146, 0.0008803233504295349, 0.0009602010250091553, 0.0010400786995887756, 0.001119956374168396, 0.0011998340487480164, 0.0012797117233276367, 0.001359589397907257, 0.0014394670724868774, 0.0015193447470664978, 0.0015992224216461182, 0.0016791000962257385, 0.0017589777708053589, 0.0018388554453849792, 0.0019187331199645996, 0.00199861079454422, 0.0020784884691238403, 0.0021583661437034607, 0.002238243818283081, 0.0023181214928627014, 0.0023979991674423218, 0.002477876842021942, 0.0025577545166015625]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 12.0, 9.0, 13.0, 11.0, 15.0, 20.0, 21.0, 21.0, 24.0, 28.0, 27.0, 30.0, 30.0, 37.0, 46.0, 42.0, 49.0, 44.0, 49.0, 53.0, 45.0, 48.0, 36.0, 43.0, 35.0, 22.0, 33.0, 29.0, 21.0, 22.0, 12.0, 11.0, 8.0, 12.0, 4.0, 7.0, 7.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.6298828125, -20.853515625, -20.0771484375, -19.30078125, -18.5244140625, -17.748046875, -16.9716796875, -16.1953125, -15.4189453125, -14.642578125, -13.8662109375, -13.08984375, -12.3134765625, -11.537109375, -10.7607421875, -9.984375, -9.2080078125, -8.431640625, -7.6552734375, -6.87890625, -6.1025390625, -5.326171875, -4.5498046875, -3.7734375, -2.9970703125, -2.220703125, -1.4443359375, -0.66796875, 0.1083984375, 0.884765625, 1.6611328125, 2.4375, 3.2138671875, 3.990234375, 4.7666015625, 5.54296875, 6.3193359375, 7.095703125, 7.8720703125, 8.6484375, 9.4248046875, 10.201171875, 10.9775390625, 11.75390625, 12.5302734375, 13.306640625, 14.0830078125, 14.859375, 15.6357421875, 16.412109375, 17.1884765625, 17.96484375, 18.7412109375, 19.517578125, 20.2939453125, 21.0703125, 21.8466796875, 22.623046875, 23.3994140625, 24.17578125, 24.9521484375, 25.728515625, 26.5048828125, 27.28125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 6.0, 11.0, 13.0, 25.0, 17.0, 36.0, 37.0, 62.0, 90.0, 108.0, 148.0, 168.0, 252.0, 342.0, 457.0, 571.0, 769.0, 1063.0, 1496.0, 2501.0, 4654.0, 10659.0, 38832.0, 337601.0, 567645.0, 53691.0, 13081.0, 5374.0, 2681.0, 1708.0, 1223.0, 784.0, 627.0, 483.0, 322.0, 278.0, 188.0, 141.0, 107.0, 75.0, 64.0, 58.0, 24.0, 25.0, 19.0, 13.0, 14.0, 2.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.25, -24.43798828125, -23.6259765625, -22.81396484375, -22.001953125, -21.18994140625, -20.3779296875, -19.56591796875, -18.75390625, -17.94189453125, -17.1298828125, -16.31787109375, -15.505859375, -14.69384765625, -13.8818359375, -13.06982421875, -12.2578125, -11.44580078125, -10.6337890625, -9.82177734375, -9.009765625, -8.19775390625, -7.3857421875, -6.57373046875, -5.76171875, -4.94970703125, -4.1376953125, -3.32568359375, -2.513671875, -1.70166015625, -0.8896484375, -0.07763671875, 0.734375, 1.54638671875, 2.3583984375, 3.17041015625, 3.982421875, 4.79443359375, 5.6064453125, 6.41845703125, 7.23046875, 8.04248046875, 8.8544921875, 9.66650390625, 10.478515625, 11.29052734375, 12.1025390625, 12.91455078125, 13.7265625, 14.53857421875, 15.3505859375, 16.16259765625, 16.974609375, 17.78662109375, 18.5986328125, 19.41064453125, 20.22265625, 21.03466796875, 21.8466796875, 22.65869140625, 23.470703125, 24.28271484375, 25.0947265625, 25.90673828125, 26.71875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 6.0, 8.0, 6.0, 11.0, 14.0, 13.0, 27.0, 18.0, 31.0, 25.0, 21.0, 23.0, 38.0, 25.0, 36.0, 37.0, 44.0, 44.0, 152.0, 1814.0, 185.0, 39.0, 41.0, 44.0, 34.0, 29.0, 28.0, 35.0, 30.0, 23.0, 22.0, 23.0, 16.0, 12.0, 14.0, 10.0, 6.0, 11.0, 8.0, 5.0, 7.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-63.53125, -61.52001953125, -59.5087890625, -57.49755859375, -55.486328125, -53.47509765625, -51.4638671875, -49.45263671875, -47.44140625, -45.43017578125, -43.4189453125, -41.40771484375, -39.396484375, -37.38525390625, -35.3740234375, -33.36279296875, -31.3515625, -29.34033203125, -27.3291015625, -25.31787109375, -23.306640625, -21.29541015625, -19.2841796875, -17.27294921875, -15.26171875, -13.25048828125, -11.2392578125, -9.22802734375, -7.216796875, -5.20556640625, -3.1943359375, -1.18310546875, 0.828125, 2.83935546875, 4.8505859375, 6.86181640625, 8.873046875, 10.88427734375, 12.8955078125, 14.90673828125, 16.91796875, 18.92919921875, 20.9404296875, 22.95166015625, 24.962890625, 26.97412109375, 28.9853515625, 30.99658203125, 33.0078125, 35.01904296875, 37.0302734375, 39.04150390625, 41.052734375, 43.06396484375, 45.0751953125, 47.08642578125, 49.09765625, 51.10888671875, 53.1201171875, 55.13134765625, 57.142578125, 59.15380859375, 61.1650390625, 63.17626953125, 65.1875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 8.0, 9.0, 20.0, 23.0, 27.0, 38.0, 71.0, 107.0, 143.0, 232.0, 541.0, 3212.0, 3122161.0, 17284.0, 906.0, 322.0, 205.0, 104.0, 82.0, 62.0, 49.0, 25.0, 18.0, 11.0, 13.0, 3.0, 4.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-218.25, -210.375, -202.5, -194.625, -186.75, -178.875, -171.0, -163.125, -155.25, -147.375, -139.5, -131.625, -123.75, -115.875, -108.0, -100.125, -92.25, -84.375, -76.5, -68.625, -60.75, -52.875, -45.0, -37.125, -29.25, -21.375, -13.5, -5.625, 2.25, 10.125, 18.0, 25.875, 33.75, 41.625, 49.5, 57.375, 65.25, 73.125, 81.0, 88.875, 96.75, 104.625, 112.5, 120.375, 128.25, 136.125, 144.0, 151.875, 159.75, 167.625, 175.5, 183.375, 191.25, 199.125, 207.0, 214.875, 222.75, 230.625, 238.5, 246.375, 254.25, 262.125, 270.0, 277.875, 285.75]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 10.0, 12.0, 34.0, 40.0, 82.0, 117.0, 175.0, 182.0, 156.0, 94.0, 53.0, 21.0, 10.0, 10.0, 3.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.06866455078125, -102.8968734741211, -100.72508239746094, -98.55329895019531, -96.38150787353516, -94.209716796875, -92.03792572021484, -89.86613464355469, -87.69435119628906, -85.5225601196289, -83.35076904296875, -81.17898559570312, -79.00719451904297, -76.83540344238281, -74.66361236572266, -72.4918212890625, -70.32003021240234, -68.14823913574219, -65.97644805908203, -63.80466079711914, -61.63287353515625, -59.461082458496094, -57.28929138183594, -55.11750030517578, -52.94571304321289, -50.773921966552734, -48.602134704589844, -46.43034362792969, -44.25855255126953, -42.08676528930664, -39.914974212646484, -37.743186950683594, -35.57139205932617, -33.399600982666016, -31.227813720703125, -29.05602264404297, -26.884233474731445, -24.712444305419922, -22.540653228759766, -20.368864059448242, -18.19707489013672, -16.025285720825195, -13.853495597839355, -11.681705474853516, -9.509916305541992, -7.338127136230469, -5.166337013244629, -2.994546890258789, -0.8227577209472656, 1.349031925201416, 3.5208215713500977, 5.692611217498779, 7.864400863647461, 10.036190032958984, 12.207980155944824, 14.379770278930664, 16.551559448242188, 18.72334861755371, 20.895137786865234, 23.06692886352539, 25.238718032836914, 27.410507202148438, 29.582298278808594, 31.754087448120117, 33.92587661743164]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 5.0, 10.0, 6.0, 10.0, 10.0, 6.0, 10.0, 8.0, 14.0, 13.0, 18.0, 16.0, 20.0, 24.0, 24.0, 20.0, 36.0, 23.0, 44.0, 40.0, 37.0, 37.0, 26.0, 33.0, 38.0, 31.0, 36.0, 36.0, 40.0, 21.0, 27.0, 28.0, 21.0, 21.0, 36.0, 29.0, 23.0, 16.0, 18.0, 6.0, 15.0, 13.0, 9.0, 12.0, 5.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-143.6927490234375, -139.14691162109375, -134.60105895996094, -130.0552215576172, -125.50936889648438, -120.9635238647461, -116.41767883300781, -111.87184143066406, -107.32598876953125, -102.78014373779297, -98.23429870605469, -93.6884536743164, -89.14260864257812, -84.59676361083984, -80.05091857910156, -75.50508117675781, -70.95923614501953, -66.41339111328125, -61.86754608154297, -57.32170104980469, -52.775856018066406, -48.230010986328125, -43.68416976928711, -39.13832473754883, -34.59247970581055, -30.046634674072266, -25.500789642333984, -20.954946517944336, -16.409101486206055, -11.863256454467773, -7.317413330078125, -2.7715682983398438, 1.7742767333984375, 6.3201212882995605, 10.865965843200684, 15.411809921264648, 19.95765495300293, 24.50349998474121, 29.04934310913086, 33.59518814086914, 38.14103317260742, 42.6868782043457, 47.232723236083984, 51.778564453125, 56.32440948486328, 60.87025451660156, 65.41609954833984, 69.96194458007812, 74.5077896118164, 79.05363464355469, 83.59947967529297, 88.14532470703125, 92.69116973876953, 97.23701477050781, 101.78285217285156, 106.32870483398438, 110.87454223632812, 115.4203872680664, 119.96623229980469, 124.51207733154297, 129.05792236328125, 133.603759765625, 138.1496124267578, 142.69544982910156, 147.24130249023438]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 1.0, 8.0, 7.0, 9.0, 13.0, 15.0, 16.0, 14.0, 25.0, 21.0, 16.0, 29.0, 28.0, 31.0, 33.0, 38.0, 45.0, 44.0, 42.0, 53.0, 48.0, 46.0, 50.0, 48.0, 37.0, 43.0, 34.0, 27.0, 39.0, 27.0, 16.0, 20.0, 11.0, 14.0, 9.0, 9.0, 10.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.729736328125, -22.91259765625, -22.095458984375, -21.2783203125, -20.461181640625, -19.64404296875, -18.826904296875, -18.009765625, -17.192626953125, -16.37548828125, -15.558349609375, -14.7412109375, -13.924072265625, -13.10693359375, -12.289794921875, -11.47265625, -10.655517578125, -9.83837890625, -9.021240234375, -8.2041015625, -7.386962890625, -6.56982421875, -5.752685546875, -4.935546875, -4.118408203125, -3.30126953125, -2.484130859375, -1.6669921875, -0.849853515625, -0.03271484375, 0.784423828125, 1.6015625, 2.418701171875, 3.23583984375, 4.052978515625, 4.8701171875, 5.687255859375, 6.50439453125, 7.321533203125, 8.138671875, 8.955810546875, 9.77294921875, 10.590087890625, 11.4072265625, 12.224365234375, 13.04150390625, 13.858642578125, 14.67578125, 15.492919921875, 16.31005859375, 17.127197265625, 17.9443359375, 18.761474609375, 19.57861328125, 20.395751953125, 21.212890625, 22.030029296875, 22.84716796875, 23.664306640625, 24.4814453125, 25.298583984375, 26.11572265625, 26.932861328125, 27.75]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 10.0, 12.0, 15.0, 33.0, 35.0, 39.0, 54.0, 84.0, 101.0, 128.0, 181.0, 226.0, 282.0, 410.0, 555.0, 789.0, 1315.0, 2345.0, 4846.0, 13457.0, 150392.0, 3064574.0, 901514.0, 36210.0, 7825.0, 3363.0, 1840.0, 1047.0, 699.0, 469.0, 365.0, 252.0, 189.0, 141.0, 103.0, 96.0, 71.0, 48.0, 37.0, 34.0, 26.0, 19.0, 9.0, 11.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.40625, -59.34326171875, -57.2802734375, -55.21728515625, -53.154296875, -51.09130859375, -49.0283203125, -46.96533203125, -44.90234375, -42.83935546875, -40.7763671875, -38.71337890625, -36.650390625, -34.58740234375, -32.5244140625, -30.46142578125, -28.3984375, -26.33544921875, -24.2724609375, -22.20947265625, -20.146484375, -18.08349609375, -16.0205078125, -13.95751953125, -11.89453125, -9.83154296875, -7.7685546875, -5.70556640625, -3.642578125, -1.57958984375, 0.4833984375, 2.54638671875, 4.609375, 6.67236328125, 8.7353515625, 10.79833984375, 12.861328125, 14.92431640625, 16.9873046875, 19.05029296875, 21.11328125, 23.17626953125, 25.2392578125, 27.30224609375, 29.365234375, 31.42822265625, 33.4912109375, 35.55419921875, 37.6171875, 39.68017578125, 41.7431640625, 43.80615234375, 45.869140625, 47.93212890625, 49.9951171875, 52.05810546875, 54.12109375, 56.18408203125, 58.2470703125, 60.31005859375, 62.373046875, 64.43603515625, 66.4990234375, 68.56201171875, 70.625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 5.0, 5.0, 13.0, 21.0, 16.0, 31.0, 28.0, 36.0, 59.0, 118.0, 209.0, 421.0, 820.0, 929.0, 622.0, 310.0, 111.0, 90.0, 63.0, 39.0, 30.0, 30.0, 14.0, 12.0, 10.0, 5.0, 5.0, 4.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.125, -54.3828125, -52.640625, -50.8984375, -49.15625, -47.4140625, -45.671875, -43.9296875, -42.1875, -40.4453125, -38.703125, -36.9609375, -35.21875, -33.4765625, -31.734375, -29.9921875, -28.25, -26.5078125, -24.765625, -23.0234375, -21.28125, -19.5390625, -17.796875, -16.0546875, -14.3125, -12.5703125, -10.828125, -9.0859375, -7.34375, -5.6015625, -3.859375, -2.1171875, -0.375, 1.3671875, 3.109375, 4.8515625, 6.59375, 8.3359375, 10.078125, 11.8203125, 13.5625, 15.3046875, 17.046875, 18.7890625, 20.53125, 22.2734375, 24.015625, 25.7578125, 27.5, 29.2421875, 30.984375, 32.7265625, 34.46875, 36.2109375, 37.953125, 39.6953125, 41.4375, 43.1796875, 44.921875, 46.6640625, 48.40625, 50.1484375, 51.890625, 53.6328125, 55.375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 6.0, 6.0, 8.0, 14.0, 19.0, 38.0, 29.0, 61.0, 95.0, 217.0, 552.0, 2765.0, 35211.0, 4079623.0, 70456.0, 3937.0, 716.0, 239.0, 93.0, 47.0, 41.0, 28.0, 19.0, 16.0, 13.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.5, -233.85546875, -226.2109375, -218.56640625, -210.921875, -203.27734375, -195.6328125, -187.98828125, -180.34375, -172.69921875, -165.0546875, -157.41015625, -149.765625, -142.12109375, -134.4765625, -126.83203125, -119.1875, -111.54296875, -103.8984375, -96.25390625, -88.609375, -80.96484375, -73.3203125, -65.67578125, -58.03125, -50.38671875, -42.7421875, -35.09765625, -27.453125, -19.80859375, -12.1640625, -4.51953125, 3.125, 10.76953125, 18.4140625, 26.05859375, 33.703125, 41.34765625, 48.9921875, 56.63671875, 64.28125, 71.92578125, 79.5703125, 87.21484375, 94.859375, 102.50390625, 110.1484375, 117.79296875, 125.4375, 133.08203125, 140.7265625, 148.37109375, 156.015625, 163.66015625, 171.3046875, 178.94921875, 186.59375, 194.23828125, 201.8828125, 209.52734375, 217.171875, 224.81640625, 232.4609375, 240.10546875, 247.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 7.0, 9.0, 12.0, 34.0, 32.0, 69.0, 109.0, 150.0, 186.0, 153.0, 95.0, 58.0, 33.0, 24.0, 15.0, 10.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-317.0658264160156, -309.921630859375, -302.77740478515625, -295.6332092285156, -288.489013671875, -281.34478759765625, -274.2005920410156, -267.0563659667969, -259.91217041015625, -252.76795959472656, -245.62374877929688, -238.47955322265625, -231.33534240722656, -224.19113159179688, -217.04693603515625, -209.90272521972656, -202.75851440429688, -195.6143035888672, -188.4700927734375, -181.32589721679688, -174.1816864013672, -167.0374755859375, -159.89328002929688, -152.7490692138672, -145.6048583984375, -138.4606475830078, -131.31643676757812, -124.1722412109375, -117.02803039550781, -109.88381958007812, -102.73961639404297, -95.59541320800781, -88.45121765136719, -81.3070068359375, -74.16280364990234, -67.01860046386719, -59.8743896484375, -52.73018264770508, -45.585975646972656, -38.441768646240234, -31.297561645507812, -24.15335464477539, -17.00914764404297, -9.864940643310547, -2.720733642578125, 4.423473358154297, 11.567680358886719, 18.71188735961914, 25.856094360351562, 33.000301361083984, 40.144508361816406, 47.28871536254883, 54.43292236328125, 61.57712936401367, 68.7213363647461, 75.86553955078125, 83.00975036621094, 90.15396118164062, 97.29816436767578, 104.44236755371094, 111.58657836914062, 118.73078918457031, 125.87499237060547, 133.01919555664062, 140.1634063720703]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 6.0, 2.0, 7.0, 6.0, 11.0, 12.0, 17.0, 7.0, 8.0, 25.0, 19.0, 28.0, 32.0, 24.0, 30.0, 26.0, 30.0, 44.0, 27.0, 26.0, 32.0, 45.0, 29.0, 46.0, 35.0, 35.0, 40.0, 37.0, 38.0, 33.0, 35.0, 25.0, 24.0, 26.0, 17.0, 19.0, 11.0, 15.0, 9.0, 11.0, 9.0, 9.0, 5.0, 9.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-113.650634765625, -109.86417388916016, -106.07772064208984, -102.291259765625, -98.50480651855469, -94.71834564208984, -90.931884765625, -87.14543151855469, -83.35897064208984, -79.572509765625, -75.78605651855469, -71.99959564208984, -68.213134765625, -64.42668151855469, -60.640220642089844, -56.853763580322266, -53.06730651855469, -49.28084945678711, -45.49439239501953, -41.70793151855469, -37.92147445678711, -34.13501739501953, -30.34855842590332, -26.56209945678711, -22.77564239501953, -18.989185333251953, -15.202726364135742, -11.416268348693848, -7.629810333251953, -3.843353271484375, -0.05689430236816406, 3.729564666748047, 7.516021728515625, 11.30247974395752, 15.088937759399414, 18.875396728515625, 22.661853790283203, 26.44831085205078, 30.234769821166992, 34.0212287902832, 37.80768585205078, 41.59414291381836, 45.38059997558594, 49.16706085205078, 52.95351791381836, 56.73997497558594, 60.52643585205078, 64.31289672851562, 68.09934997558594, 71.88581085205078, 75.6722640991211, 79.45872497558594, 83.24517822265625, 87.0316390991211, 90.81809997558594, 94.60455322265625, 98.3910140991211, 102.17747497558594, 105.96392822265625, 109.7503890991211, 113.53684997558594, 117.32330322265625, 121.1097640991211, 124.89622497558594, 128.68267822265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 8.0, 14.0, 12.0, 14.0, 17.0, 26.0, 21.0, 20.0, 29.0, 27.0, 38.0, 32.0, 31.0, 30.0, 31.0, 53.0, 59.0, 50.0, 37.0, 45.0, 41.0, 35.0, 42.0, 44.0, 22.0, 33.0, 23.0, 25.0, 22.0, 18.0, 15.0, 11.0, 8.0, 12.0, 9.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.75, -21.00830078125, -20.2666015625, -19.52490234375, -18.783203125, -18.04150390625, -17.2998046875, -16.55810546875, -15.81640625, -15.07470703125, -14.3330078125, -13.59130859375, -12.849609375, -12.10791015625, -11.3662109375, -10.62451171875, -9.8828125, -9.14111328125, -8.3994140625, -7.65771484375, -6.916015625, -6.17431640625, -5.4326171875, -4.69091796875, -3.94921875, -3.20751953125, -2.4658203125, -1.72412109375, -0.982421875, -0.24072265625, 0.5009765625, 1.24267578125, 1.984375, 2.72607421875, 3.4677734375, 4.20947265625, 4.951171875, 5.69287109375, 6.4345703125, 7.17626953125, 7.91796875, 8.65966796875, 9.4013671875, 10.14306640625, 10.884765625, 11.62646484375, 12.3681640625, 13.10986328125, 13.8515625, 14.59326171875, 15.3349609375, 16.07666015625, 16.818359375, 17.56005859375, 18.3017578125, 19.04345703125, 19.78515625, 20.52685546875, 21.2685546875, 22.01025390625, 22.751953125, 23.49365234375, 24.2353515625, 24.97705078125, 25.71875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 20.0, 13.0, 27.0, 34.0, 58.0, 79.0, 114.0, 146.0, 256.0, 345.0, 550.0, 802.0, 1147.0, 1896.0, 2939.0, 4677.0, 7565.0, 12388.0, 20919.0, 35277.0, 61128.0, 109030.0, 198492.0, 249281.0, 146322.0, 80429.0, 45990.0, 26679.0, 15928.0, 9538.0, 5898.0, 3687.0, 2410.0, 1512.0, 971.0, 664.0, 415.0, 284.0, 202.0, 120.0, 97.0, 62.0, 61.0, 30.0, 14.0, 17.0, 10.0, 9.0, 7.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.109375, -1.07269287109375, -1.0360107421875, -0.99932861328125, -0.962646484375, -0.92596435546875, -0.8892822265625, -0.85260009765625, -0.81591796875, -0.77923583984375, -0.7425537109375, -0.70587158203125, -0.669189453125, -0.63250732421875, -0.5958251953125, -0.55914306640625, -0.5224609375, -0.48577880859375, -0.4490966796875, -0.41241455078125, -0.375732421875, -0.33905029296875, -0.3023681640625, -0.26568603515625, -0.22900390625, -0.19232177734375, -0.1556396484375, -0.11895751953125, -0.082275390625, -0.04559326171875, -0.0089111328125, 0.02777099609375, 0.064453125, 0.10113525390625, 0.1378173828125, 0.17449951171875, 0.211181640625, 0.24786376953125, 0.2845458984375, 0.32122802734375, 0.35791015625, 0.39459228515625, 0.4312744140625, 0.46795654296875, 0.504638671875, 0.54132080078125, 0.5780029296875, 0.61468505859375, 0.6513671875, 0.68804931640625, 0.7247314453125, 0.76141357421875, 0.798095703125, 0.83477783203125, 0.8714599609375, 0.90814208984375, 0.94482421875, 0.98150634765625, 1.0181884765625, 1.05487060546875, 1.091552734375, 1.12823486328125, 1.1649169921875, 1.20159912109375, 1.23828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 7.0, 6.0, 14.0, 9.0, 20.0, 14.0, 24.0, 24.0, 15.0, 24.0, 29.0, 36.0, 38.0, 43.0, 35.0, 36.0, 31.0, 43.0, 38.0, 1059.0, 36.0, 35.0, 35.0, 38.0, 26.0, 33.0, 32.0, 31.0, 25.0, 25.0, 14.0, 16.0, 17.0, 15.0, 19.0, 10.0, 11.0, 11.0, 5.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0], "bins": [-14.7578125, -14.32470703125, -13.8916015625, -13.45849609375, -13.025390625, -12.59228515625, -12.1591796875, -11.72607421875, -11.29296875, -10.85986328125, -10.4267578125, -9.99365234375, -9.560546875, -9.12744140625, -8.6943359375, -8.26123046875, -7.828125, -7.39501953125, -6.9619140625, -6.52880859375, -6.095703125, -5.66259765625, -5.2294921875, -4.79638671875, -4.36328125, -3.93017578125, -3.4970703125, -3.06396484375, -2.630859375, -2.19775390625, -1.7646484375, -1.33154296875, -0.8984375, -0.46533203125, -0.0322265625, 0.40087890625, 0.833984375, 1.26708984375, 1.7001953125, 2.13330078125, 2.56640625, 2.99951171875, 3.4326171875, 3.86572265625, 4.298828125, 4.73193359375, 5.1650390625, 5.59814453125, 6.03125, 6.46435546875, 6.8974609375, 7.33056640625, 7.763671875, 8.19677734375, 8.6298828125, 9.06298828125, 9.49609375, 9.92919921875, 10.3623046875, 10.79541015625, 11.228515625, 11.66162109375, 12.0947265625, 12.52783203125, 12.9609375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 6.0, 15.0, 17.0, 26.0, 51.0, 56.0, 81.0, 143.0, 201.0, 290.0, 370.0, 574.0, 813.0, 1113.0, 1639.0, 2293.0, 3194.0, 4434.0, 6367.0, 8901.0, 12792.0, 18806.0, 27627.0, 41961.0, 65765.0, 107252.0, 175485.0, 1247418.0, 133429.0, 80263.0, 50375.0, 33118.0, 22013.0, 14866.0, 10412.0, 7311.0, 5141.0, 3623.0, 2605.0, 1880.0, 1322.0, 931.0, 661.0, 488.0, 301.0, 222.0, 180.0, 98.0, 85.0, 45.0, 32.0, 15.0, 17.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.83740234375, -0.8105697631835938, -0.7837371826171875, -0.7569046020507812, -0.730072021484375, -0.7032394409179688, -0.6764068603515625, -0.6495742797851562, -0.62274169921875, -0.5959091186523438, -0.5690765380859375, -0.5422439575195312, -0.515411376953125, -0.48857879638671875, -0.4617462158203125, -0.43491363525390625, -0.4080810546875, -0.38124847412109375, -0.3544158935546875, -0.32758331298828125, -0.300750732421875, -0.27391815185546875, -0.2470855712890625, -0.22025299072265625, -0.19342041015625, -0.16658782958984375, -0.1397552490234375, -0.11292266845703125, -0.086090087890625, -0.05925750732421875, -0.0324249267578125, -0.00559234619140625, 0.021240234375, 0.04807281494140625, 0.0749053955078125, 0.10173797607421875, 0.128570556640625, 0.15540313720703125, 0.1822357177734375, 0.20906829833984375, 0.23590087890625, 0.26273345947265625, 0.2895660400390625, 0.31639862060546875, 0.343231201171875, 0.37006378173828125, 0.3968963623046875, 0.42372894287109375, 0.4505615234375, 0.47739410400390625, 0.5042266845703125, 0.5310592651367188, 0.557891845703125, 0.5847244262695312, 0.6115570068359375, 0.6383895874023438, 0.66522216796875, 0.6920547485351562, 0.7188873291015625, 0.7457199096679688, 0.772552490234375, 0.7993850708007812, 0.8262176513671875, 0.8530502319335938, 0.8798828125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 5.0, 10.0, 9.0, 15.0, 26.0, 27.0, 37.0, 32.0, 52.0, 51.0, 52.0, 72.0, 66.0, 63.0, 61.0, 64.0, 53.0, 47.0, 48.0, 39.0, 31.0, 26.0, 16.0, 22.0, 14.0, 10.0, 13.0, 8.0, 7.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00482940673828125, -0.00467228889465332, -0.004515171051025391, -0.004358053207397461, -0.004200935363769531, -0.0040438175201416016, -0.003886699676513672, -0.003729581832885742, -0.0035724639892578125, -0.003415346145629883, -0.003258228302001953, -0.0031011104583740234, -0.0029439926147460938, -0.002786874771118164, -0.0026297569274902344, -0.0024726390838623047, -0.002315521240234375, -0.0021584033966064453, -0.0020012855529785156, -0.001844167709350586, -0.0016870498657226562, -0.0015299320220947266, -0.0013728141784667969, -0.0012156963348388672, -0.0010585784912109375, -0.0009014606475830078, -0.0007443428039550781, -0.0005872249603271484, -0.00043010711669921875, -0.00027298927307128906, -0.00011587142944335938, 4.124641418457031e-05, 0.0001983642578125, 0.0003554821014404297, 0.0005125999450683594, 0.0006697177886962891, 0.0008268356323242188, 0.0009839534759521484, 0.0011410713195800781, 0.0012981891632080078, 0.0014553070068359375, 0.0016124248504638672, 0.0017695426940917969, 0.0019266605377197266, 0.0020837783813476562, 0.002240896224975586, 0.0023980140686035156, 0.0025551319122314453, 0.002712249755859375, 0.0028693675994873047, 0.0030264854431152344, 0.003183603286743164, 0.0033407211303710938, 0.0034978389739990234, 0.003654956817626953, 0.003812074661254883, 0.0039691925048828125, 0.004126310348510742, 0.004283428192138672, 0.0044405460357666016, 0.004597663879394531, 0.004754781723022461, 0.004911899566650391, 0.00506901741027832, 0.00522613525390625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 5.0, 6.0, 9.0, 14.0, 17.0, 15.0, 18.0, 38.0, 40.0, 58.0, 95.0, 138.0, 207.0, 558.0, 19565.0, 1017260.0, 9416.0, 451.0, 205.0, 133.0, 84.0, 71.0, 36.0, 35.0, 22.0, 21.0, 9.0, 11.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11767578125, -0.11404800415039062, -0.11042022705078125, -0.10679244995117188, -0.1031646728515625, -0.09953689575195312, -0.09590911865234375, -0.09228134155273438, -0.088653564453125, -0.08502578735351562, -0.08139801025390625, -0.07777023315429688, -0.0741424560546875, -0.07051467895507812, -0.06688690185546875, -0.06325912475585938, -0.05963134765625, -0.056003570556640625, -0.05237579345703125, -0.048748016357421875, -0.0451202392578125, -0.041492462158203125, -0.03786468505859375, -0.034236907958984375, -0.030609130859375, -0.026981353759765625, -0.02335357666015625, -0.019725799560546875, -0.0160980224609375, -0.012470245361328125, -0.00884246826171875, -0.005214691162109375, -0.0015869140625, 0.002040863037109375, 0.00566864013671875, 0.009296417236328125, 0.0129241943359375, 0.016551971435546875, 0.02017974853515625, 0.023807525634765625, 0.027435302734375, 0.031063079833984375, 0.03469085693359375, 0.038318634033203125, 0.0419464111328125, 0.045574188232421875, 0.04920196533203125, 0.052829742431640625, 0.05645751953125, 0.060085296630859375, 0.06371307373046875, 0.06734085083007812, 0.0709686279296875, 0.07459640502929688, 0.07822418212890625, 0.08185195922851562, 0.085479736328125, 0.08910751342773438, 0.09273529052734375, 0.09636306762695312, 0.0999908447265625, 0.10361862182617188, 0.10724639892578125, 0.11087417602539062, 0.114501953125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 7.0, 41.0, 122.0, 374.0, 341.0, 89.0, 33.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002465706318616867, -0.002048881258815527, -0.0016320561990141869, -0.0012152311392128468, -0.0007984060794115067, -0.00038158101961016655, 3.5244040191173553e-05, 0.00045206909999251366, 0.0008688941597938538, 0.0012857192195951939, 0.001702544279396534, 0.002119369339197874, 0.002536194398999214, 0.0029530194588005543, 0.0033698445186018944, 0.0037866695784032345, 0.004203494638204575, 0.004620319698005915, 0.005037144757807255, 0.005453969817608595, 0.005870794877409935, 0.006287619937211275, 0.006704444997012615, 0.007121270056813955, 0.007538095116615295, 0.007954919710755348, 0.008371745236217976, 0.008788570761680603, 0.009205395355820656, 0.009622219949960709, 0.010039045475423336, 0.010455871000885963, 0.010872695595026016, 0.011289520189166069, 0.011706345714628696, 0.012123171240091324, 0.012539995834231377, 0.01295682042837143, 0.013373645953834057, 0.013790471479296684, 0.014207296073436737, 0.01462412066757679, 0.015040946193039417, 0.015457771718502045, 0.015874596312642097, 0.01629142090678215, 0.016708247363567352, 0.017125071957707405, 0.017541896551847458, 0.01795872114598751, 0.018375545740127563, 0.018792372196912766, 0.01920919679105282, 0.01962602138519287, 0.020042847841978073, 0.020459672436118126, 0.02087649703025818, 0.02129332162439823, 0.021710146218538284, 0.022126972675323486, 0.02254379726946354, 0.022960621863603592, 0.023377448320388794, 0.023794272914528847, 0.0242110975086689]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 14.0, 15.0, 12.0, 22.0, 16.0, 24.0, 22.0, 18.0, 21.0, 29.0, 32.0, 41.0, 35.0, 31.0, 47.0, 39.0, 32.0, 39.0, 37.0, 45.0, 38.0, 32.0, 43.0, 40.0, 31.0, 35.0, 24.0, 35.0, 31.0, 20.0, 15.0, 12.0, 13.0, 13.0, 13.0, 7.0, 8.0, 10.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020807981491088867, -0.002001827582716942, -0.001922857016324997, -0.001843886449933052, -0.0017649158835411072, -0.0016859453171491623, -0.0016069747507572174, -0.0015280041843652725, -0.0014490336179733276, -0.0013700630515813828, -0.0012910924851894379, -0.001212121918797493, -0.001133151352405548, -0.0010541807860136032, -0.0009752102196216583, -0.0008962396532297134, -0.0008172690868377686, -0.0007382985204458237, -0.0006593279540538788, -0.0005803573876619339, -0.000501386821269989, -0.00042241625487804413, -0.00034344568848609924, -0.00026447512209415436, -0.00018550455570220947, -0.00010653398931026459, -2.7563422918319702e-05, 5.140714347362518e-05, 0.00013037770986557007, 0.00020934827625751495, 0.00028831884264945984, 0.0003672894090414047, 0.0004462599754333496, 0.0005252305418252945, 0.0006042011082172394, 0.0006831716746091843, 0.0007621422410011292, 0.000841112807393074, 0.0009200833737850189, 0.0009990539401769638, 0.0010780245065689087, 0.0011569950729608536, 0.0012359656393527985, 0.0013149362057447433, 0.0013939067721366882, 0.0014728773385286331, 0.001551847904920578, 0.0016308184713125229, 0.0017097890377044678, 0.0017887596040964127, 0.0018677301704883575, 0.0019467007368803024, 0.0020256713032722473, 0.002104641869664192, 0.002183612436056137, 0.002262583002448082, 0.002341553568840027, 0.0024205241352319717, 0.0024994947016239166, 0.0025784652680158615, 0.0026574358344078064, 0.0027364064007997513, 0.002815376967191696, 0.002894347533583641, 0.002973318099975586]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 8.0, 14.0, 12.0, 14.0, 17.0, 26.0, 21.0, 20.0, 29.0, 27.0, 38.0, 32.0, 31.0, 30.0, 31.0, 53.0, 59.0, 50.0, 37.0, 45.0, 41.0, 35.0, 42.0, 44.0, 22.0, 33.0, 23.0, 25.0, 22.0, 18.0, 15.0, 11.0, 8.0, 12.0, 9.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.75, -21.00830078125, -20.2666015625, -19.52490234375, -18.783203125, -18.04150390625, -17.2998046875, -16.55810546875, -15.81640625, -15.07470703125, -14.3330078125, -13.59130859375, -12.849609375, -12.10791015625, -11.3662109375, -10.62451171875, -9.8828125, -9.14111328125, -8.3994140625, -7.65771484375, -6.916015625, -6.17431640625, -5.4326171875, -4.69091796875, -3.94921875, -3.20751953125, -2.4658203125, -1.72412109375, -0.982421875, -0.24072265625, 0.5009765625, 1.24267578125, 1.984375, 2.72607421875, 3.4677734375, 4.20947265625, 4.951171875, 5.69287109375, 6.4345703125, 7.17626953125, 7.91796875, 8.65966796875, 9.4013671875, 10.14306640625, 10.884765625, 11.62646484375, 12.3681640625, 13.10986328125, 13.8515625, 14.59326171875, 15.3349609375, 16.07666015625, 16.818359375, 17.56005859375, 18.3017578125, 19.04345703125, 19.78515625, 20.52685546875, 21.2685546875, 22.01025390625, 22.751953125, 23.49365234375, 24.2353515625, 24.97705078125, 25.71875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 7.0, 6.0, 5.0, 7.0, 9.0, 15.0, 24.0, 32.0, 39.0, 44.0, 64.0, 86.0, 163.0, 260.0, 395.0, 665.0, 1083.0, 1878.0, 3339.0, 6003.0, 11175.0, 22995.0, 51030.0, 135751.0, 441683.0, 228411.0, 77738.0, 32039.0, 15430.0, 7923.0, 4144.0, 2502.0, 1435.0, 789.0, 466.0, 307.0, 195.0, 137.0, 83.0, 57.0, 42.0, 32.0, 24.0, 20.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-15.0, -14.5416259765625, -14.083251953125, -13.6248779296875, -13.16650390625, -12.7081298828125, -12.249755859375, -11.7913818359375, -11.3330078125, -10.8746337890625, -10.416259765625, -9.9578857421875, -9.49951171875, -9.0411376953125, -8.582763671875, -8.1243896484375, -7.666015625, -7.2076416015625, -6.749267578125, -6.2908935546875, -5.83251953125, -5.3741455078125, -4.915771484375, -4.4573974609375, -3.9990234375, -3.5406494140625, -3.082275390625, -2.6239013671875, -2.16552734375, -1.7071533203125, -1.248779296875, -0.7904052734375, -0.33203125, 0.1263427734375, 0.584716796875, 1.0430908203125, 1.50146484375, 1.9598388671875, 2.418212890625, 2.8765869140625, 3.3349609375, 3.7933349609375, 4.251708984375, 4.7100830078125, 5.16845703125, 5.6268310546875, 6.085205078125, 6.5435791015625, 7.001953125, 7.4603271484375, 7.918701171875, 8.3770751953125, 8.83544921875, 9.2938232421875, 9.752197265625, 10.2105712890625, 10.6689453125, 11.1273193359375, 11.585693359375, 12.0440673828125, 12.50244140625, 12.9608154296875, 13.419189453125, 13.8775634765625, 14.3359375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 0.0, 3.0, 2.0, 4.0, 9.0, 2.0, 9.0, 13.0, 14.0, 16.0, 17.0, 24.0, 19.0, 23.0, 37.0, 38.0, 34.0, 44.0, 44.0, 53.0, 94.0, 267.0, 1676.0, 151.0, 72.0, 65.0, 47.0, 44.0, 32.0, 23.0, 32.0, 25.0, 24.0, 14.0, 19.0, 17.0, 8.0, 8.0, 6.0, 10.0, 10.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.4375, -69.962890625, -67.48828125, -65.013671875, -62.5390625, -60.064453125, -57.58984375, -55.115234375, -52.640625, -50.166015625, -47.69140625, -45.216796875, -42.7421875, -40.267578125, -37.79296875, -35.318359375, -32.84375, -30.369140625, -27.89453125, -25.419921875, -22.9453125, -20.470703125, -17.99609375, -15.521484375, -13.046875, -10.572265625, -8.09765625, -5.623046875, -3.1484375, -0.673828125, 1.80078125, 4.275390625, 6.75, 9.224609375, 11.69921875, 14.173828125, 16.6484375, 19.123046875, 21.59765625, 24.072265625, 26.546875, 29.021484375, 31.49609375, 33.970703125, 36.4453125, 38.919921875, 41.39453125, 43.869140625, 46.34375, 48.818359375, 51.29296875, 53.767578125, 56.2421875, 58.716796875, 61.19140625, 63.666015625, 66.140625, 68.615234375, 71.08984375, 73.564453125, 76.0390625, 78.513671875, 80.98828125, 83.462890625, 85.9375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 10.0, 8.0, 10.0, 15.0, 17.0, 22.0, 26.0, 38.0, 53.0, 69.0, 72.0, 97.0, 161.0, 215.0, 301.0, 721.0, 5537.0, 3091720.0, 44087.0, 1181.0, 400.0, 240.0, 177.0, 122.0, 107.0, 66.0, 46.0, 40.0, 29.0, 29.0, 22.0, 22.0, 10.0, 8.0, 3.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-202.625, -196.78515625, -190.9453125, -185.10546875, -179.265625, -173.42578125, -167.5859375, -161.74609375, -155.90625, -150.06640625, -144.2265625, -138.38671875, -132.546875, -126.70703125, -120.8671875, -115.02734375, -109.1875, -103.34765625, -97.5078125, -91.66796875, -85.828125, -79.98828125, -74.1484375, -68.30859375, -62.46875, -56.62890625, -50.7890625, -44.94921875, -39.109375, -33.26953125, -27.4296875, -21.58984375, -15.75, -9.91015625, -4.0703125, 1.76953125, 7.609375, 13.44921875, 19.2890625, 25.12890625, 30.96875, 36.80859375, 42.6484375, 48.48828125, 54.328125, 60.16796875, 66.0078125, 71.84765625, 77.6875, 83.52734375, 89.3671875, 95.20703125, 101.046875, 106.88671875, 112.7265625, 118.56640625, 124.40625, 130.24609375, 136.0859375, 141.92578125, 147.765625, 153.60546875, 159.4453125, 165.28515625, 171.125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 39.0, 83.0, 226.0, 346.0, 197.0, 78.0, 26.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.1983871459961, -76.55054473876953, -71.9027099609375, -67.25486755371094, -62.607025146484375, -57.95918273925781, -53.311344146728516, -48.66350555419922, -44.015663146972656, -39.367820739746094, -34.7199821472168, -30.072141647338867, -25.424301147460938, -20.776460647583008, -16.128620147705078, -11.480781555175781, -6.832939147949219, -2.185098648071289, 2.4627418518066406, 7.11058235168457, 11.7584228515625, 16.40626335144043, 21.05410385131836, 25.701942443847656, 30.34978485107422, 34.99762725830078, 39.64546585083008, 44.293304443359375, 48.94114685058594, 53.5889892578125, 58.2368278503418, 62.884666442871094, 67.53250122070312, 72.18034362792969, 76.82818603515625, 81.47602081298828, 86.12386322021484, 90.7717056274414, 95.41954040527344, 100.0673828125, 104.71522521972656, 109.36306762695312, 114.01091003417969, 118.65874481201172, 123.30658721923828, 127.95442962646484, 132.60226440429688, 137.25010681152344, 141.89794921875, 146.54579162597656, 151.19363403320312, 155.8414764404297, 160.48931884765625, 165.13714599609375, 169.7849884033203, 174.43283081054688, 179.08067321777344, 183.728515625, 188.37635803222656, 193.02420043945312, 197.67202758789062, 202.3198699951172, 206.96771240234375, 211.6155548095703, 216.26339721679688]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 10.0, 4.0, 9.0, 12.0, 13.0, 15.0, 24.0, 30.0, 22.0, 28.0, 36.0, 33.0, 30.0, 26.0, 28.0, 46.0, 34.0, 28.0, 45.0, 39.0, 43.0, 33.0, 49.0, 34.0, 40.0, 33.0, 47.0, 27.0, 24.0, 21.0, 20.0, 22.0, 20.0, 13.0, 11.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-169.39132690429688, -163.98867797851562, -158.5860137939453, -153.18336486816406, -147.78070068359375, -142.3780517578125, -136.97540283203125, -131.57273864746094, -126.17008209228516, -120.76742553710938, -115.3647689819336, -109.96211242675781, -104.55946350097656, -99.15679931640625, -93.754150390625, -88.35149383544922, -82.94883728027344, -77.54618072509766, -72.14352416992188, -66.74087524414062, -61.33821487426758, -55.9355583190918, -50.53290557861328, -45.1302490234375, -39.72759246826172, -34.32493591308594, -28.92228126525879, -23.51962661743164, -18.11697006225586, -12.714313507080078, -7.3116607666015625, -1.9090042114257812, 3.49365234375, 8.896307945251465, 14.29896354675293, 19.701618194580078, 25.10427474975586, 30.50693130493164, 35.909584045410156, 41.31224060058594, 46.71489715576172, 52.1175537109375, 57.52021026611328, 62.9228630065918, 68.32551574707031, 73.72817993164062, 79.13082885742188, 84.53348541259766, 89.93614196777344, 95.33879852294922, 100.741455078125, 106.14410400390625, 111.54676818847656, 116.94941711425781, 122.3520736694336, 127.75473022460938, 133.15737915039062, 138.56002807617188, 143.9626922607422, 149.36534118652344, 154.76800537109375, 160.170654296875, 165.57330322265625, 170.97596740722656, 176.37863159179688]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0, 8.0, 7.0, 9.0, 8.0, 14.0, 13.0, 19.0, 13.0, 28.0, 29.0, 23.0, 30.0, 28.0, 31.0, 31.0, 38.0, 49.0, 44.0, 43.0, 43.0, 51.0, 45.0, 40.0, 40.0, 49.0, 25.0, 36.0, 38.0, 32.0, 21.0, 18.0, 17.0, 16.0, 12.0, 5.0, 8.0, 7.0, 14.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.125, -21.3486328125, -20.572265625, -19.7958984375, -19.01953125, -18.2431640625, -17.466796875, -16.6904296875, -15.9140625, -15.1376953125, -14.361328125, -13.5849609375, -12.80859375, -12.0322265625, -11.255859375, -10.4794921875, -9.703125, -8.9267578125, -8.150390625, -7.3740234375, -6.59765625, -5.8212890625, -5.044921875, -4.2685546875, -3.4921875, -2.7158203125, -1.939453125, -1.1630859375, -0.38671875, 0.3896484375, 1.166015625, 1.9423828125, 2.71875, 3.4951171875, 4.271484375, 5.0478515625, 5.82421875, 6.6005859375, 7.376953125, 8.1533203125, 8.9296875, 9.7060546875, 10.482421875, 11.2587890625, 12.03515625, 12.8115234375, 13.587890625, 14.3642578125, 15.140625, 15.9169921875, 16.693359375, 17.4697265625, 18.24609375, 19.0224609375, 19.798828125, 20.5751953125, 21.3515625, 22.1279296875, 22.904296875, 23.6806640625, 24.45703125, 25.2333984375, 26.009765625, 26.7861328125, 27.5625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 11.0, 10.0, 9.0, 32.0, 23.0, 31.0, 51.0, 61.0, 82.0, 161.0, 168.0, 266.0, 411.0, 667.0, 1240.0, 2538.0, 6582.0, 38016.0, 1952327.0, 2139182.0, 39595.0, 6799.0, 2649.0, 1284.0, 705.0, 420.0, 286.0, 208.0, 121.0, 87.0, 67.0, 53.0, 36.0, 30.0, 22.0, 14.0, 12.0, 8.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.9375, -66.4765625, -64.015625, -61.5546875, -59.09375, -56.6328125, -54.171875, -51.7109375, -49.25, -46.7890625, -44.328125, -41.8671875, -39.40625, -36.9453125, -34.484375, -32.0234375, -29.5625, -27.1015625, -24.640625, -22.1796875, -19.71875, -17.2578125, -14.796875, -12.3359375, -9.875, -7.4140625, -4.953125, -2.4921875, -0.03125, 2.4296875, 4.890625, 7.3515625, 9.8125, 12.2734375, 14.734375, 17.1953125, 19.65625, 22.1171875, 24.578125, 27.0390625, 29.5, 31.9609375, 34.421875, 36.8828125, 39.34375, 41.8046875, 44.265625, 46.7265625, 49.1875, 51.6484375, 54.109375, 56.5703125, 59.03125, 61.4921875, 63.953125, 66.4140625, 68.875, 71.3359375, 73.796875, 76.2578125, 78.71875, 81.1796875, 83.640625, 86.1015625, 88.5625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 7.0, 11.0, 5.0, 5.0, 13.0, 12.0, 16.0, 28.0, 43.0, 43.0, 59.0, 106.0, 219.0, 398.0, 711.0, 908.0, 632.0, 333.0, 190.0, 102.0, 60.0, 38.0, 30.0, 28.0, 23.0, 17.0, 8.0, 7.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -32.634765625, -31.17578125, -29.716796875, -28.2578125, -26.798828125, -25.33984375, -23.880859375, -22.421875, -20.962890625, -19.50390625, -18.044921875, -16.5859375, -15.126953125, -13.66796875, -12.208984375, -10.75, -9.291015625, -7.83203125, -6.373046875, -4.9140625, -3.455078125, -1.99609375, -0.537109375, 0.921875, 2.380859375, 3.83984375, 5.298828125, 6.7578125, 8.216796875, 9.67578125, 11.134765625, 12.59375, 14.052734375, 15.51171875, 16.970703125, 18.4296875, 19.888671875, 21.34765625, 22.806640625, 24.265625, 25.724609375, 27.18359375, 28.642578125, 30.1015625, 31.560546875, 33.01953125, 34.478515625, 35.9375, 37.396484375, 38.85546875, 40.314453125, 41.7734375, 43.232421875, 44.69140625, 46.150390625, 47.609375, 49.068359375, 50.52734375, 51.986328125, 53.4453125, 54.904296875, 56.36328125, 57.822265625, 59.28125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 5.0, 7.0, 15.0, 23.0, 30.0, 44.0, 64.0, 80.0, 166.0, 425.0, 1153.0, 7433.0, 190521.0, 3967838.0, 22695.0, 2634.0, 564.0, 234.0, 105.0, 74.0, 48.0, 26.0, 22.0, 19.0, 9.0, 4.0, 10.0, 8.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.125, -236.765625, -230.40625, -224.046875, -217.6875, -211.328125, -204.96875, -198.609375, -192.25, -185.890625, -179.53125, -173.171875, -166.8125, -160.453125, -154.09375, -147.734375, -141.375, -135.015625, -128.65625, -122.296875, -115.9375, -109.578125, -103.21875, -96.859375, -90.5, -84.140625, -77.78125, -71.421875, -65.0625, -58.703125, -52.34375, -45.984375, -39.625, -33.265625, -26.90625, -20.546875, -14.1875, -7.828125, -1.46875, 4.890625, 11.25, 17.609375, 23.96875, 30.328125, 36.6875, 43.046875, 49.40625, 55.765625, 62.125, 68.484375, 74.84375, 81.203125, 87.5625, 93.921875, 100.28125, 106.640625, 113.0, 119.359375, 125.71875, 132.078125, 138.4375, 144.796875, 151.15625, 157.515625, 163.875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 11.0, 27.0, 57.0, 138.0, 237.0, 274.0, 142.0, 56.0, 31.0, 15.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-447.4386901855469, -437.7483825683594, -428.0580749511719, -418.3677978515625, -408.677490234375, -398.9871826171875, -389.296875, -379.6065673828125, -369.916259765625, -360.2259521484375, -350.53564453125, -340.8453674316406, -331.1550598144531, -321.4647521972656, -311.7744445800781, -302.0841369628906, -292.39385986328125, -282.70355224609375, -273.01324462890625, -263.3229675292969, -253.63265991210938, -243.94235229492188, -234.25204467773438, -224.56173706054688, -214.87144470214844, -205.18113708496094, -195.4908447265625, -185.800537109375, -176.1102294921875, -166.41993713378906, -156.72962951660156, -147.03933715820312, -137.3489990234375, -127.65869903564453, -117.96839904785156, -108.27809143066406, -98.5877914428711, -88.89749145507812, -79.20718383789062, -69.51688385009766, -59.82658386230469, -50.13628387451172, -40.445980072021484, -30.755678176879883, -21.06537628173828, -11.375076293945312, -1.6847724914550781, 8.005531311035156, 17.695831298828125, 27.386133193969727, 37.07643508911133, 46.76673889160156, 56.45703887939453, 66.1473388671875, 75.837646484375, 85.52794647216797, 95.21824645996094, 104.9085464477539, 114.59884643554688, 124.28915405273438, 133.97946166992188, 143.6697540283203, 153.3600616455078, 163.05035400390625, 172.74066162109375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 7.0, 12.0, 8.0, 16.0, 13.0, 17.0, 15.0, 30.0, 24.0, 32.0, 27.0, 40.0, 32.0, 28.0, 38.0, 38.0, 45.0, 52.0, 44.0, 38.0, 50.0, 26.0, 34.0, 39.0, 24.0, 36.0, 31.0, 34.0, 11.0, 35.0, 21.0, 12.0, 13.0, 12.0, 11.0, 8.0, 6.0, 9.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.64241790771484, -106.25418090820312, -102.8659439086914, -99.47770690917969, -96.0894775390625, -92.70124053955078, -89.31300354003906, -85.92476654052734, -82.53652954101562, -79.1482925415039, -75.76005554199219, -72.371826171875, -68.98358917236328, -65.59535217285156, -62.207115173339844, -58.818878173828125, -55.43064880371094, -52.04241180419922, -48.654178619384766, -45.26594161987305, -41.877708435058594, -38.489471435546875, -35.101234436035156, -31.71299934387207, -28.324764251708984, -24.9365291595459, -21.548294067382812, -18.160057067871094, -14.771821975708008, -11.383586883544922, -7.995349884033203, -4.607114791870117, -1.2188873291015625, 2.1693482398986816, 5.557583808898926, 8.945819854736328, 12.334054946899414, 15.7222900390625, 19.11052703857422, 22.498762130737305, 25.88699722290039, 29.275232315063477, 32.66346740722656, 36.05170440673828, 39.43994140625, 42.82817459106445, 46.21641159057617, 49.604644775390625, 52.992881774902344, 56.38111877441406, 59.769351959228516, 63.157588958740234, 66.54582214355469, 69.9340591430664, 73.32229614257812, 76.71053314208984, 80.09877014160156, 83.48700714111328, 86.875244140625, 90.26347351074219, 93.6517105102539, 97.03994750976562, 100.42818450927734, 103.81642150878906, 107.20465087890625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 6.0, 13.0, 15.0, 11.0, 15.0, 19.0, 24.0, 19.0, 28.0, 28.0, 31.0, 39.0, 39.0, 38.0, 34.0, 36.0, 50.0, 42.0, 58.0, 43.0, 44.0, 37.0, 27.0, 24.0, 29.0, 38.0, 25.0, 25.0, 20.0, 28.0, 15.0, 18.0, 14.0, 9.0, 4.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.75, -20.02392578125, -19.2978515625, -18.57177734375, -17.845703125, -17.11962890625, -16.3935546875, -15.66748046875, -14.94140625, -14.21533203125, -13.4892578125, -12.76318359375, -12.037109375, -11.31103515625, -10.5849609375, -9.85888671875, -9.1328125, -8.40673828125, -7.6806640625, -6.95458984375, -6.228515625, -5.50244140625, -4.7763671875, -4.05029296875, -3.32421875, -2.59814453125, -1.8720703125, -1.14599609375, -0.419921875, 0.30615234375, 1.0322265625, 1.75830078125, 2.484375, 3.21044921875, 3.9365234375, 4.66259765625, 5.388671875, 6.11474609375, 6.8408203125, 7.56689453125, 8.29296875, 9.01904296875, 9.7451171875, 10.47119140625, 11.197265625, 11.92333984375, 12.6494140625, 13.37548828125, 14.1015625, 14.82763671875, 15.5537109375, 16.27978515625, 17.005859375, 17.73193359375, 18.4580078125, 19.18408203125, 19.91015625, 20.63623046875, 21.3623046875, 22.08837890625, 22.814453125, 23.54052734375, 24.2666015625, 24.99267578125, 25.71875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 2.0, 7.0, 9.0, 10.0, 16.0, 31.0, 37.0, 38.0, 77.0, 99.0, 145.0, 197.0, 327.0, 476.0, 696.0, 1076.0, 1524.0, 2487.0, 3885.0, 5886.0, 9667.0, 16078.0, 26742.0, 47253.0, 85168.0, 162242.0, 265408.0, 188772.0, 98732.0, 53480.0, 30237.0, 17993.0, 10832.0, 6728.0, 4145.0, 2788.0, 1730.0, 1182.0, 760.0, 513.0, 342.0, 244.0, 150.0, 98.0, 74.0, 59.0, 43.0, 25.0, 17.0, 12.0, 6.0, 10.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1513671875, -1.11248779296875, -1.0736083984375, -1.03472900390625, -0.995849609375, -0.95697021484375, -0.9180908203125, -0.87921142578125, -0.84033203125, -0.80145263671875, -0.7625732421875, -0.72369384765625, -0.684814453125, -0.64593505859375, -0.6070556640625, -0.56817626953125, -0.529296875, -0.49041748046875, -0.4515380859375, -0.41265869140625, -0.373779296875, -0.33489990234375, -0.2960205078125, -0.25714111328125, -0.21826171875, -0.17938232421875, -0.1405029296875, -0.10162353515625, -0.062744140625, -0.02386474609375, 0.0150146484375, 0.05389404296875, 0.0927734375, 0.13165283203125, 0.1705322265625, 0.20941162109375, 0.248291015625, 0.28717041015625, 0.3260498046875, 0.36492919921875, 0.40380859375, 0.44268798828125, 0.4815673828125, 0.52044677734375, 0.559326171875, 0.59820556640625, 0.6370849609375, 0.67596435546875, 0.71484375, 0.75372314453125, 0.7926025390625, 0.83148193359375, 0.870361328125, 0.90924072265625, 0.9481201171875, 0.98699951171875, 1.02587890625, 1.06475830078125, 1.1036376953125, 1.14251708984375, 1.181396484375, 1.22027587890625, 1.2591552734375, 1.29803466796875, 1.3369140625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 9.0, 12.0, 11.0, 24.0, 19.0, 19.0, 27.0, 14.0, 30.0, 26.0, 27.0, 32.0, 20.0, 40.0, 31.0, 33.0, 43.0, 29.0, 1059.0, 33.0, 29.0, 42.0, 31.0, 37.0, 27.0, 26.0, 26.0, 32.0, 15.0, 27.0, 24.0, 21.0, 18.0, 17.0, 10.0, 19.0, 11.0, 9.0, 9.0, 10.0, 4.0, 2.0, 9.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.515625, -13.1043701171875, -12.693115234375, -12.2818603515625, -11.87060546875, -11.4593505859375, -11.048095703125, -10.6368408203125, -10.2255859375, -9.8143310546875, -9.403076171875, -8.9918212890625, -8.58056640625, -8.1693115234375, -7.758056640625, -7.3468017578125, -6.935546875, -6.5242919921875, -6.113037109375, -5.7017822265625, -5.29052734375, -4.8792724609375, -4.468017578125, -4.0567626953125, -3.6455078125, -3.2342529296875, -2.822998046875, -2.4117431640625, -2.00048828125, -1.5892333984375, -1.177978515625, -0.7667236328125, -0.35546875, 0.0557861328125, 0.467041015625, 0.8782958984375, 1.28955078125, 1.7008056640625, 2.112060546875, 2.5233154296875, 2.9345703125, 3.3458251953125, 3.757080078125, 4.1683349609375, 4.57958984375, 4.9908447265625, 5.402099609375, 5.8133544921875, 6.224609375, 6.6358642578125, 7.047119140625, 7.4583740234375, 7.86962890625, 8.2808837890625, 8.692138671875, 9.1033935546875, 9.5146484375, 9.9259033203125, 10.337158203125, 10.7484130859375, 11.15966796875, 11.5709228515625, 11.982177734375, 12.3934326171875, 12.8046875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 7.0, 14.0, 21.0, 28.0, 42.0, 58.0, 90.0, 124.0, 200.0, 280.0, 374.0, 548.0, 817.0, 1126.0, 1481.0, 2118.0, 2954.0, 4053.0, 5421.0, 7665.0, 10535.0, 14534.0, 20195.0, 28110.0, 40869.0, 60163.0, 92199.0, 143186.0, 1228637.0, 140974.0, 91064.0, 59136.0, 40444.0, 27835.0, 20117.0, 14371.0, 10152.0, 7431.0, 5600.0, 4056.0, 2834.0, 2087.0, 1498.0, 1108.0, 766.0, 574.0, 390.0, 283.0, 179.0, 129.0, 84.0, 62.0, 48.0, 28.0, 18.0, 11.0, 4.0, 6.0, 5.0, 1.0, 1.0], "bins": [-0.7568359375, -0.7327957153320312, -0.7087554931640625, -0.6847152709960938, -0.660675048828125, -0.6366348266601562, -0.6125946044921875, -0.5885543823242188, -0.56451416015625, -0.5404739379882812, -0.5164337158203125, -0.49239349365234375, -0.468353271484375, -0.44431304931640625, -0.4202728271484375, -0.39623260498046875, -0.3721923828125, -0.34815216064453125, -0.3241119384765625, -0.30007171630859375, -0.276031494140625, -0.25199127197265625, -0.2279510498046875, -0.20391082763671875, -0.17987060546875, -0.15583038330078125, -0.1317901611328125, -0.10774993896484375, -0.083709716796875, -0.05966949462890625, -0.0356292724609375, -0.01158905029296875, 0.012451171875, 0.03649139404296875, 0.0605316162109375, 0.08457183837890625, 0.108612060546875, 0.13265228271484375, 0.1566925048828125, 0.18073272705078125, 0.20477294921875, 0.22881317138671875, 0.2528533935546875, 0.27689361572265625, 0.300933837890625, 0.32497406005859375, 0.3490142822265625, 0.37305450439453125, 0.3970947265625, 0.42113494873046875, 0.4451751708984375, 0.46921539306640625, 0.493255615234375, 0.5172958374023438, 0.5413360595703125, 0.5653762817382812, 0.58941650390625, 0.6134567260742188, 0.6374969482421875, 0.6615371704101562, 0.685577392578125, 0.7096176147460938, 0.7336578369140625, 0.7576980590820312, 0.78173828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 5.0, 7.0, 13.0, 8.0, 7.0, 21.0, 15.0, 19.0, 31.0, 29.0, 35.0, 34.0, 37.0, 43.0, 46.0, 64.0, 54.0, 45.0, 65.0, 48.0, 46.0, 46.0, 35.0, 29.0, 34.0, 25.0, 30.0, 17.0, 13.0, 17.0, 11.0, 9.0, 10.0, 8.0, 8.0, 9.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.003765106201171875, -0.003645479679107666, -0.003525853157043457, -0.003406226634979248, -0.003286600112915039, -0.00316697359085083, -0.003047347068786621, -0.002927720546722412, -0.002808094024658203, -0.002688467502593994, -0.002568840980529785, -0.002449214458465576, -0.002329587936401367, -0.002209961414337158, -0.0020903348922729492, -0.0019707083702087402, -0.0018510818481445312, -0.0017314553260803223, -0.0016118288040161133, -0.0014922022819519043, -0.0013725757598876953, -0.0012529492378234863, -0.0011333227157592773, -0.0010136961936950684, -0.0008940696716308594, -0.0007744431495666504, -0.0006548166275024414, -0.0005351901054382324, -0.00041556358337402344, -0.00029593706130981445, -0.00017631053924560547, -5.6684017181396484e-05, 6.29425048828125e-05, 0.00018256902694702148, 0.00030219554901123047, 0.00042182207107543945, 0.0005414485931396484, 0.0006610751152038574, 0.0007807016372680664, 0.0009003281593322754, 0.0010199546813964844, 0.0011395812034606934, 0.0012592077255249023, 0.0013788342475891113, 0.0014984607696533203, 0.0016180872917175293, 0.0017377138137817383, 0.0018573403358459473, 0.0019769668579101562, 0.0020965933799743652, 0.0022162199020385742, 0.002335846424102783, 0.002455472946166992, 0.002575099468231201, 0.00269472599029541, 0.002814352512359619, 0.002933979034423828, 0.003053605556488037, 0.003173232078552246, 0.003292858600616455, 0.003412485122680664, 0.003532111644744873, 0.003651738166809082, 0.003771364688873291, 0.0038909912109375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 10.0, 10.0, 7.0, 15.0, 7.0, 21.0, 16.0, 19.0, 25.0, 42.0, 58.0, 55.0, 59.0, 91.0, 149.0, 212.0, 520.0, 5961.0, 915115.0, 123807.0, 1313.0, 317.0, 171.0, 121.0, 97.0, 76.0, 51.0, 41.0, 36.0, 23.0, 21.0, 20.0, 9.0, 12.0, 6.0, 4.0, 11.0, 5.0, 8.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.08203125, -0.07952880859375, -0.0770263671875, -0.07452392578125, -0.072021484375, -0.06951904296875, -0.0670166015625, -0.06451416015625, -0.06201171875, -0.05950927734375, -0.0570068359375, -0.05450439453125, -0.052001953125, -0.04949951171875, -0.0469970703125, -0.04449462890625, -0.0419921875, -0.03948974609375, -0.0369873046875, -0.03448486328125, -0.031982421875, -0.02947998046875, -0.0269775390625, -0.02447509765625, -0.02197265625, -0.01947021484375, -0.0169677734375, -0.01446533203125, -0.011962890625, -0.00946044921875, -0.0069580078125, -0.00445556640625, -0.001953125, 0.00054931640625, 0.0030517578125, 0.00555419921875, 0.008056640625, 0.01055908203125, 0.0130615234375, 0.01556396484375, 0.01806640625, 0.02056884765625, 0.0230712890625, 0.02557373046875, 0.028076171875, 0.03057861328125, 0.0330810546875, 0.03558349609375, 0.0380859375, 0.04058837890625, 0.0430908203125, 0.04559326171875, 0.048095703125, 0.05059814453125, 0.0531005859375, 0.05560302734375, 0.05810546875, 0.06060791015625, 0.0631103515625, 0.06561279296875, 0.068115234375, 0.07061767578125, 0.0731201171875, 0.07562255859375, 0.078125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 58.0, 716.0, 224.0, 17.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.043926455080509186, -0.04316602647304535, -0.042405594140291214, -0.04164516553282738, -0.04088473320007324, -0.040124304592609406, -0.03936387598514557, -0.038603443652391434, -0.0378430150449276, -0.03708258643746376, -0.036322154104709625, -0.03556172549724579, -0.03480129316449165, -0.03404086455702782, -0.03328043222427368, -0.032520003616809845, -0.03175957128405571, -0.030999140813946724, -0.030238710343837738, -0.0294782817363739, -0.028717851266264915, -0.02795742079615593, -0.027196990326046944, -0.026436559855937958, -0.02567613124847412, -0.024915700778365135, -0.02415527030825615, -0.023394841700792313, -0.022634411230683327, -0.02187398076057434, -0.021113550290465355, -0.02035311982035637, -0.019592689350247383, -0.018832258880138397, -0.01807182841002941, -0.017311397939920425, -0.01655096933245659, -0.015790538862347603, -0.015030108392238617, -0.014269677922129631, -0.013509247452020645, -0.01274881698191166, -0.011988387443125248, -0.011227956973016262, -0.010467526502907276, -0.009707096964120865, -0.008946666494011879, -0.008186236023902893, -0.0074258060194551945, -0.006665376015007496, -0.00590494554489851, -0.005144515540450811, -0.004384085536003113, -0.003623655065894127, -0.0028632250614464283, -0.0021027945913374424, -0.0013423645868897438, -0.0005819344078190625, 0.00017849577125161886, 0.0009389258921146393, 0.0016993561293929815, 0.0024597863666713238, 0.0032202163711190224, 0.003980646841228008, 0.004741076845675707]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 15.0, 10.0, 13.0, 14.0, 12.0, 12.0, 16.0, 23.0, 31.0, 35.0, 32.0, 37.0, 38.0, 32.0, 38.0, 35.0, 40.0, 35.0, 49.0, 60.0, 42.0, 36.0, 36.0, 35.0, 34.0, 33.0, 28.0, 25.0, 23.0, 15.0, 24.0, 12.0, 13.0, 14.0, 12.0, 8.0, 5.0, 9.0, 8.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002417266368865967, -0.0023432783782482147, -0.0022692903876304626, -0.0021953023970127106, -0.0021213144063949585, -0.0020473264157772064, -0.0019733384251594543, -0.0018993504345417023, -0.0018253624439239502, -0.0017513744533061981, -0.001677386462688446, -0.001603398472070694, -0.001529410481452942, -0.0014554224908351898, -0.0013814345002174377, -0.0013074465095996857, -0.0012334585189819336, -0.0011594705283641815, -0.0010854825377464294, -0.0010114945471286774, -0.0009375065565109253, -0.0008635185658931732, -0.0007895305752754211, -0.0007155425846576691, -0.000641554594039917, -0.0005675666034221649, -0.0004935786128044128, -0.00041959062218666077, -0.0003456026315689087, -0.0002716146409511566, -0.00019762665033340454, -0.00012363865971565247, -4.965066909790039e-05, 2.4337321519851685e-05, 9.832531213760376e-05, 0.00017231330275535583, 0.0002463012933731079, 0.00032028928399086, 0.00039427727460861206, 0.00046826526522636414, 0.0005422532558441162, 0.0006162412464618683, 0.0006902292370796204, 0.0007642172276973724, 0.0008382052183151245, 0.0009121932089328766, 0.0009861811995506287, 0.0010601691901683807, 0.0011341571807861328, 0.0012081451714038849, 0.001282133162021637, 0.001356121152639389, 0.0014301091432571411, 0.0015040971338748932, 0.0015780851244926453, 0.0016520731151103973, 0.0017260611057281494, 0.0018000490963459015, 0.0018740370869636536, 0.0019480250775814056, 0.0020220130681991577, 0.00209600105881691, 0.002169989049434662, 0.002243977040052414, 0.002317965030670166]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 6.0, 13.0, 15.0, 11.0, 15.0, 19.0, 24.0, 19.0, 28.0, 28.0, 31.0, 39.0, 39.0, 38.0, 34.0, 36.0, 50.0, 42.0, 58.0, 43.0, 44.0, 37.0, 27.0, 24.0, 29.0, 38.0, 25.0, 25.0, 20.0, 28.0, 15.0, 18.0, 14.0, 9.0, 4.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.75, -20.02392578125, -19.2978515625, -18.57177734375, -17.845703125, -17.11962890625, -16.3935546875, -15.66748046875, -14.94140625, -14.21533203125, -13.4892578125, -12.76318359375, -12.037109375, -11.31103515625, -10.5849609375, -9.85888671875, -9.1328125, -8.40673828125, -7.6806640625, -6.95458984375, -6.228515625, -5.50244140625, -4.7763671875, -4.05029296875, -3.32421875, -2.59814453125, -1.8720703125, -1.14599609375, -0.419921875, 0.30615234375, 1.0322265625, 1.75830078125, 2.484375, 3.21044921875, 3.9365234375, 4.66259765625, 5.388671875, 6.11474609375, 6.8408203125, 7.56689453125, 8.29296875, 9.01904296875, 9.7451171875, 10.47119140625, 11.197265625, 11.92333984375, 12.6494140625, 13.37548828125, 14.1015625, 14.82763671875, 15.5537109375, 16.27978515625, 17.005859375, 17.73193359375, 18.4580078125, 19.18408203125, 19.91015625, 20.63623046875, 21.3623046875, 22.08837890625, 22.814453125, 23.54052734375, 24.2666015625, 24.99267578125, 25.71875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 5.0, 11.0, 11.0, 18.0, 15.0, 21.0, 28.0, 35.0, 46.0, 52.0, 76.0, 100.0, 134.0, 220.0, 387.0, 687.0, 1344.0, 3133.0, 8332.0, 25668.0, 98114.0, 589222.0, 246768.0, 49794.0, 14673.0, 5208.0, 1993.0, 958.0, 522.0, 274.0, 180.0, 133.0, 89.0, 67.0, 61.0, 35.0, 26.0, 22.0, 19.0, 19.0, 9.0, 13.0, 6.0, 4.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.3662109375, -21.560546875, -20.7548828125, -19.94921875, -19.1435546875, -18.337890625, -17.5322265625, -16.7265625, -15.9208984375, -15.115234375, -14.3095703125, -13.50390625, -12.6982421875, -11.892578125, -11.0869140625, -10.28125, -9.4755859375, -8.669921875, -7.8642578125, -7.05859375, -6.2529296875, -5.447265625, -4.6416015625, -3.8359375, -3.0302734375, -2.224609375, -1.4189453125, -0.61328125, 0.1923828125, 0.998046875, 1.8037109375, 2.609375, 3.4150390625, 4.220703125, 5.0263671875, 5.83203125, 6.6376953125, 7.443359375, 8.2490234375, 9.0546875, 9.8603515625, 10.666015625, 11.4716796875, 12.27734375, 13.0830078125, 13.888671875, 14.6943359375, 15.5, 16.3056640625, 17.111328125, 17.9169921875, 18.72265625, 19.5283203125, 20.333984375, 21.1396484375, 21.9453125, 22.7509765625, 23.556640625, 24.3623046875, 25.16796875, 25.9736328125, 26.779296875, 27.5849609375, 28.390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 3.0, 7.0, 7.0, 13.0, 10.0, 13.0, 16.0, 20.0, 22.0, 24.0, 28.0, 41.0, 36.0, 34.0, 27.0, 37.0, 39.0, 73.0, 123.0, 1737.0, 231.0, 86.0, 42.0, 50.0, 28.0, 34.0, 36.0, 23.0, 40.0, 20.0, 23.0, 20.0, 21.0, 15.0, 9.0, 10.0, 7.0, 7.0, 4.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-62.9375, -61.009765625, -59.08203125, -57.154296875, -55.2265625, -53.298828125, -51.37109375, -49.443359375, -47.515625, -45.587890625, -43.66015625, -41.732421875, -39.8046875, -37.876953125, -35.94921875, -34.021484375, -32.09375, -30.166015625, -28.23828125, -26.310546875, -24.3828125, -22.455078125, -20.52734375, -18.599609375, -16.671875, -14.744140625, -12.81640625, -10.888671875, -8.9609375, -7.033203125, -5.10546875, -3.177734375, -1.25, 0.677734375, 2.60546875, 4.533203125, 6.4609375, 8.388671875, 10.31640625, 12.244140625, 14.171875, 16.099609375, 18.02734375, 19.955078125, 21.8828125, 23.810546875, 25.73828125, 27.666015625, 29.59375, 31.521484375, 33.44921875, 35.376953125, 37.3046875, 39.232421875, 41.16015625, 43.087890625, 45.015625, 46.943359375, 48.87109375, 50.798828125, 52.7265625, 54.654296875, 56.58203125, 58.509765625, 60.4375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 1.0, 5.0, 8.0, 7.0, 9.0, 10.0, 22.0, 14.0, 33.0, 41.0, 51.0, 66.0, 93.0, 98.0, 144.0, 217.0, 388.0, 1046.0, 26141.0, 3107368.0, 8081.0, 707.0, 317.0, 195.0, 164.0, 127.0, 66.0, 69.0, 62.0, 27.0, 33.0, 19.0, 21.0, 14.0, 9.0, 7.0, 13.0, 1.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.375, -151.392578125, -146.41015625, -141.427734375, -136.4453125, -131.462890625, -126.48046875, -121.498046875, -116.515625, -111.533203125, -106.55078125, -101.568359375, -96.5859375, -91.603515625, -86.62109375, -81.638671875, -76.65625, -71.673828125, -66.69140625, -61.708984375, -56.7265625, -51.744140625, -46.76171875, -41.779296875, -36.796875, -31.814453125, -26.83203125, -21.849609375, -16.8671875, -11.884765625, -6.90234375, -1.919921875, 3.0625, 8.044921875, 13.02734375, 18.009765625, 22.9921875, 27.974609375, 32.95703125, 37.939453125, 42.921875, 47.904296875, 52.88671875, 57.869140625, 62.8515625, 67.833984375, 72.81640625, 77.798828125, 82.78125, 87.763671875, 92.74609375, 97.728515625, 102.7109375, 107.693359375, 112.67578125, 117.658203125, 122.640625, 127.623046875, 132.60546875, 137.587890625, 142.5703125, 147.552734375, 152.53515625, 157.517578125, 162.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 12.0, 22.0, 36.0, 66.0, 113.0, 183.0, 191.0, 167.0, 112.0, 56.0, 24.0, 14.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.19904327392578, -98.8675537109375, -96.53605651855469, -94.2045669555664, -91.8730697631836, -89.54158020019531, -87.2100830078125, -84.87859344482422, -82.54710388183594, -80.21561431884766, -77.88411712646484, -75.55262756347656, -73.22113037109375, -70.88964080810547, -68.55815124511719, -66.22665405273438, -63.89516067504883, -61.56366729736328, -59.232173919677734, -56.90068054199219, -54.569190979003906, -52.23769760131836, -49.90620422363281, -47.57471466064453, -45.24321746826172, -42.91172409057617, -40.580230712890625, -38.248741149902344, -35.9172477722168, -33.58575439453125, -31.254261016845703, -28.92276954650879, -26.59127426147461, -24.259780883789062, -21.92828941345215, -19.5967960357666, -17.265304565429688, -14.93381118774414, -12.602317810058594, -10.27082633972168, -7.939332962036133, -5.607840538024902, -3.2763476371765137, -0.944854736328125, 1.3866376876831055, 3.718130111694336, 6.049623489379883, 8.381114959716797, 10.712608337402344, 13.044100761413574, 15.375593185424805, 17.70708656311035, 20.038578033447266, 22.370071411132812, 24.70156478881836, 27.033056259155273, 29.36454963684082, 31.696043014526367, 34.02753448486328, 36.35902786254883, 38.690521240234375, 41.022010803222656, 43.35350799560547, 45.68499755859375, 48.0164909362793]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 6.0, 4.0, 12.0, 15.0, 25.0, 16.0, 24.0, 25.0, 22.0, 29.0, 30.0, 29.0, 36.0, 41.0, 47.0, 53.0, 48.0, 40.0, 48.0, 35.0, 37.0, 34.0, 36.0, 21.0, 46.0, 41.0, 22.0, 22.0, 19.0, 19.0, 17.0, 18.0, 16.0, 13.0, 8.0, 14.0, 8.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-175.55494689941406, -170.40106201171875, -165.24716186523438, -160.09326171875, -154.9393768310547, -149.78549194335938, -144.631591796875, -139.47769165039062, -134.3238067626953, -129.169921875, -124.01602172851562, -118.86212921142578, -113.70823669433594, -108.5543441772461, -103.40045166015625, -98.2465591430664, -93.09266662597656, -87.93877410888672, -82.78488159179688, -77.63098907470703, -72.47709655761719, -67.32320404052734, -62.1693115234375, -57.015419006347656, -51.86152648925781, -46.70763397216797, -41.553741455078125, -36.39984893798828, -31.245956420898438, -26.092063903808594, -20.93817138671875, -15.784278869628906, -10.630386352539062, -5.476493835449219, -0.322601318359375, 4.831291198730469, 9.985183715820312, 15.139076232910156, 20.29296875, 25.446861267089844, 30.600753784179688, 35.75464630126953, 40.908538818359375, 46.06243133544922, 51.21632385253906, 56.370216369628906, 61.52410888671875, 66.6780014038086, 71.83189392089844, 76.98578643798828, 82.13967895507812, 87.29357147216797, 92.44746398925781, 97.60135650634766, 102.7552490234375, 107.90914154052734, 113.06303405761719, 118.21692657470703, 123.37081909179688, 128.52471923828125, 133.67860412597656, 138.83248901367188, 143.98638916015625, 149.14028930664062, 154.29417419433594]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 2.0, 10.0, 7.0, 16.0, 13.0, 16.0, 16.0, 24.0, 14.0, 33.0, 19.0, 35.0, 41.0, 39.0, 35.0, 43.0, 51.0, 46.0, 45.0, 49.0, 35.0, 42.0, 33.0, 41.0, 40.0, 28.0, 29.0, 20.0, 34.0, 18.0, 16.0, 22.0, 14.0, 18.0, 8.0, 6.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.796875, -22.02685546875, -21.2568359375, -20.48681640625, -19.716796875, -18.94677734375, -18.1767578125, -17.40673828125, -16.63671875, -15.86669921875, -15.0966796875, -14.32666015625, -13.556640625, -12.78662109375, -12.0166015625, -11.24658203125, -10.4765625, -9.70654296875, -8.9365234375, -8.16650390625, -7.396484375, -6.62646484375, -5.8564453125, -5.08642578125, -4.31640625, -3.54638671875, -2.7763671875, -2.00634765625, -1.236328125, -0.46630859375, 0.3037109375, 1.07373046875, 1.84375, 2.61376953125, 3.3837890625, 4.15380859375, 4.923828125, 5.69384765625, 6.4638671875, 7.23388671875, 8.00390625, 8.77392578125, 9.5439453125, 10.31396484375, 11.083984375, 11.85400390625, 12.6240234375, 13.39404296875, 14.1640625, 14.93408203125, 15.7041015625, 16.47412109375, 17.244140625, 18.01416015625, 18.7841796875, 19.55419921875, 20.32421875, 21.09423828125, 21.8642578125, 22.63427734375, 23.404296875, 24.17431640625, 24.9443359375, 25.71435546875, 26.484375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 5.0, 10.0, 7.0, 20.0, 20.0, 19.0, 34.0, 39.0, 52.0, 71.0, 85.0, 170.0, 274.0, 477.0, 1065.0, 2764.0, 10552.0, 304313.0, 3736005.0, 125767.0, 7934.0, 2334.0, 986.0, 467.0, 253.0, 161.0, 84.0, 67.0, 57.0, 44.0, 27.0, 30.0, 19.0, 13.0, 8.0, 8.0, 5.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.625, -76.9169921875, -74.208984375, -71.5009765625, -68.79296875, -66.0849609375, -63.376953125, -60.6689453125, -57.9609375, -55.2529296875, -52.544921875, -49.8369140625, -47.12890625, -44.4208984375, -41.712890625, -39.0048828125, -36.296875, -33.5888671875, -30.880859375, -28.1728515625, -25.46484375, -22.7568359375, -20.048828125, -17.3408203125, -14.6328125, -11.9248046875, -9.216796875, -6.5087890625, -3.80078125, -1.0927734375, 1.615234375, 4.3232421875, 7.03125, 9.7392578125, 12.447265625, 15.1552734375, 17.86328125, 20.5712890625, 23.279296875, 25.9873046875, 28.6953125, 31.4033203125, 34.111328125, 36.8193359375, 39.52734375, 42.2353515625, 44.943359375, 47.6513671875, 50.359375, 53.0673828125, 55.775390625, 58.4833984375, 61.19140625, 63.8994140625, 66.607421875, 69.3154296875, 72.0234375, 74.7314453125, 77.439453125, 80.1474609375, 82.85546875, 85.5634765625, 88.271484375, 90.9794921875, 93.6875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 11.0, 6.0, 6.0, 8.0, 9.0, 22.0, 28.0, 26.0, 57.0, 115.0, 211.0, 390.0, 847.0, 1030.0, 619.0, 310.0, 122.0, 92.0, 44.0, 26.0, 21.0, 23.0, 15.0, 8.0, 8.0, 3.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-72.0, -70.255859375, -68.51171875, -66.767578125, -65.0234375, -63.279296875, -61.53515625, -59.791015625, -58.046875, -56.302734375, -54.55859375, -52.814453125, -51.0703125, -49.326171875, -47.58203125, -45.837890625, -44.09375, -42.349609375, -40.60546875, -38.861328125, -37.1171875, -35.373046875, -33.62890625, -31.884765625, -30.140625, -28.396484375, -26.65234375, -24.908203125, -23.1640625, -21.419921875, -19.67578125, -17.931640625, -16.1875, -14.443359375, -12.69921875, -10.955078125, -9.2109375, -7.466796875, -5.72265625, -3.978515625, -2.234375, -0.490234375, 1.25390625, 2.998046875, 4.7421875, 6.486328125, 8.23046875, 9.974609375, 11.71875, 13.462890625, 15.20703125, 16.951171875, 18.6953125, 20.439453125, 22.18359375, 23.927734375, 25.671875, 27.416015625, 29.16015625, 30.904296875, 32.6484375, 34.392578125, 36.13671875, 37.880859375, 39.625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 2.0, 8.0, 11.0, 13.0, 16.0, 28.0, 41.0, 80.0, 143.0, 252.0, 720.0, 4355.0, 157686.0, 4015854.0, 12919.0, 1335.0, 397.0, 189.0, 77.0, 46.0, 23.0, 25.0, 14.0, 6.0, 7.0, 7.0, 8.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-196.25, -187.79296875, -179.3359375, -170.87890625, -162.421875, -153.96484375, -145.5078125, -137.05078125, -128.59375, -120.13671875, -111.6796875, -103.22265625, -94.765625, -86.30859375, -77.8515625, -69.39453125, -60.9375, -52.48046875, -44.0234375, -35.56640625, -27.109375, -18.65234375, -10.1953125, -1.73828125, 6.71875, 15.17578125, 23.6328125, 32.08984375, 40.546875, 49.00390625, 57.4609375, 65.91796875, 74.375, 82.83203125, 91.2890625, 99.74609375, 108.203125, 116.66015625, 125.1171875, 133.57421875, 142.03125, 150.48828125, 158.9453125, 167.40234375, 175.859375, 184.31640625, 192.7734375, 201.23046875, 209.6875, 218.14453125, 226.6015625, 235.05859375, 243.515625, 251.97265625, 260.4296875, 268.88671875, 277.34375, 285.80078125, 294.2578125, 302.71484375, 311.171875, 319.62890625, 328.0859375, 336.54296875, 345.0]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 18.0, 47.0, 99.0, 272.0, 319.0, 149.0, 50.0, 28.0, 7.0, 11.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.67606353759766, -105.22722625732422, -93.77838897705078, -82.32955932617188, -70.88072204589844, -59.431880950927734, -47.98304748535156, -36.534210205078125, -25.085372924804688, -13.636536598205566, -2.1877002716064453, 9.26113510131836, 20.709972381591797, 32.158809661865234, 43.607643127441406, 55.056480407714844, 66.50531768798828, 77.95415496826172, 89.40299224853516, 100.85182189941406, 112.3006591796875, 123.74949645996094, 135.19833374023438, 146.6471710205078, 158.09600830078125, 169.5448455810547, 180.99368286132812, 192.44252014160156, 203.891357421875, 215.34019470214844, 226.78903198242188, 238.23785400390625, 249.68667602539062, 261.135498046875, 272.5843505859375, 284.0331726074219, 295.4820251464844, 306.93084716796875, 318.37969970703125, 329.8285217285156, 341.2773742675781, 352.7261962890625, 364.175048828125, 375.6238708496094, 387.0727233886719, 398.52154541015625, 409.97039794921875, 421.4192199707031, 432.8680419921875, 444.3168640136719, 455.7657165527344, 467.21453857421875, 478.66339111328125, 490.1122131347656, 501.5610656738281, 513.0098876953125, 524.458740234375, 535.9075927734375, 547.3563842773438, 558.8052368164062, 570.2540893554688, 581.7029418945312, 593.1517333984375, 604.6005859375, 616.0494384765625]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 7.0, 14.0, 7.0, 10.0, 17.0, 14.0, 13.0, 19.0, 16.0, 24.0, 29.0, 29.0, 33.0, 37.0, 35.0, 40.0, 36.0, 36.0, 30.0, 29.0, 36.0, 46.0, 37.0, 45.0, 39.0, 32.0, 32.0, 34.0, 24.0, 34.0, 25.0, 21.0, 17.0, 15.0, 11.0, 19.0, 12.0, 10.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-123.71678161621094, -120.2337417602539, -116.75070190429688, -113.26766204833984, -109.78462219238281, -106.30157470703125, -102.81854248046875, -99.33549499511719, -95.85245513916016, -92.36941528320312, -88.8863754272461, -85.40333557128906, -81.92029571533203, -78.437255859375, -74.95420837402344, -71.4711685180664, -67.98812866210938, -64.50508880615234, -61.02204895019531, -57.53900909423828, -54.055965423583984, -50.57292556762695, -47.08988571166992, -43.606842041015625, -40.123809814453125, -36.640769958496094, -33.15773010253906, -29.6746883392334, -26.191646575927734, -22.708606719970703, -19.225566864013672, -15.742525100708008, -12.259483337402344, -8.776442527770996, -5.293402194976807, -1.8103618621826172, 1.6726789474487305, 5.155719757080078, 8.63875961303711, 12.121801376342773, 15.604841232299805, 19.087881088256836, 22.5709228515625, 26.05396270751953, 29.537002563476562, 33.020042419433594, 36.503082275390625, 39.98612594604492, 43.46916580200195, 46.952205657958984, 50.435245513916016, 53.91828918457031, 57.401329040527344, 60.884368896484375, 64.3674087524414, 67.85044860839844, 71.33348846435547, 74.8165283203125, 78.29956817626953, 81.78260803222656, 85.2656478881836, 88.74868774414062, 92.23173522949219, 95.71477508544922, 99.19781494140625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 8.0, 7.0, 7.0, 14.0, 11.0, 19.0, 23.0, 10.0, 16.0, 28.0, 37.0, 29.0, 43.0, 38.0, 27.0, 36.0, 53.0, 46.0, 38.0, 39.0, 42.0, 42.0, 38.0, 44.0, 36.0, 31.0, 29.0, 27.0, 23.0, 25.0, 23.0, 25.0, 11.0, 17.0, 8.0, 12.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-25.234375, -24.470947265625, -23.70751953125, -22.944091796875, -22.1806640625, -21.417236328125, -20.65380859375, -19.890380859375, -19.126953125, -18.363525390625, -17.60009765625, -16.836669921875, -16.0732421875, -15.309814453125, -14.54638671875, -13.782958984375, -13.01953125, -12.256103515625, -11.49267578125, -10.729248046875, -9.9658203125, -9.202392578125, -8.43896484375, -7.675537109375, -6.912109375, -6.148681640625, -5.38525390625, -4.621826171875, -3.8583984375, -3.094970703125, -2.33154296875, -1.568115234375, -0.8046875, -0.041259765625, 0.72216796875, 1.485595703125, 2.2490234375, 3.012451171875, 3.77587890625, 4.539306640625, 5.302734375, 6.066162109375, 6.82958984375, 7.593017578125, 8.3564453125, 9.119873046875, 9.88330078125, 10.646728515625, 11.41015625, 12.173583984375, 12.93701171875, 13.700439453125, 14.4638671875, 15.227294921875, 15.99072265625, 16.754150390625, 17.517578125, 18.281005859375, 19.04443359375, 19.807861328125, 20.5712890625, 21.334716796875, 22.09814453125, 22.861572265625, 23.625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 12.0, 16.0, 28.0, 37.0, 59.0, 72.0, 112.0, 156.0, 228.0, 330.0, 469.0, 684.0, 1041.0, 1419.0, 2082.0, 3021.0, 4607.0, 6762.0, 10314.0, 15848.0, 24395.0, 38287.0, 61443.0, 100068.0, 168147.0, 215668.0, 149730.0, 89831.0, 54813.0, 34180.0, 21844.0, 14232.0, 9347.0, 6213.0, 4176.0, 2741.0, 1911.0, 1285.0, 879.0, 584.0, 432.0, 309.0, 211.0, 163.0, 118.0, 76.0, 52.0, 39.0, 27.0, 22.0, 8.0, 10.0, 5.0, 6.0, 4.0, 1.0, 2.0], "bins": [-1.1171875, -1.0826873779296875, -1.048187255859375, -1.0136871337890625, -0.97918701171875, -0.9446868896484375, -0.910186767578125, -0.8756866455078125, -0.8411865234375, -0.8066864013671875, -0.772186279296875, -0.7376861572265625, -0.70318603515625, -0.6686859130859375, -0.634185791015625, -0.5996856689453125, -0.565185546875, -0.5306854248046875, -0.496185302734375, -0.4616851806640625, -0.42718505859375, -0.3926849365234375, -0.358184814453125, -0.3236846923828125, -0.2891845703125, -0.2546844482421875, -0.220184326171875, -0.1856842041015625, -0.15118408203125, -0.1166839599609375, -0.082183837890625, -0.0476837158203125, -0.01318359375, 0.0213165283203125, 0.055816650390625, 0.0903167724609375, 0.12481689453125, 0.1593170166015625, 0.193817138671875, 0.2283172607421875, 0.2628173828125, 0.2973175048828125, 0.331817626953125, 0.3663177490234375, 0.40081787109375, 0.4353179931640625, 0.469818115234375, 0.5043182373046875, 0.538818359375, 0.5733184814453125, 0.607818603515625, 0.6423187255859375, 0.67681884765625, 0.7113189697265625, 0.745819091796875, 0.7803192138671875, 0.8148193359375, 0.8493194580078125, 0.883819580078125, 0.9183197021484375, 0.95281982421875, 0.9873199462890625, 1.021820068359375, 1.0563201904296875, 1.0908203125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 6.0, 6.0, 5.0, 4.0, 11.0, 12.0, 13.0, 15.0, 16.0, 24.0, 18.0, 23.0, 23.0, 26.0, 30.0, 36.0, 38.0, 45.0, 44.0, 39.0, 51.0, 1066.0, 41.0, 38.0, 38.0, 27.0, 44.0, 35.0, 18.0, 20.0, 27.0, 32.0, 19.0, 14.0, 20.0, 19.0, 14.0, 10.0, 13.0, 4.0, 8.0, 6.0, 4.0, 8.0, 1.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.03125, -14.556640625, -14.08203125, -13.607421875, -13.1328125, -12.658203125, -12.18359375, -11.708984375, -11.234375, -10.759765625, -10.28515625, -9.810546875, -9.3359375, -8.861328125, -8.38671875, -7.912109375, -7.4375, -6.962890625, -6.48828125, -6.013671875, -5.5390625, -5.064453125, -4.58984375, -4.115234375, -3.640625, -3.166015625, -2.69140625, -2.216796875, -1.7421875, -1.267578125, -0.79296875, -0.318359375, 0.15625, 0.630859375, 1.10546875, 1.580078125, 2.0546875, 2.529296875, 3.00390625, 3.478515625, 3.953125, 4.427734375, 4.90234375, 5.376953125, 5.8515625, 6.326171875, 6.80078125, 7.275390625, 7.75, 8.224609375, 8.69921875, 9.173828125, 9.6484375, 10.123046875, 10.59765625, 11.072265625, 11.546875, 12.021484375, 12.49609375, 12.970703125, 13.4453125, 13.919921875, 14.39453125, 14.869140625, 15.34375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 13.0, 18.0, 20.0, 41.0, 83.0, 90.0, 128.0, 182.0, 272.0, 382.0, 529.0, 742.0, 1035.0, 1417.0, 1942.0, 2738.0, 3824.0, 5263.0, 7365.0, 10245.0, 14647.0, 21097.0, 31263.0, 47816.0, 76874.0, 126228.0, 1229350.0, 192514.0, 113530.0, 68809.0, 43502.0, 28498.0, 19228.0, 13644.0, 9632.0, 6676.0, 4949.0, 3502.0, 2593.0, 1750.0, 1383.0, 970.0, 699.0, 505.0, 351.0, 252.0, 188.0, 105.0, 73.0, 64.0, 41.0, 25.0, 18.0, 10.0, 5.0, 6.0, 2.0, 2.0], "bins": [-0.9111328125, -0.8834304809570312, -0.8557281494140625, -0.8280258178710938, -0.800323486328125, -0.7726211547851562, -0.7449188232421875, -0.7172164916992188, -0.68951416015625, -0.6618118286132812, -0.6341094970703125, -0.6064071655273438, -0.578704833984375, -0.5510025024414062, -0.5233001708984375, -0.49559783935546875, -0.4678955078125, -0.44019317626953125, -0.4124908447265625, -0.38478851318359375, -0.357086181640625, -0.32938385009765625, -0.3016815185546875, -0.27397918701171875, -0.24627685546875, -0.21857452392578125, -0.1908721923828125, -0.16316986083984375, -0.135467529296875, -0.10776519775390625, -0.0800628662109375, -0.05236053466796875, -0.024658203125, 0.00304412841796875, 0.0307464599609375, 0.05844879150390625, 0.086151123046875, 0.11385345458984375, 0.1415557861328125, 0.16925811767578125, 0.19696044921875, 0.22466278076171875, 0.2523651123046875, 0.28006744384765625, 0.307769775390625, 0.33547210693359375, 0.3631744384765625, 0.39087677001953125, 0.4185791015625, 0.44628143310546875, 0.4739837646484375, 0.5016860961914062, 0.529388427734375, 0.5570907592773438, 0.5847930908203125, 0.6124954223632812, 0.64019775390625, 0.6679000854492188, 0.6956024169921875, 0.7233047485351562, 0.751007080078125, 0.7787094116210938, 0.8064117431640625, 0.8341140747070312, 0.86181640625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 2.0, 7.0, 7.0, 7.0, 13.0, 11.0, 22.0, 10.0, 14.0, 19.0, 25.0, 32.0, 42.0, 45.0, 71.0, 67.0, 66.0, 66.0, 54.0, 68.0, 61.0, 58.0, 48.0, 34.0, 25.0, 23.0, 21.0, 10.0, 21.0, 15.0, 6.0, 3.0, 9.0, 6.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007076263427734375, -0.006861269474029541, -0.006646275520324707, -0.006431281566619873, -0.006216287612915039, -0.006001293659210205, -0.005786299705505371, -0.005571305751800537, -0.005356311798095703, -0.005141317844390869, -0.004926323890686035, -0.004711329936981201, -0.004496335983276367, -0.004281342029571533, -0.004066348075866699, -0.0038513541221618652, -0.0036363601684570312, -0.0034213662147521973, -0.0032063722610473633, -0.0029913783073425293, -0.0027763843536376953, -0.0025613903999328613, -0.0023463964462280273, -0.0021314024925231934, -0.0019164085388183594, -0.0017014145851135254, -0.0014864206314086914, -0.0012714266777038574, -0.0010564327239990234, -0.0008414387702941895, -0.0006264448165893555, -0.0004114508628845215, -0.0001964569091796875, 1.8537044525146484e-05, 0.00023353099822998047, 0.00044852495193481445, 0.0006635189056396484, 0.0008785128593444824, 0.0010935068130493164, 0.0013085007667541504, 0.0015234947204589844, 0.0017384886741638184, 0.0019534826278686523, 0.0021684765815734863, 0.0023834705352783203, 0.0025984644889831543, 0.0028134584426879883, 0.0030284523963928223, 0.0032434463500976562, 0.0034584403038024902, 0.0036734342575073242, 0.003888428211212158, 0.004103422164916992, 0.004318416118621826, 0.00453341007232666, 0.004748404026031494, 0.004963397979736328, 0.005178391933441162, 0.005393385887145996, 0.00560837984085083, 0.005823373794555664, 0.006038367748260498, 0.006253361701965332, 0.006468355655670166, 0.006683349609375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 8.0, 7.0, 3.0, 12.0, 13.0, 19.0, 27.0, 35.0, 40.0, 60.0, 79.0, 122.0, 234.0, 592.0, 21523.0, 1020840.0, 3827.0, 447.0, 219.0, 98.0, 73.0, 73.0, 45.0, 34.0, 19.0, 15.0, 18.0, 17.0, 10.0, 7.0, 10.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1536865234375, -0.1487865447998047, -0.14388656616210938, -0.13898658752441406, -0.13408660888671875, -0.12918663024902344, -0.12428665161132812, -0.11938667297363281, -0.1144866943359375, -0.10958671569824219, -0.10468673706054688, -0.09978675842285156, -0.09488677978515625, -0.08998680114746094, -0.08508682250976562, -0.08018684387207031, -0.075286865234375, -0.07038688659667969, -0.06548690795898438, -0.06058692932128906, -0.05568695068359375, -0.05078697204589844, -0.045886993408203125, -0.04098701477050781, -0.0360870361328125, -0.031187057495117188, -0.026287078857421875, -0.021387100219726562, -0.01648712158203125, -0.011587142944335938, -0.006687164306640625, -0.0017871856689453125, 0.00311279296875, 0.008012771606445312, 0.012912750244140625, 0.017812728881835938, 0.02271270751953125, 0.027612686157226562, 0.032512664794921875, 0.03741264343261719, 0.0423126220703125, 0.04721260070800781, 0.052112579345703125, 0.05701255798339844, 0.06191253662109375, 0.06681251525878906, 0.07171249389648438, 0.07661247253417969, 0.081512451171875, 0.08641242980957031, 0.09131240844726562, 0.09621238708496094, 0.10111236572265625, 0.10601234436035156, 0.11091232299804688, 0.11581230163574219, 0.1207122802734375, 0.1256122589111328, 0.13051223754882812, 0.13541221618652344, 0.14031219482421875, 0.14521217346191406, 0.15011215209960938, 0.1550121307373047, 0.159912109375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 16.0, 987.0, 17.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1968686878681183, -0.19332051277160645, -0.1897723376750946, -0.18622416257858276, -0.18267600238323212, -0.17912782728672028, -0.17557965219020844, -0.1720314770936966, -0.16848330199718475, -0.1649351269006729, -0.16138695180416107, -0.15783877670764923, -0.15429061651229858, -0.15074244141578674, -0.1471942663192749, -0.14364609122276306, -0.14009791612625122, -0.13654974102973938, -0.13300156593322754, -0.1294533908367157, -0.12590523064136505, -0.12235705554485321, -0.11880888044834137, -0.11526070535182953, -0.11171253770589828, -0.10816436260938644, -0.1046161949634552, -0.10106801986694336, -0.09751984477043152, -0.09397166967391968, -0.09042350202798843, -0.08687532693147659, -0.08332715183496475, -0.07977897673845291, -0.07623080909252167, -0.07268263399600983, -0.06913445889949799, -0.06558628380298615, -0.0620381161570549, -0.05848994106054306, -0.05494176968932152, -0.051393598318099976, -0.047845423221588135, -0.04429725185036659, -0.04074907675385475, -0.03720090538263321, -0.03365273028612137, -0.030104558914899826, -0.026556385681033134, -0.023008212447166443, -0.01946003921329975, -0.01591186597943306, -0.012363693676888943, -0.008815521374344826, -0.005267348140478134, -0.0017191749066114426, 0.001828998327255249, 0.005377171561121941, 0.008925344794988632, 0.01247351709753275, 0.016021691262722015, 0.019569862633943558, 0.02311803586781025, 0.02666620910167694, 0.030214382335543633]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 9.0, 8.0, 8.0, 14.0, 24.0, 17.0, 31.0, 33.0, 35.0, 48.0, 50.0, 41.0, 42.0, 51.0, 52.0, 52.0, 62.0, 57.0, 51.0, 56.0, 40.0, 31.0, 39.0, 36.0, 24.0, 25.0, 15.0, 12.0, 15.0, 8.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004563271999359131, -0.004379077814519405, -0.00419488362967968, -0.004010689444839954, -0.003826495260000229, -0.0036423010751605034, -0.003458106890320778, -0.0032739127054810524, -0.003089718520641327, -0.0029055243358016014, -0.002721330150961876, -0.0025371359661221504, -0.002352941781282425, -0.0021687475964426994, -0.001984553411602974, -0.0018003592267632484, -0.001616165041923523, -0.0014319708570837975, -0.001247776672244072, -0.0010635824874043465, -0.000879388302564621, -0.0006951941177248955, -0.00051099993288517, -0.0003268057480454445, -0.000142611563205719, 4.15826216340065e-05, 0.000225776806473732, 0.0004099709913134575, 0.000594165176153183, 0.0007783593609929085, 0.000962553545832634, 0.0011467477306723595, 0.001330941915512085, 0.0015151361003518105, 0.001699330285191536, 0.0018835244700312614, 0.002067718654870987, 0.0022519128397107124, 0.002436107024550438, 0.0026203012093901634, 0.002804495394229889, 0.0029886895790696144, 0.00317288376390934, 0.0033570779487490654, 0.003541272133588791, 0.0037254663184285164, 0.003909660503268242, 0.004093854688107967, 0.004278048872947693, 0.004462243057787418, 0.004646437242627144, 0.004830631427466869, 0.005014825612306595, 0.00519901979714632, 0.005383213981986046, 0.005567408166825771, 0.005751602351665497, 0.005935796536505222, 0.006119990721344948, 0.006304184906184673, 0.006488379091024399, 0.006672573275864124, 0.00685676746070385, 0.007040961645543575, 0.007225155830383301]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 8.0, 7.0, 7.0, 14.0, 11.0, 19.0, 23.0, 10.0, 16.0, 28.0, 37.0, 29.0, 43.0, 38.0, 27.0, 36.0, 53.0, 46.0, 38.0, 39.0, 42.0, 42.0, 38.0, 44.0, 36.0, 31.0, 29.0, 27.0, 23.0, 25.0, 23.0, 25.0, 11.0, 17.0, 8.0, 12.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-25.234375, -24.470947265625, -23.70751953125, -22.944091796875, -22.1806640625, -21.417236328125, -20.65380859375, -19.890380859375, -19.126953125, -18.363525390625, -17.60009765625, -16.836669921875, -16.0732421875, -15.309814453125, -14.54638671875, -13.782958984375, -13.01953125, -12.256103515625, -11.49267578125, -10.729248046875, -9.9658203125, -9.202392578125, -8.43896484375, -7.675537109375, -6.912109375, -6.148681640625, -5.38525390625, -4.621826171875, -3.8583984375, -3.094970703125, -2.33154296875, -1.568115234375, -0.8046875, -0.041259765625, 0.72216796875, 1.485595703125, 2.2490234375, 3.012451171875, 3.77587890625, 4.539306640625, 5.302734375, 6.066162109375, 6.82958984375, 7.593017578125, 8.3564453125, 9.119873046875, 9.88330078125, 10.646728515625, 11.41015625, 12.173583984375, 12.93701171875, 13.700439453125, 14.4638671875, 15.227294921875, 15.99072265625, 16.754150390625, 17.517578125, 18.281005859375, 19.04443359375, 19.807861328125, 20.5712890625, 21.334716796875, 22.09814453125, 22.861572265625, 23.625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 15.0, 11.0, 6.0, 14.0, 21.0, 18.0, 37.0, 46.0, 41.0, 71.0, 107.0, 160.0, 226.0, 431.0, 728.0, 1190.0, 2474.0, 6099.0, 25561.0, 401187.0, 567800.0, 29817.0, 6594.0, 2612.0, 1281.0, 744.0, 443.0, 245.0, 176.0, 107.0, 72.0, 55.0, 45.0, 23.0, 25.0, 12.0, 16.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-45.21875, -43.85009765625, -42.4814453125, -41.11279296875, -39.744140625, -38.37548828125, -37.0068359375, -35.63818359375, -34.26953125, -32.90087890625, -31.5322265625, -30.16357421875, -28.794921875, -27.42626953125, -26.0576171875, -24.68896484375, -23.3203125, -21.95166015625, -20.5830078125, -19.21435546875, -17.845703125, -16.47705078125, -15.1083984375, -13.73974609375, -12.37109375, -11.00244140625, -9.6337890625, -8.26513671875, -6.896484375, -5.52783203125, -4.1591796875, -2.79052734375, -1.421875, -0.05322265625, 1.3154296875, 2.68408203125, 4.052734375, 5.42138671875, 6.7900390625, 8.15869140625, 9.52734375, 10.89599609375, 12.2646484375, 13.63330078125, 15.001953125, 16.37060546875, 17.7392578125, 19.10791015625, 20.4765625, 21.84521484375, 23.2138671875, 24.58251953125, 25.951171875, 27.31982421875, 28.6884765625, 30.05712890625, 31.42578125, 32.79443359375, 34.1630859375, 35.53173828125, 36.900390625, 38.26904296875, 39.6376953125, 41.00634765625, 42.375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 9.0, 8.0, 12.0, 9.0, 4.0, 17.0, 13.0, 20.0, 17.0, 19.0, 37.0, 43.0, 38.0, 48.0, 42.0, 55.0, 94.0, 158.0, 1822.0, 132.0, 57.0, 60.0, 51.0, 59.0, 34.0, 31.0, 28.0, 23.0, 16.0, 26.0, 17.0, 12.0, 8.0, 8.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.59375, -57.14306640625, -54.6923828125, -52.24169921875, -49.791015625, -47.34033203125, -44.8896484375, -42.43896484375, -39.98828125, -37.53759765625, -35.0869140625, -32.63623046875, -30.185546875, -27.73486328125, -25.2841796875, -22.83349609375, -20.3828125, -17.93212890625, -15.4814453125, -13.03076171875, -10.580078125, -8.12939453125, -5.6787109375, -3.22802734375, -0.77734375, 1.67333984375, 4.1240234375, 6.57470703125, 9.025390625, 11.47607421875, 13.9267578125, 16.37744140625, 18.828125, 21.27880859375, 23.7294921875, 26.18017578125, 28.630859375, 31.08154296875, 33.5322265625, 35.98291015625, 38.43359375, 40.88427734375, 43.3349609375, 45.78564453125, 48.236328125, 50.68701171875, 53.1376953125, 55.58837890625, 58.0390625, 60.48974609375, 62.9404296875, 65.39111328125, 67.841796875, 70.29248046875, 72.7431640625, 75.19384765625, 77.64453125, 80.09521484375, 82.5458984375, 84.99658203125, 87.447265625, 89.89794921875, 92.3486328125, 94.79931640625, 97.25]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 9.0, 21.0, 30.0, 24.0, 27.0, 41.0, 41.0, 87.0, 134.0, 200.0, 426.0, 1347.0, 64992.0, 3074270.0, 2688.0, 573.0, 245.0, 147.0, 98.0, 61.0, 51.0, 16.0, 29.0, 22.0, 17.0, 17.0, 8.0, 5.0, 14.0, 6.0, 11.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-290.5, -283.083984375, -275.66796875, -268.251953125, -260.8359375, -253.419921875, -246.00390625, -238.587890625, -231.171875, -223.755859375, -216.33984375, -208.923828125, -201.5078125, -194.091796875, -186.67578125, -179.259765625, -171.84375, -164.427734375, -157.01171875, -149.595703125, -142.1796875, -134.763671875, -127.34765625, -119.931640625, -112.515625, -105.099609375, -97.68359375, -90.267578125, -82.8515625, -75.435546875, -68.01953125, -60.603515625, -53.1875, -45.771484375, -38.35546875, -30.939453125, -23.5234375, -16.107421875, -8.69140625, -1.275390625, 6.140625, 13.556640625, 20.97265625, 28.388671875, 35.8046875, 43.220703125, 50.63671875, 58.052734375, 65.46875, 72.884765625, 80.30078125, 87.716796875, 95.1328125, 102.548828125, 109.96484375, 117.380859375, 124.796875, 132.212890625, 139.62890625, 147.044921875, 154.4609375, 161.876953125, 169.29296875, 176.708984375, 184.125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 19.0, 66.0, 259.0, 366.0, 219.0, 54.0, 17.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-262.3897705078125, -257.3829040527344, -252.3760528564453, -247.36920166015625, -242.3623504638672, -237.35549926757812, -232.3486328125, -227.34178161621094, -222.33493041992188, -217.3280792236328, -212.3212127685547, -207.31436157226562, -202.30751037597656, -197.3006591796875, -192.29379272460938, -187.2869415283203, -182.2800750732422, -177.27322387695312, -172.266357421875, -167.25950622558594, -162.25265502929688, -157.24578857421875, -152.2389373779297, -147.23208618164062, -142.2252197265625, -137.21836853027344, -132.2115020751953, -127.20465087890625, -122.19779968261719, -117.1909408569336, -112.18408203125, -107.17723083496094, -102.17037963867188, -97.16352081298828, -92.15666961669922, -87.14981079101562, -82.14295959472656, -77.13610076904297, -72.12924194335938, -67.12239074707031, -62.11552810668945, -57.108673095703125, -52.10181427001953, -47.0949592590332, -42.088104248046875, -37.08124923706055, -32.07439422607422, -27.067535400390625, -22.060680389404297, -17.05382537841797, -12.046968460083008, -7.040112495422363, -2.0332565307617188, 2.9735984802246094, 7.98045539855957, 12.987312316894531, 17.99416732788086, 23.001022338867188, 28.00787925720215, 33.01473617553711, 38.02159118652344, 43.028446197509766, 48.035301208496094, 53.04216003417969, 58.049015045166016]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 8.0, 19.0, 20.0, 22.0, 20.0, 17.0, 17.0, 22.0, 38.0, 37.0, 33.0, 34.0, 33.0, 49.0, 43.0, 39.0, 34.0, 41.0, 47.0, 40.0, 36.0, 43.0, 36.0, 27.0, 33.0, 23.0, 26.0, 27.0, 17.0, 14.0, 15.0, 7.0, 13.0, 7.0, 6.0, 7.0, 6.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-168.46751403808594, -162.49844360351562, -156.52935791015625, -150.56027221679688, -144.59120178222656, -138.62213134765625, -132.65304565429688, -126.68396759033203, -120.71488952636719, -114.74581146240234, -108.7767333984375, -102.80765533447266, -96.83857727050781, -90.86949920654297, -84.90042114257812, -78.93134307861328, -72.96226501464844, -66.9931869506836, -61.02410888671875, -55.055030822753906, -49.08595275878906, -43.11687469482422, -37.147796630859375, -31.17871856689453, -25.209640502929688, -19.240562438964844, -13.271484375, -7.302406311035156, -1.3333282470703125, 4.635749816894531, 10.604827880859375, 16.57390594482422, 22.542999267578125, 28.51207733154297, 34.48115539550781, 40.450233459472656, 46.4193115234375, 52.388389587402344, 58.35746765136719, 64.32654571533203, 70.29562377929688, 76.26470184326172, 82.23377990722656, 88.2028579711914, 94.17193603515625, 100.1410140991211, 106.11009216308594, 112.07917022705078, 118.04824829101562, 124.01732635498047, 129.9864044189453, 135.95547485351562, 141.924560546875, 147.89364624023438, 153.8627166748047, 159.831787109375, 165.80087280273438, 171.76995849609375, 177.73902893066406, 183.70809936523438, 189.67718505859375, 195.64627075195312, 201.61534118652344, 207.58441162109375, 213.55349731445312]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 5.0, 9.0, 6.0, 8.0, 8.0, 16.0, 12.0, 20.0, 15.0, 17.0, 24.0, 24.0, 34.0, 39.0, 38.0, 32.0, 44.0, 39.0, 43.0, 42.0, 45.0, 38.0, 34.0, 36.0, 40.0, 53.0, 28.0, 39.0, 25.0, 26.0, 26.0, 18.0, 27.0, 14.0, 14.0, 12.0, 13.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.453125, -24.671630859375, -23.89013671875, -23.108642578125, -22.3271484375, -21.545654296875, -20.76416015625, -19.982666015625, -19.201171875, -18.419677734375, -17.63818359375, -16.856689453125, -16.0751953125, -15.293701171875, -14.51220703125, -13.730712890625, -12.94921875, -12.167724609375, -11.38623046875, -10.604736328125, -9.8232421875, -9.041748046875, -8.26025390625, -7.478759765625, -6.697265625, -5.915771484375, -5.13427734375, -4.352783203125, -3.5712890625, -2.789794921875, -2.00830078125, -1.226806640625, -0.4453125, 0.336181640625, 1.11767578125, 1.899169921875, 2.6806640625, 3.462158203125, 4.24365234375, 5.025146484375, 5.806640625, 6.588134765625, 7.36962890625, 8.151123046875, 8.9326171875, 9.714111328125, 10.49560546875, 11.277099609375, 12.05859375, 12.840087890625, 13.62158203125, 14.403076171875, 15.1845703125, 15.966064453125, 16.74755859375, 17.529052734375, 18.310546875, 19.092041015625, 19.87353515625, 20.655029296875, 21.4365234375, 22.218017578125, 22.99951171875, 23.781005859375, 24.5625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 5.0, 13.0, 12.0, 17.0, 15.0, 27.0, 29.0, 49.0, 74.0, 97.0, 125.0, 165.0, 234.0, 373.0, 520.0, 857.0, 1527.0, 3031.0, 7190.0, 48787.0, 746124.0, 2984310.0, 365694.0, 22955.0, 5584.0, 2599.0, 1326.0, 806.0, 512.0, 335.0, 248.0, 154.0, 120.0, 91.0, 88.0, 47.0, 35.0, 22.0, 19.0, 14.0, 12.0, 13.0, 11.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-54.71875, -53.0283203125, -51.337890625, -49.6474609375, -47.95703125, -46.2666015625, -44.576171875, -42.8857421875, -41.1953125, -39.5048828125, -37.814453125, -36.1240234375, -34.43359375, -32.7431640625, -31.052734375, -29.3623046875, -27.671875, -25.9814453125, -24.291015625, -22.6005859375, -20.91015625, -19.2197265625, -17.529296875, -15.8388671875, -14.1484375, -12.4580078125, -10.767578125, -9.0771484375, -7.38671875, -5.6962890625, -4.005859375, -2.3154296875, -0.625, 1.0654296875, 2.755859375, 4.4462890625, 6.13671875, 7.8271484375, 9.517578125, 11.2080078125, 12.8984375, 14.5888671875, 16.279296875, 17.9697265625, 19.66015625, 21.3505859375, 23.041015625, 24.7314453125, 26.421875, 28.1123046875, 29.802734375, 31.4931640625, 33.18359375, 34.8740234375, 36.564453125, 38.2548828125, 39.9453125, 41.6357421875, 43.326171875, 45.0166015625, 46.70703125, 48.3974609375, 50.087890625, 51.7783203125, 53.46875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 10.0, 10.0, 15.0, 34.0, 40.0, 49.0, 66.0, 132.0, 258.0, 487.0, 807.0, 852.0, 518.0, 299.0, 173.0, 80.0, 56.0, 37.0, 35.0, 32.0, 10.0, 17.0, 11.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.63671875, -46.0546875, -44.47265625, -42.890625, -41.30859375, -39.7265625, -38.14453125, -36.5625, -34.98046875, -33.3984375, -31.81640625, -30.234375, -28.65234375, -27.0703125, -25.48828125, -23.90625, -22.32421875, -20.7421875, -19.16015625, -17.578125, -15.99609375, -14.4140625, -12.83203125, -11.25, -9.66796875, -8.0859375, -6.50390625, -4.921875, -3.33984375, -1.7578125, -0.17578125, 1.40625, 2.98828125, 4.5703125, 6.15234375, 7.734375, 9.31640625, 10.8984375, 12.48046875, 14.0625, 15.64453125, 17.2265625, 18.80859375, 20.390625, 21.97265625, 23.5546875, 25.13671875, 26.71875, 28.30078125, 29.8828125, 31.46484375, 33.046875, 34.62890625, 36.2109375, 37.79296875, 39.375, 40.95703125, 42.5390625, 44.12109375, 45.703125, 47.28515625, 48.8671875, 50.44921875, 52.03125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 6.0, 5.0, 1.0, 9.0, 4.0, 17.0, 11.0, 13.0, 21.0, 35.0, 59.0, 91.0, 140.0, 317.0, 795.0, 2780.0, 21223.0, 3834255.0, 322411.0, 9322.0, 1698.0, 562.0, 190.0, 133.0, 59.0, 52.0, 26.0, 13.0, 15.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-186.625, -180.939453125, -175.25390625, -169.568359375, -163.8828125, -158.197265625, -152.51171875, -146.826171875, -141.140625, -135.455078125, -129.76953125, -124.083984375, -118.3984375, -112.712890625, -107.02734375, -101.341796875, -95.65625, -89.970703125, -84.28515625, -78.599609375, -72.9140625, -67.228515625, -61.54296875, -55.857421875, -50.171875, -44.486328125, -38.80078125, -33.115234375, -27.4296875, -21.744140625, -16.05859375, -10.373046875, -4.6875, 0.998046875, 6.68359375, 12.369140625, 18.0546875, 23.740234375, 29.42578125, 35.111328125, 40.796875, 46.482421875, 52.16796875, 57.853515625, 63.5390625, 69.224609375, 74.91015625, 80.595703125, 86.28125, 91.966796875, 97.65234375, 103.337890625, 109.0234375, 114.708984375, 120.39453125, 126.080078125, 131.765625, 137.451171875, 143.13671875, 148.822265625, 154.5078125, 160.193359375, 165.87890625, 171.564453125, 177.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 21.0, 123.0, 420.0, 335.0, 85.0, 17.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-671.45751953125, -655.0128173828125, -638.5680541992188, -622.1233520507812, -605.6786499023438, -589.2339477539062, -572.7891845703125, -556.344482421875, -539.8997802734375, -523.455078125, -507.0103454589844, -490.56561279296875, -474.12091064453125, -457.6761779785156, -441.2314453125, -424.7867431640625, -408.3420104980469, -391.89727783203125, -375.45257568359375, -359.0078430175781, -342.5631408691406, -326.118408203125, -309.6737060546875, -293.2289733886719, -276.78424072265625, -260.3395080566406, -243.89480590820312, -227.4500732421875, -211.00537109375, -194.56063842773438, -178.1159210205078, -161.67120361328125, -145.22647094726562, -128.78175354003906, -112.3370361328125, -95.8923110961914, -79.44759368896484, -63.00287628173828, -46.55815124511719, -30.113433837890625, -13.668716430664062, 2.776002883911133, 19.220722198486328, 35.665443420410156, 52.11016082763672, 68.55487823486328, 84.99960327148438, 101.44432067871094, 117.8890380859375, 134.33375549316406, 150.77847290039062, 167.22320556640625, 183.66790771484375, 200.11264038085938, 216.55735778808594, 233.0020751953125, 249.44679260253906, 265.8915100097656, 282.33624267578125, 298.78094482421875, 315.2256774902344, 331.6703796386719, 348.1151123046875, 364.559814453125, 381.0045471191406]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 12.0, 5.0, 11.0, 18.0, 17.0, 21.0, 18.0, 24.0, 24.0, 30.0, 30.0, 28.0, 37.0, 38.0, 44.0, 33.0, 30.0, 51.0, 38.0, 46.0, 40.0, 43.0, 39.0, 34.0, 30.0, 33.0, 28.0, 29.0, 27.0, 18.0, 19.0, 14.0, 17.0, 14.0, 13.0, 6.0, 5.0, 4.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-127.73908996582031, -124.02251434326172, -120.30593872070312, -116.58936309814453, -112.87278747558594, -109.15620422363281, -105.43963623046875, -101.72305297851562, -98.00647735595703, -94.28990173339844, -90.57332611083984, -86.85675048828125, -83.14017486572266, -79.42359924316406, -75.70701599121094, -71.99044036865234, -68.27386474609375, -64.55728912353516, -60.84071350097656, -57.12413787841797, -53.40755844116211, -49.690982818603516, -45.97440719604492, -42.25782775878906, -38.541259765625, -34.824684143066406, -31.10810661315918, -27.391530990600586, -23.67495346069336, -19.958377838134766, -16.241802215576172, -12.525224685668945, -8.808647155761719, -5.092070579528809, -1.3754944801330566, 2.3410816192626953, 6.0576581954956055, 9.774234771728516, 13.49081039428711, 17.207387924194336, 20.92396354675293, 24.640539169311523, 28.35711669921875, 32.073692321777344, 35.79026794433594, 39.50684356689453, 43.223419189453125, 46.939998626708984, 50.65657424926758, 54.37314987182617, 58.089725494384766, 61.806304931640625, 65.52288055419922, 69.23945617675781, 72.9560317993164, 76.672607421875, 80.3891830444336, 84.10575866699219, 87.82233428955078, 91.53890991210938, 95.25548553466797, 98.97206115722656, 102.68864440917969, 106.40522003173828, 110.12179565429688]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 8.0, 5.0, 14.0, 7.0, 16.0, 12.0, 12.0, 15.0, 21.0, 17.0, 26.0, 30.0, 37.0, 36.0, 36.0, 27.0, 46.0, 48.0, 35.0, 46.0, 35.0, 58.0, 39.0, 36.0, 38.0, 36.0, 28.0, 34.0, 27.0, 27.0, 28.0, 23.0, 12.0, 20.0, 9.0, 8.0, 11.0, 6.0, 8.0, 5.0, 4.0, 5.0, 0.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.90234375, -24.1484375, -23.39453125, -22.640625, -21.88671875, -21.1328125, -20.37890625, -19.625, -18.87109375, -18.1171875, -17.36328125, -16.609375, -15.85546875, -15.1015625, -14.34765625, -13.59375, -12.83984375, -12.0859375, -11.33203125, -10.578125, -9.82421875, -9.0703125, -8.31640625, -7.5625, -6.80859375, -6.0546875, -5.30078125, -4.546875, -3.79296875, -3.0390625, -2.28515625, -1.53125, -0.77734375, -0.0234375, 0.73046875, 1.484375, 2.23828125, 2.9921875, 3.74609375, 4.5, 5.25390625, 6.0078125, 6.76171875, 7.515625, 8.26953125, 9.0234375, 9.77734375, 10.53125, 11.28515625, 12.0390625, 12.79296875, 13.546875, 14.30078125, 15.0546875, 15.80859375, 16.5625, 17.31640625, 18.0703125, 18.82421875, 19.578125, 20.33203125, 21.0859375, 21.83984375, 22.59375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 12.0, 11.0, 20.0, 45.0, 54.0, 101.0, 131.0, 236.0, 327.0, 515.0, 850.0, 1348.0, 2048.0, 3301.0, 5173.0, 8273.0, 13853.0, 22706.0, 38835.0, 68331.0, 128413.0, 236255.0, 232152.0, 123512.0, 66561.0, 37743.0, 22305.0, 13381.0, 8274.0, 5036.0, 3073.0, 2077.0, 1254.0, 836.0, 550.0, 354.0, 214.0, 144.0, 95.0, 54.0, 40.0, 20.0, 11.0, 11.0, 5.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.1535491943359375, -1.113739013671875, -1.0739288330078125, -1.03411865234375, -0.9943084716796875, -0.954498291015625, -0.9146881103515625, -0.8748779296875, -0.8350677490234375, -0.795257568359375, -0.7554473876953125, -0.71563720703125, -0.6758270263671875, -0.636016845703125, -0.5962066650390625, -0.556396484375, -0.5165863037109375, -0.476776123046875, -0.4369659423828125, -0.39715576171875, -0.3573455810546875, -0.317535400390625, -0.2777252197265625, -0.2379150390625, -0.1981048583984375, -0.158294677734375, -0.1184844970703125, -0.07867431640625, -0.0388641357421875, 0.000946044921875, 0.0407562255859375, 0.08056640625, 0.1203765869140625, 0.160186767578125, 0.1999969482421875, 0.23980712890625, 0.2796173095703125, 0.319427490234375, 0.3592376708984375, 0.3990478515625, 0.4388580322265625, 0.478668212890625, 0.5184783935546875, 0.55828857421875, 0.5980987548828125, 0.637908935546875, 0.6777191162109375, 0.717529296875, 0.7573394775390625, 0.797149658203125, 0.8369598388671875, 0.87677001953125, 0.9165802001953125, 0.956390380859375, 0.9962005615234375, 1.0360107421875, 1.0758209228515625, 1.115631103515625, 1.1554412841796875, 1.19525146484375, 1.2350616455078125, 1.274871826171875, 1.3146820068359375, 1.3544921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 9.0, 5.0, 10.0, 4.0, 8.0, 10.0, 9.0, 14.0, 22.0, 17.0, 24.0, 17.0, 26.0, 32.0, 17.0, 28.0, 32.0, 35.0, 29.0, 45.0, 43.0, 46.0, 1061.0, 32.0, 32.0, 46.0, 36.0, 38.0, 32.0, 23.0, 28.0, 21.0, 36.0, 18.0, 28.0, 19.0, 21.0, 9.0, 8.0, 14.0, 9.0, 6.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.703125, -14.2491455078125, -13.795166015625, -13.3411865234375, -12.88720703125, -12.4332275390625, -11.979248046875, -11.5252685546875, -11.0712890625, -10.6173095703125, -10.163330078125, -9.7093505859375, -9.25537109375, -8.8013916015625, -8.347412109375, -7.8934326171875, -7.439453125, -6.9854736328125, -6.531494140625, -6.0775146484375, -5.62353515625, -5.1695556640625, -4.715576171875, -4.2615966796875, -3.8076171875, -3.3536376953125, -2.899658203125, -2.4456787109375, -1.99169921875, -1.5377197265625, -1.083740234375, -0.6297607421875, -0.17578125, 0.2781982421875, 0.732177734375, 1.1861572265625, 1.64013671875, 2.0941162109375, 2.548095703125, 3.0020751953125, 3.4560546875, 3.9100341796875, 4.364013671875, 4.8179931640625, 5.27197265625, 5.7259521484375, 6.179931640625, 6.6339111328125, 7.087890625, 7.5418701171875, 7.995849609375, 8.4498291015625, 8.90380859375, 9.3577880859375, 9.811767578125, 10.2657470703125, 10.7197265625, 11.1737060546875, 11.627685546875, 12.0816650390625, 12.53564453125, 12.9896240234375, 13.443603515625, 13.8975830078125, 14.3515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 8.0, 13.0, 16.0, 24.0, 31.0, 63.0, 70.0, 97.0, 171.0, 246.0, 356.0, 483.0, 682.0, 946.0, 1299.0, 1828.0, 2514.0, 3494.0, 5041.0, 7046.0, 9973.0, 14172.0, 20359.0, 29997.0, 44877.0, 70762.0, 114099.0, 190704.0, 1222728.0, 124388.0, 76529.0, 48474.0, 32183.0, 21633.0, 15171.0, 10684.0, 7411.0, 5305.0, 3838.0, 2675.0, 1962.0, 1345.0, 1066.0, 724.0, 506.0, 333.0, 249.0, 187.0, 125.0, 85.0, 72.0, 38.0, 18.0, 16.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.87744140625, -0.85009765625, -0.82275390625, -0.79541015625, -0.76806640625, -0.74072265625, -0.71337890625, -0.68603515625, -0.65869140625, -0.63134765625, -0.60400390625, -0.57666015625, -0.54931640625, -0.52197265625, -0.49462890625, -0.46728515625, -0.43994140625, -0.41259765625, -0.38525390625, -0.35791015625, -0.33056640625, -0.30322265625, -0.27587890625, -0.24853515625, -0.22119140625, -0.19384765625, -0.16650390625, -0.13916015625, -0.11181640625, -0.08447265625, -0.05712890625, -0.02978515625, -0.00244140625, 0.02490234375, 0.05224609375, 0.07958984375, 0.10693359375, 0.13427734375, 0.16162109375, 0.18896484375, 0.21630859375, 0.24365234375, 0.27099609375, 0.29833984375, 0.32568359375, 0.35302734375, 0.38037109375, 0.40771484375, 0.43505859375, 0.46240234375, 0.48974609375, 0.51708984375, 0.54443359375, 0.57177734375, 0.59912109375, 0.62646484375, 0.65380859375, 0.68115234375, 0.70849609375, 0.73583984375, 0.76318359375, 0.79052734375, 0.81787109375, 0.84521484375, 0.87255859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 8.0, 9.0, 15.0, 14.0, 14.0, 19.0, 22.0, 20.0, 30.0, 34.0, 51.0, 62.0, 59.0, 60.0, 67.0, 61.0, 54.0, 72.0, 44.0, 50.0, 46.0, 33.0, 32.0, 24.0, 19.0, 16.0, 13.0, 11.0, 9.0, 11.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006046295166015625, -0.005880534648895264, -0.005714774131774902, -0.005549013614654541, -0.00538325309753418, -0.005217492580413818, -0.005051732063293457, -0.004885971546173096, -0.004720211029052734, -0.004554450511932373, -0.004388689994812012, -0.00422292947769165, -0.004057168960571289, -0.0038914084434509277, -0.0037256479263305664, -0.003559887409210205, -0.0033941268920898438, -0.0032283663749694824, -0.003062605857849121, -0.0028968453407287598, -0.0027310848236083984, -0.002565324306488037, -0.0023995637893676758, -0.0022338032722473145, -0.002068042755126953, -0.0019022822380065918, -0.0017365217208862305, -0.0015707612037658691, -0.0014050006866455078, -0.0012392401695251465, -0.0010734796524047852, -0.0009077191352844238, -0.0007419586181640625, -0.0005761981010437012, -0.00041043758392333984, -0.0002446770668029785, -7.891654968261719e-05, 8.684396743774414e-05, 0.00025260448455810547, 0.0004183650016784668, 0.0005841255187988281, 0.0007498860359191895, 0.0009156465530395508, 0.0010814070701599121, 0.0012471675872802734, 0.0014129281044006348, 0.001578688621520996, 0.0017444491386413574, 0.0019102096557617188, 0.00207597017288208, 0.0022417306900024414, 0.0024074912071228027, 0.002573251724243164, 0.0027390122413635254, 0.0029047727584838867, 0.003070533275604248, 0.0032362937927246094, 0.0034020543098449707, 0.003567814826965332, 0.0037335753440856934, 0.0038993358612060547, 0.004065096378326416, 0.004230856895446777, 0.004396617412567139, 0.0045623779296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 3.0, 14.0, 12.0, 19.0, 14.0, 17.0, 34.0, 39.0, 47.0, 60.0, 78.0, 117.0, 198.0, 376.0, 2373.0, 807577.0, 235267.0, 1316.0, 325.0, 184.0, 110.0, 101.0, 59.0, 44.0, 44.0, 32.0, 13.0, 19.0, 10.0, 13.0, 11.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09063720703125, -0.08713817596435547, -0.08363914489746094, -0.0801401138305664, -0.07664108276367188, -0.07314205169677734, -0.06964302062988281, -0.06614398956298828, -0.06264495849609375, -0.05914592742919922, -0.05564689636230469, -0.052147865295410156, -0.048648834228515625, -0.045149803161621094, -0.04165077209472656, -0.03815174102783203, -0.0346527099609375, -0.03115367889404297, -0.027654647827148438, -0.024155616760253906, -0.020656585693359375, -0.017157554626464844, -0.013658523559570312, -0.010159492492675781, -0.00666046142578125, -0.0031614303588867188, 0.0003376007080078125, 0.0038366317749023438, 0.007335662841796875, 0.010834693908691406, 0.014333724975585938, 0.01783275604248047, 0.021331787109375, 0.02483081817626953, 0.028329849243164062, 0.031828880310058594, 0.035327911376953125, 0.038826942443847656, 0.04232597351074219, 0.04582500457763672, 0.04932403564453125, 0.05282306671142578, 0.05632209777832031, 0.059821128845214844, 0.06332015991210938, 0.0668191909790039, 0.07031822204589844, 0.07381725311279297, 0.0773162841796875, 0.08081531524658203, 0.08431434631347656, 0.0878133773803711, 0.09131240844726562, 0.09481143951416016, 0.09831047058105469, 0.10180950164794922, 0.10530853271484375, 0.10880756378173828, 0.11230659484863281, 0.11580562591552734, 0.11930465698242188, 0.1228036880493164, 0.12630271911621094, 0.12980175018310547, 0.13330078125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 32.0, 919.0, 64.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09649784862995148, -0.09479185193777084, -0.09308585524559021, -0.09137985855340958, -0.08967385441064835, -0.08796785771846771, -0.08626186102628708, -0.08455586433410645, -0.08284986764192581, -0.08114387094974518, -0.07943787425756454, -0.07773187756538391, -0.07602587342262268, -0.07431987673044205, -0.07261388003826141, -0.07090788334608078, -0.06920188665390015, -0.06749588996171951, -0.06578989326953888, -0.06408389657735825, -0.062377896159887314, -0.06067189574241638, -0.05896589905023575, -0.057259902358055115, -0.05555390194058418, -0.05384790524840355, -0.05214190483093262, -0.050435908138751984, -0.04872991144657135, -0.04702391475439072, -0.045317914336919785, -0.04361191764473915, -0.04190591722726822, -0.040199920535087585, -0.03849392011761665, -0.03678792342543602, -0.035081926733255386, -0.033375926315784454, -0.03166992962360382, -0.029963932931423187, -0.028257936239242554, -0.02655193768441677, -0.024845940992236137, -0.023139942437410355, -0.02143394574522972, -0.01972794719040394, -0.018021948635578156, -0.016315951943397522, -0.014609955251216888, -0.01290395762771368, -0.011197960004210472, -0.00949196144938469, -0.0077859642915427685, -0.006079966202378273, -0.004373968578875065, -0.0026679709553718567, -0.0009619733318686485, 0.0007440244080498815, 0.0024500221479684114, 0.004156020004302263, 0.005862017627805471, 0.007568015716969967, 0.009274013340473175, 0.010980010963976383, 0.012686008587479591]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 12.0, 11.0, 12.0, 19.0, 15.0, 23.0, 23.0, 17.0, 32.0, 31.0, 44.0, 38.0, 45.0, 48.0, 41.0, 33.0, 42.0, 50.0, 45.0, 46.0, 41.0, 37.0, 28.0, 43.0, 28.0, 31.0, 32.0, 19.0, 27.0, 15.0, 12.0, 6.0, 9.0, 11.0, 9.0, 7.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.003112494945526123, -0.0030047884210944176, -0.002897081896662712, -0.0027893753722310066, -0.002681668847799301, -0.0025739623233675957, -0.00246625579893589, -0.0023585492745041847, -0.0022508427500724792, -0.0021431362256407738, -0.0020354297012090683, -0.0019277231767773628, -0.0018200166523456573, -0.0017123101279139519, -0.0016046036034822464, -0.001496897079050541, -0.0013891905546188354, -0.00128148403018713, -0.0011737775057554245, -0.001066070981323719, -0.0009583644568920135, -0.0008506579324603081, -0.0007429514080286026, -0.0006352448835968971, -0.0005275383591651917, -0.0004198318347334862, -0.0003121253103017807, -0.00020441878587007523, -9.671226143836975e-05, 1.0994262993335724e-05, 0.0001187007874250412, 0.00022640731185674667, 0.00033411383628845215, 0.0004418203607201576, 0.0005495268851518631, 0.0006572334095835686, 0.000764939934015274, 0.0008726464584469795, 0.000980352982878685, 0.0010880595073103905, 0.001195766031742096, 0.0013034725561738014, 0.001411179080605507, 0.0015188856050372124, 0.0016265921294689178, 0.0017342986539006233, 0.0018420051783323288, 0.0019497117027640343, 0.0020574182271957397, 0.0021651247516274452, 0.0022728312760591507, 0.002380537800490856, 0.0024882443249225616, 0.002595950849354267, 0.0027036573737859726, 0.002811363898217678, 0.0029190704226493835, 0.003026776947081089, 0.0031344834715127945, 0.0032421899959445, 0.0033498965203762054, 0.003457603044807911, 0.0035653095692396164, 0.003673016093671322, 0.0037807226181030273]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 8.0, 5.0, 14.0, 7.0, 16.0, 12.0, 12.0, 15.0, 21.0, 17.0, 26.0, 30.0, 37.0, 36.0, 36.0, 27.0, 46.0, 48.0, 35.0, 46.0, 35.0, 58.0, 39.0, 36.0, 38.0, 36.0, 28.0, 34.0, 27.0, 27.0, 28.0, 23.0, 12.0, 20.0, 9.0, 8.0, 11.0, 6.0, 8.0, 5.0, 4.0, 5.0, 0.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.90234375, -24.1484375, -23.39453125, -22.640625, -21.88671875, -21.1328125, -20.37890625, -19.625, -18.87109375, -18.1171875, -17.36328125, -16.609375, -15.85546875, -15.1015625, -14.34765625, -13.59375, -12.83984375, -12.0859375, -11.33203125, -10.578125, -9.82421875, -9.0703125, -8.31640625, -7.5625, -6.80859375, -6.0546875, -5.30078125, -4.546875, -3.79296875, -3.0390625, -2.28515625, -1.53125, -0.77734375, -0.0234375, 0.73046875, 1.484375, 2.23828125, 2.9921875, 3.74609375, 4.5, 5.25390625, 6.0078125, 6.76171875, 7.515625, 8.26953125, 9.0234375, 9.77734375, 10.53125, 11.28515625, 12.0390625, 12.79296875, 13.546875, 14.30078125, 15.0546875, 15.80859375, 16.5625, 17.31640625, 18.0703125, 18.82421875, 19.578125, 20.33203125, 21.0859375, 21.83984375, 22.59375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 7.0, 7.0, 16.0, 19.0, 30.0, 30.0, 50.0, 72.0, 132.0, 224.0, 361.0, 613.0, 1054.0, 1918.0, 3361.0, 6187.0, 13114.0, 31033.0, 95137.0, 427449.0, 337354.0, 78735.0, 27169.0, 11600.0, 5654.0, 3082.0, 1641.0, 1010.0, 573.0, 361.0, 218.0, 112.0, 74.0, 50.0, 32.0, 18.0, 10.0, 10.0, 5.0, 6.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-30.296875, -29.40380859375, -28.5107421875, -27.61767578125, -26.724609375, -25.83154296875, -24.9384765625, -24.04541015625, -23.15234375, -22.25927734375, -21.3662109375, -20.47314453125, -19.580078125, -18.68701171875, -17.7939453125, -16.90087890625, -16.0078125, -15.11474609375, -14.2216796875, -13.32861328125, -12.435546875, -11.54248046875, -10.6494140625, -9.75634765625, -8.86328125, -7.97021484375, -7.0771484375, -6.18408203125, -5.291015625, -4.39794921875, -3.5048828125, -2.61181640625, -1.71875, -0.82568359375, 0.0673828125, 0.96044921875, 1.853515625, 2.74658203125, 3.6396484375, 4.53271484375, 5.42578125, 6.31884765625, 7.2119140625, 8.10498046875, 8.998046875, 9.89111328125, 10.7841796875, 11.67724609375, 12.5703125, 13.46337890625, 14.3564453125, 15.24951171875, 16.142578125, 17.03564453125, 17.9287109375, 18.82177734375, 19.71484375, 20.60791015625, 21.5009765625, 22.39404296875, 23.287109375, 24.18017578125, 25.0732421875, 25.96630859375, 26.859375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 3.0, 5.0, 10.0, 11.0, 5.0, 11.0, 16.0, 7.0, 35.0, 23.0, 29.0, 25.0, 30.0, 45.0, 29.0, 38.0, 51.0, 72.0, 101.0, 234.0, 1485.0, 235.0, 104.0, 75.0, 59.0, 47.0, 35.0, 35.0, 34.0, 24.0, 21.0, 14.0, 17.0, 18.0, 10.0, 11.0, 5.0, 4.0, 11.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.09375, -57.02783203125, -54.9619140625, -52.89599609375, -50.830078125, -48.76416015625, -46.6982421875, -44.63232421875, -42.56640625, -40.50048828125, -38.4345703125, -36.36865234375, -34.302734375, -32.23681640625, -30.1708984375, -28.10498046875, -26.0390625, -23.97314453125, -21.9072265625, -19.84130859375, -17.775390625, -15.70947265625, -13.6435546875, -11.57763671875, -9.51171875, -7.44580078125, -5.3798828125, -3.31396484375, -1.248046875, 0.81787109375, 2.8837890625, 4.94970703125, 7.015625, 9.08154296875, 11.1474609375, 13.21337890625, 15.279296875, 17.34521484375, 19.4111328125, 21.47705078125, 23.54296875, 25.60888671875, 27.6748046875, 29.74072265625, 31.806640625, 33.87255859375, 35.9384765625, 38.00439453125, 40.0703125, 42.13623046875, 44.2021484375, 46.26806640625, 48.333984375, 50.39990234375, 52.4658203125, 54.53173828125, 56.59765625, 58.66357421875, 60.7294921875, 62.79541015625, 64.861328125, 66.92724609375, 68.9931640625, 71.05908203125, 73.125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 7.0, 5.0, 11.0, 7.0, 13.0, 30.0, 16.0, 23.0, 39.0, 50.0, 43.0, 76.0, 66.0, 133.0, 181.0, 255.0, 581.0, 1563.0, 13302.0, 1097754.0, 2011575.0, 16500.0, 1764.0, 590.0, 310.0, 170.0, 123.0, 107.0, 84.0, 57.0, 50.0, 52.0, 25.0, 28.0, 14.0, 14.0, 14.0, 10.0, 12.0, 8.0, 12.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-115.8125, -112.5068359375, -109.201171875, -105.8955078125, -102.58984375, -99.2841796875, -95.978515625, -92.6728515625, -89.3671875, -86.0615234375, -82.755859375, -79.4501953125, -76.14453125, -72.8388671875, -69.533203125, -66.2275390625, -62.921875, -59.6162109375, -56.310546875, -53.0048828125, -49.69921875, -46.3935546875, -43.087890625, -39.7822265625, -36.4765625, -33.1708984375, -29.865234375, -26.5595703125, -23.25390625, -19.9482421875, -16.642578125, -13.3369140625, -10.03125, -6.7255859375, -3.419921875, -0.1142578125, 3.19140625, 6.4970703125, 9.802734375, 13.1083984375, 16.4140625, 19.7197265625, 23.025390625, 26.3310546875, 29.63671875, 32.9423828125, 36.248046875, 39.5537109375, 42.859375, 46.1650390625, 49.470703125, 52.7763671875, 56.08203125, 59.3876953125, 62.693359375, 65.9990234375, 69.3046875, 72.6103515625, 75.916015625, 79.2216796875, 82.52734375, 85.8330078125, 89.138671875, 92.4443359375, 95.75]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 38.0, 477.0, 460.0, 39.0, 3.0, 1.0, 0.0, 1.0], "bins": [-943.0515747070312, -926.796142578125, -910.5406494140625, -894.2852172851562, -878.02978515625, -861.7742919921875, -845.5188598632812, -829.263427734375, -813.0079345703125, -796.7525024414062, -780.4970092773438, -764.2415771484375, -747.9861450195312, -731.730712890625, -715.4752197265625, -699.2197875976562, -682.96435546875, -666.7089233398438, -650.4534301757812, -634.197998046875, -617.9425659179688, -601.6871337890625, -585.431640625, -569.1762084960938, -552.9207763671875, -536.6653442382812, -520.4098510742188, -504.1544189453125, -487.89898681640625, -471.6435241699219, -455.3880615234375, -439.13262939453125, -422.8771057128906, -406.62164306640625, -390.3662109375, -374.1107482910156, -357.85528564453125, -341.599853515625, -325.3443908691406, -309.08892822265625, -292.83349609375, -276.5780334472656, -260.3226013183594, -244.067138671875, -227.8116912841797, -211.55624389648438, -195.30078125, -179.0453338623047, -162.78988647460938, -146.53443908691406, -130.27899169921875, -114.02352905273438, -97.76808166503906, -81.51263427734375, -65.2571792602539, -49.00172424316406, -32.74628448486328, -16.490833282470703, -0.235382080078125, 16.020069122314453, 32.27552032470703, 48.530967712402344, 64.78642272949219, 81.04187774658203, 97.29732513427734]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 9.0, 13.0, 13.0, 11.0, 24.0, 15.0, 23.0, 20.0, 31.0, 20.0, 27.0, 40.0, 31.0, 27.0, 50.0, 40.0, 57.0, 40.0, 38.0, 41.0, 34.0, 50.0, 38.0, 41.0, 30.0, 27.0, 20.0, 22.0, 26.0, 27.0, 16.0, 12.0, 14.0, 13.0, 5.0, 9.0, 11.0, 7.0, 8.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-159.0382080078125, -153.84970092773438, -148.6611785888672, -143.47267150878906, -138.28416442871094, -133.09564208984375, -127.90713500976562, -122.7186279296875, -117.53011322021484, -112.34159851074219, -107.15309143066406, -101.9645767211914, -96.77606201171875, -91.58755493164062, -86.39904022216797, -81.21052551269531, -76.02201843261719, -70.83350372314453, -65.6449966430664, -60.45648193359375, -55.26797103881836, -50.07946014404297, -44.89094543457031, -39.70243453979492, -34.51392364501953, -29.32541275024414, -24.136899948120117, -18.948387145996094, -13.759876251220703, -8.571365356445312, -3.382852554321289, 1.8056602478027344, 6.9941864013671875, 12.182698249816895, 17.3712100982666, 22.559722900390625, 27.748233795166016, 32.936744689941406, 38.12525939941406, 43.31377029418945, 48.502281188964844, 53.690792083740234, 58.879302978515625, 64.06781768798828, 69.25633239746094, 74.44483947753906, 79.63335418701172, 84.82186889648438, 90.0103759765625, 95.19889068603516, 100.38739776611328, 105.57591247558594, 110.76441955566406, 115.95293426513672, 121.14144897460938, 126.3299560546875, 131.51846313476562, 136.70697021484375, 141.89549255371094, 147.08399963378906, 152.2725067138672, 157.46102905273438, 162.6495361328125, 167.83804321289062, 173.0265655517578]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 8.0, 7.0, 9.0, 11.0, 10.0, 10.0, 23.0, 12.0, 24.0, 25.0, 24.0, 34.0, 27.0, 36.0, 36.0, 41.0, 39.0, 43.0, 40.0, 53.0, 36.0, 43.0, 41.0, 37.0, 28.0, 41.0, 27.0, 32.0, 25.0, 16.0, 23.0, 24.0, 13.0, 20.0, 14.0, 10.0, 4.0, 9.0, 8.0, 5.0, 4.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.96875, -23.233642578125, -22.49853515625, -21.763427734375, -21.0283203125, -20.293212890625, -19.55810546875, -18.822998046875, -18.087890625, -17.352783203125, -16.61767578125, -15.882568359375, -15.1474609375, -14.412353515625, -13.67724609375, -12.942138671875, -12.20703125, -11.471923828125, -10.73681640625, -10.001708984375, -9.2666015625, -8.531494140625, -7.79638671875, -7.061279296875, -6.326171875, -5.591064453125, -4.85595703125, -4.120849609375, -3.3857421875, -2.650634765625, -1.91552734375, -1.180419921875, -0.4453125, 0.289794921875, 1.02490234375, 1.760009765625, 2.4951171875, 3.230224609375, 3.96533203125, 4.700439453125, 5.435546875, 6.170654296875, 6.90576171875, 7.640869140625, 8.3759765625, 9.111083984375, 9.84619140625, 10.581298828125, 11.31640625, 12.051513671875, 12.78662109375, 13.521728515625, 14.2568359375, 14.991943359375, 15.72705078125, 16.462158203125, 17.197265625, 17.932373046875, 18.66748046875, 19.402587890625, 20.1376953125, 20.872802734375, 21.60791015625, 22.343017578125, 23.078125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 8.0, 9.0, 5.0, 11.0, 17.0, 16.0, 15.0, 23.0, 32.0, 49.0, 91.0, 91.0, 197.0, 320.0, 720.0, 1438.0, 3694.0, 13791.0, 429486.0, 3587113.0, 142784.0, 8824.0, 2906.0, 1196.0, 570.0, 305.0, 201.0, 96.0, 61.0, 49.0, 36.0, 16.0, 20.0, 13.0, 13.0, 14.0, 6.0, 8.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-82.1875, -79.7958984375, -77.404296875, -75.0126953125, -72.62109375, -70.2294921875, -67.837890625, -65.4462890625, -63.0546875, -60.6630859375, -58.271484375, -55.8798828125, -53.48828125, -51.0966796875, -48.705078125, -46.3134765625, -43.921875, -41.5302734375, -39.138671875, -36.7470703125, -34.35546875, -31.9638671875, -29.572265625, -27.1806640625, -24.7890625, -22.3974609375, -20.005859375, -17.6142578125, -15.22265625, -12.8310546875, -10.439453125, -8.0478515625, -5.65625, -3.2646484375, -0.873046875, 1.5185546875, 3.91015625, 6.3017578125, 8.693359375, 11.0849609375, 13.4765625, 15.8681640625, 18.259765625, 20.6513671875, 23.04296875, 25.4345703125, 27.826171875, 30.2177734375, 32.609375, 35.0009765625, 37.392578125, 39.7841796875, 42.17578125, 44.5673828125, 46.958984375, 49.3505859375, 51.7421875, 54.1337890625, 56.525390625, 58.9169921875, 61.30859375, 63.7001953125, 66.091796875, 68.4833984375, 70.875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 4.0, 6.0, 4.0, 11.0, 13.0, 27.0, 36.0, 47.0, 82.0, 137.0, 301.0, 641.0, 1006.0, 856.0, 402.0, 196.0, 137.0, 62.0, 28.0, 23.0, 23.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.03125, -60.34423828125, -58.6572265625, -56.97021484375, -55.283203125, -53.59619140625, -51.9091796875, -50.22216796875, -48.53515625, -46.84814453125, -45.1611328125, -43.47412109375, -41.787109375, -40.10009765625, -38.4130859375, -36.72607421875, -35.0390625, -33.35205078125, -31.6650390625, -29.97802734375, -28.291015625, -26.60400390625, -24.9169921875, -23.22998046875, -21.54296875, -19.85595703125, -18.1689453125, -16.48193359375, -14.794921875, -13.10791015625, -11.4208984375, -9.73388671875, -8.046875, -6.35986328125, -4.6728515625, -2.98583984375, -1.298828125, 0.38818359375, 2.0751953125, 3.76220703125, 5.44921875, 7.13623046875, 8.8232421875, 10.51025390625, 12.197265625, 13.88427734375, 15.5712890625, 17.25830078125, 18.9453125, 20.63232421875, 22.3193359375, 24.00634765625, 25.693359375, 27.38037109375, 29.0673828125, 30.75439453125, 32.44140625, 34.12841796875, 35.8154296875, 37.50244140625, 39.189453125, 40.87646484375, 42.5634765625, 44.25048828125, 45.9375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 0.0, 7.0, 4.0, 8.0, 15.0, 17.0, 24.0, 40.0, 63.0, 116.0, 214.0, 429.0, 1132.0, 5063.0, 90128.0, 4058382.0, 33605.0, 3415.0, 799.0, 336.0, 193.0, 114.0, 65.0, 45.0, 30.0, 10.0, 5.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.25, -150.54296875, -144.8359375, -139.12890625, -133.421875, -127.71484375, -122.0078125, -116.30078125, -110.59375, -104.88671875, -99.1796875, -93.47265625, -87.765625, -82.05859375, -76.3515625, -70.64453125, -64.9375, -59.23046875, -53.5234375, -47.81640625, -42.109375, -36.40234375, -30.6953125, -24.98828125, -19.28125, -13.57421875, -7.8671875, -2.16015625, 3.546875, 9.25390625, 14.9609375, 20.66796875, 26.375, 32.08203125, 37.7890625, 43.49609375, 49.203125, 54.91015625, 60.6171875, 66.32421875, 72.03125, 77.73828125, 83.4453125, 89.15234375, 94.859375, 100.56640625, 106.2734375, 111.98046875, 117.6875, 123.39453125, 129.1015625, 134.80859375, 140.515625, 146.22265625, 151.9296875, 157.63671875, 163.34375, 169.05078125, 174.7578125, 180.46484375, 186.171875, 191.87890625, 197.5859375, 203.29296875, 209.0]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 31.0, 231.0, 589.0, 143.0, 15.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1170.8314208984375, -1150.0692138671875, -1129.3070068359375, -1108.5447998046875, -1087.78271484375, -1067.0205078125, -1046.25830078125, -1025.49609375, -1004.73388671875, -983.9716796875, -963.2095336914062, -942.4473266601562, -921.6851196289062, -900.9229125976562, -880.1607666015625, -859.3985595703125, -838.6363525390625, -817.8741455078125, -797.1119995117188, -776.3497924804688, -755.5875854492188, -734.8253784179688, -714.063232421875, -693.301025390625, -672.5388793945312, -651.7766723632812, -631.0145263671875, -610.2523193359375, -589.4901123046875, -568.7279052734375, -547.9657592773438, -527.2035522460938, -506.44134521484375, -485.6791687011719, -464.9169616699219, -444.15478515625, -423.392578125, -402.6304016113281, -381.86822509765625, -361.10601806640625, -340.34381103515625, -319.5816345214844, -298.8194274902344, -278.0572509765625, -257.2950439453125, -236.53286743164062, -215.7706756591797, -195.00848388671875, -174.2462921142578, -153.48410034179688, -132.72190856933594, -111.95972442626953, -91.1975326538086, -70.43534088134766, -49.67315673828125, -28.910964965820312, -8.148773193359375, 12.61341667175293, 33.375606536865234, 54.137794494628906, 74.89998626708984, 95.66217803955078, 116.42436218261719, 137.18655395507812, 157.94874572753906]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 3.0, 5.0, 5.0, 0.0, 9.0, 7.0, 16.0, 11.0, 18.0, 20.0, 24.0, 20.0, 21.0, 27.0, 34.0, 39.0, 42.0, 32.0, 37.0, 53.0, 44.0, 54.0, 45.0, 34.0, 30.0, 37.0, 43.0, 31.0, 30.0, 33.0, 24.0, 18.0, 25.0, 18.0, 20.0, 12.0, 19.0, 13.0, 12.0, 10.0, 6.0, 4.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-105.19232177734375, -101.75593566894531, -98.3195571899414, -94.88317108154297, -91.44679260253906, -88.01040649414062, -84.57402038574219, -81.13763427734375, -77.70125579833984, -74.2648696899414, -70.8284912109375, -67.39210510253906, -63.95572280883789, -60.51934051513672, -57.08295440673828, -53.64657211303711, -50.21018981933594, -46.773807525634766, -43.337425231933594, -39.901039123535156, -36.464656829833984, -33.02827453613281, -29.591890335083008, -26.155506134033203, -22.71912384033203, -19.28274154663086, -15.846357345581055, -12.409974098205566, -8.973590850830078, -5.537208557128906, -2.1008243560791016, 1.3355598449707031, 4.771942138671875, 8.208325386047363, 11.644708633422852, 15.08109188079834, 18.517475128173828, 21.953857421875, 25.390241622924805, 28.82662582397461, 32.26300811767578, 35.69939041137695, 39.135772705078125, 42.57215881347656, 46.008541107177734, 49.444923400878906, 52.881309509277344, 56.317691802978516, 59.75407409667969, 63.19045639038086, 66.62683868408203, 70.06322479248047, 73.49960327148438, 76.93598937988281, 80.37237548828125, 83.80876159667969, 87.2451400756836, 90.68152618408203, 94.11790466308594, 97.55429077148438, 100.99067687988281, 104.42705535888672, 107.86344146728516, 111.29981994628906, 114.7362060546875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 10.0, 8.0, 9.0, 13.0, 18.0, 9.0, 24.0, 15.0, 17.0, 19.0, 21.0, 28.0, 33.0, 46.0, 45.0, 35.0, 45.0, 50.0, 40.0, 33.0, 47.0, 31.0, 41.0, 31.0, 27.0, 30.0, 33.0, 35.0, 25.0, 27.0, 21.0, 18.0, 14.0, 17.0, 8.0, 8.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.3125, -22.607666015625, -21.90283203125, -21.197998046875, -20.4931640625, -19.788330078125, -19.08349609375, -18.378662109375, -17.673828125, -16.968994140625, -16.26416015625, -15.559326171875, -14.8544921875, -14.149658203125, -13.44482421875, -12.739990234375, -12.03515625, -11.330322265625, -10.62548828125, -9.920654296875, -9.2158203125, -8.510986328125, -7.80615234375, -7.101318359375, -6.396484375, -5.691650390625, -4.98681640625, -4.281982421875, -3.5771484375, -2.872314453125, -2.16748046875, -1.462646484375, -0.7578125, -0.052978515625, 0.65185546875, 1.356689453125, 2.0615234375, 2.766357421875, 3.47119140625, 4.176025390625, 4.880859375, 5.585693359375, 6.29052734375, 6.995361328125, 7.7001953125, 8.405029296875, 9.10986328125, 9.814697265625, 10.51953125, 11.224365234375, 11.92919921875, 12.634033203125, 13.3388671875, 14.043701171875, 14.74853515625, 15.453369140625, 16.158203125, 16.863037109375, 17.56787109375, 18.272705078125, 18.9775390625, 19.682373046875, 20.38720703125, 21.092041015625, 21.796875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 11.0, 17.0, 36.0, 46.0, 65.0, 108.0, 166.0, 211.0, 289.0, 483.0, 714.0, 1033.0, 1544.0, 2293.0, 3423.0, 5269.0, 7680.0, 11893.0, 18525.0, 28584.0, 46149.0, 76505.0, 129545.0, 207676.0, 197067.0, 118798.0, 70087.0, 42973.0, 27053.0, 17089.0, 11176.0, 7349.0, 4860.0, 3210.0, 2162.0, 1448.0, 1013.0, 610.0, 456.0, 320.0, 198.0, 128.0, 93.0, 65.0, 30.0, 26.0, 30.0, 13.0, 10.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0], "bins": [-1.1328125, -1.0984039306640625, -1.063995361328125, -1.0295867919921875, -0.99517822265625, -0.9607696533203125, -0.926361083984375, -0.8919525146484375, -0.8575439453125, -0.8231353759765625, -0.788726806640625, -0.7543182373046875, -0.71990966796875, -0.6855010986328125, -0.651092529296875, -0.6166839599609375, -0.582275390625, -0.5478668212890625, -0.513458251953125, -0.4790496826171875, -0.44464111328125, -0.4102325439453125, -0.375823974609375, -0.3414154052734375, -0.3070068359375, -0.2725982666015625, -0.238189697265625, -0.2037811279296875, -0.16937255859375, -0.1349639892578125, -0.100555419921875, -0.0661468505859375, -0.03173828125, 0.0026702880859375, 0.037078857421875, 0.0714874267578125, 0.10589599609375, 0.1403045654296875, 0.174713134765625, 0.2091217041015625, 0.2435302734375, 0.2779388427734375, 0.312347412109375, 0.3467559814453125, 0.38116455078125, 0.4155731201171875, 0.449981689453125, 0.4843902587890625, 0.518798828125, 0.5532073974609375, 0.587615966796875, 0.6220245361328125, 0.65643310546875, 0.6908416748046875, 0.725250244140625, 0.7596588134765625, 0.7940673828125, 0.8284759521484375, 0.862884521484375, 0.8972930908203125, 0.93170166015625, 0.9661102294921875, 1.000518798828125, 1.0349273681640625, 1.0693359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 5.0, 9.0, 4.0, 8.0, 12.0, 10.0, 13.0, 15.0, 16.0, 15.0, 24.0, 23.0, 21.0, 32.0, 38.0, 38.0, 48.0, 33.0, 34.0, 39.0, 39.0, 1071.0, 32.0, 45.0, 48.0, 50.0, 28.0, 29.0, 29.0, 19.0, 25.0, 17.0, 26.0, 17.0, 17.0, 11.0, 8.0, 13.0, 13.0, 6.0, 9.0, 3.0, 5.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4453125, -13.998046875, -13.55078125, -13.103515625, -12.65625, -12.208984375, -11.76171875, -11.314453125, -10.8671875, -10.419921875, -9.97265625, -9.525390625, -9.078125, -8.630859375, -8.18359375, -7.736328125, -7.2890625, -6.841796875, -6.39453125, -5.947265625, -5.5, -5.052734375, -4.60546875, -4.158203125, -3.7109375, -3.263671875, -2.81640625, -2.369140625, -1.921875, -1.474609375, -1.02734375, -0.580078125, -0.1328125, 0.314453125, 0.76171875, 1.208984375, 1.65625, 2.103515625, 2.55078125, 2.998046875, 3.4453125, 3.892578125, 4.33984375, 4.787109375, 5.234375, 5.681640625, 6.12890625, 6.576171875, 7.0234375, 7.470703125, 7.91796875, 8.365234375, 8.8125, 9.259765625, 9.70703125, 10.154296875, 10.6015625, 11.048828125, 11.49609375, 11.943359375, 12.390625, 12.837890625, 13.28515625, 13.732421875, 14.1796875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 3.0, 8.0, 8.0, 11.0, 32.0, 52.0, 60.0, 105.0, 135.0, 205.0, 287.0, 385.0, 549.0, 796.0, 1067.0, 1425.0, 1987.0, 2625.0, 3538.0, 4942.0, 6895.0, 9416.0, 13533.0, 19262.0, 28582.0, 43256.0, 67772.0, 108420.0, 165769.0, 1232967.0, 133878.0, 83466.0, 52885.0, 34360.0, 22976.0, 15645.0, 10919.0, 7823.0, 5733.0, 4194.0, 2963.0, 2265.0, 1606.0, 1241.0, 892.0, 658.0, 469.0, 331.0, 217.0, 181.0, 112.0, 79.0, 51.0, 38.0, 20.0, 21.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0], "bins": [-0.81201171875, -0.7860031127929688, -0.7599945068359375, -0.7339859008789062, -0.707977294921875, -0.6819686889648438, -0.6559600830078125, -0.6299514770507812, -0.60394287109375, -0.5779342651367188, -0.5519256591796875, -0.5259170532226562, -0.499908447265625, -0.47389984130859375, -0.4478912353515625, -0.42188262939453125, -0.3958740234375, -0.36986541748046875, -0.3438568115234375, -0.31784820556640625, -0.291839599609375, -0.26583099365234375, -0.2398223876953125, -0.21381378173828125, -0.18780517578125, -0.16179656982421875, -0.1357879638671875, -0.10977935791015625, -0.083770751953125, -0.05776214599609375, -0.0317535400390625, -0.00574493408203125, 0.020263671875, 0.04627227783203125, 0.0722808837890625, 0.09828948974609375, 0.124298095703125, 0.15030670166015625, 0.1763153076171875, 0.20232391357421875, 0.22833251953125, 0.25434112548828125, 0.2803497314453125, 0.30635833740234375, 0.332366943359375, 0.35837554931640625, 0.3843841552734375, 0.41039276123046875, 0.4364013671875, 0.46240997314453125, 0.4884185791015625, 0.5144271850585938, 0.540435791015625, 0.5664443969726562, 0.5924530029296875, 0.6184616088867188, 0.64447021484375, 0.6704788208007812, 0.6964874267578125, 0.7224960327148438, 0.748504638671875, 0.7745132446289062, 0.8005218505859375, 0.8265304565429688, 0.8525390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 12.0, 9.0, 10.0, 22.0, 19.0, 20.0, 33.0, 37.0, 48.0, 56.0, 59.0, 53.0, 52.0, 63.0, 64.0, 51.0, 50.0, 51.0, 46.0, 37.0, 29.0, 33.0, 22.0, 30.0, 15.0, 18.0, 12.0, 8.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.004974365234375, -0.004823505878448486, -0.004672646522521973, -0.004521787166595459, -0.004370927810668945, -0.004220068454742432, -0.004069209098815918, -0.003918349742889404, -0.0037674903869628906, -0.003616631031036377, -0.0034657716751098633, -0.0033149123191833496, -0.003164052963256836, -0.0030131936073303223, -0.0028623342514038086, -0.002711474895477295, -0.0025606155395507812, -0.0024097561836242676, -0.002258896827697754, -0.0021080374717712402, -0.0019571781158447266, -0.0018063187599182129, -0.0016554594039916992, -0.0015046000480651855, -0.0013537406921386719, -0.0012028813362121582, -0.0010520219802856445, -0.0009011626243591309, -0.0007503032684326172, -0.0005994439125061035, -0.00044858455657958984, -0.00029772520065307617, -0.0001468658447265625, 3.993511199951172e-06, 0.00015485286712646484, 0.0003057122230529785, 0.0004565715789794922, 0.0006074309349060059, 0.0007582902908325195, 0.0009091496467590332, 0.0010600090026855469, 0.0012108683586120605, 0.0013617277145385742, 0.0015125870704650879, 0.0016634464263916016, 0.0018143057823181152, 0.001965165138244629, 0.0021160244941711426, 0.0022668838500976562, 0.00241774320602417, 0.0025686025619506836, 0.0027194619178771973, 0.002870321273803711, 0.0030211806297302246, 0.0031720399856567383, 0.003322899341583252, 0.0034737586975097656, 0.0036246180534362793, 0.003775477409362793, 0.003926336765289307, 0.00407719612121582, 0.004228055477142334, 0.004378914833068848, 0.004529774188995361, 0.004680633544921875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 8.0, 8.0, 10.0, 8.0, 14.0, 25.0, 27.0, 34.0, 51.0, 57.0, 67.0, 90.0, 131.0, 227.0, 465.0, 2905.0, 938114.0, 104304.0, 1013.0, 322.0, 184.0, 123.0, 102.0, 78.0, 35.0, 28.0, 30.0, 28.0, 16.0, 13.0, 7.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09714317321777344, -0.09388351440429688, -0.09062385559082031, -0.08736419677734375, -0.08410453796386719, -0.08084487915039062, -0.07758522033691406, -0.0743255615234375, -0.07106590270996094, -0.06780624389648438, -0.06454658508300781, -0.06128692626953125, -0.05802726745605469, -0.054767608642578125, -0.05150794982910156, -0.048248291015625, -0.04498863220214844, -0.041728973388671875, -0.03846931457519531, -0.03520965576171875, -0.03194999694824219, -0.028690338134765625, -0.025430679321289062, -0.0221710205078125, -0.018911361694335938, -0.015651702880859375, -0.012392044067382812, -0.00913238525390625, -0.0058727264404296875, -0.002613067626953125, 0.0006465911865234375, 0.00390625, 0.0071659088134765625, 0.010425567626953125, 0.013685226440429688, 0.01694488525390625, 0.020204544067382812, 0.023464202880859375, 0.026723861694335938, 0.0299835205078125, 0.03324317932128906, 0.036502838134765625, 0.03976249694824219, 0.04302215576171875, 0.04628181457519531, 0.049541473388671875, 0.05280113220214844, 0.056060791015625, 0.05932044982910156, 0.06258010864257812, 0.06583976745605469, 0.06909942626953125, 0.07235908508300781, 0.07561874389648438, 0.07887840270996094, 0.0821380615234375, 0.08539772033691406, 0.08865737915039062, 0.09191703796386719, 0.09517669677734375, 0.09843635559082031, 0.10169601440429688, 0.10495567321777344, 0.10821533203125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 177.0, 806.0, 29.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0139493802562356, -0.012712707743048668, -0.011476034298539162, -0.01023936178535223, -0.009002689272165298, -0.007766015827655792, -0.006529343314468861, -0.005292669869959354, -0.004055997356772423, -0.002819324377924204, -0.0015826516319066286, -0.00034597888588905334, 0.0008906940929591656, 0.0021273670718073845, 0.003364039584994316, 0.004600713029503822, 0.005837385542690754, 0.007074058521538973, 0.008310731500387192, 0.009547404013574123, 0.010784076526761055, 0.012020749971270561, 0.013257422484457493, 0.014494095928966999, 0.01573076844215393, 0.016967441886663437, 0.018204113468527794, 0.0194407869130373, 0.020677460357546806, 0.021914131939411163, 0.02315080538392067, 0.024387478828430176, 0.025624152272939682, 0.026860825717449188, 0.028097497299313545, 0.02933417074382305, 0.030570844188332558, 0.031807515770196915, 0.03304418921470642, 0.03428086265921593, 0.03551753610372543, 0.03675420954823494, 0.037990882992744446, 0.039227552711963654, 0.04046422615647316, 0.041700899600982666, 0.04293757304549217, 0.04417424649000168, 0.045410916209220886, 0.04664758965373039, 0.0478842630982399, 0.049120932817459106, 0.05035760626196861, 0.05159427970647812, 0.052830953150987625, 0.05406762659549713, 0.05530430004000664, 0.056540973484516144, 0.05777764692902565, 0.059014320373535156, 0.060250990092754364, 0.06148766353726387, 0.06272433698177338, 0.06396101415157318, 0.06519768387079239]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 9.0, 9.0, 9.0, 16.0, 17.0, 30.0, 29.0, 34.0, 37.0, 40.0, 41.0, 38.0, 53.0, 45.0, 44.0, 51.0, 56.0, 59.0, 55.0, 39.0, 42.0, 34.0, 32.0, 37.0, 23.0, 21.0, 10.0, 20.0, 11.0, 10.0, 12.0, 7.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0036129355430603027, -0.0035112472251057625, -0.0034095589071512222, -0.003307870589196682, -0.0032061822712421417, -0.0031044939532876015, -0.0030028056353330612, -0.002901117317378521, -0.0027994289994239807, -0.0026977406814694405, -0.0025960523635149, -0.00249436404556036, -0.0023926757276058197, -0.0022909874096512794, -0.002189299091696739, -0.002087610773742199, -0.0019859224557876587, -0.0018842341378331184, -0.0017825458198785782, -0.001680857501924038, -0.0015791691839694977, -0.0014774808660149574, -0.0013757925480604172, -0.001274104230105877, -0.0011724159121513367, -0.0010707275941967964, -0.0009690392762422562, -0.0008673509582877159, -0.0007656626403331757, -0.0006639743223786354, -0.0005622860044240952, -0.0004605976864695549, -0.00035890936851501465, -0.0002572210505604744, -0.00015553273260593414, -5.384441465139389e-05, 4.784390330314636e-05, 0.00014953222125768661, 0.00025122053921222687, 0.0003529088571667671, 0.0004545971751213074, 0.0005562854930758476, 0.0006579738110303879, 0.0007596621289849281, 0.0008613504469394684, 0.0009630387648940086, 0.0010647270828485489, 0.0011664154008030891, 0.0012681037187576294, 0.0013697920367121696, 0.00147148035466671, 0.0015731686726212502, 0.0016748569905757904, 0.0017765453085303307, 0.001878233626484871, 0.001979921944439411, 0.0020816102623939514, 0.0021832985803484917, 0.002284986898303032, 0.002386675216257572, 0.0024883635342121124, 0.0025900518521666527, 0.002691740170121193, 0.002793428488075733, 0.0028951168060302734]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 10.0, 8.0, 9.0, 13.0, 18.0, 9.0, 24.0, 15.0, 17.0, 19.0, 21.0, 28.0, 33.0, 46.0, 45.0, 35.0, 45.0, 50.0, 40.0, 33.0, 47.0, 31.0, 41.0, 31.0, 27.0, 30.0, 33.0, 35.0, 25.0, 27.0, 21.0, 18.0, 14.0, 17.0, 8.0, 8.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.3125, -22.607666015625, -21.90283203125, -21.197998046875, -20.4931640625, -19.788330078125, -19.08349609375, -18.378662109375, -17.673828125, -16.968994140625, -16.26416015625, -15.559326171875, -14.8544921875, -14.149658203125, -13.44482421875, -12.739990234375, -12.03515625, -11.330322265625, -10.62548828125, -9.920654296875, -9.2158203125, -8.510986328125, -7.80615234375, -7.101318359375, -6.396484375, -5.691650390625, -4.98681640625, -4.281982421875, -3.5771484375, -2.872314453125, -2.16748046875, -1.462646484375, -0.7578125, -0.052978515625, 0.65185546875, 1.356689453125, 2.0615234375, 2.766357421875, 3.47119140625, 4.176025390625, 4.880859375, 5.585693359375, 6.29052734375, 6.995361328125, 7.7001953125, 8.405029296875, 9.10986328125, 9.814697265625, 10.51953125, 11.224365234375, 11.92919921875, 12.634033203125, 13.3388671875, 14.043701171875, 14.74853515625, 15.453369140625, 16.158203125, 16.863037109375, 17.56787109375, 18.272705078125, 18.9775390625, 19.682373046875, 20.38720703125, 21.092041015625, 21.796875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 6.0, 14.0, 8.0, 16.0, 19.0, 32.0, 30.0, 51.0, 51.0, 89.0, 148.0, 219.0, 327.0, 575.0, 954.0, 1692.0, 3396.0, 8121.0, 29487.0, 274898.0, 660760.0, 47407.0, 11071.0, 4142.0, 2105.0, 1098.0, 612.0, 374.0, 292.0, 148.0, 118.0, 63.0, 57.0, 31.0, 35.0, 17.0, 13.0, 17.0, 7.0, 10.0, 9.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-46.3125, -44.9150390625, -43.517578125, -42.1201171875, -40.72265625, -39.3251953125, -37.927734375, -36.5302734375, -35.1328125, -33.7353515625, -32.337890625, -30.9404296875, -29.54296875, -28.1455078125, -26.748046875, -25.3505859375, -23.953125, -22.5556640625, -21.158203125, -19.7607421875, -18.36328125, -16.9658203125, -15.568359375, -14.1708984375, -12.7734375, -11.3759765625, -9.978515625, -8.5810546875, -7.18359375, -5.7861328125, -4.388671875, -2.9912109375, -1.59375, -0.1962890625, 1.201171875, 2.5986328125, 3.99609375, 5.3935546875, 6.791015625, 8.1884765625, 9.5859375, 10.9833984375, 12.380859375, 13.7783203125, 15.17578125, 16.5732421875, 17.970703125, 19.3681640625, 20.765625, 22.1630859375, 23.560546875, 24.9580078125, 26.35546875, 27.7529296875, 29.150390625, 30.5478515625, 31.9453125, 33.3427734375, 34.740234375, 36.1376953125, 37.53515625, 38.9326171875, 40.330078125, 41.7275390625, 43.125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 6.0, 6.0, 14.0, 13.0, 15.0, 20.0, 13.0, 23.0, 29.0, 49.0, 37.0, 36.0, 40.0, 51.0, 62.0, 79.0, 188.0, 1693.0, 192.0, 76.0, 53.0, 34.0, 29.0, 34.0, 28.0, 34.0, 32.0, 27.0, 18.0, 14.0, 16.0, 10.0, 12.0, 15.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-67.4375, -65.48291015625, -63.5283203125, -61.57373046875, -59.619140625, -57.66455078125, -55.7099609375, -53.75537109375, -51.80078125, -49.84619140625, -47.8916015625, -45.93701171875, -43.982421875, -42.02783203125, -40.0732421875, -38.11865234375, -36.1640625, -34.20947265625, -32.2548828125, -30.30029296875, -28.345703125, -26.39111328125, -24.4365234375, -22.48193359375, -20.52734375, -18.57275390625, -16.6181640625, -14.66357421875, -12.708984375, -10.75439453125, -8.7998046875, -6.84521484375, -4.890625, -2.93603515625, -0.9814453125, 0.97314453125, 2.927734375, 4.88232421875, 6.8369140625, 8.79150390625, 10.74609375, 12.70068359375, 14.6552734375, 16.60986328125, 18.564453125, 20.51904296875, 22.4736328125, 24.42822265625, 26.3828125, 28.33740234375, 30.2919921875, 32.24658203125, 34.201171875, 36.15576171875, 38.1103515625, 40.06494140625, 42.01953125, 43.97412109375, 45.9287109375, 47.88330078125, 49.837890625, 51.79248046875, 53.7470703125, 55.70166015625, 57.65625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 5.0, 3.0, 12.0, 13.0, 13.0, 24.0, 21.0, 21.0, 32.0, 33.0, 56.0, 56.0, 60.0, 110.0, 164.0, 351.0, 1280.0, 13807.0, 3022527.0, 102120.0, 3541.0, 596.0, 238.0, 145.0, 100.0, 81.0, 52.0, 45.0, 33.0, 28.0, 30.0, 15.0, 14.0, 15.0, 8.0, 9.0, 5.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-131.0, -126.595703125, -122.19140625, -117.787109375, -113.3828125, -108.978515625, -104.57421875, -100.169921875, -95.765625, -91.361328125, -86.95703125, -82.552734375, -78.1484375, -73.744140625, -69.33984375, -64.935546875, -60.53125, -56.126953125, -51.72265625, -47.318359375, -42.9140625, -38.509765625, -34.10546875, -29.701171875, -25.296875, -20.892578125, -16.48828125, -12.083984375, -7.6796875, -3.275390625, 1.12890625, 5.533203125, 9.9375, 14.341796875, 18.74609375, 23.150390625, 27.5546875, 31.958984375, 36.36328125, 40.767578125, 45.171875, 49.576171875, 53.98046875, 58.384765625, 62.7890625, 67.193359375, 71.59765625, 76.001953125, 80.40625, 84.810546875, 89.21484375, 93.619140625, 98.0234375, 102.427734375, 106.83203125, 111.236328125, 115.640625, 120.044921875, 124.44921875, 128.853515625, 133.2578125, 137.662109375, 142.06640625, 146.470703125, 150.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 123.0, 698.0, 176.0, 17.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.29273986816406, -118.11075592041016, -106.92877197265625, -95.74678039550781, -84.56480407714844, -73.3828125, -62.200828552246094, -51.01884460449219, -39.83686065673828, -28.654876708984375, -17.472890853881836, -6.290904998779297, 4.891078948974609, 16.073062896728516, 27.255050659179688, 38.437034606933594, 49.6190185546875, 60.801002502441406, 71.98298645019531, 83.16497802734375, 94.34695434570312, 105.52894592285156, 116.71092987060547, 127.89291381835938, 139.07489013671875, 150.2568817138672, 161.43885803222656, 172.620849609375, 183.80282592773438, 194.9848175048828, 206.16680908203125, 217.34878540039062, 228.53079223632812, 239.71278381347656, 250.89476013183594, 262.0767517089844, 273.25872802734375, 284.4407043457031, 295.6227111816406, 306.8046875, 317.9866638183594, 329.16864013671875, 340.35064697265625, 351.5326232910156, 362.714599609375, 373.8965759277344, 385.0785827636719, 396.26055908203125, 407.44256591796875, 418.6245422363281, 429.8065490722656, 440.988525390625, 452.1705017089844, 463.35247802734375, 474.53448486328125, 485.7164611816406, 496.8984375, 508.0804138183594, 519.2623901367188, 530.4443969726562, 541.6264038085938, 552.808349609375, 563.9903564453125, 575.17236328125, 586.3543090820312]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 7.0, 2.0, 2.0, 9.0, 4.0, 16.0, 14.0, 22.0, 11.0, 16.0, 10.0, 18.0, 20.0, 20.0, 25.0, 30.0, 32.0, 30.0, 34.0, 30.0, 37.0, 42.0, 37.0, 43.0, 39.0, 37.0, 37.0, 26.0, 31.0, 32.0, 51.0, 23.0, 23.0, 28.0, 22.0, 18.0, 19.0, 16.0, 16.0, 7.0, 7.0, 10.0, 7.0, 9.0, 4.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0], "bins": [-142.92208862304688, -138.67311096191406, -134.42413330078125, -130.17515563964844, -125.9261703491211, -121.67719268798828, -117.42821502685547, -113.17923736572266, -108.93025207519531, -104.6812744140625, -100.43229675292969, -96.18331909179688, -91.93433380126953, -87.68535614013672, -83.4363784790039, -79.1874008178711, -74.93842315673828, -70.68944549560547, -66.44046783447266, -62.19148635864258, -57.9425048828125, -53.69352722167969, -49.444549560546875, -45.19557189941406, -40.946590423583984, -36.69761276245117, -32.448631286621094, -28.19965362548828, -23.950674057006836, -19.70169448852539, -15.452716827392578, -11.203737258911133, -6.9547576904296875, -2.7057785987854004, 1.5432004928588867, 5.792179107666016, 10.041158676147461, 14.290138244628906, 18.53911590576172, 22.788095474243164, 27.03707504272461, 31.286054611206055, 35.5350341796875, 39.78401184082031, 44.032989501953125, 48.2819709777832, 52.530948638916016, 56.779930114746094, 61.028907775878906, 65.27788543701172, 69.52686309814453, 73.77584838867188, 78.02482604980469, 82.2738037109375, 86.52278137207031, 90.77175903320312, 95.02073669433594, 99.26971435546875, 103.51869201660156, 107.76766967773438, 112.01665496826172, 116.26563262939453, 120.51461029052734, 124.76358795166016, 129.0125732421875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 5.0, 11.0, 7.0, 13.0, 13.0, 12.0, 13.0, 23.0, 19.0, 18.0, 16.0, 27.0, 29.0, 28.0, 30.0, 36.0, 43.0, 45.0, 58.0, 40.0, 39.0, 38.0, 40.0, 35.0, 22.0, 30.0, 28.0, 32.0, 33.0, 28.0, 24.0, 25.0, 19.0, 22.0, 13.0, 12.0, 5.0, 15.0, 7.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.5625, -22.853759765625, -22.14501953125, -21.436279296875, -20.7275390625, -20.018798828125, -19.31005859375, -18.601318359375, -17.892578125, -17.183837890625, -16.47509765625, -15.766357421875, -15.0576171875, -14.348876953125, -13.64013671875, -12.931396484375, -12.22265625, -11.513916015625, -10.80517578125, -10.096435546875, -9.3876953125, -8.678955078125, -7.97021484375, -7.261474609375, -6.552734375, -5.843994140625, -5.13525390625, -4.426513671875, -3.7177734375, -3.009033203125, -2.30029296875, -1.591552734375, -0.8828125, -0.174072265625, 0.53466796875, 1.243408203125, 1.9521484375, 2.660888671875, 3.36962890625, 4.078369140625, 4.787109375, 5.495849609375, 6.20458984375, 6.913330078125, 7.6220703125, 8.330810546875, 9.03955078125, 9.748291015625, 10.45703125, 11.165771484375, 11.87451171875, 12.583251953125, 13.2919921875, 14.000732421875, 14.70947265625, 15.418212890625, 16.126953125, 16.835693359375, 17.54443359375, 18.253173828125, 18.9619140625, 19.670654296875, 20.37939453125, 21.088134765625, 21.796875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 14.0, 12.0, 13.0, 24.0, 11.0, 27.0, 28.0, 35.0, 51.0, 57.0, 78.0, 103.0, 150.0, 203.0, 309.0, 544.0, 904.0, 1802.0, 4432.0, 15817.0, 323350.0, 3450076.0, 369560.0, 17386.0, 4644.0, 1959.0, 946.0, 548.0, 319.0, 211.0, 170.0, 118.0, 86.0, 69.0, 41.0, 32.0, 30.0, 25.0, 17.0, 16.0, 12.0, 11.0, 15.0, 4.0, 6.0, 8.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-71.9375, -69.853515625, -67.76953125, -65.685546875, -63.6015625, -61.517578125, -59.43359375, -57.349609375, -55.265625, -53.181640625, -51.09765625, -49.013671875, -46.9296875, -44.845703125, -42.76171875, -40.677734375, -38.59375, -36.509765625, -34.42578125, -32.341796875, -30.2578125, -28.173828125, -26.08984375, -24.005859375, -21.921875, -19.837890625, -17.75390625, -15.669921875, -13.5859375, -11.501953125, -9.41796875, -7.333984375, -5.25, -3.166015625, -1.08203125, 1.001953125, 3.0859375, 5.169921875, 7.25390625, 9.337890625, 11.421875, 13.505859375, 15.58984375, 17.673828125, 19.7578125, 21.841796875, 23.92578125, 26.009765625, 28.09375, 30.177734375, 32.26171875, 34.345703125, 36.4296875, 38.513671875, 40.59765625, 42.681640625, 44.765625, 46.849609375, 48.93359375, 51.017578125, 53.1015625, 55.185546875, 57.26953125, 59.353515625, 61.4375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 11.0, 16.0, 13.0, 25.0, 50.0, 68.0, 92.0, 160.0, 251.0, 474.0, 754.0, 795.0, 568.0, 316.0, 169.0, 97.0, 64.0, 33.0, 28.0, 18.0, 18.0, 7.0, 7.0, 4.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.78125, -44.439453125, -43.09765625, -41.755859375, -40.4140625, -39.072265625, -37.73046875, -36.388671875, -35.046875, -33.705078125, -32.36328125, -31.021484375, -29.6796875, -28.337890625, -26.99609375, -25.654296875, -24.3125, -22.970703125, -21.62890625, -20.287109375, -18.9453125, -17.603515625, -16.26171875, -14.919921875, -13.578125, -12.236328125, -10.89453125, -9.552734375, -8.2109375, -6.869140625, -5.52734375, -4.185546875, -2.84375, -1.501953125, -0.16015625, 1.181640625, 2.5234375, 3.865234375, 5.20703125, 6.548828125, 7.890625, 9.232421875, 10.57421875, 11.916015625, 13.2578125, 14.599609375, 15.94140625, 17.283203125, 18.625, 19.966796875, 21.30859375, 22.650390625, 23.9921875, 25.333984375, 26.67578125, 28.017578125, 29.359375, 30.701171875, 32.04296875, 33.384765625, 34.7265625, 36.068359375, 37.41015625, 38.751953125, 40.09375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 2.0, 6.0, 14.0, 20.0, 16.0, 26.0, 33.0, 56.0, 84.0, 125.0, 197.0, 331.0, 714.0, 1758.0, 5768.0, 30527.0, 1554792.0, 2553722.0, 36059.0, 6359.0, 1845.0, 791.0, 405.0, 220.0, 140.0, 77.0, 71.0, 31.0, 36.0, 15.0, 16.0, 13.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-99.5, -96.1875, -92.875, -89.5625, -86.25, -82.9375, -79.625, -76.3125, -73.0, -69.6875, -66.375, -63.0625, -59.75, -56.4375, -53.125, -49.8125, -46.5, -43.1875, -39.875, -36.5625, -33.25, -29.9375, -26.625, -23.3125, -20.0, -16.6875, -13.375, -10.0625, -6.75, -3.4375, -0.125, 3.1875, 6.5, 9.8125, 13.125, 16.4375, 19.75, 23.0625, 26.375, 29.6875, 33.0, 36.3125, 39.625, 42.9375, 46.25, 49.5625, 52.875, 56.1875, 59.5, 62.8125, 66.125, 69.4375, 72.75, 76.0625, 79.375, 82.6875, 86.0, 89.3125, 92.625, 95.9375, 99.25, 102.5625, 105.875, 109.1875, 112.5]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 11.0, 34.0, 53.0, 87.0, 214.0, 259.0, 165.0, 97.0, 46.0, 25.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.7823028564453, -223.08108520507812, -216.37986755371094, -209.67864990234375, -202.97743225097656, -196.27621459960938, -189.57498168945312, -182.87376403808594, -176.17254638671875, -169.47132873535156, -162.77011108398438, -156.0688934326172, -149.36767578125, -142.66644287109375, -135.96524047851562, -129.26400756835938, -122.56279754638672, -115.86157989501953, -109.16036224365234, -102.45913696289062, -95.75791931152344, -89.05670166015625, -82.35548400878906, -75.65426635742188, -68.95304870605469, -62.2518310546875, -55.55060958862305, -48.84939193725586, -42.148170471191406, -35.44695281982422, -28.74573516845703, -22.044513702392578, -15.343292236328125, -8.642072677612305, -1.9408540725708008, 4.760364532470703, 11.461584091186523, 18.162803649902344, 24.86402130126953, 31.565242767333984, 38.26646041870117, 44.96767807006836, 51.66889953613281, 58.3701171875, 65.07133483886719, 71.77255249023438, 78.47377014160156, 85.17499542236328, 91.87621307373047, 98.57743072509766, 105.27864837646484, 111.97987365722656, 118.68109130859375, 125.38230895996094, 132.08352661132812, 138.7847442626953, 145.4859619140625, 152.1871795654297, 158.88839721679688, 165.58961486816406, 172.29083251953125, 178.9920654296875, 185.69326782226562, 192.39450073242188, 199.09571838378906]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 7.0, 4.0, 9.0, 5.0, 7.0, 8.0, 17.0, 10.0, 14.0, 23.0, 22.0, 18.0, 22.0, 34.0, 28.0, 35.0, 38.0, 33.0, 31.0, 40.0, 41.0, 49.0, 37.0, 35.0, 44.0, 54.0, 39.0, 34.0, 32.0, 32.0, 25.0, 30.0, 22.0, 18.0, 17.0, 16.0, 14.0, 10.0, 10.0, 5.0, 9.0, 7.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.41238403320312, -84.44105529785156, -81.46971893310547, -78.4983901977539, -75.52705383300781, -72.55572509765625, -69.58439636230469, -66.6130599975586, -63.64173126220703, -60.6703987121582, -57.699066162109375, -54.72773742675781, -51.756404876708984, -48.785072326660156, -45.81373977661133, -42.8424072265625, -39.87107467651367, -36.899742126464844, -33.928409576416016, -30.95707893371582, -27.985748291015625, -25.014415740966797, -22.04308319091797, -19.071752548217773, -16.100419998168945, -13.129088401794434, -10.157756805419922, -7.186424255371094, -4.215092658996582, -1.2437610626220703, 1.7275714874267578, 4.698902130126953, 7.670234680175781, 10.641566276550293, 13.612897872924805, 16.584230422973633, 19.555561065673828, 22.526893615722656, 25.498226165771484, 28.46955680847168, 31.440889358520508, 34.4122200012207, 37.38355255126953, 40.35488510131836, 43.32621765136719, 46.29754638671875, 49.268882751464844, 52.240211486816406, 55.211544036865234, 58.18287658691406, 61.15420913696289, 64.12554168701172, 67.09687042236328, 70.06820678710938, 73.03953552246094, 76.0108642578125, 78.9822006225586, 81.95352935791016, 84.92486572265625, 87.89619445800781, 90.8675308227539, 93.83885955810547, 96.81019592285156, 99.78152465820312, 102.75285339355469]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 4.0, 6.0, 10.0, 13.0, 8.0, 4.0, 14.0, 17.0, 14.0, 14.0, 28.0, 29.0, 22.0, 32.0, 25.0, 41.0, 33.0, 44.0, 53.0, 47.0, 52.0, 47.0, 32.0, 45.0, 42.0, 40.0, 41.0, 28.0, 29.0, 23.0, 20.0, 21.0, 18.0, 21.0, 14.0, 13.0, 14.0, 11.0, 9.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-26.40625, -25.624755859375, -24.84326171875, -24.061767578125, -23.2802734375, -22.498779296875, -21.71728515625, -20.935791015625, -20.154296875, -19.372802734375, -18.59130859375, -17.809814453125, -17.0283203125, -16.246826171875, -15.46533203125, -14.683837890625, -13.90234375, -13.120849609375, -12.33935546875, -11.557861328125, -10.7763671875, -9.994873046875, -9.21337890625, -8.431884765625, -7.650390625, -6.868896484375, -6.08740234375, -5.305908203125, -4.5244140625, -3.742919921875, -2.96142578125, -2.179931640625, -1.3984375, -0.616943359375, 0.16455078125, 0.946044921875, 1.7275390625, 2.509033203125, 3.29052734375, 4.072021484375, 4.853515625, 5.635009765625, 6.41650390625, 7.197998046875, 7.9794921875, 8.760986328125, 9.54248046875, 10.323974609375, 11.10546875, 11.886962890625, 12.66845703125, 13.449951171875, 14.2314453125, 15.012939453125, 15.79443359375, 16.575927734375, 17.357421875, 18.138916015625, 18.92041015625, 19.701904296875, 20.4833984375, 21.264892578125, 22.04638671875, 22.827880859375, 23.609375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 14.0, 16.0, 8.0, 20.0, 24.0, 48.0, 63.0, 79.0, 130.0, 196.0, 271.0, 373.0, 560.0, 869.0, 1244.0, 1898.0, 2803.0, 4457.0, 6804.0, 10575.0, 16710.0, 26885.0, 44932.0, 76935.0, 138036.0, 236145.0, 202655.0, 111899.0, 63115.0, 37284.0, 23032.0, 14124.0, 9105.0, 5965.0, 3788.0, 2441.0, 1667.0, 1072.0, 736.0, 458.0, 361.0, 227.0, 170.0, 120.0, 71.0, 52.0, 40.0, 27.0, 25.0, 6.0, 8.0, 2.0, 5.0, 3.0, 7.0, 1.0, 1.0], "bins": [-1.26171875, -1.2232818603515625, -1.184844970703125, -1.1464080810546875, -1.10797119140625, -1.0695343017578125, -1.031097412109375, -0.9926605224609375, -0.9542236328125, -0.9157867431640625, -0.877349853515625, -0.8389129638671875, -0.80047607421875, -0.7620391845703125, -0.723602294921875, -0.6851654052734375, -0.646728515625, -0.6082916259765625, -0.569854736328125, -0.5314178466796875, -0.49298095703125, -0.4545440673828125, -0.416107177734375, -0.3776702880859375, -0.3392333984375, -0.3007965087890625, -0.262359619140625, -0.2239227294921875, -0.18548583984375, -0.1470489501953125, -0.108612060546875, -0.0701751708984375, -0.03173828125, 0.0066986083984375, 0.045135498046875, 0.0835723876953125, 0.12200927734375, 0.1604461669921875, 0.198883056640625, 0.2373199462890625, 0.2757568359375, 0.3141937255859375, 0.352630615234375, 0.3910675048828125, 0.42950439453125, 0.4679412841796875, 0.506378173828125, 0.5448150634765625, 0.583251953125, 0.6216888427734375, 0.660125732421875, 0.6985626220703125, 0.73699951171875, 0.7754364013671875, 0.813873291015625, 0.8523101806640625, 0.8907470703125, 0.9291839599609375, 0.967620849609375, 1.0060577392578125, 1.04449462890625, 1.0829315185546875, 1.121368408203125, 1.1598052978515625, 1.1982421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 7.0, 7.0, 4.0, 6.0, 7.0, 11.0, 6.0, 6.0, 15.0, 24.0, 20.0, 18.0, 36.0, 37.0, 36.0, 33.0, 49.0, 39.0, 41.0, 31.0, 49.0, 1069.0, 31.0, 47.0, 46.0, 36.0, 40.0, 40.0, 35.0, 32.0, 26.0, 24.0, 24.0, 23.0, 14.0, 12.0, 13.0, 10.0, 6.0, 6.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.78125, -15.24755859375, -14.7138671875, -14.18017578125, -13.646484375, -13.11279296875, -12.5791015625, -12.04541015625, -11.51171875, -10.97802734375, -10.4443359375, -9.91064453125, -9.376953125, -8.84326171875, -8.3095703125, -7.77587890625, -7.2421875, -6.70849609375, -6.1748046875, -5.64111328125, -5.107421875, -4.57373046875, -4.0400390625, -3.50634765625, -2.97265625, -2.43896484375, -1.9052734375, -1.37158203125, -0.837890625, -0.30419921875, 0.2294921875, 0.76318359375, 1.296875, 1.83056640625, 2.3642578125, 2.89794921875, 3.431640625, 3.96533203125, 4.4990234375, 5.03271484375, 5.56640625, 6.10009765625, 6.6337890625, 7.16748046875, 7.701171875, 8.23486328125, 8.7685546875, 9.30224609375, 9.8359375, 10.36962890625, 10.9033203125, 11.43701171875, 11.970703125, 12.50439453125, 13.0380859375, 13.57177734375, 14.10546875, 14.63916015625, 15.1728515625, 15.70654296875, 16.240234375, 16.77392578125, 17.3076171875, 17.84130859375, 18.375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 20.0, 14.0, 24.0, 49.0, 65.0, 72.0, 148.0, 225.0, 351.0, 464.0, 727.0, 1005.0, 1510.0, 2138.0, 3139.0, 4565.0, 6937.0, 10322.0, 15610.0, 24321.0, 38225.0, 61161.0, 100914.0, 170499.0, 1266645.0, 148471.0, 87944.0, 53659.0, 33552.0, 21504.0, 14097.0, 9351.0, 6187.0, 4102.0, 2868.0, 1990.0, 1358.0, 969.0, 664.0, 406.0, 291.0, 196.0, 132.0, 82.0, 58.0, 30.0, 22.0, 16.0, 14.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.03125, -0.9993896484375, -0.967529296875, -0.9356689453125, -0.90380859375, -0.8719482421875, -0.840087890625, -0.8082275390625, -0.7763671875, -0.7445068359375, -0.712646484375, -0.6807861328125, -0.64892578125, -0.6170654296875, -0.585205078125, -0.5533447265625, -0.521484375, -0.4896240234375, -0.457763671875, -0.4259033203125, -0.39404296875, -0.3621826171875, -0.330322265625, -0.2984619140625, -0.2666015625, -0.2347412109375, -0.202880859375, -0.1710205078125, -0.13916015625, -0.1072998046875, -0.075439453125, -0.0435791015625, -0.01171875, 0.0201416015625, 0.052001953125, 0.0838623046875, 0.11572265625, 0.1475830078125, 0.179443359375, 0.2113037109375, 0.2431640625, 0.2750244140625, 0.306884765625, 0.3387451171875, 0.37060546875, 0.4024658203125, 0.434326171875, 0.4661865234375, 0.498046875, 0.5299072265625, 0.561767578125, 0.5936279296875, 0.62548828125, 0.6573486328125, 0.689208984375, 0.7210693359375, 0.7529296875, 0.7847900390625, 0.816650390625, 0.8485107421875, 0.88037109375, 0.9122314453125, 0.944091796875, 0.9759521484375, 1.0078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 6.0, 5.0, 4.0, 4.0, 3.0, 9.0, 11.0, 13.0, 13.0, 17.0, 25.0, 29.0, 26.0, 32.0, 36.0, 48.0, 40.0, 42.0, 44.0, 49.0, 51.0, 69.0, 52.0, 48.0, 46.0, 41.0, 44.0, 34.0, 24.0, 30.0, 22.0, 9.0, 17.0, 9.0, 6.0, 2.0, 12.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004474639892578125, -0.004335999488830566, -0.004197359085083008, -0.004058718681335449, -0.003920078277587891, -0.003781437873840332, -0.0036427974700927734, -0.003504157066345215, -0.0033655166625976562, -0.0032268762588500977, -0.003088235855102539, -0.0029495954513549805, -0.002810955047607422, -0.0026723146438598633, -0.0025336742401123047, -0.002395033836364746, -0.0022563934326171875, -0.002117753028869629, -0.0019791126251220703, -0.0018404722213745117, -0.0017018318176269531, -0.0015631914138793945, -0.001424551010131836, -0.0012859106063842773, -0.0011472702026367188, -0.0010086297988891602, -0.0008699893951416016, -0.000731348991394043, -0.0005927085876464844, -0.0004540681838989258, -0.0003154277801513672, -0.0001767873764038086, -3.814697265625e-05, 0.0001004934310913086, 0.0002391338348388672, 0.0003777742385864258, 0.0005164146423339844, 0.000655055046081543, 0.0007936954498291016, 0.0009323358535766602, 0.0010709762573242188, 0.0012096166610717773, 0.001348257064819336, 0.0014868974685668945, 0.0016255378723144531, 0.0017641782760620117, 0.0019028186798095703, 0.002041459083557129, 0.0021800994873046875, 0.002318739891052246, 0.0024573802947998047, 0.0025960206985473633, 0.002734661102294922, 0.0028733015060424805, 0.003011941909790039, 0.0031505823135375977, 0.0032892227172851562, 0.003427863121032715, 0.0035665035247802734, 0.003705143928527832, 0.0038437843322753906, 0.003982424736022949, 0.004121065139770508, 0.004259705543518066, 0.004398345947265625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 9.0, 9.0, 8.0, 6.0, 14.0, 14.0, 8.0, 19.0, 27.0, 21.0, 41.0, 41.0, 68.0, 94.0, 125.0, 165.0, 257.0, 524.0, 3718.0, 902116.0, 138796.0, 1296.0, 383.0, 201.0, 134.0, 97.0, 81.0, 67.0, 51.0, 29.0, 23.0, 26.0, 14.0, 14.0, 14.0, 6.0, 4.0, 5.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093994140625, -0.09104061126708984, -0.08808708190917969, -0.08513355255126953, -0.08218002319335938, -0.07922649383544922, -0.07627296447753906, -0.0733194351196289, -0.07036590576171875, -0.0674123764038086, -0.06445884704589844, -0.06150531768798828, -0.058551788330078125, -0.05559825897216797, -0.05264472961425781, -0.049691200256347656, -0.0467376708984375, -0.043784141540527344, -0.04083061218261719, -0.03787708282470703, -0.034923553466796875, -0.03197002410888672, -0.029016494750976562, -0.026062965393066406, -0.02310943603515625, -0.020155906677246094, -0.017202377319335938, -0.014248847961425781, -0.011295318603515625, -0.008341789245605469, -0.0053882598876953125, -0.0024347305297851562, 0.000518798828125, 0.0034723281860351562, 0.0064258575439453125, 0.009379386901855469, 0.012332916259765625, 0.015286445617675781, 0.018239974975585938, 0.021193504333496094, 0.02414703369140625, 0.027100563049316406, 0.030054092407226562, 0.03300762176513672, 0.035961151123046875, 0.03891468048095703, 0.04186820983886719, 0.044821739196777344, 0.0477752685546875, 0.050728797912597656, 0.05368232727050781, 0.05663585662841797, 0.059589385986328125, 0.06254291534423828, 0.06549644470214844, 0.0684499740600586, 0.07140350341796875, 0.0743570327758789, 0.07731056213378906, 0.08026409149169922, 0.08321762084960938, 0.08617115020751953, 0.08912467956542969, 0.09207820892333984, 0.09503173828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 33.0, 751.0, 232.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036853814963251352, -0.0026991544291377068, -0.001712927594780922, -0.0007267005275934935, 0.00025952630676329136, 0.0012457531411200762, 0.0022319804411381483, 0.003218207275494933, 0.004204434342682362, 0.005190661177039146, 0.006176888011395931, 0.007163115311414003, 0.008149342611432076, 0.009135568514466286, 0.010121796280145645, 0.01110802311450243, 0.012094249948859215, 0.013080476783216, 0.014066703617572784, 0.015052931383252144, 0.016039157286286354, 0.017025385051965714, 0.018011610954999924, 0.018997838720679283, 0.019984064623713493, 0.020970292389392853, 0.021956518292427063, 0.022942746058106422, 0.023928971961140633, 0.024915199726819992, 0.025901425629854202, 0.02688765339553356, 0.02787388116121292, 0.02886010892689228, 0.02984633482992649, 0.03083256259560585, 0.03181878849864006, 0.03280501440167427, 0.03379124402999878, 0.03477746993303299, 0.0357636958360672, 0.03674992173910141, 0.03773615136742592, 0.03872237727046013, 0.03970860317349434, 0.04069482907652855, 0.04168105870485306, 0.04266728460788727, 0.04365351051092148, 0.04463973641395569, 0.0456259660422802, 0.04661219194531441, 0.04759841784834862, 0.04858464375138283, 0.049570873379707336, 0.05055709928274155, 0.051543328911066055, 0.052529554814100266, 0.053515784442424774, 0.054502010345458984, 0.055488236248493195, 0.056474462151527405, 0.05746069177985191, 0.058446917682886124, 0.059433143585920334]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 18.0, 7.0, 15.0, 19.0, 29.0, 28.0, 25.0, 39.0, 41.0, 45.0, 38.0, 41.0, 46.0, 52.0, 42.0, 45.0, 47.0, 41.0, 42.0, 43.0, 48.0, 36.0, 34.0, 22.0, 18.0, 12.0, 20.0, 20.0, 18.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0033148527145385742, -0.0032183146104216576, -0.003121776506304741, -0.0030252384021878242, -0.0029287002980709076, -0.002832162193953991, -0.0027356240898370743, -0.0026390859857201576, -0.002542547881603241, -0.0024460097774863243, -0.0023494716733694077, -0.002252933569252491, -0.0021563954651355743, -0.0020598573610186577, -0.001963319256901741, -0.0018667811527848244, -0.0017702430486679077, -0.001673704944550991, -0.0015771668404340744, -0.0014806287363171577, -0.001384090632200241, -0.0012875525280833244, -0.0011910144239664078, -0.0010944763198494911, -0.0009979382157325745, -0.0009014001116156578, -0.0008048620074987411, -0.0007083239033818245, -0.0006117857992649078, -0.0005152476951479912, -0.0004187095910310745, -0.00032217148691415787, -0.0002256333827972412, -0.00012909527868032455, -3.25571745634079e-05, 6.398092955350876e-05, 0.00016051903367042542, 0.00025705713778734207, 0.00035359524190425873, 0.0004501333460211754, 0.000546671450138092, 0.0006432095542550087, 0.0007397476583719254, 0.000836285762488842, 0.0009328238666057587, 0.0010293619707226753, 0.001125900074839592, 0.0012224381789565086, 0.0013189762830734253, 0.001415514387190342, 0.0015120524913072586, 0.0016085905954241753, 0.001705128699541092, 0.0018016668036580086, 0.0018982049077749252, 0.001994743011891842, 0.0020912811160087585, 0.002187819220125675, 0.002284357324242592, 0.0023808954283595085, 0.002477433532476425, 0.002573971636593342, 0.0026705097407102585, 0.002767047844827175, 0.002863585948944092]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 4.0, 6.0, 10.0, 13.0, 8.0, 4.0, 14.0, 17.0, 14.0, 14.0, 28.0, 29.0, 22.0, 32.0, 25.0, 41.0, 33.0, 44.0, 53.0, 47.0, 52.0, 47.0, 32.0, 45.0, 42.0, 40.0, 41.0, 28.0, 29.0, 23.0, 20.0, 21.0, 18.0, 21.0, 14.0, 13.0, 14.0, 11.0, 9.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-26.40625, -25.624755859375, -24.84326171875, -24.061767578125, -23.2802734375, -22.498779296875, -21.71728515625, -20.935791015625, -20.154296875, -19.372802734375, -18.59130859375, -17.809814453125, -17.0283203125, -16.246826171875, -15.46533203125, -14.683837890625, -13.90234375, -13.120849609375, -12.33935546875, -11.557861328125, -10.7763671875, -9.994873046875, -9.21337890625, -8.431884765625, -7.650390625, -6.868896484375, -6.08740234375, -5.305908203125, -4.5244140625, -3.742919921875, -2.96142578125, -2.179931640625, -1.3984375, -0.616943359375, 0.16455078125, 0.946044921875, 1.7275390625, 2.509033203125, 3.29052734375, 4.072021484375, 4.853515625, 5.635009765625, 6.41650390625, 7.197998046875, 7.9794921875, 8.760986328125, 9.54248046875, 10.323974609375, 11.10546875, 11.886962890625, 12.66845703125, 13.449951171875, 14.2314453125, 15.012939453125, 15.79443359375, 16.575927734375, 17.357421875, 18.138916015625, 18.92041015625, 19.701904296875, 20.4833984375, 21.264892578125, 22.04638671875, 22.827880859375, 23.609375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 8.0, 9.0, 9.0, 16.0, 25.0, 25.0, 24.0, 28.0, 56.0, 63.0, 67.0, 99.0, 138.0, 183.0, 295.0, 374.0, 520.0, 889.0, 1581.0, 3785.0, 10974.0, 49929.0, 766488.0, 177895.0, 22641.0, 6385.0, 2490.0, 1207.0, 675.0, 443.0, 308.0, 228.0, 178.0, 119.0, 91.0, 70.0, 57.0, 42.0, 31.0, 30.0, 20.0, 17.0, 7.0, 14.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-65.375, -63.43896484375, -61.5029296875, -59.56689453125, -57.630859375, -55.69482421875, -53.7587890625, -51.82275390625, -49.88671875, -47.95068359375, -46.0146484375, -44.07861328125, -42.142578125, -40.20654296875, -38.2705078125, -36.33447265625, -34.3984375, -32.46240234375, -30.5263671875, -28.59033203125, -26.654296875, -24.71826171875, -22.7822265625, -20.84619140625, -18.91015625, -16.97412109375, -15.0380859375, -13.10205078125, -11.166015625, -9.22998046875, -7.2939453125, -5.35791015625, -3.421875, -1.48583984375, 0.4501953125, 2.38623046875, 4.322265625, 6.25830078125, 8.1943359375, 10.13037109375, 12.06640625, 14.00244140625, 15.9384765625, 17.87451171875, 19.810546875, 21.74658203125, 23.6826171875, 25.61865234375, 27.5546875, 29.49072265625, 31.4267578125, 33.36279296875, 35.298828125, 37.23486328125, 39.1708984375, 41.10693359375, 43.04296875, 44.97900390625, 46.9150390625, 48.85107421875, 50.787109375, 52.72314453125, 54.6591796875, 56.59521484375, 58.53125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 4.0, 12.0, 6.0, 11.0, 10.0, 18.0, 16.0, 25.0, 18.0, 17.0, 28.0, 28.0, 29.0, 29.0, 45.0, 41.0, 47.0, 97.0, 142.0, 1524.0, 309.0, 114.0, 64.0, 39.0, 43.0, 36.0, 31.0, 38.0, 26.0, 21.0, 23.0, 19.0, 15.0, 18.0, 14.0, 11.0, 11.0, 10.0, 6.0, 6.0, 5.0, 6.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-55.28125, -53.60009765625, -51.9189453125, -50.23779296875, -48.556640625, -46.87548828125, -45.1943359375, -43.51318359375, -41.83203125, -40.15087890625, -38.4697265625, -36.78857421875, -35.107421875, -33.42626953125, -31.7451171875, -30.06396484375, -28.3828125, -26.70166015625, -25.0205078125, -23.33935546875, -21.658203125, -19.97705078125, -18.2958984375, -16.61474609375, -14.93359375, -13.25244140625, -11.5712890625, -9.89013671875, -8.208984375, -6.52783203125, -4.8466796875, -3.16552734375, -1.484375, 0.19677734375, 1.8779296875, 3.55908203125, 5.240234375, 6.92138671875, 8.6025390625, 10.28369140625, 11.96484375, 13.64599609375, 15.3271484375, 17.00830078125, 18.689453125, 20.37060546875, 22.0517578125, 23.73291015625, 25.4140625, 27.09521484375, 28.7763671875, 30.45751953125, 32.138671875, 33.81982421875, 35.5009765625, 37.18212890625, 38.86328125, 40.54443359375, 42.2255859375, 43.90673828125, 45.587890625, 47.26904296875, 48.9501953125, 50.63134765625, 52.3125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 6.0, 7.0, 8.0, 3.0, 10.0, 13.0, 8.0, 17.0, 27.0, 16.0, 18.0, 28.0, 33.0, 31.0, 53.0, 60.0, 82.0, 93.0, 164.0, 391.0, 1195.0, 14427.0, 3024840.0, 100213.0, 2627.0, 505.0, 244.0, 142.0, 84.0, 64.0, 52.0, 38.0, 31.0, 26.0, 19.0, 18.0, 16.0, 23.0, 9.0, 8.0, 13.0, 9.0, 5.0, 6.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-138.5, -133.990234375, -129.48046875, -124.970703125, -120.4609375, -115.951171875, -111.44140625, -106.931640625, -102.421875, -97.912109375, -93.40234375, -88.892578125, -84.3828125, -79.873046875, -75.36328125, -70.853515625, -66.34375, -61.833984375, -57.32421875, -52.814453125, -48.3046875, -43.794921875, -39.28515625, -34.775390625, -30.265625, -25.755859375, -21.24609375, -16.736328125, -12.2265625, -7.716796875, -3.20703125, 1.302734375, 5.8125, 10.322265625, 14.83203125, 19.341796875, 23.8515625, 28.361328125, 32.87109375, 37.380859375, 41.890625, 46.400390625, 50.91015625, 55.419921875, 59.9296875, 64.439453125, 68.94921875, 73.458984375, 77.96875, 82.478515625, 86.98828125, 91.498046875, 96.0078125, 100.517578125, 105.02734375, 109.537109375, 114.046875, 118.556640625, 123.06640625, 127.576171875, 132.0859375, 136.595703125, 141.10546875, 145.615234375, 150.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 14.0, 25.0, 29.0, 52.0, 61.0, 112.0, 129.0, 136.0, 133.0, 97.0, 82.0, 48.0, 34.0, 21.0, 7.0, 12.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.696502685546875, -46.86695861816406, -45.03741455078125, -43.20787048339844, -41.378326416015625, -39.54878234863281, -37.71923828125, -35.88969421386719, -34.060150146484375, -32.23060607910156, -30.40106201171875, -28.571517944335938, -26.741973876953125, -24.912429809570312, -23.0828857421875, -21.253341674804688, -19.423795700073242, -17.59425163269043, -15.764707565307617, -13.935163497924805, -12.105619430541992, -10.276074409484863, -8.44653034210205, -6.616986274719238, -4.787442207336426, -2.9578981399536133, -1.1283538341522217, 0.7011904716491699, 2.5307345390319824, 4.360279083251953, 6.189823150634766, 8.019367218017578, 9.84891128540039, 11.678455352783203, 13.507999420166016, 15.337543487548828, 17.16708755493164, 18.996631622314453, 20.826175689697266, 22.655719757080078, 24.48526382446289, 26.314807891845703, 28.144351959228516, 29.973896026611328, 31.80344009399414, 33.63298416137695, 35.462528228759766, 37.29207229614258, 39.121620178222656, 40.95116424560547, 42.78070831298828, 44.610252380371094, 46.439796447753906, 48.26934051513672, 50.09888458251953, 51.928428649902344, 53.757972717285156, 55.58751678466797, 57.41706085205078, 59.246604919433594, 61.076148986816406, 62.90569305419922, 64.73523712158203, 66.56478118896484, 68.39432525634766]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 2.0, 7.0, 14.0, 8.0, 9.0, 9.0, 19.0, 20.0, 16.0, 26.0, 21.0, 22.0, 27.0, 29.0, 27.0, 57.0, 42.0, 22.0, 34.0, 46.0, 45.0, 37.0, 34.0, 35.0, 44.0, 41.0, 39.0, 26.0, 27.0, 21.0, 31.0, 24.0, 23.0, 14.0, 16.0, 14.0, 13.0, 8.0, 8.0, 10.0, 7.0, 6.0, 5.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.99923706054688, -147.45291137695312, -142.9065704345703, -138.3602294921875, -133.81390380859375, -129.267578125, -124.72123718261719, -120.1749038696289, -115.62857055664062, -111.08223724365234, -106.53590393066406, -101.98957061767578, -97.4432373046875, -92.89690399169922, -88.35057067871094, -83.80423736572266, -79.25790405273438, -74.7115707397461, -70.16523742675781, -65.61890411376953, -61.07257080078125, -56.52623748779297, -51.97990417480469, -47.433570861816406, -42.887237548828125, -38.340904235839844, -33.79457092285156, -29.24823760986328, -24.701904296875, -20.15557098388672, -15.609237670898438, -11.062904357910156, -6.5165863037109375, -1.9702529907226562, 2.576080322265625, 7.122413635253906, 11.668746948242188, 16.21508026123047, 20.76141357421875, 25.30774688720703, 29.854080200195312, 34.400413513183594, 38.946746826171875, 43.493080139160156, 48.03941345214844, 52.58574676513672, 57.132080078125, 61.67841339111328, 66.22474670410156, 70.77108001708984, 75.31741333007812, 79.8637466430664, 84.41007995605469, 88.95641326904297, 93.50274658203125, 98.04907989501953, 102.59541320800781, 107.1417465209961, 111.68807983398438, 116.23441314697266, 120.78074645996094, 125.32707977294922, 129.8734130859375, 134.41973876953125, 138.96607971191406]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 7.0, 4.0, 15.0, 10.0, 15.0, 12.0, 16.0, 21.0, 22.0, 23.0, 29.0, 43.0, 35.0, 43.0, 38.0, 44.0, 42.0, 59.0, 47.0, 31.0, 56.0, 37.0, 40.0, 34.0, 34.0, 26.0, 38.0, 27.0, 18.0, 18.0, 18.0, 13.0, 19.0, 12.0, 3.0, 10.0, 11.0, 5.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.125, -27.3046875, -26.484375, -25.6640625, -24.84375, -24.0234375, -23.203125, -22.3828125, -21.5625, -20.7421875, -19.921875, -19.1015625, -18.28125, -17.4609375, -16.640625, -15.8203125, -15.0, -14.1796875, -13.359375, -12.5390625, -11.71875, -10.8984375, -10.078125, -9.2578125, -8.4375, -7.6171875, -6.796875, -5.9765625, -5.15625, -4.3359375, -3.515625, -2.6953125, -1.875, -1.0546875, -0.234375, 0.5859375, 1.40625, 2.2265625, 3.046875, 3.8671875, 4.6875, 5.5078125, 6.328125, 7.1484375, 7.96875, 8.7890625, 9.609375, 10.4296875, 11.25, 12.0703125, 12.890625, 13.7109375, 14.53125, 15.3515625, 16.171875, 16.9921875, 17.8125, 18.6328125, 19.453125, 20.2734375, 21.09375, 21.9140625, 22.734375, 23.5546875, 24.375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 4.0, 13.0, 10.0, 26.0, 21.0, 24.0, 52.0, 73.0, 106.0, 136.0, 225.0, 366.0, 614.0, 1061.0, 2114.0, 4809.0, 17277.0, 274006.0, 3303889.0, 551665.0, 25892.0, 6052.0, 2547.0, 1288.0, 720.0, 433.0, 274.0, 177.0, 122.0, 74.0, 62.0, 40.0, 29.0, 24.0, 14.0, 13.0, 8.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.1875, -64.21826171875, -62.2490234375, -60.27978515625, -58.310546875, -56.34130859375, -54.3720703125, -52.40283203125, -50.43359375, -48.46435546875, -46.4951171875, -44.52587890625, -42.556640625, -40.58740234375, -38.6181640625, -36.64892578125, -34.6796875, -32.71044921875, -30.7412109375, -28.77197265625, -26.802734375, -24.83349609375, -22.8642578125, -20.89501953125, -18.92578125, -16.95654296875, -14.9873046875, -13.01806640625, -11.048828125, -9.07958984375, -7.1103515625, -5.14111328125, -3.171875, -1.20263671875, 0.7666015625, 2.73583984375, 4.705078125, 6.67431640625, 8.6435546875, 10.61279296875, 12.58203125, 14.55126953125, 16.5205078125, 18.48974609375, 20.458984375, 22.42822265625, 24.3974609375, 26.36669921875, 28.3359375, 30.30517578125, 32.2744140625, 34.24365234375, 36.212890625, 38.18212890625, 40.1513671875, 42.12060546875, 44.08984375, 46.05908203125, 48.0283203125, 49.99755859375, 51.966796875, 53.93603515625, 55.9052734375, 57.87451171875, 59.84375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 10.0, 24.0, 34.0, 49.0, 120.0, 392.0, 1322.0, 1356.0, 456.0, 165.0, 68.0, 32.0, 18.0, 9.0, 7.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -48.29296875, -45.4609375, -42.62890625, -39.796875, -36.96484375, -34.1328125, -31.30078125, -28.46875, -25.63671875, -22.8046875, -19.97265625, -17.140625, -14.30859375, -11.4765625, -8.64453125, -5.8125, -2.98046875, -0.1484375, 2.68359375, 5.515625, 8.34765625, 11.1796875, 14.01171875, 16.84375, 19.67578125, 22.5078125, 25.33984375, 28.171875, 31.00390625, 33.8359375, 36.66796875, 39.5, 42.33203125, 45.1640625, 47.99609375, 50.828125, 53.66015625, 56.4921875, 59.32421875, 62.15625, 64.98828125, 67.8203125, 70.65234375, 73.484375, 76.31640625, 79.1484375, 81.98046875, 84.8125, 87.64453125, 90.4765625, 93.30859375, 96.140625, 98.97265625, 101.8046875, 104.63671875, 107.46875, 110.30078125, 113.1328125, 115.96484375, 118.796875, 121.62890625, 124.4609375, 127.29296875, 130.125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 11.0, 16.0, 25.0, 31.0, 54.0, 86.0, 146.0, 394.0, 1368.0, 9486.0, 3415018.0, 758824.0, 7136.0, 998.0, 331.0, 137.0, 90.0, 61.0, 26.0, 21.0, 9.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-315.25, -307.548828125, -299.84765625, -292.146484375, -284.4453125, -276.744140625, -269.04296875, -261.341796875, -253.640625, -245.939453125, -238.23828125, -230.537109375, -222.8359375, -215.134765625, -207.43359375, -199.732421875, -192.03125, -184.330078125, -176.62890625, -168.927734375, -161.2265625, -153.525390625, -145.82421875, -138.123046875, -130.421875, -122.720703125, -115.01953125, -107.318359375, -99.6171875, -91.916015625, -84.21484375, -76.513671875, -68.8125, -61.111328125, -53.41015625, -45.708984375, -38.0078125, -30.306640625, -22.60546875, -14.904296875, -7.203125, 0.498046875, 8.19921875, 15.900390625, 23.6015625, 31.302734375, 39.00390625, 46.705078125, 54.40625, 62.107421875, 69.80859375, 77.509765625, 85.2109375, 92.912109375, 100.61328125, 108.314453125, 116.015625, 123.716796875, 131.41796875, 139.119140625, 146.8203125, 154.521484375, 162.22265625, 169.923828125, 177.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 18.0, 48.0, 177.0, 446.0, 232.0, 61.0, 22.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-663.81103515625, -648.5704956054688, -633.3299560546875, -618.08935546875, -602.8488159179688, -587.6082763671875, -572.3677368164062, -557.127197265625, -541.8865966796875, -526.6460571289062, -511.4054870605469, -496.1649475097656, -480.92437744140625, -465.683837890625, -450.44329833984375, -435.2027587890625, -419.96221923828125, -404.7216796875, -389.4811096191406, -374.2405700683594, -359.0, -343.75946044921875, -328.5189208984375, -313.27838134765625, -298.0378112792969, -282.7972717285156, -267.55670166015625, -252.316162109375, -237.0756072998047, -221.83505249023438, -206.59451293945312, -191.3539581298828, -176.1134033203125, -160.8728485107422, -145.63229370117188, -130.39175415039062, -115.15119934082031, -99.91064453125, -84.67009735107422, -69.42955017089844, -54.188995361328125, -38.94844436645508, -23.70789337158203, -8.467342376708984, 6.7732086181640625, 22.013763427734375, 37.254310607910156, 52.49485778808594, 67.73541259765625, 82.97596740722656, 98.21651458740234, 113.45706176757812, 128.69761657714844, 143.93817138671875, 159.1787109375, 174.4192657470703, 189.65982055664062, 204.90037536621094, 220.14093017578125, 235.3814697265625, 250.6220245361328, 265.8625793457031, 281.1031188964844, 296.34368896484375, 311.584228515625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 0.0, 5.0, 5.0, 2.0, 8.0, 6.0, 10.0, 14.0, 11.0, 13.0, 24.0, 22.0, 27.0, 23.0, 23.0, 41.0, 25.0, 39.0, 45.0, 44.0, 34.0, 33.0, 33.0, 31.0, 48.0, 45.0, 39.0, 36.0, 45.0, 37.0, 30.0, 32.0, 21.0, 20.0, 16.0, 21.0, 19.0, 13.0, 13.0, 8.0, 5.0, 8.0, 6.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.99964141845703, -106.5563735961914, -103.11309814453125, -99.66983032226562, -96.2265625, -92.78329467773438, -89.34002685546875, -85.8967514038086, -82.45348358154297, -79.01021575927734, -75.56694030761719, -72.12367248535156, -68.68040466308594, -65.23713684082031, -61.79386520385742, -58.35059356689453, -54.907325744628906, -51.46405792236328, -48.02078628540039, -44.5775146484375, -41.134246826171875, -37.69097900390625, -34.24770736694336, -30.8044376373291, -27.361167907714844, -23.917898178100586, -20.474628448486328, -17.03135871887207, -13.588088989257812, -10.144819259643555, -6.701549530029297, -3.258279800415039, 0.1849822998046875, 3.6282520294189453, 7.071521759033203, 10.514791488647461, 13.958061218261719, 17.401330947875977, 20.844600677490234, 24.287870407104492, 27.73114013671875, 31.174409866333008, 34.617679595947266, 38.060951232910156, 41.50421905517578, 44.947486877441406, 48.3907585144043, 51.83403015136719, 55.27729797363281, 58.72056579589844, 62.16383743286133, 65.60710906982422, 69.05037689208984, 72.49364471435547, 75.93692016601562, 79.38018798828125, 82.82345581054688, 86.2667236328125, 89.70999145507812, 93.15326690673828, 96.5965347290039, 100.03980255126953, 103.48307800292969, 106.92634582519531, 110.36961364746094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 9.0, 7.0, 8.0, 3.0, 8.0, 8.0, 6.0, 14.0, 14.0, 19.0, 16.0, 30.0, 25.0, 38.0, 29.0, 29.0, 30.0, 33.0, 36.0, 38.0, 29.0, 50.0, 43.0, 46.0, 44.0, 45.0, 28.0, 29.0, 38.0, 27.0, 34.0, 29.0, 19.0, 21.0, 17.0, 10.0, 21.0, 14.0, 13.0, 12.0, 7.0, 4.0, 7.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-26.296875, -25.53466796875, -24.7724609375, -24.01025390625, -23.248046875, -22.48583984375, -21.7236328125, -20.96142578125, -20.19921875, -19.43701171875, -18.6748046875, -17.91259765625, -17.150390625, -16.38818359375, -15.6259765625, -14.86376953125, -14.1015625, -13.33935546875, -12.5771484375, -11.81494140625, -11.052734375, -10.29052734375, -9.5283203125, -8.76611328125, -8.00390625, -7.24169921875, -6.4794921875, -5.71728515625, -4.955078125, -4.19287109375, -3.4306640625, -2.66845703125, -1.90625, -1.14404296875, -0.3818359375, 0.38037109375, 1.142578125, 1.90478515625, 2.6669921875, 3.42919921875, 4.19140625, 4.95361328125, 5.7158203125, 6.47802734375, 7.240234375, 8.00244140625, 8.7646484375, 9.52685546875, 10.2890625, 11.05126953125, 11.8134765625, 12.57568359375, 13.337890625, 14.10009765625, 14.8623046875, 15.62451171875, 16.38671875, 17.14892578125, 17.9111328125, 18.67333984375, 19.435546875, 20.19775390625, 20.9599609375, 21.72216796875, 22.484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 8.0, 8.0, 10.0, 8.0, 15.0, 32.0, 47.0, 64.0, 99.0, 155.0, 193.0, 287.0, 389.0, 524.0, 809.0, 1179.0, 1673.0, 2454.0, 3625.0, 5218.0, 7694.0, 11569.0, 17553.0, 26742.0, 41398.0, 66022.0, 107842.0, 175530.0, 206529.0, 137841.0, 83379.0, 51943.0, 32733.0, 21423.0, 13993.0, 9331.0, 6322.0, 4330.0, 2973.0, 1994.0, 1408.0, 1025.0, 685.0, 470.0, 298.0, 232.0, 170.0, 116.0, 63.0, 38.0, 42.0, 25.0, 15.0, 17.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.0654296875, -1.0313262939453125, -0.997222900390625, -0.9631195068359375, -0.92901611328125, -0.8949127197265625, -0.860809326171875, -0.8267059326171875, -0.7926025390625, -0.7584991455078125, -0.724395751953125, -0.6902923583984375, -0.65618896484375, -0.6220855712890625, -0.587982177734375, -0.5538787841796875, -0.519775390625, -0.4856719970703125, -0.451568603515625, -0.4174652099609375, -0.38336181640625, -0.3492584228515625, -0.315155029296875, -0.2810516357421875, -0.2469482421875, -0.2128448486328125, -0.178741455078125, -0.1446380615234375, -0.11053466796875, -0.0764312744140625, -0.042327880859375, -0.0082244873046875, 0.02587890625, 0.0599822998046875, 0.094085693359375, 0.1281890869140625, 0.16229248046875, 0.1963958740234375, 0.230499267578125, 0.2646026611328125, 0.2987060546875, 0.3328094482421875, 0.366912841796875, 0.4010162353515625, 0.43511962890625, 0.4692230224609375, 0.503326416015625, 0.5374298095703125, 0.571533203125, 0.6056365966796875, 0.639739990234375, 0.6738433837890625, 0.70794677734375, 0.7420501708984375, 0.776153564453125, 0.8102569580078125, 0.8443603515625, 0.8784637451171875, 0.912567138671875, 0.9466705322265625, 0.98077392578125, 1.0148773193359375, 1.048980712890625, 1.0830841064453125, 1.1171875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 17.0, 13.0, 13.0, 15.0, 21.0, 21.0, 24.0, 38.0, 23.0, 27.0, 35.0, 28.0, 28.0, 34.0, 47.0, 36.0, 35.0, 24.0, 1065.0, 33.0, 41.0, 37.0, 25.0, 33.0, 28.0, 36.0, 22.0, 24.0, 17.0, 25.0, 16.0, 21.0, 23.0, 9.0, 23.0, 14.0, 6.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4296875, -13.96826171875, -13.5068359375, -13.04541015625, -12.583984375, -12.12255859375, -11.6611328125, -11.19970703125, -10.73828125, -10.27685546875, -9.8154296875, -9.35400390625, -8.892578125, -8.43115234375, -7.9697265625, -7.50830078125, -7.046875, -6.58544921875, -6.1240234375, -5.66259765625, -5.201171875, -4.73974609375, -4.2783203125, -3.81689453125, -3.35546875, -2.89404296875, -2.4326171875, -1.97119140625, -1.509765625, -1.04833984375, -0.5869140625, -0.12548828125, 0.3359375, 0.79736328125, 1.2587890625, 1.72021484375, 2.181640625, 2.64306640625, 3.1044921875, 3.56591796875, 4.02734375, 4.48876953125, 4.9501953125, 5.41162109375, 5.873046875, 6.33447265625, 6.7958984375, 7.25732421875, 7.71875, 8.18017578125, 8.6416015625, 9.10302734375, 9.564453125, 10.02587890625, 10.4873046875, 10.94873046875, 11.41015625, 11.87158203125, 12.3330078125, 12.79443359375, 13.255859375, 13.71728515625, 14.1787109375, 14.64013671875, 15.1015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 11.0, 15.0, 17.0, 30.0, 52.0, 71.0, 107.0, 154.0, 222.0, 286.0, 481.0, 603.0, 1013.0, 1412.0, 1997.0, 2802.0, 4050.0, 5631.0, 8093.0, 11356.0, 16298.0, 23479.0, 34122.0, 50029.0, 76379.0, 119817.0, 1174816.0, 219788.0, 114296.0, 73265.0, 48264.0, 32747.0, 22638.0, 15485.0, 11089.0, 7803.0, 5449.0, 3949.0, 2775.0, 1974.0, 1305.0, 944.0, 597.0, 441.0, 286.0, 241.0, 173.0, 91.0, 61.0, 42.0, 30.0, 26.0, 16.0, 6.0, 8.0, 2.0, 4.0, 1.0], "bins": [-0.908203125, -0.8806381225585938, -0.8530731201171875, -0.8255081176757812, -0.797943115234375, -0.7703781127929688, -0.7428131103515625, -0.7152481079101562, -0.68768310546875, -0.6601181030273438, -0.6325531005859375, -0.6049880981445312, -0.577423095703125, -0.5498580932617188, -0.5222930908203125, -0.49472808837890625, -0.4671630859375, -0.43959808349609375, -0.4120330810546875, -0.38446807861328125, -0.356903076171875, -0.32933807373046875, -0.3017730712890625, -0.27420806884765625, -0.24664306640625, -0.21907806396484375, -0.1915130615234375, -0.16394805908203125, -0.136383056640625, -0.10881805419921875, -0.0812530517578125, -0.05368804931640625, -0.026123046875, 0.00144195556640625, 0.0290069580078125, 0.05657196044921875, 0.084136962890625, 0.11170196533203125, 0.1392669677734375, 0.16683197021484375, 0.19439697265625, 0.22196197509765625, 0.2495269775390625, 0.27709197998046875, 0.304656982421875, 0.33222198486328125, 0.3597869873046875, 0.38735198974609375, 0.4149169921875, 0.44248199462890625, 0.4700469970703125, 0.49761199951171875, 0.525177001953125, 0.5527420043945312, 0.5803070068359375, 0.6078720092773438, 0.63543701171875, 0.6630020141601562, 0.6905670166015625, 0.7181320190429688, 0.745697021484375, 0.7732620239257812, 0.8008270263671875, 0.8283920288085938, 0.85595703125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 6.0, 4.0, 10.0, 16.0, 11.0, 17.0, 21.0, 17.0, 39.0, 43.0, 42.0, 47.0, 50.0, 50.0, 54.0, 70.0, 77.0, 62.0, 63.0, 56.0, 43.0, 39.0, 39.0, 29.0, 30.0, 19.0, 11.0, 11.0, 6.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004863739013671875, -0.004697918891906738, -0.0045320987701416016, -0.004366278648376465, -0.004200458526611328, -0.004034638404846191, -0.0038688182830810547, -0.003702998161315918, -0.0035371780395507812, -0.0033713579177856445, -0.003205537796020508, -0.003039717674255371, -0.0028738975524902344, -0.0027080774307250977, -0.002542257308959961, -0.0023764371871948242, -0.0022106170654296875, -0.0020447969436645508, -0.001878976821899414, -0.0017131567001342773, -0.0015473365783691406, -0.001381516456604004, -0.0012156963348388672, -0.0010498762130737305, -0.0008840560913085938, -0.000718235969543457, -0.0005524158477783203, -0.0003865957260131836, -0.00022077560424804688, -5.4955482482910156e-05, 0.00011086463928222656, 0.0002766847610473633, 0.0004425048828125, 0.0006083250045776367, 0.0007741451263427734, 0.0009399652481079102, 0.0011057853698730469, 0.0012716054916381836, 0.0014374256134033203, 0.001603245735168457, 0.0017690658569335938, 0.0019348859786987305, 0.002100706100463867, 0.002266526222229004, 0.0024323463439941406, 0.0025981664657592773, 0.002763986587524414, 0.0029298067092895508, 0.0030956268310546875, 0.0032614469528198242, 0.003427267074584961, 0.0035930871963500977, 0.0037589073181152344, 0.003924727439880371, 0.004090547561645508, 0.0042563676834106445, 0.004422187805175781, 0.004588007926940918, 0.004753828048706055, 0.004919648170471191, 0.005085468292236328, 0.005251288414001465, 0.0054171085357666016, 0.005582928657531738, 0.005748748779296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 12.0, 11.0, 14.0, 16.0, 19.0, 25.0, 47.0, 58.0, 80.0, 96.0, 95.0, 155.0, 300.0, 551.0, 3460.0, 976814.0, 64918.0, 862.0, 326.0, 190.0, 127.0, 104.0, 69.0, 43.0, 41.0, 29.0, 28.0, 16.0, 16.0, 13.0, 7.0, 5.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11383056640625, -0.11064529418945312, -0.10746002197265625, -0.10427474975585938, -0.1010894775390625, -0.09790420532226562, -0.09471893310546875, -0.09153366088867188, -0.088348388671875, -0.08516311645507812, -0.08197784423828125, -0.07879257202148438, -0.0756072998046875, -0.07242202758789062, -0.06923675537109375, -0.06605148315429688, -0.0628662109375, -0.059680938720703125, -0.05649566650390625, -0.053310394287109375, -0.0501251220703125, -0.046939849853515625, -0.04375457763671875, -0.040569305419921875, -0.037384033203125, -0.034198760986328125, -0.03101348876953125, -0.027828216552734375, -0.0246429443359375, -0.021457672119140625, -0.01827239990234375, -0.015087127685546875, -0.01190185546875, -0.008716583251953125, -0.00553131103515625, -0.002346038818359375, 0.0008392333984375, 0.004024505615234375, 0.00720977783203125, 0.010395050048828125, 0.013580322265625, 0.016765594482421875, 0.01995086669921875, 0.023136138916015625, 0.0263214111328125, 0.029506683349609375, 0.03269195556640625, 0.035877227783203125, 0.0390625, 0.042247772216796875, 0.04543304443359375, 0.048618316650390625, 0.0518035888671875, 0.054988861083984375, 0.05817413330078125, 0.061359405517578125, 0.064544677734375, 0.06772994995117188, 0.07091522216796875, 0.07410049438476562, 0.0772857666015625, 0.08047103881835938, 0.08365631103515625, 0.08684158325195312, 0.09002685546875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 344.0, 653.0, 13.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01742071658372879, -0.0162674468010664, -0.015114178881049156, -0.013960909098386765, -0.012807640247046947, -0.01165437139570713, -0.010501101613044739, -0.009347832761704922, -0.008194563910365105, -0.007041295059025288, -0.005888025742024183, -0.004734756425023079, -0.003581487573683262, -0.002428218722343445, -0.0012749494053423405, -0.00012168008834123611, 0.001031588762998581, 0.0021848578471690416, 0.0033381269313395023, 0.004491396248340607, 0.005644665099680424, 0.006797933951020241, 0.007951203733682632, 0.00910447258502245, 0.010257741436362267, 0.011411010287702084, 0.0125642791390419, 0.013717548921704292, 0.01487081777304411, 0.016024086624383926, 0.017177356407046318, 0.01833062618970871, 0.01948389783501625, 0.020637167617678642, 0.021790435537695885, 0.022943705320358276, 0.02409697324037552, 0.02525024302303791, 0.026403512805700302, 0.027556780725717545, 0.028710050508379936, 0.029863320291042328, 0.03101658821105957, 0.03216985613107681, 0.033323127776384354, 0.034476395696401596, 0.03562966361641884, 0.03678293526172638, 0.03793620318174362, 0.039089471101760864, 0.040242742747068405, 0.04139601066708565, 0.04254927858710289, 0.04370255023241043, 0.04485581815242767, 0.046009086072444916, 0.04716235399246216, 0.0483156219124794, 0.04946889355778694, 0.050622161477804184, 0.051775429397821426, 0.05292870104312897, 0.05408196896314621, 0.05523523688316345, 0.05638850852847099]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 0.0, 8.0, 15.0, 11.0, 17.0, 15.0, 25.0, 13.0, 30.0, 26.0, 38.0, 47.0, 45.0, 40.0, 45.0, 53.0, 62.0, 47.0, 49.0, 50.0, 42.0, 44.0, 36.0, 36.0, 44.0, 34.0, 31.0, 17.0, 22.0, 16.0, 14.0, 3.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0034325718879699707, -0.0033309776335954666, -0.0032293833792209625, -0.0031277891248464584, -0.0030261948704719543, -0.0029246006160974503, -0.002823006361722946, -0.002721412107348442, -0.002619817852973938, -0.002518223598599434, -0.00241662934422493, -0.0023150350898504257, -0.0022134408354759216, -0.0021118465811014175, -0.0020102523267269135, -0.0019086580723524094, -0.0018070638179779053, -0.0017054695636034012, -0.001603875309228897, -0.001502281054854393, -0.001400686800479889, -0.0012990925461053848, -0.0011974982917308807, -0.0010959040373563766, -0.0009943097829818726, -0.0008927155286073685, -0.0007911212742328644, -0.0006895270198583603, -0.0005879327654838562, -0.0004863385111093521, -0.000384744256734848, -0.00028315000236034393, -0.00018155574798583984, -7.996149361133575e-05, 2.1632760763168335e-05, 0.00012322701513767242, 0.00022482126951217651, 0.0003264155238866806, 0.0004280097782611847, 0.0005296040326356888, 0.0006311982870101929, 0.000732792541384697, 0.000834386795759201, 0.0009359810501337051, 0.0010375753045082092, 0.0011391695588827133, 0.0012407638132572174, 0.0013423580676317215, 0.0014439523220062256, 0.0015455465763807297, 0.0016471408307552338, 0.0017487350851297379, 0.001850329339504242, 0.001951923593878746, 0.00205351784825325, 0.002155112102627754, 0.0022567063570022583, 0.0023583006113767624, 0.0024598948657512665, 0.0025614891201257706, 0.0026630833745002747, 0.0027646776288747787, 0.002866271883249283, 0.002967866137623787, 0.003069460391998291]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 9.0, 7.0, 8.0, 3.0, 8.0, 8.0, 6.0, 14.0, 14.0, 19.0, 16.0, 30.0, 25.0, 38.0, 29.0, 29.0, 30.0, 33.0, 36.0, 38.0, 29.0, 49.0, 44.0, 46.0, 44.0, 45.0, 28.0, 29.0, 37.0, 28.0, 34.0, 29.0, 19.0, 21.0, 17.0, 10.0, 21.0, 14.0, 13.0, 12.0, 7.0, 4.0, 7.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-26.296875, -25.53466796875, -24.7724609375, -24.01025390625, -23.248046875, -22.48583984375, -21.7236328125, -20.96142578125, -20.19921875, -19.43701171875, -18.6748046875, -17.91259765625, -17.150390625, -16.38818359375, -15.6259765625, -14.86376953125, -14.1015625, -13.33935546875, -12.5771484375, -11.81494140625, -11.052734375, -10.29052734375, -9.5283203125, -8.76611328125, -8.00390625, -7.24169921875, -6.4794921875, -5.71728515625, -4.955078125, -4.19287109375, -3.4306640625, -2.66845703125, -1.90625, -1.14404296875, -0.3818359375, 0.38037109375, 1.142578125, 1.90478515625, 2.6669921875, 3.42919921875, 4.19140625, 4.95361328125, 5.7158203125, 6.47802734375, 7.240234375, 8.00244140625, 8.7646484375, 9.52685546875, 10.2890625, 11.05126953125, 11.8134765625, 12.57568359375, 13.337890625, 14.10009765625, 14.8623046875, 15.62451171875, 16.38671875, 17.14892578125, 17.9111328125, 18.67333984375, 19.435546875, 20.19775390625, 20.9599609375, 21.72216796875, 22.484375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 11.0, 10.0, 10.0, 14.0, 18.0, 15.0, 47.0, 48.0, 83.0, 110.0, 151.0, 202.0, 294.0, 441.0, 699.0, 1156.0, 1860.0, 3294.0, 5955.0, 11660.0, 25895.0, 66849.0, 224737.0, 478954.0, 139365.0, 46700.0, 19194.0, 9094.0, 4734.0, 2596.0, 1559.0, 914.0, 567.0, 398.0, 277.0, 182.0, 130.0, 89.0, 67.0, 47.0, 39.0, 20.0, 22.0, 16.0, 16.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-33.0625, -32.09912109375, -31.1357421875, -30.17236328125, -29.208984375, -28.24560546875, -27.2822265625, -26.31884765625, -25.35546875, -24.39208984375, -23.4287109375, -22.46533203125, -21.501953125, -20.53857421875, -19.5751953125, -18.61181640625, -17.6484375, -16.68505859375, -15.7216796875, -14.75830078125, -13.794921875, -12.83154296875, -11.8681640625, -10.90478515625, -9.94140625, -8.97802734375, -8.0146484375, -7.05126953125, -6.087890625, -5.12451171875, -4.1611328125, -3.19775390625, -2.234375, -1.27099609375, -0.3076171875, 0.65576171875, 1.619140625, 2.58251953125, 3.5458984375, 4.50927734375, 5.47265625, 6.43603515625, 7.3994140625, 8.36279296875, 9.326171875, 10.28955078125, 11.2529296875, 12.21630859375, 13.1796875, 14.14306640625, 15.1064453125, 16.06982421875, 17.033203125, 17.99658203125, 18.9599609375, 19.92333984375, 20.88671875, 21.85009765625, 22.8134765625, 23.77685546875, 24.740234375, 25.70361328125, 26.6669921875, 27.63037109375, 28.59375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 8.0, 8.0, 8.0, 13.0, 19.0, 11.0, 11.0, 14.0, 17.0, 27.0, 35.0, 24.0, 31.0, 44.0, 45.0, 58.0, 72.0, 77.0, 159.0, 1531.0, 264.0, 111.0, 68.0, 65.0, 45.0, 40.0, 35.0, 28.0, 28.0, 25.0, 17.0, 17.0, 20.0, 17.0, 10.0, 13.0, 7.0, 5.0, 4.0, 8.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-60.0, -58.17041015625, -56.3408203125, -54.51123046875, -52.681640625, -50.85205078125, -49.0224609375, -47.19287109375, -45.36328125, -43.53369140625, -41.7041015625, -39.87451171875, -38.044921875, -36.21533203125, -34.3857421875, -32.55615234375, -30.7265625, -28.89697265625, -27.0673828125, -25.23779296875, -23.408203125, -21.57861328125, -19.7490234375, -17.91943359375, -16.08984375, -14.26025390625, -12.4306640625, -10.60107421875, -8.771484375, -6.94189453125, -5.1123046875, -3.28271484375, -1.453125, 0.37646484375, 2.2060546875, 4.03564453125, 5.865234375, 7.69482421875, 9.5244140625, 11.35400390625, 13.18359375, 15.01318359375, 16.8427734375, 18.67236328125, 20.501953125, 22.33154296875, 24.1611328125, 25.99072265625, 27.8203125, 29.64990234375, 31.4794921875, 33.30908203125, 35.138671875, 36.96826171875, 38.7978515625, 40.62744140625, 42.45703125, 44.28662109375, 46.1162109375, 47.94580078125, 49.775390625, 51.60498046875, 53.4345703125, 55.26416015625, 57.09375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 10.0, 16.0, 17.0, 21.0, 20.0, 36.0, 50.0, 69.0, 92.0, 124.0, 160.0, 291.0, 521.0, 1986.0, 16347.0, 443448.0, 2631978.0, 44794.0, 3727.0, 788.0, 382.0, 228.0, 138.0, 99.0, 67.0, 65.0, 51.0, 41.0, 25.0, 10.0, 21.0, 19.0, 10.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-88.4375, -85.7724609375, -83.107421875, -80.4423828125, -77.77734375, -75.1123046875, -72.447265625, -69.7822265625, -67.1171875, -64.4521484375, -61.787109375, -59.1220703125, -56.45703125, -53.7919921875, -51.126953125, -48.4619140625, -45.796875, -43.1318359375, -40.466796875, -37.8017578125, -35.13671875, -32.4716796875, -29.806640625, -27.1416015625, -24.4765625, -21.8115234375, -19.146484375, -16.4814453125, -13.81640625, -11.1513671875, -8.486328125, -5.8212890625, -3.15625, -0.4912109375, 2.173828125, 4.8388671875, 7.50390625, 10.1689453125, 12.833984375, 15.4990234375, 18.1640625, 20.8291015625, 23.494140625, 26.1591796875, 28.82421875, 31.4892578125, 34.154296875, 36.8193359375, 39.484375, 42.1494140625, 44.814453125, 47.4794921875, 50.14453125, 52.8095703125, 55.474609375, 58.1396484375, 60.8046875, 63.4697265625, 66.134765625, 68.7998046875, 71.46484375, 74.1298828125, 76.794921875, 79.4599609375, 82.125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 16.0, 76.0, 250.0, 371.0, 213.0, 64.0, 14.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.11949157714844, -147.5257110595703, -140.93194580078125, -134.33816528320312, -127.74440002441406, -121.15061950683594, -114.55684661865234, -107.96307373046875, -101.36930084228516, -94.77552795410156, -88.18175506591797, -81.58798217773438, -74.99420166015625, -68.40043640136719, -61.80665588378906, -55.21288299560547, -48.619110107421875, -42.02533721923828, -35.43156433105469, -28.837787628173828, -22.244014739990234, -15.65024185180664, -9.056465148925781, -2.4626922607421875, 4.131080627441406, 10.724854469299316, 17.318628311157227, 23.912403106689453, 30.506175994873047, 37.09994888305664, 43.6937255859375, 50.287498474121094, 56.881256103515625, 63.47502899169922, 70.06880187988281, 76.66258239746094, 83.25634765625, 89.85012817382812, 96.44390106201172, 103.03767395019531, 109.6314468383789, 116.2252197265625, 122.8189926147461, 129.4127655029297, 136.0065460205078, 142.60031127929688, 149.194091796875, 155.78787231445312, 162.3816375732422, 168.9754180908203, 175.56918334960938, 182.1629638671875, 188.75672912597656, 195.3505096435547, 201.94427490234375, 208.53805541992188, 215.1318359375, 221.72561645507812, 228.3193817138672, 234.9131622314453, 241.50692749023438, 248.1007080078125, 254.69448852539062, 261.28826904296875, 267.88201904296875]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 12.0, 5.0, 8.0, 9.0, 11.0, 18.0, 23.0, 28.0, 28.0, 31.0, 23.0, 39.0, 33.0, 33.0, 38.0, 43.0, 45.0, 50.0, 44.0, 50.0, 49.0, 35.0, 43.0, 41.0, 34.0, 27.0, 30.0, 28.0, 27.0, 20.0, 17.0, 16.0, 20.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.93840026855469, -121.39701080322266, -116.85562133789062, -112.3142318725586, -107.77284240722656, -103.2314453125, -98.69005584716797, -94.14866638183594, -89.6072769165039, -85.06588745117188, -80.52449798583984, -75.98310852050781, -71.44171142578125, -66.90032958984375, -62.35893249511719, -57.817543029785156, -53.276153564453125, -48.734764099121094, -44.19337463378906, -39.651981353759766, -35.110591888427734, -30.569202423095703, -26.02781105041504, -21.486419677734375, -16.945030212402344, -12.403639793395996, -7.862249374389648, -3.320858955383301, 1.2205314636230469, 5.761920928955078, 10.303312301635742, 14.844703674316406, 19.3861083984375, 23.92749786376953, 28.468889236450195, 33.01028060913086, 37.55167007446289, 42.09305953979492, 46.63445281982422, 51.17584228515625, 55.71723175048828, 60.25862121582031, 64.80001068115234, 69.34140014648438, 73.88279724121094, 78.42417907714844, 82.965576171875, 87.50696563720703, 92.04835510253906, 96.5897445678711, 101.13113403320312, 105.67252349853516, 110.21391296386719, 114.75531005859375, 119.29669952392578, 123.83808898925781, 128.37948608398438, 132.92088317871094, 137.46226501464844, 142.003662109375, 146.5450439453125, 151.08644104003906, 155.62782287597656, 160.16921997070312, 164.71060180664062]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 2.0, 7.0, 10.0, 7.0, 6.0, 10.0, 10.0, 14.0, 18.0, 24.0, 24.0, 25.0, 36.0, 28.0, 30.0, 32.0, 31.0, 42.0, 41.0, 39.0, 42.0, 41.0, 45.0, 43.0, 43.0, 33.0, 36.0, 27.0, 30.0, 37.0, 31.0, 19.0, 10.0, 18.0, 25.0, 14.0, 17.0, 8.0, 10.0, 5.0, 8.0, 9.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.328125, -24.544677734375, -23.76123046875, -22.977783203125, -22.1943359375, -21.410888671875, -20.62744140625, -19.843994140625, -19.060546875, -18.277099609375, -17.49365234375, -16.710205078125, -15.9267578125, -15.143310546875, -14.35986328125, -13.576416015625, -12.79296875, -12.009521484375, -11.22607421875, -10.442626953125, -9.6591796875, -8.875732421875, -8.09228515625, -7.308837890625, -6.525390625, -5.741943359375, -4.95849609375, -4.175048828125, -3.3916015625, -2.608154296875, -1.82470703125, -1.041259765625, -0.2578125, 0.525634765625, 1.30908203125, 2.092529296875, 2.8759765625, 3.659423828125, 4.44287109375, 5.226318359375, 6.009765625, 6.793212890625, 7.57666015625, 8.360107421875, 9.1435546875, 9.927001953125, 10.71044921875, 11.493896484375, 12.27734375, 13.060791015625, 13.84423828125, 14.627685546875, 15.4111328125, 16.194580078125, 16.97802734375, 17.761474609375, 18.544921875, 19.328369140625, 20.11181640625, 20.895263671875, 21.6787109375, 22.462158203125, 23.24560546875, 24.029052734375, 24.8125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 11.0, 14.0, 13.0, 14.0, 23.0, 38.0, 63.0, 81.0, 102.0, 174.0, 219.0, 309.0, 458.0, 733.0, 1191.0, 2026.0, 3690.0, 8809.0, 40256.0, 330715.0, 2468060.0, 1172721.0, 133341.0, 18255.0, 5613.0, 2801.0, 1596.0, 956.0, 642.0, 389.0, 292.0, 197.0, 126.0, 94.0, 68.0, 65.0, 37.0, 29.0, 20.0, 12.0, 9.0, 6.0, 10.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.21875, -40.890625, -39.5625, -38.234375, -36.90625, -35.578125, -34.25, -32.921875, -31.59375, -30.265625, -28.9375, -27.609375, -26.28125, -24.953125, -23.625, -22.296875, -20.96875, -19.640625, -18.3125, -16.984375, -15.65625, -14.328125, -13.0, -11.671875, -10.34375, -9.015625, -7.6875, -6.359375, -5.03125, -3.703125, -2.375, -1.046875, 0.28125, 1.609375, 2.9375, 4.265625, 5.59375, 6.921875, 8.25, 9.578125, 10.90625, 12.234375, 13.5625, 14.890625, 16.21875, 17.546875, 18.875, 20.203125, 21.53125, 22.859375, 24.1875, 25.515625, 26.84375, 28.171875, 29.5, 30.828125, 32.15625, 33.484375, 34.8125, 36.140625, 37.46875, 38.796875, 40.125, 41.453125, 42.78125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 3.0, 7.0, 18.0, 13.0, 15.0, 19.0, 37.0, 69.0, 92.0, 200.0, 364.0, 714.0, 996.0, 747.0, 337.0, 169.0, 109.0, 54.0, 22.0, 17.0, 14.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.375, -37.943359375, -36.51171875, -35.080078125, -33.6484375, -32.216796875, -30.78515625, -29.353515625, -27.921875, -26.490234375, -25.05859375, -23.626953125, -22.1953125, -20.763671875, -19.33203125, -17.900390625, -16.46875, -15.037109375, -13.60546875, -12.173828125, -10.7421875, -9.310546875, -7.87890625, -6.447265625, -5.015625, -3.583984375, -2.15234375, -0.720703125, 0.7109375, 2.142578125, 3.57421875, 5.005859375, 6.4375, 7.869140625, 9.30078125, 10.732421875, 12.1640625, 13.595703125, 15.02734375, 16.458984375, 17.890625, 19.322265625, 20.75390625, 22.185546875, 23.6171875, 25.048828125, 26.48046875, 27.912109375, 29.34375, 30.775390625, 32.20703125, 33.638671875, 35.0703125, 36.501953125, 37.93359375, 39.365234375, 40.796875, 42.228515625, 43.66015625, 45.091796875, 46.5234375, 47.955078125, 49.38671875, 50.818359375, 52.25]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 8.0, 17.0, 16.0, 19.0, 35.0, 43.0, 68.0, 102.0, 155.0, 227.0, 358.0, 639.0, 1160.0, 2210.0, 4755.0, 11106.0, 33150.0, 217034.0, 3412037.0, 440618.0, 45552.0, 13648.0, 5544.0, 2612.0, 1291.0, 724.0, 395.0, 250.0, 167.0, 97.0, 66.0, 63.0, 29.0, 24.0, 18.0, 11.0, 7.0, 5.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-60.9375, -59.01025390625, -57.0830078125, -55.15576171875, -53.228515625, -51.30126953125, -49.3740234375, -47.44677734375, -45.51953125, -43.59228515625, -41.6650390625, -39.73779296875, -37.810546875, -35.88330078125, -33.9560546875, -32.02880859375, -30.1015625, -28.17431640625, -26.2470703125, -24.31982421875, -22.392578125, -20.46533203125, -18.5380859375, -16.61083984375, -14.68359375, -12.75634765625, -10.8291015625, -8.90185546875, -6.974609375, -5.04736328125, -3.1201171875, -1.19287109375, 0.734375, 2.66162109375, 4.5888671875, 6.51611328125, 8.443359375, 10.37060546875, 12.2978515625, 14.22509765625, 16.15234375, 18.07958984375, 20.0068359375, 21.93408203125, 23.861328125, 25.78857421875, 27.7158203125, 29.64306640625, 31.5703125, 33.49755859375, 35.4248046875, 37.35205078125, 39.279296875, 41.20654296875, 43.1337890625, 45.06103515625, 46.98828125, 48.91552734375, 50.8427734375, 52.77001953125, 54.697265625, 56.62451171875, 58.5517578125, 60.47900390625, 62.40625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 5.0, 9.0, 10.0, 40.0, 112.0, 246.0, 326.0, 159.0, 68.0, 23.0, 6.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.48783111572266, -62.63218688964844, -52.77653884887695, -42.92089080810547, -33.06524658203125, -23.20960235595703, -13.353954315185547, -3.4983062744140625, 6.357337951660156, 16.212984085083008, 26.06863021850586, 35.924278259277344, 45.77992248535156, 55.63556671142578, 65.4912109375, 75.34686279296875, 85.20250701904297, 95.05815124511719, 104.91380310058594, 114.76944732666016, 124.62509155273438, 134.48074340820312, 144.3363800048828, 154.19203186035156, 164.04766845703125, 173.9033203125, 183.7589569091797, 193.61460876464844, 203.47024536132812, 213.32589721679688, 223.18154907226562, 233.03720092773438, 242.892822265625, 252.74847412109375, 262.6041259765625, 272.4597473144531, 282.3153991699219, 292.1710510253906, 302.0267028808594, 311.8823547363281, 321.73797607421875, 331.5936279296875, 341.44927978515625, 351.3049011230469, 361.1605529785156, 371.0162048339844, 380.8718566894531, 390.7275085449219, 400.5831604003906, 410.4388122558594, 420.2944641113281, 430.15008544921875, 440.0057373046875, 449.86138916015625, 459.717041015625, 469.57269287109375, 479.4283447265625, 489.28399658203125, 499.1396484375, 508.9952697753906, 518.8509521484375, 528.70654296875, 538.5621948242188, 548.4178466796875, 558.2734985351562]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 11.0, 7.0, 14.0, 13.0, 16.0, 17.0, 21.0, 29.0, 27.0, 29.0, 42.0, 37.0, 32.0, 41.0, 39.0, 68.0, 43.0, 46.0, 34.0, 37.0, 47.0, 38.0, 30.0, 32.0, 29.0, 27.0, 27.0, 33.0, 22.0, 26.0, 18.0, 15.0, 6.0, 12.0, 3.0, 6.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.87333679199219, -107.46166229248047, -104.04999542236328, -100.63832092285156, -97.22664642333984, -93.81497192382812, -90.40330505371094, -86.99163055419922, -83.5799560546875, -80.16828155517578, -76.7566146850586, -73.34494018554688, -69.93326568603516, -66.52159118652344, -63.10992431640625, -59.69824981689453, -56.28657913208008, -52.874908447265625, -49.463233947753906, -46.05156326293945, -42.639888763427734, -39.22821807861328, -35.81654357910156, -32.40487289428711, -28.993200302124023, -25.581527709960938, -22.16985511779785, -18.758182525634766, -15.346510887145996, -11.934839248657227, -8.52316665649414, -5.111494064331055, -1.6998214721679688, 1.711850881576538, 5.123523235321045, 8.535195350646973, 11.946867942810059, 15.358539581298828, 18.770212173461914, 22.181884765625, 25.593557357788086, 29.005229949951172, 32.416900634765625, 35.828575134277344, 39.2402458190918, 42.65191650390625, 46.06359100341797, 49.47526550292969, 52.88693618774414, 56.298606872558594, 59.71028137207031, 63.121952056884766, 66.53362274169922, 69.94529724121094, 73.35697174072266, 76.76864624023438, 80.18031311035156, 83.59198760986328, 87.00365447998047, 90.41532897949219, 93.8270034790039, 97.23867797851562, 100.65034484863281, 104.06201934814453, 107.47369384765625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 12.0, 8.0, 14.0, 18.0, 21.0, 17.0, 25.0, 28.0, 21.0, 31.0, 38.0, 35.0, 35.0, 35.0, 45.0, 29.0, 45.0, 46.0, 49.0, 38.0, 49.0, 38.0, 34.0, 36.0, 27.0, 21.0, 18.0, 22.0, 21.0, 20.0, 26.0, 12.0, 12.0, 13.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.765625, -22.97900390625, -22.1923828125, -21.40576171875, -20.619140625, -19.83251953125, -19.0458984375, -18.25927734375, -17.47265625, -16.68603515625, -15.8994140625, -15.11279296875, -14.326171875, -13.53955078125, -12.7529296875, -11.96630859375, -11.1796875, -10.39306640625, -9.6064453125, -8.81982421875, -8.033203125, -7.24658203125, -6.4599609375, -5.67333984375, -4.88671875, -4.10009765625, -3.3134765625, -2.52685546875, -1.740234375, -0.95361328125, -0.1669921875, 0.61962890625, 1.40625, 2.19287109375, 2.9794921875, 3.76611328125, 4.552734375, 5.33935546875, 6.1259765625, 6.91259765625, 7.69921875, 8.48583984375, 9.2724609375, 10.05908203125, 10.845703125, 11.63232421875, 12.4189453125, 13.20556640625, 13.9921875, 14.77880859375, 15.5654296875, 16.35205078125, 17.138671875, 17.92529296875, 18.7119140625, 19.49853515625, 20.28515625, 21.07177734375, 21.8583984375, 22.64501953125, 23.431640625, 24.21826171875, 25.0048828125, 25.79150390625, 26.578125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 8.0, 24.0, 30.0, 62.0, 66.0, 115.0, 173.0, 248.0, 333.0, 512.0, 783.0, 1174.0, 1783.0, 2701.0, 4285.0, 6383.0, 9662.0, 14868.0, 24270.0, 39123.0, 66084.0, 111906.0, 182399.0, 212053.0, 146562.0, 86279.0, 51380.0, 30918.0, 19105.0, 12272.0, 7793.0, 5143.0, 3451.0, 2193.0, 1440.0, 971.0, 635.0, 442.0, 303.0, 219.0, 131.0, 88.0, 63.0, 49.0, 30.0, 15.0, 6.0, 7.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.115234375, -1.077117919921875, -1.03900146484375, -1.000885009765625, -0.9627685546875, -0.924652099609375, -0.88653564453125, -0.848419189453125, -0.810302734375, -0.772186279296875, -0.73406982421875, -0.695953369140625, -0.6578369140625, -0.619720458984375, -0.58160400390625, -0.543487548828125, -0.50537109375, -0.467254638671875, -0.42913818359375, -0.391021728515625, -0.3529052734375, -0.314788818359375, -0.27667236328125, -0.238555908203125, -0.200439453125, -0.162322998046875, -0.12420654296875, -0.086090087890625, -0.0479736328125, -0.009857177734375, 0.02825927734375, 0.066375732421875, 0.1044921875, 0.142608642578125, 0.18072509765625, 0.218841552734375, 0.2569580078125, 0.295074462890625, 0.33319091796875, 0.371307373046875, 0.409423828125, 0.447540283203125, 0.48565673828125, 0.523773193359375, 0.5618896484375, 0.600006103515625, 0.63812255859375, 0.676239013671875, 0.71435546875, 0.752471923828125, 0.79058837890625, 0.828704833984375, 0.8668212890625, 0.904937744140625, 0.94305419921875, 0.981170654296875, 1.019287109375, 1.057403564453125, 1.09552001953125, 1.133636474609375, 1.1717529296875, 1.209869384765625, 1.24798583984375, 1.286102294921875, 1.32421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 4.0, 20.0, 9.0, 16.0, 14.0, 19.0, 29.0, 21.0, 28.0, 28.0, 31.0, 41.0, 68.0, 41.0, 46.0, 47.0, 45.0, 1059.0, 45.0, 44.0, 35.0, 45.0, 29.0, 37.0, 36.0, 28.0, 30.0, 17.0, 21.0, 21.0, 16.0, 13.0, 6.0, 9.0, 2.0, 6.0, 8.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.6875, -18.1044921875, -17.521484375, -16.9384765625, -16.35546875, -15.7724609375, -15.189453125, -14.6064453125, -14.0234375, -13.4404296875, -12.857421875, -12.2744140625, -11.69140625, -11.1083984375, -10.525390625, -9.9423828125, -9.359375, -8.7763671875, -8.193359375, -7.6103515625, -7.02734375, -6.4443359375, -5.861328125, -5.2783203125, -4.6953125, -4.1123046875, -3.529296875, -2.9462890625, -2.36328125, -1.7802734375, -1.197265625, -0.6142578125, -0.03125, 0.5517578125, 1.134765625, 1.7177734375, 2.30078125, 2.8837890625, 3.466796875, 4.0498046875, 4.6328125, 5.2158203125, 5.798828125, 6.3818359375, 6.96484375, 7.5478515625, 8.130859375, 8.7138671875, 9.296875, 9.8798828125, 10.462890625, 11.0458984375, 11.62890625, 12.2119140625, 12.794921875, 13.3779296875, 13.9609375, 14.5439453125, 15.126953125, 15.7099609375, 16.29296875, 16.8759765625, 17.458984375, 18.0419921875, 18.625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 5.0, 22.0, 22.0, 25.0, 37.0, 49.0, 75.0, 106.0, 188.0, 254.0, 387.0, 594.0, 804.0, 1219.0, 1914.0, 2700.0, 4093.0, 6031.0, 8825.0, 13160.0, 19922.0, 30725.0, 49623.0, 81392.0, 134853.0, 1244948.0, 184683.0, 116521.0, 70193.0, 42887.0, 27120.0, 17818.0, 11620.0, 7883.0, 5301.0, 3608.0, 2413.0, 1689.0, 1130.0, 766.0, 505.0, 331.0, 208.0, 154.0, 109.0, 66.0, 38.0, 38.0, 34.0, 15.0, 11.0, 3.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.0546875, -1.021575927734375, -0.98846435546875, -0.955352783203125, -0.9222412109375, -0.889129638671875, -0.85601806640625, -0.822906494140625, -0.789794921875, -0.756683349609375, -0.72357177734375, -0.690460205078125, -0.6573486328125, -0.624237060546875, -0.59112548828125, -0.558013916015625, -0.52490234375, -0.491790771484375, -0.45867919921875, -0.425567626953125, -0.3924560546875, -0.359344482421875, -0.32623291015625, -0.293121337890625, -0.260009765625, -0.226898193359375, -0.19378662109375, -0.160675048828125, -0.1275634765625, -0.094451904296875, -0.06134033203125, -0.028228759765625, 0.0048828125, 0.037994384765625, 0.07110595703125, 0.104217529296875, 0.1373291015625, 0.170440673828125, 0.20355224609375, 0.236663818359375, 0.269775390625, 0.302886962890625, 0.33599853515625, 0.369110107421875, 0.4022216796875, 0.435333251953125, 0.46844482421875, 0.501556396484375, 0.53466796875, 0.567779541015625, 0.60089111328125, 0.634002685546875, 0.6671142578125, 0.700225830078125, 0.73333740234375, 0.766448974609375, 0.799560546875, 0.832672119140625, 0.86578369140625, 0.898895263671875, 0.9320068359375, 0.965118408203125, 0.99822998046875, 1.031341552734375, 1.064453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 2.0, 4.0, 7.0, 4.0, 9.0, 10.0, 11.0, 16.0, 22.0, 17.0, 30.0, 35.0, 31.0, 43.0, 58.0, 62.0, 57.0, 55.0, 73.0, 40.0, 65.0, 56.0, 55.0, 45.0, 36.0, 33.0, 17.0, 16.0, 24.0, 11.0, 14.0, 10.0, 8.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006656646728515625, -0.006450355052947998, -0.006244063377380371, -0.006037771701812744, -0.005831480026245117, -0.00562518835067749, -0.005418896675109863, -0.005212604999542236, -0.005006313323974609, -0.004800021648406982, -0.0045937299728393555, -0.0043874382972717285, -0.0041811466217041016, -0.003974854946136475, -0.0037685632705688477, -0.0035622715950012207, -0.0033559799194335938, -0.003149688243865967, -0.00294339656829834, -0.002737104892730713, -0.002530813217163086, -0.002324521541595459, -0.002118229866027832, -0.001911938190460205, -0.0017056465148925781, -0.0014993548393249512, -0.0012930631637573242, -0.0010867714881896973, -0.0008804798126220703, -0.0006741881370544434, -0.0004678964614868164, -0.00026160478591918945, -5.53131103515625e-05, 0.00015097856521606445, 0.0003572702407836914, 0.0005635619163513184, 0.0007698535919189453, 0.0009761452674865723, 0.0011824369430541992, 0.0013887286186218262, 0.0015950202941894531, 0.00180131196975708, 0.002007603645324707, 0.002213895320892334, 0.002420186996459961, 0.002626478672027588, 0.002832770347595215, 0.003039062023162842, 0.0032453536987304688, 0.0034516453742980957, 0.0036579370498657227, 0.0038642287254333496, 0.0040705204010009766, 0.0042768120765686035, 0.0044831037521362305, 0.004689395427703857, 0.004895687103271484, 0.005101978778839111, 0.005308270454406738, 0.005514562129974365, 0.005720853805541992, 0.005927145481109619, 0.006133437156677246, 0.006339728832244873, 0.0065460205078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 14.0, 8.0, 14.0, 23.0, 25.0, 31.0, 40.0, 54.0, 70.0, 86.0, 117.0, 233.0, 298.0, 639.0, 8086.0, 1012030.0, 24808.0, 848.0, 371.0, 189.0, 148.0, 94.0, 72.0, 52.0, 41.0, 35.0, 24.0, 20.0, 14.0, 16.0, 6.0, 11.0, 7.0, 4.0, 8.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1326904296875, -0.12862014770507812, -0.12454986572265625, -0.12047958374023438, -0.1164093017578125, -0.11233901977539062, -0.10826873779296875, -0.10419845581054688, -0.100128173828125, -0.09605789184570312, -0.09198760986328125, -0.08791732788085938, -0.0838470458984375, -0.07977676391601562, -0.07570648193359375, -0.07163619995117188, -0.06756591796875, -0.06349563598632812, -0.05942535400390625, -0.055355072021484375, -0.0512847900390625, -0.047214508056640625, -0.04314422607421875, -0.039073944091796875, -0.035003662109375, -0.030933380126953125, -0.02686309814453125, -0.022792816162109375, -0.0187225341796875, -0.014652252197265625, -0.01058197021484375, -0.006511688232421875, -0.00244140625, 0.001628875732421875, 0.00569915771484375, 0.009769439697265625, 0.0138397216796875, 0.017910003662109375, 0.02198028564453125, 0.026050567626953125, 0.030120849609375, 0.034191131591796875, 0.03826141357421875, 0.042331695556640625, 0.0464019775390625, 0.050472259521484375, 0.05454254150390625, 0.058612823486328125, 0.06268310546875, 0.06675338745117188, 0.07082366943359375, 0.07489395141601562, 0.0789642333984375, 0.08303451538085938, 0.08710479736328125, 0.09117507934570312, 0.095245361328125, 0.09931564331054688, 0.10338592529296875, 0.10745620727539062, 0.1115264892578125, 0.11559677124023438, 0.11966705322265625, 0.12373733520507812, 0.1278076171875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 37.0, 732.0, 230.0, 13.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0033708857372403145, -0.0021054628305137157, -0.000840039923787117, 0.00042538298293948174, 0.0016908058896660805, 0.002956228796392679, 0.004221651703119278, 0.005487074144184589, 0.006752497516572475, 0.008017919957637787, 0.009283343330025673, 0.010548766702413559, 0.01181418914347887, 0.013079611584544182, 0.014345034956932068, 0.01561045739799738, 0.01687588170170784, 0.018141305074095726, 0.019406728446483612, 0.02067214995622635, 0.021937573328614235, 0.02320299670100212, 0.024468418210744858, 0.025733841583132744, 0.02699926495552063, 0.028264688327908516, 0.029530111700296402, 0.03079553321003914, 0.032060958445072174, 0.03332637995481491, 0.03459180146455765, 0.035857222974300385, 0.03712264448404312, 0.03838806599378586, 0.03965349122881889, 0.04091891273856163, 0.042184337973594666, 0.0434497594833374, 0.04471518099308014, 0.045980602502822876, 0.04724602773785591, 0.04851144924759865, 0.04977687448263168, 0.05104229599237442, 0.05230771750211716, 0.05357314273715019, 0.05483856424689293, 0.056103989481925964, 0.0573694109916687, 0.05863483250141144, 0.05990025773644447, 0.06116567924618721, 0.062431104481220245, 0.06369652599096298, 0.06496194750070572, 0.06622736901044846, 0.06749279797077179, 0.06875821948051453, 0.07002364099025726, 0.0712890699505806, 0.07255449146032333, 0.07381991297006607, 0.07508533447980881, 0.07635075598955154, 0.07761617749929428]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 8.0, 13.0, 14.0, 22.0, 25.0, 36.0, 34.0, 45.0, 50.0, 49.0, 45.0, 49.0, 51.0, 59.0, 60.0, 52.0, 45.0, 52.0, 43.0, 42.0, 31.0, 24.0, 29.0, 25.0, 18.0, 16.0, 15.0, 13.0, 11.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005161285400390625, -0.005012081936001778, -0.00486287847161293, -0.004713675007224083, -0.004564471542835236, -0.004415268078446388, -0.004266064614057541, -0.0041168611496686935, -0.003967657685279846, -0.003818454220890999, -0.0036692507565021515, -0.003520047292113304, -0.003370843827724457, -0.0032216403633356094, -0.003072436898946762, -0.0029232334345579147, -0.0027740299701690674, -0.00262482650578022, -0.0024756230413913727, -0.0023264195770025253, -0.002177216112613678, -0.0020280126482248306, -0.0018788091838359833, -0.001729605719447136, -0.0015804022550582886, -0.0014311987906694412, -0.0012819953262805939, -0.0011327918618917465, -0.0009835883975028992, -0.0008343849331140518, -0.0006851814687252045, -0.0005359780043363571, -0.00038677453994750977, -0.00023757107555866241, -8.836761116981506e-05, 6.083585321903229e-05, 0.00021003931760787964, 0.000359242781996727, 0.0005084462463855743, 0.0006576497107744217, 0.000806853175163269, 0.0009560566395521164, 0.0011052601039409637, 0.001254463568329811, 0.0014036670327186584, 0.0015528704971075058, 0.0017020739614963531, 0.0018512774258852005, 0.002000480890274048, 0.002149684354662895, 0.0022988878190517426, 0.00244809128344059, 0.0025972947478294373, 0.0027464982122182846, 0.002895701676607132, 0.0030449051409959793, 0.0031941086053848267, 0.003343312069773674, 0.0034925155341625214, 0.0036417189985513687, 0.003790922462940216, 0.003940125927329063, 0.004089329391717911, 0.004238532856106758, 0.0043877363204956055]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 10.0, 12.0, 8.0, 14.0, 18.0, 21.0, 17.0, 25.0, 28.0, 21.0, 31.0, 38.0, 35.0, 35.0, 35.0, 45.0, 29.0, 45.0, 46.0, 49.0, 38.0, 49.0, 38.0, 34.0, 36.0, 27.0, 21.0, 18.0, 22.0, 21.0, 20.0, 27.0, 11.0, 12.0, 13.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.765625, -22.97900390625, -22.1923828125, -21.40576171875, -20.619140625, -19.83251953125, -19.0458984375, -18.25927734375, -17.47265625, -16.68603515625, -15.8994140625, -15.11279296875, -14.326171875, -13.53955078125, -12.7529296875, -11.96630859375, -11.1796875, -10.39306640625, -9.6064453125, -8.81982421875, -8.033203125, -7.24658203125, -6.4599609375, -5.67333984375, -4.88671875, -4.10009765625, -3.3134765625, -2.52685546875, -1.740234375, -0.95361328125, -0.1669921875, 0.61962890625, 1.40625, 2.19287109375, 2.9794921875, 3.76611328125, 4.552734375, 5.33935546875, 6.1259765625, 6.91259765625, 7.69921875, 8.48583984375, 9.2724609375, 10.05908203125, 10.845703125, 11.63232421875, 12.4189453125, 13.20556640625, 13.9921875, 14.77880859375, 15.5654296875, 16.35205078125, 17.138671875, 17.92529296875, 18.7119140625, 19.49853515625, 20.28515625, 21.07177734375, 21.8583984375, 22.64501953125, 23.431640625, 24.21826171875, 25.0048828125, 25.79150390625, 26.578125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 19.0, 18.0, 20.0, 38.0, 37.0, 48.0, 108.0, 146.0, 201.0, 324.0, 455.0, 711.0, 1243.0, 2158.0, 4244.0, 9515.0, 24158.0, 77463.0, 325647.0, 443171.0, 104764.0, 31123.0, 11462.0, 5074.0, 2575.0, 1411.0, 865.0, 519.0, 347.0, 211.0, 145.0, 96.0, 63.0, 41.0, 40.0, 27.0, 19.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.5625, -41.31494140625, -40.0673828125, -38.81982421875, -37.572265625, -36.32470703125, -35.0771484375, -33.82958984375, -32.58203125, -31.33447265625, -30.0869140625, -28.83935546875, -27.591796875, -26.34423828125, -25.0966796875, -23.84912109375, -22.6015625, -21.35400390625, -20.1064453125, -18.85888671875, -17.611328125, -16.36376953125, -15.1162109375, -13.86865234375, -12.62109375, -11.37353515625, -10.1259765625, -8.87841796875, -7.630859375, -6.38330078125, -5.1357421875, -3.88818359375, -2.640625, -1.39306640625, -0.1455078125, 1.10205078125, 2.349609375, 3.59716796875, 4.8447265625, 6.09228515625, 7.33984375, 8.58740234375, 9.8349609375, 11.08251953125, 12.330078125, 13.57763671875, 14.8251953125, 16.07275390625, 17.3203125, 18.56787109375, 19.8154296875, 21.06298828125, 22.310546875, 23.55810546875, 24.8056640625, 26.05322265625, 27.30078125, 28.54833984375, 29.7958984375, 31.04345703125, 32.291015625, 33.53857421875, 34.7861328125, 36.03369140625, 37.28125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 9.0, 8.0, 12.0, 15.0, 14.0, 22.0, 34.0, 28.0, 68.0, 45.0, 48.0, 59.0, 78.0, 143.0, 269.0, 1467.0, 197.0, 115.0, 76.0, 38.0, 61.0, 38.0, 35.0, 36.0, 24.0, 19.0, 18.0, 16.0, 6.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.625, -60.560546875, -58.49609375, -56.431640625, -54.3671875, -52.302734375, -50.23828125, -48.173828125, -46.109375, -44.044921875, -41.98046875, -39.916015625, -37.8515625, -35.787109375, -33.72265625, -31.658203125, -29.59375, -27.529296875, -25.46484375, -23.400390625, -21.3359375, -19.271484375, -17.20703125, -15.142578125, -13.078125, -11.013671875, -8.94921875, -6.884765625, -4.8203125, -2.755859375, -0.69140625, 1.373046875, 3.4375, 5.501953125, 7.56640625, 9.630859375, 11.6953125, 13.759765625, 15.82421875, 17.888671875, 19.953125, 22.017578125, 24.08203125, 26.146484375, 28.2109375, 30.275390625, 32.33984375, 34.404296875, 36.46875, 38.533203125, 40.59765625, 42.662109375, 44.7265625, 46.791015625, 48.85546875, 50.919921875, 52.984375, 55.048828125, 57.11328125, 59.177734375, 61.2421875, 63.306640625, 65.37109375, 67.435546875, 69.5]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 7.0, 10.0, 18.0, 23.0, 27.0, 29.0, 63.0, 99.0, 139.0, 261.0, 542.0, 2568.0, 195079.0, 2932869.0, 12103.0, 949.0, 361.0, 208.0, 104.0, 84.0, 41.0, 31.0, 29.0, 19.0, 10.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.125, -165.974609375, -160.82421875, -155.673828125, -150.5234375, -145.373046875, -140.22265625, -135.072265625, -129.921875, -124.771484375, -119.62109375, -114.470703125, -109.3203125, -104.169921875, -99.01953125, -93.869140625, -88.71875, -83.568359375, -78.41796875, -73.267578125, -68.1171875, -62.966796875, -57.81640625, -52.666015625, -47.515625, -42.365234375, -37.21484375, -32.064453125, -26.9140625, -21.763671875, -16.61328125, -11.462890625, -6.3125, -1.162109375, 3.98828125, 9.138671875, 14.2890625, 19.439453125, 24.58984375, 29.740234375, 34.890625, 40.041015625, 45.19140625, 50.341796875, 55.4921875, 60.642578125, 65.79296875, 70.943359375, 76.09375, 81.244140625, 86.39453125, 91.544921875, 96.6953125, 101.845703125, 106.99609375, 112.146484375, 117.296875, 122.447265625, 127.59765625, 132.748046875, 137.8984375, 143.048828125, 148.19921875, 153.349609375, 158.5]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 21.0, 565.0, 419.0, 11.0, 3.0], "bins": [-1529.5020751953125, -1504.400390625, -1479.298828125, -1454.197265625, -1429.0955810546875, -1403.993896484375, -1378.892333984375, -1353.790771484375, -1328.6890869140625, -1303.58740234375, -1278.48583984375, -1253.38427734375, -1228.2825927734375, -1203.180908203125, -1178.079345703125, -1152.977783203125, -1127.8760986328125, -1102.7744140625, -1077.6728515625, -1052.5712890625, -1027.4696044921875, -1002.3679809570312, -977.266357421875, -952.1647338867188, -927.0631103515625, -901.9614868164062, -876.85986328125, -851.7582397460938, -826.6566162109375, -801.5549926757812, -776.453369140625, -751.3517456054688, -726.2500610351562, -701.1484375, -676.0468139648438, -650.9451904296875, -625.8435668945312, -600.741943359375, -575.6403198242188, -550.5386962890625, -525.4370727539062, -500.33544921875, -475.23382568359375, -450.1322021484375, -425.03057861328125, -399.928955078125, -374.82733154296875, -349.7257080078125, -324.62408447265625, -299.5224609375, -274.42083740234375, -249.3192138671875, -224.21759033203125, -199.115966796875, -174.01434326171875, -148.9127197265625, -123.81111145019531, -98.70948791503906, -73.60786437988281, -48.50624084472656, -23.404617309570312, 1.6970062255859375, 26.798629760742188, 51.90025329589844, 77.00187683105469]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 5.0, 4.0, 6.0, 5.0, 8.0, 8.0, 8.0, 11.0, 14.0, 23.0, 20.0, 23.0, 36.0, 39.0, 21.0, 34.0, 41.0, 34.0, 47.0, 44.0, 50.0, 58.0, 39.0, 39.0, 40.0, 33.0, 35.0, 42.0, 35.0, 32.0, 24.0, 16.0, 23.0, 22.0, 21.0, 24.0, 9.0, 14.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.12045288085938, -151.65086364746094, -147.18125915527344, -142.711669921875, -138.24208068847656, -133.77249145507812, -129.30288696289062, -124.83329772949219, -120.36370086669922, -115.89410400390625, -111.42451477050781, -106.95491790771484, -102.48532104492188, -98.01573181152344, -93.54613494873047, -89.0765380859375, -84.60694885253906, -80.1373519897461, -75.66776275634766, -71.19816589355469, -66.72857666015625, -62.25897979736328, -57.78938293457031, -53.31978988647461, -48.850196838378906, -44.3806037902832, -39.9110107421875, -35.44141387939453, -30.971820831298828, -26.502227783203125, -22.03263282775879, -17.563037872314453, -13.09344482421875, -8.62385082244873, -4.154256820678711, 0.3153371810913086, 4.784931182861328, 9.254524230957031, 13.724119186401367, 18.193714141845703, 22.663307189941406, 27.13290023803711, 31.602495193481445, 36.07209014892578, 40.541683197021484, 45.01127624511719, 49.480873107910156, 53.95046615600586, 58.42005920410156, 62.889652252197266, 67.35924530029297, 71.82884216308594, 76.29843139648438, 80.76802825927734, 85.23762512207031, 89.70721435546875, 94.17681121826172, 98.64640808105469, 103.11599731445312, 107.5855941772461, 112.05519104003906, 116.5247802734375, 120.99437713623047, 125.46397399902344, 129.93356323242188]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 12.0, 11.0, 12.0, 17.0, 21.0, 26.0, 21.0, 25.0, 30.0, 31.0, 46.0, 33.0, 36.0, 36.0, 43.0, 39.0, 39.0, 36.0, 52.0, 45.0, 51.0, 35.0, 28.0, 44.0, 26.0, 26.0, 26.0, 21.0, 16.0, 12.0, 12.0, 22.0, 14.0, 6.0, 9.0, 13.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.734375, -25.895263671875, -25.05615234375, -24.217041015625, -23.3779296875, -22.538818359375, -21.69970703125, -20.860595703125, -20.021484375, -19.182373046875, -18.34326171875, -17.504150390625, -16.6650390625, -15.825927734375, -14.98681640625, -14.147705078125, -13.30859375, -12.469482421875, -11.63037109375, -10.791259765625, -9.9521484375, -9.113037109375, -8.27392578125, -7.434814453125, -6.595703125, -5.756591796875, -4.91748046875, -4.078369140625, -3.2392578125, -2.400146484375, -1.56103515625, -0.721923828125, 0.1171875, 0.956298828125, 1.79541015625, 2.634521484375, 3.4736328125, 4.312744140625, 5.15185546875, 5.990966796875, 6.830078125, 7.669189453125, 8.50830078125, 9.347412109375, 10.1865234375, 11.025634765625, 11.86474609375, 12.703857421875, 13.54296875, 14.382080078125, 15.22119140625, 16.060302734375, 16.8994140625, 17.738525390625, 18.57763671875, 19.416748046875, 20.255859375, 21.094970703125, 21.93408203125, 22.773193359375, 23.6123046875, 24.451416015625, 25.29052734375, 26.129638671875, 26.96875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 1.0, 1.0, 4.0, 9.0, 14.0, 16.0, 20.0, 19.0, 18.0, 24.0, 35.0, 52.0, 65.0, 72.0, 111.0, 193.0, 246.0, 455.0, 1012.0, 3947.0, 212753.0, 3964342.0, 7711.0, 1568.0, 579.0, 274.0, 182.0, 149.0, 90.0, 71.0, 45.0, 44.0, 34.0, 27.0, 18.0, 11.0, 15.0, 18.0, 7.0, 7.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0], "bins": [-341.0, -331.826171875, -322.65234375, -313.478515625, -304.3046875, -295.130859375, -285.95703125, -276.783203125, -267.609375, -258.435546875, -249.26171875, -240.087890625, -230.9140625, -221.740234375, -212.56640625, -203.392578125, -194.21875, -185.044921875, -175.87109375, -166.697265625, -157.5234375, -148.349609375, -139.17578125, -130.001953125, -120.828125, -111.654296875, -102.48046875, -93.306640625, -84.1328125, -74.958984375, -65.78515625, -56.611328125, -47.4375, -38.263671875, -29.08984375, -19.916015625, -10.7421875, -1.568359375, 7.60546875, 16.779296875, 25.953125, 35.126953125, 44.30078125, 53.474609375, 62.6484375, 71.822265625, 80.99609375, 90.169921875, 99.34375, 108.517578125, 117.69140625, 126.865234375, 136.0390625, 145.212890625, 154.38671875, 163.560546875, 172.734375, 181.908203125, 191.08203125, 200.255859375, 209.4296875, 218.603515625, 227.77734375, 236.951171875, 246.125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 10.0, 9.0, 19.0, 15.0, 29.0, 43.0, 89.0, 166.0, 458.0, 947.0, 1216.0, 563.0, 228.0, 104.0, 70.0, 31.0, 14.0, 19.0, 11.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.625, -61.447265625, -59.26953125, -57.091796875, -54.9140625, -52.736328125, -50.55859375, -48.380859375, -46.203125, -44.025390625, -41.84765625, -39.669921875, -37.4921875, -35.314453125, -33.13671875, -30.958984375, -28.78125, -26.603515625, -24.42578125, -22.248046875, -20.0703125, -17.892578125, -15.71484375, -13.537109375, -11.359375, -9.181640625, -7.00390625, -4.826171875, -2.6484375, -0.470703125, 1.70703125, 3.884765625, 6.0625, 8.240234375, 10.41796875, 12.595703125, 14.7734375, 16.951171875, 19.12890625, 21.306640625, 23.484375, 25.662109375, 27.83984375, 30.017578125, 32.1953125, 34.373046875, 36.55078125, 38.728515625, 40.90625, 43.083984375, 45.26171875, 47.439453125, 49.6171875, 51.794921875, 53.97265625, 56.150390625, 58.328125, 60.505859375, 62.68359375, 64.861328125, 67.0390625, 69.216796875, 71.39453125, 73.572265625, 75.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 11.0, 15.0, 28.0, 33.0, 34.0, 76.0, 121.0, 269.0, 737.0, 2439.0, 18396.0, 3824163.0, 336921.0, 8531.0, 1530.0, 506.0, 208.0, 95.0, 57.0, 26.0, 25.0, 22.0, 10.0, 14.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-314.75, -307.73046875, -300.7109375, -293.69140625, -286.671875, -279.65234375, -272.6328125, -265.61328125, -258.59375, -251.57421875, -244.5546875, -237.53515625, -230.515625, -223.49609375, -216.4765625, -209.45703125, -202.4375, -195.41796875, -188.3984375, -181.37890625, -174.359375, -167.33984375, -160.3203125, -153.30078125, -146.28125, -139.26171875, -132.2421875, -125.22265625, -118.203125, -111.18359375, -104.1640625, -97.14453125, -90.125, -83.10546875, -76.0859375, -69.06640625, -62.046875, -55.02734375, -48.0078125, -40.98828125, -33.96875, -26.94921875, -19.9296875, -12.91015625, -5.890625, 1.12890625, 8.1484375, 15.16796875, 22.1875, 29.20703125, 36.2265625, 43.24609375, 50.265625, 57.28515625, 64.3046875, 71.32421875, 78.34375, 85.36328125, 92.3828125, 99.40234375, 106.421875, 113.44140625, 120.4609375, 127.48046875, 134.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 12.0, 38.0, 102.0, 346.0, 300.0, 132.0, 43.0, 19.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-449.460205078125, -435.8744812011719, -422.2887268066406, -408.7030029296875, -395.11724853515625, -381.5315246582031, -367.94580078125, -354.36004638671875, -340.7743225097656, -327.1885986328125, -313.60284423828125, -300.0171203613281, -286.431396484375, -272.84564208984375, -259.2599182128906, -245.67417907714844, -232.08843994140625, -218.50270080566406, -204.91696166992188, -191.33123779296875, -177.74549865722656, -164.15975952148438, -150.57403564453125, -136.98829650878906, -123.40255737304688, -109.81681823730469, -96.23108673095703, -82.64535522460938, -69.05961608886719, -55.473876953125, -41.888145446777344, -28.302413940429688, -14.7166748046875, -1.1309394836425781, 12.454795837402344, 26.040531158447266, 39.62626647949219, 53.212005615234375, 66.79773712158203, 80.38346862792969, 93.96920776367188, 107.55494689941406, 121.14067840576172, 134.72640991210938, 148.31214904785156, 161.89788818359375, 175.48361206054688, 189.06935119628906, 202.65509033203125, 216.24082946777344, 229.82656860351562, 243.41229248046875, 256.998046875, 270.5837707519531, 284.16949462890625, 297.7552490234375, 311.3409729003906, 324.92669677734375, 338.512451171875, 352.0981750488281, 365.68389892578125, 379.2696533203125, 392.8553771972656, 406.44110107421875, 420.02685546875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 5.0, 5.0, 11.0, 18.0, 15.0, 14.0, 22.0, 26.0, 25.0, 23.0, 25.0, 32.0, 33.0, 45.0, 48.0, 38.0, 40.0, 32.0, 43.0, 46.0, 43.0, 45.0, 44.0, 37.0, 33.0, 36.0, 32.0, 22.0, 28.0, 20.0, 21.0, 21.0, 17.0, 12.0, 7.0, 7.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.51754760742188, -121.16007995605469, -116.80260467529297, -112.44512939453125, -108.08766174316406, -103.73019409179688, -99.37271881103516, -95.01524353027344, -90.65777587890625, -86.30030822753906, -81.94283294677734, -77.58535766601562, -73.22789001464844, -68.87042236328125, -64.51294708251953, -60.15547561645508, -55.798004150390625, -51.44053268432617, -47.08306121826172, -42.725589752197266, -38.36811828613281, -34.01064682006836, -29.653175354003906, -25.295703887939453, -20.938232421875, -16.580760955810547, -12.223289489746094, -7.865818023681641, -3.5083465576171875, 0.8491249084472656, 5.206596374511719, 9.564067840576172, 13.921524047851562, 18.278995513916016, 22.63646697998047, 26.993938446044922, 31.351409912109375, 35.70888137817383, 40.06635284423828, 44.423824310302734, 48.78129577636719, 53.13876724243164, 57.496238708496094, 61.85371017456055, 66.211181640625, 70.56864929199219, 74.9261245727539, 79.28359985351562, 83.64106750488281, 87.99853515625, 92.35601043701172, 96.71348571777344, 101.07095336914062, 105.42842102050781, 109.78589630126953, 114.14337158203125, 118.50083923339844, 122.85830688476562, 127.21578216552734, 131.57325744628906, 135.93072509765625, 140.28819274902344, 144.64566040039062, 149.00314331054688, 153.36061096191406]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 7.0, 15.0, 9.0, 5.0, 16.0, 10.0, 12.0, 20.0, 19.0, 22.0, 28.0, 27.0, 36.0, 32.0, 44.0, 27.0, 42.0, 38.0, 52.0, 33.0, 46.0, 56.0, 39.0, 46.0, 35.0, 40.0, 33.0, 26.0, 21.0, 23.0, 22.0, 27.0, 14.0, 16.0, 13.0, 2.0, 11.0, 4.0, 1.0, 9.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0], "bins": [-31.25, -30.3486328125, -29.447265625, -28.5458984375, -27.64453125, -26.7431640625, -25.841796875, -24.9404296875, -24.0390625, -23.1376953125, -22.236328125, -21.3349609375, -20.43359375, -19.5322265625, -18.630859375, -17.7294921875, -16.828125, -15.9267578125, -15.025390625, -14.1240234375, -13.22265625, -12.3212890625, -11.419921875, -10.5185546875, -9.6171875, -8.7158203125, -7.814453125, -6.9130859375, -6.01171875, -5.1103515625, -4.208984375, -3.3076171875, -2.40625, -1.5048828125, -0.603515625, 0.2978515625, 1.19921875, 2.1005859375, 3.001953125, 3.9033203125, 4.8046875, 5.7060546875, 6.607421875, 7.5087890625, 8.41015625, 9.3115234375, 10.212890625, 11.1142578125, 12.015625, 12.9169921875, 13.818359375, 14.7197265625, 15.62109375, 16.5224609375, 17.423828125, 18.3251953125, 19.2265625, 20.1279296875, 21.029296875, 21.9306640625, 22.83203125, 23.7333984375, 24.634765625, 25.5361328125, 26.4375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 10.0, 14.0, 26.0, 38.0, 69.0, 98.0, 142.0, 201.0, 275.0, 513.0, 812.0, 1210.0, 1842.0, 2952.0, 4487.0, 6983.0, 11129.0, 17401.0, 28522.0, 46428.0, 78351.0, 134109.0, 212223.0, 198481.0, 120418.0, 70158.0, 41792.0, 25401.0, 16372.0, 10073.0, 6454.0, 4086.0, 2667.0, 1684.0, 1090.0, 731.0, 491.0, 323.0, 162.0, 108.0, 79.0, 43.0, 40.0, 27.0, 11.0, 11.0, 9.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.314453125, -1.27191162109375, -1.2293701171875, -1.18682861328125, -1.144287109375, -1.10174560546875, -1.0592041015625, -1.01666259765625, -0.97412109375, -0.93157958984375, -0.8890380859375, -0.84649658203125, -0.803955078125, -0.76141357421875, -0.7188720703125, -0.67633056640625, -0.6337890625, -0.59124755859375, -0.5487060546875, -0.50616455078125, -0.463623046875, -0.42108154296875, -0.3785400390625, -0.33599853515625, -0.29345703125, -0.25091552734375, -0.2083740234375, -0.16583251953125, -0.123291015625, -0.08074951171875, -0.0382080078125, 0.00433349609375, 0.046875, 0.08941650390625, 0.1319580078125, 0.17449951171875, 0.217041015625, 0.25958251953125, 0.3021240234375, 0.34466552734375, 0.38720703125, 0.42974853515625, 0.4722900390625, 0.51483154296875, 0.557373046875, 0.59991455078125, 0.6424560546875, 0.68499755859375, 0.7275390625, 0.77008056640625, 0.8126220703125, 0.85516357421875, 0.897705078125, 0.94024658203125, 0.9827880859375, 1.02532958984375, 1.06787109375, 1.11041259765625, 1.1529541015625, 1.19549560546875, 1.238037109375, 1.28057861328125, 1.3231201171875, 1.36566162109375, 1.408203125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 4.0, 9.0, 12.0, 14.0, 17.0, 19.0, 14.0, 18.0, 25.0, 30.0, 20.0, 23.0, 32.0, 36.0, 38.0, 38.0, 38.0, 35.0, 43.0, 1072.0, 41.0, 43.0, 29.0, 27.0, 46.0, 32.0, 28.0, 24.0, 30.0, 27.0, 19.0, 18.0, 16.0, 24.0, 11.0, 10.0, 6.0, 8.0, 5.0, 5.0, 9.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-18.34375, -17.8087158203125, -17.273681640625, -16.7386474609375, -16.20361328125, -15.6685791015625, -15.133544921875, -14.5985107421875, -14.0634765625, -13.5284423828125, -12.993408203125, -12.4583740234375, -11.92333984375, -11.3883056640625, -10.853271484375, -10.3182373046875, -9.783203125, -9.2481689453125, -8.713134765625, -8.1781005859375, -7.64306640625, -7.1080322265625, -6.572998046875, -6.0379638671875, -5.5029296875, -4.9678955078125, -4.432861328125, -3.8978271484375, -3.36279296875, -2.8277587890625, -2.292724609375, -1.7576904296875, -1.22265625, -0.6876220703125, -0.152587890625, 0.3824462890625, 0.91748046875, 1.4525146484375, 1.987548828125, 2.5225830078125, 3.0576171875, 3.5926513671875, 4.127685546875, 4.6627197265625, 5.19775390625, 5.7327880859375, 6.267822265625, 6.8028564453125, 7.337890625, 7.8729248046875, 8.407958984375, 8.9429931640625, 9.47802734375, 10.0130615234375, 10.548095703125, 11.0831298828125, 11.6181640625, 12.1531982421875, 12.688232421875, 13.2232666015625, 13.75830078125, 14.2933349609375, 14.828369140625, 15.3634033203125, 15.8984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 7.0, 8.0, 11.0, 19.0, 25.0, 39.0, 66.0, 68.0, 117.0, 188.0, 253.0, 339.0, 577.0, 852.0, 1171.0, 1614.0, 2349.0, 3345.0, 4940.0, 6773.0, 9922.0, 14463.0, 21005.0, 32112.0, 49355.0, 77061.0, 125224.0, 1233334.0, 190142.0, 113644.0, 70928.0, 44977.0, 28991.0, 19656.0, 13267.0, 9193.0, 6381.0, 4451.0, 3127.0, 2156.0, 1579.0, 1048.0, 757.0, 508.0, 359.0, 230.0, 152.0, 138.0, 80.0, 57.0, 31.0, 20.0, 11.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-1.0615234375, -1.0282440185546875, -0.994964599609375, -0.9616851806640625, -0.92840576171875, -0.8951263427734375, -0.861846923828125, -0.8285675048828125, -0.7952880859375, -0.7620086669921875, -0.728729248046875, -0.6954498291015625, -0.66217041015625, -0.6288909912109375, -0.595611572265625, -0.5623321533203125, -0.529052734375, -0.4957733154296875, -0.462493896484375, -0.4292144775390625, -0.39593505859375, -0.3626556396484375, -0.329376220703125, -0.2960968017578125, -0.2628173828125, -0.2295379638671875, -0.196258544921875, -0.1629791259765625, -0.12969970703125, -0.0964202880859375, -0.063140869140625, -0.0298614501953125, 0.00341796875, 0.0366973876953125, 0.069976806640625, 0.1032562255859375, 0.13653564453125, 0.1698150634765625, 0.203094482421875, 0.2363739013671875, 0.2696533203125, 0.3029327392578125, 0.336212158203125, 0.3694915771484375, 0.40277099609375, 0.4360504150390625, 0.469329833984375, 0.5026092529296875, 0.535888671875, 0.5691680908203125, 0.602447509765625, 0.6357269287109375, 0.66900634765625, 0.7022857666015625, 0.735565185546875, 0.7688446044921875, 0.8021240234375, 0.8354034423828125, 0.868682861328125, 0.9019622802734375, 0.93524169921875, 0.9685211181640625, 1.001800537109375, 1.0350799560546875, 1.068359375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 2.0, 5.0, 12.0, 13.0, 13.0, 17.0, 31.0, 27.0, 27.0, 40.0, 52.0, 54.0, 46.0, 66.0, 64.0, 62.0, 54.0, 55.0, 64.0, 48.0, 39.0, 36.0, 31.0, 27.0, 19.0, 14.0, 7.0, 6.0, 14.0, 10.0, 4.0, 5.0, 7.0, 1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.007022857666015625, -0.006814539432525635, -0.0066062211990356445, -0.006397902965545654, -0.006189584732055664, -0.005981266498565674, -0.005772948265075684, -0.005564630031585693, -0.005356311798095703, -0.005147993564605713, -0.004939675331115723, -0.004731357097625732, -0.004523038864135742, -0.004314720630645752, -0.004106402397155762, -0.0038980841636657715, -0.0036897659301757812, -0.003481447696685791, -0.0032731294631958008, -0.0030648112297058105, -0.0028564929962158203, -0.00264817476272583, -0.00243985652923584, -0.0022315382957458496, -0.0020232200622558594, -0.0018149018287658691, -0.001606583595275879, -0.0013982653617858887, -0.0011899471282958984, -0.0009816288948059082, -0.000773310661315918, -0.0005649924278259277, -0.0003566741943359375, -0.00014835596084594727, 5.996227264404297e-05, 0.0002682805061340332, 0.00047659873962402344, 0.0006849169731140137, 0.0008932352066040039, 0.0011015534400939941, 0.0013098716735839844, 0.0015181899070739746, 0.0017265081405639648, 0.001934826374053955, 0.0021431446075439453, 0.0023514628410339355, 0.0025597810745239258, 0.002768099308013916, 0.0029764175415039062, 0.0031847357749938965, 0.0033930540084838867, 0.003601372241973877, 0.003809690475463867, 0.004018008708953857, 0.004226326942443848, 0.004434645175933838, 0.004642963409423828, 0.004851281642913818, 0.005059599876403809, 0.005267918109893799, 0.005476236343383789, 0.005684554576873779, 0.0058928728103637695, 0.00610119104385376, 0.00630950927734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 12.0, 10.0, 15.0, 14.0, 19.0, 30.0, 29.0, 36.0, 55.0, 92.0, 123.0, 150.0, 274.0, 551.0, 1291.0, 129268.0, 912181.0, 2828.0, 632.0, 290.0, 170.0, 125.0, 91.0, 67.0, 39.0, 31.0, 23.0, 17.0, 11.0, 17.0, 10.0, 6.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.11941719055175781, -0.11517715454101562, -0.11093711853027344, -0.10669708251953125, -0.10245704650878906, -0.09821701049804688, -0.09397697448730469, -0.0897369384765625, -0.08549690246582031, -0.08125686645507812, -0.07701683044433594, -0.07277679443359375, -0.06853675842285156, -0.06429672241210938, -0.06005668640136719, -0.055816650390625, -0.05157661437988281, -0.047336578369140625, -0.04309654235839844, -0.03885650634765625, -0.03461647033691406, -0.030376434326171875, -0.026136398315429688, -0.0218963623046875, -0.017656326293945312, -0.013416290283203125, -0.009176254272460938, -0.00493621826171875, -0.0006961822509765625, 0.003543853759765625, 0.0077838897705078125, 0.01202392578125, 0.016263961791992188, 0.020503997802734375, 0.024744033813476562, 0.02898406982421875, 0.03322410583496094, 0.037464141845703125, 0.04170417785644531, 0.0459442138671875, 0.05018424987792969, 0.054424285888671875, 0.05866432189941406, 0.06290435791015625, 0.06714439392089844, 0.07138442993164062, 0.07562446594238281, 0.079864501953125, 0.08410453796386719, 0.08834457397460938, 0.09258460998535156, 0.09682464599609375, 0.10106468200683594, 0.10530471801757812, 0.10954475402832031, 0.1137847900390625, 0.11802482604980469, 0.12226486206054688, 0.12650489807128906, 0.13074493408203125, 0.13498497009277344, 0.13922500610351562, 0.1434650421142578, 0.147705078125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 32.0, 765.0, 209.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00774567062035203, -0.0063897971995174885, -0.0050339242443442345, -0.003678050823509693, -0.002322177402675152, -0.0009663039818406105, 0.0003895689733326435, 0.0017454423941671848, 0.003101315815001726, 0.0044571892358362675, 0.0058130621910095215, 0.007168935611844063, 0.008524809032678604, 0.009880682453513145, 0.011236555874347687, 0.012592429295182228, 0.01394830271601677, 0.01530417613685131, 0.016660049557685852, 0.018015922978520393, 0.019371796399354935, 0.020727669820189476, 0.022083543241024017, 0.02343941479921341, 0.02479528822004795, 0.026151161640882492, 0.027507035061717033, 0.028862908482551575, 0.030218781903386116, 0.03157465532422066, 0.03293052688241005, 0.03428640216588974, 0.03564227744936943, 0.03699814900755882, 0.03835402429103851, 0.039709895849227905, 0.041065771132707596, 0.04242164269089699, 0.04377751797437668, 0.04513338953256607, 0.04648926481604576, 0.04784513637423515, 0.049201011657714844, 0.050556883215904236, 0.051912758499383926, 0.05326863005757332, 0.05462450534105301, 0.0559803768992424, 0.05733624845743179, 0.058692120015621185, 0.060047995299100876, 0.06140386685729027, 0.06275974214076996, 0.06411561369895935, 0.06547148525714874, 0.06682736426591873, 0.06818323582410812, 0.06953910738229752, 0.07089497894048691, 0.0722508579492569, 0.07360672950744629, 0.07496260106563568, 0.07631847262382507, 0.07767435163259506, 0.07903022319078445]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 10.0, 9.0, 10.0, 14.0, 15.0, 19.0, 19.0, 24.0, 24.0, 26.0, 30.0, 31.0, 43.0, 51.0, 44.0, 48.0, 39.0, 43.0, 44.0, 40.0, 43.0, 42.0, 32.0, 33.0, 27.0, 27.0, 45.0, 23.0, 28.0, 14.0, 12.0, 16.0, 11.0, 19.0, 9.0, 8.0, 2.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004876494407653809, -0.0047376034781336784, -0.004598712548613548, -0.004459821619093418, -0.004320930689573288, -0.004182039760053158, -0.004043148830533028, -0.0039042579010128975, -0.0037653669714927673, -0.003626476041972637, -0.003487585112452507, -0.003348694182932377, -0.0032098032534122467, -0.0030709123238921165, -0.0029320213943719864, -0.0027931304648518562, -0.002654239535331726, -0.002515348605811596, -0.0023764576762914658, -0.0022375667467713356, -0.0020986758172512054, -0.0019597848877310753, -0.0018208939582109451, -0.001682003028690815, -0.0015431120991706848, -0.0014042211696505547, -0.0012653302401304245, -0.0011264393106102943, -0.0009875483810901642, -0.000848657451570034, -0.0007097665220499039, -0.0005708755925297737, -0.00043198466300964355, -0.0002930937334895134, -0.00015420280396938324, -1.5311874449253082e-05, 0.00012357905507087708, 0.00026246998459100723, 0.0004013609141111374, 0.0005402518436312675, 0.0006791427731513977, 0.0008180337026715279, 0.000956924632191658, 0.0010958155617117882, 0.0012347064912319183, 0.0013735974207520485, 0.0015124883502721786, 0.0016513792797923088, 0.001790270209312439, 0.0019291611388325691, 0.0020680520683526993, 0.0022069429978728294, 0.0023458339273929596, 0.0024847248569130898, 0.00262361578643322, 0.00276250671595335, 0.0029013976454734802, 0.0030402885749936104, 0.0031791795045137405, 0.0033180704340338707, 0.003456961363554001, 0.003595852293074131, 0.003734743222594261, 0.0038736341521143913, 0.0040125250816345215]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 7.0, 15.0, 9.0, 5.0, 16.0, 10.0, 12.0, 20.0, 19.0, 22.0, 28.0, 27.0, 36.0, 32.0, 44.0, 27.0, 42.0, 38.0, 52.0, 33.0, 46.0, 56.0, 39.0, 46.0, 35.0, 40.0, 33.0, 26.0, 21.0, 23.0, 22.0, 27.0, 14.0, 16.0, 13.0, 2.0, 11.0, 4.0, 1.0, 9.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0], "bins": [-31.25, -30.3486328125, -29.447265625, -28.5458984375, -27.64453125, -26.7431640625, -25.841796875, -24.9404296875, -24.0390625, -23.1376953125, -22.236328125, -21.3349609375, -20.43359375, -19.5322265625, -18.630859375, -17.7294921875, -16.828125, -15.9267578125, -15.025390625, -14.1240234375, -13.22265625, -12.3212890625, -11.419921875, -10.5185546875, -9.6171875, -8.7158203125, -7.814453125, -6.9130859375, -6.01171875, -5.1103515625, -4.208984375, -3.3076171875, -2.40625, -1.5048828125, -0.603515625, 0.2978515625, 1.19921875, 2.1005859375, 3.001953125, 3.9033203125, 4.8046875, 5.7060546875, 6.607421875, 7.5087890625, 8.41015625, 9.3115234375, 10.212890625, 11.1142578125, 12.015625, 12.9169921875, 13.818359375, 14.7197265625, 15.62109375, 16.5224609375, 17.423828125, 18.3251953125, 19.2265625, 20.1279296875, 21.029296875, 21.9306640625, 22.83203125, 23.7333984375, 24.634765625, 25.5361328125, 26.4375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 13.0, 17.0, 21.0, 21.0, 31.0, 49.0, 70.0, 96.0, 110.0, 185.0, 227.0, 289.0, 410.0, 558.0, 798.0, 1207.0, 1964.0, 4516.0, 15048.0, 78815.0, 596899.0, 290521.0, 39248.0, 9049.0, 3232.0, 1570.0, 1001.0, 703.0, 496.0, 376.0, 285.0, 187.0, 164.0, 121.0, 59.0, 49.0, 33.0, 37.0, 22.0, 9.0, 9.0, 11.0, 6.0, 7.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.1875, -55.3896484375, -53.591796875, -51.7939453125, -49.99609375, -48.1982421875, -46.400390625, -44.6025390625, -42.8046875, -41.0068359375, -39.208984375, -37.4111328125, -35.61328125, -33.8154296875, -32.017578125, -30.2197265625, -28.421875, -26.6240234375, -24.826171875, -23.0283203125, -21.23046875, -19.4326171875, -17.634765625, -15.8369140625, -14.0390625, -12.2412109375, -10.443359375, -8.6455078125, -6.84765625, -5.0498046875, -3.251953125, -1.4541015625, 0.34375, 2.1416015625, 3.939453125, 5.7373046875, 7.53515625, 9.3330078125, 11.130859375, 12.9287109375, 14.7265625, 16.5244140625, 18.322265625, 20.1201171875, 21.91796875, 23.7158203125, 25.513671875, 27.3115234375, 29.109375, 30.9072265625, 32.705078125, 34.5029296875, 36.30078125, 38.0986328125, 39.896484375, 41.6943359375, 43.4921875, 45.2900390625, 47.087890625, 48.8857421875, 50.68359375, 52.4814453125, 54.279296875, 56.0771484375, 57.875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 14.0, 17.0, 20.0, 27.0, 30.0, 29.0, 48.0, 41.0, 65.0, 69.0, 81.0, 134.0, 1473.0, 360.0, 134.0, 104.0, 62.0, 57.0, 55.0, 45.0, 31.0, 25.0, 20.0, 12.0, 17.0, 15.0, 12.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-72.6875, -70.33984375, -67.9921875, -65.64453125, -63.296875, -60.94921875, -58.6015625, -56.25390625, -53.90625, -51.55859375, -49.2109375, -46.86328125, -44.515625, -42.16796875, -39.8203125, -37.47265625, -35.125, -32.77734375, -30.4296875, -28.08203125, -25.734375, -23.38671875, -21.0390625, -18.69140625, -16.34375, -13.99609375, -11.6484375, -9.30078125, -6.953125, -4.60546875, -2.2578125, 0.08984375, 2.4375, 4.78515625, 7.1328125, 9.48046875, 11.828125, 14.17578125, 16.5234375, 18.87109375, 21.21875, 23.56640625, 25.9140625, 28.26171875, 30.609375, 32.95703125, 35.3046875, 37.65234375, 40.0, 42.34765625, 44.6953125, 47.04296875, 49.390625, 51.73828125, 54.0859375, 56.43359375, 58.78125, 61.12890625, 63.4765625, 65.82421875, 68.171875, 70.51953125, 72.8671875, 75.21484375, 77.5625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 5.0, 9.0, 11.0, 12.0, 15.0, 16.0, 15.0, 18.0, 34.0, 32.0, 48.0, 76.0, 117.0, 175.0, 299.0, 593.0, 1520.0, 65022.0, 3073078.0, 2726.0, 793.0, 385.0, 238.0, 140.0, 71.0, 50.0, 36.0, 43.0, 29.0, 13.0, 11.0, 17.0, 11.0, 11.0, 9.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-287.75, -279.3359375, -270.921875, -262.5078125, -254.09375, -245.6796875, -237.265625, -228.8515625, -220.4375, -212.0234375, -203.609375, -195.1953125, -186.78125, -178.3671875, -169.953125, -161.5390625, -153.125, -144.7109375, -136.296875, -127.8828125, -119.46875, -111.0546875, -102.640625, -94.2265625, -85.8125, -77.3984375, -68.984375, -60.5703125, -52.15625, -43.7421875, -35.328125, -26.9140625, -18.5, -10.0859375, -1.671875, 6.7421875, 15.15625, 23.5703125, 31.984375, 40.3984375, 48.8125, 57.2265625, 65.640625, 74.0546875, 82.46875, 90.8828125, 99.296875, 107.7109375, 116.125, 124.5390625, 132.953125, 141.3671875, 149.78125, 158.1953125, 166.609375, 175.0234375, 183.4375, 191.8515625, 200.265625, 208.6796875, 217.09375, 225.5078125, 233.921875, 242.3359375, 250.75]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 14.0, 63.0, 449.0, 424.0, 53.0, 13.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-856.8184814453125, -840.9448852539062, -825.0713500976562, -809.19775390625, -793.32421875, -777.4506225585938, -761.5770874023438, -745.7034912109375, -729.8299560546875, -713.9563598632812, -698.0828247070312, -682.209228515625, -666.335693359375, -650.4620971679688, -634.5885620117188, -618.7149658203125, -602.8414306640625, -586.9678344726562, -571.0942993164062, -555.220703125, -539.34716796875, -523.4735717773438, -507.60003662109375, -491.7264709472656, -475.8528747558594, -459.97930908203125, -444.1057434082031, -428.232177734375, -412.3586120605469, -396.48504638671875, -380.6114807128906, -364.7379150390625, -348.8643798828125, -332.9908142089844, -317.11724853515625, -301.2436828613281, -285.3701171875, -269.4965515136719, -253.62298583984375, -237.74942016601562, -221.87582397460938, -206.00225830078125, -190.12869262695312, -174.255126953125, -158.38156127929688, -142.50799560546875, -126.6344223022461, -110.76085662841797, -94.88729858398438, -79.01373291015625, -63.140167236328125, -47.266597747802734, -31.39303207397461, -15.519462585449219, 0.35410308837890625, 16.22766876220703, 32.101234436035156, 47.97480010986328, 63.848365783691406, 79.72193908691406, 95.59550476074219, 111.46907043457031, 127.34263610839844, 143.21620178222656, 159.0897674560547]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 9.0, 7.0, 12.0, 4.0, 13.0, 12.0, 17.0, 30.0, 15.0, 18.0, 25.0, 18.0, 29.0, 29.0, 39.0, 45.0, 35.0, 41.0, 42.0, 50.0, 47.0, 41.0, 55.0, 54.0, 35.0, 41.0, 34.0, 40.0, 27.0, 28.0, 20.0, 18.0, 8.0, 12.0, 13.0, 9.0, 10.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-208.3531494140625, -202.52880859375, -196.7044677734375, -190.88014221191406, -185.05580139160156, -179.23146057128906, -173.40711975097656, -167.58279418945312, -161.75845336914062, -155.93411254882812, -150.10977172851562, -144.2854461669922, -138.4611053466797, -132.6367645263672, -126.81242370605469, -120.98809051513672, -115.16374969482422, -109.33940887451172, -103.51507568359375, -97.69073486328125, -91.86640167236328, -86.04206085205078, -80.21772766113281, -74.39338684082031, -68.56904602050781, -62.74470901489258, -56.920372009277344, -51.096031188964844, -45.271697998046875, -39.447357177734375, -33.62302017211914, -27.798683166503906, -21.974349975585938, -16.150012969970703, -10.325675010681152, -4.501337051391602, 1.3229999542236328, 7.147336959838867, 12.971675872802734, 18.79601287841797, 24.620349884033203, 30.444686889648438, 36.26902389526367, 42.093360900878906, 47.917701721191406, 53.742034912109375, 59.566375732421875, 65.39071655273438, 71.21504974365234, 77.03939056396484, 82.86372375488281, 88.68806457519531, 94.51239776611328, 100.33673858642578, 106.16107177734375, 111.98541259765625, 117.80975341796875, 123.63409423828125, 129.45843505859375, 135.2827606201172, 141.1071014404297, 146.9314422607422, 152.7557830810547, 158.58010864257812, 164.40444946289062]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 8.0, 9.0, 8.0, 10.0, 16.0, 14.0, 23.0, 22.0, 40.0, 31.0, 29.0, 35.0, 43.0, 44.0, 44.0, 45.0, 45.0, 61.0, 39.0, 54.0, 47.0, 27.0, 33.0, 37.0, 23.0, 29.0, 26.0, 34.0, 26.0, 16.0, 7.0, 7.0, 14.0, 10.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-37.78125, -36.7666015625, -35.751953125, -34.7373046875, -33.72265625, -32.7080078125, -31.693359375, -30.6787109375, -29.6640625, -28.6494140625, -27.634765625, -26.6201171875, -25.60546875, -24.5908203125, -23.576171875, -22.5615234375, -21.546875, -20.5322265625, -19.517578125, -18.5029296875, -17.48828125, -16.4736328125, -15.458984375, -14.4443359375, -13.4296875, -12.4150390625, -11.400390625, -10.3857421875, -9.37109375, -8.3564453125, -7.341796875, -6.3271484375, -5.3125, -4.2978515625, -3.283203125, -2.2685546875, -1.25390625, -0.2392578125, 0.775390625, 1.7900390625, 2.8046875, 3.8193359375, 4.833984375, 5.8486328125, 6.86328125, 7.8779296875, 8.892578125, 9.9072265625, 10.921875, 11.9365234375, 12.951171875, 13.9658203125, 14.98046875, 15.9951171875, 17.009765625, 18.0244140625, 19.0390625, 20.0537109375, 21.068359375, 22.0830078125, 23.09765625, 24.1123046875, 25.126953125, 26.1416015625, 27.15625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 7.0, 7.0, 9.0, 8.0, 6.0, 13.0, 16.0, 14.0, 13.0, 21.0, 44.0, 48.0, 57.0, 92.0, 162.0, 279.0, 493.0, 829.0, 1651.0, 3781.0, 15815.0, 1571764.0, 2570504.0, 20434.0, 4201.0, 1797.0, 892.0, 506.0, 267.0, 177.0, 97.0, 64.0, 51.0, 27.0, 30.0, 21.0, 11.0, 17.0, 9.0, 17.0, 5.0, 8.0, 6.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.875, -112.708984375, -108.54296875, -104.376953125, -100.2109375, -96.044921875, -91.87890625, -87.712890625, -83.546875, -79.380859375, -75.21484375, -71.048828125, -66.8828125, -62.716796875, -58.55078125, -54.384765625, -50.21875, -46.052734375, -41.88671875, -37.720703125, -33.5546875, -29.388671875, -25.22265625, -21.056640625, -16.890625, -12.724609375, -8.55859375, -4.392578125, -0.2265625, 3.939453125, 8.10546875, 12.271484375, 16.4375, 20.603515625, 24.76953125, 28.935546875, 33.1015625, 37.267578125, 41.43359375, 45.599609375, 49.765625, 53.931640625, 58.09765625, 62.263671875, 66.4296875, 70.595703125, 74.76171875, 78.927734375, 83.09375, 87.259765625, 91.42578125, 95.591796875, 99.7578125, 103.923828125, 108.08984375, 112.255859375, 116.421875, 120.587890625, 124.75390625, 128.919921875, 133.0859375, 137.251953125, 141.41796875, 145.583984375, 149.75]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 9.0, 18.0, 22.0, 13.0, 29.0, 39.0, 72.0, 109.0, 197.0, 376.0, 620.0, 891.0, 634.0, 397.0, 217.0, 130.0, 91.0, 44.0, 41.0, 29.0, 26.0, 11.0, 8.0, 7.0, 7.0, 7.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.96875, -62.064453125, -60.16015625, -58.255859375, -56.3515625, -54.447265625, -52.54296875, -50.638671875, -48.734375, -46.830078125, -44.92578125, -43.021484375, -41.1171875, -39.212890625, -37.30859375, -35.404296875, -33.5, -31.595703125, -29.69140625, -27.787109375, -25.8828125, -23.978515625, -22.07421875, -20.169921875, -18.265625, -16.361328125, -14.45703125, -12.552734375, -10.6484375, -8.744140625, -6.83984375, -4.935546875, -3.03125, -1.126953125, 0.77734375, 2.681640625, 4.5859375, 6.490234375, 8.39453125, 10.298828125, 12.203125, 14.107421875, 16.01171875, 17.916015625, 19.8203125, 21.724609375, 23.62890625, 25.533203125, 27.4375, 29.341796875, 31.24609375, 33.150390625, 35.0546875, 36.958984375, 38.86328125, 40.767578125, 42.671875, 44.576171875, 46.48046875, 48.384765625, 50.2890625, 52.193359375, 54.09765625, 56.001953125, 57.90625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 6.0, 11.0, 17.0, 17.0, 25.0, 37.0, 80.0, 142.0, 222.0, 452.0, 966.0, 2099.0, 5005.0, 16531.0, 101886.0, 3599947.0, 420221.0, 32713.0, 8103.0, 3008.0, 1348.0, 683.0, 316.0, 154.0, 101.0, 59.0, 36.0, 15.0, 12.0, 12.0, 13.0, 1.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.75, -99.4052734375, -96.060546875, -92.7158203125, -89.37109375, -86.0263671875, -82.681640625, -79.3369140625, -75.9921875, -72.6474609375, -69.302734375, -65.9580078125, -62.61328125, -59.2685546875, -55.923828125, -52.5791015625, -49.234375, -45.8896484375, -42.544921875, -39.2001953125, -35.85546875, -32.5107421875, -29.166015625, -25.8212890625, -22.4765625, -19.1318359375, -15.787109375, -12.4423828125, -9.09765625, -5.7529296875, -2.408203125, 0.9365234375, 4.28125, 7.6259765625, 10.970703125, 14.3154296875, 17.66015625, 21.0048828125, 24.349609375, 27.6943359375, 31.0390625, 34.3837890625, 37.728515625, 41.0732421875, 44.41796875, 47.7626953125, 51.107421875, 54.4521484375, 57.796875, 61.1416015625, 64.486328125, 67.8310546875, 71.17578125, 74.5205078125, 77.865234375, 81.2099609375, 84.5546875, 87.8994140625, 91.244140625, 94.5888671875, 97.93359375, 101.2783203125, 104.623046875, 107.9677734375, 111.3125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 47.0, 733.0, 223.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1271.74951171875, -1222.289794921875, -1172.830078125, -1123.370361328125, -1073.91064453125, -1024.450927734375, -974.9911499023438, -925.5313720703125, -876.0716552734375, -826.6119384765625, -777.1522216796875, -727.6925048828125, -678.2327270507812, -628.7730102539062, -579.3132934570312, -529.853515625, -480.39385986328125, -430.93414306640625, -381.4743957519531, -332.0146789550781, -282.554931640625, -233.09521484375, -183.635498046875, -134.17575073242188, -84.71603393554688, -35.25630569458008, 14.203422546386719, 63.66314697265625, 113.12287902832031, 162.58261108398438, 212.04232788085938, 261.5020751953125, 310.9617919921875, 360.4215087890625, 409.8812561035156, 459.3409729003906, 508.80072021484375, 558.2604370117188, 607.7201538085938, 657.179931640625, 706.6396484375, 756.099365234375, 805.55908203125, 855.018798828125, 904.4785766601562, 953.9382934570312, 1003.3980102539062, 1052.8577880859375, 1102.3173828125, 1151.777099609375, 1201.23681640625, 1250.696533203125, 1300.15625, 1349.615966796875, 1399.07568359375, 1448.5355224609375, 1497.9952392578125, 1547.4549560546875, 1596.9146728515625, 1646.3743896484375, 1695.8341064453125, 1745.2939453125, 1794.753662109375, 1844.21337890625, 1893.673095703125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 7.0, 7.0, 8.0, 4.0, 9.0, 6.0, 10.0, 24.0, 14.0, 9.0, 30.0, 14.0, 35.0, 26.0, 31.0, 25.0, 30.0, 33.0, 36.0, 29.0, 40.0, 50.0, 34.0, 31.0, 32.0, 45.0, 43.0, 43.0, 28.0, 38.0, 29.0, 21.0, 20.0, 25.0, 17.0, 18.0, 17.0, 16.0, 17.0, 11.0, 9.0, 7.0, 8.0, 10.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-154.60592651367188, -149.64340209960938, -144.68089294433594, -139.71836853027344, -134.75584411621094, -129.79331970214844, -124.830810546875, -119.8682861328125, -114.90576171875, -109.94324493408203, -104.98072052001953, -100.01820373535156, -95.05567932128906, -90.0931625366211, -85.13064575195312, -80.16812133789062, -75.20560455322266, -70.24308776855469, -65.28056335449219, -60.31804656982422, -55.35552215576172, -50.39300537109375, -45.430484771728516, -40.46796417236328, -35.50544357299805, -30.542922973632812, -25.580402374267578, -20.617883682250977, -15.655363082885742, -10.692842483520508, -5.730323791503906, -0.7678031921386719, 4.1947174072265625, 9.157238006591797, 14.119757652282715, 19.082277297973633, 24.044797897338867, 29.0073184967041, 33.9698371887207, 38.93235778808594, 43.89487838745117, 48.857398986816406, 53.81991958618164, 58.782440185546875, 63.744956970214844, 68.70748138427734, 73.66999816894531, 78.63252258300781, 83.59503936767578, 88.55755615234375, 93.52008056640625, 98.48259735107422, 103.44512176513672, 108.40763854980469, 113.37016296386719, 118.33267974853516, 123.29519653320312, 128.25772094726562, 133.22023010253906, 138.18275451660156, 143.14527893066406, 148.10780334472656, 153.0703125, 158.0328369140625, 162.995361328125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 9.0, 11.0, 13.0, 18.0, 20.0, 19.0, 26.0, 24.0, 33.0, 23.0, 30.0, 39.0, 33.0, 48.0, 41.0, 49.0, 40.0, 44.0, 37.0, 41.0, 42.0, 50.0, 29.0, 25.0, 37.0, 29.0, 33.0, 24.0, 15.0, 17.0, 15.0, 11.0, 10.0, 10.0, 6.0, 2.0, 2.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.794921875, -23.93359375, -23.072265625, -22.2109375, -21.349609375, -20.48828125, -19.626953125, -18.765625, -17.904296875, -17.04296875, -16.181640625, -15.3203125, -14.458984375, -13.59765625, -12.736328125, -11.875, -11.013671875, -10.15234375, -9.291015625, -8.4296875, -7.568359375, -6.70703125, -5.845703125, -4.984375, -4.123046875, -3.26171875, -2.400390625, -1.5390625, -0.677734375, 0.18359375, 1.044921875, 1.90625, 2.767578125, 3.62890625, 4.490234375, 5.3515625, 6.212890625, 7.07421875, 7.935546875, 8.796875, 9.658203125, 10.51953125, 11.380859375, 12.2421875, 13.103515625, 13.96484375, 14.826171875, 15.6875, 16.548828125, 17.41015625, 18.271484375, 19.1328125, 19.994140625, 20.85546875, 21.716796875, 22.578125, 23.439453125, 24.30078125, 25.162109375, 26.0234375, 26.884765625, 27.74609375, 28.607421875, 29.46875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 7.0, 9.0, 9.0, 13.0, 17.0, 22.0, 43.0, 45.0, 81.0, 101.0, 164.0, 196.0, 335.0, 459.0, 618.0, 896.0, 1315.0, 1869.0, 2655.0, 3983.0, 5968.0, 9263.0, 14581.0, 23389.0, 37562.0, 61402.0, 103722.0, 171016.0, 221214.0, 150704.0, 90606.0, 54100.0, 32879.0, 20685.0, 13229.0, 8529.0, 5458.0, 3673.0, 2402.0, 1601.0, 1098.0, 770.0, 508.0, 382.0, 275.0, 216.0, 150.0, 93.0, 71.0, 45.0, 46.0, 23.0, 18.0, 17.0, 12.0, 4.0, 3.0, 5.0, 4.0, 2.0, 5.0, 2.0], "bins": [-1.2021484375, -1.162567138671875, -1.12298583984375, -1.083404541015625, -1.0438232421875, -1.004241943359375, -0.96466064453125, -0.925079345703125, -0.885498046875, -0.845916748046875, -0.80633544921875, -0.766754150390625, -0.7271728515625, -0.687591552734375, -0.64801025390625, -0.608428955078125, -0.56884765625, -0.529266357421875, -0.48968505859375, -0.450103759765625, -0.4105224609375, -0.370941162109375, -0.33135986328125, -0.291778564453125, -0.252197265625, -0.212615966796875, -0.17303466796875, -0.133453369140625, -0.0938720703125, -0.054290771484375, -0.01470947265625, 0.024871826171875, 0.064453125, 0.104034423828125, 0.14361572265625, 0.183197021484375, 0.2227783203125, 0.262359619140625, 0.30194091796875, 0.341522216796875, 0.381103515625, 0.420684814453125, 0.46026611328125, 0.499847412109375, 0.5394287109375, 0.579010009765625, 0.61859130859375, 0.658172607421875, 0.69775390625, 0.737335205078125, 0.77691650390625, 0.816497802734375, 0.8560791015625, 0.895660400390625, 0.93524169921875, 0.974822998046875, 1.014404296875, 1.053985595703125, 1.09356689453125, 1.133148193359375, 1.1727294921875, 1.212310791015625, 1.25189208984375, 1.291473388671875, 1.3310546875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 5.0, 16.0, 15.0, 19.0, 19.0, 34.0, 18.0, 18.0, 35.0, 27.0, 35.0, 47.0, 44.0, 43.0, 48.0, 51.0, 1070.0, 49.0, 42.0, 37.0, 43.0, 38.0, 18.0, 35.0, 25.0, 19.0, 29.0, 21.0, 19.0, 23.0, 13.0, 15.0, 6.0, 8.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-21.234375, -20.6632080078125, -20.092041015625, -19.5208740234375, -18.94970703125, -18.3785400390625, -17.807373046875, -17.2362060546875, -16.6650390625, -16.0938720703125, -15.522705078125, -14.9515380859375, -14.38037109375, -13.8092041015625, -13.238037109375, -12.6668701171875, -12.095703125, -11.5245361328125, -10.953369140625, -10.3822021484375, -9.81103515625, -9.2398681640625, -8.668701171875, -8.0975341796875, -7.5263671875, -6.9552001953125, -6.384033203125, -5.8128662109375, -5.24169921875, -4.6705322265625, -4.099365234375, -3.5281982421875, -2.95703125, -2.3858642578125, -1.814697265625, -1.2435302734375, -0.67236328125, -0.1011962890625, 0.469970703125, 1.0411376953125, 1.6123046875, 2.1834716796875, 2.754638671875, 3.3258056640625, 3.89697265625, 4.4681396484375, 5.039306640625, 5.6104736328125, 6.181640625, 6.7528076171875, 7.323974609375, 7.8951416015625, 8.46630859375, 9.0374755859375, 9.608642578125, 10.1798095703125, 10.7509765625, 11.3221435546875, 11.893310546875, 12.4644775390625, 13.03564453125, 13.6068115234375, 14.177978515625, 14.7491455078125, 15.3203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 6.0, 14.0, 14.0, 21.0, 35.0, 50.0, 81.0, 156.0, 215.0, 343.0, 481.0, 829.0, 1340.0, 1992.0, 3049.0, 4852.0, 7420.0, 11453.0, 17847.0, 28486.0, 47282.0, 82383.0, 146918.0, 1281365.0, 192071.0, 108891.0, 61149.0, 36168.0, 22373.0, 14119.0, 9188.0, 5691.0, 3954.0, 2486.0, 1573.0, 1011.0, 667.0, 418.0, 274.0, 173.0, 113.0, 70.0, 35.0, 24.0, 17.0, 18.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2080078125, -1.169952392578125, -1.13189697265625, -1.093841552734375, -1.0557861328125, -1.017730712890625, -0.97967529296875, -0.941619873046875, -0.903564453125, -0.865509033203125, -0.82745361328125, -0.789398193359375, -0.7513427734375, -0.713287353515625, -0.67523193359375, -0.637176513671875, -0.59912109375, -0.561065673828125, -0.52301025390625, -0.484954833984375, -0.4468994140625, -0.408843994140625, -0.37078857421875, -0.332733154296875, -0.294677734375, -0.256622314453125, -0.21856689453125, -0.180511474609375, -0.1424560546875, -0.104400634765625, -0.06634521484375, -0.028289794921875, 0.009765625, 0.047821044921875, 0.08587646484375, 0.123931884765625, 0.1619873046875, 0.200042724609375, 0.23809814453125, 0.276153564453125, 0.314208984375, 0.352264404296875, 0.39031982421875, 0.428375244140625, 0.4664306640625, 0.504486083984375, 0.54254150390625, 0.580596923828125, 0.61865234375, 0.656707763671875, 0.69476318359375, 0.732818603515625, 0.7708740234375, 0.808929443359375, 0.84698486328125, 0.885040283203125, 0.923095703125, 0.961151123046875, 0.99920654296875, 1.037261962890625, 1.0753173828125, 1.113372802734375, 1.15142822265625, 1.189483642578125, 1.2275390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 3.0, 6.0, 5.0, 10.0, 9.0, 12.0, 23.0, 14.0, 27.0, 43.0, 61.0, 86.0, 100.0, 95.0, 102.0, 103.0, 83.0, 56.0, 44.0, 29.0, 21.0, 17.0, 8.0, 7.0, 7.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0111236572265625, -0.01075279712677002, -0.010381937026977539, -0.010011076927185059, -0.009640216827392578, -0.009269356727600098, -0.008898496627807617, -0.008527636528015137, -0.008156776428222656, -0.007785916328430176, -0.007415056228637695, -0.007044196128845215, -0.006673336029052734, -0.006302475929260254, -0.0059316158294677734, -0.005560755729675293, -0.0051898956298828125, -0.004819035530090332, -0.0044481754302978516, -0.004077315330505371, -0.0037064552307128906, -0.00333559513092041, -0.0029647350311279297, -0.0025938749313354492, -0.0022230148315429688, -0.0018521547317504883, -0.0014812946319580078, -0.0011104345321655273, -0.0007395744323730469, -0.0003687143325805664, 2.1457672119140625e-06, 0.00037300586700439453, 0.000743865966796875, 0.0011147260665893555, 0.001485586166381836, 0.0018564462661743164, 0.002227306365966797, 0.0025981664657592773, 0.002969026565551758, 0.0033398866653442383, 0.0037107467651367188, 0.004081606864929199, 0.00445246696472168, 0.00482332706451416, 0.005194187164306641, 0.005565047264099121, 0.0059359073638916016, 0.006306767463684082, 0.0066776275634765625, 0.007048487663269043, 0.0074193477630615234, 0.007790207862854004, 0.008161067962646484, 0.008531928062438965, 0.008902788162231445, 0.009273648262023926, 0.009644508361816406, 0.010015368461608887, 0.010386228561401367, 0.010757088661193848, 0.011127948760986328, 0.011498808860778809, 0.011869668960571289, 0.01224052906036377, 0.01261138916015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 12.0, 10.0, 11.0, 11.0, 18.0, 31.0, 53.0, 59.0, 116.0, 175.0, 404.0, 1188.0, 914050.0, 130599.0, 917.0, 339.0, 191.0, 106.0, 59.0, 38.0, 39.0, 25.0, 20.0, 12.0, 10.0, 11.0, 4.0, 8.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2506828308105469, -0.24306488037109375, -0.23544692993164062, -0.2278289794921875, -0.22021102905273438, -0.21259307861328125, -0.20497512817382812, -0.197357177734375, -0.18973922729492188, -0.18212127685546875, -0.17450332641601562, -0.1668853759765625, -0.15926742553710938, -0.15164947509765625, -0.14403152465820312, -0.13641357421875, -0.12879562377929688, -0.12117767333984375, -0.11355972290039062, -0.1059417724609375, -0.09832382202148438, -0.09070587158203125, -0.08308792114257812, -0.075469970703125, -0.06785202026367188, -0.06023406982421875, -0.052616119384765625, -0.0449981689453125, -0.037380218505859375, -0.02976226806640625, -0.022144317626953125, -0.0145263671875, -0.006908416748046875, 0.00070953369140625, 0.008327484130859375, 0.0159454345703125, 0.023563385009765625, 0.03118133544921875, 0.038799285888671875, 0.046417236328125, 0.054035186767578125, 0.06165313720703125, 0.06927108764648438, 0.0768890380859375, 0.08450698852539062, 0.09212493896484375, 0.09974288940429688, 0.10736083984375, 0.11497879028320312, 0.12259674072265625, 0.13021469116210938, 0.1378326416015625, 0.14545059204101562, 0.15306854248046875, 0.16068649291992188, 0.168304443359375, 0.17592239379882812, 0.18354034423828125, 0.19115829467773438, 0.1987762451171875, 0.20639419555664062, 0.21401214599609375, 0.22163009643554688, 0.229248046875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 43.0, 958.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010794905945658684, -0.007518281228840351, -0.004241656046360731, -0.0009650308638811111, 0.0023115938529372215, 0.005588218569755554, 0.008864844217896461, 0.01214146800339222, 0.015418093651533127, 0.018694719299674034, 0.021971343085169792, 0.0252479687333107, 0.028524592518806458, 0.031801216304302216, 0.03507784381508827, 0.03835446760058403, 0.04163109511137009, 0.044907718896865845, 0.0481843464076519, 0.05146097019314766, 0.05473759397864342, 0.058014221489429474, 0.06129084527492523, 0.06456746906042099, 0.06784409284591675, 0.0711207166314125, 0.07439734041690826, 0.07767397165298462, 0.08095059543848038, 0.08422721922397614, 0.0875038430094719, 0.09078046679496765, 0.09405709058046341, 0.09733371436595917, 0.10061033815145493, 0.10388696193695068, 0.10716359317302704, 0.1104402169585228, 0.11371684074401855, 0.11699346452951431, 0.12027008831501007, 0.12354671210050583, 0.1268233358860016, 0.13009996712207794, 0.1333765834569931, 0.13665321469306946, 0.13992983102798462, 0.14320646226406097, 0.14648309350013733, 0.14975972473621368, 0.15303634107112885, 0.1563129723072052, 0.15958958864212036, 0.16286621987819672, 0.16614285111427307, 0.16941946744918823, 0.1726960837841034, 0.17597271502017975, 0.1792493313550949, 0.18252596259117126, 0.18580257892608643, 0.18907921016216278, 0.19235584139823914, 0.1956324577331543, 0.19890908896923065]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 13.0, 12.0, 12.0, 29.0, 22.0, 45.0, 48.0, 60.0, 58.0, 72.0, 66.0, 75.0, 60.0, 64.0, 74.0, 54.0, 41.0, 38.0, 32.0, 29.0, 26.0, 26.0, 17.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01441192626953125, -0.014080301858484745, -0.01374867744743824, -0.013417053036391735, -0.01308542862534523, -0.012753804214298725, -0.01242217980325222, -0.012090555392205715, -0.01175893098115921, -0.011427306570112705, -0.0110956821590662, -0.010764057748019695, -0.01043243333697319, -0.010100808925926685, -0.00976918451488018, -0.009437560103833675, -0.00910593569278717, -0.008774311281740665, -0.00844268687069416, -0.008111062459647655, -0.0077794380486011505, -0.0074478136375546455, -0.0071161892265081406, -0.006784564815461636, -0.006452940404415131, -0.006121315993368626, -0.005789691582322121, -0.005458067171275616, -0.005126442760229111, -0.004794818349182606, -0.004463193938136101, -0.004131569527089596, -0.003799945116043091, -0.003468320704996586, -0.003136696293950081, -0.002805071882903576, -0.002473447471857071, -0.002141823060810566, -0.001810198649764061, -0.001478574238717556, -0.001146949827671051, -0.000815325416624546, -0.0004837010055780411, -0.0001520765945315361, 0.00017954781651496887, 0.0005111722275614738, 0.0008427966386079788, 0.0011744210496544838, 0.0015060454607009888, 0.0018376698717474937, 0.0021692942827939987, 0.0025009186938405037, 0.0028325431048870087, 0.0031641675159335136, 0.0034957919269800186, 0.0038274163380265236, 0.0041590407490730286, 0.0044906651601195335, 0.0048222895711660385, 0.0051539139822125435, 0.0054855383932590485, 0.0058171628043055534, 0.006148787215352058, 0.006480411626398563, 0.006812036037445068]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 9.0, 11.0, 13.0, 18.0, 20.0, 19.0, 26.0, 24.0, 33.0, 23.0, 30.0, 39.0, 33.0, 48.0, 41.0, 49.0, 41.0, 43.0, 37.0, 41.0, 42.0, 50.0, 29.0, 25.0, 37.0, 29.0, 33.0, 24.0, 15.0, 17.0, 15.0, 11.0, 10.0, 10.0, 6.0, 2.0, 2.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.794921875, -23.93359375, -23.072265625, -22.2109375, -21.349609375, -20.48828125, -19.626953125, -18.765625, -17.904296875, -17.04296875, -16.181640625, -15.3203125, -14.458984375, -13.59765625, -12.736328125, -11.875, -11.013671875, -10.15234375, -9.291015625, -8.4296875, -7.568359375, -6.70703125, -5.845703125, -4.984375, -4.123046875, -3.26171875, -2.400390625, -1.5390625, -0.677734375, 0.18359375, 1.044921875, 1.90625, 2.767578125, 3.62890625, 4.490234375, 5.3515625, 6.212890625, 7.07421875, 7.935546875, 8.796875, 9.658203125, 10.51953125, 11.380859375, 12.2421875, 13.103515625, 13.96484375, 14.826171875, 15.6875, 16.548828125, 17.41015625, 18.271484375, 19.1328125, 19.994140625, 20.85546875, 21.716796875, 22.578125, 23.439453125, 24.30078125, 25.162109375, 26.0234375, 26.884765625, 27.74609375, 28.607421875, 29.46875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 11.0, 17.0, 25.0, 26.0, 33.0, 46.0, 74.0, 101.0, 143.0, 191.0, 227.0, 360.0, 520.0, 714.0, 968.0, 1470.0, 2222.0, 3798.0, 9768.0, 50690.0, 716051.0, 224503.0, 21530.0, 6132.0, 2972.0, 1720.0, 1246.0, 823.0, 624.0, 399.0, 291.0, 219.0, 160.0, 133.0, 86.0, 59.0, 55.0, 32.0, 30.0, 21.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0], "bins": [-81.375, -79.03515625, -76.6953125, -74.35546875, -72.015625, -69.67578125, -67.3359375, -64.99609375, -62.65625, -60.31640625, -57.9765625, -55.63671875, -53.296875, -50.95703125, -48.6171875, -46.27734375, -43.9375, -41.59765625, -39.2578125, -36.91796875, -34.578125, -32.23828125, -29.8984375, -27.55859375, -25.21875, -22.87890625, -20.5390625, -18.19921875, -15.859375, -13.51953125, -11.1796875, -8.83984375, -6.5, -4.16015625, -1.8203125, 0.51953125, 2.859375, 5.19921875, 7.5390625, 9.87890625, 12.21875, 14.55859375, 16.8984375, 19.23828125, 21.578125, 23.91796875, 26.2578125, 28.59765625, 30.9375, 33.27734375, 35.6171875, 37.95703125, 40.296875, 42.63671875, 44.9765625, 47.31640625, 49.65625, 51.99609375, 54.3359375, 56.67578125, 59.015625, 61.35546875, 63.6953125, 66.03515625, 68.375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 16.0, 14.0, 16.0, 23.0, 22.0, 22.0, 35.0, 40.0, 38.0, 47.0, 55.0, 74.0, 111.0, 368.0, 1545.0, 141.0, 80.0, 64.0, 54.0, 42.0, 32.0, 25.0, 22.0, 21.0, 14.0, 18.0, 8.0, 17.0, 11.0, 7.0, 9.0, 7.0, 4.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0625, -49.1787109375, -47.294921875, -45.4111328125, -43.52734375, -41.6435546875, -39.759765625, -37.8759765625, -35.9921875, -34.1083984375, -32.224609375, -30.3408203125, -28.45703125, -26.5732421875, -24.689453125, -22.8056640625, -20.921875, -19.0380859375, -17.154296875, -15.2705078125, -13.38671875, -11.5029296875, -9.619140625, -7.7353515625, -5.8515625, -3.9677734375, -2.083984375, -0.2001953125, 1.68359375, 3.5673828125, 5.451171875, 7.3349609375, 9.21875, 11.1025390625, 12.986328125, 14.8701171875, 16.75390625, 18.6376953125, 20.521484375, 22.4052734375, 24.2890625, 26.1728515625, 28.056640625, 29.9404296875, 31.82421875, 33.7080078125, 35.591796875, 37.4755859375, 39.359375, 41.2431640625, 43.126953125, 45.0107421875, 46.89453125, 48.7783203125, 50.662109375, 52.5458984375, 54.4296875, 56.3134765625, 58.197265625, 60.0810546875, 61.96484375, 63.8486328125, 65.732421875, 67.6162109375, 69.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 9.0, 3.0, 11.0, 6.0, 12.0, 17.0, 14.0, 22.0, 38.0, 55.0, 95.0, 126.0, 190.0, 423.0, 1049.0, 5915.0, 3132303.0, 3591.0, 869.0, 374.0, 204.0, 115.0, 71.0, 38.0, 32.0, 29.0, 23.0, 21.0, 11.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-341.25, -332.80859375, -324.3671875, -315.92578125, -307.484375, -299.04296875, -290.6015625, -282.16015625, -273.71875, -265.27734375, -256.8359375, -248.39453125, -239.953125, -231.51171875, -223.0703125, -214.62890625, -206.1875, -197.74609375, -189.3046875, -180.86328125, -172.421875, -163.98046875, -155.5390625, -147.09765625, -138.65625, -130.21484375, -121.7734375, -113.33203125, -104.890625, -96.44921875, -88.0078125, -79.56640625, -71.125, -62.68359375, -54.2421875, -45.80078125, -37.359375, -28.91796875, -20.4765625, -12.03515625, -3.59375, 4.84765625, 13.2890625, 21.73046875, 30.171875, 38.61328125, 47.0546875, 55.49609375, 63.9375, 72.37890625, 80.8203125, 89.26171875, 97.703125, 106.14453125, 114.5859375, 123.02734375, 131.46875, 139.91015625, 148.3515625, 156.79296875, 165.234375, 173.67578125, 182.1171875, 190.55859375, 199.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 16.0, 135.0, 497.0, 296.0, 55.0, 12.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-255.23687744140625, -242.28587341308594, -229.33486938476562, -216.38388061523438, -203.43287658691406, -190.48187255859375, -177.5308837890625, -164.5798797607422, -151.62887573242188, -138.67787170410156, -125.72687530517578, -112.77587890625, -99.82487487792969, -86.87387084960938, -73.9228744506836, -60.97187805175781, -48.0208740234375, -35.06987380981445, -22.118873596191406, -9.16787338256836, 3.7831268310546875, 16.734130859375, 29.68512725830078, 42.63612365722656, 55.587127685546875, 68.53813171386719, 81.48912811279297, 94.44012451171875, 107.39112854003906, 120.34213256835938, 133.29312133789062, 146.24412536621094, 159.19512939453125, 172.14613342285156, 185.09713745117188, 198.04812622070312, 210.99913024902344, 223.95013427734375, 236.901123046875, 249.8521270751953, 262.8031311035156, 275.7541198730469, 288.70513916015625, 301.6561279296875, 314.60711669921875, 327.5581359863281, 340.5091247558594, 353.46014404296875, 366.4111328125, 379.36212158203125, 392.3131408691406, 405.2641296386719, 418.21514892578125, 431.1661376953125, 444.11712646484375, 457.068115234375, 470.0191345214844, 482.9701232910156, 495.921142578125, 508.87213134765625, 521.8231201171875, 534.774169921875, 547.7251586914062, 560.6761474609375, 573.6271362304688]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 5.0, 11.0, 6.0, 12.0, 11.0, 10.0, 17.0, 20.0, 20.0, 20.0, 21.0, 28.0, 36.0, 34.0, 37.0, 21.0, 39.0, 34.0, 31.0, 37.0, 28.0, 48.0, 38.0, 36.0, 36.0, 37.0, 43.0, 34.0, 28.0, 28.0, 32.0, 17.0, 9.0, 14.0, 17.0, 14.0, 13.0, 10.0, 10.0, 10.0, 8.0, 10.0, 3.0, 5.0, 3.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-136.9477081298828, -132.6690216064453, -128.39035034179688, -124.11166381835938, -119.83297729492188, -115.55429077148438, -111.2756118774414, -106.99693298339844, -102.71824645996094, -98.43955993652344, -94.16088104248047, -89.8822021484375, -85.603515625, -81.3248291015625, -77.04615020751953, -72.76747131347656, -68.48878479003906, -64.21009826660156, -59.931419372558594, -55.65273666381836, -51.374053955078125, -47.09537124633789, -42.816688537597656, -38.53800582885742, -34.25932312011719, -29.980640411376953, -25.70195770263672, -21.423274993896484, -17.14459228515625, -12.865909576416016, -8.587226867675781, -4.308544158935547, -0.029876708984375, 4.248805999755859, 8.527488708496094, 12.806171417236328, 17.084854125976562, 21.363536834716797, 25.64221954345703, 29.920902252197266, 34.1995849609375, 38.478267669677734, 42.75695037841797, 47.0356330871582, 51.31431579589844, 55.59299850463867, 59.871681213378906, 64.15036010742188, 68.42904663085938, 72.70773315429688, 76.98641204833984, 81.26509094238281, 85.54377746582031, 89.82246398925781, 94.10114288330078, 98.37982177734375, 102.65850830078125, 106.93719482421875, 111.21587371826172, 115.49455261230469, 119.77323913574219, 124.05192565917969, 128.33059692382812, 132.60928344726562, 136.88796997070312]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 4.0, 14.0, 10.0, 14.0, 15.0, 17.0, 25.0, 19.0, 14.0, 21.0, 31.0, 24.0, 41.0, 33.0, 50.0, 36.0, 53.0, 43.0, 44.0, 48.0, 30.0, 41.0, 40.0, 41.0, 46.0, 32.0, 30.0, 28.0, 22.0, 21.0, 17.0, 20.0, 11.0, 16.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.125, -24.2158203125, -23.306640625, -22.3974609375, -21.48828125, -20.5791015625, -19.669921875, -18.7607421875, -17.8515625, -16.9423828125, -16.033203125, -15.1240234375, -14.21484375, -13.3056640625, -12.396484375, -11.4873046875, -10.578125, -9.6689453125, -8.759765625, -7.8505859375, -6.94140625, -6.0322265625, -5.123046875, -4.2138671875, -3.3046875, -2.3955078125, -1.486328125, -0.5771484375, 0.33203125, 1.2412109375, 2.150390625, 3.0595703125, 3.96875, 4.8779296875, 5.787109375, 6.6962890625, 7.60546875, 8.5146484375, 9.423828125, 10.3330078125, 11.2421875, 12.1513671875, 13.060546875, 13.9697265625, 14.87890625, 15.7880859375, 16.697265625, 17.6064453125, 18.515625, 19.4248046875, 20.333984375, 21.2431640625, 22.15234375, 23.0615234375, 23.970703125, 24.8798828125, 25.7890625, 26.6982421875, 27.607421875, 28.5166015625, 29.42578125, 30.3349609375, 31.244140625, 32.1533203125, 33.0625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 4.0, 10.0, 13.0, 7.0, 18.0, 13.0, 17.0, 35.0, 39.0, 35.0, 38.0, 40.0, 63.0, 69.0, 99.0, 127.0, 267.0, 437.0, 927.0, 2236.0, 5782.0, 22908.0, 259916.0, 3150781.0, 698091.0, 39263.0, 7654.0, 2717.0, 1126.0, 546.0, 301.0, 174.0, 115.0, 95.0, 64.0, 35.0, 47.0, 28.0, 32.0, 25.0, 21.0, 13.0, 9.0, 11.0, 8.0, 7.0, 4.0, 0.0, 2.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-69.125, -66.94140625, -64.7578125, -62.57421875, -60.390625, -58.20703125, -56.0234375, -53.83984375, -51.65625, -49.47265625, -47.2890625, -45.10546875, -42.921875, -40.73828125, -38.5546875, -36.37109375, -34.1875, -32.00390625, -29.8203125, -27.63671875, -25.453125, -23.26953125, -21.0859375, -18.90234375, -16.71875, -14.53515625, -12.3515625, -10.16796875, -7.984375, -5.80078125, -3.6171875, -1.43359375, 0.75, 2.93359375, 5.1171875, 7.30078125, 9.484375, 11.66796875, 13.8515625, 16.03515625, 18.21875, 20.40234375, 22.5859375, 24.76953125, 26.953125, 29.13671875, 31.3203125, 33.50390625, 35.6875, 37.87109375, 40.0546875, 42.23828125, 44.421875, 46.60546875, 48.7890625, 50.97265625, 53.15625, 55.33984375, 57.5234375, 59.70703125, 61.890625, 64.07421875, 66.2578125, 68.44140625, 70.625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 14.0, 17.0, 21.0, 45.0, 52.0, 74.0, 122.0, 188.0, 328.0, 566.0, 877.0, 724.0, 391.0, 232.0, 158.0, 88.0, 66.0, 42.0, 15.0, 16.0, 9.0, 11.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.947265625, -65.01953125, -63.091796875, -61.1640625, -59.236328125, -57.30859375, -55.380859375, -53.453125, -51.525390625, -49.59765625, -47.669921875, -45.7421875, -43.814453125, -41.88671875, -39.958984375, -38.03125, -36.103515625, -34.17578125, -32.248046875, -30.3203125, -28.392578125, -26.46484375, -24.537109375, -22.609375, -20.681640625, -18.75390625, -16.826171875, -14.8984375, -12.970703125, -11.04296875, -9.115234375, -7.1875, -5.259765625, -3.33203125, -1.404296875, 0.5234375, 2.451171875, 4.37890625, 6.306640625, 8.234375, 10.162109375, 12.08984375, 14.017578125, 15.9453125, 17.873046875, 19.80078125, 21.728515625, 23.65625, 25.583984375, 27.51171875, 29.439453125, 31.3671875, 33.294921875, 35.22265625, 37.150390625, 39.078125, 41.005859375, 42.93359375, 44.861328125, 46.7890625, 48.716796875, 50.64453125, 52.572265625, 54.5]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 7.0, 15.0, 24.0, 18.0, 48.0, 98.0, 169.0, 335.0, 943.0, 3747.0, 29088.0, 3639892.0, 502791.0, 13521.0, 2249.0, 711.0, 271.0, 158.0, 69.0, 44.0, 34.0, 19.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.75, -132.16796875, -127.5859375, -123.00390625, -118.421875, -113.83984375, -109.2578125, -104.67578125, -100.09375, -95.51171875, -90.9296875, -86.34765625, -81.765625, -77.18359375, -72.6015625, -68.01953125, -63.4375, -58.85546875, -54.2734375, -49.69140625, -45.109375, -40.52734375, -35.9453125, -31.36328125, -26.78125, -22.19921875, -17.6171875, -13.03515625, -8.453125, -3.87109375, 0.7109375, 5.29296875, 9.875, 14.45703125, 19.0390625, 23.62109375, 28.203125, 32.78515625, 37.3671875, 41.94921875, 46.53125, 51.11328125, 55.6953125, 60.27734375, 64.859375, 69.44140625, 74.0234375, 78.60546875, 83.1875, 87.76953125, 92.3515625, 96.93359375, 101.515625, 106.09765625, 110.6796875, 115.26171875, 119.84375, 124.42578125, 129.0078125, 133.58984375, 138.171875, 142.75390625, 147.3359375, 151.91796875, 156.5]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 26.0, 173.0, 696.0, 101.0, 13.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-271.91302490234375, -239.56765747070312, -207.2222900390625, -174.87693786621094, -142.5315704345703, -110.18620300292969, -77.84085083007812, -45.4954833984375, -13.150115966796875, 19.195247650146484, 51.540611267089844, 83.88597106933594, 116.23133850097656, 148.5767059326172, 180.92205810546875, 213.26742553710938, 245.61279296875, 277.9581604003906, 310.30352783203125, 342.64886474609375, 374.9942626953125, 407.339599609375, 439.6849670410156, 472.03033447265625, 504.3757019042969, 536.7210693359375, 569.06640625, 601.4118041992188, 633.7571411132812, 666.1025390625, 698.4478759765625, 730.793212890625, 763.1385498046875, 795.48388671875, 827.8292846679688, 860.1746215820312, 892.52001953125, 924.8653564453125, 957.210693359375, 989.5560913085938, 1021.9014892578125, 1054.246826171875, 1086.5921630859375, 1118.9376220703125, 1151.282958984375, 1183.6282958984375, 1215.9736328125, 1248.319091796875, 1280.664306640625, 1313.0096435546875, 1345.35498046875, 1377.700439453125, 1410.0457763671875, 1442.39111328125, 1474.7364501953125, 1507.081787109375, 1539.42724609375, 1571.7725830078125, 1604.117919921875, 1636.46337890625, 1668.8087158203125, 1701.154052734375, 1733.4993896484375, 1765.8447265625, 1798.190185546875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 5.0, 10.0, 15.0, 10.0, 12.0, 9.0, 17.0, 20.0, 26.0, 36.0, 29.0, 29.0, 35.0, 38.0, 40.0, 39.0, 38.0, 42.0, 42.0, 50.0, 28.0, 40.0, 36.0, 44.0, 37.0, 36.0, 22.0, 25.0, 24.0, 27.0, 24.0, 24.0, 13.0, 18.0, 12.0, 5.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-160.9530029296875, -156.26988220214844, -151.58677673339844, -146.90365600585938, -142.22055053710938, -137.5374298095703, -132.8543243408203, -128.17120361328125, -123.48809051513672, -118.80497741699219, -114.12186431884766, -109.43875122070312, -104.75563049316406, -100.07252502441406, -95.389404296875, -90.70629119873047, -86.02317810058594, -81.3400650024414, -76.65695190429688, -71.97383880615234, -67.29072570800781, -62.607608795166016, -57.92449188232422, -53.24137878417969, -48.558265686035156, -43.875152587890625, -39.192039489746094, -34.5089225769043, -29.825809478759766, -25.142696380615234, -20.45958137512207, -15.776466369628906, -11.093368530273438, -6.41025447845459, -1.7271404266357422, 2.9559736251831055, 7.639087677001953, 12.322200775146484, 17.00531578063965, 21.688430786132812, 26.371543884277344, 31.054656982421875, 35.737770080566406, 40.4208869934082, 45.104000091552734, 49.787113189697266, 54.47023010253906, 59.153343200683594, 63.836456298828125, 68.51956939697266, 73.20268249511719, 77.88579559326172, 82.56890869140625, 87.25202941894531, 91.93514251708984, 96.61825561523438, 101.3013687133789, 105.98448181152344, 110.66759490966797, 115.3507080078125, 120.03382873535156, 124.71693420410156, 129.40005493164062, 134.08316040039062, 138.7662811279297]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 14.0, 5.0, 10.0, 12.0, 14.0, 20.0, 21.0, 26.0, 24.0, 27.0, 26.0, 40.0, 33.0, 41.0, 42.0, 46.0, 38.0, 31.0, 49.0, 42.0, 52.0, 45.0, 39.0, 40.0, 38.0, 33.0, 31.0, 27.0, 23.0, 14.0, 22.0, 16.0, 10.0, 5.0, 13.0, 6.0, 9.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.890625, -23.07861328125, -22.2666015625, -21.45458984375, -20.642578125, -19.83056640625, -19.0185546875, -18.20654296875, -17.39453125, -16.58251953125, -15.7705078125, -14.95849609375, -14.146484375, -13.33447265625, -12.5224609375, -11.71044921875, -10.8984375, -10.08642578125, -9.2744140625, -8.46240234375, -7.650390625, -6.83837890625, -6.0263671875, -5.21435546875, -4.40234375, -3.59033203125, -2.7783203125, -1.96630859375, -1.154296875, -0.34228515625, 0.4697265625, 1.28173828125, 2.09375, 2.90576171875, 3.7177734375, 4.52978515625, 5.341796875, 6.15380859375, 6.9658203125, 7.77783203125, 8.58984375, 9.40185546875, 10.2138671875, 11.02587890625, 11.837890625, 12.64990234375, 13.4619140625, 14.27392578125, 15.0859375, 15.89794921875, 16.7099609375, 17.52197265625, 18.333984375, 19.14599609375, 19.9580078125, 20.77001953125, 21.58203125, 22.39404296875, 23.2060546875, 24.01806640625, 24.830078125, 25.64208984375, 26.4541015625, 27.26611328125, 28.078125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 7.0, 11.0, 5.0, 13.0, 22.0, 29.0, 41.0, 64.0, 63.0, 128.0, 208.0, 259.0, 424.0, 627.0, 809.0, 1393.0, 2103.0, 3187.0, 4923.0, 7621.0, 11903.0, 18868.0, 30126.0, 50344.0, 87735.0, 160336.0, 247026.0, 177929.0, 97002.0, 55335.0, 33062.0, 20215.0, 12896.0, 8143.0, 5321.0, 3565.0, 2318.0, 1559.0, 1002.0, 659.0, 444.0, 284.0, 185.0, 135.0, 73.0, 62.0, 34.0, 26.0, 15.0, 9.0, 6.0, 3.0, 7.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.259765625, -1.222259521484375, -1.18475341796875, -1.147247314453125, -1.1097412109375, -1.072235107421875, -1.03472900390625, -0.997222900390625, -0.959716796875, -0.922210693359375, -0.88470458984375, -0.847198486328125, -0.8096923828125, -0.772186279296875, -0.73468017578125, -0.697174072265625, -0.65966796875, -0.622161865234375, -0.58465576171875, -0.547149658203125, -0.5096435546875, -0.472137451171875, -0.43463134765625, -0.397125244140625, -0.359619140625, -0.322113037109375, -0.28460693359375, -0.247100830078125, -0.2095947265625, -0.172088623046875, -0.13458251953125, -0.097076416015625, -0.0595703125, -0.022064208984375, 0.01544189453125, 0.052947998046875, 0.0904541015625, 0.127960205078125, 0.16546630859375, 0.202972412109375, 0.240478515625, 0.277984619140625, 0.31549072265625, 0.352996826171875, 0.3905029296875, 0.428009033203125, 0.46551513671875, 0.503021240234375, 0.54052734375, 0.578033447265625, 0.61553955078125, 0.653045654296875, 0.6905517578125, 0.728057861328125, 0.76556396484375, 0.803070068359375, 0.840576171875, 0.878082275390625, 0.91558837890625, 0.953094482421875, 0.9906005859375, 1.028106689453125, 1.06561279296875, 1.103118896484375, 1.140625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 15.0, 14.0, 8.0, 16.0, 16.0, 19.0, 24.0, 20.0, 27.0, 32.0, 26.0, 34.0, 35.0, 27.0, 42.0, 35.0, 36.0, 47.0, 1061.0, 43.0, 33.0, 38.0, 28.0, 37.0, 30.0, 32.0, 20.0, 34.0, 31.0, 28.0, 16.0, 20.0, 14.0, 17.0, 12.0, 9.0, 12.0, 3.0, 8.0, 5.0, 4.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.734375, -13.26416015625, -12.7939453125, -12.32373046875, -11.853515625, -11.38330078125, -10.9130859375, -10.44287109375, -9.97265625, -9.50244140625, -9.0322265625, -8.56201171875, -8.091796875, -7.62158203125, -7.1513671875, -6.68115234375, -6.2109375, -5.74072265625, -5.2705078125, -4.80029296875, -4.330078125, -3.85986328125, -3.3896484375, -2.91943359375, -2.44921875, -1.97900390625, -1.5087890625, -1.03857421875, -0.568359375, -0.09814453125, 0.3720703125, 0.84228515625, 1.3125, 1.78271484375, 2.2529296875, 2.72314453125, 3.193359375, 3.66357421875, 4.1337890625, 4.60400390625, 5.07421875, 5.54443359375, 6.0146484375, 6.48486328125, 6.955078125, 7.42529296875, 7.8955078125, 8.36572265625, 8.8359375, 9.30615234375, 9.7763671875, 10.24658203125, 10.716796875, 11.18701171875, 11.6572265625, 12.12744140625, 12.59765625, 13.06787109375, 13.5380859375, 14.00830078125, 14.478515625, 14.94873046875, 15.4189453125, 15.88916015625, 16.359375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 11.0, 13.0, 15.0, 27.0, 36.0, 58.0, 107.0, 151.0, 189.0, 238.0, 440.0, 604.0, 907.0, 1286.0, 1831.0, 2721.0, 3841.0, 5520.0, 7711.0, 11143.0, 16315.0, 24166.0, 35887.0, 55583.0, 87280.0, 143705.0, 1253959.0, 161161.0, 97957.0, 60653.0, 39631.0, 26305.0, 17600.0, 12198.0, 8513.0, 5906.0, 4125.0, 2920.0, 2012.0, 1444.0, 922.0, 607.0, 484.0, 340.0, 207.0, 135.0, 98.0, 69.0, 30.0, 30.0, 16.0, 11.0, 7.0, 5.0, 6.0, 2.0, 0.0, 1.0], "bins": [-0.93115234375, -0.9026031494140625, -0.874053955078125, -0.8455047607421875, -0.81695556640625, -0.7884063720703125, -0.759857177734375, -0.7313079833984375, -0.7027587890625, -0.6742095947265625, -0.645660400390625, -0.6171112060546875, -0.58856201171875, -0.5600128173828125, -0.531463623046875, -0.5029144287109375, -0.474365234375, -0.4458160400390625, -0.417266845703125, -0.3887176513671875, -0.36016845703125, -0.3316192626953125, -0.303070068359375, -0.2745208740234375, -0.2459716796875, -0.2174224853515625, -0.188873291015625, -0.1603240966796875, -0.13177490234375, -0.1032257080078125, -0.074676513671875, -0.0461273193359375, -0.017578125, 0.0109710693359375, 0.039520263671875, 0.0680694580078125, 0.09661865234375, 0.1251678466796875, 0.153717041015625, 0.1822662353515625, 0.2108154296875, 0.2393646240234375, 0.267913818359375, 0.2964630126953125, 0.32501220703125, 0.3535614013671875, 0.382110595703125, 0.4106597900390625, 0.439208984375, 0.4677581787109375, 0.496307373046875, 0.5248565673828125, 0.55340576171875, 0.5819549560546875, 0.610504150390625, 0.6390533447265625, 0.6676025390625, 0.6961517333984375, 0.724700927734375, 0.7532501220703125, 0.78179931640625, 0.8103485107421875, 0.838897705078125, 0.8674468994140625, 0.89599609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 3.0, 9.0, 11.0, 14.0, 15.0, 11.0, 18.0, 25.0, 30.0, 33.0, 38.0, 39.0, 40.0, 69.0, 64.0, 69.0, 66.0, 67.0, 50.0, 51.0, 52.0, 36.0, 35.0, 35.0, 23.0, 20.0, 22.0, 14.0, 8.0, 11.0, 2.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005615234375, -0.0054631829261779785, -0.005311131477355957, -0.0051590800285339355, -0.005007028579711914, -0.004854977130889893, -0.004702925682067871, -0.00455087423324585, -0.004398822784423828, -0.004246771335601807, -0.004094719886779785, -0.003942668437957764, -0.003790616989135742, -0.0036385655403137207, -0.0034865140914916992, -0.0033344626426696777, -0.0031824111938476562, -0.0030303597450256348, -0.0028783082962036133, -0.002726256847381592, -0.0025742053985595703, -0.002422153949737549, -0.0022701025009155273, -0.002118051052093506, -0.0019659996032714844, -0.0018139481544494629, -0.0016618967056274414, -0.00150984525680542, -0.0013577938079833984, -0.001205742359161377, -0.0010536909103393555, -0.000901639461517334, -0.0007495880126953125, -0.000597536563873291, -0.00044548511505126953, -0.00029343366622924805, -0.00014138221740722656, 1.0669231414794922e-05, 0.0001627206802368164, 0.0003147721290588379, 0.0004668235778808594, 0.0006188750267028809, 0.0007709264755249023, 0.0009229779243469238, 0.0010750293731689453, 0.0012270808219909668, 0.0013791322708129883, 0.0015311837196350098, 0.0016832351684570312, 0.0018352866172790527, 0.0019873380661010742, 0.0021393895149230957, 0.002291440963745117, 0.0024434924125671387, 0.00259554386138916, 0.0027475953102111816, 0.002899646759033203, 0.0030516982078552246, 0.003203749656677246, 0.0033558011054992676, 0.003507852554321289, 0.0036599040031433105, 0.003811955451965332, 0.0039640069007873535, 0.004116058349609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 10.0, 12.0, 14.0, 13.0, 28.0, 31.0, 45.0, 64.0, 63.0, 98.0, 119.0, 188.0, 247.0, 491.0, 1248.0, 78809.0, 961902.0, 3344.0, 700.0, 323.0, 207.0, 146.0, 91.0, 86.0, 50.0, 49.0, 33.0, 32.0, 21.0, 21.0, 18.0, 10.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07342529296875, -0.07062530517578125, -0.0678253173828125, -0.06502532958984375, -0.062225341796875, -0.05942535400390625, -0.0566253662109375, -0.05382537841796875, -0.051025390625, -0.04822540283203125, -0.0454254150390625, -0.04262542724609375, -0.039825439453125, -0.03702545166015625, -0.0342254638671875, -0.03142547607421875, -0.02862548828125, -0.02582550048828125, -0.0230255126953125, -0.02022552490234375, -0.017425537109375, -0.01462554931640625, -0.0118255615234375, -0.00902557373046875, -0.0062255859375, -0.00342559814453125, -0.0006256103515625, 0.00217437744140625, 0.004974365234375, 0.00777435302734375, 0.0105743408203125, 0.01337432861328125, 0.01617431640625, 0.01897430419921875, 0.0217742919921875, 0.02457427978515625, 0.027374267578125, 0.03017425537109375, 0.0329742431640625, 0.03577423095703125, 0.03857421875, 0.04137420654296875, 0.0441741943359375, 0.04697418212890625, 0.049774169921875, 0.05257415771484375, 0.0553741455078125, 0.05817413330078125, 0.06097412109375, 0.06377410888671875, 0.0665740966796875, 0.06937408447265625, 0.072174072265625, 0.07497406005859375, 0.0777740478515625, 0.08057403564453125, 0.0833740234375, 0.08617401123046875, 0.0889739990234375, 0.09177398681640625, 0.094573974609375, 0.09737396240234375, 0.1001739501953125, 0.10297393798828125, 0.10577392578125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 18.0, 90.0, 461.0, 360.0, 66.0, 13.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007264423184096813, -0.0068797217682003975, -0.006495020352303982, -0.006110318936407566, -0.00572561752051115, -0.005340916104614735, -0.004956214688718319, -0.004571513272821903, -0.0041868118569254875, -0.003802110441029072, -0.003417409025132656, -0.0030327076092362404, -0.0026480061933398247, -0.002263304777443409, -0.0018786033615469933, -0.0014939019456505775, -0.0011092005297541618, -0.0007244991138577461, -0.0003397976979613304, 4.49037179350853e-05, 0.000429605133831501, 0.0008143065497279167, 0.0011990079656243324, 0.0015837093815207481, 0.001968410797417164, 0.0023531122133135796, 0.0027378136292099953, 0.003122515045106411, 0.0035072164610028267, 0.0038919178768992424, 0.004276619292795658, 0.004661320708692074, 0.005046021193265915, 0.005430722609162331, 0.005815424025058746, 0.006200125440955162, 0.006584826856851578, 0.0069695282727479935, 0.007354229688644409, 0.007738931104540825, 0.00812363252043724, 0.008508333936333656, 0.008893035352230072, 0.009277736768126488, 0.009662438184022903, 0.01004713959991932, 0.010431841015815735, 0.01081654243171215, 0.011201243847608566, 0.011585945263504982, 0.011970646679401398, 0.012355348095297813, 0.012740049511194229, 0.013124750927090645, 0.01350945234298706, 0.013894153758883476, 0.014278855174779892, 0.014663556590676308, 0.015048258006572723, 0.015432959422469139, 0.015817660838365555, 0.01620236225426197, 0.016587063670158386, 0.016971765086054802, 0.017356466501951218]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 5.0, 3.0, 10.0, 13.0, 13.0, 15.0, 13.0, 20.0, 16.0, 14.0, 22.0, 24.0, 35.0, 34.0, 44.0, 37.0, 35.0, 27.0, 36.0, 32.0, 29.0, 39.0, 35.0, 34.0, 41.0, 39.0, 32.0, 32.0, 32.0, 36.0, 26.0, 29.0, 23.0, 13.0, 21.0, 12.0, 14.0, 14.0, 8.0, 7.0, 1.0, 5.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.002219557762145996, -0.002150637097656727, -0.0020817164331674576, -0.0020127957686781883, -0.001943875104188919, -0.0018749544396996498, -0.0018060337752103806, -0.0017371131107211113, -0.001668192446231842, -0.0015992717817425728, -0.0015303511172533035, -0.0014614304527640343, -0.001392509788274765, -0.0013235891237854958, -0.0012546684592962265, -0.0011857477948069572, -0.001116827130317688, -0.0010479064658284187, -0.0009789858013391495, -0.0009100651368498802, -0.000841144472360611, -0.0007722238078713417, -0.0007033031433820724, -0.0006343824788928032, -0.0005654618144035339, -0.0004965411499142647, -0.0004276204854249954, -0.00035869982093572617, -0.0002897791564464569, -0.00022085849195718765, -0.0001519378274679184, -8.301716297864914e-05, -1.4096498489379883e-05, 5.4824165999889374e-05, 0.00012374483048915863, 0.0001926654949784279, 0.00026158615946769714, 0.0003305068239569664, 0.00039942748844623566, 0.0004683481529355049, 0.0005372688174247742, 0.0006061894819140434, 0.0006751101464033127, 0.0007440308108925819, 0.0008129514753818512, 0.0008818721398711205, 0.0009507928043603897, 0.001019713468849659, 0.0010886341333389282, 0.0011575547978281975, 0.0012264754623174667, 0.001295396126806736, 0.0013643167912960052, 0.0014332374557852745, 0.0015021581202745438, 0.001571078784763813, 0.0016399994492530823, 0.0017089201137423515, 0.0017778407782316208, 0.00184676144272089, 0.0019156821072101593, 0.0019846027716994286, 0.002053523436188698, 0.002122444100677967, 0.0021913647651672363]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 14.0, 5.0, 10.0, 12.0, 14.0, 20.0, 21.0, 26.0, 24.0, 27.0, 26.0, 40.0, 32.0, 42.0, 42.0, 46.0, 38.0, 31.0, 49.0, 42.0, 52.0, 45.0, 39.0, 40.0, 38.0, 33.0, 31.0, 27.0, 22.0, 15.0, 22.0, 16.0, 10.0, 5.0, 13.0, 6.0, 9.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.890625, -23.07861328125, -22.2666015625, -21.45458984375, -20.642578125, -19.83056640625, -19.0185546875, -18.20654296875, -17.39453125, -16.58251953125, -15.7705078125, -14.95849609375, -14.146484375, -13.33447265625, -12.5224609375, -11.71044921875, -10.8984375, -10.08642578125, -9.2744140625, -8.46240234375, -7.650390625, -6.83837890625, -6.0263671875, -5.21435546875, -4.40234375, -3.59033203125, -2.7783203125, -1.96630859375, -1.154296875, -0.34228515625, 0.4697265625, 1.28173828125, 2.09375, 2.90576171875, 3.7177734375, 4.52978515625, 5.341796875, 6.15380859375, 6.9658203125, 7.77783203125, 8.58984375, 9.40185546875, 10.2138671875, 11.02587890625, 11.837890625, 12.64990234375, 13.4619140625, 14.27392578125, 15.0859375, 15.89794921875, 16.7099609375, 17.52197265625, 18.333984375, 19.14599609375, 19.9580078125, 20.77001953125, 21.58203125, 22.39404296875, 23.2060546875, 24.01806640625, 24.830078125, 25.64208984375, 26.4541015625, 27.26611328125, 28.078125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 5.0, 0.0, 3.0, 6.0, 8.0, 9.0, 16.0, 38.0, 44.0, 55.0, 75.0, 74.0, 118.0, 145.0, 189.0, 272.0, 384.0, 578.0, 928.0, 1457.0, 2521.0, 5073.0, 11188.0, 30406.0, 117177.0, 600904.0, 202329.0, 44917.0, 15188.0, 6359.0, 3079.0, 1641.0, 1138.0, 640.0, 426.0, 331.0, 234.0, 137.0, 120.0, 82.0, 55.0, 55.0, 34.0, 33.0, 21.0, 13.0, 20.0, 11.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.65625, -32.48193359375, -31.3076171875, -30.13330078125, -28.958984375, -27.78466796875, -26.6103515625, -25.43603515625, -24.26171875, -23.08740234375, -21.9130859375, -20.73876953125, -19.564453125, -18.39013671875, -17.2158203125, -16.04150390625, -14.8671875, -13.69287109375, -12.5185546875, -11.34423828125, -10.169921875, -8.99560546875, -7.8212890625, -6.64697265625, -5.47265625, -4.29833984375, -3.1240234375, -1.94970703125, -0.775390625, 0.39892578125, 1.5732421875, 2.74755859375, 3.921875, 5.09619140625, 6.2705078125, 7.44482421875, 8.619140625, 9.79345703125, 10.9677734375, 12.14208984375, 13.31640625, 14.49072265625, 15.6650390625, 16.83935546875, 18.013671875, 19.18798828125, 20.3623046875, 21.53662109375, 22.7109375, 23.88525390625, 25.0595703125, 26.23388671875, 27.408203125, 28.58251953125, 29.7568359375, 30.93115234375, 32.10546875, 33.27978515625, 34.4541015625, 35.62841796875, 36.802734375, 37.97705078125, 39.1513671875, 40.32568359375, 41.5]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 2.0, 6.0, 7.0, 3.0, 15.0, 23.0, 24.0, 21.0, 29.0, 49.0, 42.0, 65.0, 68.0, 107.0, 342.0, 1650.0, 170.0, 87.0, 67.0, 48.0, 58.0, 39.0, 28.0, 20.0, 22.0, 12.0, 15.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.25, -60.1181640625, -57.986328125, -55.8544921875, -53.72265625, -51.5908203125, -49.458984375, -47.3271484375, -45.1953125, -43.0634765625, -40.931640625, -38.7998046875, -36.66796875, -34.5361328125, -32.404296875, -30.2724609375, -28.140625, -26.0087890625, -23.876953125, -21.7451171875, -19.61328125, -17.4814453125, -15.349609375, -13.2177734375, -11.0859375, -8.9541015625, -6.822265625, -4.6904296875, -2.55859375, -0.4267578125, 1.705078125, 3.8369140625, 5.96875, 8.1005859375, 10.232421875, 12.3642578125, 14.49609375, 16.6279296875, 18.759765625, 20.8916015625, 23.0234375, 25.1552734375, 27.287109375, 29.4189453125, 31.55078125, 33.6826171875, 35.814453125, 37.9462890625, 40.078125, 42.2099609375, 44.341796875, 46.4736328125, 48.60546875, 50.7373046875, 52.869140625, 55.0009765625, 57.1328125, 59.2646484375, 61.396484375, 63.5283203125, 65.66015625, 67.7919921875, 69.923828125, 72.0556640625, 74.1875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 10.0, 18.0, 24.0, 18.0, 48.0, 63.0, 69.0, 138.0, 276.0, 537.0, 1592.0, 347846.0, 2791889.0, 1841.0, 585.0, 295.0, 133.0, 120.0, 74.0, 42.0, 26.0, 16.0, 15.0, 9.0, 3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.875, -174.59375, -169.3125, -164.03125, -158.75, -153.46875, -148.1875, -142.90625, -137.625, -132.34375, -127.0625, -121.78125, -116.5, -111.21875, -105.9375, -100.65625, -95.375, -90.09375, -84.8125, -79.53125, -74.25, -68.96875, -63.6875, -58.40625, -53.125, -47.84375, -42.5625, -37.28125, -32.0, -26.71875, -21.4375, -16.15625, -10.875, -5.59375, -0.3125, 4.96875, 10.25, 15.53125, 20.8125, 26.09375, 31.375, 36.65625, 41.9375, 47.21875, 52.5, 57.78125, 63.0625, 68.34375, 73.625, 78.90625, 84.1875, 89.46875, 94.75, 100.03125, 105.3125, 110.59375, 115.875, 121.15625, 126.4375, 131.71875, 137.0, 142.28125, 147.5625, 152.84375, 158.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 28.0, 588.0, 376.0, 22.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-584.1806030273438, -566.9111938476562, -549.6417846679688, -532.3723754882812, -515.1029663085938, -497.83355712890625, -480.56414794921875, -463.29473876953125, -446.02532958984375, -428.75592041015625, -411.48651123046875, -394.21710205078125, -376.94769287109375, -359.67828369140625, -342.40887451171875, -325.13946533203125, -307.87005615234375, -290.60064697265625, -273.33123779296875, -256.06182861328125, -238.79241943359375, -221.52301025390625, -204.25360107421875, -186.98419189453125, -169.71478271484375, -152.44537353515625, -135.17596435546875, -117.90655517578125, -100.63714599609375, -83.36773681640625, -66.09832763671875, -48.82891845703125, -31.5595703125, -14.2901611328125, 2.979248046875, 20.2486572265625, 37.51806640625, 54.7874755859375, 72.056884765625, 89.3262939453125, 106.595703125, 123.8651123046875, 141.134521484375, 158.4039306640625, 175.67333984375, 192.9427490234375, 210.212158203125, 227.4815673828125, 244.7509765625, 262.0203857421875, 279.289794921875, 296.5592041015625, 313.82861328125, 331.0980224609375, 348.367431640625, 365.6368408203125, 382.90625, 400.1756591796875, 417.445068359375, 434.7144775390625, 451.98388671875, 469.2532958984375, 486.522705078125, 503.7921142578125, 521.0615234375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 2.0, 10.0, 11.0, 10.0, 21.0, 17.0, 22.0, 28.0, 22.0, 22.0, 30.0, 39.0, 40.0, 47.0, 33.0, 29.0, 42.0, 44.0, 39.0, 37.0, 37.0, 42.0, 44.0, 39.0, 35.0, 33.0, 26.0, 32.0, 35.0, 20.0, 18.0, 14.0, 15.0, 10.0, 9.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.70568084716797, -97.85025024414062, -93.99481964111328, -90.13938903808594, -86.28396606445312, -82.42853546142578, -78.57310485839844, -74.7176742553711, -70.86224365234375, -67.0068130493164, -63.15138626098633, -59.295955657958984, -55.440528869628906, -51.58509826660156, -47.72966766357422, -43.874237060546875, -40.01881408691406, -36.16338348388672, -32.30795669555664, -28.452526092529297, -24.597097396850586, -20.741668701171875, -16.88623809814453, -13.03080940246582, -9.17538070678711, -5.31995153427124, -1.464522361755371, 2.3909072875976562, 6.246335983276367, 10.101764678955078, 13.957195281982422, 17.812623977661133, 21.668060302734375, 25.523488998413086, 29.378917694091797, 33.23434829711914, 37.08977508544922, 40.94520568847656, 44.800636291503906, 48.65606689453125, 52.51149368286133, 56.36692428588867, 60.22235107421875, 64.0777816772461, 67.93321228027344, 71.78863525390625, 75.64407348632812, 79.49949645996094, 83.35492706298828, 87.21035766601562, 91.06578826904297, 94.92121887207031, 98.77664184570312, 102.63207244873047, 106.48750305175781, 110.34293365478516, 114.1983642578125, 118.05379486083984, 121.90922546386719, 125.7646484375, 129.62008666992188, 133.4755096435547, 137.3309326171875, 141.18637084960938, 145.0417938232422]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 10.0, 13.0, 10.0, 12.0, 16.0, 17.0, 18.0, 23.0, 30.0, 33.0, 27.0, 33.0, 42.0, 37.0, 44.0, 50.0, 39.0, 39.0, 52.0, 42.0, 36.0, 47.0, 30.0, 33.0, 34.0, 33.0, 25.0, 31.0, 25.0, 20.0, 21.0, 14.0, 11.0, 10.0, 12.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.29736328125, -22.3759765625, -21.45458984375, -20.533203125, -19.61181640625, -18.6904296875, -17.76904296875, -16.84765625, -15.92626953125, -15.0048828125, -14.08349609375, -13.162109375, -12.24072265625, -11.3193359375, -10.39794921875, -9.4765625, -8.55517578125, -7.6337890625, -6.71240234375, -5.791015625, -4.86962890625, -3.9482421875, -3.02685546875, -2.10546875, -1.18408203125, -0.2626953125, 0.65869140625, 1.580078125, 2.50146484375, 3.4228515625, 4.34423828125, 5.265625, 6.18701171875, 7.1083984375, 8.02978515625, 8.951171875, 9.87255859375, 10.7939453125, 11.71533203125, 12.63671875, 13.55810546875, 14.4794921875, 15.40087890625, 16.322265625, 17.24365234375, 18.1650390625, 19.08642578125, 20.0078125, 20.92919921875, 21.8505859375, 22.77197265625, 23.693359375, 24.61474609375, 25.5361328125, 26.45751953125, 27.37890625, 28.30029296875, 29.2216796875, 30.14306640625, 31.064453125, 31.98583984375, 32.9072265625, 33.82861328125, 34.75]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 18.0, 13.0, 28.0, 41.0, 46.0, 66.0, 70.0, 114.0, 186.0, 230.0, 339.0, 489.0, 844.0, 1659.0, 3795.0, 10754.0, 44465.0, 2248876.0, 1828552.0, 36894.0, 9357.0, 3480.0, 1494.0, 804.0, 479.0, 308.0, 225.0, 155.0, 131.0, 100.0, 74.0, 45.0, 39.0, 21.0, 25.0, 21.0, 10.0, 5.0, 8.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.25, -111.7734375, -107.296875, -102.8203125, -98.34375, -93.8671875, -89.390625, -84.9140625, -80.4375, -75.9609375, -71.484375, -67.0078125, -62.53125, -58.0546875, -53.578125, -49.1015625, -44.625, -40.1484375, -35.671875, -31.1953125, -26.71875, -22.2421875, -17.765625, -13.2890625, -8.8125, -4.3359375, 0.140625, 4.6171875, 9.09375, 13.5703125, 18.046875, 22.5234375, 27.0, 31.4765625, 35.953125, 40.4296875, 44.90625, 49.3828125, 53.859375, 58.3359375, 62.8125, 67.2890625, 71.765625, 76.2421875, 80.71875, 85.1953125, 89.671875, 94.1484375, 98.625, 103.1015625, 107.578125, 112.0546875, 116.53125, 121.0078125, 125.484375, 129.9609375, 134.4375, 138.9140625, 143.390625, 147.8671875, 152.34375, 156.8203125, 161.296875, 165.7734375, 170.25]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 6.0, 4.0, 10.0, 14.0, 25.0, 38.0, 37.0, 66.0, 93.0, 197.0, 433.0, 1140.0, 1130.0, 411.0, 162.0, 111.0, 50.0, 48.0, 33.0, 15.0, 15.0, 14.0, 7.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.9375, -78.3759765625, -74.814453125, -71.2529296875, -67.69140625, -64.1298828125, -60.568359375, -57.0068359375, -53.4453125, -49.8837890625, -46.322265625, -42.7607421875, -39.19921875, -35.6376953125, -32.076171875, -28.5146484375, -24.953125, -21.3916015625, -17.830078125, -14.2685546875, -10.70703125, -7.1455078125, -3.583984375, -0.0224609375, 3.5390625, 7.1005859375, 10.662109375, 14.2236328125, 17.78515625, 21.3466796875, 24.908203125, 28.4697265625, 32.03125, 35.5927734375, 39.154296875, 42.7158203125, 46.27734375, 49.8388671875, 53.400390625, 56.9619140625, 60.5234375, 64.0849609375, 67.646484375, 71.2080078125, 74.76953125, 78.3310546875, 81.892578125, 85.4541015625, 89.015625, 92.5771484375, 96.138671875, 99.7001953125, 103.26171875, 106.8232421875, 110.384765625, 113.9462890625, 117.5078125, 121.0693359375, 124.630859375, 128.1923828125, 131.75390625, 135.3154296875, 138.876953125, 142.4384765625, 146.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 8.0, 7.0, 10.0, 20.0, 23.0, 53.0, 77.0, 126.0, 203.0, 274.0, 504.0, 957.0, 1741.0, 3306.0, 6786.0, 15507.0, 39942.0, 152622.0, 2858484.0, 963615.0, 96854.0, 29620.0, 11914.0, 5493.0, 2761.0, 1437.0, 749.0, 418.0, 285.0, 180.0, 108.0, 55.0, 36.0, 36.0, 24.0, 8.0, 11.0, 8.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.6875, -72.3427734375, -69.998046875, -67.6533203125, -65.30859375, -62.9638671875, -60.619140625, -58.2744140625, -55.9296875, -53.5849609375, -51.240234375, -48.8955078125, -46.55078125, -44.2060546875, -41.861328125, -39.5166015625, -37.171875, -34.8271484375, -32.482421875, -30.1376953125, -27.79296875, -25.4482421875, -23.103515625, -20.7587890625, -18.4140625, -16.0693359375, -13.724609375, -11.3798828125, -9.03515625, -6.6904296875, -4.345703125, -2.0009765625, 0.34375, 2.6884765625, 5.033203125, 7.3779296875, 9.72265625, 12.0673828125, 14.412109375, 16.7568359375, 19.1015625, 21.4462890625, 23.791015625, 26.1357421875, 28.48046875, 30.8251953125, 33.169921875, 35.5146484375, 37.859375, 40.2041015625, 42.548828125, 44.8935546875, 47.23828125, 49.5830078125, 51.927734375, 54.2724609375, 56.6171875, 58.9619140625, 61.306640625, 63.6513671875, 65.99609375, 68.3408203125, 70.685546875, 73.0302734375, 75.375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 3.0, 4.0, 9.0, 7.0, 13.0, 18.0, 16.0, 37.0, 29.0, 42.0, 65.0, 105.0, 144.0, 131.0, 96.0, 68.0, 59.0, 34.0, 23.0, 20.0, 22.0, 8.0, 11.0, 14.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-446.7537841796875, -432.40869140625, -418.0636291503906, -403.7185363769531, -389.37347412109375, -375.02838134765625, -360.68328857421875, -346.3382263183594, -331.9931335449219, -317.6480407714844, -303.302978515625, -288.9578857421875, -274.6128234863281, -260.2677307128906, -245.9226531982422, -231.57757568359375, -217.2324981689453, -202.88742065429688, -188.54234313964844, -174.197265625, -159.8521728515625, -145.50709533691406, -131.16201782226562, -116.81693267822266, -102.47185516357422, -88.12677764892578, -73.78169250488281, -59.436614990234375, -45.09153366088867, -30.74645233154297, -16.40137481689453, -2.0562896728515625, 12.288787841796875, 26.633869171142578, 40.97895050048828, 55.32402801513672, 69.66911315917969, 84.01419067382812, 98.35926818847656, 112.70435333251953, 127.04943084716797, 141.39451599121094, 155.73959350585938, 170.0846710205078, 184.42974853515625, 198.77484130859375, 213.11990356445312, 227.46499633789062, 241.81007385253906, 256.1551513671875, 270.500244140625, 284.8453063964844, 299.1903991699219, 313.53546142578125, 327.88055419921875, 342.22564697265625, 356.5707092285156, 370.9158020019531, 385.2608642578125, 399.60595703125, 413.9510192871094, 428.2961120605469, 442.64117431640625, 456.98626708984375, 471.33135986328125]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 11.0, 12.0, 14.0, 16.0, 16.0, 13.0, 26.0, 26.0, 20.0, 25.0, 32.0, 38.0, 35.0, 48.0, 38.0, 53.0, 37.0, 38.0, 34.0, 39.0, 44.0, 32.0, 52.0, 26.0, 30.0, 31.0, 44.0, 28.0, 17.0, 18.0, 11.0, 13.0, 18.0, 11.0, 6.0, 4.0, 7.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-283.0593566894531, -274.0446472167969, -265.02996826171875, -256.0152587890625, -247.00057983398438, -237.98587036132812, -228.97117614746094, -219.95648193359375, -210.94178771972656, -201.92709350585938, -192.9123992919922, -183.897705078125, -174.88299560546875, -165.86831665039062, -156.85360717773438, -147.8389129638672, -138.82421875, -129.8095245361328, -120.79483032226562, -111.7801284790039, -102.76543426513672, -93.75074005126953, -84.73603820800781, -75.72134399414062, -66.70664978027344, -57.69195556640625, -48.6772575378418, -39.662559509277344, -30.647865295410156, -21.63317108154297, -12.618473052978516, -3.6037750244140625, 5.41094970703125, 14.42564582824707, 23.44034194946289, 32.455039978027344, 41.46973419189453, 50.48442840576172, 59.49912643432617, 68.51382446289062, 77.52851867675781, 86.543212890625, 95.55790710449219, 104.5726089477539, 113.5873031616211, 122.60199737548828, 131.61669921875, 140.6313934326172, 149.64608764648438, 158.66078186035156, 167.67547607421875, 176.69017028808594, 185.70486450195312, 194.71957397460938, 203.73426818847656, 212.74896240234375, 221.76365661621094, 230.77835083007812, 239.7930450439453, 248.8077392578125, 257.82244873046875, 266.8371276855469, 275.8518371582031, 284.86651611328125, 293.8812255859375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 10.0, 15.0, 6.0, 17.0, 19.0, 16.0, 14.0, 26.0, 22.0, 28.0, 21.0, 40.0, 37.0, 47.0, 48.0, 41.0, 49.0, 45.0, 45.0, 40.0, 39.0, 38.0, 44.0, 38.0, 30.0, 28.0, 43.0, 30.0, 20.0, 14.0, 10.0, 13.0, 14.0, 9.0, 6.0, 7.0, 7.0, 2.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-520.5, -504.046875, -487.59375, -471.140625, -454.6875, -438.234375, -421.78125, -405.328125, -388.875, -372.421875, -355.96875, -339.515625, -323.0625, -306.609375, -290.15625, -273.703125, -257.25, -240.796875, -224.34375, -207.890625, -191.4375, -174.984375, -158.53125, -142.078125, -125.625, -109.171875, -92.71875, -76.265625, -59.8125, -43.359375, -26.90625, -10.453125, 6.0, 22.453125, 38.90625, 55.359375, 71.8125, 88.265625, 104.71875, 121.171875, 137.625, 154.078125, 170.53125, 186.984375, 203.4375, 219.890625, 236.34375, 252.796875, 269.25, 285.703125, 302.15625, 318.609375, 335.0625, 351.515625, 367.96875, 384.421875, 400.875, 417.328125, 433.78125, 450.234375, 466.6875, 483.140625, 499.59375, 516.046875, 532.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 1.0, 10.0, 13.0, 22.0, 32.0, 36.0, 48.0, 75.0, 113.0, 151.0, 217.0, 268.0, 449.0, 567.0, 857.0, 1153.0, 1691.0, 2406.0, 3543.0, 5058.0, 7446.0, 10813.0, 16692.0, 25385.0, 41282.0, 69844.0, 127106.0, 240968.0, 212120.0, 110619.0, 62207.0, 36922.0, 23075.0, 15331.0, 9992.0, 6746.0, 4593.0, 3139.0, 2275.0, 1584.0, 1046.0, 803.0, 527.0, 416.0, 270.0, 183.0, 142.0, 95.0, 74.0, 46.0, 32.0, 18.0, 25.0, 12.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0], "bins": [-27.0, -26.1533203125, -25.306640625, -24.4599609375, -23.61328125, -22.7666015625, -21.919921875, -21.0732421875, -20.2265625, -19.3798828125, -18.533203125, -17.6865234375, -16.83984375, -15.9931640625, -15.146484375, -14.2998046875, -13.453125, -12.6064453125, -11.759765625, -10.9130859375, -10.06640625, -9.2197265625, -8.373046875, -7.5263671875, -6.6796875, -5.8330078125, -4.986328125, -4.1396484375, -3.29296875, -2.4462890625, -1.599609375, -0.7529296875, 0.09375, 0.9404296875, 1.787109375, 2.6337890625, 3.48046875, 4.3271484375, 5.173828125, 6.0205078125, 6.8671875, 7.7138671875, 8.560546875, 9.4072265625, 10.25390625, 11.1005859375, 11.947265625, 12.7939453125, 13.640625, 14.4873046875, 15.333984375, 16.1806640625, 17.02734375, 17.8740234375, 18.720703125, 19.5673828125, 20.4140625, 21.2607421875, 22.107421875, 22.9541015625, 23.80078125, 24.6474609375, 25.494140625, 26.3408203125, 27.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 8.0, 2.0, 6.0, 7.0, 8.0, 10.0, 8.0, 13.0, 20.0, 21.0, 23.0, 22.0, 28.0, 26.0, 38.0, 44.0, 30.0, 22.0, 32.0, 43.0, 41.0, 1067.0, 42.0, 51.0, 41.0, 47.0, 36.0, 35.0, 31.0, 34.0, 26.0, 24.0, 25.0, 25.0, 14.0, 16.0, 12.0, 12.0, 4.0, 7.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-336.5, -326.26171875, -316.0234375, -305.78515625, -295.546875, -285.30859375, -275.0703125, -264.83203125, -254.59375, -244.35546875, -234.1171875, -223.87890625, -213.640625, -203.40234375, -193.1640625, -182.92578125, -172.6875, -162.44921875, -152.2109375, -141.97265625, -131.734375, -121.49609375, -111.2578125, -101.01953125, -90.78125, -80.54296875, -70.3046875, -60.06640625, -49.828125, -39.58984375, -29.3515625, -19.11328125, -8.875, 1.36328125, 11.6015625, 21.83984375, 32.078125, 42.31640625, 52.5546875, 62.79296875, 73.03125, 83.26953125, 93.5078125, 103.74609375, 113.984375, 124.22265625, 134.4609375, 144.69921875, 154.9375, 165.17578125, 175.4140625, 185.65234375, 195.890625, 206.12890625, 216.3671875, 226.60546875, 236.84375, 247.08203125, 257.3203125, 267.55859375, 277.796875, 288.03515625, 298.2734375, 308.51171875, 318.75]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 13.0, 11.0, 22.0, 25.0, 46.0, 74.0, 105.0, 144.0, 208.0, 249.0, 412.0, 548.0, 752.0, 998.0, 1440.0, 1952.0, 2781.0, 3933.0, 5519.0, 8107.0, 11892.0, 17288.0, 25933.0, 39841.0, 63058.0, 107289.0, 208280.0, 1261416.0, 125841.0, 72031.0, 44866.0, 29353.0, 19358.0, 13124.0, 8949.0, 6242.0, 4291.0, 3075.0, 2127.0, 1570.0, 1141.0, 768.0, 567.0, 440.0, 330.0, 229.0, 164.0, 117.0, 62.0, 58.0, 38.0, 24.0, 13.0, 9.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-19.109375, -18.49560546875, -17.8818359375, -17.26806640625, -16.654296875, -16.04052734375, -15.4267578125, -14.81298828125, -14.19921875, -13.58544921875, -12.9716796875, -12.35791015625, -11.744140625, -11.13037109375, -10.5166015625, -9.90283203125, -9.2890625, -8.67529296875, -8.0615234375, -7.44775390625, -6.833984375, -6.22021484375, -5.6064453125, -4.99267578125, -4.37890625, -3.76513671875, -3.1513671875, -2.53759765625, -1.923828125, -1.31005859375, -0.6962890625, -0.08251953125, 0.53125, 1.14501953125, 1.7587890625, 2.37255859375, 2.986328125, 3.60009765625, 4.2138671875, 4.82763671875, 5.44140625, 6.05517578125, 6.6689453125, 7.28271484375, 7.896484375, 8.51025390625, 9.1240234375, 9.73779296875, 10.3515625, 10.96533203125, 11.5791015625, 12.19287109375, 12.806640625, 13.42041015625, 14.0341796875, 14.64794921875, 15.26171875, 15.87548828125, 16.4892578125, 17.10302734375, 17.716796875, 18.33056640625, 18.9443359375, 19.55810546875, 20.171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 15.0, 17.0, 21.0, 35.0, 43.0, 45.0, 58.0, 39.0, 58.0, 64.0, 51.0, 73.0, 64.0, 67.0, 52.0, 54.0, 31.0, 41.0, 27.0, 30.0, 21.0, 16.0, 5.0, 13.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10699462890625, -0.10355663299560547, -0.10011863708496094, -0.0966806411743164, -0.09324264526367188, -0.08980464935302734, -0.08636665344238281, -0.08292865753173828, -0.07949066162109375, -0.07605266571044922, -0.07261466979980469, -0.06917667388916016, -0.06573867797851562, -0.062300682067871094, -0.05886268615722656, -0.05542469024658203, -0.0519866943359375, -0.04854869842529297, -0.04511070251464844, -0.041672706604003906, -0.038234710693359375, -0.034796714782714844, -0.03135871887207031, -0.02792072296142578, -0.02448272705078125, -0.02104473114013672, -0.017606735229492188, -0.014168739318847656, -0.010730743408203125, -0.007292747497558594, -0.0038547515869140625, -0.00041675567626953125, 0.003021240234375, 0.006459236145019531, 0.009897232055664062, 0.013335227966308594, 0.016773223876953125, 0.020211219787597656, 0.023649215698242188, 0.02708721160888672, 0.03052520751953125, 0.03396320343017578, 0.03740119934082031, 0.040839195251464844, 0.044277191162109375, 0.047715187072753906, 0.05115318298339844, 0.05459117889404297, 0.0580291748046875, 0.06146717071533203, 0.06490516662597656, 0.0683431625366211, 0.07178115844726562, 0.07521915435791016, 0.07865715026855469, 0.08209514617919922, 0.08553314208984375, 0.08897113800048828, 0.09240913391113281, 0.09584712982177734, 0.09928512573242188, 0.1027231216430664, 0.10616111755371094, 0.10959911346435547, 0.113037109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 3.0, 8.0, 12.0, 11.0, 18.0, 19.0, 14.0, 28.0, 42.0, 66.0, 76.0, 96.0, 193.0, 365.0, 517.0, 1018.0, 1964.0, 4338.0, 10777.0, 34959.0, 139004.0, 476753.0, 280154.0, 66545.0, 18646.0, 6760.0, 2888.0, 1401.0, 747.0, 412.0, 242.0, 143.0, 87.0, 63.0, 50.0, 37.0, 24.0, 14.0, 12.0, 9.0, 11.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.61376953125, -0.5950241088867188, -0.5762786865234375, -0.5575332641601562, -0.538787841796875, -0.5200424194335938, -0.5012969970703125, -0.48255157470703125, -0.46380615234375, -0.44506072998046875, -0.4263153076171875, -0.40756988525390625, -0.388824462890625, -0.37007904052734375, -0.3513336181640625, -0.33258819580078125, -0.3138427734375, -0.29509735107421875, -0.2763519287109375, -0.25760650634765625, -0.238861083984375, -0.22011566162109375, -0.2013702392578125, -0.18262481689453125, -0.16387939453125, -0.14513397216796875, -0.1263885498046875, -0.10764312744140625, -0.088897705078125, -0.07015228271484375, -0.0514068603515625, -0.03266143798828125, -0.013916015625, 0.00482940673828125, 0.0235748291015625, 0.04232025146484375, 0.061065673828125, 0.07981109619140625, 0.0985565185546875, 0.11730194091796875, 0.13604736328125, 0.15479278564453125, 0.1735382080078125, 0.19228363037109375, 0.211029052734375, 0.22977447509765625, 0.2485198974609375, 0.26726531982421875, 0.2860107421875, 0.30475616455078125, 0.3235015869140625, 0.34224700927734375, 0.360992431640625, 0.37973785400390625, 0.3984832763671875, 0.41722869873046875, 0.43597412109375, 0.45471954345703125, 0.4734649658203125, 0.49221038818359375, 0.510955810546875, 0.5297012329101562, 0.5484466552734375, 0.5671920776367188, 0.5859375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 22.0, 24.0, 44.0, 86.0, 108.0, 133.0, 146.0, 103.0, 90.0, 69.0, 41.0, 32.0, 29.0, 15.0, 18.0, 8.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07617875933647156, -0.07196757197380066, -0.06775639206171036, -0.06354521214962006, -0.05933402478694916, -0.05512284114956856, -0.05091165751218796, -0.04670047387480736, -0.04248929023742676, -0.03827810660004616, -0.03406692296266556, -0.029855739325284958, -0.025644555687904358, -0.021433372050523758, -0.017222188413143158, -0.013011004775762558, -0.008799821138381958, -0.004588637501001358, -0.00037745386362075806, 0.003833729773759842, 0.008044913411140442, 0.012256097048521042, 0.016467280685901642, 0.020678464323282242, 0.024889647960662842, 0.029100831598043442, 0.03331201523542404, 0.03752319887280464, 0.04173438251018524, 0.04594556614756584, 0.05015674978494644, 0.05436793342232704, 0.05857910215854645, 0.06279028952121735, 0.06700146943330765, 0.07121264934539795, 0.07542383670806885, 0.07963502407073975, 0.08384620398283005, 0.08805738389492035, 0.09226857125759125, 0.09647975862026215, 0.10069093853235245, 0.10490211844444275, 0.10911330580711365, 0.11332449316978455, 0.11753567308187485, 0.12174685299396515, 0.12595804035663605, 0.13016922771930695, 0.13438040018081665, 0.13859158754348755, 0.14280277490615845, 0.14701396226882935, 0.15122514963150024, 0.15543632209300995, 0.15964750945568085, 0.16385869681835175, 0.16806986927986145, 0.17228105664253235, 0.17649224400520325, 0.18070343136787415, 0.18491461873054504, 0.18912579119205475, 0.19333697855472565]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 8.0, 3.0, 3.0, 9.0, 6.0, 10.0, 12.0, 16.0, 18.0, 20.0, 18.0, 16.0, 23.0, 35.0, 31.0, 43.0, 29.0, 27.0, 27.0, 35.0, 39.0, 47.0, 37.0, 39.0, 38.0, 36.0, 37.0, 32.0, 45.0, 35.0, 29.0, 34.0, 22.0, 21.0, 24.0, 20.0, 10.0, 8.0, 14.0, 8.0, 7.0, 10.0, 4.0, 4.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.06549620628356934, -0.06358537077903748, -0.06167452782392502, -0.05976369231939316, -0.057852853089571, -0.05594201385974884, -0.05403117835521698, -0.05212033912539482, -0.05020949989557266, -0.048298660665750504, -0.046387821435928345, -0.044476985931396484, -0.042566146701574326, -0.04065530747175217, -0.038744471967220306, -0.03683363273739815, -0.03492279350757599, -0.03301195427775383, -0.03110111691057682, -0.02919027954339981, -0.027279440313577652, -0.025368601083755493, -0.023457763716578484, -0.021546926349401474, -0.019636087119579315, -0.017725247889757156, -0.015814410522580147, -0.013903572224080563, -0.011992733925580978, -0.010081895627081394, -0.00817105732858181, -0.006260219030082226, -0.004349380731582642, -0.0024385424330830574, -0.0005277041345834732, 0.001383134163916111, 0.003293972462415695, 0.005204810760915279, 0.007115649059414864, 0.009026487357914448, 0.010937325656414032, 0.012848163954913616, 0.0147590022534132, 0.01666983962059021, 0.01858067885041237, 0.020491518080234528, 0.022402355447411537, 0.024313192814588547, 0.026224032044410706, 0.028134871274232864, 0.030045708641409874, 0.031956546008586884, 0.03386738523840904, 0.0357782244682312, 0.03768905997276306, 0.03959989920258522, 0.04151073843240738, 0.04342157766222954, 0.0453324168920517, 0.04724325239658356, 0.049154091626405716, 0.051064930856227875, 0.052975766360759735, 0.054886605590581894, 0.05679744482040405]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 10.0, 15.0, 6.0, 17.0, 19.0, 15.0, 15.0, 26.0, 22.0, 28.0, 21.0, 40.0, 37.0, 47.0, 49.0, 40.0, 49.0, 45.0, 46.0, 39.0, 38.0, 38.0, 45.0, 37.0, 31.0, 28.0, 43.0, 29.0, 20.0, 15.0, 10.0, 13.0, 14.0, 9.0, 6.0, 7.0, 7.0, 2.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-520.5, -504.046875, -487.59375, -471.140625, -454.6875, -438.234375, -421.78125, -405.328125, -388.875, -372.421875, -355.96875, -339.515625, -323.0625, -306.609375, -290.15625, -273.703125, -257.25, -240.796875, -224.34375, -207.890625, -191.4375, -174.984375, -158.53125, -142.078125, -125.625, -109.171875, -92.71875, -76.265625, -59.8125, -43.359375, -26.90625, -10.453125, 6.0, 22.453125, 38.90625, 55.359375, 71.8125, 88.265625, 104.71875, 121.171875, 137.625, 154.078125, 170.53125, 186.984375, 203.4375, 219.890625, 236.34375, 252.796875, 269.25, 285.703125, 302.15625, 318.609375, 335.0625, 351.515625, 367.96875, 384.421875, 400.875, 417.328125, 433.78125, 450.234375, 466.6875, 483.140625, 499.59375, 516.046875, 532.5]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 5.0, 6.0, 9.0, 5.0, 14.0, 13.0, 24.0, 37.0, 36.0, 53.0, 70.0, 94.0, 143.0, 185.0, 260.0, 380.0, 596.0, 935.0, 1687.0, 3370.0, 8601.0, 26749.0, 115967.0, 640848.0, 189496.0, 38107.0, 11266.0, 4316.0, 2036.0, 1125.0, 652.0, 417.0, 306.0, 209.0, 148.0, 98.0, 70.0, 57.0, 45.0, 38.0, 21.0, 12.0, 20.0, 7.0, 6.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-97.0, -93.93359375, -90.8671875, -87.80078125, -84.734375, -81.66796875, -78.6015625, -75.53515625, -72.46875, -69.40234375, -66.3359375, -63.26953125, -60.203125, -57.13671875, -54.0703125, -51.00390625, -47.9375, -44.87109375, -41.8046875, -38.73828125, -35.671875, -32.60546875, -29.5390625, -26.47265625, -23.40625, -20.33984375, -17.2734375, -14.20703125, -11.140625, -8.07421875, -5.0078125, -1.94140625, 1.125, 4.19140625, 7.2578125, 10.32421875, 13.390625, 16.45703125, 19.5234375, 22.58984375, 25.65625, 28.72265625, 31.7890625, 34.85546875, 37.921875, 40.98828125, 44.0546875, 47.12109375, 50.1875, 53.25390625, 56.3203125, 59.38671875, 62.453125, 65.51953125, 68.5859375, 71.65234375, 74.71875, 77.78515625, 80.8515625, 83.91796875, 86.984375, 90.05078125, 93.1171875, 96.18359375, 99.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 10.0, 7.0, 9.0, 11.0, 15.0, 26.0, 31.0, 23.0, 25.0, 27.0, 38.0, 47.0, 48.0, 47.0, 47.0, 2018.0, 137.0, 34.0, 38.0, 57.0, 49.0, 45.0, 47.0, 43.0, 29.0, 24.0, 32.0, 12.0, 21.0, 12.0, 7.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-626.5, -604.0234375, -581.546875, -559.0703125, -536.59375, -514.1171875, -491.640625, -469.1640625, -446.6875, -424.2109375, -401.734375, -379.2578125, -356.78125, -334.3046875, -311.828125, -289.3515625, -266.875, -244.3984375, -221.921875, -199.4453125, -176.96875, -154.4921875, -132.015625, -109.5390625, -87.0625, -64.5859375, -42.109375, -19.6328125, 2.84375, 25.3203125, 47.796875, 70.2734375, 92.75, 115.2265625, 137.703125, 160.1796875, 182.65625, 205.1328125, 227.609375, 250.0859375, 272.5625, 295.0390625, 317.515625, 339.9921875, 362.46875, 384.9453125, 407.421875, 429.8984375, 452.375, 474.8515625, 497.328125, 519.8046875, 542.28125, 564.7578125, 587.234375, 609.7109375, 632.1875, 654.6640625, 677.140625, 699.6171875, 722.09375, 744.5703125, 767.046875, 789.5234375, 812.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 12.0, 8.0, 12.0, 16.0, 23.0, 33.0, 50.0, 55.0, 84.0, 103.0, 170.0, 231.0, 329.0, 502.0, 886.0, 1677.0, 4315.0, 17994.0, 139190.0, 2841737.0, 114873.0, 15427.0, 4029.0, 1590.0, 838.0, 465.0, 319.0, 198.0, 162.0, 103.0, 74.0, 53.0, 42.0, 32.0, 18.0, 14.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0], "bins": [-142.25, -138.4521484375, -134.654296875, -130.8564453125, -127.05859375, -123.2607421875, -119.462890625, -115.6650390625, -111.8671875, -108.0693359375, -104.271484375, -100.4736328125, -96.67578125, -92.8779296875, -89.080078125, -85.2822265625, -81.484375, -77.6865234375, -73.888671875, -70.0908203125, -66.29296875, -62.4951171875, -58.697265625, -54.8994140625, -51.1015625, -47.3037109375, -43.505859375, -39.7080078125, -35.91015625, -32.1123046875, -28.314453125, -24.5166015625, -20.71875, -16.9208984375, -13.123046875, -9.3251953125, -5.52734375, -1.7294921875, 2.068359375, 5.8662109375, 9.6640625, 13.4619140625, 17.259765625, 21.0576171875, 24.85546875, 28.6533203125, 32.451171875, 36.2490234375, 40.046875, 43.8447265625, 47.642578125, 51.4404296875, 55.23828125, 59.0361328125, 62.833984375, 66.6318359375, 70.4296875, 74.2275390625, 78.025390625, 81.8232421875, 85.62109375, 89.4189453125, 93.216796875, 97.0146484375, 100.8125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 14.0, 33.0, 94.0, 280.0, 334.0, 151.0, 45.0, 17.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3685.001220703125, -3614.29296875, -3543.5849609375, -3472.876708984375, -3402.16845703125, -3331.460205078125, -3260.752197265625, -3190.0439453125, -3119.335693359375, -3048.62744140625, -2977.91943359375, -2907.211181640625, -2836.5029296875, -2765.794677734375, -2695.086669921875, -2624.37841796875, -2553.67041015625, -2482.962158203125, -2412.254150390625, -2341.5458984375, -2270.837646484375, -2200.12939453125, -2129.42138671875, -2058.713134765625, -1988.0048828125, -1917.2967529296875, -1846.5885009765625, -1775.88037109375, -1705.172119140625, -1634.4639892578125, -1563.755859375, -1493.047607421875, -1422.3394775390625, -1351.63134765625, -1280.923095703125, -1210.2149658203125, -1139.5067138671875, -1068.798583984375, -998.0903930664062, -927.3822021484375, -856.6740112304688, -785.9658203125, -715.2576293945312, -644.5494384765625, -573.84130859375, -503.1330871582031, -432.4249267578125, -361.71673583984375, -291.008544921875, -220.30035400390625, -149.59217834472656, -78.88400268554688, -8.175811767578125, 62.532379150390625, 133.24053955078125, 203.94873046875, 274.65692138671875, 345.3651123046875, 416.07330322265625, 486.7814636230469, 557.4896240234375, 628.1978759765625, 698.906005859375, 769.6141967773438, 840.3223876953125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 6.0, 11.0, 9.0, 26.0, 19.0, 34.0, 25.0, 36.0, 46.0, 45.0, 38.0, 39.0, 43.0, 44.0, 39.0, 40.0, 48.0, 48.0, 41.0, 43.0, 40.0, 43.0, 29.0, 30.0, 20.0, 19.0, 16.0, 17.0, 13.0, 12.0, 13.0, 7.0, 5.0, 4.0, 11.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-780.2860107421875, -751.8855590820312, -723.485107421875, -695.0846557617188, -666.6842041015625, -638.2838134765625, -609.8833618164062, -581.48291015625, -553.0824584960938, -524.6820068359375, -496.28155517578125, -467.8811340332031, -439.4806823730469, -411.0802307128906, -382.6798095703125, -354.27935791015625, -325.87890625, -297.47845458984375, -269.0780029296875, -240.67758178710938, -212.27713012695312, -183.87667846679688, -155.4762420654297, -127.0758056640625, -98.67535400390625, -70.27490997314453, -41.87446594238281, -13.474021911621094, 14.926422119140625, 43.326873779296875, 71.72731018066406, 100.12774658203125, 128.5281982421875, 156.92864990234375, 185.32908630371094, 213.72952270507812, 242.12997436523438, 270.5304260253906, 298.93084716796875, 327.331298828125, 355.73175048828125, 384.1322021484375, 412.53265380859375, 440.9330749511719, 469.3335266113281, 497.7339782714844, 526.1343994140625, 554.5348510742188, 582.935302734375, 611.3357543945312, 639.7362060546875, 668.1366577148438, 696.537109375, 724.9375, 753.3379516601562, 781.7384033203125, 810.1388549804688, 838.539306640625, 866.9397583007812, 895.3402099609375, 923.7406005859375, 952.14111328125, 980.54150390625, 1008.9419555664062, 1037.3424072265625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 7.0, 9.0, 5.0, 20.0, 13.0, 15.0, 21.0, 24.0, 20.0, 22.0, 34.0, 35.0, 52.0, 89.0, 168.0, 294.0, 553.0, 1162.0, 1041946.0, 1808.0, 988.0, 485.0, 251.0, 150.0, 80.0, 49.0, 38.0, 39.0, 24.0, 22.0, 22.0, 18.0, 13.0, 14.0, 10.0, 8.0, 5.0, 8.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-451.31146240234375, -437.1623840332031, -423.0133361816406, -408.8642578125, -394.7151794433594, -380.56610107421875, -366.41705322265625, -352.2679748535156, -338.118896484375, -323.9698181152344, -309.8207702636719, -295.67169189453125, -281.5226135253906, -267.37353515625, -253.2244873046875, -239.07540893554688, -224.92636108398438, -210.7772979736328, -196.6282196044922, -182.47915649414062, -168.330078125, -154.18101501464844, -140.03195190429688, -125.88288116455078, -111.73381042480469, -97.5847396850586, -83.4356689453125, -69.28660583496094, -55.137535095214844, -40.98846435546875, -26.839401245117188, -12.690330505371094, 1.458740234375, 15.607809066772461, 29.756877899169922, 43.90594482421875, 58.055015563964844, 72.20408630371094, 86.3531494140625, 100.5022201538086, 114.65129089355469, 128.80035400390625, 142.94943237304688, 157.09849548339844, 171.24755859375, 185.39663696289062, 199.5457000732422, 213.69476318359375, 227.84384155273438, 241.99290466308594, 256.1419677734375, 270.2910461425781, 284.44012451171875, 298.58917236328125, 312.7382507324219, 326.8873291015625, 341.036376953125, 355.1854553222656, 369.3345031738281, 383.48358154296875, 397.6326599121094, 411.78173828125, 425.9307861328125, 440.0798645019531, 454.22894287109375]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 11.0, 16.0, 23.0, 24.0, 61.0, 182.0, 1149.0, 51460976.0, 477.0, 113.0, 44.0, 15.0, 10.0, 11.0, 4.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3681.113525390625, -3559.976318359375, -3438.83935546875, -3317.7021484375, -3196.56494140625, -3075.427734375, -2954.29052734375, -2833.153564453125, -2712.016357421875, -2590.879150390625, -2469.7421875, -2348.60498046875, -2227.4677734375, -2106.33056640625, -1985.1934814453125, -1864.056396484375, -1742.919189453125, -1621.781982421875, -1500.6448974609375, -1379.5078125, -1258.37060546875, -1137.2333984375, -1016.0963134765625, -894.9591674804688, -773.822021484375, -652.6848754882812, -531.5477294921875, -410.41058349609375, -289.2734375, -168.13629150390625, -46.9991455078125, 74.13800048828125, 195.275390625, 316.41253662109375, 437.5496826171875, 558.6868286132812, 679.823974609375, 800.9611206054688, 922.0982666015625, 1043.2353515625, 1164.37255859375, 1285.509765625, 1406.6468505859375, 1527.783935546875, 1648.921142578125, 1770.058349609375, 1891.1954345703125, 2012.33251953125, 2133.4697265625, 2254.60693359375, 2375.744140625, 2496.881103515625, 2618.018310546875, 2739.155517578125, 2860.29248046875, 2981.4296875, 3102.56689453125, 3223.7041015625, 3344.84130859375, 3465.978271484375, 3587.115478515625, 3708.252685546875, 3829.3896484375, 3950.52685546875, 4071.6640625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 7.0, 11.0, 17.0, 17.0, 21.0, 46.0, 79.0, 103.0, 165.0, 204.0, 324.0, 502.0, 767.0, 1043.0, 1531.0, 2345.0, 3402.0, 5015.0, 7283.0, 10586.0, 15626.0, 23421.0, 34335.0, 52150.0, 79041.0, 125825.0, 213365.0, 393452.0, 3722641.0, 779755.0, 322017.0, 180537.0, 109051.0, 68945.0, 45186.0, 29803.0, 19891.0, 13851.0, 9064.0, 6287.0, 4326.0, 2982.0, 2059.0, 1407.0, 961.0, 640.0, 452.0, 318.0, 199.0, 127.0, 86.0, 55.0, 47.0, 27.0, 18.0, 12.0, 7.0, 4.0, 4.0, 5.0], "bins": [-8.6796875, -8.4154052734375, -8.151123046875, -7.8868408203125, -7.62255859375, -7.3582763671875, -7.093994140625, -6.8297119140625, -6.5654296875, -6.3011474609375, -6.036865234375, -5.7725830078125, -5.50830078125, -5.2440185546875, -4.979736328125, -4.7154541015625, -4.451171875, -4.1868896484375, -3.922607421875, -3.6583251953125, -3.39404296875, -3.1297607421875, -2.865478515625, -2.6011962890625, -2.3369140625, -2.0726318359375, -1.808349609375, -1.5440673828125, -1.27978515625, -1.0155029296875, -0.751220703125, -0.4869384765625, -0.22265625, 0.0416259765625, 0.305908203125, 0.5701904296875, 0.83447265625, 1.0987548828125, 1.363037109375, 1.6273193359375, 1.8916015625, 2.1558837890625, 2.420166015625, 2.6844482421875, 2.94873046875, 3.2130126953125, 3.477294921875, 3.7415771484375, 4.005859375, 4.2701416015625, 4.534423828125, 4.7987060546875, 5.06298828125, 5.3272705078125, 5.591552734375, 5.8558349609375, 6.1201171875, 6.3843994140625, 6.648681640625, 6.9129638671875, 7.17724609375, 7.4415283203125, 7.705810546875, 7.9700927734375, 8.234375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 14.0, 6.0, 10.0, 10.0, 12.0, 17.0, 23.0, 19.0, 19.0, 17.0, 26.0, 28.0, 25.0, 30.0, 24.0, 31.0, 36.0, 34.0, 40.0, 34.0, 749.0, 362.0, 47.0, 40.0, 33.0, 42.0, 30.0, 31.0, 26.0, 30.0, 23.0, 16.0, 26.0, 21.0, 14.0, 13.0, 15.0, 8.0, 10.0, 5.0, 9.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-113.125, -109.689453125, -106.25390625, -102.818359375, -99.3828125, -95.947265625, -92.51171875, -89.076171875, -85.640625, -82.205078125, -78.76953125, -75.333984375, -71.8984375, -68.462890625, -65.02734375, -61.591796875, -58.15625, -54.720703125, -51.28515625, -47.849609375, -44.4140625, -40.978515625, -37.54296875, -34.107421875, -30.671875, -27.236328125, -23.80078125, -20.365234375, -16.9296875, -13.494140625, -10.05859375, -6.623046875, -3.1875, 0.248046875, 3.68359375, 7.119140625, 10.5546875, 13.990234375, 17.42578125, 20.861328125, 24.296875, 27.732421875, 31.16796875, 34.603515625, 38.0390625, 41.474609375, 44.91015625, 48.345703125, 51.78125, 55.216796875, 58.65234375, 62.087890625, 65.5234375, 68.958984375, 72.39453125, 75.830078125, 79.265625, 82.701171875, 86.13671875, 89.572265625, 93.0078125, 96.443359375, 99.87890625, 103.314453125, 106.75]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 8.0, 5.0, 14.0, 19.0, 20.0, 36.0, 51.0, 100.0, 150.0, 222.0, 384.0, 548.0, 793.0, 1179.0, 1847.0, 2678.0, 4094.0, 6282.0, 9472.0, 14530.0, 22500.0, 35155.0, 56193.0, 91646.0, 152174.0, 263524.0, 454771.0, 3695626.0, 643998.0, 334211.0, 192408.0, 114311.0, 69575.0, 43432.0, 27706.0, 17784.0, 11565.0, 7807.0, 4946.0, 3250.0, 2146.0, 1421.0, 928.0, 652.0, 446.0, 298.0, 188.0, 121.0, 85.0, 58.0, 30.0, 24.0, 15.0, 8.0, 4.0, 8.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.9140625, -7.66455078125, -7.4150390625, -7.16552734375, -6.916015625, -6.66650390625, -6.4169921875, -6.16748046875, -5.91796875, -5.66845703125, -5.4189453125, -5.16943359375, -4.919921875, -4.67041015625, -4.4208984375, -4.17138671875, -3.921875, -3.67236328125, -3.4228515625, -3.17333984375, -2.923828125, -2.67431640625, -2.4248046875, -2.17529296875, -1.92578125, -1.67626953125, -1.4267578125, -1.17724609375, -0.927734375, -0.67822265625, -0.4287109375, -0.17919921875, 0.0703125, 0.31982421875, 0.5693359375, 0.81884765625, 1.068359375, 1.31787109375, 1.5673828125, 1.81689453125, 2.06640625, 2.31591796875, 2.5654296875, 2.81494140625, 3.064453125, 3.31396484375, 3.5634765625, 3.81298828125, 4.0625, 4.31201171875, 4.5615234375, 4.81103515625, 5.060546875, 5.31005859375, 5.5595703125, 5.80908203125, 6.05859375, 6.30810546875, 6.5576171875, 6.80712890625, 7.056640625, 7.30615234375, 7.5556640625, 7.80517578125, 8.0546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 5.0, 5.0, 7.0, 11.0, 10.0, 9.0, 17.0, 15.0, 18.0, 22.0, 27.0, 24.0, 26.0, 34.0, 30.0, 45.0, 34.0, 43.0, 43.0, 129.0, 974.0, 46.0, 46.0, 51.0, 32.0, 31.0, 43.0, 29.0, 28.0, 32.0, 30.0, 19.0, 22.0, 14.0, 16.0, 13.0, 8.0, 12.0, 9.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.375, -81.4912109375, -78.607421875, -75.7236328125, -72.83984375, -69.9560546875, -67.072265625, -64.1884765625, -61.3046875, -58.4208984375, -55.537109375, -52.6533203125, -49.76953125, -46.8857421875, -44.001953125, -41.1181640625, -38.234375, -35.3505859375, -32.466796875, -29.5830078125, -26.69921875, -23.8154296875, -20.931640625, -18.0478515625, -15.1640625, -12.2802734375, -9.396484375, -6.5126953125, -3.62890625, -0.7451171875, 2.138671875, 5.0224609375, 7.90625, 10.7900390625, 13.673828125, 16.5576171875, 19.44140625, 22.3251953125, 25.208984375, 28.0927734375, 30.9765625, 33.8603515625, 36.744140625, 39.6279296875, 42.51171875, 45.3955078125, 48.279296875, 51.1630859375, 54.046875, 56.9306640625, 59.814453125, 62.6982421875, 65.58203125, 68.4658203125, 71.349609375, 74.2333984375, 77.1171875, 80.0009765625, 82.884765625, 85.7685546875, 88.65234375, 91.5361328125, 94.419921875, 97.3037109375, 100.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 8.0, 11.0, 7.0, 15.0, 26.0, 25.0, 35.0, 53.0, 62.0, 97.0, 106.0, 133.0, 185.0, 309.0, 407.0, 560.0, 870.0, 1255.0, 2018.0, 3478.0, 5630.0, 9888.0, 17078.0, 31388.0, 59766.0, 130299.0, 5716849.0, 160701.0, 67949.0, 35339.0, 19260.0, 10944.0, 6215.0, 3718.0, 2228.0, 1493.0, 876.0, 609.0, 385.0, 321.0, 212.0, 146.0, 137.0, 99.0, 73.0, 43.0, 34.0, 32.0, 16.0, 15.0, 11.0, 7.0, 5.0, 4.0, 7.0, 1.0, 3.0, 2.0], "bins": [-21.015625, -20.370849609375, -19.72607421875, -19.081298828125, -18.4365234375, -17.791748046875, -17.14697265625, -16.502197265625, -15.857421875, -15.212646484375, -14.56787109375, -13.923095703125, -13.2783203125, -12.633544921875, -11.98876953125, -11.343994140625, -10.69921875, -10.054443359375, -9.40966796875, -8.764892578125, -8.1201171875, -7.475341796875, -6.83056640625, -6.185791015625, -5.541015625, -4.896240234375, -4.25146484375, -3.606689453125, -2.9619140625, -2.317138671875, -1.67236328125, -1.027587890625, -0.3828125, 0.261962890625, 0.90673828125, 1.551513671875, 2.1962890625, 2.841064453125, 3.48583984375, 4.130615234375, 4.775390625, 5.420166015625, 6.06494140625, 6.709716796875, 7.3544921875, 7.999267578125, 8.64404296875, 9.288818359375, 9.93359375, 10.578369140625, 11.22314453125, 11.867919921875, 12.5126953125, 13.157470703125, 13.80224609375, 14.447021484375, 15.091796875, 15.736572265625, 16.38134765625, 17.026123046875, 17.6708984375, 18.315673828125, 18.96044921875, 19.605224609375, 20.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 3.0, 18.0, 8.0, 9.0, 13.0, 9.0, 18.0, 21.0, 28.0, 33.0, 31.0, 31.0, 34.0, 37.0, 35.0, 30.0, 38.0, 66.0, 1013.0, 80.0, 39.0, 37.0, 44.0, 32.0, 37.0, 40.0, 38.0, 31.0, 20.0, 23.0, 22.0, 19.0, 11.0, 12.0, 3.0, 10.0, 13.0, 5.0, 7.0, 2.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.6064453125, -62.337890625, -60.0693359375, -57.80078125, -55.5322265625, -53.263671875, -50.9951171875, -48.7265625, -46.4580078125, -44.189453125, -41.9208984375, -39.65234375, -37.3837890625, -35.115234375, -32.8466796875, -30.578125, -28.3095703125, -26.041015625, -23.7724609375, -21.50390625, -19.2353515625, -16.966796875, -14.6982421875, -12.4296875, -10.1611328125, -7.892578125, -5.6240234375, -3.35546875, -1.0869140625, 1.181640625, 3.4501953125, 5.71875, 7.9873046875, 10.255859375, 12.5244140625, 14.79296875, 17.0615234375, 19.330078125, 21.5986328125, 23.8671875, 26.1357421875, 28.404296875, 30.6728515625, 32.94140625, 35.2099609375, 37.478515625, 39.7470703125, 42.015625, 44.2841796875, 46.552734375, 48.8212890625, 51.08984375, 53.3583984375, 55.626953125, 57.8955078125, 60.1640625, 62.4326171875, 64.701171875, 66.9697265625, 69.23828125, 71.5068359375, 73.775390625, 76.0439453125, 78.3125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 15.0, 32.0, 76.0, 260.0, 423.0, 116.0, 47.0, 25.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-498.89581298828125, -487.05743408203125, -475.2190856933594, -463.3807067871094, -451.5423583984375, -439.7039794921875, -427.8656311035156, -416.0272521972656, -404.18890380859375, -392.35052490234375, -380.5121765136719, -368.6737976074219, -356.83544921875, -344.9970703125, -333.1587219238281, -321.3203430175781, -309.48199462890625, -297.64361572265625, -285.8052673339844, -273.9668884277344, -262.1285400390625, -250.29017639160156, -238.45181274414062, -226.61343383789062, -214.77505493164062, -202.9366912841797, -191.09832763671875, -179.2599639892578, -167.42160034179688, -155.58323669433594, -143.744873046875, -131.906494140625, -120.06814575195312, -108.22978210449219, -96.39141845703125, -84.55305480957031, -72.71469116210938, -60.87632369995117, -49.03795623779297, -37.19959259033203, -25.361228942871094, -13.52286434173584, -1.684499740600586, 10.153865814208984, 21.992229461669922, 33.83059310913086, 45.66896057128906, 57.50732421875, 69.34568786621094, 81.18405151367188, 93.02241516113281, 104.86077880859375, 116.69914245605469, 128.53750610351562, 140.37588500976562, 152.2142333984375, 164.0526123046875, 175.89097595214844, 187.72933959960938, 199.5677032470703, 211.40606689453125, 223.2444305419922, 235.08279418945312, 246.92117309570312, 258.759521484375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 10.0, 8.0, 10.0, 12.0, 8.0, 10.0, 19.0, 23.0, 13.0, 27.0, 26.0, 25.0, 32.0, 29.0, 39.0, 41.0, 35.0, 44.0, 44.0, 38.0, 46.0, 58.0, 43.0, 35.0, 38.0, 37.0, 23.0, 21.0, 27.0, 27.0, 19.0, 25.0, 17.0, 16.0, 17.0, 13.0, 10.0, 10.0, 10.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-171.00814819335938, -166.32424926757812, -161.64035034179688, -156.95645141601562, -152.27255249023438, -147.5886688232422, -142.90476989746094, -138.2208709716797, -133.53697204589844, -128.8530731201172, -124.16917419433594, -119.48528289794922, -114.80138397216797, -110.11748504638672, -105.43359375, -100.74969482421875, -96.0657958984375, -91.38189697265625, -86.697998046875, -82.01410675048828, -77.33020782470703, -72.64630889892578, -67.96241760253906, -63.27851867675781, -58.59461975097656, -53.91072082519531, -49.22682571411133, -44.542930603027344, -39.859031677246094, -35.175132751464844, -30.49123764038086, -25.807342529296875, -21.123458862304688, -16.43956184387207, -11.755664825439453, -7.071767807006836, -2.3878707885742188, 2.2960262298583984, 6.979923248291016, 11.663818359375, 16.34771728515625, 21.031614303588867, 25.715511322021484, 30.3994083404541, 35.08330535888672, 39.76720428466797, 44.45109939575195, 49.13499450683594, 53.81889343261719, 58.50279235839844, 63.18668746948242, 67.8705825805664, 72.55448150634766, 77.2383804321289, 81.92227172851562, 86.60617065429688, 91.29006958007812, 95.97396850585938, 100.65786743164062, 105.34175872802734, 110.0256576538086, 114.70955657958984, 119.39344787597656, 124.07734680175781, 128.76124572753906]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 9.0, 5.0, 9.0, 7.0, 18.0, 14.0, 15.0, 33.0, 34.0, 35.0, 47.0, 64.0, 75.0, 110.0, 156.0, 189.0, 288.0, 430.0, 618.0, 964.0, 1570.0, 3066.0, 7250.0, 30568.0, 4088915.0, 44389.0, 7998.0, 2957.0, 1581.0, 944.0, 581.0, 414.0, 241.0, 197.0, 127.0, 97.0, 75.0, 52.0, 29.0, 31.0, 16.0, 17.0, 12.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0], "bins": [-3.162109375, -3.08013916015625, -2.9981689453125, -2.91619873046875, -2.834228515625, -2.75225830078125, -2.6702880859375, -2.58831787109375, -2.50634765625, -2.42437744140625, -2.3424072265625, -2.26043701171875, -2.178466796875, -2.09649658203125, -2.0145263671875, -1.93255615234375, -1.8505859375, -1.76861572265625, -1.6866455078125, -1.60467529296875, -1.522705078125, -1.44073486328125, -1.3587646484375, -1.27679443359375, -1.19482421875, -1.11285400390625, -1.0308837890625, -0.94891357421875, -0.866943359375, -0.78497314453125, -0.7030029296875, -0.62103271484375, -0.5390625, -0.45709228515625, -0.3751220703125, -0.29315185546875, -0.211181640625, -0.12921142578125, -0.0472412109375, 0.03472900390625, 0.11669921875, 0.19866943359375, 0.2806396484375, 0.36260986328125, 0.444580078125, 0.52655029296875, 0.6085205078125, 0.69049072265625, 0.7724609375, 0.85443115234375, 0.9364013671875, 1.01837158203125, 1.100341796875, 1.18231201171875, 1.2642822265625, 1.34625244140625, 1.42822265625, 1.51019287109375, 1.5921630859375, 1.67413330078125, 1.756103515625, 1.83807373046875, 1.9200439453125, 2.00201416015625, 2.083984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 8.0, 6.0, 4.0, 4.0, 2.0, 8.0, 5.0, 14.0, 12.0, 9.0, 26.0, 727.0, 77.0, 20.0, 23.0, 6.0, 6.0, 6.0, 8.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.99609375, -0.9704437255859375, -0.944793701171875, -0.9191436767578125, -0.89349365234375, -0.8678436279296875, -0.842193603515625, -0.8165435791015625, -0.7908935546875, -0.7652435302734375, -0.739593505859375, -0.7139434814453125, -0.68829345703125, -0.6626434326171875, -0.636993408203125, -0.6113433837890625, -0.585693359375, -0.5600433349609375, -0.534393310546875, -0.5087432861328125, -0.48309326171875, -0.4574432373046875, -0.431793212890625, -0.4061431884765625, -0.3804931640625, -0.3548431396484375, -0.329193115234375, -0.3035430908203125, -0.27789306640625, -0.2522430419921875, -0.226593017578125, -0.2009429931640625, -0.17529296875, -0.1496429443359375, -0.123992919921875, -0.0983428955078125, -0.07269287109375, -0.0470428466796875, -0.021392822265625, 0.0042572021484375, 0.0299072265625, 0.0555572509765625, 0.081207275390625, 0.1068572998046875, 0.13250732421875, 0.1581573486328125, 0.183807373046875, 0.2094573974609375, 0.235107421875, 0.2607574462890625, 0.286407470703125, 0.3120574951171875, 0.33770751953125, 0.3633575439453125, 0.389007568359375, 0.4146575927734375, 0.4403076171875, 0.4659576416015625, 0.491607666015625, 0.5172576904296875, 0.54290771484375, 0.5685577392578125, 0.594207763671875, 0.6198577880859375, 0.6455078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 4.0, 6.0, 14.0, 9.0, 19.0, 34.0, 41.0, 44.0, 79.0, 145.0, 182.0, 362.0, 502.0, 879.0, 1356.0, 2487.0, 4572.0, 9979.0, 26473.0, 160955.0, 3793198.0, 147147.0, 26041.0, 9552.0, 4540.0, 2358.0, 1311.0, 796.0, 432.0, 290.0, 167.0, 117.0, 68.0, 43.0, 27.0, 18.0, 16.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.1522369384765625, -2.091583251953125, -2.0309295654296875, -1.97027587890625, -1.9096221923828125, -1.848968505859375, -1.7883148193359375, -1.7276611328125, -1.6670074462890625, -1.606353759765625, -1.5457000732421875, -1.48504638671875, -1.4243927001953125, -1.363739013671875, -1.3030853271484375, -1.242431640625, -1.1817779541015625, -1.121124267578125, -1.0604705810546875, -0.99981689453125, -0.9391632080078125, -0.878509521484375, -0.8178558349609375, -0.7572021484375, -0.6965484619140625, -0.635894775390625, -0.5752410888671875, -0.51458740234375, -0.4539337158203125, -0.393280029296875, -0.3326263427734375, -0.27197265625, -0.2113189697265625, -0.150665283203125, -0.0900115966796875, -0.02935791015625, 0.0312957763671875, 0.091949462890625, 0.1526031494140625, 0.2132568359375, 0.2739105224609375, 0.334564208984375, 0.3952178955078125, 0.45587158203125, 0.5165252685546875, 0.577178955078125, 0.6378326416015625, 0.698486328125, 0.7591400146484375, 0.819793701171875, 0.8804473876953125, 0.94110107421875, 1.0017547607421875, 1.062408447265625, 1.1230621337890625, 1.1837158203125, 1.2443695068359375, 1.305023193359375, 1.3656768798828125, 1.42633056640625, 1.4869842529296875, 1.547637939453125, 1.6082916259765625, 1.6689453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 10.0, 6.0, 9.0, 13.0, 12.0, 14.0, 12.0, 33.0, 51.0, 134.0, 323.0, 2206.0, 818.0, 157.0, 75.0, 62.0, 33.0, 15.0, 20.0, 6.0, 8.0, 6.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.150390625, -1.1173095703125, -1.084228515625, -1.0511474609375, -1.01806640625, -0.9849853515625, -0.951904296875, -0.9188232421875, -0.8857421875, -0.8526611328125, -0.819580078125, -0.7864990234375, -0.75341796875, -0.7203369140625, -0.687255859375, -0.6541748046875, -0.62109375, -0.5880126953125, -0.554931640625, -0.5218505859375, -0.48876953125, -0.4556884765625, -0.422607421875, -0.3895263671875, -0.3564453125, -0.3233642578125, -0.290283203125, -0.2572021484375, -0.22412109375, -0.1910400390625, -0.157958984375, -0.1248779296875, -0.091796875, -0.0587158203125, -0.025634765625, 0.0074462890625, 0.04052734375, 0.0736083984375, 0.106689453125, 0.1397705078125, 0.1728515625, 0.2059326171875, 0.239013671875, 0.2720947265625, 0.30517578125, 0.3382568359375, 0.371337890625, 0.4044189453125, 0.4375, 0.4705810546875, 0.503662109375, 0.5367431640625, 0.56982421875, 0.6029052734375, 0.635986328125, 0.6690673828125, 0.7021484375, 0.7352294921875, 0.768310546875, 0.8013916015625, 0.83447265625, 0.8675537109375, 0.900634765625, 0.9337158203125, 0.966796875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 16.0, 62.0, 312.0, 430.0, 121.0, 37.0, 9.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.919100284576416, -6.682254791259766, -6.445409774780273, -6.208564758300781, -5.971719264984131, -5.7348737716674805, -5.498028755187988, -5.261183738708496, -5.024338245391846, -4.787492752075195, -4.550647735595703, -4.313802719116211, -4.0769572257995605, -3.8401119709014893, -3.603266716003418, -3.3664214611053467, -3.1295762062072754, -2.892730951309204, -2.655885696411133, -2.4190404415130615, -2.1821951866149902, -1.945349931716919, -1.7085046768188477, -1.4716594219207764, -1.234814167022705, -0.9979689121246338, -0.7611236572265625, -0.5242784023284912, -0.2874331474304199, -0.05058789253234863, 0.18625736236572266, 0.42310261726379395, 0.6599483489990234, 0.8967936038970947, 1.133638858795166, 1.3704841136932373, 1.6073293685913086, 1.8441746234893799, 2.081019878387451, 2.3178651332855225, 2.5547103881835938, 2.791555643081665, 3.0284008979797363, 3.2652461528778076, 3.502091407775879, 3.73893666267395, 3.9757819175720215, 4.212627410888672, 4.449472427368164, 4.686317443847656, 4.923162937164307, 5.160008430480957, 5.396853446960449, 5.633698463439941, 5.870543956756592, 6.107389450073242, 6.344234466552734, 6.581079483032227, 6.817924976348877, 7.054770469665527, 7.2916154861450195, 7.528460502624512, 7.765305995941162, 8.002151489257812, 8.238996505737305]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 2.0, 2.0, 5.0, 10.0, 9.0, 18.0, 20.0, 21.0, 38.0, 50.0, 54.0, 65.0, 86.0, 94.0, 98.0, 67.0, 79.0, 65.0, 42.0, 45.0, 21.0, 20.0, 10.0, 12.0, 11.0, 7.0, 7.0, 3.0, 7.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9708611965179443, -2.8577542304992676, -2.744647264480591, -2.631540298461914, -2.518433094024658, -2.4053263664245605, -2.2922191619873047, -2.179112195968628, -2.066005229949951, -1.9528982639312744, -1.8397912979125977, -1.7266842126846313, -1.6135772466659546, -1.5004702806472778, -1.3873631954193115, -1.2742562294006348, -1.161149263381958, -1.0480422973632812, -0.9349352717399597, -0.8218282461166382, -0.7087212800979614, -0.5956143140792847, -0.48250728845596313, -0.3694002628326416, -0.25629329681396484, -0.1431863009929657, -0.030079305171966553, 0.08302769064903259, 0.19613468647003174, 0.3092416524887085, 0.42234867811203003, 0.5354557037353516, 0.6485629081726074, 0.7616698741912842, 0.8747768998146057, 0.9878839254379272, 1.100990891456604, 1.2140978574752808, 1.327204942703247, 1.4403119087219238, 1.5534188747406006, 1.6665258407592773, 1.779632806777954, 1.8927398920059204, 2.0058469772338867, 2.1189537048339844, 2.2320609092712402, 2.345167875289917, 2.4582748413085938, 2.5713818073272705, 2.6844887733459473, 2.797595739364624, 2.910702705383301, 3.0238099098205566, 3.1369168758392334, 3.25002384185791, 3.363130807876587, 3.4762377738952637, 3.5893447399139404, 3.702451705932617, 3.815558910369873, 3.9286656379699707, 4.041772842407227, 4.154879570007324, 4.26798677444458]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 11.0, 13.0, 22.0, 29.0, 31.0, 51.0, 67.0, 98.0, 139.0, 212.0, 301.0, 456.0, 711.0, 1016.0, 1703.0, 2877.0, 5166.0, 10216.0, 26254.0, 902338.0, 63504.0, 16011.0, 7302.0, 3756.0, 2246.0, 1410.0, 872.0, 561.0, 363.0, 239.0, 153.0, 137.0, 79.0, 58.0, 36.0, 28.0, 29.0, 10.0, 12.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-5.296875, -5.152801513671875, -5.00872802734375, -4.864654541015625, -4.7205810546875, -4.576507568359375, -4.43243408203125, -4.288360595703125, -4.144287109375, -4.000213623046875, -3.85614013671875, -3.712066650390625, -3.5679931640625, -3.423919677734375, -3.27984619140625, -3.135772705078125, -2.99169921875, -2.847625732421875, -2.70355224609375, -2.559478759765625, -2.4154052734375, -2.271331787109375, -2.12725830078125, -1.983184814453125, -1.839111328125, -1.695037841796875, -1.55096435546875, -1.406890869140625, -1.2628173828125, -1.118743896484375, -0.97467041015625, -0.830596923828125, -0.6865234375, -0.542449951171875, -0.39837646484375, -0.254302978515625, -0.1102294921875, 0.033843994140625, 0.17791748046875, 0.321990966796875, 0.466064453125, 0.610137939453125, 0.75421142578125, 0.898284912109375, 1.0423583984375, 1.186431884765625, 1.33050537109375, 1.474578857421875, 1.61865234375, 1.762725830078125, 1.90679931640625, 2.050872802734375, 2.1949462890625, 2.339019775390625, 2.48309326171875, 2.627166748046875, 2.771240234375, 2.915313720703125, 3.05938720703125, 3.203460693359375, 3.3475341796875, 3.491607666015625, 3.63568115234375, 3.779754638671875, 3.923828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 7.0, 4.0, 11.0, 15.0, 12.0, 15.0, 44.0, 709.0, 70.0, 21.0, 18.0, 6.0, 7.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.92724609375, -0.9031448364257812, -0.8790435791015625, -0.8549423217773438, -0.830841064453125, -0.8067398071289062, -0.7826385498046875, -0.7585372924804688, -0.73443603515625, -0.7103347778320312, -0.6862335205078125, -0.6621322631835938, -0.638031005859375, -0.6139297485351562, -0.5898284912109375, -0.5657272338867188, -0.5416259765625, -0.5175247192382812, -0.4934234619140625, -0.46932220458984375, -0.445220947265625, -0.42111968994140625, -0.3970184326171875, -0.37291717529296875, -0.34881591796875, -0.32471466064453125, -0.3006134033203125, -0.27651214599609375, -0.252410888671875, -0.22830963134765625, -0.2042083740234375, -0.18010711669921875, -0.156005859375, -0.13190460205078125, -0.1078033447265625, -0.08370208740234375, -0.059600830078125, -0.03549957275390625, -0.0113983154296875, 0.01270294189453125, 0.03680419921875, 0.06090545654296875, 0.0850067138671875, 0.10910797119140625, 0.133209228515625, 0.15731048583984375, 0.1814117431640625, 0.20551300048828125, 0.2296142578125, 0.25371551513671875, 0.2778167724609375, 0.30191802978515625, 0.326019287109375, 0.35012054443359375, 0.3742218017578125, 0.39832305908203125, 0.42242431640625, 0.44652557373046875, 0.4706268310546875, 0.49472808837890625, 0.518829345703125, 0.5429306030273438, 0.5670318603515625, 0.5911331176757812, 0.615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 8.0, 12.0, 6.0, 14.0, 23.0, 20.0, 32.0, 45.0, 74.0, 99.0, 160.0, 291.0, 460.0, 985.0, 1948.0, 4354.0, 11497.0, 36098.0, 149976.0, 613271.0, 168122.0, 39586.0, 12367.0, 4702.0, 2053.0, 1028.0, 514.0, 255.0, 180.0, 114.0, 73.0, 50.0, 29.0, 31.0, 17.0, 18.0, 14.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.375, -2.294586181640625, -2.21417236328125, -2.133758544921875, -2.0533447265625, -1.972930908203125, -1.89251708984375, -1.812103271484375, -1.731689453125, -1.651275634765625, -1.57086181640625, -1.490447998046875, -1.4100341796875, -1.329620361328125, -1.24920654296875, -1.168792724609375, -1.08837890625, -1.007965087890625, -0.92755126953125, -0.847137451171875, -0.7667236328125, -0.686309814453125, -0.60589599609375, -0.525482177734375, -0.445068359375, -0.364654541015625, -0.28424072265625, -0.203826904296875, -0.1234130859375, -0.042999267578125, 0.03741455078125, 0.117828369140625, 0.1982421875, 0.278656005859375, 0.35906982421875, 0.439483642578125, 0.5198974609375, 0.600311279296875, 0.68072509765625, 0.761138916015625, 0.841552734375, 0.921966552734375, 1.00238037109375, 1.082794189453125, 1.1632080078125, 1.243621826171875, 1.32403564453125, 1.404449462890625, 1.48486328125, 1.565277099609375, 1.64569091796875, 1.726104736328125, 1.8065185546875, 1.886932373046875, 1.96734619140625, 2.047760009765625, 2.128173828125, 2.208587646484375, 2.28900146484375, 2.369415283203125, 2.4498291015625, 2.530242919921875, 2.61065673828125, 2.691070556640625, 2.771484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 2.0, 3.0, 7.0, 4.0, 5.0, 12.0, 11.0, 14.0, 16.0, 16.0, 14.0, 14.0, 22.0, 25.0, 33.0, 31.0, 38.0, 32.0, 31.0, 33.0, 42.0, 33.0, 37.0, 33.0, 32.0, 41.0, 33.0, 30.0, 30.0, 35.0, 33.0, 34.0, 27.0, 26.0, 29.0, 20.0, 23.0, 14.0, 20.0, 8.0, 6.0, 8.0, 8.0, 9.0, 2.0, 3.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.287109375, -2.21209716796875, -2.1370849609375, -2.06207275390625, -1.987060546875, -1.91204833984375, -1.8370361328125, -1.76202392578125, -1.68701171875, -1.61199951171875, -1.5369873046875, -1.46197509765625, -1.386962890625, -1.31195068359375, -1.2369384765625, -1.16192626953125, -1.0869140625, -1.01190185546875, -0.9368896484375, -0.86187744140625, -0.786865234375, -0.71185302734375, -0.6368408203125, -0.56182861328125, -0.48681640625, -0.41180419921875, -0.3367919921875, -0.26177978515625, -0.186767578125, -0.11175537109375, -0.0367431640625, 0.03826904296875, 0.11328125, 0.18829345703125, 0.2633056640625, 0.33831787109375, 0.413330078125, 0.48834228515625, 0.5633544921875, 0.63836669921875, 0.71337890625, 0.78839111328125, 0.8634033203125, 0.93841552734375, 1.013427734375, 1.08843994140625, 1.1634521484375, 1.23846435546875, 1.3134765625, 1.38848876953125, 1.4635009765625, 1.53851318359375, 1.613525390625, 1.68853759765625, 1.7635498046875, 1.83856201171875, 1.91357421875, 1.98858642578125, 2.0635986328125, 2.13861083984375, 2.213623046875, 2.28863525390625, 2.3636474609375, 2.43865966796875, 2.513671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 14.0, 12.0, 14.0, 30.0, 32.0, 51.0, 80.0, 137.0, 252.0, 459.0, 986.0, 2850.0, 10837.0, 137551.0, 856846.0, 30058.0, 5233.0, 1634.0, 672.0, 321.0, 170.0, 102.0, 69.0, 33.0, 26.0, 21.0, 11.0, 13.0, 2.0, 3.0, 8.0, 3.0, 6.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2578125, -3.1654052734375, -3.072998046875, -2.9805908203125, -2.88818359375, -2.7957763671875, -2.703369140625, -2.6109619140625, -2.5185546875, -2.4261474609375, -2.333740234375, -2.2413330078125, -2.14892578125, -2.0565185546875, -1.964111328125, -1.8717041015625, -1.779296875, -1.6868896484375, -1.594482421875, -1.5020751953125, -1.40966796875, -1.3172607421875, -1.224853515625, -1.1324462890625, -1.0400390625, -0.9476318359375, -0.855224609375, -0.7628173828125, -0.67041015625, -0.5780029296875, -0.485595703125, -0.3931884765625, -0.30078125, -0.2083740234375, -0.115966796875, -0.0235595703125, 0.06884765625, 0.1612548828125, 0.253662109375, 0.3460693359375, 0.4384765625, 0.5308837890625, 0.623291015625, 0.7156982421875, 0.80810546875, 0.9005126953125, 0.992919921875, 1.0853271484375, 1.177734375, 1.2701416015625, 1.362548828125, 1.4549560546875, 1.54736328125, 1.6397705078125, 1.732177734375, 1.8245849609375, 1.9169921875, 2.0093994140625, 2.101806640625, 2.1942138671875, 2.28662109375, 2.3790283203125, 2.471435546875, 2.5638427734375, 2.65625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 9.0, 8.0, 8.0, 3.0, 8.0, 8.0, 16.0, 23.0, 30.0, 31.0, 40.0, 41.0, 51.0, 56.0, 80.0, 83.0, 81.0, 84.0, 63.0, 50.0, 39.0, 32.0, 39.0, 23.0, 21.0, 18.0, 12.0, 12.0, 6.0, 6.0, 5.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.52346420288086e-05, -8.207559585571289e-05, -7.891654968261719e-05, -7.575750350952148e-05, -7.259845733642578e-05, -6.943941116333008e-05, -6.628036499023438e-05, -6.312131881713867e-05, -5.996227264404297e-05, -5.6803226470947266e-05, -5.364418029785156e-05, -5.048513412475586e-05, -4.7326087951660156e-05, -4.416704177856445e-05, -4.100799560546875e-05, -3.784894943237305e-05, -3.4689903259277344e-05, -3.153085708618164e-05, -2.8371810913085938e-05, -2.5212764739990234e-05, -2.205371856689453e-05, -1.8894672393798828e-05, -1.5735626220703125e-05, -1.2576580047607422e-05, -9.417533874511719e-06, -6.258487701416016e-06, -3.0994415283203125e-06, 5.960464477539063e-08, 3.2186508178710938e-06, 6.377696990966797e-06, 9.5367431640625e-06, 1.2695789337158203e-05, 1.5854835510253906e-05, 1.901388168334961e-05, 2.2172927856445312e-05, 2.5331974029541016e-05, 2.849102020263672e-05, 3.165006637573242e-05, 3.4809112548828125e-05, 3.796815872192383e-05, 4.112720489501953e-05, 4.4286251068115234e-05, 4.744529724121094e-05, 5.060434341430664e-05, 5.3763389587402344e-05, 5.692243576049805e-05, 6.008148193359375e-05, 6.324052810668945e-05, 6.639957427978516e-05, 6.955862045288086e-05, 7.271766662597656e-05, 7.587671279907227e-05, 7.903575897216797e-05, 8.219480514526367e-05, 8.535385131835938e-05, 8.851289749145508e-05, 9.167194366455078e-05, 9.483098983764648e-05, 9.799003601074219e-05, 0.00010114908218383789, 0.0001043081283569336, 0.0001074671745300293, 0.000110626220703125, 0.0001137852668762207, 0.0001169443130493164]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 8.0, 16.0, 22.0, 34.0, 47.0, 83.0, 115.0, 219.0, 333.0, 651.0, 1537.0, 4024.0, 13972.0, 79150.0, 719401.0, 193273.0, 25095.0, 6339.0, 2169.0, 926.0, 473.0, 226.0, 159.0, 95.0, 59.0, 34.0, 19.0, 17.0, 13.0, 3.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.40625, -2.3424072265625, -2.278564453125, -2.2147216796875, -2.15087890625, -2.0870361328125, -2.023193359375, -1.9593505859375, -1.8955078125, -1.8316650390625, -1.767822265625, -1.7039794921875, -1.64013671875, -1.5762939453125, -1.512451171875, -1.4486083984375, -1.384765625, -1.3209228515625, -1.257080078125, -1.1932373046875, -1.12939453125, -1.0655517578125, -1.001708984375, -0.9378662109375, -0.8740234375, -0.8101806640625, -0.746337890625, -0.6824951171875, -0.61865234375, -0.5548095703125, -0.490966796875, -0.4271240234375, -0.36328125, -0.2994384765625, -0.235595703125, -0.1717529296875, -0.10791015625, -0.0440673828125, 0.019775390625, 0.0836181640625, 0.1474609375, 0.2113037109375, 0.275146484375, 0.3389892578125, 0.40283203125, 0.4666748046875, 0.530517578125, 0.5943603515625, 0.658203125, 0.7220458984375, 0.785888671875, 0.8497314453125, 0.91357421875, 0.9774169921875, 1.041259765625, 1.1051025390625, 1.1689453125, 1.2327880859375, 1.296630859375, 1.3604736328125, 1.42431640625, 1.4881591796875, 1.552001953125, 1.6158447265625, 1.6796875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 12.0, 15.0, 23.0, 31.0, 42.0, 59.0, 67.0, 79.0, 88.0, 110.0, 101.0, 89.0, 72.0, 51.0, 40.0, 26.0, 24.0, 23.0, 15.0, 9.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8684844970703125, -1.792633056640625, -1.7167816162109375, -1.64093017578125, -1.5650787353515625, -1.489227294921875, -1.4133758544921875, -1.3375244140625, -1.2616729736328125, -1.185821533203125, -1.1099700927734375, -1.03411865234375, -0.9582672119140625, -0.882415771484375, -0.8065643310546875, -0.730712890625, -0.6548614501953125, -0.579010009765625, -0.5031585693359375, -0.42730712890625, -0.3514556884765625, -0.275604248046875, -0.1997528076171875, -0.1239013671875, -0.0480499267578125, 0.027801513671875, 0.1036529541015625, 0.17950439453125, 0.2553558349609375, 0.331207275390625, 0.4070587158203125, 0.48291015625, 0.5587615966796875, 0.634613037109375, 0.7104644775390625, 0.78631591796875, 0.8621673583984375, 0.938018798828125, 1.0138702392578125, 1.0897216796875, 1.1655731201171875, 1.241424560546875, 1.3172760009765625, 1.39312744140625, 1.4689788818359375, 1.544830322265625, 1.6206817626953125, 1.696533203125, 1.7723846435546875, 1.848236083984375, 1.9240875244140625, 1.99993896484375, 2.0757904052734375, 2.151641845703125, 2.2274932861328125, 2.3033447265625, 2.3791961669921875, 2.455047607421875, 2.5308990478515625, 2.60675048828125, 2.6826019287109375, 2.758453369140625, 2.8343048095703125, 2.91015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 17.0, 38.0, 117.0, 443.0, 247.0, 74.0, 25.0, 10.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.22264099121094, -31.816661834716797, -30.410682678222656, -29.004703521728516, -27.598724365234375, -26.192745208740234, -24.78676414489746, -23.38078498840332, -21.97480583190918, -20.56882667541504, -19.1628475189209, -17.756866455078125, -16.350887298583984, -14.94490909576416, -13.538928985595703, -12.132949829101562, -10.726970672607422, -9.320991516113281, -7.915011882781982, -6.509032249450684, -5.103053092956543, -3.6970739364624023, -2.2910938262939453, -0.8851146697998047, 0.5208644866943359, 1.9268438816070557, 3.3328232765197754, 4.738802909851074, 6.144782066345215, 7.5507612228393555, 8.956741333007812, 10.362720489501953, 11.768699645996094, 13.174678802490234, 14.580657958984375, 15.986638069152832, 17.392616271972656, 18.798595428466797, 20.20457649230957, 21.61055564880371, 23.01653480529785, 24.422513961791992, 25.828493118286133, 27.234474182128906, 28.640453338623047, 30.046432495117188, 31.452411651611328, 32.85839080810547, 34.26436996459961, 35.67034912109375, 37.07632827758789, 38.48230743408203, 39.88828659057617, 41.29426574707031, 42.70024871826172, 44.106224060058594, 45.51220703125, 46.91818618774414, 48.32416534423828, 49.73014450073242, 51.13612365722656, 52.5421028137207, 53.948081970214844, 55.35406494140625, 56.760040283203125]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 11.0, 7.0, 12.0, 14.0, 23.0, 48.0, 65.0, 96.0, 122.0, 120.0, 105.0, 97.0, 84.0, 43.0, 32.0, 25.0, 19.0, 9.0, 11.0, 10.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.21520233154297, -41.7050895690918, -40.194976806640625, -38.68486404418945, -37.17475128173828, -35.664634704589844, -34.15452575683594, -32.6444091796875, -31.134296417236328, -29.624183654785156, -28.114070892333984, -26.603958129882812, -25.093843460083008, -23.583730697631836, -22.073617935180664, -20.56350326538086, -19.05339241027832, -17.54327964782715, -16.033166885375977, -14.523053169250488, -13.012939453125, -11.502826690673828, -9.992713928222656, -8.482600212097168, -6.972487449645996, -5.462374210357666, -3.952261209487915, -2.442148208618164, -0.932034969329834, 0.5780782699584961, 2.088191032409668, 3.5983047485351562, 5.108417510986328, 6.618530750274658, 8.128643989562988, 9.63875675201416, 11.148870468139648, 12.65898323059082, 14.169095993041992, 15.67920970916748, 17.18932342529297, 18.69943618774414, 20.209548950195312, 21.719661712646484, 23.22977638244629, 24.73988914489746, 26.250001907348633, 27.760116577148438, 29.270227432250977, 30.78034019470215, 32.29045486450195, 33.800567626953125, 35.3106803894043, 36.82079315185547, 38.33090591430664, 39.84101867675781, 41.351131439208984, 42.861244201660156, 44.37135696411133, 45.8814697265625, 47.39158248901367, 48.901695251464844, 50.41181182861328, 51.92192459106445, 53.432037353515625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 14.0, 13.0, 23.0, 32.0, 51.0, 74.0, 116.0, 149.0, 227.0, 414.0, 640.0, 969.0, 1656.0, 3096.0, 6093.0, 13926.0, 44575.0, 3462082.0, 605907.0, 33714.0, 10166.0, 4638.0, 2353.0, 1254.0, 755.0, 506.0, 274.0, 186.0, 116.0, 82.0, 53.0, 35.0, 35.0, 14.0, 10.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8359375, -5.647216796875, -5.45849609375, -5.269775390625, -5.0810546875, -4.892333984375, -4.70361328125, -4.514892578125, -4.326171875, -4.137451171875, -3.94873046875, -3.760009765625, -3.5712890625, -3.382568359375, -3.19384765625, -3.005126953125, -2.81640625, -2.627685546875, -2.43896484375, -2.250244140625, -2.0615234375, -1.872802734375, -1.68408203125, -1.495361328125, -1.306640625, -1.117919921875, -0.92919921875, -0.740478515625, -0.5517578125, -0.363037109375, -0.17431640625, 0.014404296875, 0.203125, 0.391845703125, 0.58056640625, 0.769287109375, 0.9580078125, 1.146728515625, 1.33544921875, 1.524169921875, 1.712890625, 1.901611328125, 2.09033203125, 2.279052734375, 2.4677734375, 2.656494140625, 2.84521484375, 3.033935546875, 3.22265625, 3.411376953125, 3.60009765625, 3.788818359375, 3.9775390625, 4.166259765625, 4.35498046875, 4.543701171875, 4.732421875, 4.921142578125, 5.10986328125, 5.298583984375, 5.4873046875, 5.676025390625, 5.86474609375, 6.053466796875, 6.2421875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 0.0, 5.0, 4.0, 8.0, 2.0, 6.0, 9.0, 8.0, 8.0, 11.0, 13.0, 13.0, 38.0, 110.0, 239.0, 268.0, 113.0, 38.0, 30.0, 11.0, 14.0, 8.0, 6.0, 4.0, 6.0, 1.0, 6.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50244140625, -0.4861907958984375, -0.469940185546875, -0.4536895751953125, -0.43743896484375, -0.4211883544921875, -0.404937744140625, -0.3886871337890625, -0.3724365234375, -0.3561859130859375, -0.339935302734375, -0.3236846923828125, -0.30743408203125, -0.2911834716796875, -0.274932861328125, -0.2586822509765625, -0.242431640625, -0.2261810302734375, -0.209930419921875, -0.1936798095703125, -0.17742919921875, -0.1611785888671875, -0.144927978515625, -0.1286773681640625, -0.1124267578125, -0.0961761474609375, -0.079925537109375, -0.0636749267578125, -0.04742431640625, -0.0311737060546875, -0.014923095703125, 0.0013275146484375, 0.017578125, 0.0338287353515625, 0.050079345703125, 0.0663299560546875, 0.08258056640625, 0.0988311767578125, 0.115081787109375, 0.1313323974609375, 0.1475830078125, 0.1638336181640625, 0.180084228515625, 0.1963348388671875, 0.21258544921875, 0.2288360595703125, 0.245086669921875, 0.2613372802734375, 0.277587890625, 0.2938385009765625, 0.310089111328125, 0.3263397216796875, 0.34259033203125, 0.3588409423828125, 0.375091552734375, 0.3913421630859375, 0.4075927734375, 0.4238433837890625, 0.440093994140625, 0.4563446044921875, 0.47259521484375, 0.4888458251953125, 0.505096435546875, 0.5213470458984375, 0.53759765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 12.0, 11.0, 10.0, 29.0, 39.0, 67.0, 88.0, 121.0, 223.0, 359.0, 622.0, 1057.0, 2243.0, 5402.0, 15357.0, 65279.0, 2052538.0, 1960792.0, 63996.0, 15338.0, 5397.0, 2349.0, 1186.0, 630.0, 384.0, 215.0, 172.0, 106.0, 88.0, 41.0, 23.0, 25.0, 12.0, 10.0, 11.0, 8.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.513671875, -3.39654541015625, -3.2794189453125, -3.16229248046875, -3.045166015625, -2.92803955078125, -2.8109130859375, -2.69378662109375, -2.57666015625, -2.45953369140625, -2.3424072265625, -2.22528076171875, -2.108154296875, -1.99102783203125, -1.8739013671875, -1.75677490234375, -1.6396484375, -1.52252197265625, -1.4053955078125, -1.28826904296875, -1.171142578125, -1.05401611328125, -0.9368896484375, -0.81976318359375, -0.70263671875, -0.58551025390625, -0.4683837890625, -0.35125732421875, -0.234130859375, -0.11700439453125, 0.0001220703125, 0.11724853515625, 0.234375, 0.35150146484375, 0.4686279296875, 0.58575439453125, 0.702880859375, 0.82000732421875, 0.9371337890625, 1.05426025390625, 1.17138671875, 1.28851318359375, 1.4056396484375, 1.52276611328125, 1.639892578125, 1.75701904296875, 1.8741455078125, 1.99127197265625, 2.1083984375, 2.22552490234375, 2.3426513671875, 2.45977783203125, 2.576904296875, 2.69403076171875, 2.8111572265625, 2.92828369140625, 3.04541015625, 3.16253662109375, 3.2796630859375, 3.39678955078125, 3.513916015625, 3.63104248046875, 3.7481689453125, 3.86529541015625, 3.982421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 6.0, 8.0, 17.0, 15.0, 24.0, 25.0, 38.0, 59.0, 125.0, 224.0, 953.0, 1890.0, 324.0, 126.0, 81.0, 45.0, 19.0, 20.0, 17.0, 14.0, 7.0, 5.0, 8.0, 4.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.74365234375, -0.7152328491210938, -0.6868133544921875, -0.6583938598632812, -0.629974365234375, -0.6015548706054688, -0.5731353759765625, -0.5447158813476562, -0.51629638671875, -0.48787689208984375, -0.4594573974609375, -0.43103790283203125, -0.402618408203125, -0.37419891357421875, -0.3457794189453125, -0.31735992431640625, -0.2889404296875, -0.26052093505859375, -0.2321014404296875, -0.20368194580078125, -0.175262451171875, -0.14684295654296875, -0.1184234619140625, -0.09000396728515625, -0.06158447265625, -0.03316497802734375, -0.0047454833984375, 0.02367401123046875, 0.052093505859375, 0.08051300048828125, 0.1089324951171875, 0.13735198974609375, 0.165771484375, 0.19419097900390625, 0.2226104736328125, 0.25102996826171875, 0.279449462890625, 0.30786895751953125, 0.3362884521484375, 0.36470794677734375, 0.39312744140625, 0.42154693603515625, 0.4499664306640625, 0.47838592529296875, 0.506805419921875, 0.5352249145507812, 0.5636444091796875, 0.5920639038085938, 0.6204833984375, 0.6489028930664062, 0.6773223876953125, 0.7057418823242188, 0.734161376953125, 0.7625808715820312, 0.7910003662109375, 0.8194198608398438, 0.84783935546875, 0.8762588500976562, 0.9046783447265625, 0.9330978393554688, 0.961517333984375, 0.9899368286132812, 1.0183563232421875, 1.0467758178710938, 1.0751953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 21.0, 192.0, 677.0, 83.0, 18.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.153841972351074, -6.766066551208496, -6.37829065322876, -5.990515232086182, -5.602739334106445, -5.214963912963867, -4.827188491821289, -4.439413070678711, -4.051637172698975, -3.6638615131378174, -3.27608585357666, -2.888310432434082, -2.500534772872925, -2.1127591133117676, -1.7249836921691895, -1.3372080326080322, -0.949432373046875, -0.5616567730903625, -0.1738811731338501, 0.21389436721801758, 0.6016700267791748, 0.989445686340332, 1.3772211074829102, 1.7649967670440674, 2.1527724266052246, 2.540548086166382, 2.928323745727539, 3.316099166870117, 3.7038748264312744, 4.091650485992432, 4.47942590713501, 4.867201805114746, 5.254976272583008, 5.642751693725586, 6.030527591705322, 6.4183030128479, 6.806078910827637, 7.193854331970215, 7.581629753112793, 7.969405174255371, 8.357181549072266, 8.744956970214844, 9.132732391357422, 9.5205078125, 9.908284187316895, 10.296059608459473, 10.68383502960205, 11.071610450744629, 11.459385871887207, 11.847161293029785, 12.234936714172363, 12.622713088989258, 13.010488510131836, 13.398263931274414, 13.786039352416992, 14.17381477355957, 14.561590194702148, 14.949365615844727, 15.337141036987305, 15.724916458129883, 16.11269187927246, 16.500469207763672, 16.88824462890625, 17.276020050048828, 17.663795471191406]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 13.0, 8.0, 16.0, 24.0, 29.0, 47.0, 57.0, 75.0, 106.0, 94.0, 98.0, 104.0, 67.0, 62.0, 41.0, 41.0, 27.0, 11.0, 11.0, 5.0, 8.0, 10.0, 2.0, 5.0, 3.0, 4.0, 1.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.241288185119629, -4.114683151245117, -3.9880785942077637, -3.861473798751831, -3.7348690032958984, -3.6082639694213867, -3.481659173965454, -3.3550543785095215, -3.228449583053589, -3.1018447875976562, -2.9752399921417236, -2.848635196685791, -2.7220301628112793, -2.595425605773926, -2.468820571899414, -2.3422157764434814, -2.215610980987549, -2.089006185531616, -1.9624013900756836, -1.8357964754104614, -1.7091916799545288, -1.5825868844985962, -1.455981969833374, -1.3293771743774414, -1.2027723789215088, -1.0761675834655762, -0.9495627284049988, -0.8229578733444214, -0.6963530778884888, -0.5697482824325562, -0.44314342737197876, -0.31653857231140137, -0.18993377685546875, -0.06332895159721375, 0.06327587366104126, 0.18988069891929626, 0.31648552417755127, 0.4430903196334839, 0.5696951746940613, 0.6963000297546387, 0.8229048252105713, 0.9495096206665039, 1.0761144161224365, 1.2027193307876587, 1.3293241262435913, 1.455928921699524, 1.582533836364746, 1.7091386318206787, 1.8357434272766113, 1.962348222732544, 2.0889530181884766, 2.215557813644409, 2.342162609100342, 2.4687676429748535, 2.595372438430786, 2.7219772338867188, 2.8485820293426514, 2.975186824798584, 3.1017916202545166, 3.228396415710449, 3.355001449584961, 3.4816060066223145, 3.608211040496826, 3.734815835952759, 3.8614206314086914]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 6.0, 19.0, 29.0, 33.0, 70.0, 87.0, 101.0, 185.0, 252.0, 354.0, 546.0, 948.0, 1546.0, 2656.0, 4506.0, 8996.0, 19621.0, 69580.0, 752967.0, 134894.0, 26592.0, 11111.0, 5476.0, 3088.0, 1823.0, 1120.0, 614.0, 426.0, 280.0, 189.0, 129.0, 95.0, 59.0, 50.0, 31.0, 18.0, 15.0, 11.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.26171875, -3.17022705078125, -3.0787353515625, -2.98724365234375, -2.895751953125, -2.80426025390625, -2.7127685546875, -2.62127685546875, -2.52978515625, -2.43829345703125, -2.3468017578125, -2.25531005859375, -2.163818359375, -2.07232666015625, -1.9808349609375, -1.88934326171875, -1.7978515625, -1.70635986328125, -1.6148681640625, -1.52337646484375, -1.431884765625, -1.34039306640625, -1.2489013671875, -1.15740966796875, -1.06591796875, -0.97442626953125, -0.8829345703125, -0.79144287109375, -0.699951171875, -0.60845947265625, -0.5169677734375, -0.42547607421875, -0.333984375, -0.24249267578125, -0.1510009765625, -0.05950927734375, 0.031982421875, 0.12347412109375, 0.2149658203125, 0.30645751953125, 0.39794921875, 0.48944091796875, 0.5809326171875, 0.67242431640625, 0.763916015625, 0.85540771484375, 0.9468994140625, 1.03839111328125, 1.1298828125, 1.22137451171875, 1.3128662109375, 1.40435791015625, 1.495849609375, 1.58734130859375, 1.6788330078125, 1.77032470703125, 1.86181640625, 1.95330810546875, 2.0447998046875, 2.13629150390625, 2.227783203125, 2.31927490234375, 2.4107666015625, 2.50225830078125, 2.59375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 10.0, 4.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 10.0, 15.0, 15.0, 24.0, 39.0, 109.0, 161.0, 233.0, 144.0, 73.0, 37.0, 24.0, 18.0, 12.0, 5.0, 10.0, 6.0, 7.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5205078125, -0.5061302185058594, -0.49175262451171875, -0.4773750305175781, -0.4629974365234375, -0.4486198425292969, -0.43424224853515625, -0.4198646545410156, -0.405487060546875, -0.3911094665527344, -0.37673187255859375, -0.3623542785644531, -0.3479766845703125, -0.3335990905761719, -0.31922149658203125, -0.3048439025878906, -0.29046630859375, -0.2760887145996094, -0.26171112060546875, -0.24733352661132812, -0.2329559326171875, -0.21857833862304688, -0.20420074462890625, -0.18982315063476562, -0.175445556640625, -0.16106796264648438, -0.14669036865234375, -0.13231277465820312, -0.1179351806640625, -0.10355758666992188, -0.08917999267578125, -0.07480239868164062, -0.0604248046875, -0.046047210693359375, -0.03166961669921875, -0.017292022705078125, -0.0029144287109375, 0.011463165283203125, 0.02584075927734375, 0.040218353271484375, 0.054595947265625, 0.06897354125976562, 0.08335113525390625, 0.09772872924804688, 0.1121063232421875, 0.12648391723632812, 0.14086151123046875, 0.15523910522460938, 0.16961669921875, 0.18399429321289062, 0.19837188720703125, 0.21274948120117188, 0.2271270751953125, 0.24150466918945312, 0.25588226318359375, 0.2702598571777344, 0.284637451171875, 0.2990150451660156, 0.31339263916015625, 0.3277702331542969, 0.3421478271484375, 0.3565254211425781, 0.37090301513671875, 0.3852806091308594, 0.399658203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 18.0, 65.0, 304.0, 2074.0, 33456.0, 897863.0, 109327.0, 4705.0, 528.0, 124.0, 35.0, 12.0, 11.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.11328125, -4.9140625, -4.71484375, -4.515625, -4.31640625, -4.1171875, -3.91796875, -3.71875, -3.51953125, -3.3203125, -3.12109375, -2.921875, -2.72265625, -2.5234375, -2.32421875, -2.125, -1.92578125, -1.7265625, -1.52734375, -1.328125, -1.12890625, -0.9296875, -0.73046875, -0.53125, -0.33203125, -0.1328125, 0.06640625, 0.265625, 0.46484375, 0.6640625, 0.86328125, 1.0625, 1.26171875, 1.4609375, 1.66015625, 1.859375, 2.05859375, 2.2578125, 2.45703125, 2.65625, 2.85546875, 3.0546875, 3.25390625, 3.453125, 3.65234375, 3.8515625, 4.05078125, 4.25, 4.44921875, 4.6484375, 4.84765625, 5.046875, 5.24609375, 5.4453125, 5.64453125, 5.84375, 6.04296875, 6.2421875, 6.44140625, 6.640625, 6.83984375, 7.0390625, 7.23828125, 7.4375, 7.63671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 10.0, 11.0, 10.0, 19.0, 20.0, 23.0, 20.0, 28.0, 25.0, 27.0, 35.0, 29.0, 36.0, 41.0, 40.0, 27.0, 37.0, 42.0, 40.0, 45.0, 40.0, 37.0, 37.0, 26.0, 39.0, 26.0, 34.0, 19.0, 22.0, 14.0, 17.0, 18.0, 15.0, 18.0, 10.0, 7.0, 5.0, 5.0, 6.0, 3.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.2821807861328125, -1.240142822265625, -1.1981048583984375, -1.15606689453125, -1.1140289306640625, -1.071990966796875, -1.0299530029296875, -0.9879150390625, -0.9458770751953125, -0.903839111328125, -0.8618011474609375, -0.81976318359375, -0.7777252197265625, -0.735687255859375, -0.6936492919921875, -0.651611328125, -0.6095733642578125, -0.567535400390625, -0.5254974365234375, -0.48345947265625, -0.4414215087890625, -0.399383544921875, -0.3573455810546875, -0.3153076171875, -0.2732696533203125, -0.231231689453125, -0.1891937255859375, -0.14715576171875, -0.1051177978515625, -0.063079833984375, -0.0210418701171875, 0.02099609375, 0.0630340576171875, 0.105072021484375, 0.1471099853515625, 0.18914794921875, 0.2311859130859375, 0.273223876953125, 0.3152618408203125, 0.3572998046875, 0.3993377685546875, 0.441375732421875, 0.4834136962890625, 0.52545166015625, 0.5674896240234375, 0.609527587890625, 0.6515655517578125, 0.693603515625, 0.7356414794921875, 0.777679443359375, 0.8197174072265625, 0.86175537109375, 0.9037933349609375, 0.945831298828125, 0.9878692626953125, 1.0299072265625, 1.0719451904296875, 1.113983154296875, 1.1560211181640625, 1.19805908203125, 1.2400970458984375, 1.282135009765625, 1.3241729736328125, 1.3662109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 2.0, 7.0, 4.0, 13.0, 16.0, 21.0, 34.0, 48.0, 93.0, 162.0, 389.0, 951.0, 3354.0, 21749.0, 815893.0, 193488.0, 9091.0, 1993.0, 663.0, 262.0, 122.0, 68.0, 36.0, 25.0, 11.0, 7.0, 10.0, 6.0, 5.0, 7.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.21484375, -5.083831787109375, -4.95281982421875, -4.821807861328125, -4.6907958984375, -4.559783935546875, -4.42877197265625, -4.297760009765625, -4.166748046875, -4.035736083984375, -3.90472412109375, -3.773712158203125, -3.6427001953125, -3.511688232421875, -3.38067626953125, -3.249664306640625, -3.11865234375, -2.987640380859375, -2.85662841796875, -2.725616455078125, -2.5946044921875, -2.463592529296875, -2.33258056640625, -2.201568603515625, -2.070556640625, -1.939544677734375, -1.80853271484375, -1.677520751953125, -1.5465087890625, -1.415496826171875, -1.28448486328125, -1.153472900390625, -1.0224609375, -0.891448974609375, -0.76043701171875, -0.629425048828125, -0.4984130859375, -0.367401123046875, -0.23638916015625, -0.105377197265625, 0.025634765625, 0.156646728515625, 0.28765869140625, 0.418670654296875, 0.5496826171875, 0.680694580078125, 0.81170654296875, 0.942718505859375, 1.07373046875, 1.204742431640625, 1.33575439453125, 1.466766357421875, 1.5977783203125, 1.728790283203125, 1.85980224609375, 1.990814208984375, 2.121826171875, 2.252838134765625, 2.38385009765625, 2.514862060546875, 2.6458740234375, 2.776885986328125, 2.90789794921875, 3.038909912109375, 3.169921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 8.0, 8.0, 14.0, 16.0, 24.0, 45.0, 52.0, 87.0, 110.0, 160.0, 117.0, 92.0, 78.0, 63.0, 49.0, 25.0, 20.0, 12.0, 5.0, 3.0, 5.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020968914031982422, -0.00020331144332885742, -0.00019693374633789062, -0.00019055604934692383, -0.00018417835235595703, -0.00017780065536499023, -0.00017142295837402344, -0.00016504526138305664, -0.00015866756439208984, -0.00015228986740112305, -0.00014591217041015625, -0.00013953447341918945, -0.00013315677642822266, -0.00012677907943725586, -0.00012040138244628906, -0.00011402368545532227, -0.00010764598846435547, -0.00010126829147338867, -9.489059448242188e-05, -8.851289749145508e-05, -8.213520050048828e-05, -7.575750350952148e-05, -6.937980651855469e-05, -6.300210952758789e-05, -5.6624412536621094e-05, -5.02467155456543e-05, -4.38690185546875e-05, -3.74913215637207e-05, -3.1113624572753906e-05, -2.473592758178711e-05, -1.8358230590820312e-05, -1.1980533599853516e-05, -5.602836608886719e-06, 7.748603820800781e-07, 7.152557373046875e-06, 1.3530254364013672e-05, 1.990795135498047e-05, 2.6285648345947266e-05, 3.266334533691406e-05, 3.904104232788086e-05, 4.5418739318847656e-05, 5.179643630981445e-05, 5.817413330078125e-05, 6.455183029174805e-05, 7.092952728271484e-05, 7.730722427368164e-05, 8.368492126464844e-05, 9.006261825561523e-05, 9.644031524658203e-05, 0.00010281801223754883, 0.00010919570922851562, 0.00011557340621948242, 0.00012195110321044922, 0.00012832880020141602, 0.0001347064971923828, 0.0001410841941833496, 0.0001474618911743164, 0.0001538395881652832, 0.00016021728515625, 0.0001665949821472168, 0.0001729726791381836, 0.0001793503761291504, 0.0001857280731201172, 0.00019210577011108398, 0.00019848346710205078]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 12.0, 12.0, 16.0, 24.0, 39.0, 75.0, 125.0, 226.0, 460.0, 1045.0, 2910.0, 11668.0, 98934.0, 787308.0, 127976.0, 12785.0, 2934.0, 1097.0, 431.0, 216.0, 125.0, 54.0, 24.0, 21.0, 11.0, 12.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.457275390625, -2.37939453125, -2.301513671875, -2.2236328125, -2.145751953125, -2.06787109375, -1.989990234375, -1.912109375, -1.834228515625, -1.75634765625, -1.678466796875, -1.6005859375, -1.522705078125, -1.44482421875, -1.366943359375, -1.2890625, -1.211181640625, -1.13330078125, -1.055419921875, -0.9775390625, -0.899658203125, -0.82177734375, -0.743896484375, -0.666015625, -0.588134765625, -0.51025390625, -0.432373046875, -0.3544921875, -0.276611328125, -0.19873046875, -0.120849609375, -0.04296875, 0.034912109375, 0.11279296875, 0.190673828125, 0.2685546875, 0.346435546875, 0.42431640625, 0.502197265625, 0.580078125, 0.657958984375, 0.73583984375, 0.813720703125, 0.8916015625, 0.969482421875, 1.04736328125, 1.125244140625, 1.203125, 1.281005859375, 1.35888671875, 1.436767578125, 1.5146484375, 1.592529296875, 1.67041015625, 1.748291015625, 1.826171875, 1.904052734375, 1.98193359375, 2.059814453125, 2.1376953125, 2.215576171875, 2.29345703125, 2.371337890625, 2.44921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 10.0, 6.0, 10.0, 14.0, 19.0, 34.0, 61.0, 90.0, 113.0, 137.0, 117.0, 123.0, 78.0, 78.0, 42.0, 27.0, 16.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.3187713623046875, -2.256683349609375, -2.1945953369140625, -2.13250732421875, -2.0704193115234375, -2.008331298828125, -1.9462432861328125, -1.8841552734375, -1.8220672607421875, -1.759979248046875, -1.6978912353515625, -1.63580322265625, -1.5737152099609375, -1.511627197265625, -1.4495391845703125, -1.387451171875, -1.3253631591796875, -1.263275146484375, -1.2011871337890625, -1.13909912109375, -1.0770111083984375, -1.014923095703125, -0.9528350830078125, -0.8907470703125, -0.8286590576171875, -0.766571044921875, -0.7044830322265625, -0.64239501953125, -0.5803070068359375, -0.518218994140625, -0.4561309814453125, -0.39404296875, -0.3319549560546875, -0.269866943359375, -0.2077789306640625, -0.14569091796875, -0.0836029052734375, -0.021514892578125, 0.0405731201171875, 0.1026611328125, 0.1647491455078125, 0.226837158203125, 0.2889251708984375, 0.35101318359375, 0.4131011962890625, 0.475189208984375, 0.5372772216796875, 0.599365234375, 0.6614532470703125, 0.723541259765625, 0.7856292724609375, 0.84771728515625, 0.9098052978515625, 0.971893310546875, 1.0339813232421875, 1.0960693359375, 1.1581573486328125, 1.220245361328125, 1.2823333740234375, 1.34442138671875, 1.4065093994140625, 1.468597412109375, 1.5306854248046875, 1.5927734375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 8.0, 12.0, 19.0, 46.0, 161.0, 394.0, 223.0, 82.0, 36.0, 14.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.46117401123047, -28.699419021606445, -27.93766212463379, -27.175907135009766, -26.414152145385742, -25.65239715576172, -24.890640258789062, -24.12888526916504, -23.367130279541016, -22.605375289916992, -21.843618392944336, -21.081863403320312, -20.32010841369629, -19.558353424072266, -18.79659652709961, -18.034841537475586, -17.27308464050293, -16.511329650878906, -15.749573707580566, -14.987817764282227, -14.226062774658203, -13.464306831359863, -12.702550888061523, -11.9407958984375, -11.17903995513916, -10.41728401184082, -9.655529022216797, -8.893773078918457, -8.132017135620117, -7.370262145996094, -6.608506202697754, -5.846750736236572, -5.084995269775391, -4.323239803314209, -3.5614840984344482, -2.7997283935546875, -2.037972927093506, -1.2762174606323242, -0.5144615173339844, 0.24729394912719727, 1.009049415588379, 1.77080500125885, 2.5325605869293213, 3.294316291809082, 4.056071758270264, 4.817827224731445, 5.579583168029785, 6.341338634490967, 7.103094100952148, 7.86484956741333, 8.626605033874512, 9.388360977172852, 10.150115966796875, 10.911871910095215, 11.673627853393555, 12.435382843017578, 13.197138786315918, 13.958894729614258, 14.720649719238281, 15.482405662536621, 16.24416160583496, 17.005916595458984, 17.76767349243164, 18.529428482055664, 19.291183471679688]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 5.0, 4.0, 7.0, 5.0, 15.0, 18.0, 18.0, 33.0, 47.0, 51.0, 76.0, 97.0, 105.0, 105.0, 86.0, 86.0, 76.0, 45.0, 32.0, 17.0, 17.0, 14.0, 9.0, 6.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15813446044922, -19.52935791015625, -18.900583267211914, -18.271808624267578, -17.64303207397461, -17.01425552368164, -16.385480880737305, -15.756705284118652, -15.1279296875, -14.499154090881348, -13.870378494262695, -13.241602897644043, -12.61282730102539, -11.984051704406738, -11.355276107788086, -10.726500511169434, -10.097724914550781, -9.468949317932129, -8.840173721313477, -8.211398124694824, -7.582622528076172, -6.9538469314575195, -6.325071334838867, -5.696295738220215, -5.0675201416015625, -4.43874454498291, -3.809968948364258, -3.1811933517456055, -2.552417755126953, -1.9236421585083008, -1.2948665618896484, -0.6660909652709961, -0.03731727600097656, 0.5914583206176758, 1.2202339172363281, 1.8490095138549805, 2.477785110473633, 3.106560707092285, 3.7353363037109375, 4.36411190032959, 4.992887496948242, 5.6216630935668945, 6.250438690185547, 6.879214286804199, 7.507989883422852, 8.136765480041504, 8.765541076660156, 9.394316673278809, 10.023092269897461, 10.651867866516113, 11.280643463134766, 11.909419059753418, 12.53819465637207, 13.166970252990723, 13.795745849609375, 14.424521446228027, 15.05329704284668, 15.682072639465332, 16.310848236083984, 16.939624786376953, 17.56839942932129, 18.197174072265625, 18.825950622558594, 19.454727172851562, 20.0835018157959]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 5.0, 6.0, 5.0, 7.0, 16.0, 13.0, 13.0, 26.0, 26.0, 28.0, 52.0, 49.0, 74.0, 112.0, 144.0, 198.0, 334.0, 563.0, 952.0, 1866.0, 3933.0, 11357.0, 77121.0, 4014981.0, 64959.0, 10363.0, 3380.0, 1503.0, 811.0, 482.0, 283.0, 201.0, 132.0, 90.0, 62.0, 51.0, 32.0, 14.0, 11.0, 10.0, 4.0, 7.0, 2.0, 2.0, 2.0], "bins": [-11.7578125, -11.48095703125, -11.2041015625, -10.92724609375, -10.650390625, -10.37353515625, -10.0966796875, -9.81982421875, -9.54296875, -9.26611328125, -8.9892578125, -8.71240234375, -8.435546875, -8.15869140625, -7.8818359375, -7.60498046875, -7.328125, -7.05126953125, -6.7744140625, -6.49755859375, -6.220703125, -5.94384765625, -5.6669921875, -5.39013671875, -5.11328125, -4.83642578125, -4.5595703125, -4.28271484375, -4.005859375, -3.72900390625, -3.4521484375, -3.17529296875, -2.8984375, -2.62158203125, -2.3447265625, -2.06787109375, -1.791015625, -1.51416015625, -1.2373046875, -0.96044921875, -0.68359375, -0.40673828125, -0.1298828125, 0.14697265625, 0.423828125, 0.70068359375, 0.9775390625, 1.25439453125, 1.53125, 1.80810546875, 2.0849609375, 2.36181640625, 2.638671875, 2.91552734375, 3.1923828125, 3.46923828125, 3.74609375, 4.02294921875, 4.2998046875, 4.57666015625, 4.853515625, 5.13037109375, 5.4072265625, 5.68408203125, 5.9609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 11.0, 19.0, 13.0, 28.0, 30.0, 58.0, 120.0, 158.0, 171.0, 138.0, 80.0, 54.0, 31.0, 10.0, 17.0, 7.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5743942260742188, -0.5604095458984375, -0.5464248657226562, -0.532440185546875, -0.5184555053710938, -0.5044708251953125, -0.49048614501953125, -0.47650146484375, -0.46251678466796875, -0.4485321044921875, -0.43454742431640625, -0.420562744140625, -0.40657806396484375, -0.3925933837890625, -0.37860870361328125, -0.3646240234375, -0.35063934326171875, -0.3366546630859375, -0.32266998291015625, -0.308685302734375, -0.29470062255859375, -0.2807159423828125, -0.26673126220703125, -0.25274658203125, -0.23876190185546875, -0.2247772216796875, -0.21079254150390625, -0.196807861328125, -0.18282318115234375, -0.1688385009765625, -0.15485382080078125, -0.140869140625, -0.12688446044921875, -0.1128997802734375, -0.09891510009765625, -0.084930419921875, -0.07094573974609375, -0.0569610595703125, -0.04297637939453125, -0.02899169921875, -0.01500701904296875, -0.0010223388671875, 0.01296234130859375, 0.026947021484375, 0.04093170166015625, 0.0549163818359375, 0.06890106201171875, 0.0828857421875, 0.09687042236328125, 0.1108551025390625, 0.12483978271484375, 0.138824462890625, 0.15280914306640625, 0.1667938232421875, 0.18077850341796875, 0.19476318359375, 0.20874786376953125, 0.2227325439453125, 0.23671722412109375, 0.250701904296875, 0.26468658447265625, 0.2786712646484375, 0.29265594482421875, 0.306640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 8.0, 7.0, 8.0, 12.0, 12.0, 19.0, 23.0, 49.0, 88.0, 270.0, 1897.0, 289073.0, 3899070.0, 3198.0, 326.0, 79.0, 43.0, 22.0, 20.0, 10.0, 19.0, 6.0, 10.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.8372802734375, -11.276123046875, -10.7149658203125, -10.15380859375, -9.5926513671875, -9.031494140625, -8.4703369140625, -7.9091796875, -7.3480224609375, -6.786865234375, -6.2257080078125, -5.66455078125, -5.1033935546875, -4.542236328125, -3.9810791015625, -3.419921875, -2.8587646484375, -2.297607421875, -1.7364501953125, -1.17529296875, -0.6141357421875, -0.052978515625, 0.5081787109375, 1.0693359375, 1.6304931640625, 2.191650390625, 2.7528076171875, 3.31396484375, 3.8751220703125, 4.436279296875, 4.9974365234375, 5.55859375, 6.1197509765625, 6.680908203125, 7.2420654296875, 7.80322265625, 8.3643798828125, 8.925537109375, 9.4866943359375, 10.0478515625, 10.6090087890625, 11.170166015625, 11.7313232421875, 12.29248046875, 12.8536376953125, 13.414794921875, 13.9759521484375, 14.537109375, 15.0982666015625, 15.659423828125, 16.2205810546875, 16.78173828125, 17.3428955078125, 17.904052734375, 18.4652099609375, 19.0263671875, 19.5875244140625, 20.148681640625, 20.7098388671875, 21.27099609375, 21.8321533203125, 22.393310546875, 22.9544677734375, 23.515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 6.0, 9.0, 12.0, 12.0, 21.0, 21.0, 37.0, 39.0, 83.0, 159.0, 404.0, 1728.0, 842.0, 311.0, 144.0, 67.0, 48.0, 23.0, 27.0, 17.0, 11.0, 16.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0], "bins": [-0.95703125, -0.9341201782226562, -0.9112091064453125, -0.8882980346679688, -0.865386962890625, -0.8424758911132812, -0.8195648193359375, -0.7966537475585938, -0.77374267578125, -0.7508316040039062, -0.7279205322265625, -0.7050094604492188, -0.682098388671875, -0.6591873168945312, -0.6362762451171875, -0.6133651733398438, -0.5904541015625, -0.5675430297851562, -0.5446319580078125, -0.5217208862304688, -0.498809814453125, -0.47589874267578125, -0.4529876708984375, -0.43007659912109375, -0.40716552734375, -0.38425445556640625, -0.3613433837890625, -0.33843231201171875, -0.315521240234375, -0.29261016845703125, -0.2696990966796875, -0.24678802490234375, -0.223876953125, -0.20096588134765625, -0.1780548095703125, -0.15514373779296875, -0.132232666015625, -0.10932159423828125, -0.0864105224609375, -0.06349945068359375, -0.04058837890625, -0.01767730712890625, 0.0052337646484375, 0.02814483642578125, 0.051055908203125, 0.07396697998046875, 0.0968780517578125, 0.11978912353515625, 0.1427001953125, 0.16561126708984375, 0.1885223388671875, 0.21143341064453125, 0.234344482421875, 0.25725555419921875, 0.2801666259765625, 0.30307769775390625, 0.32598876953125, 0.34889984130859375, 0.3718109130859375, 0.39472198486328125, 0.417633056640625, 0.44054412841796875, 0.4634552001953125, 0.48636627197265625, 0.50927734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 8.0, 19.0, 43.0, 104.0, 239.0, 294.0, 172.0, 62.0, 28.0, 12.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.606807231903076, -5.447340488433838, -5.287873268127441, -5.128406524658203, -4.968939781188965, -4.809473037719727, -4.65000581741333, -4.490539073944092, -4.331071853637695, -4.171605110168457, -4.0121378898620605, -3.8526711463928223, -3.693204402923584, -3.5337374210357666, -3.374270439147949, -3.214803695678711, -3.0553369522094727, -2.8958699703216553, -2.736403226852417, -2.5769362449645996, -2.4174695014953613, -2.258002519607544, -2.0985355377197266, -1.9390686750411987, -1.779601812362671, -1.620134949684143, -1.4606680870056152, -1.3012011051177979, -1.14173424243927, -0.9822673797607422, -0.8228004574775696, -0.663333535194397, -0.5038671493530273, -0.3444002568721771, -0.1849333643913269, -0.025466471910476685, 0.13400042057037354, 0.29346728324890137, 0.452934205532074, 0.6124011278152466, 0.7718679904937744, 0.9313348531723022, 1.09080171585083, 1.2502686977386475, 1.4097355604171753, 1.5692024230957031, 1.7286694049835205, 1.8881362676620483, 2.047603130340576, 2.2070701122283936, 2.366536855697632, 2.526003837585449, 2.6854705810546875, 2.844937562942505, 3.0044045448303223, 3.1638712882995605, 3.323338270187378, 3.4828052520751953, 3.6422719955444336, 3.801738977432251, 3.9612059593200684, 4.120672702789307, 4.280139446258545, 4.439606666564941, 4.59907341003418]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 1.0, 7.0, 3.0, 3.0, 9.0, 6.0, 7.0, 19.0, 40.0, 60.0, 59.0, 88.0, 99.0, 130.0, 129.0, 83.0, 80.0, 52.0, 43.0, 27.0, 19.0, 13.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4642257690429688, -2.3253109455108643, -2.1863961219787598, -2.0474812984466553, -1.9085664749145508, -1.7696516513824463, -1.6307368278503418, -1.4918220043182373, -1.3529071807861328, -1.2139923572540283, -1.0750775337219238, -0.9361627101898193, -0.7972478866577148, -0.6583330631256104, -0.5194182395935059, -0.38050341606140137, -0.24158859252929688, -0.10267376899719238, 0.03624105453491211, 0.1751558780670166, 0.3140707015991211, 0.4529855251312256, 0.5919003486633301, 0.7308151721954346, 0.8697299957275391, 1.0086448192596436, 1.147559642791748, 1.2864744663238525, 1.425389289855957, 1.5643041133880615, 1.703218936920166, 1.8421337604522705, 1.9810481071472168, 2.1199629306793213, 2.258877754211426, 2.3977925777435303, 2.5367074012756348, 2.6756222248077393, 2.8145370483398438, 2.9534518718719482, 3.0923666954040527, 3.2312815189361572, 3.3701963424682617, 3.509111166000366, 3.6480259895324707, 3.786940813064575, 3.9258556365966797, 4.064770698547363, 4.203685283660889, 4.342599868774414, 4.481514930725098, 4.620429992675781, 4.759344577789307, 4.898259162902832, 5.037174224853516, 5.176089286804199, 5.315003871917725, 5.45391845703125, 5.592833518981934, 5.731748580932617, 5.870663166046143, 6.009577751159668, 6.148492813110352, 6.287407875061035, 6.4263224601745605]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 1.0, 5.0, 9.0, 5.0, 17.0, 22.0, 26.0, 51.0, 93.0, 132.0, 227.0, 454.0, 814.0, 1745.0, 4550.0, 18620.0, 232932.0, 734437.0, 41866.0, 7556.0, 2612.0, 1093.0, 520.0, 312.0, 148.0, 107.0, 77.0, 32.0, 30.0, 21.0, 10.0, 14.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3515625, -3.23272705078125, -3.1138916015625, -2.99505615234375, -2.876220703125, -2.75738525390625, -2.6385498046875, -2.51971435546875, -2.40087890625, -2.28204345703125, -2.1632080078125, -2.04437255859375, -1.925537109375, -1.80670166015625, -1.6878662109375, -1.56903076171875, -1.4501953125, -1.33135986328125, -1.2125244140625, -1.09368896484375, -0.974853515625, -0.85601806640625, -0.7371826171875, -0.61834716796875, -0.49951171875, -0.38067626953125, -0.2618408203125, -0.14300537109375, -0.024169921875, 0.09466552734375, 0.2135009765625, 0.33233642578125, 0.451171875, 0.57000732421875, 0.6888427734375, 0.80767822265625, 0.926513671875, 1.04534912109375, 1.1641845703125, 1.28302001953125, 1.40185546875, 1.52069091796875, 1.6395263671875, 1.75836181640625, 1.877197265625, 1.99603271484375, 2.1148681640625, 2.23370361328125, 2.3525390625, 2.47137451171875, 2.5902099609375, 2.70904541015625, 2.827880859375, 2.94671630859375, 3.0655517578125, 3.18438720703125, 3.30322265625, 3.42205810546875, 3.5408935546875, 3.65972900390625, 3.778564453125, 3.89739990234375, 4.0162353515625, 4.13507080078125, 4.25390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 8.0, 9.0, 16.0, 21.0, 43.0, 77.0, 124.0, 167.0, 177.0, 134.0, 81.0, 45.0, 39.0, 19.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.493408203125, -0.4811134338378906, -0.46881866455078125, -0.4565238952636719, -0.4442291259765625, -0.4319343566894531, -0.41963958740234375, -0.4073448181152344, -0.395050048828125, -0.3827552795410156, -0.37046051025390625, -0.3581657409667969, -0.3458709716796875, -0.3335762023925781, -0.32128143310546875, -0.3089866638183594, -0.29669189453125, -0.2843971252441406, -0.27210235595703125, -0.2598075866699219, -0.2475128173828125, -0.23521804809570312, -0.22292327880859375, -0.21062850952148438, -0.198333740234375, -0.18603897094726562, -0.17374420166015625, -0.16144943237304688, -0.1491546630859375, -0.13685989379882812, -0.12456512451171875, -0.11227035522460938, -0.0999755859375, -0.08768081665039062, -0.07538604736328125, -0.06309127807617188, -0.0507965087890625, -0.038501739501953125, -0.02620697021484375, -0.013912200927734375, -0.001617431640625, 0.010677337646484375, 0.02297210693359375, 0.035266876220703125, 0.0475616455078125, 0.059856414794921875, 0.07215118408203125, 0.08444595336914062, 0.09674072265625, 0.10903549194335938, 0.12133026123046875, 0.13362503051757812, 0.1459197998046875, 0.15821456909179688, 0.17050933837890625, 0.18280410766601562, 0.195098876953125, 0.20739364624023438, 0.21968841552734375, 0.23198318481445312, 0.2442779541015625, 0.2565727233886719, 0.26886749267578125, 0.2811622619628906, 0.29345703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 0.0, 8.0, 6.0, 8.0, 16.0, 13.0, 11.0, 25.0, 28.0, 39.0, 48.0, 67.0, 89.0, 145.0, 174.0, 291.0, 408.0, 603.0, 1049.0, 1817.0, 3080.0, 5678.0, 10867.0, 22659.0, 50517.0, 125428.0, 309762.0, 299386.0, 121223.0, 48788.0, 22175.0, 10604.0, 5738.0, 3053.0, 1726.0, 1043.0, 628.0, 388.0, 258.0, 205.0, 124.0, 80.0, 84.0, 67.0, 45.0, 29.0, 17.0, 22.0, 10.0, 5.0, 8.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0], "bins": [-1.015625, -0.9828338623046875, -0.950042724609375, -0.9172515869140625, -0.88446044921875, -0.8516693115234375, -0.818878173828125, -0.7860870361328125, -0.7532958984375, -0.7205047607421875, -0.687713623046875, -0.6549224853515625, -0.62213134765625, -0.5893402099609375, -0.556549072265625, -0.5237579345703125, -0.490966796875, -0.4581756591796875, -0.425384521484375, -0.3925933837890625, -0.35980224609375, -0.3270111083984375, -0.294219970703125, -0.2614288330078125, -0.2286376953125, -0.1958465576171875, -0.163055419921875, -0.1302642822265625, -0.09747314453125, -0.0646820068359375, -0.031890869140625, 0.0009002685546875, 0.03369140625, 0.0664825439453125, 0.099273681640625, 0.1320648193359375, 0.16485595703125, 0.1976470947265625, 0.230438232421875, 0.2632293701171875, 0.2960205078125, 0.3288116455078125, 0.361602783203125, 0.3943939208984375, 0.42718505859375, 0.4599761962890625, 0.492767333984375, 0.5255584716796875, 0.558349609375, 0.5911407470703125, 0.623931884765625, 0.6567230224609375, 0.68951416015625, 0.7223052978515625, 0.755096435546875, 0.7878875732421875, 0.8206787109375, 0.8534698486328125, 0.886260986328125, 0.9190521240234375, 0.95184326171875, 0.9846343994140625, 1.017425537109375, 1.0502166748046875, 1.0830078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 9.0, 5.0, 6.0, 11.0, 8.0, 13.0, 11.0, 9.0, 18.0, 22.0, 23.0, 26.0, 30.0, 24.0, 29.0, 28.0, 34.0, 47.0, 40.0, 50.0, 46.0, 46.0, 35.0, 46.0, 36.0, 39.0, 41.0, 31.0, 35.0, 23.0, 20.0, 30.0, 25.0, 16.0, 9.0, 11.0, 18.0, 7.0, 7.0, 6.0, 6.0, 11.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9164886474609375, -0.885711669921875, -0.8549346923828125, -0.82415771484375, -0.7933807373046875, -0.762603759765625, -0.7318267822265625, -0.7010498046875, -0.6702728271484375, -0.639495849609375, -0.6087188720703125, -0.57794189453125, -0.5471649169921875, -0.516387939453125, -0.4856109619140625, -0.454833984375, -0.4240570068359375, -0.393280029296875, -0.3625030517578125, -0.33172607421875, -0.3009490966796875, -0.270172119140625, -0.2393951416015625, -0.2086181640625, -0.1778411865234375, -0.147064208984375, -0.1162872314453125, -0.08551025390625, -0.0547332763671875, -0.023956298828125, 0.0068206787109375, 0.03759765625, 0.0683746337890625, 0.099151611328125, 0.1299285888671875, 0.16070556640625, 0.1914825439453125, 0.222259521484375, 0.2530364990234375, 0.2838134765625, 0.3145904541015625, 0.345367431640625, 0.3761444091796875, 0.40692138671875, 0.4376983642578125, 0.468475341796875, 0.4992523193359375, 0.530029296875, 0.5608062744140625, 0.591583251953125, 0.6223602294921875, 0.65313720703125, 0.6839141845703125, 0.714691162109375, 0.7454681396484375, 0.7762451171875, 0.8070220947265625, 0.837799072265625, 0.8685760498046875, 0.89935302734375, 0.9301300048828125, 0.960906982421875, 0.9916839599609375, 1.0224609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 4.0, 9.0, 10.0, 23.0, 21.0, 25.0, 62.0, 138.0, 231.0, 562.0, 1595.0, 6556.0, 65489.0, 691168.0, 261055.0, 17164.0, 2826.0, 844.0, 368.0, 160.0, 103.0, 42.0, 33.0, 27.0, 10.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.4260406494140625, -1.370635986328125, -1.3152313232421875, -1.25982666015625, -1.2044219970703125, -1.149017333984375, -1.0936126708984375, -1.0382080078125, -0.9828033447265625, -0.927398681640625, -0.8719940185546875, -0.81658935546875, -0.7611846923828125, -0.705780029296875, -0.6503753662109375, -0.594970703125, -0.5395660400390625, -0.484161376953125, -0.4287567138671875, -0.37335205078125, -0.3179473876953125, -0.262542724609375, -0.2071380615234375, -0.1517333984375, -0.0963287353515625, -0.040924072265625, 0.0144805908203125, 0.06988525390625, 0.1252899169921875, 0.180694580078125, 0.2360992431640625, 0.29150390625, 0.3469085693359375, 0.402313232421875, 0.4577178955078125, 0.51312255859375, 0.5685272216796875, 0.623931884765625, 0.6793365478515625, 0.7347412109375, 0.7901458740234375, 0.845550537109375, 0.9009552001953125, 0.95635986328125, 1.0117645263671875, 1.067169189453125, 1.1225738525390625, 1.177978515625, 1.2333831787109375, 1.288787841796875, 1.3441925048828125, 1.39959716796875, 1.4550018310546875, 1.510406494140625, 1.5658111572265625, 1.6212158203125, 1.6766204833984375, 1.732025146484375, 1.7874298095703125, 1.84283447265625, 1.8982391357421875, 1.953643798828125, 2.0090484619140625, 2.064453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 18.0, 17.0, 27.0, 22.0, 31.0, 42.0, 52.0, 70.0, 68.0, 66.0, 84.0, 74.0, 86.0, 61.0, 65.0, 47.0, 32.0, 25.0, 28.0, 12.0, 7.0, 10.0, 11.0, 8.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012993812561035156, -0.00012583285570144653, -0.0001217275857925415, -0.00011762231588363647, -0.00011351704597473145, -0.00010941177606582642, -0.00010530650615692139, -0.00010120123624801636, -9.709596633911133e-05, -9.29906964302063e-05, -8.888542652130127e-05, -8.478015661239624e-05, -8.067488670349121e-05, -7.656961679458618e-05, -7.246434688568115e-05, -6.835907697677612e-05, -6.42538070678711e-05, -6.0148537158966064e-05, -5.6043267250061035e-05, -5.1937997341156006e-05, -4.7832727432250977e-05, -4.372745752334595e-05, -3.962218761444092e-05, -3.551691770553589e-05, -3.141164779663086e-05, -2.730637788772583e-05, -2.32011079788208e-05, -1.909583806991577e-05, -1.4990568161010742e-05, -1.0885298252105713e-05, -6.780028343200684e-06, -2.6747584342956543e-06, 1.430511474609375e-06, 5.535781383514404e-06, 9.641051292419434e-06, 1.3746321201324463e-05, 1.7851591110229492e-05, 2.195686101913452e-05, 2.606213092803955e-05, 3.016740083694458e-05, 3.427267074584961e-05, 3.837794065475464e-05, 4.248321056365967e-05, 4.65884804725647e-05, 5.0693750381469727e-05, 5.4799020290374756e-05, 5.8904290199279785e-05, 6.300956010818481e-05, 6.711483001708984e-05, 7.122009992599487e-05, 7.53253698348999e-05, 7.943063974380493e-05, 8.353590965270996e-05, 8.764117956161499e-05, 9.174644947052002e-05, 9.585171937942505e-05, 9.995698928833008e-05, 0.00010406225919723511, 0.00010816752910614014, 0.00011227279901504517, 0.0001163780689239502, 0.00012048333883285522, 0.00012458860874176025, 0.00012869387865066528, 0.0001327991485595703]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 4.0, 4.0, 8.0, 13.0, 12.0, 19.0, 23.0, 36.0, 55.0, 86.0, 125.0, 220.0, 366.0, 707.0, 1742.0, 4896.0, 19900.0, 118131.0, 543254.0, 298186.0, 45907.0, 9506.0, 2870.0, 1136.0, 495.0, 312.0, 159.0, 116.0, 65.0, 38.0, 39.0, 41.0, 14.0, 14.0, 23.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3095703125, -1.2729339599609375, -1.236297607421875, -1.1996612548828125, -1.16302490234375, -1.1263885498046875, -1.089752197265625, -1.0531158447265625, -1.0164794921875, -0.9798431396484375, -0.943206787109375, -0.9065704345703125, -0.86993408203125, -0.8332977294921875, -0.796661376953125, -0.7600250244140625, -0.723388671875, -0.6867523193359375, -0.650115966796875, -0.6134796142578125, -0.57684326171875, -0.5402069091796875, -0.503570556640625, -0.4669342041015625, -0.4302978515625, -0.3936614990234375, -0.357025146484375, -0.3203887939453125, -0.28375244140625, -0.2471160888671875, -0.210479736328125, -0.1738433837890625, -0.13720703125, -0.1005706787109375, -0.063934326171875, -0.0272979736328125, 0.00933837890625, 0.0459747314453125, 0.082611083984375, 0.1192474365234375, 0.1558837890625, 0.1925201416015625, 0.229156494140625, 0.2657928466796875, 0.30242919921875, 0.3390655517578125, 0.375701904296875, 0.4123382568359375, 0.448974609375, 0.4856109619140625, 0.522247314453125, 0.5588836669921875, 0.59552001953125, 0.6321563720703125, 0.668792724609375, 0.7054290771484375, 0.7420654296875, 0.7787017822265625, 0.815338134765625, 0.8519744873046875, 0.88861083984375, 0.9252471923828125, 0.961883544921875, 0.9985198974609375, 1.03515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 6.0, 15.0, 22.0, 31.0, 41.0, 61.0, 86.0, 100.0, 117.0, 134.0, 96.0, 88.0, 70.0, 35.0, 32.0, 17.0, 14.0, 9.0, 7.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5458984375, -0.519683837890625, -0.49346923828125, -0.467254638671875, -0.4410400390625, -0.414825439453125, -0.38861083984375, -0.362396240234375, -0.336181640625, -0.309967041015625, -0.28375244140625, -0.257537841796875, -0.2313232421875, -0.205108642578125, -0.17889404296875, -0.152679443359375, -0.12646484375, -0.100250244140625, -0.07403564453125, -0.047821044921875, -0.0216064453125, 0.004608154296875, 0.03082275390625, 0.057037353515625, 0.083251953125, 0.109466552734375, 0.13568115234375, 0.161895751953125, 0.1881103515625, 0.214324951171875, 0.24053955078125, 0.266754150390625, 0.29296875, 0.319183349609375, 0.34539794921875, 0.371612548828125, 0.3978271484375, 0.424041748046875, 0.45025634765625, 0.476470947265625, 0.502685546875, 0.528900146484375, 0.55511474609375, 0.581329345703125, 0.6075439453125, 0.633758544921875, 0.65997314453125, 0.686187744140625, 0.71240234375, 0.738616943359375, 0.76483154296875, 0.791046142578125, 0.8172607421875, 0.843475341796875, 0.86968994140625, 0.895904541015625, 0.922119140625, 0.948333740234375, 0.97454833984375, 1.000762939453125, 1.0269775390625, 1.053192138671875, 1.07940673828125, 1.105621337890625, 1.1318359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 13.0, 27.0, 75.0, 190.0, 323.0, 233.0, 86.0, 28.0, 12.0, 9.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.391127586364746, -13.728572845458984, -13.066018104553223, -12.403463363647461, -11.7409086227417, -11.078353881835938, -10.415800094604492, -9.753244400024414, -9.090690612792969, -8.428135871887207, -7.765581130981445, -7.103026390075684, -6.440471649169922, -5.77791690826416, -5.115362644195557, -4.452807903289795, -3.790252685546875, -3.1276979446411133, -2.4651432037353516, -1.802588701248169, -1.1400339603424072, -0.4774792194366455, 0.1850752830505371, 0.8476300239562988, 1.5101847648620605, 2.1727395057678223, 2.835294246673584, 3.4978487491607666, 4.160403251647949, 4.822957992553711, 5.485512733459473, 6.148067474365234, 6.81062126159668, 7.473176002502441, 8.135730743408203, 8.798285484313965, 9.460840225219727, 10.123394966125488, 10.78594970703125, 11.448503494262695, 12.111059188842773, 12.773613929748535, 13.436168670654297, 14.098723411560059, 14.76127815246582, 15.423832893371582, 16.086387634277344, 16.74894142150879, 17.411495208740234, 18.07404899597168, 18.736604690551758, 19.399158477783203, 20.06171417236328, 20.724267959594727, 21.386823654174805, 22.04937744140625, 22.711933135986328, 23.374486923217773, 24.03704261779785, 24.699596405029297, 25.362152099609375, 26.02470588684082, 26.6872615814209, 27.349815368652344, 28.012371063232422]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 7.0, 9.0, 6.0, 15.0, 14.0, 23.0, 25.0, 27.0, 41.0, 50.0, 49.0, 53.0, 69.0, 62.0, 69.0, 63.0, 53.0, 52.0, 59.0, 40.0, 41.0, 40.0, 24.0, 32.0, 23.0, 15.0, 10.0, 10.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.59659194946289, -10.22994613647461, -9.863299369812012, -9.496652603149414, -9.130006790161133, -8.763360977172852, -8.396714210510254, -8.030067443847656, -7.663421630859375, -7.2967753410339355, -6.930129051208496, -6.563482761383057, -6.196836471557617, -5.830190181732178, -5.463543891906738, -5.096897602081299, -4.730251312255859, -4.36360502243042, -3.9969587326049805, -3.630312442779541, -3.2636661529541016, -2.897019863128662, -2.5303735733032227, -2.163727283477783, -1.7970809936523438, -1.4304347038269043, -1.0637884140014648, -0.6971421241760254, -0.33049583435058594, 0.036150455474853516, 0.40279674530029297, 0.7694430351257324, 1.1360893249511719, 1.5027356147766113, 1.8693819046020508, 2.2360281944274902, 2.6026744842529297, 2.969320774078369, 3.3359670639038086, 3.702613353729248, 4.0692596435546875, 4.435905933380127, 4.802552223205566, 5.169198513031006, 5.535844802856445, 5.902491092681885, 6.269137382507324, 6.635783672332764, 7.002429962158203, 7.369076251983643, 7.735722541809082, 8.10236930847168, 8.469015121459961, 8.835660934448242, 9.20230770111084, 9.568954467773438, 9.935600280761719, 10.30224609375, 10.668892860412598, 11.035539627075195, 11.402185440063477, 11.768831253051758, 12.135478019714355, 12.502124786376953, 12.868770599365234]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 6.0, 9.0, 19.0, 33.0, 75.0, 181.0, 506.0, 3009.0, 3817357.0, 370493.0, 1997.0, 352.0, 117.0, 70.0, 25.0, 11.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.3125, -25.600341796875, -24.88818359375, -24.176025390625, -23.4638671875, -22.751708984375, -22.03955078125, -21.327392578125, -20.615234375, -19.903076171875, -19.19091796875, -18.478759765625, -17.7666015625, -17.054443359375, -16.34228515625, -15.630126953125, -14.91796875, -14.205810546875, -13.49365234375, -12.781494140625, -12.0693359375, -11.357177734375, -10.64501953125, -9.932861328125, -9.220703125, -8.508544921875, -7.79638671875, -7.084228515625, -6.3720703125, -5.659912109375, -4.94775390625, -4.235595703125, -3.5234375, -2.811279296875, -2.09912109375, -1.386962890625, -0.6748046875, 0.037353515625, 0.74951171875, 1.461669921875, 2.173828125, 2.885986328125, 3.59814453125, 4.310302734375, 5.0224609375, 5.734619140625, 6.44677734375, 7.158935546875, 7.87109375, 8.583251953125, 9.29541015625, 10.007568359375, 10.7197265625, 11.431884765625, 12.14404296875, 12.856201171875, 13.568359375, 14.280517578125, 14.99267578125, 15.704833984375, 16.4169921875, 17.129150390625, 17.84130859375, 18.553466796875, 19.265625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 16.0, 16.0, 44.0, 63.0, 96.0, 147.0, 141.0, 141.0, 114.0, 82.0, 47.0, 40.0, 16.0, 9.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6357421875, -0.6184234619140625, -0.601104736328125, -0.5837860107421875, -0.56646728515625, -0.5491485595703125, -0.531829833984375, -0.5145111083984375, -0.4971923828125, -0.4798736572265625, -0.462554931640625, -0.4452362060546875, -0.42791748046875, -0.4105987548828125, -0.393280029296875, -0.3759613037109375, -0.358642578125, -0.3413238525390625, -0.324005126953125, -0.3066864013671875, -0.28936767578125, -0.2720489501953125, -0.254730224609375, -0.2374114990234375, -0.2200927734375, -0.2027740478515625, -0.185455322265625, -0.1681365966796875, -0.15081787109375, -0.1334991455078125, -0.116180419921875, -0.0988616943359375, -0.08154296875, -0.0642242431640625, -0.046905517578125, -0.0295867919921875, -0.01226806640625, 0.0050506591796875, 0.022369384765625, 0.0396881103515625, 0.0570068359375, 0.0743255615234375, 0.091644287109375, 0.1089630126953125, 0.12628173828125, 0.1436004638671875, 0.160919189453125, 0.1782379150390625, 0.195556640625, 0.2128753662109375, 0.230194091796875, 0.2475128173828125, 0.26483154296875, 0.2821502685546875, 0.299468994140625, 0.3167877197265625, 0.3341064453125, 0.3514251708984375, 0.368743896484375, 0.3860626220703125, 0.40338134765625, 0.4207000732421875, 0.438018798828125, 0.4553375244140625, 0.47265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 5.0, 4.0, 15.0, 14.0, 25.0, 29.0, 55.0, 117.0, 192.0, 368.0, 805.0, 2056.0, 7070.0, 49591.0, 3427200.0, 674325.0, 25126.0, 4557.0, 1446.0, 607.0, 268.0, 169.0, 86.0, 58.0, 28.0, 26.0, 16.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.765625, -4.62890625, -4.4921875, -4.35546875, -4.21875, -4.08203125, -3.9453125, -3.80859375, -3.671875, -3.53515625, -3.3984375, -3.26171875, -3.125, -2.98828125, -2.8515625, -2.71484375, -2.578125, -2.44140625, -2.3046875, -2.16796875, -2.03125, -1.89453125, -1.7578125, -1.62109375, -1.484375, -1.34765625, -1.2109375, -1.07421875, -0.9375, -0.80078125, -0.6640625, -0.52734375, -0.390625, -0.25390625, -0.1171875, 0.01953125, 0.15625, 0.29296875, 0.4296875, 0.56640625, 0.703125, 0.83984375, 0.9765625, 1.11328125, 1.25, 1.38671875, 1.5234375, 1.66015625, 1.796875, 1.93359375, 2.0703125, 2.20703125, 2.34375, 2.48046875, 2.6171875, 2.75390625, 2.890625, 3.02734375, 3.1640625, 3.30078125, 3.4375, 3.57421875, 3.7109375, 3.84765625, 3.984375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 6.0, 4.0, 5.0, 15.0, 18.0, 29.0, 42.0, 68.0, 76.0, 149.0, 301.0, 816.0, 1530.0, 442.0, 196.0, 113.0, 72.0, 50.0, 33.0, 22.0, 13.0, 17.0, 13.0, 4.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497802734375, -0.4801521301269531, -0.46250152587890625, -0.4448509216308594, -0.4272003173828125, -0.4095497131347656, -0.39189910888671875, -0.3742485046386719, -0.356597900390625, -0.3389472961425781, -0.32129669189453125, -0.3036460876464844, -0.2859954833984375, -0.2683448791503906, -0.25069427490234375, -0.23304367065429688, -0.21539306640625, -0.19774246215820312, -0.18009185791015625, -0.16244125366210938, -0.1447906494140625, -0.12714004516601562, -0.10948944091796875, -0.09183883666992188, -0.074188232421875, -0.056537628173828125, -0.03888702392578125, -0.021236419677734375, -0.0035858154296875, 0.014064788818359375, 0.03171539306640625, 0.049365997314453125, 0.0670166015625, 0.08466720581054688, 0.10231781005859375, 0.11996841430664062, 0.1376190185546875, 0.15526962280273438, 0.17292022705078125, 0.19057083129882812, 0.208221435546875, 0.22587203979492188, 0.24352264404296875, 0.2611732482910156, 0.2788238525390625, 0.2964744567871094, 0.31412506103515625, 0.3317756652832031, 0.34942626953125, 0.3670768737792969, 0.38472747802734375, 0.4023780822753906, 0.4200286865234375, 0.4376792907714844, 0.45532989501953125, 0.4729804992675781, 0.490631103515625, 0.5082817077636719, 0.5259323120117188, 0.5435829162597656, 0.5612335205078125, 0.5788841247558594, 0.5965347290039062, 0.6141853332519531, 0.6318359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 6.0, 21.0, 39.0, 101.0, 136.0, 181.0, 175.0, 141.0, 88.0, 49.0, 25.0, 14.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.852826118469238, -4.728435516357422, -4.6040449142456055, -4.479654312133789, -4.355263710021973, -4.2308735847473145, -4.106482982635498, -3.9820923805236816, -3.8577017784118652, -3.733311176300049, -3.6089205741882324, -3.484530210494995, -3.3601396083831787, -3.2357490062713623, -3.111358642578125, -2.9869680404663086, -2.862577438354492, -2.738186836242676, -2.6137962341308594, -2.489405870437622, -2.3650152683258057, -2.2406246662139893, -2.116234302520752, -1.9918437004089355, -1.8674530982971191, -1.7430624961853027, -1.6186720132827759, -1.494281530380249, -1.3698909282684326, -1.2455003261566162, -1.1211098432540894, -0.9967193007469177, -0.8723289966583252, -0.7479384541511536, -0.6235479116439819, -0.4991573691368103, -0.37476682662963867, -0.25037628412246704, -0.1259857416152954, -0.0015951991081237793, 0.12279534339904785, 0.24718588590621948, 0.3715764284133911, 0.49596697092056274, 0.6203575134277344, 0.744748055934906, 0.8691385984420776, 0.9935291409492493, 1.117919683456421, 1.2423102855682373, 1.3667007684707642, 1.491091251373291, 1.6154818534851074, 1.7398724555969238, 1.8642629384994507, 1.9886534214019775, 2.113044023513794, 2.2374346256256104, 2.3618249893188477, 2.486215591430664, 2.6106061935424805, 2.734996795654297, 2.8593873977661133, 2.9837777614593506, 3.108168363571167]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 11.0, 11.0, 27.0, 19.0, 42.0, 48.0, 53.0, 57.0, 72.0, 71.0, 74.0, 92.0, 68.0, 64.0, 76.0, 63.0, 38.0, 32.0, 23.0, 12.0, 13.0, 14.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.997781276702881, -2.899254322052002, -2.800727367401123, -2.702200412750244, -2.603673219680786, -2.5051462650299072, -2.4066193103790283, -2.3080923557281494, -2.2095651626586914, -2.1110382080078125, -2.0125112533569336, -1.9139841794967651, -1.8154571056365967, -1.7169301509857178, -1.6184031963348389, -1.51987624168396, -1.421349287033081, -1.3228223323822021, -1.2242952585220337, -1.1257683038711548, -1.0272412300109863, -0.9287142753601074, -0.8301873207092285, -0.7316603064537048, -0.6331332921981812, -0.5346062779426575, -0.4360792934894562, -0.3375523090362549, -0.2390252947807312, -0.14049828052520752, -0.04197132587432861, 0.05655568838119507, 0.15508294105529785, 0.25360995531082153, 0.3521369397640228, 0.4506639242172241, 0.5491909384727478, 0.6477179527282715, 0.7462449073791504, 0.8447719216346741, 0.9432989358901978, 1.0418258905410767, 1.1403529644012451, 1.238879919052124, 1.337406873703003, 1.4359339475631714, 1.5344609022140503, 1.6329879760742188, 1.7315149307250977, 1.8300418853759766, 1.928568959236145, 2.0270957946777344, 2.1256229877471924, 2.2241499423980713, 2.32267689704895, 2.421203851699829, 2.519731044769287, 2.618257999420166, 2.716784954071045, 2.815311908721924, 2.913839101791382, 3.0123660564422607, 3.1108930110931396, 3.2094199657440186, 3.3079469203948975]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 14.0, 10.0, 21.0, 30.0, 36.0, 45.0, 60.0, 124.0, 206.0, 311.0, 537.0, 1024.0, 1908.0, 4868.0, 19311.0, 199123.0, 710148.0, 91483.0, 12036.0, 3611.0, 1577.0, 826.0, 478.0, 266.0, 162.0, 109.0, 57.0, 58.0, 29.0, 17.0, 16.0, 12.0, 8.0, 7.0, 6.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.791015625, -2.699066162109375, -2.60711669921875, -2.515167236328125, -2.4232177734375, -2.331268310546875, -2.23931884765625, -2.147369384765625, -2.055419921875, -1.963470458984375, -1.87152099609375, -1.779571533203125, -1.6876220703125, -1.595672607421875, -1.50372314453125, -1.411773681640625, -1.31982421875, -1.227874755859375, -1.13592529296875, -1.043975830078125, -0.9520263671875, -0.860076904296875, -0.76812744140625, -0.676177978515625, -0.584228515625, -0.492279052734375, -0.40032958984375, -0.308380126953125, -0.2164306640625, -0.124481201171875, -0.03253173828125, 0.059417724609375, 0.1513671875, 0.243316650390625, 0.33526611328125, 0.427215576171875, 0.5191650390625, 0.611114501953125, 0.70306396484375, 0.795013427734375, 0.886962890625, 0.978912353515625, 1.07086181640625, 1.162811279296875, 1.2547607421875, 1.346710205078125, 1.43865966796875, 1.530609130859375, 1.62255859375, 1.714508056640625, 1.80645751953125, 1.898406982421875, 1.9903564453125, 2.082305908203125, 2.17425537109375, 2.266204833984375, 2.358154296875, 2.450103759765625, 2.54205322265625, 2.634002685546875, 2.7259521484375, 2.817901611328125, 2.90985107421875, 3.001800537109375, 3.09375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 14.0, 24.0, 57.0, 91.0, 123.0, 166.0, 168.0, 134.0, 99.0, 50.0, 23.0, 20.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51220703125, -0.49456787109375, -0.4769287109375, -0.45928955078125, -0.441650390625, -0.42401123046875, -0.4063720703125, -0.38873291015625, -0.37109375, -0.35345458984375, -0.3358154296875, -0.31817626953125, -0.300537109375, -0.28289794921875, -0.2652587890625, -0.24761962890625, -0.22998046875, -0.21234130859375, -0.1947021484375, -0.17706298828125, -0.159423828125, -0.14178466796875, -0.1241455078125, -0.10650634765625, -0.0888671875, -0.07122802734375, -0.0535888671875, -0.03594970703125, -0.018310546875, -0.00067138671875, 0.0169677734375, 0.03460693359375, 0.05224609375, 0.06988525390625, 0.0875244140625, 0.10516357421875, 0.122802734375, 0.14044189453125, 0.1580810546875, 0.17572021484375, 0.193359375, 0.21099853515625, 0.2286376953125, 0.24627685546875, 0.263916015625, 0.28155517578125, 0.2991943359375, 0.31683349609375, 0.33447265625, 0.35211181640625, 0.3697509765625, 0.38739013671875, 0.405029296875, 0.42266845703125, 0.4403076171875, 0.45794677734375, 0.4755859375, 0.49322509765625, 0.5108642578125, 0.52850341796875, 0.546142578125, 0.56378173828125, 0.5814208984375, 0.59906005859375, 0.61669921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 12.0, 16.0, 16.0, 26.0, 26.0, 64.0, 102.0, 149.0, 209.0, 370.0, 587.0, 1231.0, 2554.0, 6381.0, 21002.0, 103018.0, 556303.0, 290447.0, 46836.0, 11453.0, 3994.0, 1704.0, 841.0, 487.0, 277.0, 149.0, 98.0, 56.0, 40.0, 27.0, 26.0, 12.0, 11.0, 6.0, 3.0, 6.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.043121337890625, -1.98077392578125, -1.918426513671875, -1.8560791015625, -1.793731689453125, -1.73138427734375, -1.669036865234375, -1.606689453125, -1.544342041015625, -1.48199462890625, -1.419647216796875, -1.3572998046875, -1.294952392578125, -1.23260498046875, -1.170257568359375, -1.10791015625, -1.045562744140625, -0.98321533203125, -0.920867919921875, -0.8585205078125, -0.796173095703125, -0.73382568359375, -0.671478271484375, -0.609130859375, -0.546783447265625, -0.48443603515625, -0.422088623046875, -0.3597412109375, -0.297393798828125, -0.23504638671875, -0.172698974609375, -0.1103515625, -0.048004150390625, 0.01434326171875, 0.076690673828125, 0.1390380859375, 0.201385498046875, 0.26373291015625, 0.326080322265625, 0.388427734375, 0.450775146484375, 0.51312255859375, 0.575469970703125, 0.6378173828125, 0.700164794921875, 0.76251220703125, 0.824859619140625, 0.88720703125, 0.949554443359375, 1.01190185546875, 1.074249267578125, 1.1365966796875, 1.198944091796875, 1.26129150390625, 1.323638916015625, 1.385986328125, 1.448333740234375, 1.51068115234375, 1.573028564453125, 1.6353759765625, 1.697723388671875, 1.76007080078125, 1.822418212890625, 1.884765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 10.0, 12.0, 15.0, 30.0, 38.0, 35.0, 61.0, 70.0, 97.0, 100.0, 89.0, 109.0, 81.0, 53.0, 62.0, 35.0, 34.0, 28.0, 16.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6875, -2.61358642578125, -2.5396728515625, -2.46575927734375, -2.391845703125, -2.31793212890625, -2.2440185546875, -2.17010498046875, -2.09619140625, -2.02227783203125, -1.9483642578125, -1.87445068359375, -1.800537109375, -1.72662353515625, -1.6527099609375, -1.57879638671875, -1.5048828125, -1.43096923828125, -1.3570556640625, -1.28314208984375, -1.209228515625, -1.13531494140625, -1.0614013671875, -0.98748779296875, -0.91357421875, -0.83966064453125, -0.7657470703125, -0.69183349609375, -0.617919921875, -0.54400634765625, -0.4700927734375, -0.39617919921875, -0.322265625, -0.24835205078125, -0.1744384765625, -0.10052490234375, -0.026611328125, 0.04730224609375, 0.1212158203125, 0.19512939453125, 0.26904296875, 0.34295654296875, 0.4168701171875, 0.49078369140625, 0.564697265625, 0.63861083984375, 0.7125244140625, 0.78643798828125, 0.8603515625, 0.93426513671875, 1.0081787109375, 1.08209228515625, 1.156005859375, 1.22991943359375, 1.3038330078125, 1.37774658203125, 1.45166015625, 1.52557373046875, 1.5994873046875, 1.67340087890625, 1.747314453125, 1.82122802734375, 1.8951416015625, 1.96905517578125, 2.04296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 23.0, 42.0, 89.0, 218.0, 746.0, 19820.0, 1021442.0, 5434.0, 444.0, 138.0, 72.0, 31.0, 17.0, 11.0, 11.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.080810546875, -3.88037109375, -3.679931640625, -3.4794921875, -3.279052734375, -3.07861328125, -2.878173828125, -2.677734375, -2.477294921875, -2.27685546875, -2.076416015625, -1.8759765625, -1.675537109375, -1.47509765625, -1.274658203125, -1.07421875, -0.873779296875, -0.67333984375, -0.472900390625, -0.2724609375, -0.072021484375, 0.12841796875, 0.328857421875, 0.529296875, 0.729736328125, 0.93017578125, 1.130615234375, 1.3310546875, 1.531494140625, 1.73193359375, 1.932373046875, 2.1328125, 2.333251953125, 2.53369140625, 2.734130859375, 2.9345703125, 3.135009765625, 3.33544921875, 3.535888671875, 3.736328125, 3.936767578125, 4.13720703125, 4.337646484375, 4.5380859375, 4.738525390625, 4.93896484375, 5.139404296875, 5.33984375, 5.540283203125, 5.74072265625, 5.941162109375, 6.1416015625, 6.342041015625, 6.54248046875, 6.742919921875, 6.943359375, 7.143798828125, 7.34423828125, 7.544677734375, 7.7451171875, 7.945556640625, 8.14599609375, 8.346435546875, 8.546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 10.0, 13.0, 14.0, 36.0, 52.0, 80.0, 100.0, 133.0, 135.0, 137.0, 86.0, 70.0, 42.0, 23.0, 15.0, 10.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.00028777122497558594, -0.0002812780439853668, -0.0002747848629951477, -0.0002682916820049286, -0.00026179850101470947, -0.00025530532002449036, -0.00024881213903427124, -0.00024231895804405212, -0.000235825777053833, -0.0002293325960636139, -0.00022283941507339478, -0.00021634623408317566, -0.00020985305309295654, -0.00020335987210273743, -0.0001968666911125183, -0.0001903735101222992, -0.00018388032913208008, -0.00017738714814186096, -0.00017089396715164185, -0.00016440078616142273, -0.0001579076051712036, -0.0001514144241809845, -0.00014492124319076538, -0.00013842806220054626, -0.00013193488121032715, -0.00012544170022010803, -0.00011894851922988892, -0.0001124553382396698, -0.00010596215724945068, -9.946897625923157e-05, -9.297579526901245e-05, -8.648261427879333e-05, -7.998943328857422e-05, -7.34962522983551e-05, -6.700307130813599e-05, -6.050989031791687e-05, -5.4016709327697754e-05, -4.752352833747864e-05, -4.103034734725952e-05, -3.4537166357040405e-05, -2.804398536682129e-05, -2.1550804376602173e-05, -1.5057623386383057e-05, -8.56444239616394e-06, -2.0712614059448242e-06, 4.421919584274292e-06, 1.0915100574493408e-05, 1.7408281564712524e-05, 2.390146255493164e-05, 3.0394643545150757e-05, 3.688782453536987e-05, 4.338100552558899e-05, 4.9874186515808105e-05, 5.636736750602722e-05, 6.286054849624634e-05, 6.935372948646545e-05, 7.584691047668457e-05, 8.234009146690369e-05, 8.88332724571228e-05, 9.532645344734192e-05, 0.00010181963443756104, 0.00010831281542778015, 0.00011480599641799927, 0.00012129917740821838, 0.0001277923583984375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 10.0, 7.0, 10.0, 20.0, 24.0, 34.0, 54.0, 110.0, 196.0, 448.0, 1142.0, 3401.0, 15122.0, 228185.0, 747568.0, 42781.0, 6463.0, 1752.0, 626.0, 253.0, 121.0, 76.0, 52.0, 27.0, 13.0, 14.0, 7.0, 6.0, 13.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9541015625, -1.89703369140625, -1.8399658203125, -1.78289794921875, -1.725830078125, -1.66876220703125, -1.6116943359375, -1.55462646484375, -1.49755859375, -1.44049072265625, -1.3834228515625, -1.32635498046875, -1.269287109375, -1.21221923828125, -1.1551513671875, -1.09808349609375, -1.041015625, -0.98394775390625, -0.9268798828125, -0.86981201171875, -0.812744140625, -0.75567626953125, -0.6986083984375, -0.64154052734375, -0.58447265625, -0.52740478515625, -0.4703369140625, -0.41326904296875, -0.356201171875, -0.29913330078125, -0.2420654296875, -0.18499755859375, -0.1279296875, -0.07086181640625, -0.0137939453125, 0.04327392578125, 0.100341796875, 0.15740966796875, 0.2144775390625, 0.27154541015625, 0.32861328125, 0.38568115234375, 0.4427490234375, 0.49981689453125, 0.556884765625, 0.61395263671875, 0.6710205078125, 0.72808837890625, 0.78515625, 0.84222412109375, 0.8992919921875, 0.95635986328125, 1.013427734375, 1.07049560546875, 1.1275634765625, 1.18463134765625, 1.24169921875, 1.29876708984375, 1.3558349609375, 1.41290283203125, 1.469970703125, 1.52703857421875, 1.5841064453125, 1.64117431640625, 1.6982421875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 10.0, 2.0, 6.0, 9.0, 10.0, 8.0, 18.0, 37.0, 52.0, 49.0, 87.0, 115.0, 123.0, 121.0, 90.0, 91.0, 56.0, 32.0, 23.0, 10.0, 12.0, 11.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7267532348632812, -0.7030181884765625, -0.6792831420898438, -0.655548095703125, -0.6318130493164062, -0.6080780029296875, -0.5843429565429688, -0.56060791015625, -0.5368728637695312, -0.5131378173828125, -0.48940277099609375, -0.465667724609375, -0.44193267822265625, -0.4181976318359375, -0.39446258544921875, -0.3707275390625, -0.34699249267578125, -0.3232574462890625, -0.29952239990234375, -0.275787353515625, -0.25205230712890625, -0.2283172607421875, -0.20458221435546875, -0.18084716796875, -0.15711212158203125, -0.1333770751953125, -0.10964202880859375, -0.085906982421875, -0.06217193603515625, -0.0384368896484375, -0.01470184326171875, 0.009033203125, 0.03276824951171875, 0.0565032958984375, 0.08023834228515625, 0.103973388671875, 0.12770843505859375, 0.1514434814453125, 0.17517852783203125, 0.19891357421875, 0.22264862060546875, 0.2463836669921875, 0.27011871337890625, 0.293853759765625, 0.31758880615234375, 0.3413238525390625, 0.36505889892578125, 0.3887939453125, 0.41252899169921875, 0.4362640380859375, 0.45999908447265625, 0.483734130859375, 0.5074691772460938, 0.5312042236328125, 0.5549392700195312, 0.57867431640625, 0.6024093627929688, 0.6261444091796875, 0.6498794555664062, 0.673614501953125, 0.6973495483398438, 0.7210845947265625, 0.7448196411132812, 0.7685546875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 21.0, 37.0, 117.0, 283.0, 314.0, 144.0, 43.0, 29.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.469057083129883, -17.835643768310547, -17.20223045349121, -16.568817138671875, -15.935403823852539, -15.301990509033203, -14.668578147888184, -14.035164833068848, -13.401751518249512, -12.768338203430176, -12.13492488861084, -11.501511573791504, -10.868099212646484, -10.234685897827148, -9.601272583007812, -8.967859268188477, -8.33444595336914, -7.701032638549805, -7.067619323730469, -6.434206485748291, -5.800793170928955, -5.167379856109619, -4.533967018127441, -3.9005537033081055, -3.2671403884887695, -2.6337270736694336, -2.0003139972686768, -1.3669008016586304, -0.733487606048584, -0.10007429122924805, 0.5333387851715088, 1.1667518615722656, 1.8001632690429688, 2.4335765838623047, 3.0669896602630615, 3.7004027366638184, 4.333816051483154, 4.96722936630249, 5.600642204284668, 6.234055519104004, 6.86746883392334, 7.500882148742676, 8.134295463562012, 8.767708778381348, 9.401121139526367, 10.034534454345703, 10.667947769165039, 11.301361083984375, 11.934774398803711, 12.568187713623047, 13.201601028442383, 13.835014343261719, 14.468427658081055, 15.10184097290039, 15.73525333404541, 16.368667602539062, 17.002079010009766, 17.6354923248291, 18.268905639648438, 18.902318954467773, 19.53573226928711, 20.169145584106445, 20.80255889892578, 21.435970306396484, 22.069385528564453]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 8.0, 4.0, 8.0, 12.0, 11.0, 12.0, 25.0, 27.0, 40.0, 29.0, 34.0, 41.0, 51.0, 53.0, 43.0, 57.0, 56.0, 54.0, 58.0, 42.0, 45.0, 49.0, 44.0, 33.0, 20.0, 27.0, 19.0, 16.0, 16.0, 14.0, 13.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.135211944580078, -9.859474182128906, -9.583736419677734, -9.307998657226562, -9.03226089477539, -8.756524085998535, -8.480786323547363, -8.205048561096191, -7.9293107986450195, -7.653573036193848, -7.377835273742676, -7.102097988128662, -6.82636022567749, -6.550622463226318, -6.274885177612305, -5.999147415161133, -5.723409652709961, -5.447671890258789, -5.171934127807617, -4.8961968421936035, -4.620459079742432, -4.34472131729126, -4.068984031677246, -3.793246269226074, -3.5175085067749023, -3.2417707443237305, -2.9660332202911377, -2.690295696258545, -2.414557933807373, -2.138820171356201, -1.8630826473236084, -1.587345004081726, -1.3116064071655273, -1.035868763923645, -0.7601311206817627, -0.48439347743988037, -0.20865583419799805, 0.06708180904388428, 0.3428194522857666, 0.6185570955276489, 0.8942947387695312, 1.1700323820114136, 1.445770025253296, 1.7215076684951782, 1.9972453117370605, 2.2729830741882324, 2.548720598220825, 2.824458122253418, 3.10019588470459, 3.3759336471557617, 3.6516711711883545, 3.9274086952209473, 4.203146457672119, 4.478884220123291, 4.754621505737305, 5.030359268188477, 5.306097030639648, 5.58183479309082, 5.857572555541992, 6.133309841156006, 6.409047603607178, 6.68478536605835, 6.960522651672363, 7.236260414123535, 7.511998176574707]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 10.0, 16.0, 14.0, 27.0, 34.0, 50.0, 68.0, 132.0, 166.0, 310.0, 487.0, 967.0, 1965.0, 5055.0, 18695.0, 137610.0, 3833458.0, 166658.0, 20104.0, 4997.0, 1729.0, 773.0, 413.0, 222.0, 124.0, 57.0, 36.0, 26.0, 16.0, 14.0, 6.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.962890625, -3.854400634765625, -3.74591064453125, -3.637420654296875, -3.5289306640625, -3.420440673828125, -3.31195068359375, -3.203460693359375, -3.094970703125, -2.986480712890625, -2.87799072265625, -2.769500732421875, -2.6610107421875, -2.552520751953125, -2.44403076171875, -2.335540771484375, -2.22705078125, -2.118560791015625, -2.01007080078125, -1.901580810546875, -1.7930908203125, -1.684600830078125, -1.57611083984375, -1.467620849609375, -1.359130859375, -1.250640869140625, -1.14215087890625, -1.033660888671875, -0.9251708984375, -0.816680908203125, -0.70819091796875, -0.599700927734375, -0.4912109375, -0.382720947265625, -0.27423095703125, -0.165740966796875, -0.0572509765625, 0.051239013671875, 0.15972900390625, 0.268218994140625, 0.376708984375, 0.485198974609375, 0.59368896484375, 0.702178955078125, 0.8106689453125, 0.919158935546875, 1.02764892578125, 1.136138916015625, 1.24462890625, 1.353118896484375, 1.46160888671875, 1.570098876953125, 1.6785888671875, 1.787078857421875, 1.89556884765625, 2.004058837890625, 2.112548828125, 2.221038818359375, 2.32952880859375, 2.438018798828125, 2.5465087890625, 2.654998779296875, 2.76348876953125, 2.871978759765625, 2.98046875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 15.0, 17.0, 28.0, 32.0, 55.0, 72.0, 85.0, 88.0, 89.0, 108.0, 97.0, 89.0, 66.0, 44.0, 28.0, 30.0, 14.0, 15.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.484130859375, -0.4709587097167969, -0.45778656005859375, -0.4446144104003906, -0.4314422607421875, -0.4182701110839844, -0.40509796142578125, -0.3919258117675781, -0.378753662109375, -0.3655815124511719, -0.35240936279296875, -0.3392372131347656, -0.3260650634765625, -0.3128929138183594, -0.29972076416015625, -0.2865486145019531, -0.27337646484375, -0.2602043151855469, -0.24703216552734375, -0.23386001586914062, -0.2206878662109375, -0.20751571655273438, -0.19434356689453125, -0.18117141723632812, -0.167999267578125, -0.15482711791992188, -0.14165496826171875, -0.12848281860351562, -0.1153106689453125, -0.10213851928710938, -0.08896636962890625, -0.07579421997070312, -0.0626220703125, -0.049449920654296875, -0.03627777099609375, -0.023105621337890625, -0.0099334716796875, 0.003238677978515625, 0.01641082763671875, 0.029582977294921875, 0.042755126953125, 0.055927276611328125, 0.06909942626953125, 0.08227157592773438, 0.0954437255859375, 0.10861587524414062, 0.12178802490234375, 0.13496017456054688, 0.14813232421875, 0.16130447387695312, 0.17447662353515625, 0.18764877319335938, 0.2008209228515625, 0.21399307250976562, 0.22716522216796875, 0.24033737182617188, 0.253509521484375, 0.2666816711425781, 0.27985382080078125, 0.2930259704589844, 0.3061981201171875, 0.3193702697753906, 0.33254241943359375, 0.3457145690917969, 0.35888671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 6.0, 13.0, 13.0, 18.0, 35.0, 50.0, 110.0, 162.0, 327.0, 605.0, 1446.0, 4736.0, 24648.0, 496852.0, 3589149.0, 63357.0, 8666.0, 2281.0, 860.0, 373.0, 226.0, 127.0, 84.0, 42.0, 34.0, 15.0, 12.0, 6.0, 8.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.064453125, -2.96624755859375, -2.8680419921875, -2.76983642578125, -2.671630859375, -2.57342529296875, -2.4752197265625, -2.37701416015625, -2.27880859375, -2.18060302734375, -2.0823974609375, -1.98419189453125, -1.885986328125, -1.78778076171875, -1.6895751953125, -1.59136962890625, -1.4931640625, -1.39495849609375, -1.2967529296875, -1.19854736328125, -1.100341796875, -1.00213623046875, -0.9039306640625, -0.80572509765625, -0.70751953125, -0.60931396484375, -0.5111083984375, -0.41290283203125, -0.314697265625, -0.21649169921875, -0.1182861328125, -0.02008056640625, 0.078125, 0.17633056640625, 0.2745361328125, 0.37274169921875, 0.470947265625, 0.56915283203125, 0.6673583984375, 0.76556396484375, 0.86376953125, 0.96197509765625, 1.0601806640625, 1.15838623046875, 1.256591796875, 1.35479736328125, 1.4530029296875, 1.55120849609375, 1.6494140625, 1.74761962890625, 1.8458251953125, 1.94403076171875, 2.042236328125, 2.14044189453125, 2.2386474609375, 2.33685302734375, 2.43505859375, 2.53326416015625, 2.6314697265625, 2.72967529296875, 2.827880859375, 2.92608642578125, 3.0242919921875, 3.12249755859375, 3.220703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 12.0, 5.0, 12.0, 24.0, 31.0, 38.0, 69.0, 139.0, 276.0, 732.0, 1803.0, 450.0, 206.0, 95.0, 52.0, 34.0, 22.0, 20.0, 9.0, 4.0, 9.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64892578125, -0.6299819946289062, -0.6110382080078125, -0.5920944213867188, -0.573150634765625, -0.5542068481445312, -0.5352630615234375, -0.5163192749023438, -0.49737548828125, -0.47843170166015625, -0.4594879150390625, -0.44054412841796875, -0.421600341796875, -0.40265655517578125, -0.3837127685546875, -0.36476898193359375, -0.3458251953125, -0.32688140869140625, -0.3079376220703125, -0.28899383544921875, -0.270050048828125, -0.25110626220703125, -0.2321624755859375, -0.21321868896484375, -0.19427490234375, -0.17533111572265625, -0.1563873291015625, -0.13744354248046875, -0.118499755859375, -0.09955596923828125, -0.0806121826171875, -0.06166839599609375, -0.042724609375, -0.02378082275390625, -0.0048370361328125, 0.01410675048828125, 0.033050537109375, 0.05199432373046875, 0.0709381103515625, 0.08988189697265625, 0.10882568359375, 0.12776947021484375, 0.1467132568359375, 0.16565704345703125, 0.184600830078125, 0.20354461669921875, 0.2224884033203125, 0.24143218994140625, 0.2603759765625, 0.27931976318359375, 0.2982635498046875, 0.31720733642578125, 0.336151123046875, 0.35509490966796875, 0.3740386962890625, 0.39298248291015625, 0.41192626953125, 0.43087005615234375, 0.4498138427734375, 0.46875762939453125, 0.487701416015625, 0.5066452026367188, 0.5255889892578125, 0.5445327758789062, 0.5634765625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 13.0, 47.0, 134.0, 257.0, 260.0, 178.0, 57.0, 31.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5511512756347656, -2.382310628890991, -2.213470220565796, -2.0446295738220215, -1.8757890462875366, -1.7069485187530518, -1.5381078720092773, -1.3692673444747925, -1.2004268169403076, -1.0315862894058228, -0.8627457022666931, -0.6939051151275635, -0.5250645875930786, -0.35622406005859375, -0.18738341331481934, -0.018542885780334473, 0.1502976417541504, 0.31913819909095764, 0.4879787564277649, 0.6568193435668945, 0.8256598711013794, 0.9945003986358643, 1.1633410453796387, 1.3321815729141235, 1.5010221004486084, 1.6698626279830933, 1.8387031555175781, 2.0075438022613525, 2.176384449005127, 2.3452248573303223, 2.5140655040740967, 2.682906150817871, 2.8517465591430664, 3.020587205886841, 3.189427614212036, 3.3582682609558105, 3.527108669281006, 3.6959493160247803, 3.8647899627685547, 4.03363037109375, 4.202470779418945, 4.371311187744141, 4.540152072906494, 4.7089924812316895, 4.877832889556885, 5.046673774719238, 5.215514183044434, 5.384354591369629, 5.553195476531982, 5.722035884857178, 5.890876770019531, 6.059717178344727, 6.228557586669922, 6.397397994995117, 6.566238880157471, 6.735079288482666, 6.9039201736450195, 7.072760581970215, 7.241601467132568, 7.410441875457764, 7.579282283782959, 7.7481231689453125, 7.916963577270508, 8.085803985595703, 8.254644393920898]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 9.0, 5.0, 10.0, 9.0, 17.0, 16.0, 25.0, 18.0, 26.0, 47.0, 47.0, 52.0, 43.0, 57.0, 53.0, 65.0, 64.0, 67.0, 46.0, 55.0, 41.0, 37.0, 28.0, 43.0, 24.0, 25.0, 17.0, 19.0, 8.0, 7.0, 9.0, 4.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.040316343307495, -1.9751049280166626, -1.9098936319351196, -1.844682216644287, -1.7794709205627441, -1.7142595052719116, -1.649048089981079, -1.5838367938995361, -1.5186253786087036, -1.453413963317871, -1.3882026672363281, -1.3229912519454956, -1.257779836654663, -1.1925685405731201, -1.1273571252822876, -1.062145709991455, -0.9969344139099121, -0.9317230582237244, -0.8665117025375366, -0.8013002872467041, -0.7360889315605164, -0.6708775758743286, -0.6056661605834961, -0.5404548048973083, -0.4752434492111206, -0.41003209352493286, -0.34482070803642273, -0.2796093225479126, -0.21439796686172485, -0.1491866111755371, -0.08397522568702698, -0.018763840198516846, 0.04644775390625, 0.11165912449359894, 0.17687049508094788, 0.24208186566829681, 0.30729323625564575, 0.3725045919418335, 0.43771597743034363, 0.5029273629188538, 0.5681387186050415, 0.6333500742912292, 0.698561429977417, 0.7637728452682495, 0.8289842009544373, 0.894195556640625, 0.9594069719314575, 1.02461838722229, 1.089829683303833, 1.1550410985946655, 1.2202523946762085, 1.285463809967041, 1.350675106048584, 1.4158865213394165, 1.481097936630249, 1.546309232711792, 1.6115206480026245, 1.676732063293457, 1.741943359375, 1.8071547746658325, 1.872366189956665, 1.937577486038208, 2.002788782119751, 2.068000316619873, 2.133211612701416]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 5.0, 10.0, 11.0, 21.0, 41.0, 47.0, 61.0, 102.0, 138.0, 198.0, 299.0, 448.0, 685.0, 1143.0, 2098.0, 4350.0, 11168.0, 35411.0, 128959.0, 396040.0, 327161.0, 95874.0, 27140.0, 8865.0, 3680.0, 1752.0, 998.0, 617.0, 396.0, 248.0, 187.0, 124.0, 86.0, 65.0, 35.0, 31.0, 24.0, 14.0, 10.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.4990234375, -1.4594573974609375, -1.419891357421875, -1.3803253173828125, -1.34075927734375, -1.3011932373046875, -1.261627197265625, -1.2220611572265625, -1.1824951171875, -1.1429290771484375, -1.103363037109375, -1.0637969970703125, -1.02423095703125, -0.9846649169921875, -0.945098876953125, -0.9055328369140625, -0.865966796875, -0.8264007568359375, -0.786834716796875, -0.7472686767578125, -0.70770263671875, -0.6681365966796875, -0.628570556640625, -0.5890045166015625, -0.5494384765625, -0.5098724365234375, -0.470306396484375, -0.4307403564453125, -0.39117431640625, -0.3516082763671875, -0.312042236328125, -0.2724761962890625, -0.23291015625, -0.1933441162109375, -0.153778076171875, -0.1142120361328125, -0.07464599609375, -0.0350799560546875, 0.004486083984375, 0.0440521240234375, 0.0836181640625, 0.1231842041015625, 0.162750244140625, 0.2023162841796875, 0.24188232421875, 0.2814483642578125, 0.321014404296875, 0.3605804443359375, 0.400146484375, 0.4397125244140625, 0.479278564453125, 0.5188446044921875, 0.55841064453125, 0.5979766845703125, 0.637542724609375, 0.6771087646484375, 0.7166748046875, 0.7562408447265625, 0.795806884765625, 0.8353729248046875, 0.87493896484375, 0.9145050048828125, 0.954071044921875, 0.9936370849609375, 1.033203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 12.0, 8.0, 28.0, 45.0, 62.0, 62.0, 79.0, 88.0, 99.0, 123.0, 96.0, 97.0, 58.0, 46.0, 33.0, 14.0, 12.0, 12.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3840370178222656, -0.37110137939453125, -0.3581657409667969, -0.3452301025390625, -0.3322944641113281, -0.31935882568359375, -0.3064231872558594, -0.293487548828125, -0.2805519104003906, -0.26761627197265625, -0.2546806335449219, -0.2417449951171875, -0.22880935668945312, -0.21587371826171875, -0.20293807983398438, -0.19000244140625, -0.17706680297851562, -0.16413116455078125, -0.15119552612304688, -0.1382598876953125, -0.12532424926757812, -0.11238861083984375, -0.09945297241210938, -0.086517333984375, -0.07358169555664062, -0.06064605712890625, -0.047710418701171875, -0.0347747802734375, -0.021839141845703125, -0.00890350341796875, 0.004032135009765625, 0.0169677734375, 0.029903411865234375, 0.04283905029296875, 0.055774688720703125, 0.0687103271484375, 0.08164596557617188, 0.09458160400390625, 0.10751724243164062, 0.120452880859375, 0.13338851928710938, 0.14632415771484375, 0.15925979614257812, 0.1721954345703125, 0.18513107299804688, 0.19806671142578125, 0.21100234985351562, 0.22393798828125, 0.23687362670898438, 0.24980926513671875, 0.2627449035644531, 0.2756805419921875, 0.2886161804199219, 0.30155181884765625, 0.3144874572753906, 0.327423095703125, 0.3403587341308594, 0.35329437255859375, 0.3662300109863281, 0.3791656494140625, 0.3921012878417969, 0.40503692626953125, 0.4179725646972656, 0.430908203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 7.0, 12.0, 20.0, 34.0, 33.0, 56.0, 54.0, 84.0, 148.0, 198.0, 349.0, 563.0, 1027.0, 1766.0, 3527.0, 7324.0, 16835.0, 45535.0, 142009.0, 372215.0, 298608.0, 99821.0, 33161.0, 12944.0, 5875.0, 2753.0, 1481.0, 817.0, 490.0, 286.0, 163.0, 111.0, 76.0, 52.0, 37.0, 21.0, 21.0, 13.0, 3.0, 9.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.041015625, -1.0093231201171875, -0.977630615234375, -0.9459381103515625, -0.91424560546875, -0.8825531005859375, -0.850860595703125, -0.8191680908203125, -0.7874755859375, -0.7557830810546875, -0.724090576171875, -0.6923980712890625, -0.66070556640625, -0.6290130615234375, -0.597320556640625, -0.5656280517578125, -0.533935546875, -0.5022430419921875, -0.470550537109375, -0.4388580322265625, -0.40716552734375, -0.3754730224609375, -0.343780517578125, -0.3120880126953125, -0.2803955078125, -0.2487030029296875, -0.217010498046875, -0.1853179931640625, -0.15362548828125, -0.1219329833984375, -0.090240478515625, -0.0585479736328125, -0.02685546875, 0.0048370361328125, 0.036529541015625, 0.0682220458984375, 0.09991455078125, 0.1316070556640625, 0.163299560546875, 0.1949920654296875, 0.2266845703125, 0.2583770751953125, 0.290069580078125, 0.3217620849609375, 0.35345458984375, 0.3851470947265625, 0.416839599609375, 0.4485321044921875, 0.480224609375, 0.5119171142578125, 0.543609619140625, 0.5753021240234375, 0.60699462890625, 0.6386871337890625, 0.670379638671875, 0.7020721435546875, 0.7337646484375, 0.7654571533203125, 0.797149658203125, 0.8288421630859375, 0.86053466796875, 0.8922271728515625, 0.923919677734375, 0.9556121826171875, 0.9873046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 12.0, 6.0, 3.0, 13.0, 14.0, 17.0, 14.0, 26.0, 18.0, 32.0, 18.0, 35.0, 27.0, 43.0, 49.0, 42.0, 45.0, 43.0, 44.0, 50.0, 51.0, 35.0, 55.0, 30.0, 36.0, 25.0, 33.0, 25.0, 22.0, 26.0, 19.0, 12.0, 8.0, 8.0, 10.0, 5.0, 10.0, 3.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0859375, -1.0537033081054688, -1.0214691162109375, -0.9892349243164062, -0.957000732421875, -0.9247665405273438, -0.8925323486328125, -0.8602981567382812, -0.82806396484375, -0.7958297729492188, -0.7635955810546875, -0.7313613891601562, -0.699127197265625, -0.6668930053710938, -0.6346588134765625, -0.6024246215820312, -0.5701904296875, -0.5379562377929688, -0.5057220458984375, -0.47348785400390625, -0.441253662109375, -0.40901947021484375, -0.3767852783203125, -0.34455108642578125, -0.31231689453125, -0.28008270263671875, -0.2478485107421875, -0.21561431884765625, -0.183380126953125, -0.15114593505859375, -0.1189117431640625, -0.08667755126953125, -0.054443359375, -0.02220916748046875, 0.0100250244140625, 0.04225921630859375, 0.074493408203125, 0.10672760009765625, 0.1389617919921875, 0.17119598388671875, 0.20343017578125, 0.23566436767578125, 0.2678985595703125, 0.30013275146484375, 0.332366943359375, 0.36460113525390625, 0.3968353271484375, 0.42906951904296875, 0.4613037109375, 0.49353790283203125, 0.5257720947265625, 0.5580062866210938, 0.590240478515625, 0.6224746704101562, 0.6547088623046875, 0.6869430541992188, 0.71917724609375, 0.7514114379882812, 0.7836456298828125, 0.8158798217773438, 0.848114013671875, 0.8803482055664062, 0.9125823974609375, 0.9448165893554688, 0.97705078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 2.0, 7.0, 6.0, 16.0, 21.0, 25.0, 31.0, 64.0, 129.0, 212.0, 502.0, 1349.0, 4279.0, 19453.0, 191497.0, 713626.0, 99174.0, 12973.0, 3254.0, 1058.0, 394.0, 204.0, 90.0, 60.0, 41.0, 22.0, 18.0, 6.0, 15.0, 3.0, 2.0, 8.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9384765625, -0.9119491577148438, -0.8854217529296875, -0.8588943481445312, -0.832366943359375, -0.8058395385742188, -0.7793121337890625, -0.7527847290039062, -0.72625732421875, -0.6997299194335938, -0.6732025146484375, -0.6466751098632812, -0.620147705078125, -0.5936203002929688, -0.5670928955078125, -0.5405654907226562, -0.5140380859375, -0.48751068115234375, -0.4609832763671875, -0.43445587158203125, -0.407928466796875, -0.38140106201171875, -0.3548736572265625, -0.32834625244140625, -0.30181884765625, -0.27529144287109375, -0.2487640380859375, -0.22223663330078125, -0.195709228515625, -0.16918182373046875, -0.1426544189453125, -0.11612701416015625, -0.089599609375, -0.06307220458984375, -0.0365447998046875, -0.01001739501953125, 0.016510009765625, 0.04303741455078125, 0.0695648193359375, 0.09609222412109375, 0.12261962890625, 0.14914703369140625, 0.1756744384765625, 0.20220184326171875, 0.228729248046875, 0.25525665283203125, 0.2817840576171875, 0.30831146240234375, 0.3348388671875, 0.36136627197265625, 0.3878936767578125, 0.41442108154296875, 0.440948486328125, 0.46747589111328125, 0.4940032958984375, 0.5205307006835938, 0.54705810546875, 0.5735855102539062, 0.6001129150390625, 0.6266403198242188, 0.653167724609375, 0.6796951293945312, 0.7062225341796875, 0.7327499389648438, 0.75927734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 7.0, 9.0, 14.0, 9.0, 21.0, 19.0, 26.0, 32.0, 49.0, 67.0, 63.0, 72.0, 91.0, 63.0, 81.0, 70.0, 59.0, 44.0, 52.0, 30.0, 25.0, 23.0, 13.0, 13.0, 12.0, 6.0, 7.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.28640365600586e-05, -9.023398160934448e-05, -8.760392665863037e-05, -8.497387170791626e-05, -8.234381675720215e-05, -7.971376180648804e-05, -7.708370685577393e-05, -7.445365190505981e-05, -7.18235969543457e-05, -6.919354200363159e-05, -6.656348705291748e-05, -6.393343210220337e-05, -6.130337715148926e-05, -5.8673322200775146e-05, -5.6043267250061035e-05, -5.3413212299346924e-05, -5.078315734863281e-05, -4.81531023979187e-05, -4.552304744720459e-05, -4.289299249649048e-05, -4.026293754577637e-05, -3.7632882595062256e-05, -3.5002827644348145e-05, -3.237277269363403e-05, -2.9742717742919922e-05, -2.711266279220581e-05, -2.44826078414917e-05, -2.1852552890777588e-05, -1.9222497940063477e-05, -1.6592442989349365e-05, -1.3962388038635254e-05, -1.1332333087921143e-05, -8.702278137207031e-06, -6.07222318649292e-06, -3.4421682357788086e-06, -8.121132850646973e-07, 1.817941665649414e-06, 4.447996616363525e-06, 7.078051567077637e-06, 9.708106517791748e-06, 1.233816146850586e-05, 1.496821641921997e-05, 1.7598271369934082e-05, 2.0228326320648193e-05, 2.2858381271362305e-05, 2.5488436222076416e-05, 2.8118491172790527e-05, 3.074854612350464e-05, 3.337860107421875e-05, 3.600865602493286e-05, 3.863871097564697e-05, 4.1268765926361084e-05, 4.3898820877075195e-05, 4.652887582778931e-05, 4.915893077850342e-05, 5.178898572921753e-05, 5.441904067993164e-05, 5.704909563064575e-05, 5.967915058135986e-05, 6.230920553207397e-05, 6.493926048278809e-05, 6.75693154335022e-05, 7.019937038421631e-05, 7.282942533493042e-05, 7.545948028564453e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 9.0, 9.0, 11.0, 34.0, 27.0, 62.0, 92.0, 172.0, 276.0, 575.0, 1433.0, 4419.0, 16536.0, 122334.0, 725472.0, 150519.0, 18755.0, 4823.0, 1606.0, 657.0, 278.0, 154.0, 94.0, 65.0, 42.0, 32.0, 20.0, 14.0, 7.0, 8.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.72998046875, -0.7052688598632812, -0.6805572509765625, -0.6558456420898438, -0.631134033203125, -0.6064224243164062, -0.5817108154296875, -0.5569992065429688, -0.53228759765625, -0.5075759887695312, -0.4828643798828125, -0.45815277099609375, -0.433441162109375, -0.40872955322265625, -0.3840179443359375, -0.35930633544921875, -0.3345947265625, -0.30988311767578125, -0.2851715087890625, -0.26045989990234375, -0.235748291015625, -0.21103668212890625, -0.1863250732421875, -0.16161346435546875, -0.13690185546875, -0.11219024658203125, -0.0874786376953125, -0.06276702880859375, -0.038055419921875, -0.01334381103515625, 0.0113677978515625, 0.03607940673828125, 0.060791015625, 0.08550262451171875, 0.1102142333984375, 0.13492584228515625, 0.159637451171875, 0.18434906005859375, 0.2090606689453125, 0.23377227783203125, 0.25848388671875, 0.28319549560546875, 0.3079071044921875, 0.33261871337890625, 0.357330322265625, 0.38204193115234375, 0.4067535400390625, 0.43146514892578125, 0.4561767578125, 0.48088836669921875, 0.5055999755859375, 0.5303115844726562, 0.555023193359375, 0.5797348022460938, 0.6044464111328125, 0.6291580200195312, 0.65386962890625, 0.6785812377929688, 0.7032928466796875, 0.7280044555664062, 0.752716064453125, 0.7774276733398438, 0.8021392822265625, 0.8268508911132812, 0.8515625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 0.0, 2.0, 9.0, 5.0, 7.0, 7.0, 15.0, 16.0, 32.0, 47.0, 51.0, 80.0, 104.0, 108.0, 110.0, 109.0, 73.0, 62.0, 44.0, 21.0, 20.0, 16.0, 13.0, 6.0, 10.0, 5.0, 4.0, 6.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.48779296875, -0.4734382629394531, -0.45908355712890625, -0.4447288513183594, -0.4303741455078125, -0.4160194396972656, -0.40166473388671875, -0.3873100280761719, -0.372955322265625, -0.3586006164550781, -0.34424591064453125, -0.3298912048339844, -0.3155364990234375, -0.3011817932128906, -0.28682708740234375, -0.2724723815917969, -0.25811767578125, -0.24376296997070312, -0.22940826416015625, -0.21505355834960938, -0.2006988525390625, -0.18634414672851562, -0.17198944091796875, -0.15763473510742188, -0.143280029296875, -0.12892532348632812, -0.11457061767578125, -0.10021591186523438, -0.0858612060546875, -0.07150650024414062, -0.05715179443359375, -0.042797088623046875, -0.0284423828125, -0.014087677001953125, 0.00026702880859375, 0.014621734619140625, 0.0289764404296875, 0.043331146240234375, 0.05768585205078125, 0.07204055786132812, 0.086395263671875, 0.10074996948242188, 0.11510467529296875, 0.12945938110351562, 0.1438140869140625, 0.15816879272460938, 0.17252349853515625, 0.18687820434570312, 0.20123291015625, 0.21558761596679688, 0.22994232177734375, 0.24429702758789062, 0.2586517333984375, 0.2730064392089844, 0.28736114501953125, 0.3017158508300781, 0.316070556640625, 0.3304252624511719, 0.34477996826171875, 0.3591346740722656, 0.3734893798828125, 0.3878440856933594, 0.40219879150390625, 0.4165534973144531, 0.430908203125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 14.0, 42.0, 96.0, 177.0, 249.0, 205.0, 121.0, 43.0, 16.0, 12.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.439359664916992, -10.046066284179688, -9.652771949768066, -9.259478569030762, -8.86618423461914, -8.472890853881836, -8.079597473144531, -7.68630313873291, -7.293009281158447, -6.899715423583984, -6.5064215660095215, -6.113127708435059, -5.719834327697754, -5.326539993286133, -4.933246612548828, -4.539952754974365, -4.146658897399902, -3.7533650398254395, -3.3600711822509766, -2.9667775630950928, -2.57348370552063, -2.180189847946167, -1.7868962287902832, -1.3936023712158203, -1.0003085136413574, -0.6070147156715393, -0.2137209177017212, 0.17957282066345215, 0.572866678237915, 0.9661605358123779, 1.3594541549682617, 1.7527480125427246, 2.146042823791504, 2.539336681365967, 2.9326305389404297, 3.3259241580963135, 3.7192180156707764, 4.11251163482666, 4.505805492401123, 4.899099349975586, 5.292393207550049, 5.685687065124512, 6.078980922698975, 6.4722747802734375, 6.865568161010742, 7.258862495422363, 7.652155876159668, 8.045450210571289, 8.438743591308594, 8.832036972045898, 9.22533130645752, 9.618624687194824, 10.011919021606445, 10.40521240234375, 10.798505783081055, 11.191800117492676, 11.585094451904297, 11.978387832641602, 12.371682167053223, 12.764975547790527, 13.158269882202148, 13.551563262939453, 13.944856643676758, 14.338150978088379, 14.731444358825684]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 8.0, 17.0, 11.0, 16.0, 19.0, 20.0, 17.0, 30.0, 37.0, 34.0, 37.0, 45.0, 42.0, 39.0, 36.0, 47.0, 34.0, 42.0, 28.0, 46.0, 47.0, 35.0, 36.0, 35.0, 22.0, 24.0, 29.0, 19.0, 18.0, 19.0, 13.0, 16.0, 10.0, 8.0, 11.0, 3.0, 7.0, 3.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.281522750854492, -5.109341144561768, -4.937159538269043, -4.76497745513916, -4.5927958488464355, -4.420614242553711, -4.248432636260986, -4.076251029968262, -3.904069423675537, -3.7318878173828125, -3.559705972671509, -3.387524366378784, -3.2153427600860596, -3.043160915374756, -2.8709793090820312, -2.6987977027893066, -2.526615858078003, -2.3544342517852783, -2.1822524070739746, -2.01007080078125, -1.8378891944885254, -1.6657074689865112, -1.493525743484497, -1.3213441371917725, -1.1491624116897583, -0.9769807457923889, -0.8047990798950195, -0.6326173543930054, -0.460435688495636, -0.2882540225982666, -0.11607229709625244, 0.05610930919647217, 0.22829103469848633, 0.4004727005958557, 0.5726543664932251, 0.7448360919952393, 0.9170177578926086, 1.089199423789978, 1.2613811492919922, 1.4335627555847168, 1.605744481086731, 1.7779262065887451, 1.9501078128814697, 2.1222896575927734, 2.294471263885498, 2.4666528701782227, 2.6388344764709473, 2.811016082763672, 2.9831979274749756, 3.1553795337677, 3.327561378479004, 3.4997429847717285, 3.671924591064453, 3.8441061973571777, 4.016287803649902, 4.188469886779785, 4.36065149307251, 4.532833099365234, 4.705014705657959, 4.877196311950684, 5.049378395080566, 5.221560001373291, 5.393741607666016, 5.56592321395874, 5.738104820251465]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 6.0, 10.0, 15.0, 13.0, 33.0, 29.0, 45.0, 62.0, 105.0, 85.0, 152.0, 282.0, 451.0, 697.0, 1359.0, 2619.0, 6422.0, 18194.0, 78815.0, 1057207.0, 2894476.0, 98457.0, 20806.0, 7187.0, 3093.0, 1451.0, 823.0, 443.0, 277.0, 191.0, 128.0, 94.0, 63.0, 50.0, 33.0, 24.0, 17.0, 17.0, 10.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.328125, -1.2824249267578125, -1.236724853515625, -1.1910247802734375, -1.14532470703125, -1.0996246337890625, -1.053924560546875, -1.0082244873046875, -0.9625244140625, -0.9168243408203125, -0.871124267578125, -0.8254241943359375, -0.77972412109375, -0.7340240478515625, -0.688323974609375, -0.6426239013671875, -0.596923828125, -0.5512237548828125, -0.505523681640625, -0.4598236083984375, -0.41412353515625, -0.3684234619140625, -0.322723388671875, -0.2770233154296875, -0.2313232421875, -0.1856231689453125, -0.139923095703125, -0.0942230224609375, -0.04852294921875, -0.0028228759765625, 0.042877197265625, 0.0885772705078125, 0.13427734375, 0.1799774169921875, 0.225677490234375, 0.2713775634765625, 0.31707763671875, 0.3627777099609375, 0.408477783203125, 0.4541778564453125, 0.4998779296875, 0.5455780029296875, 0.591278076171875, 0.6369781494140625, 0.68267822265625, 0.7283782958984375, 0.774078369140625, 0.8197784423828125, 0.865478515625, 0.9111785888671875, 0.956878662109375, 1.0025787353515625, 1.04827880859375, 1.0939788818359375, 1.139678955078125, 1.1853790283203125, 1.2310791015625, 1.2767791748046875, 1.322479248046875, 1.3681793212890625, 1.41387939453125, 1.4595794677734375, 1.505279541015625, 1.5509796142578125, 1.5966796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 3.0, 5.0, 22.0, 26.0, 28.0, 40.0, 57.0, 61.0, 72.0, 66.0, 96.0, 83.0, 74.0, 76.0, 71.0, 53.0, 39.0, 32.0, 26.0, 17.0, 11.0, 5.0, 9.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.337158203125, -0.3263435363769531, -0.31552886962890625, -0.3047142028808594, -0.2938995361328125, -0.2830848693847656, -0.27227020263671875, -0.2614555358886719, -0.250640869140625, -0.23982620239257812, -0.22901153564453125, -0.21819686889648438, -0.2073822021484375, -0.19656753540039062, -0.18575286865234375, -0.17493820190429688, -0.16412353515625, -0.15330886840820312, -0.14249420166015625, -0.13167953491210938, -0.1208648681640625, -0.11005020141601562, -0.09923553466796875, -0.08842086791992188, -0.077606201171875, -0.06679153442382812, -0.05597686767578125, -0.045162200927734375, -0.0343475341796875, -0.023532867431640625, -0.01271820068359375, -0.001903533935546875, 0.0089111328125, 0.019725799560546875, 0.03054046630859375, 0.041355133056640625, 0.0521697998046875, 0.06298446655273438, 0.07379913330078125, 0.08461380004882812, 0.095428466796875, 0.10624313354492188, 0.11705780029296875, 0.12787246704101562, 0.1386871337890625, 0.14950180053710938, 0.16031646728515625, 0.17113113403320312, 0.18194580078125, 0.19276046752929688, 0.20357513427734375, 0.21438980102539062, 0.2252044677734375, 0.23601913452148438, 0.24683380126953125, 0.2576484680175781, 0.268463134765625, 0.2792778015136719, 0.29009246826171875, 0.3009071350097656, 0.3117218017578125, 0.3225364685058594, 0.33335113525390625, 0.3441658020019531, 0.35498046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 18.0, 22.0, 32.0, 52.0, 97.0, 139.0, 229.0, 458.0, 1166.0, 3680.0, 16582.0, 172258.0, 3748826.0, 226760.0, 18433.0, 3475.0, 1108.0, 436.0, 199.0, 105.0, 78.0, 27.0, 28.0, 20.0, 15.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.03692626953125, -1.9761962890625, -1.91546630859375, -1.854736328125, -1.79400634765625, -1.7332763671875, -1.67254638671875, -1.61181640625, -1.55108642578125, -1.4903564453125, -1.42962646484375, -1.368896484375, -1.30816650390625, -1.2474365234375, -1.18670654296875, -1.1259765625, -1.06524658203125, -1.0045166015625, -0.94378662109375, -0.883056640625, -0.82232666015625, -0.7615966796875, -0.70086669921875, -0.64013671875, -0.57940673828125, -0.5186767578125, -0.45794677734375, -0.397216796875, -0.33648681640625, -0.2757568359375, -0.21502685546875, -0.154296875, -0.09356689453125, -0.0328369140625, 0.02789306640625, 0.088623046875, 0.14935302734375, 0.2100830078125, 0.27081298828125, 0.33154296875, 0.39227294921875, 0.4530029296875, 0.51373291015625, 0.574462890625, 0.63519287109375, 0.6959228515625, 0.75665283203125, 0.8173828125, 0.87811279296875, 0.9388427734375, 0.99957275390625, 1.060302734375, 1.12103271484375, 1.1817626953125, 1.24249267578125, 1.30322265625, 1.36395263671875, 1.4246826171875, 1.48541259765625, 1.546142578125, 1.60687255859375, 1.6676025390625, 1.72833251953125, 1.7890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 11.0, 24.0, 21.0, 30.0, 77.0, 98.0, 171.0, 437.0, 1496.0, 887.0, 365.0, 184.0, 93.0, 63.0, 33.0, 20.0, 17.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.50634765625, -0.4936408996582031, -0.48093414306640625, -0.4682273864746094, -0.4555206298828125, -0.4428138732910156, -0.43010711669921875, -0.4174003601074219, -0.404693603515625, -0.3919868469238281, -0.37928009033203125, -0.3665733337402344, -0.3538665771484375, -0.3411598205566406, -0.32845306396484375, -0.3157463073730469, -0.30303955078125, -0.2903327941894531, -0.27762603759765625, -0.2649192810058594, -0.2522125244140625, -0.23950576782226562, -0.22679901123046875, -0.21409225463867188, -0.201385498046875, -0.18867874145507812, -0.17597198486328125, -0.16326522827148438, -0.1505584716796875, -0.13785171508789062, -0.12514495849609375, -0.11243820190429688, -0.0997314453125, -0.08702468872070312, -0.07431793212890625, -0.061611175537109375, -0.0489044189453125, -0.036197662353515625, -0.02349090576171875, -0.010784149169921875, 0.001922607421875, 0.014629364013671875, 0.02733612060546875, 0.040042877197265625, 0.0527496337890625, 0.06545639038085938, 0.07816314697265625, 0.09086990356445312, 0.10357666015625, 0.11628341674804688, 0.12899017333984375, 0.14169692993164062, 0.1544036865234375, 0.16711044311523438, 0.17981719970703125, 0.19252395629882812, 0.205230712890625, 0.21793746948242188, 0.23064422607421875, 0.24335098266601562, 0.2560577392578125, 0.2687644958496094, 0.28147125244140625, 0.2941780090332031, 0.306884765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 26.0, 72.0, 156.0, 182.0, 193.0, 177.0, 105.0, 44.0, 23.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.639739990234375, -4.539134502410889, -4.438528537750244, -4.337923049926758, -4.237317085266113, -4.136711597442627, -4.036106109619141, -3.935500144958496, -3.8348946571350098, -3.7342889308929443, -3.633683204650879, -3.5330777168273926, -3.432471990585327, -3.3318662643432617, -3.2312605381011963, -3.130654811859131, -3.0300493240356445, -2.929443597793579, -2.8288378715515137, -2.7282323837280273, -2.627626657485962, -2.5270209312438965, -2.426415205001831, -2.3258094787597656, -2.2252037525177, -2.1245980262756348, -2.0239923000335693, -1.9233866930007935, -1.8227810859680176, -1.7221753597259521, -1.6215696334838867, -1.5209640264511108, -1.420358419418335, -1.3197526931762695, -1.2191470861434937, -1.1185413599014282, -1.0179357528686523, -0.9173300266265869, -0.8167243599891663, -0.7161186933517456, -0.615513026714325, -0.5149073600769043, -0.41430169343948364, -0.3136959969997406, -0.21309033036231995, -0.1124846339225769, -0.01187896728515625, 0.0887266993522644, 0.18933236598968506, 0.2899380326271057, 0.39054369926452637, 0.4911493957042694, 0.5917550325393677, 0.6923607587814331, 0.7929664254188538, 0.8935720920562744, 0.9941777586936951, 1.0947834253311157, 1.1953891515731812, 1.295994758605957, 1.3966004848480225, 1.497206211090088, 1.5978118181228638, 1.6984174251556396, 1.799023151397705]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 7.0, 4.0, 8.0, 10.0, 9.0, 10.0, 13.0, 25.0, 16.0, 24.0, 16.0, 31.0, 35.0, 41.0, 39.0, 34.0, 34.0, 41.0, 46.0, 56.0, 35.0, 43.0, 38.0, 46.0, 37.0, 36.0, 35.0, 37.0, 33.0, 29.0, 10.0, 21.0, 17.0, 22.0, 15.0, 10.0, 6.0, 7.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.938157320022583, -0.9063146114349365, -0.87447190284729, -0.8426291942596436, -0.8107865452766418, -0.7789438366889954, -0.7471011281013489, -0.7152584195137024, -0.6834157705307007, -0.6515730619430542, -0.6197303533554077, -0.5878876447677612, -0.5560449957847595, -0.524202287197113, -0.49235957860946655, -0.46051687002182007, -0.4286741614341736, -0.3968314528465271, -0.364988774061203, -0.3331460654735565, -0.3013033866882324, -0.26946067810058594, -0.23761796951293945, -0.20577527582645416, -0.17393258213996887, -0.14208988845348358, -0.1102471873164177, -0.0784044861793518, -0.046561792492866516, -0.014719098806381226, 0.01712360978126526, 0.04896630346775055, 0.08080899715423584, 0.11265169084072113, 0.14449438452720642, 0.1763370931148529, 0.2081797868013382, 0.2400224804878235, 0.27186518907546997, 0.30370789766311646, 0.33555057644844055, 0.36739328503608704, 0.39923596382141113, 0.4310786724090576, 0.4629213809967041, 0.4947640597820282, 0.5266067981719971, 0.5584494471549988, 0.5902921557426453, 0.6221348643302917, 0.6539775729179382, 0.6858202219009399, 0.7176629304885864, 0.7495056390762329, 0.7813483476638794, 0.8131910562515259, 0.8450337648391724, 0.8768764734268188, 0.9087191820144653, 0.9405618906021118, 0.9724045395851135, 1.0042471885681152, 1.0360898971557617, 1.0679326057434082, 1.0997753143310547]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 6.0, 7.0, 15.0, 14.0, 20.0, 34.0, 43.0, 72.0, 95.0, 134.0, 198.0, 301.0, 462.0, 713.0, 1170.0, 2001.0, 3642.0, 8026.0, 21909.0, 71728.0, 238188.0, 411015.0, 197377.0, 58344.0, 17936.0, 6900.0, 3349.0, 1814.0, 1028.0, 688.0, 399.0, 296.0, 184.0, 136.0, 101.0, 61.0, 35.0, 27.0, 13.0, 19.0, 14.0, 7.0, 6.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.099609375, -1.064605712890625, -1.02960205078125, -0.994598388671875, -0.9595947265625, -0.924591064453125, -0.88958740234375, -0.854583740234375, -0.819580078125, -0.784576416015625, -0.74957275390625, -0.714569091796875, -0.6795654296875, -0.644561767578125, -0.60955810546875, -0.574554443359375, -0.53955078125, -0.504547119140625, -0.46954345703125, -0.434539794921875, -0.3995361328125, -0.364532470703125, -0.32952880859375, -0.294525146484375, -0.259521484375, -0.224517822265625, -0.18951416015625, -0.154510498046875, -0.1195068359375, -0.084503173828125, -0.04949951171875, -0.014495849609375, 0.0205078125, 0.055511474609375, 0.09051513671875, 0.125518798828125, 0.1605224609375, 0.195526123046875, 0.23052978515625, 0.265533447265625, 0.300537109375, 0.335540771484375, 0.37054443359375, 0.405548095703125, 0.4405517578125, 0.475555419921875, 0.51055908203125, 0.545562744140625, 0.58056640625, 0.615570068359375, 0.65057373046875, 0.685577392578125, 0.7205810546875, 0.755584716796875, 0.79058837890625, 0.825592041015625, 0.860595703125, 0.895599365234375, 0.93060302734375, 0.965606689453125, 1.0006103515625, 1.035614013671875, 1.07061767578125, 1.105621337890625, 1.140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 3.0, 14.0, 20.0, 24.0, 36.0, 40.0, 47.0, 71.0, 69.0, 74.0, 91.0, 96.0, 81.0, 74.0, 67.0, 57.0, 31.0, 31.0, 19.0, 17.0, 8.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.333740234375, -0.3229331970214844, -0.31212615966796875, -0.3013191223144531, -0.2905120849609375, -0.2797050476074219, -0.26889801025390625, -0.2580909729003906, -0.247283935546875, -0.23647689819335938, -0.22566986083984375, -0.21486282348632812, -0.2040557861328125, -0.19324874877929688, -0.18244171142578125, -0.17163467407226562, -0.16082763671875, -0.15002059936523438, -0.13921356201171875, -0.12840652465820312, -0.1175994873046875, -0.10679244995117188, -0.09598541259765625, -0.08517837524414062, -0.074371337890625, -0.06356430053710938, -0.05275726318359375, -0.041950225830078125, -0.0311431884765625, -0.020336151123046875, -0.00952911376953125, 0.001277923583984375, 0.0120849609375, 0.022891998291015625, 0.03369903564453125, 0.044506072998046875, 0.0553131103515625, 0.06612014770507812, 0.07692718505859375, 0.08773422241210938, 0.098541259765625, 0.10934829711914062, 0.12015533447265625, 0.13096237182617188, 0.1417694091796875, 0.15257644653320312, 0.16338348388671875, 0.17419052124023438, 0.18499755859375, 0.19580459594726562, 0.20661163330078125, 0.21741867065429688, 0.2282257080078125, 0.23903274536132812, 0.24983978271484375, 0.2606468200683594, 0.271453857421875, 0.2822608947753906, 0.29306793212890625, 0.3038749694824219, 0.3146820068359375, 0.3254890441894531, 0.33629608154296875, 0.3471031188964844, 0.35791015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 10.0, 5.0, 12.0, 9.0, 27.0, 29.0, 55.0, 74.0, 157.0, 232.0, 402.0, 836.0, 1929.0, 5086.0, 16341.0, 67130.0, 303163.0, 470838.0, 137765.0, 30562.0, 8469.0, 2942.0, 1206.0, 584.0, 301.0, 156.0, 86.0, 52.0, 42.0, 16.0, 20.0, 15.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.6181640625, -1.57794189453125, -1.5377197265625, -1.49749755859375, -1.457275390625, -1.41705322265625, -1.3768310546875, -1.33660888671875, -1.29638671875, -1.25616455078125, -1.2159423828125, -1.17572021484375, -1.135498046875, -1.09527587890625, -1.0550537109375, -1.01483154296875, -0.974609375, -0.93438720703125, -0.8941650390625, -0.85394287109375, -0.813720703125, -0.77349853515625, -0.7332763671875, -0.69305419921875, -0.65283203125, -0.61260986328125, -0.5723876953125, -0.53216552734375, -0.491943359375, -0.45172119140625, -0.4114990234375, -0.37127685546875, -0.3310546875, -0.29083251953125, -0.2506103515625, -0.21038818359375, -0.170166015625, -0.12994384765625, -0.0897216796875, -0.04949951171875, -0.00927734375, 0.03094482421875, 0.0711669921875, 0.11138916015625, 0.151611328125, 0.19183349609375, 0.2320556640625, 0.27227783203125, 0.3125, 0.35272216796875, 0.3929443359375, 0.43316650390625, 0.473388671875, 0.51361083984375, 0.5538330078125, 0.59405517578125, 0.63427734375, 0.67449951171875, 0.7147216796875, 0.75494384765625, 0.795166015625, 0.83538818359375, 0.8756103515625, 0.91583251953125, 0.9560546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 5.0, 3.0, 5.0, 11.0, 6.0, 15.0, 9.0, 11.0, 24.0, 21.0, 24.0, 18.0, 27.0, 30.0, 28.0, 36.0, 57.0, 42.0, 37.0, 32.0, 46.0, 34.0, 47.0, 32.0, 41.0, 45.0, 32.0, 36.0, 34.0, 29.0, 19.0, 28.0, 27.0, 19.0, 12.0, 16.0, 12.0, 9.0, 7.0, 10.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.90087890625, -0.8718948364257812, -0.8429107666015625, -0.8139266967773438, -0.784942626953125, -0.7559585571289062, -0.7269744873046875, -0.6979904174804688, -0.66900634765625, -0.6400222778320312, -0.6110382080078125, -0.5820541381835938, -0.553070068359375, -0.5240859985351562, -0.4951019287109375, -0.46611785888671875, -0.4371337890625, -0.40814971923828125, -0.3791656494140625, -0.35018157958984375, -0.321197509765625, -0.29221343994140625, -0.2632293701171875, -0.23424530029296875, -0.20526123046875, -0.17627716064453125, -0.1472930908203125, -0.11830902099609375, -0.089324951171875, -0.06034088134765625, -0.0313568115234375, -0.00237274169921875, 0.026611328125, 0.05559539794921875, 0.0845794677734375, 0.11356353759765625, 0.142547607421875, 0.17153167724609375, 0.2005157470703125, 0.22949981689453125, 0.25848388671875, 0.28746795654296875, 0.3164520263671875, 0.34543609619140625, 0.374420166015625, 0.40340423583984375, 0.4323883056640625, 0.46137237548828125, 0.4903564453125, 0.5193405151367188, 0.5483245849609375, 0.5773086547851562, 0.606292724609375, 0.6352767944335938, 0.6642608642578125, 0.6932449340820312, 0.72222900390625, 0.7512130737304688, 0.7801971435546875, 0.8091812133789062, 0.838165283203125, 0.8671493530273438, 0.8961334228515625, 0.9251174926757812, 0.9541015625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 11.0, 22.0, 18.0, 41.0, 49.0, 104.0, 154.0, 323.0, 671.0, 1641.0, 5235.0, 23802.0, 202467.0, 664756.0, 125802.0, 16670.0, 4124.0, 1463.0, 573.0, 300.0, 125.0, 65.0, 45.0, 22.0, 14.0, 12.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74755859375, -0.7264404296875, -0.705322265625, -0.6842041015625, -0.6630859375, -0.6419677734375, -0.620849609375, -0.5997314453125, -0.57861328125, -0.5574951171875, -0.536376953125, -0.5152587890625, -0.494140625, -0.4730224609375, -0.451904296875, -0.4307861328125, -0.40966796875, -0.3885498046875, -0.367431640625, -0.3463134765625, -0.3251953125, -0.3040771484375, -0.282958984375, -0.2618408203125, -0.24072265625, -0.2196044921875, -0.198486328125, -0.1773681640625, -0.15625, -0.1351318359375, -0.114013671875, -0.0928955078125, -0.07177734375, -0.0506591796875, -0.029541015625, -0.0084228515625, 0.0126953125, 0.0338134765625, 0.054931640625, 0.0760498046875, 0.09716796875, 0.1182861328125, 0.139404296875, 0.1605224609375, 0.181640625, 0.2027587890625, 0.223876953125, 0.2449951171875, 0.26611328125, 0.2872314453125, 0.308349609375, 0.3294677734375, 0.3505859375, 0.3717041015625, 0.392822265625, 0.4139404296875, 0.43505859375, 0.4561767578125, 0.477294921875, 0.4984130859375, 0.51953125, 0.5406494140625, 0.561767578125, 0.5828857421875, 0.60400390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 9.0, 13.0, 21.0, 30.0, 44.0, 58.0, 76.0, 112.0, 121.0, 89.0, 126.0, 77.0, 50.0, 47.0, 32.0, 21.0, 13.0, 11.0, 16.0, 5.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001442432403564453, -0.00014064554125070572, -0.00013704784214496613, -0.00013345014303922653, -0.00012985244393348694, -0.00012625474482774734, -0.00012265704572200775, -0.00011905934661626816, -0.00011546164751052856, -0.00011186394840478897, -0.00010826624929904938, -0.00010466855019330978, -0.00010107085108757019, -9.74731519818306e-05, -9.3875452876091e-05, -9.027775377035141e-05, -8.668005466461182e-05, -8.308235555887222e-05, -7.948465645313263e-05, -7.588695734739304e-05, -7.228925824165344e-05, -6.869155913591385e-05, -6.509386003017426e-05, -6.149616092443466e-05, -5.789846181869507e-05, -5.4300762712955475e-05, -5.070306360721588e-05, -4.710536450147629e-05, -4.3507665395736694e-05, -3.99099662899971e-05, -3.631226718425751e-05, -3.2714568078517914e-05, -2.911686897277832e-05, -2.5519169867038727e-05, -2.1921470761299133e-05, -1.832377165555954e-05, -1.4726072549819946e-05, -1.1128373444080353e-05, -7.530674338340759e-06, -3.932975232601166e-06, -3.3527612686157227e-07, 3.2624229788780212e-06, 6.860122084617615e-06, 1.0457821190357208e-05, 1.4055520296096802e-05, 1.7653219401836395e-05, 2.125091850757599e-05, 2.4848617613315582e-05, 2.8446316719055176e-05, 3.204401582479477e-05, 3.564171493053436e-05, 3.9239414036273956e-05, 4.283711314201355e-05, 4.643481224775314e-05, 5.003251135349274e-05, 5.363021045923233e-05, 5.7227909564971924e-05, 6.082560867071152e-05, 6.442330777645111e-05, 6.80210068821907e-05, 7.16187059879303e-05, 7.521640509366989e-05, 7.881410419940948e-05, 8.241180330514908e-05, 8.600950241088867e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 12.0, 18.0, 28.0, 28.0, 55.0, 76.0, 131.0, 266.0, 468.0, 911.0, 2225.0, 6488.0, 26760.0, 179855.0, 612595.0, 181145.0, 26556.0, 6489.0, 2298.0, 1017.0, 473.0, 234.0, 143.0, 93.0, 51.0, 44.0, 20.0, 19.0, 11.0, 9.0, 8.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5917129516601562, -0.5740509033203125, -0.5563888549804688, -0.538726806640625, -0.5210647583007812, -0.5034027099609375, -0.48574066162109375, -0.46807861328125, -0.45041656494140625, -0.4327545166015625, -0.41509246826171875, -0.397430419921875, -0.37976837158203125, -0.3621063232421875, -0.34444427490234375, -0.3267822265625, -0.30912017822265625, -0.2914581298828125, -0.27379608154296875, -0.256134033203125, -0.23847198486328125, -0.2208099365234375, -0.20314788818359375, -0.18548583984375, -0.16782379150390625, -0.1501617431640625, -0.13249969482421875, -0.114837646484375, -0.09717559814453125, -0.0795135498046875, -0.06185150146484375, -0.044189453125, -0.02652740478515625, -0.0088653564453125, 0.00879669189453125, 0.026458740234375, 0.04412078857421875, 0.0617828369140625, 0.07944488525390625, 0.09710693359375, 0.11476898193359375, 0.1324310302734375, 0.15009307861328125, 0.167755126953125, 0.18541717529296875, 0.2030792236328125, 0.22074127197265625, 0.2384033203125, 0.25606536865234375, 0.2737274169921875, 0.29138946533203125, 0.309051513671875, 0.32671356201171875, 0.3443756103515625, 0.36203765869140625, 0.37969970703125, 0.39736175537109375, 0.4150238037109375, 0.43268585205078125, 0.450347900390625, 0.46800994873046875, 0.4856719970703125, 0.5033340454101562, 0.52099609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 12.0, 12.0, 19.0, 22.0, 34.0, 30.0, 47.0, 77.0, 73.0, 80.0, 114.0, 94.0, 89.0, 73.0, 56.0, 48.0, 33.0, 20.0, 14.0, 9.0, 7.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.384521484375, -0.3719673156738281, -0.35941314697265625, -0.3468589782714844, -0.3343048095703125, -0.3217506408691406, -0.30919647216796875, -0.2966423034667969, -0.284088134765625, -0.2715339660644531, -0.25897979736328125, -0.24642562866210938, -0.2338714599609375, -0.22131729125976562, -0.20876312255859375, -0.19620895385742188, -0.18365478515625, -0.17110061645507812, -0.15854644775390625, -0.14599227905273438, -0.1334381103515625, -0.12088394165039062, -0.10832977294921875, -0.09577560424804688, -0.083221435546875, -0.07066726684570312, -0.05811309814453125, -0.045558929443359375, -0.0330047607421875, -0.020450592041015625, -0.00789642333984375, 0.004657745361328125, 0.0172119140625, 0.029766082763671875, 0.04232025146484375, 0.054874420166015625, 0.0674285888671875, 0.07998275756835938, 0.09253692626953125, 0.10509109497070312, 0.117645263671875, 0.13019943237304688, 0.14275360107421875, 0.15530776977539062, 0.1678619384765625, 0.18041610717773438, 0.19297027587890625, 0.20552444458007812, 0.21807861328125, 0.23063278198242188, 0.24318695068359375, 0.2557411193847656, 0.2682952880859375, 0.2808494567871094, 0.29340362548828125, 0.3059577941894531, 0.318511962890625, 0.3310661315917969, 0.34362030029296875, 0.3561744689941406, 0.3687286376953125, 0.3812828063964844, 0.39383697509765625, 0.4063911437988281, 0.4189453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 10.0, 10.0, 17.0, 37.0, 85.0, 132.0, 158.0, 183.0, 167.0, 77.0, 56.0, 30.0, 17.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.751825332641602, -15.44526195526123, -15.13869857788086, -14.832135200500488, -14.525571823120117, -14.21900749206543, -13.912444114685059, -13.605880737304688, -13.299317359924316, -12.992753982543945, -12.686190605163574, -12.379627227783203, -12.073062896728516, -11.766499519348145, -11.459936141967773, -11.153372764587402, -10.846809387207031, -10.54024600982666, -10.233682632446289, -9.927119255065918, -9.620555877685547, -9.31399154663086, -9.007428169250488, -8.700864791870117, -8.394301414489746, -8.087738037109375, -7.781174659729004, -7.474610805511475, -7.1680474281311035, -6.861484050750732, -6.554920196533203, -6.248356819152832, -5.941794395446777, -5.635231018066406, -5.328667640686035, -5.022103786468506, -4.715540409088135, -4.408977031707764, -4.102413177490234, -3.7958498001098633, -3.489286422729492, -3.182723045349121, -2.876159429550171, -2.5695958137512207, -2.2630324363708496, -1.956468939781189, -1.6499054431915283, -1.3433418273925781, -1.036778450012207, -0.7302149534225464, -0.42365145683288574, -0.1170879602432251, 0.18947553634643555, 0.4960390329360962, 0.8026025295257568, 1.109166145324707, 1.4157295227050781, 1.7222930192947388, 2.0288565158843994, 2.3354201316833496, 2.6419835090637207, 2.948546886444092, 3.255110502243042, 3.561674118041992, 3.8682374954223633]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 8.0, 6.0, 10.0, 9.0, 18.0, 22.0, 14.0, 24.0, 43.0, 35.0, 50.0, 49.0, 61.0, 70.0, 61.0, 68.0, 64.0, 56.0, 62.0, 48.0, 42.0, 47.0, 33.0, 23.0, 19.0, 15.0, 13.0, 15.0, 4.0, 7.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.669235229492188, -8.42377758026123, -8.17832088470459, -7.932863235473633, -7.687406063079834, -7.441948890686035, -7.196491241455078, -6.951034069061279, -6.7055768966674805, -6.460119724273682, -6.214662075042725, -5.969204902648926, -5.723747730255127, -5.478290557861328, -5.232832908630371, -4.987375736236572, -4.741918563842773, -4.496461391448975, -4.251003742218018, -4.005546569824219, -3.76008939743042, -3.514631986618042, -3.269174575805664, -3.0237174034118652, -2.778259754180908, -2.5328023433685303, -2.2873451709747314, -2.0418877601623535, -1.7964305877685547, -1.5509731769561768, -1.3055158853530884, -1.06005859375, -0.8146014213562012, -0.5691441297531128, -0.323686808347702, -0.07822948694229126, 0.16722780466079712, 0.4126851558685303, 0.6581424474716187, 0.903599739074707, 1.1490570306777954, 1.3945143222808838, 1.6399716138839722, 1.8854289054870605, 2.1308863162994385, 2.3763437271118164, 2.6218008995056152, 2.867258071899414, 3.112715482711792, 3.35817289352417, 3.6036300659179688, 3.8490874767303467, 4.094544887542725, 4.340002059936523, 4.585459232330322, 4.830916404724121, 5.076374053955078, 5.321831226348877, 5.567288875579834, 5.812746047973633, 6.058203220367432, 6.3036603927612305, 6.5491180419921875, 6.794575214385986, 7.040032386779785]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 6.0, 5.0, 8.0, 12.0, 18.0, 23.0, 30.0, 56.0, 73.0, 119.0, 190.0, 347.0, 659.0, 1304.0, 2822.0, 8086.0, 36410.0, 439722.0, 3555571.0, 121322.0, 17875.0, 5197.0, 2104.0, 981.0, 489.0, 284.0, 199.0, 109.0, 72.0, 44.0, 33.0, 27.0, 15.0, 18.0, 7.0, 4.0, 3.0, 11.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8345489501953125, -1.769683837890625, -1.7048187255859375, -1.63995361328125, -1.5750885009765625, -1.510223388671875, -1.4453582763671875, -1.3804931640625, -1.3156280517578125, -1.250762939453125, -1.1858978271484375, -1.12103271484375, -1.0561676025390625, -0.991302490234375, -0.9264373779296875, -0.861572265625, -0.7967071533203125, -0.731842041015625, -0.6669769287109375, -0.60211181640625, -0.5372467041015625, -0.472381591796875, -0.4075164794921875, -0.3426513671875, -0.2777862548828125, -0.212921142578125, -0.1480560302734375, -0.08319091796875, -0.0183258056640625, 0.046539306640625, 0.1114044189453125, 0.17626953125, 0.2411346435546875, 0.305999755859375, 0.3708648681640625, 0.43572998046875, 0.5005950927734375, 0.565460205078125, 0.6303253173828125, 0.6951904296875, 0.7600555419921875, 0.824920654296875, 0.8897857666015625, 0.95465087890625, 1.0195159912109375, 1.084381103515625, 1.1492462158203125, 1.214111328125, 1.2789764404296875, 1.343841552734375, 1.4087066650390625, 1.47357177734375, 1.5384368896484375, 1.603302001953125, 1.6681671142578125, 1.7330322265625, 1.7978973388671875, 1.862762451171875, 1.9276275634765625, 1.99249267578125, 2.0573577880859375, 2.122222900390625, 2.1870880126953125, 2.251953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 10.0, 8.0, 13.0, 32.0, 36.0, 51.0, 64.0, 75.0, 90.0, 82.0, 100.0, 105.0, 81.0, 65.0, 60.0, 41.0, 21.0, 13.0, 12.0, 15.0, 4.0, 2.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387939453125, -0.3755149841308594, -0.36309051513671875, -0.3506660461425781, -0.3382415771484375, -0.3258171081542969, -0.31339263916015625, -0.3009681701660156, -0.288543701171875, -0.2761192321777344, -0.26369476318359375, -0.2512702941894531, -0.2388458251953125, -0.22642135620117188, -0.21399688720703125, -0.20157241821289062, -0.18914794921875, -0.17672348022460938, -0.16429901123046875, -0.15187454223632812, -0.1394500732421875, -0.12702560424804688, -0.11460113525390625, -0.10217666625976562, -0.089752197265625, -0.07732772827148438, -0.06490325927734375, -0.052478790283203125, -0.0400543212890625, -0.027629852294921875, -0.01520538330078125, -0.002780914306640625, 0.0096435546875, 0.022068023681640625, 0.03449249267578125, 0.046916961669921875, 0.0593414306640625, 0.07176589965820312, 0.08419036865234375, 0.09661483764648438, 0.109039306640625, 0.12146377563476562, 0.13388824462890625, 0.14631271362304688, 0.1587371826171875, 0.17116165161132812, 0.18358612060546875, 0.19601058959960938, 0.20843505859375, 0.22085952758789062, 0.23328399658203125, 0.24570846557617188, 0.2581329345703125, 0.2705574035644531, 0.28298187255859375, 0.2954063415527344, 0.307830810546875, 0.3202552795410156, 0.33267974853515625, 0.3451042175292969, 0.3575286865234375, 0.3699531555175781, 0.38237762451171875, 0.3948020935058594, 0.4072265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 6.0, 11.0, 22.0, 24.0, 46.0, 60.0, 158.0, 326.0, 764.0, 2221.0, 8743.0, 82119.0, 3901128.0, 182185.0, 12193.0, 2783.0, 854.0, 320.0, 138.0, 75.0, 25.0, 24.0, 17.0, 12.0, 6.0, 7.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.09857177734375, -2.0057373046875, -1.91290283203125, -1.820068359375, -1.72723388671875, -1.6343994140625, -1.54156494140625, -1.44873046875, -1.35589599609375, -1.2630615234375, -1.17022705078125, -1.077392578125, -0.98455810546875, -0.8917236328125, -0.79888916015625, -0.7060546875, -0.61322021484375, -0.5203857421875, -0.42755126953125, -0.334716796875, -0.24188232421875, -0.1490478515625, -0.05621337890625, 0.03662109375, 0.12945556640625, 0.2222900390625, 0.31512451171875, 0.407958984375, 0.50079345703125, 0.5936279296875, 0.68646240234375, 0.779296875, 0.87213134765625, 0.9649658203125, 1.05780029296875, 1.150634765625, 1.24346923828125, 1.3363037109375, 1.42913818359375, 1.52197265625, 1.61480712890625, 1.7076416015625, 1.80047607421875, 1.893310546875, 1.98614501953125, 2.0789794921875, 2.17181396484375, 2.2646484375, 2.35748291015625, 2.4503173828125, 2.54315185546875, 2.635986328125, 2.72882080078125, 2.8216552734375, 2.91448974609375, 3.00732421875, 3.10015869140625, 3.1929931640625, 3.28582763671875, 3.378662109375, 3.47149658203125, 3.5643310546875, 3.65716552734375, 3.75]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 11.0, 15.0, 23.0, 32.0, 42.0, 102.0, 191.0, 444.0, 1305.0, 1074.0, 403.0, 167.0, 92.0, 57.0, 34.0, 20.0, 8.0, 7.0, 12.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8203125, -0.7974929809570312, -0.7746734619140625, -0.7518539428710938, -0.729034423828125, -0.7062149047851562, -0.6833953857421875, -0.6605758666992188, -0.63775634765625, -0.6149368286132812, -0.5921173095703125, -0.5692977905273438, -0.546478271484375, -0.5236587524414062, -0.5008392333984375, -0.47801971435546875, -0.4552001953125, -0.43238067626953125, -0.4095611572265625, -0.38674163818359375, -0.363922119140625, -0.34110260009765625, -0.3182830810546875, -0.29546356201171875, -0.27264404296875, -0.24982452392578125, -0.2270050048828125, -0.20418548583984375, -0.181365966796875, -0.15854644775390625, -0.1357269287109375, -0.11290740966796875, -0.090087890625, -0.06726837158203125, -0.0444488525390625, -0.02162933349609375, 0.001190185546875, 0.02400970458984375, 0.0468292236328125, 0.06964874267578125, 0.09246826171875, 0.11528778076171875, 0.1381072998046875, 0.16092681884765625, 0.183746337890625, 0.20656585693359375, 0.2293853759765625, 0.25220489501953125, 0.2750244140625, 0.29784393310546875, 0.3206634521484375, 0.34348297119140625, 0.366302490234375, 0.38912200927734375, 0.4119415283203125, 0.43476104736328125, 0.45758056640625, 0.48040008544921875, 0.5032196044921875, 0.5260391235351562, 0.548858642578125, 0.5716781616210938, 0.5944976806640625, 0.6173171997070312, 0.64013671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 8.0, 16.0, 49.0, 115.0, 225.0, 266.0, 184.0, 79.0, 33.0, 13.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.487597465515137, -8.282448768615723, -8.077301025390625, -7.872152328491211, -7.667003631591797, -7.461855411529541, -7.256707191467285, -7.051558494567871, -6.846410274505615, -6.641262054443359, -6.436113357543945, -6.2309651374816895, -6.025816917419434, -5.8206682205200195, -5.615520000457764, -5.410371780395508, -5.205223083496094, -5.000074863433838, -4.794926166534424, -4.589777946472168, -4.384629249572754, -4.179481029510498, -3.974332809448242, -3.7691843509674072, -3.5640358924865723, -3.3588874340057373, -3.1537389755249023, -2.9485907554626465, -2.7434422969818115, -2.5382938385009766, -2.3331456184387207, -2.1279971599578857, -1.922849178314209, -1.717700719833374, -1.5125523805618286, -1.3074040412902832, -1.1022555828094482, -0.8971071243286133, -0.6919587850570679, -0.48681044578552246, -0.2816619873046875, -0.07651358842849731, 0.12863481044769287, 0.33378320932388306, 0.5389316082000732, 0.7440800666809082, 0.9492284059524536, 1.154376745223999, 1.359525203704834, 1.564673662185669, 1.7698220014572144, 1.9749703407287598, 2.1801187992095947, 2.3852672576904297, 2.5904154777526855, 2.7955639362335205, 3.0007123947143555, 3.2058608531951904, 3.4110093116760254, 3.6161575317382812, 3.821305990219116, 4.026454448699951, 4.231602668762207, 4.436751365661621, 4.641899585723877]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 3.0, 3.0, 8.0, 5.0, 10.0, 19.0, 29.0, 34.0, 40.0, 48.0, 63.0, 56.0, 82.0, 59.0, 61.0, 57.0, 59.0, 60.0, 59.0, 49.0, 48.0, 33.0, 32.0, 17.0, 23.0, 11.0, 15.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0690722465515137, -1.9785453081130981, -1.888018250465393, -1.7974913120269775, -1.706964373588562, -1.6164374351501465, -1.5259103775024414, -1.4353834390640259, -1.3448565006256104, -1.2543295621871948, -1.1638025045394897, -1.0732755661010742, -0.9827486276626587, -0.8922216296195984, -0.8016946315765381, -0.7111676931381226, -0.6206406354904175, -0.5301136374473572, -0.43958669900894165, -0.34905970096588135, -0.25853273272514343, -0.16800576448440552, -0.07747876644134521, 0.013048171997070312, 0.10357517004013062, 0.19410213828086853, 0.28462910652160645, 0.37515610456466675, 0.46568307280540466, 0.5562100410461426, 0.6467370390892029, 0.7372639775276184, 0.8277909755706787, 0.918317973613739, 1.0088449716567993, 1.0993719100952148, 1.1898988485336304, 1.280425786972046, 1.370952844619751, 1.4614797830581665, 1.552006721496582, 1.6425336599349976, 1.7330607175827026, 1.8235876560211182, 1.9141145944595337, 2.004641532897949, 2.0951685905456543, 2.1856956481933594, 2.2762227058410645, 2.3667497634887695, 2.4572765827178955, 2.5478036403656006, 2.6383306980133057, 2.7288575172424316, 2.8193845748901367, 2.909911632537842, 3.0004384517669678, 3.090965509414673, 3.181492328643799, 3.272019386291504, 3.362546443939209, 3.453073263168335, 3.54360032081604, 3.634127140045166, 3.724654197692871]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 12.0, 15.0, 14.0, 18.0, 31.0, 46.0, 70.0, 60.0, 129.0, 159.0, 199.0, 290.0, 438.0, 621.0, 1060.0, 1828.0, 3520.0, 8827.0, 31936.0, 156665.0, 516001.0, 253181.0, 50638.0, 12659.0, 4437.0, 2109.0, 1184.0, 767.0, 477.0, 337.0, 228.0, 152.0, 121.0, 105.0, 59.0, 40.0, 32.0, 19.0, 18.0, 10.0, 9.0, 7.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.349609375, -1.3040924072265625, -1.258575439453125, -1.2130584716796875, -1.16754150390625, -1.1220245361328125, -1.076507568359375, -1.0309906005859375, -0.9854736328125, -0.9399566650390625, -0.894439697265625, -0.8489227294921875, -0.80340576171875, -0.7578887939453125, -0.712371826171875, -0.6668548583984375, -0.621337890625, -0.5758209228515625, -0.530303955078125, -0.4847869873046875, -0.43927001953125, -0.3937530517578125, -0.348236083984375, -0.3027191162109375, -0.2572021484375, -0.2116851806640625, -0.166168212890625, -0.1206512451171875, -0.07513427734375, -0.0296173095703125, 0.015899658203125, 0.0614166259765625, 0.10693359375, 0.1524505615234375, 0.197967529296875, 0.2434844970703125, 0.28900146484375, 0.3345184326171875, 0.380035400390625, 0.4255523681640625, 0.4710693359375, 0.5165863037109375, 0.562103271484375, 0.6076202392578125, 0.65313720703125, 0.6986541748046875, 0.744171142578125, 0.7896881103515625, 0.835205078125, 0.8807220458984375, 0.926239013671875, 0.9717559814453125, 1.01727294921875, 1.0627899169921875, 1.108306884765625, 1.1538238525390625, 1.1993408203125, 1.2448577880859375, 1.290374755859375, 1.3358917236328125, 1.38140869140625, 1.4269256591796875, 1.472442626953125, 1.5179595947265625, 1.5634765625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 21.0, 23.0, 46.0, 77.0, 80.0, 123.0, 121.0, 135.0, 114.0, 85.0, 61.0, 44.0, 24.0, 13.0, 9.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46435546875, -0.44835662841796875, -0.4323577880859375, -0.41635894775390625, -0.400360107421875, -0.38436126708984375, -0.3683624267578125, -0.35236358642578125, -0.33636474609375, -0.32036590576171875, -0.3043670654296875, -0.28836822509765625, -0.272369384765625, -0.25637054443359375, -0.2403717041015625, -0.22437286376953125, -0.2083740234375, -0.19237518310546875, -0.1763763427734375, -0.16037750244140625, -0.144378662109375, -0.12837982177734375, -0.1123809814453125, -0.09638214111328125, -0.08038330078125, -0.06438446044921875, -0.0483856201171875, -0.03238677978515625, -0.016387939453125, -0.00038909912109375, 0.0156097412109375, 0.03160858154296875, 0.047607421875, 0.06360626220703125, 0.0796051025390625, 0.09560394287109375, 0.111602783203125, 0.12760162353515625, 0.1436004638671875, 0.15959930419921875, 0.17559814453125, 0.19159698486328125, 0.2075958251953125, 0.22359466552734375, 0.239593505859375, 0.25559234619140625, 0.2715911865234375, 0.28759002685546875, 0.3035888671875, 0.31958770751953125, 0.3355865478515625, 0.35158538818359375, 0.367584228515625, 0.38358306884765625, 0.3995819091796875, 0.41558074951171875, 0.43157958984375, 0.44757843017578125, 0.4635772705078125, 0.47957611083984375, 0.495574951171875, 0.5115737915039062, 0.5275726318359375, 0.5435714721679688, 0.5595703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 10.0, 5.0, 13.0, 15.0, 22.0, 42.0, 45.0, 62.0, 100.0, 142.0, 241.0, 386.0, 628.0, 1182.0, 2246.0, 4624.0, 11057.0, 29884.0, 86979.0, 246435.0, 371403.0, 189262.0, 64689.0, 22433.0, 8564.0, 3864.0, 1787.0, 953.0, 560.0, 328.0, 198.0, 104.0, 87.0, 52.0, 51.0, 20.0, 14.0, 14.0, 19.0, 5.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7952499389648438, -0.7706756591796875, -0.7461013793945312, -0.721527099609375, -0.6969528198242188, -0.6723785400390625, -0.6478042602539062, -0.62322998046875, -0.5986557006835938, -0.5740814208984375, -0.5495071411132812, -0.524932861328125, -0.5003585815429688, -0.4757843017578125, -0.45121002197265625, -0.4266357421875, -0.40206146240234375, -0.3774871826171875, -0.35291290283203125, -0.328338623046875, -0.30376434326171875, -0.2791900634765625, -0.25461578369140625, -0.23004150390625, -0.20546722412109375, -0.1808929443359375, -0.15631866455078125, -0.131744384765625, -0.10717010498046875, -0.0825958251953125, -0.05802154541015625, -0.033447265625, -0.00887298583984375, 0.0157012939453125, 0.04027557373046875, 0.064849853515625, 0.08942413330078125, 0.1139984130859375, 0.13857269287109375, 0.16314697265625, 0.18772125244140625, 0.2122955322265625, 0.23686981201171875, 0.261444091796875, 0.28601837158203125, 0.3105926513671875, 0.33516693115234375, 0.3597412109375, 0.38431549072265625, 0.4088897705078125, 0.43346405029296875, 0.458038330078125, 0.48261260986328125, 0.5071868896484375, 0.5317611694335938, 0.55633544921875, 0.5809097290039062, 0.6054840087890625, 0.6300582885742188, 0.654632568359375, 0.6792068481445312, 0.7037811279296875, 0.7283554077148438, 0.7529296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 4.0, 5.0, 14.0, 12.0, 18.0, 24.0, 21.0, 21.0, 36.0, 26.0, 37.0, 42.0, 41.0, 30.0, 52.0, 60.0, 36.0, 45.0, 61.0, 36.0, 56.0, 38.0, 27.0, 37.0, 23.0, 26.0, 26.0, 26.0, 28.0, 13.0, 14.0, 15.0, 8.0, 6.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.90185546875, -0.8738174438476562, -0.8457794189453125, -0.8177413940429688, -0.789703369140625, -0.7616653442382812, -0.7336273193359375, -0.7055892944335938, -0.67755126953125, -0.6495132446289062, -0.6214752197265625, -0.5934371948242188, -0.565399169921875, -0.5373611450195312, -0.5093231201171875, -0.48128509521484375, -0.4532470703125, -0.42520904541015625, -0.3971710205078125, -0.36913299560546875, -0.341094970703125, -0.31305694580078125, -0.2850189208984375, -0.25698089599609375, -0.22894287109375, -0.20090484619140625, -0.1728668212890625, -0.14482879638671875, -0.116790771484375, -0.08875274658203125, -0.0607147216796875, -0.03267669677734375, -0.004638671875, 0.02339935302734375, 0.0514373779296875, 0.07947540283203125, 0.107513427734375, 0.13555145263671875, 0.1635894775390625, 0.19162750244140625, 0.21966552734375, 0.24770355224609375, 0.2757415771484375, 0.30377960205078125, 0.331817626953125, 0.35985565185546875, 0.3878936767578125, 0.41593170166015625, 0.4439697265625, 0.47200775146484375, 0.5000457763671875, 0.5280838012695312, 0.556121826171875, 0.5841598510742188, 0.6121978759765625, 0.6402359008789062, 0.66827392578125, 0.6963119506835938, 0.7243499755859375, 0.7523880004882812, 0.780426025390625, 0.8084640502929688, 0.8365020751953125, 0.8645401000976562, 0.892578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 16.0, 33.0, 37.0, 57.0, 83.0, 147.0, 218.0, 347.0, 795.0, 1837.0, 4748.0, 17159.0, 83231.0, 419187.0, 413852.0, 81780.0, 16837.0, 4727.0, 1665.0, 737.0, 398.0, 250.0, 136.0, 84.0, 52.0, 37.0, 24.0, 18.0, 11.0, 11.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50634765625, -0.48888397216796875, -0.4714202880859375, -0.45395660400390625, -0.436492919921875, -0.41902923583984375, -0.4015655517578125, -0.38410186767578125, -0.36663818359375, -0.34917449951171875, -0.3317108154296875, -0.31424713134765625, -0.296783447265625, -0.27931976318359375, -0.2618560791015625, -0.24439239501953125, -0.2269287109375, -0.20946502685546875, -0.1920013427734375, -0.17453765869140625, -0.157073974609375, -0.13961029052734375, -0.1221466064453125, -0.10468292236328125, -0.08721923828125, -0.06975555419921875, -0.0522918701171875, -0.03482818603515625, -0.017364501953125, 9.918212890625e-05, 0.0175628662109375, 0.03502655029296875, 0.052490234375, 0.06995391845703125, 0.0874176025390625, 0.10488128662109375, 0.122344970703125, 0.13980865478515625, 0.1572723388671875, 0.17473602294921875, 0.19219970703125, 0.20966339111328125, 0.2271270751953125, 0.24459075927734375, 0.262054443359375, 0.27951812744140625, 0.2969818115234375, 0.31444549560546875, 0.3319091796875, 0.34937286376953125, 0.3668365478515625, 0.38430023193359375, 0.401763916015625, 0.41922760009765625, 0.4366912841796875, 0.45415496826171875, 0.47161865234375, 0.48908233642578125, 0.5065460205078125, 0.5240097045898438, 0.541473388671875, 0.5589370727539062, 0.5764007568359375, 0.5938644409179688, 0.611328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 6.0, 2.0, 2.0, 15.0, 17.0, 26.0, 20.0, 32.0, 27.0, 44.0, 41.0, 55.0, 71.0, 80.0, 76.0, 68.0, 76.0, 83.0, 57.0, 47.0, 34.0, 27.0, 20.0, 18.0, 11.0, 12.0, 9.0, 5.0, 7.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.530782699584961e-05, -9.285192936658859e-05, -9.039603173732758e-05, -8.794013410806656e-05, -8.548423647880554e-05, -8.302833884954453e-05, -8.057244122028351e-05, -7.811654359102249e-05, -7.566064596176147e-05, -7.320474833250046e-05, -7.074885070323944e-05, -6.829295307397842e-05, -6.583705544471741e-05, -6.338115781545639e-05, -6.0925260186195374e-05, -5.846936255693436e-05, -5.601346492767334e-05, -5.355756729841232e-05, -5.1101669669151306e-05, -4.864577203989029e-05, -4.618987441062927e-05, -4.3733976781368256e-05, -4.127807915210724e-05, -3.882218152284622e-05, -3.6366283893585205e-05, -3.391038626432419e-05, -3.145448863506317e-05, -2.8998591005802155e-05, -2.6542693376541138e-05, -2.408679574728012e-05, -2.1630898118019104e-05, -1.9175000488758087e-05, -1.671910285949707e-05, -1.4263205230236053e-05, -1.1807307600975037e-05, -9.35140997171402e-06, -6.895512342453003e-06, -4.439614713191986e-06, -1.9837170839309692e-06, 4.721805453300476e-07, 2.9280781745910645e-06, 5.383975803852081e-06, 7.839873433113098e-06, 1.0295771062374115e-05, 1.2751668691635132e-05, 1.5207566320896149e-05, 1.7663463950157166e-05, 2.0119361579418182e-05, 2.25752592086792e-05, 2.5031156837940216e-05, 2.7487054467201233e-05, 2.994295209646225e-05, 3.2398849725723267e-05, 3.4854747354984283e-05, 3.73106449842453e-05, 3.976654261350632e-05, 4.2222440242767334e-05, 4.467833787202835e-05, 4.713423550128937e-05, 4.9590133130550385e-05, 5.20460307598114e-05, 5.450192838907242e-05, 5.6957826018333435e-05, 5.941372364759445e-05, 6.186962127685547e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 7.0, 13.0, 10.0, 19.0, 27.0, 39.0, 70.0, 88.0, 153.0, 247.0, 601.0, 1370.0, 3886.0, 14157.0, 82080.0, 482245.0, 388911.0, 57976.0, 10925.0, 3269.0, 1206.0, 546.0, 266.0, 149.0, 107.0, 50.0, 55.0, 26.0, 21.0, 19.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0], "bins": [-0.76123046875, -0.7430686950683594, -0.7249069213867188, -0.7067451477050781, -0.6885833740234375, -0.6704216003417969, -0.6522598266601562, -0.6340980529785156, -0.615936279296875, -0.5977745056152344, -0.5796127319335938, -0.5614509582519531, -0.5432891845703125, -0.5251274108886719, -0.5069656372070312, -0.4888038635253906, -0.47064208984375, -0.4524803161621094, -0.43431854248046875, -0.4161567687988281, -0.3979949951171875, -0.3798332214355469, -0.36167144775390625, -0.3435096740722656, -0.325347900390625, -0.3071861267089844, -0.28902435302734375, -0.2708625793457031, -0.2527008056640625, -0.23453903198242188, -0.21637725830078125, -0.19821548461914062, -0.1800537109375, -0.16189193725585938, -0.14373016357421875, -0.12556838989257812, -0.1074066162109375, -0.08924484252929688, -0.07108306884765625, -0.052921295166015625, -0.034759521484375, -0.016597747802734375, 0.00156402587890625, 0.019725799560546875, 0.0378875732421875, 0.056049346923828125, 0.07421112060546875, 0.09237289428710938, 0.11053466796875, 0.12869644165039062, 0.14685821533203125, 0.16501998901367188, 0.1831817626953125, 0.20134353637695312, 0.21950531005859375, 0.23766708374023438, 0.255828857421875, 0.2739906311035156, 0.29215240478515625, 0.3103141784667969, 0.3284759521484375, 0.3466377258300781, 0.36479949951171875, 0.3829612731933594, 0.401123046875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 14.0, 12.0, 21.0, 32.0, 48.0, 64.0, 99.0, 102.0, 120.0, 137.0, 85.0, 68.0, 53.0, 48.0, 31.0, 26.0, 13.0, 6.0, 4.0, 5.0, 4.0, 6.0], "bins": [-0.7978515625, -0.7821407318115234, -0.7664299011230469, -0.7507190704345703, -0.7350082397460938, -0.7192974090576172, -0.7035865783691406, -0.6878757476806641, -0.6721649169921875, -0.6564540863037109, -0.6407432556152344, -0.6250324249267578, -0.6093215942382812, -0.5936107635498047, -0.5778999328613281, -0.5621891021728516, -0.546478271484375, -0.5307674407958984, -0.5150566101074219, -0.4993457794189453, -0.48363494873046875, -0.4679241180419922, -0.4522132873535156, -0.43650245666503906, -0.4207916259765625, -0.40508079528808594, -0.3893699645996094, -0.3736591339111328, -0.35794830322265625, -0.3422374725341797, -0.3265266418457031, -0.31081581115722656, -0.29510498046875, -0.27939414978027344, -0.2636833190917969, -0.2479724884033203, -0.23226165771484375, -0.2165508270263672, -0.20083999633789062, -0.18512916564941406, -0.1694183349609375, -0.15370750427246094, -0.13799667358398438, -0.12228584289550781, -0.10657501220703125, -0.09086418151855469, -0.07515335083007812, -0.05944252014160156, -0.043731689453125, -0.028020858764648438, -0.012310028076171875, 0.0034008026123046875, 0.01911163330078125, 0.03482246398925781, 0.050533294677734375, 0.06624412536621094, 0.0819549560546875, 0.09766578674316406, 0.11337661743164062, 0.1290874481201172, 0.14479827880859375, 0.1605091094970703, 0.17621994018554688, 0.19193077087402344, 0.2076416015625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 34.0, 40.0, 46.0, 80.0, 126.0, 126.0, 146.0, 118.0, 92.0, 67.0, 31.0, 27.0, 18.0, 13.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.7641825675964355, -7.555502414703369, -7.346822261810303, -7.138142108917236, -6.92946195602417, -6.7207818031311035, -6.512101173400879, -6.3034210205078125, -6.094740867614746, -5.88606071472168, -5.677380561828613, -5.468700408935547, -5.2600202560424805, -5.051340103149414, -4.842659950256348, -4.633979797363281, -4.425299644470215, -4.216619491577148, -4.007939338684082, -3.7992591857910156, -3.590579032897949, -3.381898880004883, -3.1732184886932373, -2.964538335800171, -2.7558581829071045, -2.547178030014038, -2.3384978771209717, -2.129817485809326, -1.9211374521255493, -1.712457299232483, -1.503777027130127, -1.2950968742370605, -1.0864171981811523, -0.8777370452880859, -0.6690568327903748, -0.4603766202926636, -0.25169646739959717, -0.04301631450653076, 0.1656639575958252, 0.3743441104888916, 0.583024263381958, 0.7917044162750244, 1.0003845691680908, 1.2090648412704468, 1.4177449941635132, 1.6264251470565796, 1.8351054191589355, 2.043785572052002, 2.2524657249450684, 2.4611458778381348, 2.669826030731201, 2.8785061836242676, 3.087186336517334, 3.2958664894104004, 3.504546880722046, 3.7132270336151123, 3.9219071865081787, 4.130587577819824, 4.339267730712891, 4.547947883605957, 4.756628036499023, 4.96530818939209, 5.173988342285156, 5.382668495178223, 5.591348648071289]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 8.0, 10.0, 12.0, 7.0, 9.0, 13.0, 19.0, 23.0, 24.0, 29.0, 27.0, 31.0, 35.0, 25.0, 47.0, 51.0, 49.0, 40.0, 48.0, 42.0, 46.0, 32.0, 59.0, 42.0, 45.0, 21.0, 32.0, 31.0, 19.0, 23.0, 23.0, 11.0, 13.0, 10.0, 9.0, 9.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.498128414154053, -4.342016696929932, -4.185905456542969, -4.029793739318848, -3.8736822605133057, -3.7175707817077637, -3.5614593029022217, -3.4053478240966797, -3.2492361068725586, -3.0931246280670166, -2.9370131492614746, -2.7809014320373535, -2.6247899532318115, -2.4686784744262695, -2.3125669956207275, -2.1564555168151855, -2.0003440380096436, -1.8442325592041016, -1.68812096118927, -1.532009482383728, -1.3758978843688965, -1.2197864055633545, -1.0636749267578125, -0.907563328742981, -0.751451849937439, -0.5953403115272522, -0.4392288029193878, -0.28311729431152344, -0.12700575590133667, 0.029105782508850098, 0.1852172613143921, 0.34132885932922363, 0.4974403381347656, 0.6535518765449524, 0.8096634149551392, 0.9657748937606812, 1.1218864917755127, 1.2779979705810547, 1.4341094493865967, 1.5902210474014282, 1.7463325262069702, 1.9024440050125122, 2.0585556030273438, 2.2146670818328857, 2.3707785606384277, 2.526890277862549, 2.6830015182495117, 2.839113235473633, 2.995224714279175, 3.151336193084717, 3.307447671890259, 3.463559150695801, 3.619670867919922, 3.775782346725464, 3.931893825531006, 4.088005542755127, 4.24411678314209, 4.400228500366211, 4.556339740753174, 4.712451457977295, 4.868562698364258, 5.024674415588379, 5.1807861328125, 5.336897373199463, 5.493009090423584]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 3.0, 8.0, 6.0, 18.0, 20.0, 41.0, 58.0, 95.0, 140.0, 250.0, 429.0, 894.0, 2024.0, 6688.0, 33658.0, 474468.0, 3577227.0, 79649.0, 12038.0, 3502.0, 1345.0, 680.0, 381.0, 207.0, 142.0, 98.0, 73.0, 47.0, 30.0, 15.0, 15.0, 8.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.435455322265625, -1.38067626953125, -1.325897216796875, -1.2711181640625, -1.216339111328125, -1.16156005859375, -1.106781005859375, -1.052001953125, -0.997222900390625, -0.94244384765625, -0.887664794921875, -0.8328857421875, -0.778106689453125, -0.72332763671875, -0.668548583984375, -0.61376953125, -0.558990478515625, -0.50421142578125, -0.449432373046875, -0.3946533203125, -0.339874267578125, -0.28509521484375, -0.230316162109375, -0.175537109375, -0.120758056640625, -0.06597900390625, -0.011199951171875, 0.0435791015625, 0.098358154296875, 0.15313720703125, 0.207916259765625, 0.2626953125, 0.317474365234375, 0.37225341796875, 0.427032470703125, 0.4818115234375, 0.536590576171875, 0.59136962890625, 0.646148681640625, 0.700927734375, 0.755706787109375, 0.81048583984375, 0.865264892578125, 0.9200439453125, 0.974822998046875, 1.02960205078125, 1.084381103515625, 1.13916015625, 1.193939208984375, 1.24871826171875, 1.303497314453125, 1.3582763671875, 1.413055419921875, 1.46783447265625, 1.522613525390625, 1.577392578125, 1.632171630859375, 1.68695068359375, 1.741729736328125, 1.7965087890625, 1.851287841796875, 1.90606689453125, 1.960845947265625, 2.015625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 15.0, 22.0, 45.0, 50.0, 79.0, 100.0, 93.0, 115.0, 126.0, 93.0, 74.0, 77.0, 38.0, 31.0, 15.0, 10.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46337890625, -0.44725799560546875, -0.4311370849609375, -0.41501617431640625, -0.398895263671875, -0.38277435302734375, -0.3666534423828125, -0.35053253173828125, -0.33441162109375, -0.31829071044921875, -0.3021697998046875, -0.28604888916015625, -0.269927978515625, -0.25380706787109375, -0.2376861572265625, -0.22156524658203125, -0.2054443359375, -0.18932342529296875, -0.1732025146484375, -0.15708160400390625, -0.140960693359375, -0.12483978271484375, -0.1087188720703125, -0.09259796142578125, -0.07647705078125, -0.06035614013671875, -0.0442352294921875, -0.02811431884765625, -0.011993408203125, 0.00412750244140625, 0.0202484130859375, 0.03636932373046875, 0.052490234375, 0.06861114501953125, 0.0847320556640625, 0.10085296630859375, 0.116973876953125, 0.13309478759765625, 0.1492156982421875, 0.16533660888671875, 0.18145751953125, 0.19757843017578125, 0.2136993408203125, 0.22982025146484375, 0.245941162109375, 0.26206207275390625, 0.2781829833984375, 0.29430389404296875, 0.3104248046875, 0.32654571533203125, 0.3426666259765625, 0.35878753662109375, 0.374908447265625, 0.39102935791015625, 0.4071502685546875, 0.42327117919921875, 0.43939208984375, 0.45551300048828125, 0.4716339111328125, 0.48775482177734375, 0.503875732421875, 0.5199966430664062, 0.5361175537109375, 0.5522384643554688, 0.568359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 16.0, 21.0, 48.0, 115.0, 295.0, 800.0, 2695.0, 14193.0, 161982.0, 3784692.0, 208571.0, 16433.0, 3033.0, 819.0, 297.0, 137.0, 62.0, 18.0, 13.0, 11.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.37933349609375, -1.3231201171875, -1.26690673828125, -1.210693359375, -1.15447998046875, -1.0982666015625, -1.04205322265625, -0.98583984375, -0.92962646484375, -0.8734130859375, -0.81719970703125, -0.760986328125, -0.70477294921875, -0.6485595703125, -0.59234619140625, -0.5361328125, -0.47991943359375, -0.4237060546875, -0.36749267578125, -0.311279296875, -0.25506591796875, -0.1988525390625, -0.14263916015625, -0.08642578125, -0.03021240234375, 0.0260009765625, 0.08221435546875, 0.138427734375, 0.19464111328125, 0.2508544921875, 0.30706787109375, 0.36328125, 0.41949462890625, 0.4757080078125, 0.53192138671875, 0.588134765625, 0.64434814453125, 0.7005615234375, 0.75677490234375, 0.81298828125, 0.86920166015625, 0.9254150390625, 0.98162841796875, 1.037841796875, 1.09405517578125, 1.1502685546875, 1.20648193359375, 1.2626953125, 1.31890869140625, 1.3751220703125, 1.43133544921875, 1.487548828125, 1.54376220703125, 1.5999755859375, 1.65618896484375, 1.71240234375, 1.76861572265625, 1.8248291015625, 1.88104248046875, 1.937255859375, 1.99346923828125, 2.0496826171875, 2.10589599609375, 2.162109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 7.0, 12.0, 11.0, 10.0, 19.0, 29.0, 45.0, 96.0, 128.0, 248.0, 551.0, 1640.0, 604.0, 260.0, 142.0, 97.0, 52.0, 39.0, 22.0, 19.0, 15.0, 7.0, 9.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409423828125, -0.3960151672363281, -0.38260650634765625, -0.3691978454589844, -0.3557891845703125, -0.3423805236816406, -0.32897186279296875, -0.3155632019042969, -0.302154541015625, -0.2887458801269531, -0.27533721923828125, -0.2619285583496094, -0.2485198974609375, -0.23511123657226562, -0.22170257568359375, -0.20829391479492188, -0.19488525390625, -0.18147659301757812, -0.16806793212890625, -0.15465927124023438, -0.1412506103515625, -0.12784194946289062, -0.11443328857421875, -0.10102462768554688, -0.087615966796875, -0.07420730590820312, -0.06079864501953125, -0.047389984130859375, -0.0339813232421875, -0.020572662353515625, -0.00716400146484375, 0.006244659423828125, 0.0196533203125, 0.033061981201171875, 0.04647064208984375, 0.059879302978515625, 0.0732879638671875, 0.08669662475585938, 0.10010528564453125, 0.11351394653320312, 0.126922607421875, 0.14033126831054688, 0.15373992919921875, 0.16714859008789062, 0.1805572509765625, 0.19396591186523438, 0.20737457275390625, 0.22078323364257812, 0.23419189453125, 0.24760055541992188, 0.26100921630859375, 0.2744178771972656, 0.2878265380859375, 0.3012351989746094, 0.31464385986328125, 0.3280525207519531, 0.341461181640625, 0.3548698425292969, 0.36827850341796875, 0.3816871643066406, 0.3950958251953125, 0.4085044860839844, 0.42191314697265625, 0.4353218078613281, 0.44873046875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 11.0, 24.0, 97.0, 167.0, 257.0, 230.0, 121.0, 60.0, 25.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.573794364929199, -6.42956018447876, -6.2853264808654785, -6.141092300415039, -5.9968581199646, -5.85262393951416, -5.708390235900879, -5.5641560554504395, -5.419921875, -5.2756876945495605, -5.131453990936279, -4.98721981048584, -4.8429856300354, -4.698751449584961, -4.55451774597168, -4.41028356552124, -4.266049385070801, -4.121815204620361, -3.977581262588501, -3.8333473205566406, -3.689113140106201, -3.544879198074341, -3.4006452560424805, -3.256411075592041, -3.1121773719787598, -2.9679434299468994, -2.82370924949646, -2.6794753074645996, -2.53524112701416, -2.3910071849823, -2.2467732429504395, -2.1025390625, -1.9583046436309814, -1.8140705823898315, -1.6698365211486816, -1.5256025791168213, -1.3813683986663818, -1.2371344566345215, -1.0929003953933716, -0.9486663341522217, -0.8044322729110718, -0.6601982116699219, -0.515964150428772, -0.37173014879226685, -0.22749608755111694, -0.08326202630996704, 0.060971975326538086, 0.205206036567688, 0.3494400978088379, 0.4936741590499878, 0.6379082202911377, 0.7821422219276428, 0.9263762831687927, 1.0706102848052979, 1.2148443460464478, 1.3590784072875977, 1.5033124685287476, 1.6475465297698975, 1.7917805910110474, 1.9360146522521973, 2.0802485942840576, 2.224482774734497, 2.3687167167663574, 2.512950897216797, 2.6571848392486572]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 7.0, 18.0, 16.0, 22.0, 24.0, 41.0, 35.0, 47.0, 47.0, 68.0, 59.0, 81.0, 56.0, 73.0, 68.0, 64.0, 63.0, 51.0, 44.0, 35.0, 21.0, 20.0, 18.0, 8.0, 1.0, 6.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6214098930358887, -1.563547134399414, -1.505684494972229, -1.447821855545044, -1.3899590969085693, -1.3320963382720947, -1.2742336988449097, -1.2163710594177246, -1.15850830078125, -1.1006455421447754, -1.0427829027175903, -0.9849202036857605, -0.9270575046539307, -0.8691948056221008, -0.811332106590271, -0.7534694075584412, -0.6956067085266113, -0.6377440094947815, -0.5798813104629517, -0.5220186114311218, -0.464155912399292, -0.40629321336746216, -0.3484305143356323, -0.2905678153038025, -0.23270511627197266, -0.17484241724014282, -0.11697971820831299, -0.059117019176483154, -0.0012543201446533203, 0.056608378887176514, 0.11447107791900635, 0.17233377695083618, 0.23019647598266602, 0.28805917501449585, 0.3459218740463257, 0.4037845730781555, 0.46164727210998535, 0.5195099711418152, 0.577372670173645, 0.6352353692054749, 0.6930980682373047, 0.7509607672691345, 0.8088234663009644, 0.8666861653327942, 0.924548864364624, 0.9824115633964539, 1.0402742624282837, 1.0981369018554688, 1.1559996604919434, 1.213862419128418, 1.271725058555603, 1.329587697982788, 1.3874504566192627, 1.4453132152557373, 1.5031758546829224, 1.5610384941101074, 1.618901252746582, 1.6767640113830566, 1.7346266508102417, 1.7924892902374268, 1.8503520488739014, 1.908214807510376, 1.966077446937561, 2.023940086364746, 2.0818028450012207]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 12.0, 11.0, 24.0, 19.0, 33.0, 14.0, 48.0, 41.0, 74.0, 129.0, 146.0, 165.0, 256.0, 353.0, 485.0, 738.0, 1142.0, 2071.0, 4202.0, 10851.0, 35233.0, 135600.0, 417104.0, 313490.0, 86785.0, 23613.0, 7687.0, 3304.0, 1622.0, 1009.0, 634.0, 434.0, 369.0, 215.0, 152.0, 125.0, 97.0, 59.0, 48.0, 43.0, 32.0, 21.0, 12.0, 14.0, 7.0, 5.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.2958984375, -1.257598876953125, -1.21929931640625, -1.180999755859375, -1.1427001953125, -1.104400634765625, -1.06610107421875, -1.027801513671875, -0.989501953125, -0.951202392578125, -0.91290283203125, -0.874603271484375, -0.8363037109375, -0.798004150390625, -0.75970458984375, -0.721405029296875, -0.68310546875, -0.644805908203125, -0.60650634765625, -0.568206787109375, -0.5299072265625, -0.491607666015625, -0.45330810546875, -0.415008544921875, -0.376708984375, -0.338409423828125, -0.30010986328125, -0.261810302734375, -0.2235107421875, -0.185211181640625, -0.14691162109375, -0.108612060546875, -0.0703125, -0.032012939453125, 0.00628662109375, 0.044586181640625, 0.0828857421875, 0.121185302734375, 0.15948486328125, 0.197784423828125, 0.236083984375, 0.274383544921875, 0.31268310546875, 0.350982666015625, 0.3892822265625, 0.427581787109375, 0.46588134765625, 0.504180908203125, 0.54248046875, 0.580780029296875, 0.61907958984375, 0.657379150390625, 0.6956787109375, 0.733978271484375, 0.77227783203125, 0.810577392578125, 0.848876953125, 0.887176513671875, 0.92547607421875, 0.963775634765625, 1.0020751953125, 1.040374755859375, 1.07867431640625, 1.116973876953125, 1.1552734375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 13.0, 14.0, 31.0, 37.0, 59.0, 86.0, 109.0, 106.0, 133.0, 110.0, 82.0, 83.0, 59.0, 26.0, 19.0, 12.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.4636077880859375, -0.447235107421875, -0.4308624267578125, -0.41448974609375, -0.3981170654296875, -0.381744384765625, -0.3653717041015625, -0.3489990234375, -0.3326263427734375, -0.316253662109375, -0.2998809814453125, -0.28350830078125, -0.2671356201171875, -0.250762939453125, -0.2343902587890625, -0.218017578125, -0.2016448974609375, -0.185272216796875, -0.1688995361328125, -0.15252685546875, -0.1361541748046875, -0.119781494140625, -0.1034088134765625, -0.0870361328125, -0.0706634521484375, -0.054290771484375, -0.0379180908203125, -0.02154541015625, -0.0051727294921875, 0.011199951171875, 0.0275726318359375, 0.0439453125, 0.0603179931640625, 0.076690673828125, 0.0930633544921875, 0.10943603515625, 0.1258087158203125, 0.142181396484375, 0.1585540771484375, 0.1749267578125, 0.1912994384765625, 0.207672119140625, 0.2240447998046875, 0.24041748046875, 0.2567901611328125, 0.273162841796875, 0.2895355224609375, 0.305908203125, 0.3222808837890625, 0.338653564453125, 0.3550262451171875, 0.37139892578125, 0.3877716064453125, 0.404144287109375, 0.4205169677734375, 0.4368896484375, 0.4532623291015625, 0.469635009765625, 0.4860076904296875, 0.50238037109375, 0.5187530517578125, 0.535125732421875, 0.5514984130859375, 0.56787109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 2.0, 5.0, 10.0, 9.0, 22.0, 27.0, 24.0, 58.0, 82.0, 123.0, 188.0, 288.0, 547.0, 1153.0, 2392.0, 6404.0, 18212.0, 56155.0, 178567.0, 398459.0, 258548.0, 85150.0, 26675.0, 8896.0, 3422.0, 1475.0, 691.0, 371.0, 228.0, 110.0, 83.0, 51.0, 37.0, 30.0, 17.0, 6.0, 9.0, 4.0, 7.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7318038940429688, -0.7062835693359375, -0.6807632446289062, -0.655242919921875, -0.6297225952148438, -0.6042022705078125, -0.5786819458007812, -0.55316162109375, -0.5276412963867188, -0.5021209716796875, -0.47660064697265625, -0.451080322265625, -0.42555999755859375, -0.4000396728515625, -0.37451934814453125, -0.3489990234375, -0.32347869873046875, -0.2979583740234375, -0.27243804931640625, -0.246917724609375, -0.22139739990234375, -0.1958770751953125, -0.17035675048828125, -0.14483642578125, -0.11931610107421875, -0.0937957763671875, -0.06827545166015625, -0.042755126953125, -0.01723480224609375, 0.0082855224609375, 0.03380584716796875, 0.059326171875, 0.08484649658203125, 0.1103668212890625, 0.13588714599609375, 0.161407470703125, 0.18692779541015625, 0.2124481201171875, 0.23796844482421875, 0.26348876953125, 0.28900909423828125, 0.3145294189453125, 0.34004974365234375, 0.365570068359375, 0.39109039306640625, 0.4166107177734375, 0.44213104248046875, 0.4676513671875, 0.49317169189453125, 0.5186920166015625, 0.5442123413085938, 0.569732666015625, 0.5952529907226562, 0.6207733154296875, 0.6462936401367188, 0.67181396484375, 0.6973342895507812, 0.7228546142578125, 0.7483749389648438, 0.773895263671875, 0.7994155883789062, 0.8249359130859375, 0.8504562377929688, 0.8759765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 11.0, 4.0, 4.0, 9.0, 13.0, 12.0, 12.0, 20.0, 22.0, 18.0, 26.0, 30.0, 31.0, 35.0, 37.0, 40.0, 34.0, 42.0, 42.0, 48.0, 47.0, 50.0, 43.0, 36.0, 38.0, 27.0, 30.0, 34.0, 37.0, 26.0, 22.0, 21.0, 16.0, 16.0, 12.0, 11.0, 7.0, 9.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8585433959960938, -0.8318328857421875, -0.8051223754882812, -0.778411865234375, -0.7517013549804688, -0.7249908447265625, -0.6982803344726562, -0.67156982421875, -0.6448593139648438, -0.6181488037109375, -0.5914382934570312, -0.564727783203125, -0.5380172729492188, -0.5113067626953125, -0.48459625244140625, -0.4578857421875, -0.43117523193359375, -0.4044647216796875, -0.37775421142578125, -0.351043701171875, -0.32433319091796875, -0.2976226806640625, -0.27091217041015625, -0.24420166015625, -0.21749114990234375, -0.1907806396484375, -0.16407012939453125, -0.137359619140625, -0.11064910888671875, -0.0839385986328125, -0.05722808837890625, -0.030517578125, -0.00380706787109375, 0.0229034423828125, 0.04961395263671875, 0.076324462890625, 0.10303497314453125, 0.1297454833984375, 0.15645599365234375, 0.18316650390625, 0.20987701416015625, 0.2365875244140625, 0.26329803466796875, 0.290008544921875, 0.31671905517578125, 0.3434295654296875, 0.37014007568359375, 0.3968505859375, 0.42356109619140625, 0.4502716064453125, 0.47698211669921875, 0.503692626953125, 0.5304031372070312, 0.5571136474609375, 0.5838241577148438, 0.61053466796875, 0.6372451782226562, 0.6639556884765625, 0.6906661987304688, 0.717376708984375, 0.7440872192382812, 0.7707977294921875, 0.7975082397460938, 0.82421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 7.0, 9.0, 12.0, 15.0, 21.0, 26.0, 33.0, 55.0, 94.0, 172.0, 288.0, 654.0, 1362.0, 3616.0, 15237.0, 218425.0, 741377.0, 55455.0, 7340.0, 2376.0, 925.0, 426.0, 230.0, 112.0, 79.0, 46.0, 31.0, 31.0, 26.0, 19.0, 10.0, 4.0, 14.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0615234375, -1.0305557250976562, -0.9995880126953125, -0.9686203002929688, -0.937652587890625, -0.9066848754882812, -0.8757171630859375, -0.8447494506835938, -0.81378173828125, -0.7828140258789062, -0.7518463134765625, -0.7208786010742188, -0.689910888671875, -0.6589431762695312, -0.6279754638671875, -0.5970077514648438, -0.5660400390625, -0.5350723266601562, -0.5041046142578125, -0.47313690185546875, -0.442169189453125, -0.41120147705078125, -0.3802337646484375, -0.34926605224609375, -0.31829833984375, -0.28733062744140625, -0.2563629150390625, -0.22539520263671875, -0.194427490234375, -0.16345977783203125, -0.1324920654296875, -0.10152435302734375, -0.070556640625, -0.03958892822265625, -0.0086212158203125, 0.02234649658203125, 0.053314208984375, 0.08428192138671875, 0.1152496337890625, 0.14621734619140625, 0.17718505859375, 0.20815277099609375, 0.2391204833984375, 0.27008819580078125, 0.301055908203125, 0.33202362060546875, 0.3629913330078125, 0.39395904541015625, 0.4249267578125, 0.45589447021484375, 0.4868621826171875, 0.5178298950195312, 0.548797607421875, 0.5797653198242188, 0.6107330322265625, 0.6417007446289062, 0.67266845703125, 0.7036361694335938, 0.7346038818359375, 0.7655715942382812, 0.796539306640625, 0.8275070190429688, 0.8584747314453125, 0.8894424438476562, 0.92041015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 10.0, 6.0, 10.0, 14.0, 25.0, 50.0, 68.0, 117.0, 191.0, 189.0, 142.0, 63.0, 51.0, 31.0, 14.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014710426330566406, -0.0001412220299243927, -0.00013533979654312134, -0.00012945756316184998, -0.0001235753297805786, -0.00011769309639930725, -0.00011181086301803589, -0.00010592862963676453, -0.00010004639625549316, -9.41641628742218e-05, -8.828192949295044e-05, -8.239969611167908e-05, -7.651746273040771e-05, -7.063522934913635e-05, -6.475299596786499e-05, -5.887076258659363e-05, -5.2988529205322266e-05, -4.71062958240509e-05, -4.122406244277954e-05, -3.534182906150818e-05, -2.9459595680236816e-05, -2.3577362298965454e-05, -1.7695128917694092e-05, -1.181289553642273e-05, -5.930662155151367e-06, -4.842877388000488e-08, 5.833804607391357e-06, 1.171603798866272e-05, 1.7598271369934082e-05, 2.3480504751205444e-05, 2.9362738132476807e-05, 3.524497151374817e-05, 4.112720489501953e-05, 4.7009438276290894e-05, 5.2891671657562256e-05, 5.877390503883362e-05, 6.465613842010498e-05, 7.053837180137634e-05, 7.64206051826477e-05, 8.230283856391907e-05, 8.818507194519043e-05, 9.406730532646179e-05, 9.994953870773315e-05, 0.00010583177208900452, 0.00011171400547027588, 0.00011759623885154724, 0.0001234784722328186, 0.00012936070561408997, 0.00013524293899536133, 0.0001411251723766327, 0.00014700740575790405, 0.00015288963913917542, 0.00015877187252044678, 0.00016465410590171814, 0.0001705363392829895, 0.00017641857266426086, 0.00018230080604553223, 0.0001881830394268036, 0.00019406527280807495, 0.0001999475061893463, 0.00020582973957061768, 0.00021171197295188904, 0.0002175942063331604, 0.00022347643971443176, 0.00022935867309570312]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 13.0, 18.0, 16.0, 40.0, 38.0, 60.0, 102.0, 170.0, 307.0, 592.0, 1095.0, 2387.0, 5987.0, 18732.0, 82982.0, 378388.0, 423920.0, 99839.0, 21992.0, 6652.0, 2584.0, 1170.0, 614.0, 311.0, 205.0, 108.0, 59.0, 47.0, 32.0, 30.0, 13.0, 13.0, 10.0, 5.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.57373046875, -0.55865478515625, -0.5435791015625, -0.52850341796875, -0.513427734375, -0.49835205078125, -0.4832763671875, -0.46820068359375, -0.453125, -0.43804931640625, -0.4229736328125, -0.40789794921875, -0.392822265625, -0.37774658203125, -0.3626708984375, -0.34759521484375, -0.33251953125, -0.31744384765625, -0.3023681640625, -0.28729248046875, -0.272216796875, -0.25714111328125, -0.2420654296875, -0.22698974609375, -0.2119140625, -0.19683837890625, -0.1817626953125, -0.16668701171875, -0.151611328125, -0.13653564453125, -0.1214599609375, -0.10638427734375, -0.09130859375, -0.07623291015625, -0.0611572265625, -0.04608154296875, -0.031005859375, -0.01593017578125, -0.0008544921875, 0.01422119140625, 0.029296875, 0.04437255859375, 0.0594482421875, 0.07452392578125, 0.089599609375, 0.10467529296875, 0.1197509765625, 0.13482666015625, 0.14990234375, 0.16497802734375, 0.1800537109375, 0.19512939453125, 0.210205078125, 0.22528076171875, 0.2403564453125, 0.25543212890625, 0.2705078125, 0.28558349609375, 0.3006591796875, 0.31573486328125, 0.330810546875, 0.34588623046875, 0.3609619140625, 0.37603759765625, 0.39111328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 10.0, 5.0, 4.0, 12.0, 14.0, 16.0, 23.0, 19.0, 38.0, 46.0, 58.0, 71.0, 84.0, 93.0, 80.0, 76.0, 74.0, 61.0, 39.0, 50.0, 38.0, 27.0, 14.0, 11.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431396484375, -0.41977691650390625, -0.4081573486328125, -0.39653778076171875, -0.384918212890625, -0.37329864501953125, -0.3616790771484375, -0.35005950927734375, -0.33843994140625, -0.32682037353515625, -0.3152008056640625, -0.30358123779296875, -0.291961669921875, -0.28034210205078125, -0.2687225341796875, -0.25710296630859375, -0.2454833984375, -0.23386383056640625, -0.2222442626953125, -0.21062469482421875, -0.199005126953125, -0.18738555908203125, -0.1757659912109375, -0.16414642333984375, -0.15252685546875, -0.14090728759765625, -0.1292877197265625, -0.11766815185546875, -0.106048583984375, -0.09442901611328125, -0.0828094482421875, -0.07118988037109375, -0.0595703125, -0.04795074462890625, -0.0363311767578125, -0.02471160888671875, -0.013092041015625, -0.00147247314453125, 0.0101470947265625, 0.02176666259765625, 0.03338623046875, 0.04500579833984375, 0.0566253662109375, 0.06824493408203125, 0.079864501953125, 0.09148406982421875, 0.1031036376953125, 0.11472320556640625, 0.1263427734375, 0.13796234130859375, 0.1495819091796875, 0.16120147705078125, 0.172821044921875, 0.18444061279296875, 0.1960601806640625, 0.20767974853515625, 0.21929931640625, 0.23091888427734375, 0.2425384521484375, 0.25415802001953125, 0.265777587890625, 0.27739715576171875, 0.2890167236328125, 0.30063629150390625, 0.312255859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 7.0, 5.0, 17.0, 26.0, 57.0, 83.0, 141.0, 180.0, 180.0, 142.0, 91.0, 38.0, 18.0, 11.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.774497032165527, -9.476940155029297, -9.179384231567383, -8.881827354431152, -8.584270477294922, -8.286714553833008, -7.989157676696777, -7.691601276397705, -7.394044876098633, -7.0964884757995605, -6.79893159866333, -6.501375198364258, -6.2038187980651855, -5.906262397766113, -5.608705520629883, -5.3111491203308105, -5.01359224319458, -4.716035842895508, -4.418478965759277, -4.120922565460205, -3.823366165161133, -3.5258095264434814, -3.22825288772583, -2.930696487426758, -2.6331398487091064, -2.335583209991455, -2.038026809692383, -1.7404701709747314, -1.4429136514663696, -1.1453571319580078, -0.8478004932403564, -0.5502440929412842, -0.2526874542236328, 0.04486909508705139, 0.3424256443977356, 0.6399822235107422, 0.937538743019104, 1.2350952625274658, 1.5326519012451172, 1.8302083015441895, 2.127764940261841, 2.425321578979492, 2.7228779792785645, 3.020434617996216, 3.317991256713867, 3.6155476570129395, 3.913104295730591, 4.210660934448242, 4.5082173347473145, 4.805773735046387, 5.103330612182617, 5.4008870124816895, 5.698443412780762, 5.996000289916992, 6.2935566902160645, 6.591113090515137, 6.888669967651367, 7.1862263679504395, 7.48378324508667, 7.781339645385742, 8.078896522521973, 8.376452445983887, 8.674009323120117, 8.971565246582031, 9.269122123718262]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 9.0, 8.0, 7.0, 6.0, 16.0, 10.0, 23.0, 15.0, 25.0, 27.0, 27.0, 36.0, 36.0, 48.0, 38.0, 38.0, 46.0, 35.0, 44.0, 42.0, 40.0, 44.0, 48.0, 41.0, 31.0, 36.0, 34.0, 34.0, 19.0, 20.0, 18.0, 11.0, 17.0, 16.0, 13.0, 9.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.13310432434082, -4.980539321899414, -4.827974796295166, -4.67540979385376, -4.522845268249512, -4.3702802658081055, -4.217715263366699, -4.065150260925293, -3.912585735321045, -3.7600209712982178, -3.6074562072753906, -3.4548912048339844, -3.3023264408111572, -3.14976167678833, -2.997196674346924, -2.8446319103240967, -2.6920671463012695, -2.5395023822784424, -2.3869376182556152, -2.234372615814209, -2.081807851791382, -1.9292430877685547, -1.776678204536438, -1.6241133213043213, -1.4715485572814941, -1.318983793258667, -1.1664189100265503, -1.0138540267944336, -0.8612892627716064, -0.7087244391441345, -0.5561596155166626, -0.4035947322845459, -0.25102996826171875, -0.09846514463424683, 0.0540996789932251, 0.20666450262069702, 0.35922932624816895, 0.5117941498756409, 0.6643589735031128, 0.8169238567352295, 0.9694886207580566, 1.1220533847808838, 1.2746182680130005, 1.4271831512451172, 1.5797479152679443, 1.7323126792907715, 1.8848775625228882, 2.037442445755005, 2.190007209777832, 2.342571973800659, 2.4951367378234863, 2.6477017402648926, 2.8002665042877197, 2.952831268310547, 3.105396270751953, 3.2579610347747803, 3.4105257987976074, 3.5630905628204346, 3.7156553268432617, 3.868220329284668, 4.020785331726074, 4.173349857330322, 4.3259148597717285, 4.478479385375977, 4.631044387817383]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 13.0, 10.0, 25.0, 33.0, 57.0, 111.0, 195.0, 402.0, 788.0, 2269.0, 9100.0, 92455.0, 3893900.0, 176099.0, 13359.0, 3133.0, 1116.0, 554.0, 264.0, 145.0, 86.0, 49.0, 44.0, 18.0, 12.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.33984375, -2.26806640625, -2.1962890625, -2.12451171875, -2.052734375, -1.98095703125, -1.9091796875, -1.83740234375, -1.765625, -1.69384765625, -1.6220703125, -1.55029296875, -1.478515625, -1.40673828125, -1.3349609375, -1.26318359375, -1.19140625, -1.11962890625, -1.0478515625, -0.97607421875, -0.904296875, -0.83251953125, -0.7607421875, -0.68896484375, -0.6171875, -0.54541015625, -0.4736328125, -0.40185546875, -0.330078125, -0.25830078125, -0.1865234375, -0.11474609375, -0.04296875, 0.02880859375, 0.1005859375, 0.17236328125, 0.244140625, 0.31591796875, 0.3876953125, 0.45947265625, 0.53125, 0.60302734375, 0.6748046875, 0.74658203125, 0.818359375, 0.89013671875, 0.9619140625, 1.03369140625, 1.10546875, 1.17724609375, 1.2490234375, 1.32080078125, 1.392578125, 1.46435546875, 1.5361328125, 1.60791015625, 1.6796875, 1.75146484375, 1.8232421875, 1.89501953125, 1.966796875, 2.03857421875, 2.1103515625, 2.18212890625, 2.25390625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 13.0, 32.0, 35.0, 51.0, 62.0, 96.0, 116.0, 108.0, 122.0, 95.0, 91.0, 75.0, 39.0, 20.0, 12.0, 10.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51220703125, -0.49501800537109375, -0.4778289794921875, -0.46063995361328125, -0.443450927734375, -0.42626190185546875, -0.4090728759765625, -0.39188385009765625, -0.37469482421875, -0.35750579833984375, -0.3403167724609375, -0.32312774658203125, -0.305938720703125, -0.28874969482421875, -0.2715606689453125, -0.25437164306640625, -0.2371826171875, -0.21999359130859375, -0.2028045654296875, -0.18561553955078125, -0.168426513671875, -0.15123748779296875, -0.1340484619140625, -0.11685943603515625, -0.09967041015625, -0.08248138427734375, -0.0652923583984375, -0.04810333251953125, -0.030914306640625, -0.01372528076171875, 0.0034637451171875, 0.02065277099609375, 0.037841796875, 0.05503082275390625, 0.0722198486328125, 0.08940887451171875, 0.106597900390625, 0.12378692626953125, 0.1409759521484375, 0.15816497802734375, 0.17535400390625, 0.19254302978515625, 0.2097320556640625, 0.22692108154296875, 0.244110107421875, 0.26129913330078125, 0.2784881591796875, 0.29567718505859375, 0.3128662109375, 0.33005523681640625, 0.3472442626953125, 0.36443328857421875, 0.381622314453125, 0.39881134033203125, 0.4160003662109375, 0.43318939208984375, 0.45037841796875, 0.46756744384765625, 0.4847564697265625, 0.5019454956054688, 0.519134521484375, 0.5363235473632812, 0.5535125732421875, 0.5707015991210938, 0.587890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 16.0, 24.0, 35.0, 61.0, 198.0, 520.0, 1731.0, 7214.0, 47547.0, 1197863.0, 2861966.0, 65215.0, 8830.0, 2010.0, 623.0, 228.0, 98.0, 45.0, 16.0, 14.0, 9.0, 5.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8251953125, -1.7731475830078125, -1.721099853515625, -1.6690521240234375, -1.61700439453125, -1.5649566650390625, -1.512908935546875, -1.4608612060546875, -1.4088134765625, -1.3567657470703125, -1.304718017578125, -1.2526702880859375, -1.20062255859375, -1.1485748291015625, -1.096527099609375, -1.0444793701171875, -0.992431640625, -0.9403839111328125, -0.888336181640625, -0.8362884521484375, -0.78424072265625, -0.7321929931640625, -0.680145263671875, -0.6280975341796875, -0.5760498046875, -0.5240020751953125, -0.471954345703125, -0.4199066162109375, -0.36785888671875, -0.3158111572265625, -0.263763427734375, -0.2117156982421875, -0.15966796875, -0.1076202392578125, -0.055572509765625, -0.0035247802734375, 0.04852294921875, 0.1005706787109375, 0.152618408203125, 0.2046661376953125, 0.2567138671875, 0.3087615966796875, 0.360809326171875, 0.4128570556640625, 0.46490478515625, 0.5169525146484375, 0.569000244140625, 0.6210479736328125, 0.673095703125, 0.7251434326171875, 0.777191162109375, 0.8292388916015625, 0.88128662109375, 0.9333343505859375, 0.985382080078125, 1.0374298095703125, 1.0894775390625, 1.1415252685546875, 1.193572998046875, 1.2456207275390625, 1.29766845703125, 1.3497161865234375, 1.401763916015625, 1.4538116455078125, 1.505859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 5.0, 8.0, 13.0, 14.0, 28.0, 43.0, 52.0, 81.0, 119.0, 203.0, 358.0, 902.0, 1124.0, 443.0, 237.0, 135.0, 85.0, 51.0, 39.0, 24.0, 25.0, 18.0, 10.0, 9.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.437744140625, -0.4240989685058594, -0.41045379638671875, -0.3968086242675781, -0.3831634521484375, -0.3695182800292969, -0.35587310791015625, -0.3422279357910156, -0.328582763671875, -0.3149375915527344, -0.30129241943359375, -0.2876472473144531, -0.2740020751953125, -0.2603569030761719, -0.24671173095703125, -0.23306655883789062, -0.21942138671875, -0.20577621459960938, -0.19213104248046875, -0.17848587036132812, -0.1648406982421875, -0.15119552612304688, -0.13755035400390625, -0.12390518188476562, -0.110260009765625, -0.09661483764648438, -0.08296966552734375, -0.06932449340820312, -0.0556793212890625, -0.042034149169921875, -0.02838897705078125, -0.014743804931640625, -0.0010986328125, 0.012546539306640625, 0.02619171142578125, 0.039836883544921875, 0.0534820556640625, 0.06712722778320312, 0.08077239990234375, 0.09441757202148438, 0.108062744140625, 0.12170791625976562, 0.13535308837890625, 0.14899826049804688, 0.1626434326171875, 0.17628860473632812, 0.18993377685546875, 0.20357894897460938, 0.21722412109375, 0.23086929321289062, 0.24451446533203125, 0.2581596374511719, 0.2718048095703125, 0.2854499816894531, 0.29909515380859375, 0.3127403259277344, 0.326385498046875, 0.3400306701660156, 0.35367584228515625, 0.3673210144042969, 0.3809661865234375, 0.3946113586425781, 0.40825653076171875, 0.4219017028808594, 0.435546875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 4.0, 4.0, 8.0, 22.0, 61.0, 115.0, 197.0, 265.0, 169.0, 91.0, 32.0, 25.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.444695949554443, -6.2917890548706055, -6.138882160186768, -5.9859747886657715, -5.833067893981934, -5.680160999298096, -5.527254104614258, -5.37434720993042, -5.221440315246582, -5.068533420562744, -4.915626525878906, -4.76271915435791, -4.609812259674072, -4.456905364990234, -4.3039984703063965, -4.151091575622559, -3.9981842041015625, -3.8452773094177246, -3.6923701763153076, -3.5394632816314697, -3.3865561485290527, -3.233649253845215, -3.080742359161377, -2.927835464477539, -2.774928331375122, -2.622021436691284, -2.469114303588867, -2.3162074089050293, -2.1633005142211914, -2.0103933811187744, -1.8574864864349365, -1.704579472541809, -1.5516724586486816, -1.3987654447555542, -1.2458584308624268, -1.0929515361785889, -0.9400445222854614, -0.787137508392334, -0.6342305541038513, -0.48132359981536865, -0.3284165859222412, -0.17550960183143616, -0.022602617740631104, 0.13030436635017395, 0.283211350440979, 0.43611836433410645, 0.5890253186225891, 0.7419322729110718, 0.8948392868041992, 1.0477463006973267, 1.200653314590454, 1.353560209274292, 1.5064672231674194, 1.6593742370605469, 1.8122811317443848, 1.9651881456375122, 2.1180951595306396, 2.2710020542144775, 2.4239091873168945, 2.5768160820007324, 2.7297229766845703, 2.8826301097869873, 3.035537004470825, 3.188444137573242, 3.34135103225708]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 11.0, 18.0, 11.0, 25.0, 29.0, 40.0, 40.0, 44.0, 53.0, 50.0, 62.0, 53.0, 41.0, 62.0, 60.0, 55.0, 46.0, 46.0, 38.0, 33.0, 25.0, 34.0, 21.0, 20.0, 14.0, 11.0, 6.0, 12.0, 4.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.924283504486084, -1.8664038181304932, -1.8085241317749023, -1.7506444454193115, -1.6927646398544312, -1.6348849534988403, -1.5770052671432495, -1.5191255807876587, -1.4612458944320679, -1.403366208076477, -1.3454865217208862, -1.2876067161560059, -1.229727029800415, -1.1718473434448242, -1.1139676570892334, -1.0560879707336426, -0.998208224773407, -0.9403285384178162, -0.8824487924575806, -0.8245691061019897, -0.7666894197463989, -0.7088097333908081, -0.6509299874305725, -0.5930503010749817, -0.5351705551147461, -0.4772908389568329, -0.41941115260124207, -0.36153143644332886, -0.30365175008773804, -0.24577203392982483, -0.18789231777191162, -0.1300126314163208, -0.07213294506072998, -0.014253240078687668, 0.043626464903354645, 0.10150617361068726, 0.15938587486743927, 0.21726557612419128, 0.2751452922821045, 0.3330249786376953, 0.3909046947956085, 0.44878441095352173, 0.5066640973091125, 0.5645438432693481, 0.622423529624939, 0.6803032159805298, 0.7381829023361206, 0.7960625886917114, 0.853942334651947, 0.9118220210075378, 0.9697017669677734, 1.0275814533233643, 1.085461139678955, 1.143340826034546, 1.2012205123901367, 1.2591001987457275, 1.316980004310608, 1.3748596906661987, 1.4327393770217896, 1.49061918258667, 1.5484988689422607, 1.6063785552978516, 1.6642582416534424, 1.7221379280090332, 1.780017614364624]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 5.0, 7.0, 5.0, 12.0, 16.0, 24.0, 44.0, 44.0, 66.0, 105.0, 194.0, 335.0, 528.0, 1010.0, 2176.0, 5646.0, 25224.0, 213144.0, 683062.0, 95718.0, 13800.0, 3848.0, 1573.0, 798.0, 427.0, 277.0, 155.0, 97.0, 74.0, 45.0, 24.0, 15.0, 12.0, 11.0, 5.0, 2.0, 8.0, 5.0, 3.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8564453125, -1.7909088134765625, -1.725372314453125, -1.6598358154296875, -1.59429931640625, -1.5287628173828125, -1.463226318359375, -1.3976898193359375, -1.3321533203125, -1.2666168212890625, -1.201080322265625, -1.1355438232421875, -1.07000732421875, -1.0044708251953125, -0.938934326171875, -0.8733978271484375, -0.807861328125, -0.7423248291015625, -0.676788330078125, -0.6112518310546875, -0.54571533203125, -0.4801788330078125, -0.414642333984375, -0.3491058349609375, -0.2835693359375, -0.2180328369140625, -0.152496337890625, -0.0869598388671875, -0.02142333984375, 0.0441131591796875, 0.109649658203125, 0.1751861572265625, 0.24072265625, 0.3062591552734375, 0.371795654296875, 0.4373321533203125, 0.50286865234375, 0.5684051513671875, 0.633941650390625, 0.6994781494140625, 0.7650146484375, 0.8305511474609375, 0.896087646484375, 0.9616241455078125, 1.02716064453125, 1.0926971435546875, 1.158233642578125, 1.2237701416015625, 1.289306640625, 1.3548431396484375, 1.420379638671875, 1.4859161376953125, 1.55145263671875, 1.6169891357421875, 1.682525634765625, 1.7480621337890625, 1.8135986328125, 1.8791351318359375, 1.944671630859375, 2.0102081298828125, 2.07574462890625, 2.1412811279296875, 2.206817626953125, 2.2723541259765625, 2.337890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 16.0, 32.0, 44.0, 53.0, 71.0, 121.0, 98.0, 118.0, 119.0, 100.0, 84.0, 50.0, 31.0, 22.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.4957275390625, -0.478271484375, -0.4608154296875, -0.443359375, -0.4259033203125, -0.408447265625, -0.3909912109375, -0.37353515625, -0.3560791015625, -0.338623046875, -0.3211669921875, -0.3037109375, -0.2862548828125, -0.268798828125, -0.2513427734375, -0.23388671875, -0.2164306640625, -0.198974609375, -0.1815185546875, -0.1640625, -0.1466064453125, -0.129150390625, -0.1116943359375, -0.09423828125, -0.0767822265625, -0.059326171875, -0.0418701171875, -0.0244140625, -0.0069580078125, 0.010498046875, 0.0279541015625, 0.04541015625, 0.0628662109375, 0.080322265625, 0.0977783203125, 0.115234375, 0.1326904296875, 0.150146484375, 0.1676025390625, 0.18505859375, 0.2025146484375, 0.219970703125, 0.2374267578125, 0.2548828125, 0.2723388671875, 0.289794921875, 0.3072509765625, 0.32470703125, 0.3421630859375, 0.359619140625, 0.3770751953125, 0.39453125, 0.4119873046875, 0.429443359375, 0.4468994140625, 0.46435546875, 0.4818115234375, 0.499267578125, 0.5167236328125, 0.5341796875, 0.5516357421875, 0.569091796875, 0.5865478515625, 0.60400390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 8.0, 16.0, 18.0, 18.0, 21.0, 30.0, 52.0, 59.0, 80.0, 142.0, 243.0, 457.0, 916.0, 2545.0, 7918.0, 31010.0, 151015.0, 528928.0, 254657.0, 51626.0, 12271.0, 3580.0, 1362.0, 610.0, 324.0, 205.0, 110.0, 81.0, 60.0, 41.0, 32.0, 20.0, 21.0, 9.0, 12.0, 9.0, 9.0, 3.0, 2.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.083984375, -1.0507965087890625, -1.017608642578125, -0.9844207763671875, -0.95123291015625, -0.9180450439453125, -0.884857177734375, -0.8516693115234375, -0.8184814453125, -0.7852935791015625, -0.752105712890625, -0.7189178466796875, -0.68572998046875, -0.6525421142578125, -0.619354248046875, -0.5861663818359375, -0.552978515625, -0.5197906494140625, -0.486602783203125, -0.4534149169921875, -0.42022705078125, -0.3870391845703125, -0.353851318359375, -0.3206634521484375, -0.2874755859375, -0.2542877197265625, -0.221099853515625, -0.1879119873046875, -0.15472412109375, -0.1215362548828125, -0.088348388671875, -0.0551605224609375, -0.02197265625, 0.0112152099609375, 0.044403076171875, 0.0775909423828125, 0.11077880859375, 0.1439666748046875, 0.177154541015625, 0.2103424072265625, 0.2435302734375, 0.2767181396484375, 0.309906005859375, 0.3430938720703125, 0.37628173828125, 0.4094696044921875, 0.442657470703125, 0.4758453369140625, 0.509033203125, 0.5422210693359375, 0.575408935546875, 0.6085968017578125, 0.64178466796875, 0.6749725341796875, 0.708160400390625, 0.7413482666015625, 0.7745361328125, 0.8077239990234375, 0.840911865234375, 0.8740997314453125, 0.90728759765625, 0.9404754638671875, 0.973663330078125, 1.0068511962890625, 1.0400390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 11.0, 11.0, 12.0, 11.0, 17.0, 25.0, 43.0, 30.0, 46.0, 68.0, 50.0, 46.0, 59.0, 52.0, 51.0, 44.0, 47.0, 47.0, 39.0, 44.0, 38.0, 32.0, 29.0, 31.0, 19.0, 12.0, 19.0, 16.0, 12.0, 8.0, 10.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.970703125, -0.9362030029296875, -0.901702880859375, -0.8672027587890625, -0.83270263671875, -0.7982025146484375, -0.763702392578125, -0.7292022705078125, -0.6947021484375, -0.6602020263671875, -0.625701904296875, -0.5912017822265625, -0.55670166015625, -0.5222015380859375, -0.487701416015625, -0.4532012939453125, -0.418701171875, -0.3842010498046875, -0.349700927734375, -0.3152008056640625, -0.28070068359375, -0.2462005615234375, -0.211700439453125, -0.1772003173828125, -0.1427001953125, -0.1082000732421875, -0.073699951171875, -0.0391998291015625, -0.00469970703125, 0.0298004150390625, 0.064300537109375, 0.0988006591796875, 0.13330078125, 0.1678009033203125, 0.202301025390625, 0.2368011474609375, 0.27130126953125, 0.3058013916015625, 0.340301513671875, 0.3748016357421875, 0.4093017578125, 0.4438018798828125, 0.478302001953125, 0.5128021240234375, 0.54730224609375, 0.5818023681640625, 0.616302490234375, 0.6508026123046875, 0.685302734375, 0.7198028564453125, 0.754302978515625, 0.7888031005859375, 0.82330322265625, 0.8578033447265625, 0.892303466796875, 0.9268035888671875, 0.9613037109375, 0.9958038330078125, 1.030303955078125, 1.0648040771484375, 1.09930419921875, 1.1338043212890625, 1.168304443359375, 1.2028045654296875, 1.2373046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 8.0, 8.0, 7.0, 12.0, 22.0, 29.0, 52.0, 66.0, 100.0, 157.0, 276.0, 551.0, 1279.0, 3766.0, 17632.0, 164650.0, 709518.0, 129907.0, 14820.0, 3286.0, 1131.0, 541.0, 290.0, 151.0, 84.0, 58.0, 47.0, 34.0, 22.0, 14.0, 12.0, 6.0, 12.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6160430908203125, -0.594390869140625, -0.5727386474609375, -0.55108642578125, -0.5294342041015625, -0.507781982421875, -0.4861297607421875, -0.4644775390625, -0.4428253173828125, -0.421173095703125, -0.3995208740234375, -0.37786865234375, -0.3562164306640625, -0.334564208984375, -0.3129119873046875, -0.291259765625, -0.2696075439453125, -0.247955322265625, -0.2263031005859375, -0.20465087890625, -0.1829986572265625, -0.161346435546875, -0.1396942138671875, -0.1180419921875, -0.0963897705078125, -0.074737548828125, -0.0530853271484375, -0.03143310546875, -0.0097808837890625, 0.011871337890625, 0.0335235595703125, 0.05517578125, 0.0768280029296875, 0.098480224609375, 0.1201324462890625, 0.14178466796875, 0.1634368896484375, 0.185089111328125, 0.2067413330078125, 0.2283935546875, 0.2500457763671875, 0.271697998046875, 0.2933502197265625, 0.31500244140625, 0.3366546630859375, 0.358306884765625, 0.3799591064453125, 0.401611328125, 0.4232635498046875, 0.444915771484375, 0.4665679931640625, 0.48822021484375, 0.5098724365234375, 0.531524658203125, 0.5531768798828125, 0.5748291015625, 0.5964813232421875, 0.618133544921875, 0.6397857666015625, 0.66143798828125, 0.6830902099609375, 0.704742431640625, 0.7263946533203125, 0.748046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 4.0, 3.0, 15.0, 16.0, 40.0, 54.0, 81.0, 138.0, 174.0, 147.0, 126.0, 85.0, 40.0, 31.0, 17.0, 8.0, 7.0, 6.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010389089584350586, -9.838584810495377e-05, -9.288080036640167e-05, -8.737575262784958e-05, -8.187070488929749e-05, -7.636565715074539e-05, -7.08606094121933e-05, -6.53555616736412e-05, -5.985051393508911e-05, -5.434546619653702e-05, -4.8840418457984924e-05, -4.333537071943283e-05, -3.783032298088074e-05, -3.2325275242328644e-05, -2.682022750377655e-05, -2.1315179765224457e-05, -1.5810132026672363e-05, -1.030508428812027e-05, -4.800036549568176e-06, 7.050111889839172e-07, 6.210058927536011e-06, 1.1715106666088104e-05, 1.7220154404640198e-05, 2.272520214319229e-05, 2.8230249881744385e-05, 3.373529762029648e-05, 3.924034535884857e-05, 4.4745393097400665e-05, 5.025044083595276e-05, 5.575548857450485e-05, 6.126053631305695e-05, 6.676558405160904e-05, 7.227063179016113e-05, 7.777567952871323e-05, 8.328072726726532e-05, 8.878577500581741e-05, 9.429082274436951e-05, 9.97958704829216e-05, 0.0001053009182214737, 0.00011080596596002579, 0.00011631101369857788, 0.00012181606143712997, 0.00012732110917568207, 0.00013282615691423416, 0.00013833120465278625, 0.00014383625239133835, 0.00014934130012989044, 0.00015484634786844254, 0.00016035139560699463, 0.00016585644334554672, 0.00017136149108409882, 0.0001768665388226509, 0.000182371586561203, 0.0001878766342997551, 0.0001933816820383072, 0.00019888672977685928, 0.00020439177751541138, 0.00020989682525396347, 0.00021540187299251556, 0.00022090692073106766, 0.00022641196846961975, 0.00023191701620817184, 0.00023742206394672394, 0.00024292711168527603, 0.0002484321594238281]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 15.0, 32.0, 45.0, 71.0, 117.0, 219.0, 517.0, 1403.0, 5707.0, 61908.0, 799258.0, 165502.0, 10438.0, 1974.0, 670.0, 279.0, 147.0, 87.0, 49.0, 21.0, 24.0, 14.0, 10.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.89599609375, -0.8676910400390625, -0.839385986328125, -0.8110809326171875, -0.78277587890625, -0.7544708251953125, -0.726165771484375, -0.6978607177734375, -0.6695556640625, -0.6412506103515625, -0.612945556640625, -0.5846405029296875, -0.55633544921875, -0.5280303955078125, -0.499725341796875, -0.4714202880859375, -0.443115234375, -0.4148101806640625, -0.386505126953125, -0.3582000732421875, -0.32989501953125, -0.3015899658203125, -0.273284912109375, -0.2449798583984375, -0.2166748046875, -0.1883697509765625, -0.160064697265625, -0.1317596435546875, -0.10345458984375, -0.0751495361328125, -0.046844482421875, -0.0185394287109375, 0.009765625, 0.0380706787109375, 0.066375732421875, 0.0946807861328125, 0.12298583984375, 0.1512908935546875, 0.179595947265625, 0.2079010009765625, 0.2362060546875, 0.2645111083984375, 0.292816162109375, 0.3211212158203125, 0.34942626953125, 0.3777313232421875, 0.406036376953125, 0.4343414306640625, 0.462646484375, 0.4909515380859375, 0.519256591796875, 0.5475616455078125, 0.57586669921875, 0.6041717529296875, 0.632476806640625, 0.6607818603515625, 0.6890869140625, 0.7173919677734375, 0.745697021484375, 0.7740020751953125, 0.80230712890625, 0.8306121826171875, 0.858917236328125, 0.8872222900390625, 0.91552734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 5.0, 3.0, 6.0, 5.0, 9.0, 14.0, 37.0, 41.0, 62.0, 92.0, 99.0, 116.0, 120.0, 117.0, 81.0, 60.0, 50.0, 28.0, 20.0, 11.0, 5.0, 8.0, 7.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46337890625, -0.4463653564453125, -0.429351806640625, -0.4123382568359375, -0.39532470703125, -0.3783111572265625, -0.361297607421875, -0.3442840576171875, -0.3272705078125, -0.3102569580078125, -0.293243408203125, -0.2762298583984375, -0.25921630859375, -0.2422027587890625, -0.225189208984375, -0.2081756591796875, -0.191162109375, -0.1741485595703125, -0.157135009765625, -0.1401214599609375, -0.12310791015625, -0.1060943603515625, -0.089080810546875, -0.0720672607421875, -0.0550537109375, -0.0380401611328125, -0.021026611328125, -0.0040130615234375, 0.01300048828125, 0.0300140380859375, 0.047027587890625, 0.0640411376953125, 0.0810546875, 0.0980682373046875, 0.115081787109375, 0.1320953369140625, 0.14910888671875, 0.1661224365234375, 0.183135986328125, 0.2001495361328125, 0.2171630859375, 0.2341766357421875, 0.251190185546875, 0.2682037353515625, 0.28521728515625, 0.3022308349609375, 0.319244384765625, 0.3362579345703125, 0.353271484375, 0.3702850341796875, 0.387298583984375, 0.4043121337890625, 0.42132568359375, 0.4383392333984375, 0.455352783203125, 0.4723663330078125, 0.4893798828125, 0.5063934326171875, 0.523406982421875, 0.5404205322265625, 0.55743408203125, 0.5744476318359375, 0.591461181640625, 0.6084747314453125, 0.62548828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 12.0, 17.0, 24.0, 75.0, 121.0, 173.0, 205.0, 189.0, 86.0, 52.0, 24.0, 15.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.511625289916992, -12.199226379394531, -11.886826515197754, -11.574427604675293, -11.262028694152832, -10.949628829956055, -10.637229919433594, -10.324831008911133, -10.012432098388672, -9.700033187866211, -9.387633323669434, -9.075234413146973, -8.762835502624512, -8.450435638427734, -8.138036727905273, -7.8256378173828125, -7.513237953186035, -7.200838565826416, -6.888439655303955, -6.576040267944336, -6.263641357421875, -5.951241970062256, -5.638842582702637, -5.326443672180176, -5.014044284820557, -4.7016448974609375, -4.389245986938477, -4.076846599578857, -3.7644474506378174, -3.4520483016967773, -3.139648914337158, -2.827249765396118, -2.5148496627807617, -2.2024505138397217, -1.890051245689392, -1.5776519775390625, -1.2652528285980225, -0.9528536796569824, -0.6404544115066528, -0.32805514335632324, -0.015655994415283203, 0.2967432141304016, 0.6091424226760864, 0.9215416312217712, 1.233940839767456, 1.546339988708496, 1.8587392568588257, 2.1711385250091553, 2.4835376739501953, 2.7959368228912354, 3.1083359718322754, 3.4207353591918945, 3.7331345081329346, 4.045533657073975, 4.357933044433594, 4.670331954956055, 4.982731342315674, 5.295130729675293, 5.607529640197754, 5.919929027557373, 6.232328414916992, 6.544727325439453, 6.857126712799072, 7.169526100158691, 7.481925010681152]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 9.0, 6.0, 14.0, 16.0, 18.0, 25.0, 23.0, 27.0, 45.0, 29.0, 55.0, 47.0, 47.0, 60.0, 59.0, 60.0, 53.0, 48.0, 45.0, 41.0, 45.0, 26.0, 28.0, 31.0, 31.0, 28.0, 19.0, 26.0, 12.0, 4.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.699517726898193, -6.519691467285156, -6.339865207672119, -6.160038948059082, -5.980213165283203, -5.800386905670166, -5.620560646057129, -5.440734386444092, -5.260908126831055, -5.081081867218018, -4.9012556076049805, -4.721429347991943, -4.541603088378906, -4.361777305603027, -4.18195104598999, -4.002124786376953, -3.822298526763916, -3.642472267150879, -3.462646007537842, -3.282819986343384, -3.1029937267303467, -2.9231674671173096, -2.7433414459228516, -2.5635151863098145, -2.3836889266967773, -2.2038626670837402, -2.024036407470703, -1.8442103862762451, -1.664384126663208, -1.484557867050171, -1.3047317266464233, -1.1249055862426758, -0.9450788497924805, -0.7652526497840881, -0.5854264497756958, -0.40560024976730347, -0.22577404975891113, -0.0459478497505188, 0.13387835025787354, 0.3137044906616211, 0.4935307502746582, 0.6733569502830505, 0.8531831502914429, 1.0330092906951904, 1.2128355503082275, 1.3926618099212646, 1.5724879503250122, 1.7523140907287598, 1.9321403503417969, 2.111966609954834, 2.291792869567871, 2.471618890762329, 2.651445150375366, 2.8312714099884033, 3.0110974311828613, 3.1909236907958984, 3.3707499504089355, 3.5505762100219727, 3.7304024696350098, 3.9102284908294678, 4.090054512023926, 4.269880771636963, 4.44970703125, 4.629533290863037, 4.809359550476074]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 11.0, 17.0, 15.0, 32.0, 50.0, 49.0, 84.0, 120.0, 196.0, 374.0, 762.0, 1740.0, 5156.0, 20360.0, 157991.0, 3823744.0, 154804.0, 19600.0, 5194.0, 1857.0, 841.0, 428.0, 291.0, 171.0, 108.0, 88.0, 56.0, 42.0, 24.0, 16.0, 6.0, 8.0, 6.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.69140625, -1.6409149169921875, -1.590423583984375, -1.5399322509765625, -1.48944091796875, -1.4389495849609375, -1.388458251953125, -1.3379669189453125, -1.2874755859375, -1.2369842529296875, -1.186492919921875, -1.1360015869140625, -1.08551025390625, -1.0350189208984375, -0.984527587890625, -0.9340362548828125, -0.883544921875, -0.8330535888671875, -0.782562255859375, -0.7320709228515625, -0.68157958984375, -0.6310882568359375, -0.580596923828125, -0.5301055908203125, -0.4796142578125, -0.4291229248046875, -0.378631591796875, -0.3281402587890625, -0.27764892578125, -0.2271575927734375, -0.176666259765625, -0.1261749267578125, -0.07568359375, -0.0251922607421875, 0.025299072265625, 0.0757904052734375, 0.12628173828125, 0.1767730712890625, 0.227264404296875, 0.2777557373046875, 0.3282470703125, 0.3787384033203125, 0.429229736328125, 0.4797210693359375, 0.53021240234375, 0.5807037353515625, 0.631195068359375, 0.6816864013671875, 0.732177734375, 0.7826690673828125, 0.833160400390625, 0.8836517333984375, 0.93414306640625, 0.9846343994140625, 1.035125732421875, 1.0856170654296875, 1.1361083984375, 1.1865997314453125, 1.237091064453125, 1.2875823974609375, 1.33807373046875, 1.3885650634765625, 1.439056396484375, 1.4895477294921875, 1.5400390625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 9.0, 13.0, 18.0, 36.0, 62.0, 104.0, 104.0, 114.0, 126.0, 132.0, 93.0, 65.0, 55.0, 21.0, 16.0, 15.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5686264038085938, -0.5498504638671875, -0.5310745239257812, -0.512298583984375, -0.49352264404296875, -0.4747467041015625, -0.45597076416015625, -0.43719482421875, -0.41841888427734375, -0.3996429443359375, -0.38086700439453125, -0.362091064453125, -0.34331512451171875, -0.3245391845703125, -0.30576324462890625, -0.2869873046875, -0.26821136474609375, -0.2494354248046875, -0.23065948486328125, -0.211883544921875, -0.19310760498046875, -0.1743316650390625, -0.15555572509765625, -0.13677978515625, -0.11800384521484375, -0.0992279052734375, -0.08045196533203125, -0.061676025390625, -0.04290008544921875, -0.0241241455078125, -0.00534820556640625, 0.013427734375, 0.03220367431640625, 0.0509796142578125, 0.06975555419921875, 0.088531494140625, 0.10730743408203125, 0.1260833740234375, 0.14485931396484375, 0.16363525390625, 0.18241119384765625, 0.2011871337890625, 0.21996307373046875, 0.238739013671875, 0.25751495361328125, 0.2762908935546875, 0.29506683349609375, 0.3138427734375, 0.33261871337890625, 0.3513946533203125, 0.37017059326171875, 0.388946533203125, 0.40772247314453125, 0.4264984130859375, 0.44527435302734375, 0.46405029296875, 0.48282623291015625, 0.5016021728515625, 0.5203781127929688, 0.539154052734375, 0.5579299926757812, 0.5767059326171875, 0.5954818725585938, 0.6142578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 11.0, 17.0, 26.0, 50.0, 126.0, 203.0, 353.0, 779.0, 1751.0, 4516.0, 15077.0, 73758.0, 2116064.0, 1887014.0, 72136.0, 14806.0, 4473.0, 1616.0, 764.0, 341.0, 173.0, 97.0, 53.0, 27.0, 21.0, 8.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0], "bins": [-1.791015625, -1.7512130737304688, -1.7114105224609375, -1.6716079711914062, -1.631805419921875, -1.5920028686523438, -1.5522003173828125, -1.5123977661132812, -1.47259521484375, -1.4327926635742188, -1.3929901123046875, -1.3531875610351562, -1.313385009765625, -1.2735824584960938, -1.2337799072265625, -1.1939773559570312, -1.1541748046875, -1.1143722534179688, -1.0745697021484375, -1.0347671508789062, -0.994964599609375, -0.9551620483398438, -0.9153594970703125, -0.8755569458007812, -0.83575439453125, -0.7959518432617188, -0.7561492919921875, -0.7163467407226562, -0.676544189453125, -0.6367416381835938, -0.5969390869140625, -0.5571365356445312, -0.517333984375, -0.47753143310546875, -0.4377288818359375, -0.39792633056640625, -0.358123779296875, -0.31832122802734375, -0.2785186767578125, -0.23871612548828125, -0.19891357421875, -0.15911102294921875, -0.1193084716796875, -0.07950592041015625, -0.039703369140625, 9.918212890625e-05, 0.0399017333984375, 0.07970428466796875, 0.1195068359375, 0.15930938720703125, 0.1991119384765625, 0.23891448974609375, 0.278717041015625, 0.31851959228515625, 0.3583221435546875, 0.39812469482421875, 0.43792724609375, 0.47772979736328125, 0.5175323486328125, 0.5573348999023438, 0.597137451171875, 0.6369400024414062, 0.6767425537109375, 0.7165451049804688, 0.75634765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 2.0, 8.0, 15.0, 15.0, 13.0, 39.0, 47.0, 65.0, 82.0, 175.0, 308.0, 1280.0, 1256.0, 337.0, 173.0, 91.0, 47.0, 35.0, 19.0, 17.0, 6.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.53369140625, -0.5200042724609375, -0.506317138671875, -0.4926300048828125, -0.47894287109375, -0.4652557373046875, -0.451568603515625, -0.4378814697265625, -0.4241943359375, -0.4105072021484375, -0.396820068359375, -0.3831329345703125, -0.36944580078125, -0.3557586669921875, -0.342071533203125, -0.3283843994140625, -0.314697265625, -0.3010101318359375, -0.287322998046875, -0.2736358642578125, -0.25994873046875, -0.2462615966796875, -0.232574462890625, -0.2188873291015625, -0.2052001953125, -0.1915130615234375, -0.177825927734375, -0.1641387939453125, -0.15045166015625, -0.1367645263671875, -0.123077392578125, -0.1093902587890625, -0.095703125, -0.0820159912109375, -0.068328857421875, -0.0546417236328125, -0.04095458984375, -0.0272674560546875, -0.013580322265625, 0.0001068115234375, 0.0137939453125, 0.0274810791015625, 0.041168212890625, 0.0548553466796875, 0.06854248046875, 0.0822296142578125, 0.095916748046875, 0.1096038818359375, 0.123291015625, 0.1369781494140625, 0.150665283203125, 0.1643524169921875, 0.17803955078125, 0.1917266845703125, 0.205413818359375, 0.2191009521484375, 0.2327880859375, 0.2464752197265625, 0.260162353515625, 0.2738494873046875, 0.28753662109375, 0.3012237548828125, 0.314910888671875, 0.3285980224609375, 0.34228515625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 16.0, 65.0, 164.0, 297.0, 283.0, 116.0, 38.0, 12.0, 6.0, 6.0], "bins": [-10.268869400024414, -10.091272354125977, -9.913675308227539, -9.736079216003418, -9.55848217010498, -9.380885124206543, -9.203288078308105, -9.025691986083984, -8.848094940185547, -8.67049789428711, -8.492900848388672, -8.31530475616455, -8.137707710266113, -7.960110664367676, -7.7825140953063965, -7.604917049407959, -7.42732048034668, -7.249723434448242, -7.072126865386963, -6.894529819488525, -6.716933250427246, -6.539336204528809, -6.361739635467529, -6.184142589569092, -6.006545543670654, -5.828948497772217, -5.6513519287109375, -5.4737548828125, -5.296158313751221, -5.118561267852783, -4.940964698791504, -4.763367652893066, -4.585771560668945, -4.408174514770508, -4.2305779457092285, -4.052980899810791, -3.8753843307495117, -3.6977875232696533, -3.520190715789795, -3.3425936698913574, -3.16499662399292, -2.9873998165130615, -2.809803009033203, -2.6322062015533447, -2.4546093940734863, -2.277012586593628, -2.0994157791137695, -1.9218188524246216, -1.7442221641540527, -1.5666253566741943, -1.389028549194336, -1.2114317417144775, -1.0338349342346191, -0.856238067150116, -0.6786412000656128, -0.5010443925857544, -0.323447585105896, -0.1458507627248764, 0.03174605965614319, 0.20934289693832397, 0.3869397044181824, 0.5645365118980408, 0.742133378982544, 0.9197301864624023, 1.0973269939422607]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 11.0, 17.0, 21.0, 20.0, 37.0, 39.0, 48.0, 56.0, 65.0, 69.0, 79.0, 77.0, 81.0, 66.0, 50.0, 49.0, 54.0, 45.0, 32.0, 27.0, 16.0, 11.0, 8.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4956579208374023, -2.4305272102355957, -2.36539626121521, -2.3002655506134033, -2.2351346015930176, -2.170003890991211, -2.1048731803894043, -2.0397422313690186, -1.974611520767212, -1.9094806909561157, -1.8443498611450195, -1.779219150543213, -1.7140883207321167, -1.6489574909210205, -1.5838267803192139, -1.5186959505081177, -1.4535651206970215, -1.3884342908859253, -1.323303461074829, -1.2581727504730225, -1.1930419206619263, -1.12791109085083, -1.0627803802490234, -0.9976495504379272, -0.932518720626831, -0.8673878908157349, -0.8022571206092834, -0.737126350402832, -0.6719955205917358, -0.6068646907806396, -0.5417339205741882, -0.47660312056541443, -0.4114725589752197, -0.3463417589664459, -0.2812109589576721, -0.21608015894889832, -0.1509493589401245, -0.08581855893135071, -0.020687758922576904, 0.0444430410861969, 0.1095738410949707, 0.1747046411037445, 0.2398354411125183, 0.3049662411212921, 0.3700970411300659, 0.4352278411388397, 0.5003586411476135, 0.5654894113540649, 0.6306202411651611, 0.6957510709762573, 0.7608818411827087, 0.8260126113891602, 0.8911434412002563, 0.9562742710113525, 1.0214049816131592, 1.0865358114242554, 1.1516666412353516, 1.2167974710464478, 1.281928300857544, 1.3470590114593506, 1.4121898412704468, 1.477320671081543, 1.5424513816833496, 1.6075822114944458, 1.672713041305542]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 11.0, 19.0, 28.0, 39.0, 68.0, 138.0, 257.0, 486.0, 915.0, 2183.0, 8406.0, 82226.0, 767870.0, 166882.0, 13792.0, 2909.0, 1144.0, 525.0, 276.0, 146.0, 91.0, 41.0, 34.0, 19.0, 14.0, 8.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.27215576171875, -2.2025146484375, -2.13287353515625, -2.063232421875, -1.99359130859375, -1.9239501953125, -1.85430908203125, -1.78466796875, -1.71502685546875, -1.6453857421875, -1.57574462890625, -1.506103515625, -1.43646240234375, -1.3668212890625, -1.29718017578125, -1.2275390625, -1.15789794921875, -1.0882568359375, -1.01861572265625, -0.948974609375, -0.87933349609375, -0.8096923828125, -0.74005126953125, -0.67041015625, -0.60076904296875, -0.5311279296875, -0.46148681640625, -0.391845703125, -0.32220458984375, -0.2525634765625, -0.18292236328125, -0.11328125, -0.04364013671875, 0.0260009765625, 0.09564208984375, 0.165283203125, 0.23492431640625, 0.3045654296875, 0.37420654296875, 0.44384765625, 0.51348876953125, 0.5831298828125, 0.65277099609375, 0.722412109375, 0.79205322265625, 0.8616943359375, 0.93133544921875, 1.0009765625, 1.07061767578125, 1.1402587890625, 1.20989990234375, 1.279541015625, 1.34918212890625, 1.4188232421875, 1.48846435546875, 1.55810546875, 1.62774658203125, 1.6973876953125, 1.76702880859375, 1.836669921875, 1.90631103515625, 1.9759521484375, 2.04559326171875, 2.115234375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 14.0, 20.0, 36.0, 53.0, 98.0, 117.0, 113.0, 142.0, 128.0, 94.0, 75.0, 41.0, 33.0, 19.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69921875, -0.6788406372070312, -0.6584625244140625, -0.6380844116210938, -0.617706298828125, -0.5973281860351562, -0.5769500732421875, -0.5565719604492188, -0.53619384765625, -0.5158157348632812, -0.4954376220703125, -0.47505950927734375, -0.454681396484375, -0.43430328369140625, -0.4139251708984375, -0.39354705810546875, -0.3731689453125, -0.35279083251953125, -0.3324127197265625, -0.31203460693359375, -0.291656494140625, -0.27127838134765625, -0.2509002685546875, -0.23052215576171875, -0.21014404296875, -0.18976593017578125, -0.1693878173828125, -0.14900970458984375, -0.128631591796875, -0.10825347900390625, -0.0878753662109375, -0.06749725341796875, -0.047119140625, -0.02674102783203125, -0.0063629150390625, 0.01401519775390625, 0.034393310546875, 0.05477142333984375, 0.0751495361328125, 0.09552764892578125, 0.11590576171875, 0.13628387451171875, 0.1566619873046875, 0.17704010009765625, 0.197418212890625, 0.21779632568359375, 0.2381744384765625, 0.25855255126953125, 0.2789306640625, 0.29930877685546875, 0.3196868896484375, 0.34006500244140625, 0.360443115234375, 0.38082122802734375, 0.4011993408203125, 0.42157745361328125, 0.44195556640625, 0.46233367919921875, 0.4827117919921875, 0.5030899047851562, 0.523468017578125, 0.5438461303710938, 0.5642242431640625, 0.5846023559570312, 0.60498046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 11.0, 10.0, 11.0, 18.0, 18.0, 22.0, 28.0, 54.0, 64.0, 73.0, 110.0, 156.0, 255.0, 437.0, 1102.0, 3322.0, 11312.0, 41561.0, 164282.0, 483023.0, 253700.0, 64072.0, 16876.0, 4873.0, 1612.0, 609.0, 307.0, 175.0, 115.0, 78.0, 64.0, 43.0, 38.0, 32.0, 24.0, 8.0, 13.0, 14.0, 5.0, 8.0, 1.0, 6.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.87158203125, -0.8448944091796875, -0.818206787109375, -0.7915191650390625, -0.76483154296875, -0.7381439208984375, -0.711456298828125, -0.6847686767578125, -0.6580810546875, -0.6313934326171875, -0.604705810546875, -0.5780181884765625, -0.55133056640625, -0.5246429443359375, -0.497955322265625, -0.4712677001953125, -0.444580078125, -0.4178924560546875, -0.391204833984375, -0.3645172119140625, -0.33782958984375, -0.3111419677734375, -0.284454345703125, -0.2577667236328125, -0.2310791015625, -0.2043914794921875, -0.177703857421875, -0.1510162353515625, -0.12432861328125, -0.0976409912109375, -0.070953369140625, -0.0442657470703125, -0.017578125, 0.0091094970703125, 0.035797119140625, 0.0624847412109375, 0.08917236328125, 0.1158599853515625, 0.142547607421875, 0.1692352294921875, 0.1959228515625, 0.2226104736328125, 0.249298095703125, 0.2759857177734375, 0.30267333984375, 0.3293609619140625, 0.356048583984375, 0.3827362060546875, 0.409423828125, 0.4361114501953125, 0.462799072265625, 0.4894866943359375, 0.51617431640625, 0.5428619384765625, 0.569549560546875, 0.5962371826171875, 0.6229248046875, 0.6496124267578125, 0.676300048828125, 0.7029876708984375, 0.72967529296875, 0.7563629150390625, 0.783050537109375, 0.8097381591796875, 0.83642578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 4.0, 6.0, 2.0, 7.0, 10.0, 11.0, 5.0, 12.0, 12.0, 13.0, 17.0, 21.0, 16.0, 22.0, 35.0, 31.0, 32.0, 43.0, 41.0, 28.0, 50.0, 49.0, 38.0, 45.0, 38.0, 32.0, 35.0, 32.0, 34.0, 32.0, 41.0, 29.0, 20.0, 22.0, 20.0, 21.0, 14.0, 12.0, 10.0, 14.0, 9.0, 3.0, 5.0, 9.0, 4.0, 2.0, 7.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7744140625, -0.7495346069335938, -0.7246551513671875, -0.6997756958007812, -0.674896240234375, -0.6500167846679688, -0.6251373291015625, -0.6002578735351562, -0.57537841796875, -0.5504989624023438, -0.5256195068359375, -0.5007400512695312, -0.475860595703125, -0.45098114013671875, -0.4261016845703125, -0.40122222900390625, -0.3763427734375, -0.35146331787109375, -0.3265838623046875, -0.30170440673828125, -0.276824951171875, -0.25194549560546875, -0.2270660400390625, -0.20218658447265625, -0.17730712890625, -0.15242767333984375, -0.1275482177734375, -0.10266876220703125, -0.077789306640625, -0.05290985107421875, -0.0280303955078125, -0.00315093994140625, 0.021728515625, 0.04660797119140625, 0.0714874267578125, 0.09636688232421875, 0.121246337890625, 0.14612579345703125, 0.1710052490234375, 0.19588470458984375, 0.22076416015625, 0.24564361572265625, 0.2705230712890625, 0.29540252685546875, 0.320281982421875, 0.34516143798828125, 0.3700408935546875, 0.39492034912109375, 0.4197998046875, 0.44467926025390625, 0.4695587158203125, 0.49443817138671875, 0.519317626953125, 0.5441970825195312, 0.5690765380859375, 0.5939559936523438, 0.61883544921875, 0.6437149047851562, 0.6685943603515625, 0.6934738159179688, 0.718353271484375, 0.7432327270507812, 0.7681121826171875, 0.7929916381835938, 0.81787109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 14.0, 17.0, 35.0, 59.0, 83.0, 111.0, 156.0, 219.0, 380.0, 778.0, 1714.0, 5006.0, 20803.0, 133972.0, 607704.0, 232121.0, 33818.0, 7106.0, 2268.0, 933.0, 496.0, 265.0, 176.0, 109.0, 60.0, 45.0, 30.0, 26.0, 9.0, 13.0, 8.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.2964286804199219, -0.28206634521484375, -0.2677040100097656, -0.2533416748046875, -0.23897933959960938, -0.22461700439453125, -0.21025466918945312, -0.195892333984375, -0.18152999877929688, -0.16716766357421875, -0.15280532836914062, -0.1384429931640625, -0.12408065795898438, -0.10971832275390625, -0.09535598754882812, -0.08099365234375, -0.06663131713867188, -0.05226898193359375, -0.037906646728515625, -0.0235443115234375, -0.009181976318359375, 0.00518035888671875, 0.019542694091796875, 0.033905029296875, 0.048267364501953125, 0.06262969970703125, 0.07699203491210938, 0.0913543701171875, 0.10571670532226562, 0.12007904052734375, 0.13444137573242188, 0.1488037109375, 0.16316604614257812, 0.17752838134765625, 0.19189071655273438, 0.2062530517578125, 0.22061538696289062, 0.23497772216796875, 0.24934005737304688, 0.263702392578125, 0.2780647277832031, 0.29242706298828125, 0.3067893981933594, 0.3211517333984375, 0.3355140686035156, 0.34987640380859375, 0.3642387390136719, 0.37860107421875, 0.3929634094238281, 0.40732574462890625, 0.4216880798339844, 0.4360504150390625, 0.4504127502441406, 0.46477508544921875, 0.4791374206542969, 0.493499755859375, 0.5078620910644531, 0.5222244262695312, 0.5365867614746094, 0.5509490966796875, 0.5653114318847656, 0.5796737670898438, 0.5940361022949219, 0.6083984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 5.0, 9.0, 27.0, 31.0, 41.0, 65.0, 90.0, 81.0, 118.0, 115.0, 102.0, 81.0, 72.0, 47.0, 35.0, 20.0, 21.0, 6.0, 9.0, 10.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.232759475708008e-05, -8.917786180973053e-05, -8.602812886238098e-05, -8.287839591503143e-05, -7.972866296768188e-05, -7.657893002033234e-05, -7.342919707298279e-05, -7.027946412563324e-05, -6.712973117828369e-05, -6.397999823093414e-05, -6.0830265283584595e-05, -5.7680532336235046e-05, -5.45307993888855e-05, -5.138106644153595e-05, -4.82313334941864e-05, -4.508160054683685e-05, -4.1931867599487305e-05, -3.8782134652137756e-05, -3.563240170478821e-05, -3.248266875743866e-05, -2.933293581008911e-05, -2.6183202862739563e-05, -2.3033469915390015e-05, -1.9883736968040466e-05, -1.6734004020690918e-05, -1.358427107334137e-05, -1.0434538125991821e-05, -7.284805178642273e-06, -4.135072231292725e-06, -9.853392839431763e-07, 2.164393663406372e-06, 5.31412661075592e-06, 8.463859558105469e-06, 1.1613592505455017e-05, 1.4763325452804565e-05, 1.7913058400154114e-05, 2.1062791347503662e-05, 2.421252429485321e-05, 2.736225724220276e-05, 3.0511990189552307e-05, 3.3661723136901855e-05, 3.6811456084251404e-05, 3.996118903160095e-05, 4.31109219789505e-05, 4.626065492630005e-05, 4.94103878736496e-05, 5.2560120820999146e-05, 5.5709853768348694e-05, 5.885958671569824e-05, 6.200931966304779e-05, 6.515905261039734e-05, 6.830878555774689e-05, 7.145851850509644e-05, 7.460825145244598e-05, 7.775798439979553e-05, 8.090771734714508e-05, 8.405745029449463e-05, 8.720718324184418e-05, 9.035691618919373e-05, 9.350664913654327e-05, 9.665638208389282e-05, 9.980611503124237e-05, 0.00010295584797859192, 0.00010610558092594147, 0.00010925531387329102]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 15.0, 34.0, 45.0, 100.0, 228.0, 536.0, 1579.0, 5784.0, 45591.0, 659843.0, 309537.0, 19887.0, 3485.0, 1150.0, 389.0, 179.0, 70.0, 44.0, 19.0, 10.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7696304321289062, -0.7487335205078125, -0.7278366088867188, -0.706939697265625, -0.6860427856445312, -0.6651458740234375, -0.6442489624023438, -0.62335205078125, -0.6024551391601562, -0.5815582275390625, -0.5606613159179688, -0.539764404296875, -0.5188674926757812, -0.4979705810546875, -0.47707366943359375, -0.4561767578125, -0.43527984619140625, -0.4143829345703125, -0.39348602294921875, -0.372589111328125, -0.35169219970703125, -0.3307952880859375, -0.30989837646484375, -0.28900146484375, -0.26810455322265625, -0.2472076416015625, -0.22631072998046875, -0.205413818359375, -0.18451690673828125, -0.1636199951171875, -0.14272308349609375, -0.121826171875, -0.10092926025390625, -0.0800323486328125, -0.05913543701171875, -0.038238525390625, -0.01734161376953125, 0.0035552978515625, 0.02445220947265625, 0.04534912109375, 0.06624603271484375, 0.0871429443359375, 0.10803985595703125, 0.128936767578125, 0.14983367919921875, 0.1707305908203125, 0.19162750244140625, 0.2125244140625, 0.23342132568359375, 0.2543182373046875, 0.27521514892578125, 0.296112060546875, 0.31700897216796875, 0.3379058837890625, 0.35880279541015625, 0.37969970703125, 0.40059661865234375, 0.4214935302734375, 0.44239044189453125, 0.463287353515625, 0.48418426513671875, 0.5050811767578125, 0.5259780883789062, 0.546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 19.0, 11.0, 25.0, 26.0, 41.0, 49.0, 52.0, 69.0, 98.0, 70.0, 81.0, 85.0, 69.0, 76.0, 57.0, 38.0, 29.0, 26.0, 18.0, 12.0, 8.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.39566802978515625, -0.3850860595703125, -0.37450408935546875, -0.363922119140625, -0.35334014892578125, -0.3427581787109375, -0.33217620849609375, -0.32159423828125, -0.31101226806640625, -0.3004302978515625, -0.28984832763671875, -0.279266357421875, -0.26868438720703125, -0.2581024169921875, -0.24752044677734375, -0.2369384765625, -0.22635650634765625, -0.2157745361328125, -0.20519256591796875, -0.194610595703125, -0.18402862548828125, -0.1734466552734375, -0.16286468505859375, -0.15228271484375, -0.14170074462890625, -0.1311187744140625, -0.12053680419921875, -0.109954833984375, -0.09937286376953125, -0.0887908935546875, -0.07820892333984375, -0.067626953125, -0.05704498291015625, -0.0464630126953125, -0.03588104248046875, -0.025299072265625, -0.01471710205078125, -0.0041351318359375, 0.00644683837890625, 0.01702880859375, 0.02761077880859375, 0.0381927490234375, 0.04877471923828125, 0.059356689453125, 0.06993865966796875, 0.0805206298828125, 0.09110260009765625, 0.1016845703125, 0.11226654052734375, 0.1228485107421875, 0.13343048095703125, 0.144012451171875, 0.15459442138671875, 0.1651763916015625, 0.17575836181640625, 0.18634033203125, 0.19692230224609375, 0.2075042724609375, 0.21808624267578125, 0.228668212890625, 0.23925018310546875, 0.2498321533203125, 0.26041412353515625, 0.27099609375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 39.0, 79.0, 156.0, 264.0, 224.0, 133.0, 66.0, 25.0, 11.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.559551239013672, -12.207952499389648, -11.856354713439941, -11.504755973815918, -11.153157234191895, -10.801559448242188, -10.449960708618164, -10.09836196899414, -9.746763229370117, -9.395164489746094, -9.043566703796387, -8.691967964172363, -8.34036922454834, -7.988770961761475, -7.637172698974609, -7.285573959350586, -6.933976173400879, -6.582377910614014, -6.23077917098999, -5.879180908203125, -5.527582168579102, -5.175983905792236, -4.824385643005371, -4.472786903381348, -4.121188640594482, -3.769590139389038, -3.4179916381835938, -3.0663933753967285, -2.714794874191284, -2.36319637298584, -2.0115981101989746, -1.6599996089935303, -1.3084001541137695, -0.95680171251297, -0.6052032709121704, -0.2536048889160156, 0.09799361228942871, 0.44959211349487305, 0.8011903762817383, 1.1527888774871826, 1.504387378692627, 1.8559858798980713, 2.2075843811035156, 2.559182643890381, 2.910781145095825, 3.2623796463012695, 3.6139779090881348, 3.965576410293579, 4.317174911499023, 4.668773174285889, 5.020371913909912, 5.371970176696777, 5.723568916320801, 6.075167179107666, 6.426765441894531, 6.778364181518555, 7.12996244430542, 7.481560707092285, 7.833159446716309, 8.184757232666016, 8.536355972290039, 8.887954711914062, 9.239553451538086, 9.591151237487793, 9.942749977111816]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 17.0, 11.0, 16.0, 16.0, 13.0, 25.0, 27.0, 30.0, 41.0, 41.0, 30.0, 45.0, 44.0, 35.0, 43.0, 57.0, 44.0, 41.0, 50.0, 36.0, 44.0, 36.0, 32.0, 35.0, 33.0, 33.0, 19.0, 24.0, 12.0, 11.0, 14.0, 15.0, 10.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.811568737030029, -4.672929286956787, -4.534289836883545, -4.395650386810303, -4.257011413574219, -4.118371963500977, -3.9797325134277344, -3.841093063354492, -3.70245361328125, -3.563814163208008, -3.4251747131347656, -3.2865355014801025, -3.1478960514068604, -3.009256601333618, -2.870617389678955, -2.731977939605713, -2.5933384895324707, -2.4546990394592285, -2.3160595893859863, -2.1774203777313232, -2.038780927658081, -1.9001414775848389, -1.7615021467208862, -1.6228628158569336, -1.4842233657836914, -1.3455839157104492, -1.2069445848464966, -1.068305253982544, -0.9296658039093018, -0.7910264134407043, -0.6523870229721069, -0.5137476325035095, -0.3751077651977539, -0.2364683747291565, -0.09782898426055908, 0.04081040620803833, 0.17944979667663574, 0.31808918714523315, 0.45672857761383057, 0.595367968082428, 0.7340073585510254, 0.8726467490196228, 1.0112861394882202, 1.1499254703521729, 1.288564920425415, 1.4272043704986572, 1.5658437013626099, 1.7044830322265625, 1.8431224822998047, 1.9817619323730469, 2.120401382446289, 2.259040594100952, 2.3976800441741943, 2.5363194942474365, 2.6749587059020996, 2.813598155975342, 2.952237606048584, 3.090877056121826, 3.2295165061950684, 3.3681557178497314, 3.5067951679229736, 3.645434617996216, 3.784073829650879, 3.922713279724121, 4.061352729797363]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 20.0, 27.0, 36.0, 64.0, 133.0, 216.0, 374.0, 864.0, 2516.0, 11537.0, 180052.0, 3950300.0, 39404.0, 5496.0, 1659.0, 704.0, 335.0, 192.0, 136.0, 66.0, 45.0, 34.0, 10.0, 8.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.146484375, -3.05975341796875, -2.9730224609375, -2.88629150390625, -2.799560546875, -2.71282958984375, -2.6260986328125, -2.53936767578125, -2.45263671875, -2.36590576171875, -2.2791748046875, -2.19244384765625, -2.105712890625, -2.01898193359375, -1.9322509765625, -1.84552001953125, -1.7587890625, -1.67205810546875, -1.5853271484375, -1.49859619140625, -1.411865234375, -1.32513427734375, -1.2384033203125, -1.15167236328125, -1.06494140625, -0.97821044921875, -0.8914794921875, -0.80474853515625, -0.718017578125, -0.63128662109375, -0.5445556640625, -0.45782470703125, -0.37109375, -0.28436279296875, -0.1976318359375, -0.11090087890625, -0.024169921875, 0.06256103515625, 0.1492919921875, 0.23602294921875, 0.32275390625, 0.40948486328125, 0.4962158203125, 0.58294677734375, 0.669677734375, 0.75640869140625, 0.8431396484375, 0.92987060546875, 1.0166015625, 1.10333251953125, 1.1900634765625, 1.27679443359375, 1.363525390625, 1.45025634765625, 1.5369873046875, 1.62371826171875, 1.71044921875, 1.79718017578125, 1.8839111328125, 1.97064208984375, 2.057373046875, 2.14410400390625, 2.2308349609375, 2.31756591796875, 2.404296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 20.0, 27.0, 45.0, 77.0, 107.0, 112.0, 130.0, 112.0, 112.0, 97.0, 64.0, 44.0, 24.0, 6.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6796875, -0.6596145629882812, -0.6395416259765625, -0.6194686889648438, -0.599395751953125, -0.5793228149414062, -0.5592498779296875, -0.5391769409179688, -0.51910400390625, -0.49903106689453125, -0.4789581298828125, -0.45888519287109375, -0.438812255859375, -0.41873931884765625, -0.3986663818359375, -0.37859344482421875, -0.3585205078125, -0.33844757080078125, -0.3183746337890625, -0.29830169677734375, -0.278228759765625, -0.25815582275390625, -0.2380828857421875, -0.21800994873046875, -0.19793701171875, -0.17786407470703125, -0.1577911376953125, -0.13771820068359375, -0.117645263671875, -0.09757232666015625, -0.0774993896484375, -0.05742645263671875, -0.037353515625, -0.01728057861328125, 0.0027923583984375, 0.02286529541015625, 0.042938232421875, 0.06301116943359375, 0.0830841064453125, 0.10315704345703125, 0.12322998046875, 0.14330291748046875, 0.1633758544921875, 0.18344879150390625, 0.203521728515625, 0.22359466552734375, 0.2436676025390625, 0.26374053955078125, 0.2838134765625, 0.30388641357421875, 0.3239593505859375, 0.34403228759765625, 0.364105224609375, 0.38417816162109375, 0.4042510986328125, 0.42432403564453125, 0.44439697265625, 0.46446990966796875, 0.4845428466796875, 0.5046157836914062, 0.524688720703125, 0.5447616577148438, 0.5648345947265625, 0.5849075317382812, 0.60498046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 14.0, 23.0, 38.0, 73.0, 102.0, 170.0, 288.0, 527.0, 996.0, 1968.0, 4502.0, 12091.0, 46979.0, 412169.0, 3553822.0, 123132.0, 23651.0, 7478.0, 3019.0, 1456.0, 742.0, 439.0, 215.0, 173.0, 72.0, 50.0, 34.0, 17.0, 8.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.0592041015625, -1.021728515625, -0.9842529296875, -0.94677734375, -0.9093017578125, -0.871826171875, -0.8343505859375, -0.796875, -0.7593994140625, -0.721923828125, -0.6844482421875, -0.64697265625, -0.6094970703125, -0.572021484375, -0.5345458984375, -0.4970703125, -0.4595947265625, -0.422119140625, -0.3846435546875, -0.34716796875, -0.3096923828125, -0.272216796875, -0.2347412109375, -0.197265625, -0.1597900390625, -0.122314453125, -0.0848388671875, -0.04736328125, -0.0098876953125, 0.027587890625, 0.0650634765625, 0.1025390625, 0.1400146484375, 0.177490234375, 0.2149658203125, 0.25244140625, 0.2899169921875, 0.327392578125, 0.3648681640625, 0.40234375, 0.4398193359375, 0.477294921875, 0.5147705078125, 0.55224609375, 0.5897216796875, 0.627197265625, 0.6646728515625, 0.7021484375, 0.7396240234375, 0.777099609375, 0.8145751953125, 0.85205078125, 0.8895263671875, 0.927001953125, 0.9644775390625, 1.001953125, 1.0394287109375, 1.076904296875, 1.1143798828125, 1.15185546875, 1.1893310546875, 1.226806640625, 1.2642822265625, 1.3017578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 1.0, 11.0, 25.0, 25.0, 46.0, 79.0, 170.0, 484.0, 2445.0, 399.0, 150.0, 90.0, 44.0, 22.0, 25.0, 15.0, 9.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5205078125, -0.5022048950195312, -0.4839019775390625, -0.46559906005859375, -0.447296142578125, -0.42899322509765625, -0.4106903076171875, -0.39238739013671875, -0.37408447265625, -0.35578155517578125, -0.3374786376953125, -0.31917572021484375, -0.300872802734375, -0.28256988525390625, -0.2642669677734375, -0.24596405029296875, -0.2276611328125, -0.20935821533203125, -0.1910552978515625, -0.17275238037109375, -0.154449462890625, -0.13614654541015625, -0.1178436279296875, -0.09954071044921875, -0.08123779296875, -0.06293487548828125, -0.0446319580078125, -0.02632904052734375, -0.008026123046875, 0.01027679443359375, 0.0285797119140625, 0.04688262939453125, 0.065185546875, 0.08348846435546875, 0.1017913818359375, 0.12009429931640625, 0.138397216796875, 0.15670013427734375, 0.1750030517578125, 0.19330596923828125, 0.21160888671875, 0.22991180419921875, 0.2482147216796875, 0.26651763916015625, 0.284820556640625, 0.30312347412109375, 0.3214263916015625, 0.33972930908203125, 0.3580322265625, 0.37633514404296875, 0.3946380615234375, 0.41294097900390625, 0.431243896484375, 0.44954681396484375, 0.4678497314453125, 0.48615264892578125, 0.50445556640625, 0.5227584838867188, 0.5410614013671875, 0.5593643188476562, 0.577667236328125, 0.5959701538085938, 0.6142730712890625, 0.6325759887695312, 0.65087890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 12.0, 46.0, 510.0, 388.0, 36.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.754898548126221, -4.38496732711792, -4.015035629272461, -3.64510440826416, -3.2751729488372803, -2.9052414894104004, -2.5353102684020996, -2.1653788089752197, -1.7954473495483398, -1.42551589012146, -1.0555845499038696, -0.6856532096862793, -0.3157217502593994, 0.05420970916748047, 0.42414093017578125, 0.7940723896026611, 1.164003849029541, 1.533935308456421, 1.9038666486740112, 2.2737979888916016, 2.6437294483184814, 3.0136609077453613, 3.383592128753662, 3.753523588180542, 4.123455047607422, 4.493386268615723, 4.863317966461182, 5.233249187469482, 5.603180885314941, 5.973112106323242, 6.343043327331543, 6.712974548339844, 7.082906723022461, 7.452837944030762, 7.822769641876221, 8.19270133972168, 8.56263256072998, 8.932563781738281, 9.302495002746582, 9.672426223754883, 10.0423583984375, 10.4122896194458, 10.782220840454102, 11.152153015136719, 11.52208423614502, 11.89201545715332, 12.261946678161621, 12.631877899169922, 13.001809120178223, 13.371740341186523, 13.741671562194824, 14.111602783203125, 14.481534957885742, 14.851466178894043, 15.221397399902344, 15.591328620910645, 15.961259841918945, 16.331192016601562, 16.701122283935547, 17.071054458618164, 17.44098472595215, 17.810916900634766, 18.18084716796875, 18.550779342651367, 18.920711517333984]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 6.0, 8.0, 9.0, 12.0, 14.0, 14.0, 27.0, 28.0, 27.0, 32.0, 48.0, 48.0, 54.0, 48.0, 69.0, 37.0, 62.0, 65.0, 49.0, 41.0, 46.0, 48.0, 46.0, 35.0, 21.0, 20.0, 14.0, 18.0, 9.0, 11.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3293942213058472, -1.2811225652694702, -1.2328509092330933, -1.1845792531967163, -1.1363075971603394, -1.0880359411239624, -1.039764165878296, -0.9914925694465637, -0.9432209134101868, -0.8949492573738098, -0.8466776013374329, -0.7984058856964111, -0.7501342296600342, -0.7018625736236572, -0.6535909175872803, -0.6053192615509033, -0.5570476055145264, -0.5087759494781494, -0.46050429344177246, -0.4122326076030731, -0.36396095156669617, -0.3156892955303192, -0.2674176096916199, -0.21914595365524292, -0.17087429761886597, -0.12260263413190842, -0.07433097064495087, -0.02605929970741272, 0.022212356328964233, 0.07048401236534119, 0.11875569820404053, 0.16702735424041748, 0.21529912948608398, 0.26357078552246094, 0.3118424415588379, 0.36011412739753723, 0.4083857834339142, 0.45665743947029114, 0.5049291253089905, 0.5532007813453674, 0.6014724373817444, 0.6497440934181213, 0.6980157494544983, 0.74628746509552, 0.794559121131897, 0.8428307771682739, 0.8911024332046509, 0.9393740892410278, 0.9876457452774048, 1.0359174013137817, 1.0841890573501587, 1.1324607133865356, 1.1807323694229126, 1.2290040254592896, 1.277275800704956, 1.325547456741333, 1.37381911277771, 1.422090768814087, 1.4703624248504639, 1.5186340808868408, 1.5669057369232178, 1.6151773929595947, 1.6634490489959717, 1.7117207050323486, 1.7599923610687256]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 14.0, 18.0, 21.0, 23.0, 30.0, 57.0, 54.0, 98.0, 123.0, 194.0, 278.0, 395.0, 561.0, 914.0, 1525.0, 3153.0, 9156.0, 38188.0, 187048.0, 529433.0, 215330.0, 43817.0, 10264.0, 3465.0, 1573.0, 928.0, 595.0, 400.0, 259.0, 189.0, 137.0, 100.0, 53.0, 36.0, 32.0, 25.0, 18.0, 16.0, 11.0, 8.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.37890625, -1.3389892578125, -1.299072265625, -1.2591552734375, -1.21923828125, -1.1793212890625, -1.139404296875, -1.0994873046875, -1.0595703125, -1.0196533203125, -0.979736328125, -0.9398193359375, -0.89990234375, -0.8599853515625, -0.820068359375, -0.7801513671875, -0.740234375, -0.7003173828125, -0.660400390625, -0.6204833984375, -0.58056640625, -0.5406494140625, -0.500732421875, -0.4608154296875, -0.4208984375, -0.3809814453125, -0.341064453125, -0.3011474609375, -0.26123046875, -0.2213134765625, -0.181396484375, -0.1414794921875, -0.1015625, -0.0616455078125, -0.021728515625, 0.0181884765625, 0.05810546875, 0.0980224609375, 0.137939453125, 0.1778564453125, 0.2177734375, 0.2576904296875, 0.297607421875, 0.3375244140625, 0.37744140625, 0.4173583984375, 0.457275390625, 0.4971923828125, 0.537109375, 0.5770263671875, 0.616943359375, 0.6568603515625, 0.69677734375, 0.7366943359375, 0.776611328125, 0.8165283203125, 0.8564453125, 0.8963623046875, 0.936279296875, 0.9761962890625, 1.01611328125, 1.0560302734375, 1.095947265625, 1.1358642578125, 1.17578125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 30.0, 42.0, 66.0, 91.0, 109.0, 149.0, 130.0, 104.0, 103.0, 63.0, 36.0, 27.0, 11.0, 12.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.7009735107421875, -0.679779052734375, -0.6585845947265625, -0.63739013671875, -0.6161956787109375, -0.595001220703125, -0.5738067626953125, -0.5526123046875, -0.5314178466796875, -0.510223388671875, -0.4890289306640625, -0.46783447265625, -0.4466400146484375, -0.425445556640625, -0.4042510986328125, -0.383056640625, -0.3618621826171875, -0.340667724609375, -0.3194732666015625, -0.29827880859375, -0.2770843505859375, -0.255889892578125, -0.2346954345703125, -0.2135009765625, -0.1923065185546875, -0.171112060546875, -0.1499176025390625, -0.12872314453125, -0.1075286865234375, -0.086334228515625, -0.0651397705078125, -0.0439453125, -0.0227508544921875, -0.001556396484375, 0.0196380615234375, 0.04083251953125, 0.0620269775390625, 0.083221435546875, 0.1044158935546875, 0.1256103515625, 0.1468048095703125, 0.167999267578125, 0.1891937255859375, 0.21038818359375, 0.2315826416015625, 0.252777099609375, 0.2739715576171875, 0.295166015625, 0.3163604736328125, 0.337554931640625, 0.3587493896484375, 0.37994384765625, 0.4011383056640625, 0.422332763671875, 0.4435272216796875, 0.4647216796875, 0.4859161376953125, 0.507110595703125, 0.5283050537109375, 0.54949951171875, 0.5706939697265625, 0.591888427734375, 0.6130828857421875, 0.63427734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 6.0, 10.0, 18.0, 21.0, 23.0, 28.0, 40.0, 66.0, 88.0, 134.0, 195.0, 323.0, 558.0, 1174.0, 2693.0, 7412.0, 22412.0, 69799.0, 206345.0, 390587.0, 228052.0, 78706.0, 25362.0, 8489.0, 3119.0, 1233.0, 595.0, 337.0, 207.0, 126.0, 102.0, 79.0, 47.0, 36.0, 33.0, 22.0, 18.0, 14.0, 9.0, 7.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.642578125, -0.6215438842773438, -0.6005096435546875, -0.5794754028320312, -0.558441162109375, -0.5374069213867188, -0.5163726806640625, -0.49533843994140625, -0.47430419921875, -0.45326995849609375, -0.4322357177734375, -0.41120147705078125, -0.390167236328125, -0.36913299560546875, -0.3480987548828125, -0.32706451416015625, -0.3060302734375, -0.28499603271484375, -0.2639617919921875, -0.24292755126953125, -0.221893310546875, -0.20085906982421875, -0.1798248291015625, -0.15879058837890625, -0.13775634765625, -0.11672210693359375, -0.0956878662109375, -0.07465362548828125, -0.053619384765625, -0.03258514404296875, -0.0115509033203125, 0.00948333740234375, 0.030517578125, 0.05155181884765625, 0.0725860595703125, 0.09362030029296875, 0.114654541015625, 0.13568878173828125, 0.1567230224609375, 0.17775726318359375, 0.19879150390625, 0.21982574462890625, 0.2408599853515625, 0.26189422607421875, 0.282928466796875, 0.30396270751953125, 0.3249969482421875, 0.34603118896484375, 0.3670654296875, 0.38809967041015625, 0.4091339111328125, 0.43016815185546875, 0.451202392578125, 0.47223663330078125, 0.4932708740234375, 0.5143051147460938, 0.53533935546875, 0.5563735961914062, 0.5774078369140625, 0.5984420776367188, 0.619476318359375, 0.6405105590820312, 0.6615447998046875, 0.6825790405273438, 0.70361328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 4.0, 8.0, 14.0, 12.0, 11.0, 20.0, 19.0, 23.0, 20.0, 26.0, 34.0, 39.0, 37.0, 32.0, 36.0, 39.0, 51.0, 52.0, 49.0, 52.0, 35.0, 38.0, 35.0, 32.0, 42.0, 36.0, 22.0, 24.0, 23.0, 23.0, 20.0, 20.0, 15.0, 11.0, 4.0, 8.0, 6.0, 6.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0107421875, -0.9805374145507812, -0.9503326416015625, -0.9201278686523438, -0.889923095703125, -0.8597183227539062, -0.8295135498046875, -0.7993087768554688, -0.76910400390625, -0.7388992309570312, -0.7086944580078125, -0.6784896850585938, -0.648284912109375, -0.6180801391601562, -0.5878753662109375, -0.5576705932617188, -0.5274658203125, -0.49726104736328125, -0.4670562744140625, -0.43685150146484375, -0.406646728515625, -0.37644195556640625, -0.3462371826171875, -0.31603240966796875, -0.28582763671875, -0.25562286376953125, -0.2254180908203125, -0.19521331787109375, -0.165008544921875, -0.13480377197265625, -0.1045989990234375, -0.07439422607421875, -0.044189453125, -0.01398468017578125, 0.0162200927734375, 0.04642486572265625, 0.076629638671875, 0.10683441162109375, 0.1370391845703125, 0.16724395751953125, 0.19744873046875, 0.22765350341796875, 0.2578582763671875, 0.28806304931640625, 0.318267822265625, 0.34847259521484375, 0.3786773681640625, 0.40888214111328125, 0.4390869140625, 0.46929168701171875, 0.4994964599609375, 0.5297012329101562, 0.559906005859375, 0.5901107788085938, 0.6203155517578125, 0.6505203247070312, 0.68072509765625, 0.7109298706054688, 0.7411346435546875, 0.7713394165039062, 0.801544189453125, 0.8317489624023438, 0.8619537353515625, 0.8921585083007812, 0.92236328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 9.0, 10.0, 18.0, 36.0, 44.0, 93.0, 168.0, 348.0, 777.0, 2087.0, 7075.0, 43723.0, 424502.0, 502879.0, 54650.0, 8181.0, 2222.0, 877.0, 395.0, 200.0, 87.0, 62.0, 40.0, 26.0, 14.0, 8.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.48673248291015625, -0.4705352783203125, -0.45433807373046875, -0.438140869140625, -0.42194366455078125, -0.4057464599609375, -0.38954925537109375, -0.37335205078125, -0.35715484619140625, -0.3409576416015625, -0.32476043701171875, -0.308563232421875, -0.29236602783203125, -0.2761688232421875, -0.25997161865234375, -0.2437744140625, -0.22757720947265625, -0.2113800048828125, -0.19518280029296875, -0.178985595703125, -0.16278839111328125, -0.1465911865234375, -0.13039398193359375, -0.11419677734375, -0.09799957275390625, -0.0818023681640625, -0.06560516357421875, -0.049407958984375, -0.03321075439453125, -0.0170135498046875, -0.00081634521484375, 0.015380859375, 0.03157806396484375, 0.0477752685546875, 0.06397247314453125, 0.080169677734375, 0.09636688232421875, 0.1125640869140625, 0.12876129150390625, 0.14495849609375, 0.16115570068359375, 0.1773529052734375, 0.19355010986328125, 0.209747314453125, 0.22594451904296875, 0.2421417236328125, 0.25833892822265625, 0.2745361328125, 0.29073333740234375, 0.3069305419921875, 0.32312774658203125, 0.339324951171875, 0.35552215576171875, 0.3717193603515625, 0.38791656494140625, 0.40411376953125, 0.42031097412109375, 0.4365081787109375, 0.45270538330078125, 0.468902587890625, 0.48509979248046875, 0.5012969970703125, 0.5174942016601562, 0.53369140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 10.0, 6.0, 12.0, 13.0, 22.0, 21.0, 22.0, 32.0, 41.0, 55.0, 60.0, 55.0, 71.0, 62.0, 79.0, 81.0, 57.0, 62.0, 50.0, 35.0, 27.0, 23.0, 23.0, 16.0, 19.0, 9.0, 9.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4405460357666016e-05, -4.2557716369628906e-05, -4.07099723815918e-05, -3.886222839355469e-05, -3.701448440551758e-05, -3.516674041748047e-05, -3.331899642944336e-05, -3.147125244140625e-05, -2.962350845336914e-05, -2.777576446533203e-05, -2.5928020477294922e-05, -2.4080276489257812e-05, -2.2232532501220703e-05, -2.0384788513183594e-05, -1.8537044525146484e-05, -1.6689300537109375e-05, -1.4841556549072266e-05, -1.2993812561035156e-05, -1.1146068572998047e-05, -9.298324584960938e-06, -7.450580596923828e-06, -5.602836608886719e-06, -3.7550926208496094e-06, -1.9073486328125e-06, -5.960464477539063e-08, 1.7881393432617188e-06, 3.635883331298828e-06, 5.4836273193359375e-06, 7.331371307373047e-06, 9.179115295410156e-06, 1.1026859283447266e-05, 1.2874603271484375e-05, 1.4722347259521484e-05, 1.6570091247558594e-05, 1.8417835235595703e-05, 2.0265579223632812e-05, 2.2113323211669922e-05, 2.396106719970703e-05, 2.580881118774414e-05, 2.765655517578125e-05, 2.950429916381836e-05, 3.135204315185547e-05, 3.319978713989258e-05, 3.504753112792969e-05, 3.68952751159668e-05, 3.8743019104003906e-05, 4.0590763092041016e-05, 4.2438507080078125e-05, 4.4286251068115234e-05, 4.6133995056152344e-05, 4.798173904418945e-05, 4.982948303222656e-05, 5.167722702026367e-05, 5.352497100830078e-05, 5.537271499633789e-05, 5.7220458984375e-05, 5.906820297241211e-05, 6.091594696044922e-05, 6.276369094848633e-05, 6.461143493652344e-05, 6.645917892456055e-05, 6.830692291259766e-05, 7.015466690063477e-05, 7.200241088867188e-05, 7.385015487670898e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 16.0, 20.0, 38.0, 49.0, 108.0, 164.0, 419.0, 1386.0, 6663.0, 52815.0, 536656.0, 406214.0, 37009.0, 5054.0, 1188.0, 371.0, 154.0, 93.0, 47.0, 31.0, 32.0, 18.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76904296875, -0.7476348876953125, -0.726226806640625, -0.7048187255859375, -0.68341064453125, -0.6620025634765625, -0.640594482421875, -0.6191864013671875, -0.5977783203125, -0.5763702392578125, -0.554962158203125, -0.5335540771484375, -0.51214599609375, -0.4907379150390625, -0.469329833984375, -0.4479217529296875, -0.426513671875, -0.4051055908203125, -0.383697509765625, -0.3622894287109375, -0.34088134765625, -0.3194732666015625, -0.298065185546875, -0.2766571044921875, -0.2552490234375, -0.2338409423828125, -0.212432861328125, -0.1910247802734375, -0.16961669921875, -0.1482086181640625, -0.126800537109375, -0.1053924560546875, -0.083984375, -0.0625762939453125, -0.041168212890625, -0.0197601318359375, 0.00164794921875, 0.0230560302734375, 0.044464111328125, 0.0658721923828125, 0.0872802734375, 0.1086883544921875, 0.130096435546875, 0.1515045166015625, 0.17291259765625, 0.1943206787109375, 0.215728759765625, 0.2371368408203125, 0.258544921875, 0.2799530029296875, 0.301361083984375, 0.3227691650390625, 0.34417724609375, 0.3655853271484375, 0.386993408203125, 0.4084014892578125, 0.4298095703125, 0.4512176513671875, 0.472625732421875, 0.4940338134765625, 0.51544189453125, 0.5368499755859375, 0.558258056640625, 0.5796661376953125, 0.60107421875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 5.0, 16.0, 14.0, 11.0, 20.0, 13.0, 24.0, 23.0, 43.0, 34.0, 43.0, 55.0, 70.0, 81.0, 70.0, 69.0, 75.0, 55.0, 50.0, 39.0, 25.0, 35.0, 23.0, 20.0, 11.0, 19.0, 9.0, 7.0, 8.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.330291748046875, -0.31903076171875, -0.307769775390625, -0.2965087890625, -0.285247802734375, -0.27398681640625, -0.262725830078125, -0.25146484375, -0.240203857421875, -0.22894287109375, -0.217681884765625, -0.2064208984375, -0.195159912109375, -0.18389892578125, -0.172637939453125, -0.161376953125, -0.150115966796875, -0.13885498046875, -0.127593994140625, -0.1163330078125, -0.105072021484375, -0.09381103515625, -0.082550048828125, -0.0712890625, -0.060028076171875, -0.04876708984375, -0.037506103515625, -0.0262451171875, -0.014984130859375, -0.00372314453125, 0.007537841796875, 0.018798828125, 0.030059814453125, 0.04132080078125, 0.052581787109375, 0.0638427734375, 0.075103759765625, 0.08636474609375, 0.097625732421875, 0.10888671875, 0.120147705078125, 0.13140869140625, 0.142669677734375, 0.1539306640625, 0.165191650390625, 0.17645263671875, 0.187713623046875, 0.198974609375, 0.210235595703125, 0.22149658203125, 0.232757568359375, 0.2440185546875, 0.255279541015625, 0.26654052734375, 0.277801513671875, 0.2890625, 0.300323486328125, 0.31158447265625, 0.322845458984375, 0.3341064453125, 0.345367431640625, 0.35662841796875, 0.367889404296875, 0.379150390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 9.0, 26.0, 79.0, 209.0, 276.0, 213.0, 124.0, 40.0, 19.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.354331970214844, -11.903773307800293, -11.453214645385742, -11.002655982971191, -10.55209732055664, -10.10153865814209, -9.650979995727539, -9.200422286987305, -8.749862670898438, -8.299304008483887, -7.848745346069336, -7.398186683654785, -6.947628021240234, -6.497069358825684, -6.046511173248291, -5.59595251083374, -5.145394325256348, -4.694835662841797, -4.244277000427246, -3.7937185764312744, -3.3431599140167236, -2.892601251602173, -2.442042827606201, -1.9914841651916504, -1.5409255027770996, -1.0903668403625488, -0.6398082971572876, -0.18924975395202637, 0.2613089084625244, 0.7118675708770752, 1.1624259948730469, 1.6129846572875977, 2.0635433197021484, 2.514101982116699, 2.96466064453125, 3.4152190685272217, 3.8657777309417725, 4.316336631774902, 4.766894817352295, 5.217453479766846, 5.6680121421813965, 6.118570804595947, 6.569129467010498, 7.019687652587891, 7.470246315002441, 7.920804977416992, 8.371363639831543, 8.821922302246094, 9.272480964660645, 9.723039627075195, 10.173598289489746, 10.624156951904297, 11.074715614318848, 11.525274276733398, 11.975831985473633, 12.4263916015625, 12.876949310302734, 13.327507972717285, 13.778066635131836, 14.228625297546387, 14.679183959960938, 15.129742622375488, 15.580301284790039, 16.030858993530273, 16.48141860961914]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 0.0, 6.0, 5.0, 9.0, 7.0, 9.0, 14.0, 11.0, 11.0, 14.0, 19.0, 16.0, 26.0, 20.0, 20.0, 34.0, 28.0, 42.0, 38.0, 41.0, 35.0, 40.0, 37.0, 46.0, 37.0, 36.0, 38.0, 31.0, 36.0, 35.0, 27.0, 29.0, 28.0, 22.0, 24.0, 21.0, 21.0, 13.0, 5.0, 21.0, 9.0, 10.0, 11.0, 4.0, 6.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.773796081542969, -4.630876541137695, -4.487957000732422, -4.345037460327148, -4.202117919921875, -4.059198379516602, -3.9162790775299072, -3.773359537124634, -3.6304399967193604, -3.487520456314087, -3.3446009159088135, -3.20168137550354, -3.0587620735168457, -2.9158425331115723, -2.772922992706299, -2.6300034523010254, -2.487083911895752, -2.3441643714904785, -2.201244831085205, -2.0583252906799316, -1.9154058694839478, -1.7724863290786743, -1.6295669078826904, -1.486647367477417, -1.3437278270721436, -1.2008082866668701, -1.0578887462615967, -0.9149693250656128, -0.7720497846603394, -0.6291302442550659, -0.48621076345443726, -0.3432912826538086, -0.20037174224853516, -0.057452231645584106, 0.08546727895736694, 0.228386789560318, 0.37130630016326904, 0.5142258405685425, 0.6571453213691711, 0.8000648021697998, 0.9429843425750732, 1.0859038829803467, 1.2288234233856201, 1.371742844581604, 1.5146623849868774, 1.6575819253921509, 1.8005013465881348, 1.9434208869934082, 2.0863404273986816, 2.229259967803955, 2.3721795082092285, 2.515099048614502, 2.6580185890197754, 2.800938129425049, 2.943857431411743, 3.0867769718170166, 3.22969651222229, 3.3726160526275635, 3.515535593032837, 3.6584551334381104, 3.8013744354248047, 3.944293975830078, 4.087213516235352, 4.230133056640625, 4.373052597045898]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 11.0, 11.0, 11.0, 12.0, 11.0, 21.0, 31.0, 50.0, 67.0, 81.0, 123.0, 207.0, 356.0, 639.0, 1535.0, 3959.0, 14122.0, 82710.0, 3882832.0, 176342.0, 20955.0, 5584.0, 2077.0, 972.0, 521.0, 349.0, 224.0, 147.0, 99.0, 64.0, 50.0, 21.0, 27.0, 13.0, 13.0, 7.0, 6.0, 4.0, 7.0, 8.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9013671875, -1.8431243896484375, -1.784881591796875, -1.7266387939453125, -1.66839599609375, -1.6101531982421875, -1.551910400390625, -1.4936676025390625, -1.4354248046875, -1.3771820068359375, -1.318939208984375, -1.2606964111328125, -1.20245361328125, -1.1442108154296875, -1.085968017578125, -1.0277252197265625, -0.969482421875, -0.9112396240234375, -0.852996826171875, -0.7947540283203125, -0.73651123046875, -0.6782684326171875, -0.620025634765625, -0.5617828369140625, -0.5035400390625, -0.4452972412109375, -0.387054443359375, -0.3288116455078125, -0.27056884765625, -0.2123260498046875, -0.154083251953125, -0.0958404541015625, -0.03759765625, 0.0206451416015625, 0.078887939453125, 0.1371307373046875, 0.19537353515625, 0.2536163330078125, 0.311859130859375, 0.3701019287109375, 0.4283447265625, 0.4865875244140625, 0.544830322265625, 0.6030731201171875, 0.66131591796875, 0.7195587158203125, 0.777801513671875, 0.8360443115234375, 0.894287109375, 0.9525299072265625, 1.010772705078125, 1.0690155029296875, 1.12725830078125, 1.1855010986328125, 1.243743896484375, 1.3019866943359375, 1.3602294921875, 1.4184722900390625, 1.476715087890625, 1.5349578857421875, 1.59320068359375, 1.6514434814453125, 1.709686279296875, 1.7679290771484375, 1.826171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 6.0, 16.0, 30.0, 53.0, 69.0, 106.0, 129.0, 119.0, 139.0, 115.0, 75.0, 66.0, 32.0, 19.0, 9.0, 8.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.767578125, -0.7455215454101562, -0.7234649658203125, -0.7014083862304688, -0.679351806640625, -0.6572952270507812, -0.6352386474609375, -0.6131820678710938, -0.59112548828125, -0.5690689086914062, -0.5470123291015625, -0.5249557495117188, -0.502899169921875, -0.48084259033203125, -0.4587860107421875, -0.43672943115234375, -0.4146728515625, -0.39261627197265625, -0.3705596923828125, -0.34850311279296875, -0.326446533203125, -0.30438995361328125, -0.2823333740234375, -0.26027679443359375, -0.23822021484375, -0.21616363525390625, -0.1941070556640625, -0.17205047607421875, -0.149993896484375, -0.12793731689453125, -0.1058807373046875, -0.08382415771484375, -0.061767578125, -0.03971099853515625, -0.0176544189453125, 0.00440216064453125, 0.026458740234375, 0.04851531982421875, 0.0705718994140625, 0.09262847900390625, 0.11468505859375, 0.13674163818359375, 0.1587982177734375, 0.18085479736328125, 0.202911376953125, 0.22496795654296875, 0.2470245361328125, 0.26908111572265625, 0.2911376953125, 0.31319427490234375, 0.3352508544921875, 0.35730743408203125, 0.379364013671875, 0.40142059326171875, 0.4234771728515625, 0.44553375244140625, 0.46759033203125, 0.48964691162109375, 0.5117034912109375, 0.5337600708007812, 0.555816650390625, 0.5778732299804688, 0.5999298095703125, 0.6219863891601562, 0.64404296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 10.0, 9.0, 15.0, 30.0, 38.0, 57.0, 81.0, 173.0, 285.0, 414.0, 730.0, 1342.0, 2481.0, 5198.0, 13637.0, 46751.0, 301498.0, 3601738.0, 167222.0, 32786.0, 10347.0, 4413.0, 2194.0, 1148.0, 715.0, 379.0, 254.0, 116.0, 90.0, 50.0, 30.0, 19.0, 12.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1875, -1.1539306640625, -1.120361328125, -1.0867919921875, -1.05322265625, -1.0196533203125, -0.986083984375, -0.9525146484375, -0.9189453125, -0.8853759765625, -0.851806640625, -0.8182373046875, -0.78466796875, -0.7510986328125, -0.717529296875, -0.6839599609375, -0.650390625, -0.6168212890625, -0.583251953125, -0.5496826171875, -0.51611328125, -0.4825439453125, -0.448974609375, -0.4154052734375, -0.3818359375, -0.3482666015625, -0.314697265625, -0.2811279296875, -0.24755859375, -0.2139892578125, -0.180419921875, -0.1468505859375, -0.11328125, -0.0797119140625, -0.046142578125, -0.0125732421875, 0.02099609375, 0.0545654296875, 0.088134765625, 0.1217041015625, 0.1552734375, 0.1888427734375, 0.222412109375, 0.2559814453125, 0.28955078125, 0.3231201171875, 0.356689453125, 0.3902587890625, 0.423828125, 0.4573974609375, 0.490966796875, 0.5245361328125, 0.55810546875, 0.5916748046875, 0.625244140625, 0.6588134765625, 0.6923828125, 0.7259521484375, 0.759521484375, 0.7930908203125, 0.82666015625, 0.8602294921875, 0.893798828125, 0.9273681640625, 0.9609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 14.0, 12.0, 11.0, 18.0, 34.0, 32.0, 93.0, 207.0, 993.0, 2079.0, 286.0, 117.0, 64.0, 34.0, 18.0, 17.0, 17.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6611328125, -0.6384048461914062, -0.6156768798828125, -0.5929489135742188, -0.570220947265625, -0.5474929809570312, -0.5247650146484375, -0.5020370483398438, -0.47930908203125, -0.45658111572265625, -0.4338531494140625, -0.41112518310546875, -0.388397216796875, -0.36566925048828125, -0.3429412841796875, -0.32021331787109375, -0.2974853515625, -0.27475738525390625, -0.2520294189453125, -0.22930145263671875, -0.206573486328125, -0.18384552001953125, -0.1611175537109375, -0.13838958740234375, -0.11566162109375, -0.09293365478515625, -0.0702056884765625, -0.04747772216796875, -0.024749755859375, -0.00202178955078125, 0.0207061767578125, 0.04343414306640625, 0.066162109375, 0.08889007568359375, 0.1116180419921875, 0.13434600830078125, 0.157073974609375, 0.17980194091796875, 0.2025299072265625, 0.22525787353515625, 0.24798583984375, 0.27071380615234375, 0.2934417724609375, 0.31616973876953125, 0.338897705078125, 0.36162567138671875, 0.3843536376953125, 0.40708160400390625, 0.4298095703125, 0.45253753662109375, 0.4752655029296875, 0.49799346923828125, 0.520721435546875, 0.5434494018554688, 0.5661773681640625, 0.5889053344726562, 0.61163330078125, 0.6343612670898438, 0.6570892333984375, 0.6798171997070312, 0.702545166015625, 0.7252731323242188, 0.7480010986328125, 0.7707290649414062, 0.79345703125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 8.0, 12.0, 38.0, 133.0, 281.0, 274.0, 155.0, 60.0, 22.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.252060890197754, -3.0498206615448, -2.8475801944732666, -2.6453399658203125, -2.4430997371673584, -2.2408595085144043, -2.038619041442871, -1.836378812789917, -1.6341384649276733, -1.4318981170654297, -1.2296578884124756, -1.027417540550232, -0.8251772522926331, -0.6229369640350342, -0.4206966161727905, -0.21845638751983643, -0.016216039657592773, 0.1860242635011673, 0.38826456665992737, 0.5905048847198486, 0.7927451729774475, 0.9949854612350464, 1.19722580909729, 1.3994660377502441, 1.6017063856124878, 1.8039467334747314, 2.0061869621276855, 2.2084274291992188, 2.410667657852173, 2.612907886505127, 2.81514835357666, 3.017388343811035, 3.2196288108825684, 3.4218690395355225, 3.6241095066070557, 3.8263497352600098, 4.028590202331543, 4.230830192565918, 4.433070659637451, 4.635311126708984, 4.837551116943359, 5.039791584014893, 5.242031574249268, 5.444272041320801, 5.646512508392334, 5.848752498626709, 6.050992965698242, 6.253232955932617, 6.455473899841309, 6.657714366912842, 6.859954357147217, 7.06219482421875, 7.264435291290283, 7.466675281524658, 7.668915748596191, 7.871155738830566, 8.073395729064941, 8.275635719299316, 8.477876663208008, 8.680116653442383, 8.882356643676758, 9.08459758758545, 9.286837577819824, 9.4890775680542, 9.69131851196289]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 11.0, 6.0, 23.0, 17.0, 28.0, 27.0, 33.0, 32.0, 38.0, 37.0, 50.0, 57.0, 60.0, 57.0, 53.0, 58.0, 53.0, 43.0, 55.0, 45.0, 38.0, 29.0, 30.0, 21.0, 28.0, 18.0, 14.0, 9.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.105159282684326, -2.0450165271759033, -1.984873652458191, -1.924730896949768, -1.8645880222320557, -1.8044452667236328, -1.74430251121521, -1.6841596364974976, -1.6240167617797852, -1.5638740062713623, -1.50373113155365, -1.443588376045227, -1.3834455013275146, -1.3233027458190918, -1.263159990310669, -1.2030171155929565, -1.1428743600845337, -1.0827316045761108, -1.0225887298583984, -0.9624459743499756, -0.9023030996322632, -0.8421603441238403, -0.7820175290107727, -0.7218747138977051, -0.6617318987846375, -0.6015890836715698, -0.5414462685585022, -0.48130348324775696, -0.42116066813468933, -0.3610178530216217, -0.30087506771087646, -0.24073225259780884, -0.1805894374847412, -0.12044662982225418, -0.06030382215976715, -0.00016102194786071777, 0.05998179316520691, 0.12012460827827454, 0.18026739358901978, 0.2404102087020874, 0.30055302381515503, 0.36069583892822266, 0.4208386540412903, 0.4809814393520355, 0.5411242246627808, 0.6012670993804932, 0.661409854888916, 0.7215526700019836, 0.7816954851150513, 0.8418383002281189, 0.9019811153411865, 0.9621238708496094, 1.0222667455673218, 1.0824095010757446, 1.142552375793457, 1.2026951313018799, 1.2628378868103027, 1.3229806423187256, 1.383123517036438, 1.4432662725448608, 1.5034091472625732, 1.563551902770996, 1.623694658279419, 1.6838375329971313, 1.7439804077148438]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 7.0, 20.0, 13.0, 33.0, 44.0, 63.0, 85.0, 159.0, 239.0, 395.0, 678.0, 1276.0, 2534.0, 7341.0, 37224.0, 297865.0, 579933.0, 97891.0, 14745.0, 4039.0, 1775.0, 880.0, 459.0, 297.0, 188.0, 113.0, 74.0, 58.0, 36.0, 27.0, 12.0, 9.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.013671875, -1.9595947265625, -1.905517578125, -1.8514404296875, -1.79736328125, -1.7432861328125, -1.689208984375, -1.6351318359375, -1.5810546875, -1.5269775390625, -1.472900390625, -1.4188232421875, -1.36474609375, -1.3106689453125, -1.256591796875, -1.2025146484375, -1.1484375, -1.0943603515625, -1.040283203125, -0.9862060546875, -0.93212890625, -0.8780517578125, -0.823974609375, -0.7698974609375, -0.7158203125, -0.6617431640625, -0.607666015625, -0.5535888671875, -0.49951171875, -0.4454345703125, -0.391357421875, -0.3372802734375, -0.283203125, -0.2291259765625, -0.175048828125, -0.1209716796875, -0.06689453125, -0.0128173828125, 0.041259765625, 0.0953369140625, 0.1494140625, 0.2034912109375, 0.257568359375, 0.3116455078125, 0.36572265625, 0.4197998046875, 0.473876953125, 0.5279541015625, 0.58203125, 0.6361083984375, 0.690185546875, 0.7442626953125, 0.79833984375, 0.8524169921875, 0.906494140625, 0.9605712890625, 1.0146484375, 1.0687255859375, 1.122802734375, 1.1768798828125, 1.23095703125, 1.2850341796875, 1.339111328125, 1.3931884765625, 1.447265625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 6.0, 21.0, 32.0, 56.0, 75.0, 112.0, 142.0, 102.0, 127.0, 104.0, 88.0, 46.0, 41.0, 19.0, 8.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7783203125, -0.7558517456054688, -0.7333831787109375, -0.7109146118164062, -0.688446044921875, -0.6659774780273438, -0.6435089111328125, -0.6210403442382812, -0.59857177734375, -0.5761032104492188, -0.5536346435546875, -0.5311660766601562, -0.508697509765625, -0.48622894287109375, -0.4637603759765625, -0.44129180908203125, -0.4188232421875, -0.39635467529296875, -0.3738861083984375, -0.35141754150390625, -0.328948974609375, -0.30648040771484375, -0.2840118408203125, -0.26154327392578125, -0.23907470703125, -0.21660614013671875, -0.1941375732421875, -0.17166900634765625, -0.149200439453125, -0.12673187255859375, -0.1042633056640625, -0.08179473876953125, -0.059326171875, -0.03685760498046875, -0.0143890380859375, 0.00807952880859375, 0.030548095703125, 0.05301666259765625, 0.0754852294921875, 0.09795379638671875, 0.12042236328125, 0.14289093017578125, 0.1653594970703125, 0.18782806396484375, 0.210296630859375, 0.23276519775390625, 0.2552337646484375, 0.27770233154296875, 0.3001708984375, 0.32263946533203125, 0.3451080322265625, 0.36757659912109375, 0.390045166015625, 0.41251373291015625, 0.4349822998046875, 0.45745086669921875, 0.47991943359375, 0.5023880004882812, 0.5248565673828125, 0.5473251342773438, 0.569793701171875, 0.5922622680664062, 0.6147308349609375, 0.6371994018554688, 0.65966796875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 8.0, 6.0, 6.0, 14.0, 27.0, 41.0, 65.0, 92.0, 128.0, 188.0, 429.0, 824.0, 1967.0, 5845.0, 21703.0, 115195.0, 540182.0, 295588.0, 49181.0, 10955.0, 3424.0, 1254.0, 595.0, 307.0, 175.0, 115.0, 83.0, 50.0, 41.0, 20.0, 13.0, 12.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.181640625, -1.14556884765625, -1.1094970703125, -1.07342529296875, -1.037353515625, -1.00128173828125, -0.9652099609375, -0.92913818359375, -0.89306640625, -0.85699462890625, -0.8209228515625, -0.78485107421875, -0.748779296875, -0.71270751953125, -0.6766357421875, -0.64056396484375, -0.6044921875, -0.56842041015625, -0.5323486328125, -0.49627685546875, -0.460205078125, -0.42413330078125, -0.3880615234375, -0.35198974609375, -0.31591796875, -0.27984619140625, -0.2437744140625, -0.20770263671875, -0.171630859375, -0.13555908203125, -0.0994873046875, -0.06341552734375, -0.02734375, 0.00872802734375, 0.0447998046875, 0.08087158203125, 0.116943359375, 0.15301513671875, 0.1890869140625, 0.22515869140625, 0.26123046875, 0.29730224609375, 0.3333740234375, 0.36944580078125, 0.405517578125, 0.44158935546875, 0.4776611328125, 0.51373291015625, 0.5498046875, 0.58587646484375, 0.6219482421875, 0.65802001953125, 0.694091796875, 0.73016357421875, 0.7662353515625, 0.80230712890625, 0.83837890625, 0.87445068359375, 0.9105224609375, 0.94659423828125, 0.982666015625, 1.01873779296875, 1.0548095703125, 1.09088134765625, 1.126953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 9.0, 5.0, 7.0, 18.0, 14.0, 24.0, 27.0, 38.0, 42.0, 44.0, 53.0, 61.0, 62.0, 69.0, 63.0, 67.0, 67.0, 53.0, 56.0, 49.0, 38.0, 26.0, 22.0, 21.0, 15.0, 14.0, 7.0, 10.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9267578125, -1.8786163330078125, -1.830474853515625, -1.7823333740234375, -1.73419189453125, -1.6860504150390625, -1.637908935546875, -1.5897674560546875, -1.5416259765625, -1.4934844970703125, -1.445343017578125, -1.3972015380859375, -1.34906005859375, -1.3009185791015625, -1.252777099609375, -1.2046356201171875, -1.156494140625, -1.1083526611328125, -1.060211181640625, -1.0120697021484375, -0.96392822265625, -0.9157867431640625, -0.867645263671875, -0.8195037841796875, -0.7713623046875, -0.7232208251953125, -0.675079345703125, -0.6269378662109375, -0.57879638671875, -0.5306549072265625, -0.482513427734375, -0.4343719482421875, -0.38623046875, -0.3380889892578125, -0.289947509765625, -0.2418060302734375, -0.19366455078125, -0.1455230712890625, -0.097381591796875, -0.0492401123046875, -0.0010986328125, 0.0470428466796875, 0.095184326171875, 0.1433258056640625, 0.19146728515625, 0.2396087646484375, 0.287750244140625, 0.3358917236328125, 0.384033203125, 0.4321746826171875, 0.480316162109375, 0.5284576416015625, 0.57659912109375, 0.6247406005859375, 0.672882080078125, 0.7210235595703125, 0.7691650390625, 0.8173065185546875, 0.865447998046875, 0.9135894775390625, 0.96173095703125, 1.0098724365234375, 1.058013916015625, 1.1061553955078125, 1.154296875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 5.0, 12.0, 18.0, 21.0, 17.0, 35.0, 59.0, 76.0, 127.0, 216.0, 371.0, 706.0, 1461.0, 3618.0, 10475.0, 39126.0, 179177.0, 494593.0, 243182.0, 53388.0, 13597.0, 4560.0, 1755.0, 823.0, 415.0, 256.0, 143.0, 108.0, 49.0, 42.0, 33.0, 12.0, 13.0, 14.0, 11.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.384765625, -0.37131500244140625, -0.3578643798828125, -0.34441375732421875, -0.330963134765625, -0.31751251220703125, -0.3040618896484375, -0.29061126708984375, -0.27716064453125, -0.26371002197265625, -0.2502593994140625, -0.23680877685546875, -0.223358154296875, -0.20990753173828125, -0.1964569091796875, -0.18300628662109375, -0.1695556640625, -0.15610504150390625, -0.1426544189453125, -0.12920379638671875, -0.115753173828125, -0.10230255126953125, -0.0888519287109375, -0.07540130615234375, -0.06195068359375, -0.04850006103515625, -0.0350494384765625, -0.02159881591796875, -0.008148193359375, 0.00530242919921875, 0.0187530517578125, 0.03220367431640625, 0.045654296875, 0.05910491943359375, 0.0725555419921875, 0.08600616455078125, 0.099456787109375, 0.11290740966796875, 0.1263580322265625, 0.13980865478515625, 0.15325927734375, 0.16670989990234375, 0.1801605224609375, 0.19361114501953125, 0.207061767578125, 0.22051239013671875, 0.2339630126953125, 0.24741363525390625, 0.2608642578125, 0.27431488037109375, 0.2877655029296875, 0.30121612548828125, 0.314666748046875, 0.32811737060546875, 0.3415679931640625, 0.35501861572265625, 0.36846923828125, 0.38191986083984375, 0.3953704833984375, 0.40882110595703125, 0.422271728515625, 0.43572235107421875, 0.4491729736328125, 0.46262359619140625, 0.47607421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 2.0, 9.0, 11.0, 14.0, 29.0, 39.0, 57.0, 57.0, 95.0, 91.0, 111.0, 112.0, 95.0, 73.0, 57.0, 28.0, 33.0, 26.0, 12.0, 13.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011366605758666992, -0.00011045299470424652, -0.00010723993182182312, -0.00010402686893939972, -0.00010081380605697632, -9.760074317455292e-05, -9.438768029212952e-05, -9.117461740970612e-05, -8.796155452728271e-05, -8.474849164485931e-05, -8.153542876243591e-05, -7.832236588001251e-05, -7.510930299758911e-05, -7.189624011516571e-05, -6.868317723274231e-05, -6.547011435031891e-05, -6.225705146789551e-05, -5.904398858547211e-05, -5.5830925703048706e-05, -5.2617862820625305e-05, -4.9404799938201904e-05, -4.6191737055778503e-05, -4.29786741733551e-05, -3.97656112909317e-05, -3.65525484085083e-05, -3.33394855260849e-05, -3.01264226436615e-05, -2.6913359761238098e-05, -2.3700296878814697e-05, -2.0487233996391296e-05, -1.7274171113967896e-05, -1.4061108231544495e-05, -1.0848045349121094e-05, -7.634982466697693e-06, -4.421919584274292e-06, -1.2088567018508911e-06, 2.0042061805725098e-06, 5.217269062995911e-06, 8.430331945419312e-06, 1.1643394827842712e-05, 1.4856457710266113e-05, 1.8069520592689514e-05, 2.1282583475112915e-05, 2.4495646357536316e-05, 2.7708709239959717e-05, 3.092177212238312e-05, 3.413483500480652e-05, 3.734789788722992e-05, 4.056096076965332e-05, 4.377402365207672e-05, 4.698708653450012e-05, 5.020014941692352e-05, 5.3413212299346924e-05, 5.6626275181770325e-05, 5.9839338064193726e-05, 6.305240094661713e-05, 6.626546382904053e-05, 6.947852671146393e-05, 7.269158959388733e-05, 7.590465247631073e-05, 7.911771535873413e-05, 8.233077824115753e-05, 8.554384112358093e-05, 8.875690400600433e-05, 9.196996688842773e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 10.0, 9.0, 24.0, 42.0, 55.0, 114.0, 209.0, 421.0, 1042.0, 2821.0, 10953.0, 73902.0, 514715.0, 385156.0, 47384.0, 7821.0, 2234.0, 825.0, 373.0, 170.0, 121.0, 52.0, 37.0, 23.0, 8.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5216217041015625, -0.502227783203125, -0.4828338623046875, -0.46343994140625, -0.4440460205078125, -0.424652099609375, -0.4052581787109375, -0.3858642578125, -0.3664703369140625, -0.347076416015625, -0.3276824951171875, -0.30828857421875, -0.2888946533203125, -0.269500732421875, -0.2501068115234375, -0.230712890625, -0.2113189697265625, -0.191925048828125, -0.1725311279296875, -0.15313720703125, -0.1337432861328125, -0.114349365234375, -0.0949554443359375, -0.0755615234375, -0.0561676025390625, -0.036773681640625, -0.0173797607421875, 0.00201416015625, 0.0214080810546875, 0.040802001953125, 0.0601959228515625, 0.07958984375, 0.0989837646484375, 0.118377685546875, 0.1377716064453125, 0.15716552734375, 0.1765594482421875, 0.195953369140625, 0.2153472900390625, 0.2347412109375, 0.2541351318359375, 0.273529052734375, 0.2929229736328125, 0.31231689453125, 0.3317108154296875, 0.351104736328125, 0.3704986572265625, 0.389892578125, 0.4092864990234375, 0.428680419921875, 0.4480743408203125, 0.46746826171875, 0.4868621826171875, 0.506256103515625, 0.5256500244140625, 0.5450439453125, 0.5644378662109375, 0.583831787109375, 0.6032257080078125, 0.62261962890625, 0.6420135498046875, 0.661407470703125, 0.6808013916015625, 0.7001953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 10.0, 20.0, 26.0, 42.0, 54.0, 86.0, 108.0, 122.0, 134.0, 100.0, 73.0, 59.0, 45.0, 30.0, 19.0, 22.0, 13.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.748046875, -0.7260818481445312, -0.7041168212890625, -0.6821517944335938, -0.660186767578125, -0.6382217407226562, -0.6162567138671875, -0.5942916870117188, -0.57232666015625, -0.5503616333007812, -0.5283966064453125, -0.5064315795898438, -0.484466552734375, -0.46250152587890625, -0.4405364990234375, -0.41857147216796875, -0.3966064453125, -0.37464141845703125, -0.3526763916015625, -0.33071136474609375, -0.308746337890625, -0.28678131103515625, -0.2648162841796875, -0.24285125732421875, -0.22088623046875, -0.19892120361328125, -0.1769561767578125, -0.15499114990234375, -0.133026123046875, -0.11106109619140625, -0.0890960693359375, -0.06713104248046875, -0.045166015625, -0.02320098876953125, -0.0012359619140625, 0.02072906494140625, 0.042694091796875, 0.06465911865234375, 0.0866241455078125, 0.10858917236328125, 0.13055419921875, 0.15251922607421875, 0.1744842529296875, 0.19644927978515625, 0.218414306640625, 0.24037933349609375, 0.2623443603515625, 0.28430938720703125, 0.3062744140625, 0.32823944091796875, 0.3502044677734375, 0.37216949462890625, 0.394134521484375, 0.41609954833984375, 0.4380645751953125, 0.46002960205078125, 0.48199462890625, 0.5039596557617188, 0.5259246826171875, 0.5478897094726562, 0.569854736328125, 0.5918197631835938, 0.6137847900390625, 0.6357498168945312, 0.65771484375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 11.0, 16.0, 32.0, 53.0, 97.0, 137.0, 150.0, 149.0, 129.0, 80.0, 62.0, 36.0, 19.0, 14.0, 8.0, 2.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.51634407043457, -13.23917007446289, -12.961997032165527, -12.684823036193848, -12.407649040222168, -12.130475997924805, -11.853302001953125, -11.576128005981445, -11.298954963684082, -11.021780967712402, -10.744607925415039, -10.46743392944336, -10.19025993347168, -9.913086891174316, -9.635912895202637, -9.358738899230957, -9.081565856933594, -8.804391860961914, -8.52721881866455, -8.250044822692871, -7.97287130355835, -7.695697784423828, -7.418523788452148, -7.141350269317627, -6.864175796508789, -6.587002277374268, -6.309828281402588, -6.032654762268066, -5.755481243133545, -5.478307723999023, -5.201133728027344, -4.923960208892822, -4.646786689758301, -4.369613170623779, -4.0924391746521, -3.815265655517578, -3.5380921363830566, -3.260918378829956, -2.9837446212768555, -2.706571102142334, -2.4293973445892334, -2.152223587036133, -1.8750500679016113, -1.5978763103485107, -1.3207026720046997, -1.0435290336608887, -0.7663552761077881, -0.48918163776397705, -0.21200799942016602, 0.06516566872596741, 0.34233933687210083, 0.6195130348205566, 0.8966866731643677, 1.1738603115081787, 1.4510340690612793, 1.7282077074050903, 2.0053813457489014, 2.282555103302002, 2.5597286224365234, 2.836902379989624, 3.1140761375427246, 3.391249656677246, 3.6684234142303467, 3.9455971717834473, 4.222770690917969]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 10.0, 9.0, 20.0, 14.0, 11.0, 22.0, 27.0, 14.0, 21.0, 29.0, 26.0, 35.0, 34.0, 41.0, 47.0, 41.0, 51.0, 42.0, 49.0, 58.0, 52.0, 34.0, 26.0, 31.0, 34.0, 25.0, 27.0, 21.0, 16.0, 17.0, 14.0, 9.0, 17.0, 14.0, 15.0, 8.0, 5.0, 8.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.450253486633301, -6.266421794891357, -6.082590103149414, -5.898758888244629, -5.7149271965026855, -5.531095504760742, -5.347263813018799, -5.1634321212768555, -4.97960090637207, -4.795769214630127, -4.611937522888184, -4.428106307983398, -4.244274616241455, -4.060442924499512, -3.8766112327575684, -3.692779541015625, -3.5089478492736816, -3.3251161575317383, -3.141284704208374, -2.9574530124664307, -2.7736215591430664, -2.589789867401123, -2.4059581756591797, -2.2221264839172363, -2.038295030593872, -1.8544634580612183, -1.6706318855285645, -1.486800193786621, -1.3029686212539673, -1.1191370487213135, -0.9353053569793701, -0.7514737844467163, -0.5676422119140625, -0.3838106095790863, -0.1999790072441101, -0.016147375106811523, 0.16768419742584229, 0.3515157699584961, 0.5353474617004395, 0.7191790342330933, 0.9030106067657471, 1.0868421792984009, 1.2706737518310547, 1.454505443572998, 1.6383370161056519, 1.8221685886383057, 2.006000280380249, 2.1898317337036133, 2.3736634254455566, 2.5574951171875, 2.7413265705108643, 2.9251582622528076, 3.108989715576172, 3.2928214073181152, 3.4766530990600586, 3.660484790802002, 3.844316244125366, 4.0281476974487305, 4.211979389190674, 4.395811080932617, 4.5796427726745605, 4.763474464416504, 4.947305679321289, 5.131137371063232, 5.314969062805176]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 7.0, 13.0, 18.0, 29.0, 38.0, 58.0, 117.0, 169.0, 351.0, 825.0, 3324.0, 32504.0, 4142067.0, 11544.0, 1880.0, 604.0, 289.0, 182.0, 83.0, 62.0, 38.0, 22.0, 14.0, 17.0, 7.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.44921875, -5.323455810546875, -5.19769287109375, -5.071929931640625, -4.9461669921875, -4.820404052734375, -4.69464111328125, -4.568878173828125, -4.443115234375, -4.317352294921875, -4.19158935546875, -4.065826416015625, -3.9400634765625, -3.814300537109375, -3.68853759765625, -3.562774658203125, -3.43701171875, -3.311248779296875, -3.18548583984375, -3.059722900390625, -2.9339599609375, -2.808197021484375, -2.68243408203125, -2.556671142578125, -2.430908203125, -2.305145263671875, -2.17938232421875, -2.053619384765625, -1.9278564453125, -1.802093505859375, -1.67633056640625, -1.550567626953125, -1.4248046875, -1.299041748046875, -1.17327880859375, -1.047515869140625, -0.9217529296875, -0.795989990234375, -0.67022705078125, -0.544464111328125, -0.418701171875, -0.292938232421875, -0.16717529296875, -0.041412353515625, 0.0843505859375, 0.210113525390625, 0.33587646484375, 0.461639404296875, 0.58740234375, 0.713165283203125, 0.83892822265625, 0.964691162109375, 1.0904541015625, 1.216217041015625, 1.34197998046875, 1.467742919921875, 1.593505859375, 1.719268798828125, 1.84503173828125, 1.970794677734375, 2.0965576171875, 2.222320556640625, 2.34808349609375, 2.473846435546875, 2.599609375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 8.0, 22.0, 36.0, 55.0, 67.0, 102.0, 106.0, 107.0, 113.0, 104.0, 94.0, 67.0, 42.0, 22.0, 15.0, 13.0, 11.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8203125, -0.7968292236328125, -0.773345947265625, -0.7498626708984375, -0.72637939453125, -0.7028961181640625, -0.679412841796875, -0.6559295654296875, -0.6324462890625, -0.6089630126953125, -0.585479736328125, -0.5619964599609375, -0.53851318359375, -0.5150299072265625, -0.491546630859375, -0.4680633544921875, -0.444580078125, -0.4210968017578125, -0.397613525390625, -0.3741302490234375, -0.35064697265625, -0.3271636962890625, -0.303680419921875, -0.2801971435546875, -0.2567138671875, -0.2332305908203125, -0.209747314453125, -0.1862640380859375, -0.16278076171875, -0.1392974853515625, -0.115814208984375, -0.0923309326171875, -0.06884765625, -0.0453643798828125, -0.021881103515625, 0.0016021728515625, 0.02508544921875, 0.0485687255859375, 0.072052001953125, 0.0955352783203125, 0.1190185546875, 0.1425018310546875, 0.165985107421875, 0.1894683837890625, 0.21295166015625, 0.2364349365234375, 0.259918212890625, 0.2834014892578125, 0.306884765625, 0.3303680419921875, 0.353851318359375, 0.3773345947265625, 0.40081787109375, 0.4243011474609375, 0.447784423828125, 0.4712677001953125, 0.4947509765625, 0.5182342529296875, 0.541717529296875, 0.5652008056640625, 0.58868408203125, 0.6121673583984375, 0.635650634765625, 0.6591339111328125, 0.6826171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 9.0, 11.0, 16.0, 23.0, 37.0, 46.0, 61.0, 74.0, 74.0, 101.0, 172.0, 246.0, 457.0, 1010.0, 3111.0, 14192.0, 3940284.0, 218498.0, 10944.0, 2557.0, 970.0, 436.0, 252.0, 171.0, 94.0, 83.0, 92.0, 54.0, 40.0, 37.0, 31.0, 20.0, 14.0, 9.0, 6.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.92572021484375, -1.8514404296875, -1.77716064453125, -1.702880859375, -1.62860107421875, -1.5543212890625, -1.48004150390625, -1.40576171875, -1.33148193359375, -1.2572021484375, -1.18292236328125, -1.108642578125, -1.03436279296875, -0.9600830078125, -0.88580322265625, -0.8115234375, -0.73724365234375, -0.6629638671875, -0.58868408203125, -0.514404296875, -0.44012451171875, -0.3658447265625, -0.29156494140625, -0.21728515625, -0.14300537109375, -0.0687255859375, 0.00555419921875, 0.079833984375, 0.15411376953125, 0.2283935546875, 0.30267333984375, 0.376953125, 0.45123291015625, 0.5255126953125, 0.59979248046875, 0.674072265625, 0.74835205078125, 0.8226318359375, 0.89691162109375, 0.97119140625, 1.04547119140625, 1.1197509765625, 1.19403076171875, 1.268310546875, 1.34259033203125, 1.4168701171875, 1.49114990234375, 1.5654296875, 1.63970947265625, 1.7139892578125, 1.78826904296875, 1.862548828125, 1.93682861328125, 2.0111083984375, 2.08538818359375, 2.15966796875, 2.23394775390625, 2.3082275390625, 2.38250732421875, 2.456787109375, 2.53106689453125, 2.6053466796875, 2.67962646484375, 2.75390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 32.0, 65.0, 3523.0, 353.0, 55.0, 18.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.1731243133544922, -0.15374374389648438, -0.13436317443847656, -0.11498260498046875, -0.09560203552246094, -0.07622146606445312, -0.05684089660644531, -0.0374603271484375, -0.018079757690429688, 0.001300811767578125, 0.020681381225585938, 0.04006195068359375, 0.05944252014160156, 0.07882308959960938, 0.09820365905761719, 0.117584228515625, 0.1369647979736328, 0.15634536743164062, 0.17572593688964844, 0.19510650634765625, 0.21448707580566406, 0.23386764526367188, 0.2532482147216797, 0.2726287841796875, 0.2920093536376953, 0.3113899230957031, 0.33077049255371094, 0.35015106201171875, 0.36953163146972656, 0.3889122009277344, 0.4082927703857422, 0.42767333984375, 0.4470539093017578, 0.4664344787597656, 0.48581504821777344, 0.5051956176757812, 0.5245761871337891, 0.5439567565917969, 0.5633373260498047, 0.5827178955078125, 0.6020984649658203, 0.6214790344238281, 0.6408596038818359, 0.6602401733398438, 0.6796207427978516, 0.6990013122558594, 0.7183818817138672, 0.737762451171875, 0.7571430206298828, 0.7765235900878906, 0.7959041595458984, 0.8152847290039062, 0.8346652984619141, 0.8540458679199219, 0.8734264373779297, 0.8928070068359375, 0.9121875762939453, 0.9315681457519531, 0.9509487152099609, 0.9703292846679688, 0.9897098541259766, 1.0090904235839844, 1.0284709930419922, 1.0478515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 28.0, 38.0, 94.0, 142.0, 173.0, 193.0, 127.0, 87.0, 48.0, 27.0, 15.0, 6.0, 12.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6181740760803223, -1.5613782405853271, -1.5045825242996216, -1.4477866888046265, -1.390990972518921, -1.3341951370239258, -1.2773993015289307, -1.2206034660339355, -1.16380774974823, -1.1070119142532349, -1.0502161979675293, -0.9934203624725342, -0.9366245865821838, -0.8798288106918335, -0.8230329751968384, -0.766237199306488, -0.7094414234161377, -0.6526456475257874, -0.595849871635437, -0.5390540361404419, -0.48225826025009155, -0.4254624843597412, -0.3686666786670685, -0.31187087297439575, -0.2550750970840454, -0.19827930629253387, -0.14148351550102234, -0.0846877247095108, -0.027891933917999268, 0.028903841972351074, 0.0856996476650238, 0.14249545335769653, 0.19929122924804688, 0.2560870051383972, 0.31288281083106995, 0.3696786165237427, 0.426474392414093, 0.48327016830444336, 0.5400660037994385, 0.5968617796897888, 0.6536575555801392, 0.7104533314704895, 0.7672491073608398, 0.824044942855835, 0.8808407187461853, 0.9376364946365356, 0.9944323301315308, 1.0512280464172363, 1.1080238819122314, 1.1648197174072266, 1.2216154336929321, 1.2784112691879272, 1.3352069854736328, 1.392002820968628, 1.448798656463623, 1.5055944919586182, 1.5623902082443237, 1.6191860437393188, 1.6759817600250244, 1.7327775955200195, 1.7895734310150146, 1.8463691473007202, 1.9031649827957153, 1.959960699081421, 2.016756534576416]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 9.0, 15.0, 16.0, 14.0, 25.0, 30.0, 28.0, 42.0, 27.0, 36.0, 37.0, 35.0, 39.0, 41.0, 51.0, 45.0, 51.0, 51.0, 37.0, 45.0, 40.0, 39.0, 35.0, 29.0, 26.0, 18.0, 26.0, 20.0, 17.0, 15.0, 12.0, 7.0, 6.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.782922625541687, -0.7577028870582581, -0.7324832081794739, -0.7072634696960449, -0.682043731212616, -0.656823992729187, -0.6316043138504028, -0.6063845753669739, -0.5811648368835449, -0.555945098400116, -0.5307254195213318, -0.5055056810379028, -0.4802859425544739, -0.4550662338733673, -0.42984652519226074, -0.4046267867088318, -0.3794070780277252, -0.35418736934661865, -0.3289676308631897, -0.30374792218208313, -0.2785281836986542, -0.2533084750175476, -0.22808875143527985, -0.20286902785301208, -0.17764930427074432, -0.15242958068847656, -0.1272098571062088, -0.10199014097452164, -0.07677041739225388, -0.05155070126056671, -0.02633097767829895, -0.001111254096031189, 0.024108469486236572, 0.049328193068504333, 0.0745479166507721, 0.09976763278245926, 0.12498735636472702, 0.15020707249641418, 0.17542679607868195, 0.2006465196609497, 0.22586624324321747, 0.25108596682548523, 0.2763056755065918, 0.30152541399002075, 0.3267451226711273, 0.3519648313522339, 0.37718456983566284, 0.4024043083190918, 0.42762401700019836, 0.45284372568130493, 0.4780634641647339, 0.5032832026481628, 0.528502881526947, 0.553722620010376, 0.5789423584938049, 0.6041620969772339, 0.6293817758560181, 0.654601514339447, 0.6798211932182312, 0.7050409317016602, 0.7302606701850891, 0.7554804086685181, 0.7807000875473022, 0.8059198260307312, 0.8311395645141602]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 10.0, 12.0, 25.0, 48.0, 81.0, 128.0, 223.0, 456.0, 881.0, 2001.0, 6031.0, 32415.0, 244881.0, 587826.0, 146298.0, 19596.0, 4355.0, 1599.0, 754.0, 412.0, 207.0, 122.0, 83.0, 41.0, 23.0, 12.0, 12.0, 6.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.08984375, -2.0290374755859375, -1.968231201171875, -1.9074249267578125, -1.84661865234375, -1.7858123779296875, -1.725006103515625, -1.6641998291015625, -1.6033935546875, -1.5425872802734375, -1.481781005859375, -1.4209747314453125, -1.36016845703125, -1.2993621826171875, -1.238555908203125, -1.1777496337890625, -1.116943359375, -1.0561370849609375, -0.995330810546875, -0.9345245361328125, -0.87371826171875, -0.8129119873046875, -0.752105712890625, -0.6912994384765625, -0.6304931640625, -0.5696868896484375, -0.508880615234375, -0.4480743408203125, -0.38726806640625, -0.3264617919921875, -0.265655517578125, -0.2048492431640625, -0.14404296875, -0.0832366943359375, -0.022430419921875, 0.0383758544921875, 0.09918212890625, 0.1599884033203125, 0.220794677734375, 0.2816009521484375, 0.3424072265625, 0.4032135009765625, 0.464019775390625, 0.5248260498046875, 0.58563232421875, 0.6464385986328125, 0.707244873046875, 0.7680511474609375, 0.828857421875, 0.8896636962890625, 0.950469970703125, 1.0112762451171875, 1.07208251953125, 1.1328887939453125, 1.193695068359375, 1.2545013427734375, 1.3153076171875, 1.3761138916015625, 1.436920166015625, 1.4977264404296875, 1.55853271484375, 1.6193389892578125, 1.680145263671875, 1.7409515380859375, 1.8017578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 16.0, 18.0, 24.0, 35.0, 56.0, 72.0, 86.0, 99.0, 110.0, 86.0, 91.0, 79.0, 67.0, 52.0, 39.0, 28.0, 13.0, 15.0, 2.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.822265625, -0.7988052368164062, -0.7753448486328125, -0.7518844604492188, -0.728424072265625, -0.7049636840820312, -0.6815032958984375, -0.6580429077148438, -0.63458251953125, -0.6111221313476562, -0.5876617431640625, -0.5642013549804688, -0.540740966796875, -0.5172805786132812, -0.4938201904296875, -0.47035980224609375, -0.4468994140625, -0.42343902587890625, -0.3999786376953125, -0.37651824951171875, -0.353057861328125, -0.32959747314453125, -0.3061370849609375, -0.28267669677734375, -0.25921630859375, -0.23575592041015625, -0.2122955322265625, -0.18883514404296875, -0.165374755859375, -0.14191436767578125, -0.1184539794921875, -0.09499359130859375, -0.071533203125, -0.04807281494140625, -0.0246124267578125, -0.00115203857421875, 0.022308349609375, 0.04576873779296875, 0.0692291259765625, 0.09268951416015625, 0.11614990234375, 0.13961029052734375, 0.1630706787109375, 0.18653106689453125, 0.209991455078125, 0.23345184326171875, 0.2569122314453125, 0.28037261962890625, 0.3038330078125, 0.32729339599609375, 0.3507537841796875, 0.37421417236328125, 0.397674560546875, 0.42113494873046875, 0.4445953369140625, 0.46805572509765625, 0.49151611328125, 0.5149765014648438, 0.5384368896484375, 0.5618972778320312, 0.585357666015625, 0.6088180541992188, 0.6322784423828125, 0.6557388305664062, 0.67919921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 10.0, 15.0, 15.0, 21.0, 21.0, 29.0, 39.0, 43.0, 83.0, 91.0, 130.0, 212.0, 305.0, 492.0, 983.0, 1893.0, 4123.0, 10051.0, 26722.0, 76251.0, 218860.0, 392576.0, 202971.0, 70345.0, 24795.0, 9361.0, 3849.0, 1796.0, 977.0, 543.0, 307.0, 184.0, 127.0, 77.0, 52.0, 51.0, 44.0, 34.0, 19.0, 12.0, 10.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.76416015625, -0.73907470703125, -0.7139892578125, -0.68890380859375, -0.663818359375, -0.63873291015625, -0.6136474609375, -0.58856201171875, -0.5634765625, -0.53839111328125, -0.5133056640625, -0.48822021484375, -0.463134765625, -0.43804931640625, -0.4129638671875, -0.38787841796875, -0.36279296875, -0.33770751953125, -0.3126220703125, -0.28753662109375, -0.262451171875, -0.23736572265625, -0.2122802734375, -0.18719482421875, -0.162109375, -0.13702392578125, -0.1119384765625, -0.08685302734375, -0.061767578125, -0.03668212890625, -0.0115966796875, 0.01348876953125, 0.03857421875, 0.06365966796875, 0.0887451171875, 0.11383056640625, 0.138916015625, 0.16400146484375, 0.1890869140625, 0.21417236328125, 0.2392578125, 0.26434326171875, 0.2894287109375, 0.31451416015625, 0.339599609375, 0.36468505859375, 0.3897705078125, 0.41485595703125, 0.43994140625, 0.46502685546875, 0.4901123046875, 0.51519775390625, 0.540283203125, 0.56536865234375, 0.5904541015625, 0.61553955078125, 0.640625, 0.66571044921875, 0.6907958984375, 0.71588134765625, 0.740966796875, 0.76605224609375, 0.7911376953125, 0.81622314453125, 0.84130859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 5.0, 2.0, 3.0, 7.0, 9.0, 10.0, 11.0, 14.0, 24.0, 19.0, 26.0, 28.0, 38.0, 34.0, 44.0, 34.0, 53.0, 39.0, 59.0, 41.0, 39.0, 57.0, 51.0, 51.0, 43.0, 38.0, 35.0, 25.0, 26.0, 23.0, 14.0, 23.0, 17.0, 13.0, 12.0, 6.0, 7.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.505859375, -1.453125, -1.400390625, -1.34765625, -1.294921875, -1.2421875, -1.189453125, -1.13671875, -1.083984375, -1.03125, -0.978515625, -0.92578125, -0.873046875, -0.8203125, -0.767578125, -0.71484375, -0.662109375, -0.609375, -0.556640625, -0.50390625, -0.451171875, -0.3984375, -0.345703125, -0.29296875, -0.240234375, -0.1875, -0.134765625, -0.08203125, -0.029296875, 0.0234375, 0.076171875, 0.12890625, 0.181640625, 0.234375, 0.287109375, 0.33984375, 0.392578125, 0.4453125, 0.498046875, 0.55078125, 0.603515625, 0.65625, 0.708984375, 0.76171875, 0.814453125, 0.8671875, 0.919921875, 0.97265625, 1.025390625, 1.078125, 1.130859375, 1.18359375, 1.236328125, 1.2890625, 1.341796875, 1.39453125, 1.447265625, 1.5, 1.552734375, 1.60546875, 1.658203125, 1.7109375, 1.763671875, 1.81640625, 1.869140625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 16.0, 30.0, 50.0, 77.0, 192.0, 545.0, 3599.0, 164118.0, 868558.0, 9865.0, 965.0, 284.0, 120.0, 53.0, 36.0, 12.0, 9.0, 6.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.59375, -1.52191162109375, -1.4500732421875, -1.37823486328125, -1.306396484375, -1.23455810546875, -1.1627197265625, -1.09088134765625, -1.01904296875, -0.94720458984375, -0.8753662109375, -0.80352783203125, -0.731689453125, -0.65985107421875, -0.5880126953125, -0.51617431640625, -0.4443359375, -0.37249755859375, -0.3006591796875, -0.22882080078125, -0.156982421875, -0.08514404296875, -0.0133056640625, 0.05853271484375, 0.13037109375, 0.20220947265625, 0.2740478515625, 0.34588623046875, 0.417724609375, 0.48956298828125, 0.5614013671875, 0.63323974609375, 0.705078125, 0.77691650390625, 0.8487548828125, 0.92059326171875, 0.992431640625, 1.06427001953125, 1.1361083984375, 1.20794677734375, 1.27978515625, 1.35162353515625, 1.4234619140625, 1.49530029296875, 1.567138671875, 1.63897705078125, 1.7108154296875, 1.78265380859375, 1.8544921875, 1.92633056640625, 1.9981689453125, 2.07000732421875, 2.141845703125, 2.21368408203125, 2.2855224609375, 2.35736083984375, 2.42919921875, 2.50103759765625, 2.5728759765625, 2.64471435546875, 2.716552734375, 2.78839111328125, 2.8602294921875, 2.93206787109375, 3.00390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 2.0, 7.0, 9.0, 7.0, 16.0, 11.0, 19.0, 19.0, 29.0, 35.0, 50.0, 61.0, 53.0, 66.0, 89.0, 78.0, 78.0, 69.0, 48.0, 63.0, 43.0, 26.0, 25.0, 21.0, 14.0, 11.0, 13.0, 3.0, 5.0, 2.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.666515350341797e-05, -8.389260619878769e-05, -8.112005889415741e-05, -7.834751158952713e-05, -7.557496428489685e-05, -7.280241698026657e-05, -7.002986967563629e-05, -6.725732237100601e-05, -6.448477506637573e-05, -6.171222776174545e-05, -5.893968045711517e-05, -5.6167133152484894e-05, -5.3394585847854614e-05, -5.0622038543224335e-05, -4.7849491238594055e-05, -4.5076943933963776e-05, -4.2304396629333496e-05, -3.9531849324703217e-05, -3.675930202007294e-05, -3.398675471544266e-05, -3.121420741081238e-05, -2.84416601061821e-05, -2.566911280155182e-05, -2.289656549692154e-05, -2.012401819229126e-05, -1.735147088766098e-05, -1.45789235830307e-05, -1.1806376278400421e-05, -9.033828973770142e-06, -6.261281669139862e-06, -3.4887343645095825e-06, -7.16187059879303e-07, 2.0563602447509766e-06, 4.828907549381256e-06, 7.601454854011536e-06, 1.0374002158641815e-05, 1.3146549463272095e-05, 1.5919096767902374e-05, 1.8691644072532654e-05, 2.1464191377162933e-05, 2.4236738681793213e-05, 2.7009285986423492e-05, 2.9781833291053772e-05, 3.255438059568405e-05, 3.532692790031433e-05, 3.809947520494461e-05, 4.087202250957489e-05, 4.364456981420517e-05, 4.641711711883545e-05, 4.918966442346573e-05, 5.196221172809601e-05, 5.473475903272629e-05, 5.750730633735657e-05, 6.027985364198685e-05, 6.305240094661713e-05, 6.58249482512474e-05, 6.859749555587769e-05, 7.137004286050797e-05, 7.414259016513824e-05, 7.691513746976852e-05, 7.96876847743988e-05, 8.246023207902908e-05, 8.523277938365936e-05, 8.800532668828964e-05, 9.077787399291992e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 16.0, 14.0, 28.0, 38.0, 84.0, 173.0, 348.0, 800.0, 2114.0, 7382.0, 37640.0, 349258.0, 570353.0, 64709.0, 10756.0, 2882.0, 1039.0, 420.0, 218.0, 116.0, 60.0, 26.0, 20.0, 14.0, 8.0, 12.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9203033447265625, -0.893341064453125, -0.8663787841796875, -0.83941650390625, -0.8124542236328125, -0.785491943359375, -0.7585296630859375, -0.7315673828125, -0.7046051025390625, -0.677642822265625, -0.6506805419921875, -0.62371826171875, -0.5967559814453125, -0.569793701171875, -0.5428314208984375, -0.515869140625, -0.4889068603515625, -0.461944580078125, -0.4349822998046875, -0.40802001953125, -0.3810577392578125, -0.354095458984375, -0.3271331787109375, -0.3001708984375, -0.2732086181640625, -0.246246337890625, -0.2192840576171875, -0.19232177734375, -0.1653594970703125, -0.138397216796875, -0.1114349365234375, -0.08447265625, -0.0575103759765625, -0.030548095703125, -0.0035858154296875, 0.02337646484375, 0.0503387451171875, 0.077301025390625, 0.1042633056640625, 0.1312255859375, 0.1581878662109375, 0.185150146484375, 0.2121124267578125, 0.23907470703125, 0.2660369873046875, 0.292999267578125, 0.3199615478515625, 0.346923828125, 0.3738861083984375, 0.400848388671875, 0.4278106689453125, 0.45477294921875, 0.4817352294921875, 0.508697509765625, 0.5356597900390625, 0.5626220703125, 0.5895843505859375, 0.616546630859375, 0.6435089111328125, 0.67047119140625, 0.6974334716796875, 0.724395751953125, 0.7513580322265625, 0.7783203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 8.0, 7.0, 20.0, 17.0, 25.0, 43.0, 74.0, 114.0, 125.0, 144.0, 116.0, 103.0, 72.0, 42.0, 32.0, 21.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.166412353515625, -1.12677001953125, -1.087127685546875, -1.0474853515625, -1.007843017578125, -0.96820068359375, -0.928558349609375, -0.888916015625, -0.849273681640625, -0.80963134765625, -0.769989013671875, -0.7303466796875, -0.690704345703125, -0.65106201171875, -0.611419677734375, -0.57177734375, -0.532135009765625, -0.49249267578125, -0.452850341796875, -0.4132080078125, -0.373565673828125, -0.33392333984375, -0.294281005859375, -0.254638671875, -0.214996337890625, -0.17535400390625, -0.135711669921875, -0.0960693359375, -0.056427001953125, -0.01678466796875, 0.022857666015625, 0.0625, 0.102142333984375, 0.14178466796875, 0.181427001953125, 0.2210693359375, 0.260711669921875, 0.30035400390625, 0.339996337890625, 0.379638671875, 0.419281005859375, 0.45892333984375, 0.498565673828125, 0.5382080078125, 0.577850341796875, 0.61749267578125, 0.657135009765625, 0.69677734375, 0.736419677734375, 0.77606201171875, 0.815704345703125, 0.8553466796875, 0.894989013671875, 0.93463134765625, 0.974273681640625, 1.013916015625, 1.053558349609375, 1.09320068359375, 1.132843017578125, 1.1724853515625, 1.212127685546875, 1.25177001953125, 1.291412353515625, 1.3310546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 27.0, 36.0, 63.0, 112.0, 140.0, 155.0, 146.0, 110.0, 78.0, 47.0, 33.0, 24.0, 11.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.92661190032959, -4.4984130859375, -4.07021427154541, -3.6420156955718994, -3.2138168811798096, -2.7856180667877197, -2.357419490814209, -1.9292206764221191, -1.5010218620300293, -1.0728230476379395, -0.6446243524551392, -0.21642565727233887, 0.21177315711975098, 0.6399719715118408, 1.0681705474853516, 1.4963693618774414, 1.9245681762695312, 2.352766990661621, 2.780965805053711, 3.2091643810272217, 3.6373631954193115, 4.0655622482299805, 4.493760585784912, 4.921959400177002, 5.350158214569092, 5.778357028961182, 6.2065558433532715, 6.634754180908203, 7.062952995300293, 7.491151809692383, 7.919350624084473, 8.347549438476562, 8.775747299194336, 9.203946113586426, 9.632144927978516, 10.060343742370605, 10.488542556762695, 10.916741371154785, 11.344940185546875, 11.773138046264648, 12.201337814331055, 12.629536628723145, 13.057735443115234, 13.485934257507324, 13.914133071899414, 14.342331886291504, 14.770530700683594, 15.198728561401367, 15.626927375793457, 16.055126190185547, 16.48332405090332, 16.911523818969727, 17.3397216796875, 17.767921447753906, 18.19611930847168, 18.624319076538086, 19.05251693725586, 19.480714797973633, 19.90891456604004, 20.337112426757812, 20.76531219482422, 21.193510055541992, 21.6217098236084, 22.049907684326172, 22.478107452392578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 5.0, 5.0, 7.0, 4.0, 4.0, 4.0, 13.0, 18.0, 16.0, 17.0, 22.0, 28.0, 28.0, 28.0, 26.0, 42.0, 39.0, 39.0, 41.0, 40.0, 48.0, 56.0, 41.0, 51.0, 39.0, 40.0, 51.0, 36.0, 32.0, 27.0, 25.0, 26.0, 19.0, 19.0, 9.0, 6.0, 10.0, 9.0, 6.0, 4.0, 5.0, 9.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.880712509155273, -8.599197387695312, -8.317683219909668, -8.036168098449707, -7.754653453826904, -7.473138809204102, -7.191623687744141, -6.910109043121338, -6.628594398498535, -6.347079753875732, -6.06556510925293, -5.784049987792969, -5.502535343170166, -5.221020698547363, -4.939505577087402, -4.6579909324646, -4.376476287841797, -4.094961643218994, -3.8134467601776123, -3.5319318771362305, -3.2504172325134277, -2.968902587890625, -2.687387704849243, -2.4058728218078613, -2.1243581771850586, -1.8428434133529663, -1.561328649520874, -1.2798138856887817, -0.9982991218566895, -0.7167843580245972, -0.4352695941925049, -0.1537548303604126, 0.1277608871459961, 0.4092756509780884, 0.6907904148101807, 0.972305178642273, 1.2538199424743652, 1.5353347063064575, 1.8168494701385498, 2.0983643531799316, 2.3798789978027344, 2.661393642425537, 2.942908525466919, 3.224423408508301, 3.5059380531311035, 3.7874526977539062, 4.068967819213867, 4.35048246383667, 4.631997108459473, 4.913511753082275, 5.195026397705078, 5.476541519165039, 5.758056163787842, 6.0395708084106445, 6.3210859298706055, 6.602600574493408, 6.884115219116211, 7.165629863739014, 7.447144508361816, 7.728659629821777, 8.010173797607422, 8.291688919067383, 8.573204040527344, 8.854718208312988, 9.13623332977295]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 9.0, 9.0, 20.0, 38.0, 59.0, 90.0, 172.0, 309.0, 572.0, 1179.0, 3188.0, 10581.0, 58461.0, 4036051.0, 66516.0, 11208.0, 3254.0, 1253.0, 566.0, 295.0, 182.0, 81.0, 70.0, 34.0, 29.0, 16.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.515625, -2.4519805908203125, -2.388336181640625, -2.3246917724609375, -2.26104736328125, -2.1974029541015625, -2.133758544921875, -2.0701141357421875, -2.0064697265625, -1.9428253173828125, -1.879180908203125, -1.8155364990234375, -1.75189208984375, -1.6882476806640625, -1.624603271484375, -1.5609588623046875, -1.497314453125, -1.4336700439453125, -1.370025634765625, -1.3063812255859375, -1.24273681640625, -1.1790924072265625, -1.115447998046875, -1.0518035888671875, -0.9881591796875, -0.9245147705078125, -0.860870361328125, -0.7972259521484375, -0.73358154296875, -0.6699371337890625, -0.606292724609375, -0.5426483154296875, -0.47900390625, -0.4153594970703125, -0.351715087890625, -0.2880706787109375, -0.22442626953125, -0.1607818603515625, -0.097137451171875, -0.0334930419921875, 0.0301513671875, 0.0937957763671875, 0.157440185546875, 0.2210845947265625, 0.28472900390625, 0.3483734130859375, 0.412017822265625, 0.4756622314453125, 0.539306640625, 0.6029510498046875, 0.666595458984375, 0.7302398681640625, 0.79388427734375, 0.8575286865234375, 0.921173095703125, 0.9848175048828125, 1.0484619140625, 1.1121063232421875, 1.175750732421875, 1.2393951416015625, 1.30303955078125, 1.3666839599609375, 1.430328369140625, 1.4939727783203125, 1.5576171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 13.0, 16.0, 24.0, 33.0, 41.0, 47.0, 56.0, 93.0, 75.0, 93.0, 96.0, 66.0, 85.0, 74.0, 54.0, 39.0, 27.0, 15.0, 16.0, 14.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7982406616210938, -0.7747039794921875, -0.7511672973632812, -0.727630615234375, -0.7040939331054688, -0.6805572509765625, -0.6570205688476562, -0.63348388671875, -0.6099472045898438, -0.5864105224609375, -0.5628738403320312, -0.539337158203125, -0.5158004760742188, -0.4922637939453125, -0.46872711181640625, -0.4451904296875, -0.42165374755859375, -0.3981170654296875, -0.37458038330078125, -0.351043701171875, -0.32750701904296875, -0.3039703369140625, -0.28043365478515625, -0.25689697265625, -0.23336029052734375, -0.2098236083984375, -0.18628692626953125, -0.162750244140625, -0.13921356201171875, -0.1156768798828125, -0.09214019775390625, -0.068603515625, -0.04506683349609375, -0.0215301513671875, 0.00200653076171875, 0.025543212890625, 0.04907989501953125, 0.0726165771484375, 0.09615325927734375, 0.11968994140625, 0.14322662353515625, 0.1667633056640625, 0.19029998779296875, 0.213836669921875, 0.23737335205078125, 0.2609100341796875, 0.28444671630859375, 0.3079833984375, 0.33152008056640625, 0.3550567626953125, 0.37859344482421875, 0.402130126953125, 0.42566680908203125, 0.4492034912109375, 0.47274017333984375, 0.49627685546875, 0.5198135375976562, 0.5433502197265625, 0.5668869018554688, 0.590423583984375, 0.6139602661132812, 0.6374969482421875, 0.6610336303710938, 0.6845703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 7.0, 7.0, 14.0, 21.0, 12.0, 27.0, 25.0, 32.0, 47.0, 68.0, 78.0, 134.0, 165.0, 196.0, 289.0, 407.0, 560.0, 922.0, 1607.0, 2966.0, 5980.0, 14054.0, 45808.0, 389918.0, 3640810.0, 58188.0, 16915.0, 6775.0, 3324.0, 1687.0, 1042.0, 608.0, 435.0, 284.0, 192.0, 164.0, 123.0, 68.0, 71.0, 56.0, 48.0, 36.0, 37.0, 14.0, 18.0, 8.0, 11.0, 9.0, 0.0, 2.0, 6.0, 0.0, 4.0, 4.0, 0.0, 0.0, 3.0], "bins": [-1.306640625, -1.2646026611328125, -1.222564697265625, -1.1805267333984375, -1.13848876953125, -1.0964508056640625, -1.054412841796875, -1.0123748779296875, -0.9703369140625, -0.9282989501953125, -0.886260986328125, -0.8442230224609375, -0.80218505859375, -0.7601470947265625, -0.718109130859375, -0.6760711669921875, -0.634033203125, -0.5919952392578125, -0.549957275390625, -0.5079193115234375, -0.46588134765625, -0.4238433837890625, -0.381805419921875, -0.3397674560546875, -0.2977294921875, -0.2556915283203125, -0.213653564453125, -0.1716156005859375, -0.12957763671875, -0.0875396728515625, -0.045501708984375, -0.0034637451171875, 0.03857421875, 0.0806121826171875, 0.122650146484375, 0.1646881103515625, 0.20672607421875, 0.2487640380859375, 0.290802001953125, 0.3328399658203125, 0.3748779296875, 0.4169158935546875, 0.458953857421875, 0.5009918212890625, 0.54302978515625, 0.5850677490234375, 0.627105712890625, 0.6691436767578125, 0.711181640625, 0.7532196044921875, 0.795257568359375, 0.8372955322265625, 0.87933349609375, 0.9213714599609375, 0.963409423828125, 1.0054473876953125, 1.0474853515625, 1.0895233154296875, 1.131561279296875, 1.1735992431640625, 1.21563720703125, 1.2576751708984375, 1.299713134765625, 1.3417510986328125, 1.3837890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 12.0, 12.0, 21.0, 24.0, 83.0, 134.0, 2886.0, 647.0, 113.0, 49.0, 25.0, 17.0, 8.0, 9.0, 8.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262939453125, -0.24744796752929688, -0.23195648193359375, -0.21646499633789062, -0.2009735107421875, -0.18548202514648438, -0.16999053955078125, -0.15449905395507812, -0.139007568359375, -0.12351608276367188, -0.10802459716796875, -0.09253311157226562, -0.0770416259765625, -0.061550140380859375, -0.04605865478515625, -0.030567169189453125, -0.01507568359375, 0.000415802001953125, 0.01590728759765625, 0.031398773193359375, 0.0468902587890625, 0.062381744384765625, 0.07787322998046875, 0.09336471557617188, 0.108856201171875, 0.12434768676757812, 0.13983917236328125, 0.15533065795898438, 0.1708221435546875, 0.18631362915039062, 0.20180511474609375, 0.21729660034179688, 0.2327880859375, 0.24827957153320312, 0.26377105712890625, 0.2792625427246094, 0.2947540283203125, 0.3102455139160156, 0.32573699951171875, 0.3412284851074219, 0.356719970703125, 0.3722114562988281, 0.38770294189453125, 0.4031944274902344, 0.4186859130859375, 0.4341773986816406, 0.44966888427734375, 0.4651603698730469, 0.48065185546875, 0.4961433410644531, 0.5116348266601562, 0.5271263122558594, 0.5426177978515625, 0.5581092834472656, 0.5736007690429688, 0.5890922546386719, 0.604583740234375, 0.6200752258300781, 0.6355667114257812, 0.6510581970214844, 0.6665496826171875, 0.6820411682128906, 0.6975326538085938, 0.7130241394042969, 0.728515625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 6.0, 10.0, 9.0, 5.0, 20.0, 49.0, 67.0, 112.0, 129.0, 139.0, 113.0, 111.0, 60.0, 63.0, 38.0, 31.0, 15.0, 12.0, 4.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53227961063385, -1.471066951751709, -1.4098541736602783, -1.3486413955688477, -1.2874287366867065, -1.2262160778045654, -1.1650032997131348, -1.103790521621704, -1.042577862739563, -0.9813651442527771, -0.9201524257659912, -0.8589397072792053, -0.7977269887924194, -0.7365142703056335, -0.6753015518188477, -0.6140888333320618, -0.5528761148452759, -0.49166339635849, -0.4304506778717041, -0.3692379593849182, -0.3080252408981323, -0.24681252241134644, -0.18559980392456055, -0.12438708543777466, -0.06317436695098877, -0.001961648464202881, 0.05925107002258301, 0.1204637885093689, 0.18167650699615479, 0.24288922548294067, 0.30410194396972656, 0.36531466245651245, 0.4265275001525879, 0.4877402186393738, 0.5489529371261597, 0.6101656556129456, 0.6713783740997314, 0.7325910925865173, 0.7938038110733032, 0.8550165295600891, 0.916229248046875, 0.9774419665336609, 1.0386546850204468, 1.099867343902588, 1.1610801219940186, 1.2222929000854492, 1.2835055589675903, 1.3447182178497314, 1.405930995941162, 1.4671437740325928, 1.5283564329147339, 1.589569091796875, 1.6507818698883057, 1.7119946479797363, 1.7732073068618774, 1.8344199657440186, 1.8956327438354492, 1.9568455219268799, 2.0180583000183105, 2.079270839691162, 2.1404836177825928, 2.2016963958740234, 2.262908935546875, 2.3241217136383057, 2.3853344917297363]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 14.0, 7.0, 13.0, 13.0, 20.0, 25.0, 32.0, 45.0, 44.0, 45.0, 48.0, 46.0, 82.0, 65.0, 57.0, 57.0, 57.0, 57.0, 52.0, 42.0, 35.0, 40.0, 25.0, 27.0, 11.0, 10.0, 10.0, 10.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3468122482299805, -1.3013062477111816, -1.2558001279830933, -1.2102941274642944, -1.164788007736206, -1.1192820072174072, -1.0737760066986084, -1.0282700061798096, -0.9827638864517212, -0.9372578263282776, -0.891751766204834, -0.8462457656860352, -0.8007397055625916, -0.755233645439148, -0.7097276449203491, -0.6642215847969055, -0.6187155246734619, -0.5732094645500183, -0.5277034044265747, -0.4821974039077759, -0.4366913437843323, -0.39118528366088867, -0.34567925333976746, -0.30017322301864624, -0.25466716289520264, -0.20916111767292023, -0.16365507245063782, -0.11814902722835541, -0.072642982006073, -0.02713693678379059, 0.01836910843849182, 0.06387513875961304, 0.10938107967376709, 0.1548871248960495, 0.2003931701183319, 0.24589921534061432, 0.29140526056289673, 0.33691132068634033, 0.38241735100746155, 0.42792338132858276, 0.47342944145202637, 0.51893550157547, 0.5644415616989136, 0.6099475622177124, 0.655453622341156, 0.7009596824645996, 0.7464656829833984, 0.791971743106842, 0.8374778032302856, 0.8829838633537292, 0.9284899234771729, 0.9739959239959717, 1.0195019245147705, 1.0650080442428589, 1.1105140447616577, 1.156020164489746, 1.201526165008545, 1.2470321655273438, 1.2925382852554321, 1.338044285774231, 1.3835504055023193, 1.4290564060211182, 1.474562406539917, 1.5200684070587158, 1.5655745267868042]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 7.0, 10.0, 18.0, 25.0, 44.0, 76.0, 122.0, 211.0, 344.0, 714.0, 1508.0, 3962.0, 12528.0, 47480.0, 196917.0, 452984.0, 246570.0, 61254.0, 15358.0, 4726.0, 1833.0, 850.0, 469.0, 227.0, 119.0, 73.0, 48.0, 29.0, 19.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3115234375, -1.2724761962890625, -1.233428955078125, -1.1943817138671875, -1.15533447265625, -1.1162872314453125, -1.077239990234375, -1.0381927490234375, -0.9991455078125, -0.9600982666015625, -0.921051025390625, -0.8820037841796875, -0.84295654296875, -0.8039093017578125, -0.764862060546875, -0.7258148193359375, -0.686767578125, -0.6477203369140625, -0.608673095703125, -0.5696258544921875, -0.53057861328125, -0.4915313720703125, -0.452484130859375, -0.4134368896484375, -0.3743896484375, -0.3353424072265625, -0.296295166015625, -0.2572479248046875, -0.21820068359375, -0.1791534423828125, -0.140106201171875, -0.1010589599609375, -0.06201171875, -0.0229644775390625, 0.016082763671875, 0.0551300048828125, 0.09417724609375, 0.1332244873046875, 0.172271728515625, 0.2113189697265625, 0.2503662109375, 0.2894134521484375, 0.328460693359375, 0.3675079345703125, 0.40655517578125, 0.4456024169921875, 0.484649658203125, 0.5236968994140625, 0.562744140625, 0.6017913818359375, 0.640838623046875, 0.6798858642578125, 0.71893310546875, 0.7579803466796875, 0.797027587890625, 0.8360748291015625, 0.8751220703125, 0.9141693115234375, 0.953216552734375, 0.9922637939453125, 1.03131103515625, 1.0703582763671875, 1.109405517578125, 1.1484527587890625, 1.1875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 10.0, 16.0, 17.0, 23.0, 34.0, 27.0, 42.0, 60.0, 84.0, 68.0, 76.0, 81.0, 88.0, 87.0, 66.0, 60.0, 50.0, 32.0, 24.0, 20.0, 15.0, 7.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.828125, -0.804046630859375, -0.77996826171875, -0.755889892578125, -0.7318115234375, -0.707733154296875, -0.68365478515625, -0.659576416015625, -0.635498046875, -0.611419677734375, -0.58734130859375, -0.563262939453125, -0.5391845703125, -0.515106201171875, -0.49102783203125, -0.466949462890625, -0.44287109375, -0.418792724609375, -0.39471435546875, -0.370635986328125, -0.3465576171875, -0.322479248046875, -0.29840087890625, -0.274322509765625, -0.250244140625, -0.226165771484375, -0.20208740234375, -0.178009033203125, -0.1539306640625, -0.129852294921875, -0.10577392578125, -0.081695556640625, -0.0576171875, -0.033538818359375, -0.00946044921875, 0.014617919921875, 0.0386962890625, 0.062774658203125, 0.08685302734375, 0.110931396484375, 0.135009765625, 0.159088134765625, 0.18316650390625, 0.207244873046875, 0.2313232421875, 0.255401611328125, 0.27947998046875, 0.303558349609375, 0.32763671875, 0.351715087890625, 0.37579345703125, 0.399871826171875, 0.4239501953125, 0.448028564453125, 0.47210693359375, 0.496185302734375, 0.520263671875, 0.544342041015625, 0.56842041015625, 0.592498779296875, 0.6165771484375, 0.640655517578125, 0.66473388671875, 0.688812255859375, 0.712890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 10.0, 15.0, 16.0, 16.0, 50.0, 87.0, 153.0, 266.0, 596.0, 1569.0, 6290.0, 49622.0, 628318.0, 331380.0, 24078.0, 3932.0, 1180.0, 474.0, 210.0, 122.0, 57.0, 37.0, 18.0, 17.0, 11.0, 7.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.02398681640625, -1.9561767578125, -1.88836669921875, -1.820556640625, -1.75274658203125, -1.6849365234375, -1.61712646484375, -1.54931640625, -1.48150634765625, -1.4136962890625, -1.34588623046875, -1.278076171875, -1.21026611328125, -1.1424560546875, -1.07464599609375, -1.0068359375, -0.93902587890625, -0.8712158203125, -0.80340576171875, -0.735595703125, -0.66778564453125, -0.5999755859375, -0.53216552734375, -0.46435546875, -0.39654541015625, -0.3287353515625, -0.26092529296875, -0.193115234375, -0.12530517578125, -0.0574951171875, 0.01031494140625, 0.078125, 0.14593505859375, 0.2137451171875, 0.28155517578125, 0.349365234375, 0.41717529296875, 0.4849853515625, 0.55279541015625, 0.62060546875, 0.68841552734375, 0.7562255859375, 0.82403564453125, 0.891845703125, 0.95965576171875, 1.0274658203125, 1.09527587890625, 1.1630859375, 1.23089599609375, 1.2987060546875, 1.36651611328125, 1.434326171875, 1.50213623046875, 1.5699462890625, 1.63775634765625, 1.70556640625, 1.77337646484375, 1.8411865234375, 1.90899658203125, 1.976806640625, 2.04461669921875, 2.1124267578125, 2.18023681640625, 2.248046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 16.0, 15.0, 19.0, 34.0, 38.0, 47.0, 68.0, 75.0, 82.0, 99.0, 90.0, 98.0, 69.0, 70.0, 59.0, 49.0, 20.0, 15.0, 15.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.16015625, -5.039031982421875, -4.91790771484375, -4.796783447265625, -4.6756591796875, -4.554534912109375, -4.43341064453125, -4.312286376953125, -4.191162109375, -4.070037841796875, -3.94891357421875, -3.827789306640625, -3.7066650390625, -3.585540771484375, -3.46441650390625, -3.343292236328125, -3.22216796875, -3.101043701171875, -2.97991943359375, -2.858795166015625, -2.7376708984375, -2.616546630859375, -2.49542236328125, -2.374298095703125, -2.253173828125, -2.132049560546875, -2.01092529296875, -1.889801025390625, -1.7686767578125, -1.647552490234375, -1.52642822265625, -1.405303955078125, -1.2841796875, -1.163055419921875, -1.04193115234375, -0.920806884765625, -0.7996826171875, -0.678558349609375, -0.55743408203125, -0.436309814453125, -0.315185546875, -0.194061279296875, -0.07293701171875, 0.048187255859375, 0.1693115234375, 0.290435791015625, 0.41156005859375, 0.532684326171875, 0.65380859375, 0.774932861328125, 0.89605712890625, 1.017181396484375, 1.1383056640625, 1.259429931640625, 1.38055419921875, 1.501678466796875, 1.622802734375, 1.743927001953125, 1.86505126953125, 1.986175537109375, 2.1072998046875, 2.228424072265625, 2.34954833984375, 2.470672607421875, 2.591796875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 8.0, 21.0, 25.0, 57.0, 99.0, 248.0, 920.0, 5133.0, 97288.0, 911362.0, 29801.0, 2690.0, 521.0, 195.0, 85.0, 40.0, 20.0, 18.0, 14.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6640625, -2.5996246337890625, -2.535186767578125, -2.4707489013671875, -2.40631103515625, -2.3418731689453125, -2.277435302734375, -2.2129974365234375, -2.1485595703125, -2.0841217041015625, -2.019683837890625, -1.9552459716796875, -1.89080810546875, -1.8263702392578125, -1.761932373046875, -1.6974945068359375, -1.633056640625, -1.5686187744140625, -1.504180908203125, -1.4397430419921875, -1.37530517578125, -1.3108673095703125, -1.246429443359375, -1.1819915771484375, -1.1175537109375, -1.0531158447265625, -0.988677978515625, -0.9242401123046875, -0.85980224609375, -0.7953643798828125, -0.730926513671875, -0.6664886474609375, -0.60205078125, -0.5376129150390625, -0.473175048828125, -0.4087371826171875, -0.34429931640625, -0.2798614501953125, -0.215423583984375, -0.1509857177734375, -0.0865478515625, -0.0221099853515625, 0.042327880859375, 0.1067657470703125, 0.17120361328125, 0.2356414794921875, 0.300079345703125, 0.3645172119140625, 0.428955078125, 0.4933929443359375, 0.557830810546875, 0.6222686767578125, 0.68670654296875, 0.7511444091796875, 0.815582275390625, 0.8800201416015625, 0.9444580078125, 1.0088958740234375, 1.073333740234375, 1.1377716064453125, 1.20220947265625, 1.2666473388671875, 1.331085205078125, 1.3955230712890625, 1.4599609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 6.0, 10.0, 16.0, 22.0, 36.0, 70.0, 90.0, 130.0, 146.0, 136.0, 115.0, 68.0, 48.0, 33.0, 20.0, 12.0, 13.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019121170043945312, -0.00018480047583580017, -0.00017838925123214722, -0.00017197802662849426, -0.0001655668020248413, -0.00015915557742118835, -0.0001527443528175354, -0.00014633312821388245, -0.0001399219036102295, -0.00013351067900657654, -0.00012709945440292358, -0.00012068822979927063, -0.00011427700519561768, -0.00010786578059196472, -0.00010145455598831177, -9.504333138465881e-05, -8.863210678100586e-05, -8.22208821773529e-05, -7.580965757369995e-05, -6.9398432970047e-05, -6.298720836639404e-05, -5.657598376274109e-05, -5.0164759159088135e-05, -4.375353455543518e-05, -3.7342309951782227e-05, -3.093108534812927e-05, -2.451986074447632e-05, -1.8108636140823364e-05, -1.169741153717041e-05, -5.286186933517456e-06, 1.125037670135498e-06, 7.536262273788452e-06, 1.3947486877441406e-05, 2.035871148109436e-05, 2.6769936084747314e-05, 3.318116068840027e-05, 3.959238529205322e-05, 4.600360989570618e-05, 5.241483449935913e-05, 5.8826059103012085e-05, 6.523728370666504e-05, 7.164850831031799e-05, 7.805973291397095e-05, 8.44709575176239e-05, 9.088218212127686e-05, 9.729340672492981e-05, 0.00010370463132858276, 0.00011011585593223572, 0.00011652708053588867, 0.00012293830513954163, 0.00012934952974319458, 0.00013576075434684753, 0.0001421719789505005, 0.00014858320355415344, 0.0001549944281578064, 0.00016140565276145935, 0.0001678168773651123, 0.00017422810196876526, 0.0001806393265724182, 0.00018705055117607117, 0.00019346177577972412, 0.00019987300038337708, 0.00020628422498703003, 0.00021269544959068298, 0.00021910667419433594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 13.0, 13.0, 39.0, 74.0, 139.0, 464.0, 2387.0, 31336.0, 932239.0, 77196.0, 3605.0, 659.0, 205.0, 79.0, 47.0, 22.0, 19.0, 5.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.067413330078125, -2.00201416015625, -1.936614990234375, -1.8712158203125, -1.805816650390625, -1.74041748046875, -1.675018310546875, -1.609619140625, -1.544219970703125, -1.47882080078125, -1.413421630859375, -1.3480224609375, -1.282623291015625, -1.21722412109375, -1.151824951171875, -1.08642578125, -1.021026611328125, -0.95562744140625, -0.890228271484375, -0.8248291015625, -0.759429931640625, -0.69403076171875, -0.628631591796875, -0.563232421875, -0.497833251953125, -0.43243408203125, -0.367034912109375, -0.3016357421875, -0.236236572265625, -0.17083740234375, -0.105438232421875, -0.0400390625, 0.025360107421875, 0.09075927734375, 0.156158447265625, 0.2215576171875, 0.286956787109375, 0.35235595703125, 0.417755126953125, 0.483154296875, 0.548553466796875, 0.61395263671875, 0.679351806640625, 0.7447509765625, 0.810150146484375, 0.87554931640625, 0.940948486328125, 1.00634765625, 1.071746826171875, 1.13714599609375, 1.202545166015625, 1.2679443359375, 1.333343505859375, 1.39874267578125, 1.464141845703125, 1.529541015625, 1.594940185546875, 1.66033935546875, 1.725738525390625, 1.7911376953125, 1.856536865234375, 1.92193603515625, 1.987335205078125, 2.052734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 12.0, 6.0, 12.0, 23.0, 46.0, 72.0, 111.0, 139.0, 172.0, 134.0, 96.0, 71.0, 49.0, 25.0, 13.0, 9.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87353515625, -0.8232650756835938, -0.7729949951171875, -0.7227249145507812, -0.672454833984375, -0.6221847534179688, -0.5719146728515625, -0.5216445922851562, -0.47137451171875, -0.42110443115234375, -0.3708343505859375, -0.32056427001953125, -0.270294189453125, -0.22002410888671875, -0.1697540283203125, -0.11948394775390625, -0.0692138671875, -0.01894378662109375, 0.0313262939453125, 0.08159637451171875, 0.131866455078125, 0.18213653564453125, 0.2324066162109375, 0.28267669677734375, 0.33294677734375, 0.38321685791015625, 0.4334869384765625, 0.48375701904296875, 0.534027099609375, 0.5842971801757812, 0.6345672607421875, 0.6848373413085938, 0.735107421875, 0.7853775024414062, 0.8356475830078125, 0.8859176635742188, 0.936187744140625, 0.9864578247070312, 1.0367279052734375, 1.0869979858398438, 1.13726806640625, 1.1875381469726562, 1.2378082275390625, 1.2880783081054688, 1.338348388671875, 1.3886184692382812, 1.4388885498046875, 1.4891586303710938, 1.5394287109375, 1.5896987915039062, 1.6399688720703125, 1.6902389526367188, 1.740509033203125, 1.7907791137695312, 1.8410491943359375, 1.8913192749023438, 1.94158935546875, 1.9918594360351562, 2.0421295166015625, 2.0923995971679688, 2.142669677734375, 2.1929397583007812, 2.2432098388671875, 2.2934799194335938, 2.34375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 21.0, 40.0, 97.0, 131.0, 173.0, 200.0, 154.0, 92.0, 41.0, 17.0, 13.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484781265258789, -10.873579025268555, -10.26237678527832, -9.651174545288086, -9.039972305297852, -8.428770065307617, -7.817568778991699, -7.206366539001465, -6.5951642990112305, -5.983962059020996, -5.372759819030762, -4.7615580558776855, -4.150355815887451, -3.539153575897217, -2.9279515743255615, -2.3167495727539062, -1.7055473327636719, -1.094345211982727, -0.4831430912017822, 0.1280590295791626, 0.7392611503601074, 1.3504633903503418, 1.961665391921997, 2.5728673934936523, 3.1840696334838867, 3.795271873474121, 4.4064741134643555, 5.017675876617432, 5.628878116607666, 6.2400803565979, 6.851282119750977, 7.462484359741211, 8.073688507080078, 8.684890747070312, 9.296092987060547, 9.907295227050781, 10.518497467041016, 11.12969970703125, 11.740900993347168, 12.352103233337402, 12.963305473327637, 13.574507713317871, 14.185709953308105, 14.79691219329834, 15.408113479614258, 16.019315719604492, 16.630517959594727, 17.24172019958496, 17.852922439575195, 18.46412467956543, 19.075326919555664, 19.6865291595459, 20.297731399536133, 20.908933639526367, 21.5201358795166, 22.131336212158203, 22.742538452148438, 23.353740692138672, 23.964942932128906, 24.57614517211914, 25.187347412109375, 25.79854965209961, 26.409751892089844, 27.020954132080078, 27.632156372070312]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 11.0, 9.0, 9.0, 20.0, 24.0, 25.0, 31.0, 38.0, 31.0, 37.0, 36.0, 50.0, 56.0, 44.0, 64.0, 58.0, 54.0, 61.0, 45.0, 43.0, 37.0, 41.0, 34.0, 29.0, 28.0, 15.0, 20.0, 12.0, 7.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.89755916595459, -10.513012886047363, -10.128466606140137, -9.74392032623291, -9.359374046325684, -8.974827766418457, -8.590280532836914, -8.205734252929688, -7.821188449859619, -7.436642169952393, -7.052095890045166, -6.667549133300781, -6.283002853393555, -5.898456573486328, -5.513910293579102, -5.129364013671875, -4.744817733764648, -4.360271453857422, -3.9757251739501953, -3.5911786556243896, -3.206632375717163, -2.8220860958099365, -2.437539577484131, -2.0529932975769043, -1.6684470176696777, -1.2839007377624512, -0.8993543386459351, -0.514807939529419, -0.13026165962219238, 0.2542846202850342, 0.6388311386108398, 1.0233774185180664, 1.4079227447509766, 1.7924690246582031, 2.1770153045654297, 2.5615618228912354, 2.946108102798462, 3.3306543827056885, 3.715200901031494, 4.099747180938721, 4.484293460845947, 4.868839740753174, 5.2533860206604, 5.637932777404785, 6.022479057312012, 6.407025337219238, 6.791571617126465, 7.176117897033691, 7.560664176940918, 7.9452104568481445, 8.329756736755371, 8.714303016662598, 9.098849296569824, 9.48339557647705, 9.867942810058594, 10.25248908996582, 10.637035369873047, 11.021581649780273, 11.4061279296875, 11.790674209594727, 12.175220489501953, 12.55976676940918, 12.944313049316406, 13.328859329223633, 13.71340560913086]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 9.0, 23.0, 22.0, 29.0, 47.0, 91.0, 130.0, 195.0, 344.0, 587.0, 1190.0, 2730.0, 7827.0, 39597.0, 4091889.0, 36892.0, 7507.0, 2668.0, 1122.0, 557.0, 282.0, 173.0, 129.0, 71.0, 43.0, 33.0, 28.0, 13.0, 12.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 4.0], "bins": [-3.244140625, -3.1677703857421875, -3.091400146484375, -3.0150299072265625, -2.93865966796875, -2.8622894287109375, -2.785919189453125, -2.7095489501953125, -2.6331787109375, -2.5568084716796875, -2.480438232421875, -2.4040679931640625, -2.32769775390625, -2.2513275146484375, -2.174957275390625, -2.0985870361328125, -2.022216796875, -1.9458465576171875, -1.869476318359375, -1.7931060791015625, -1.71673583984375, -1.6403656005859375, -1.563995361328125, -1.4876251220703125, -1.4112548828125, -1.3348846435546875, -1.258514404296875, -1.1821441650390625, -1.10577392578125, -1.0294036865234375, -0.953033447265625, -0.8766632080078125, -0.80029296875, -0.7239227294921875, -0.647552490234375, -0.5711822509765625, -0.49481201171875, -0.4184417724609375, -0.342071533203125, -0.2657012939453125, -0.1893310546875, -0.1129608154296875, -0.036590576171875, 0.0397796630859375, 0.11614990234375, 0.1925201416015625, 0.268890380859375, 0.3452606201171875, 0.421630859375, 0.4980010986328125, 0.574371337890625, 0.6507415771484375, 0.72711181640625, 0.8034820556640625, 0.879852294921875, 0.9562225341796875, 1.0325927734375, 1.1089630126953125, 1.185333251953125, 1.2617034912109375, 1.33807373046875, 1.4144439697265625, 1.490814208984375, 1.5671844482421875, 1.6435546875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 20.0, 27.0, 29.0, 36.0, 36.0, 44.0, 60.0, 62.0, 69.0, 76.0, 87.0, 70.0, 66.0, 50.0, 55.0, 49.0, 31.0, 27.0, 20.0, 17.0, 14.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80224609375, -0.7787017822265625, -0.755157470703125, -0.7316131591796875, -0.70806884765625, -0.6845245361328125, -0.660980224609375, -0.6374359130859375, -0.6138916015625, -0.5903472900390625, -0.566802978515625, -0.5432586669921875, -0.51971435546875, -0.4961700439453125, -0.472625732421875, -0.4490814208984375, -0.425537109375, -0.4019927978515625, -0.378448486328125, -0.3549041748046875, -0.33135986328125, -0.3078155517578125, -0.284271240234375, -0.2607269287109375, -0.2371826171875, -0.2136383056640625, -0.190093994140625, -0.1665496826171875, -0.14300537109375, -0.1194610595703125, -0.095916748046875, -0.0723724365234375, -0.048828125, -0.0252838134765625, -0.001739501953125, 0.0218048095703125, 0.04534912109375, 0.0688934326171875, 0.092437744140625, 0.1159820556640625, 0.1395263671875, 0.1630706787109375, 0.186614990234375, 0.2101593017578125, 0.23370361328125, 0.2572479248046875, 0.280792236328125, 0.3043365478515625, 0.327880859375, 0.3514251708984375, 0.374969482421875, 0.3985137939453125, 0.42205810546875, 0.4456024169921875, 0.469146728515625, 0.4926910400390625, 0.5162353515625, 0.5397796630859375, 0.563323974609375, 0.5868682861328125, 0.61041259765625, 0.6339569091796875, 0.657501220703125, 0.6810455322265625, 0.70458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 3.0, 2.0, 2.0, 5.0, 11.0, 9.0, 12.0, 15.0, 9.0, 28.0, 34.0, 25.0, 50.0, 73.0, 111.0, 209.0, 433.0, 1083.0, 3757.0, 25840.0, 4121180.0, 34556.0, 4451.0, 1229.0, 463.0, 244.0, 128.0, 67.0, 63.0, 38.0, 24.0, 22.0, 26.0, 17.0, 6.0, 4.0, 6.0, 6.0, 12.0, 7.0, 4.0, 10.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.982421875, -3.852081298828125, -3.72174072265625, -3.591400146484375, -3.4610595703125, -3.330718994140625, -3.20037841796875, -3.070037841796875, -2.939697265625, -2.809356689453125, -2.67901611328125, -2.548675537109375, -2.4183349609375, -2.287994384765625, -2.15765380859375, -2.027313232421875, -1.89697265625, -1.766632080078125, -1.63629150390625, -1.505950927734375, -1.3756103515625, -1.245269775390625, -1.11492919921875, -0.984588623046875, -0.854248046875, -0.723907470703125, -0.59356689453125, -0.463226318359375, -0.3328857421875, -0.202545166015625, -0.07220458984375, 0.058135986328125, 0.1884765625, 0.318817138671875, 0.44915771484375, 0.579498291015625, 0.7098388671875, 0.840179443359375, 0.97052001953125, 1.100860595703125, 1.231201171875, 1.361541748046875, 1.49188232421875, 1.622222900390625, 1.7525634765625, 1.882904052734375, 2.01324462890625, 2.143585205078125, 2.27392578125, 2.404266357421875, 2.53460693359375, 2.664947509765625, 2.7952880859375, 2.925628662109375, 3.05596923828125, 3.186309814453125, 3.316650390625, 3.446990966796875, 3.57733154296875, 3.707672119140625, 3.8380126953125, 3.968353271484375, 4.09869384765625, 4.229034423828125, 4.359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 7.0, 11.0, 26.0, 50.0, 183.0, 3670.0, 71.0, 29.0, 10.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66845703125, -0.6408157348632812, -0.6131744384765625, -0.5855331420898438, -0.557891845703125, -0.5302505493164062, -0.5026092529296875, -0.47496795654296875, -0.44732666015625, -0.41968536376953125, -0.3920440673828125, -0.36440277099609375, -0.336761474609375, -0.30912017822265625, -0.2814788818359375, -0.25383758544921875, -0.2261962890625, -0.19855499267578125, -0.1709136962890625, -0.14327239990234375, -0.115631103515625, -0.08798980712890625, -0.0603485107421875, -0.03270721435546875, -0.00506591796875, 0.02257537841796875, 0.0502166748046875, 0.07785797119140625, 0.105499267578125, 0.13314056396484375, 0.1607818603515625, 0.18842315673828125, 0.216064453125, 0.24370574951171875, 0.2713470458984375, 0.29898834228515625, 0.326629638671875, 0.35427093505859375, 0.3819122314453125, 0.40955352783203125, 0.43719482421875, 0.46483612060546875, 0.4924774169921875, 0.5201187133789062, 0.547760009765625, 0.5754013061523438, 0.6030426025390625, 0.6306838989257812, 0.6583251953125, 0.6859664916992188, 0.7136077880859375, 0.7412490844726562, 0.768890380859375, 0.7965316772460938, 0.8241729736328125, 0.8518142700195312, 0.87945556640625, 0.9070968627929688, 0.9347381591796875, 0.9623794555664062, 0.990020751953125, 1.0176620483398438, 1.0453033447265625, 1.0729446411132812, 1.1005859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 14.0, 13.0, 11.0, 19.0, 35.0, 37.0, 60.0, 72.0, 92.0, 98.0, 126.0, 86.0, 64.0, 68.0, 54.0, 34.0, 33.0, 24.0, 8.0, 9.0, 6.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9305427074432373, -1.881780982017517, -1.8330192565917969, -1.784257411956787, -1.735495686531067, -1.6867339611053467, -1.637972116470337, -1.5892103910446167, -1.5404486656188965, -1.4916869401931763, -1.442925214767456, -1.3941633701324463, -1.345401644706726, -1.2966399192810059, -1.247878074645996, -1.1991163492202759, -1.1503546237945557, -1.1015928983688354, -1.0528311729431152, -1.0040693283081055, -0.9553076028823853, -0.906545877456665, -0.8577840924263, -0.8090223073959351, -0.7602605819702148, -0.7114988565444946, -0.6627370715141296, -0.6139752864837646, -0.5652135610580444, -0.5164518356323242, -0.46769005060195923, -0.4189282953739166, -0.370166540145874, -0.3214047849178314, -0.2726430296897888, -0.22388127446174622, -0.1751195192337036, -0.126357764005661, -0.07759600877761841, -0.028834253549575806, 0.019927501678466797, 0.0686892569065094, 0.117451012134552, 0.1662127673625946, 0.2149745225906372, 0.2637362778186798, 0.3124980330467224, 0.361259788274765, 0.4100215435028076, 0.4587832987308502, 0.5075450539588928, 0.5563068389892578, 0.605068564414978, 0.6538302898406982, 0.7025920748710632, 0.7513538599014282, 0.8001155853271484, 0.8488773107528687, 0.8976390957832336, 0.9464008808135986, 0.9951626062393188, 1.043924331665039, 1.0926861763000488, 1.141447901725769, 1.1902096271514893]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 12.0, 8.0, 15.0, 16.0, 16.0, 22.0, 16.0, 30.0, 26.0, 38.0, 32.0, 36.0, 43.0, 41.0, 48.0, 53.0, 40.0, 41.0, 47.0, 43.0, 52.0, 42.0, 42.0, 32.0, 36.0, 22.0, 18.0, 24.0, 18.0, 14.0, 19.0, 6.0, 14.0, 2.0, 7.0, 4.0, 7.0, 5.0, 2.0, 4.0, 1.0], "bins": [-1.3384265899658203, -1.3046557903289795, -1.2708848714828491, -1.2371140718460083, -1.2033432722091675, -1.169572353363037, -1.1358015537261963, -1.1020307540893555, -1.0682599544525146, -1.0344891548156738, -1.0007182359695435, -0.9669474363327026, -0.9331766366958618, -0.8994057774543762, -0.8656349182128906, -0.8318641185760498, -0.7980931997299194, -0.7643223404884338, -0.730551540851593, -0.6967806816101074, -0.6630098819732666, -0.629239022731781, -0.5954681634902954, -0.5616973638534546, -0.527926504611969, -0.4941556751728058, -0.4603848457336426, -0.426613986492157, -0.3928431570529938, -0.35907232761383057, -0.32530146837234497, -0.29153063893318176, -0.2577599287033081, -0.2239890992641449, -0.1902182549238205, -0.1564474105834961, -0.12267658114433289, -0.08890575170516968, -0.055134907364845276, -0.021364063024520874, 0.012406766414642334, 0.04617760330438614, 0.07994844019412994, 0.11371927708387375, 0.14749011397361755, 0.18126094341278076, 0.21503178775310516, 0.24880263209342957, 0.2825734615325928, 0.316344290971756, 0.3501151204109192, 0.3838859796524048, 0.417656809091568, 0.4514276385307312, 0.4851984977722168, 0.5189692974090576, 0.5527401566505432, 0.5865110158920288, 0.6202818155288696, 0.6540526747703552, 0.6878235340118408, 0.7215943336486816, 0.7553651928901672, 0.7891360521316528, 0.8229068517684937]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 12.0, 11.0, 22.0, 25.0, 35.0, 62.0, 114.0, 173.0, 316.0, 489.0, 911.0, 1793.0, 3588.0, 7619.0, 17206.0, 41243.0, 105611.0, 243422.0, 319040.0, 181151.0, 73260.0, 28970.0, 12272.0, 5474.0, 2619.0, 1318.0, 729.0, 420.0, 244.0, 162.0, 81.0, 48.0, 48.0, 23.0, 15.0, 13.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-1.0341796875, -1.0071792602539062, -0.9801788330078125, -0.9531784057617188, -0.926177978515625, -0.8991775512695312, -0.8721771240234375, -0.8451766967773438, -0.81817626953125, -0.7911758422851562, -0.7641754150390625, -0.7371749877929688, -0.710174560546875, -0.6831741333007812, -0.6561737060546875, -0.6291732788085938, -0.6021728515625, -0.5751724243164062, -0.5481719970703125, -0.5211715698242188, -0.494171142578125, -0.46717071533203125, -0.4401702880859375, -0.41316986083984375, -0.38616943359375, -0.35916900634765625, -0.3321685791015625, -0.30516815185546875, -0.278167724609375, -0.25116729736328125, -0.2241668701171875, -0.19716644287109375, -0.170166015625, -0.14316558837890625, -0.1161651611328125, -0.08916473388671875, -0.062164306640625, -0.03516387939453125, -0.0081634521484375, 0.01883697509765625, 0.04583740234375, 0.07283782958984375, 0.0998382568359375, 0.12683868408203125, 0.153839111328125, 0.18083953857421875, 0.2078399658203125, 0.23484039306640625, 0.2618408203125, 0.28884124755859375, 0.3158416748046875, 0.34284210205078125, 0.369842529296875, 0.39684295654296875, 0.4238433837890625, 0.45084381103515625, 0.47784423828125, 0.5048446655273438, 0.5318450927734375, 0.5588455200195312, 0.585845947265625, 0.6128463745117188, 0.6398468017578125, 0.6668472290039062, 0.69384765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 5.0, 15.0, 18.0, 28.0, 20.0, 25.0, 30.0, 44.0, 45.0, 59.0, 59.0, 61.0, 85.0, 63.0, 47.0, 54.0, 52.0, 53.0, 37.0, 33.0, 25.0, 34.0, 18.0, 20.0, 9.0, 13.0, 5.0, 4.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.78857421875, -0.7654647827148438, -0.7423553466796875, -0.7192459106445312, -0.696136474609375, -0.6730270385742188, -0.6499176025390625, -0.6268081665039062, -0.60369873046875, -0.5805892944335938, -0.5574798583984375, -0.5343704223632812, -0.511260986328125, -0.48815155029296875, -0.4650421142578125, -0.44193267822265625, -0.4188232421875, -0.39571380615234375, -0.3726043701171875, -0.34949493408203125, -0.326385498046875, -0.30327606201171875, -0.2801666259765625, -0.25705718994140625, -0.23394775390625, -0.21083831787109375, -0.1877288818359375, -0.16461944580078125, -0.141510009765625, -0.11840057373046875, -0.0952911376953125, -0.07218170166015625, -0.049072265625, -0.02596282958984375, -0.0028533935546875, 0.02025604248046875, 0.043365478515625, 0.06647491455078125, 0.0895843505859375, 0.11269378662109375, 0.13580322265625, 0.15891265869140625, 0.1820220947265625, 0.20513153076171875, 0.228240966796875, 0.25135040283203125, 0.2744598388671875, 0.29756927490234375, 0.3206787109375, 0.34378814697265625, 0.3668975830078125, 0.39000701904296875, 0.413116455078125, 0.43622589111328125, 0.4593353271484375, 0.48244476318359375, 0.50555419921875, 0.5286636352539062, 0.5517730712890625, 0.5748825073242188, 0.597991943359375, 0.6211013793945312, 0.6442108154296875, 0.6673202514648438, 0.6904296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 7.0, 4.0, 12.0, 18.0, 22.0, 26.0, 47.0, 55.0, 75.0, 114.0, 187.0, 318.0, 614.0, 1460.0, 4375.0, 18701.0, 114995.0, 609957.0, 249982.0, 36141.0, 7358.0, 2127.0, 828.0, 413.0, 204.0, 154.0, 85.0, 71.0, 41.0, 29.0, 31.0, 25.0, 18.0, 8.0, 11.0, 11.0, 7.0, 4.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.66796875, -1.6153411865234375, -1.562713623046875, -1.5100860595703125, -1.45745849609375, -1.4048309326171875, -1.352203369140625, -1.2995758056640625, -1.2469482421875, -1.1943206787109375, -1.141693115234375, -1.0890655517578125, -1.03643798828125, -0.9838104248046875, -0.931182861328125, -0.8785552978515625, -0.825927734375, -0.7733001708984375, -0.720672607421875, -0.6680450439453125, -0.61541748046875, -0.5627899169921875, -0.510162353515625, -0.4575347900390625, -0.4049072265625, -0.3522796630859375, -0.299652099609375, -0.2470245361328125, -0.19439697265625, -0.1417694091796875, -0.089141845703125, -0.0365142822265625, 0.01611328125, 0.0687408447265625, 0.121368408203125, 0.1739959716796875, 0.22662353515625, 0.2792510986328125, 0.331878662109375, 0.3845062255859375, 0.4371337890625, 0.4897613525390625, 0.542388916015625, 0.5950164794921875, 0.64764404296875, 0.7002716064453125, 0.752899169921875, 0.8055267333984375, 0.858154296875, 0.9107818603515625, 0.963409423828125, 1.0160369873046875, 1.06866455078125, 1.1212921142578125, 1.173919677734375, 1.2265472412109375, 1.2791748046875, 1.3318023681640625, 1.384429931640625, 1.4370574951171875, 1.48968505859375, 1.5423126220703125, 1.594940185546875, 1.6475677490234375, 1.7001953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 7.0, 5.0, 4.0, 10.0, 19.0, 26.0, 22.0, 24.0, 34.0, 33.0, 41.0, 45.0, 49.0, 56.0, 44.0, 60.0, 61.0, 57.0, 60.0, 38.0, 42.0, 45.0, 40.0, 30.0, 29.0, 28.0, 24.0, 15.0, 13.0, 12.0, 5.0, 6.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30078125, -3.197723388671875, -3.09466552734375, -2.991607666015625, -2.8885498046875, -2.785491943359375, -2.68243408203125, -2.579376220703125, -2.476318359375, -2.373260498046875, -2.27020263671875, -2.167144775390625, -2.0640869140625, -1.961029052734375, -1.85797119140625, -1.754913330078125, -1.65185546875, -1.548797607421875, -1.44573974609375, -1.342681884765625, -1.2396240234375, -1.136566162109375, -1.03350830078125, -0.930450439453125, -0.827392578125, -0.724334716796875, -0.62127685546875, -0.518218994140625, -0.4151611328125, -0.312103271484375, -0.20904541015625, -0.105987548828125, -0.0029296875, 0.100128173828125, 0.20318603515625, 0.306243896484375, 0.4093017578125, 0.512359619140625, 0.61541748046875, 0.718475341796875, 0.821533203125, 0.924591064453125, 1.02764892578125, 1.130706787109375, 1.2337646484375, 1.336822509765625, 1.43988037109375, 1.542938232421875, 1.64599609375, 1.749053955078125, 1.85211181640625, 1.955169677734375, 2.0582275390625, 2.161285400390625, 2.26434326171875, 2.367401123046875, 2.470458984375, 2.573516845703125, 2.67657470703125, 2.779632568359375, 2.8826904296875, 2.985748291015625, 3.08880615234375, 3.191864013671875, 3.294921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 2.0, 4.0, 14.0, 17.0, 18.0, 50.0, 102.0, 283.0, 1054.0, 7289.0, 764220.0, 269615.0, 4620.0, 838.0, 239.0, 70.0, 49.0, 21.0, 18.0, 9.0, 11.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8125, -2.73193359375, -2.6513671875, -2.57080078125, -2.490234375, -2.40966796875, -2.3291015625, -2.24853515625, -2.16796875, -2.08740234375, -2.0068359375, -1.92626953125, -1.845703125, -1.76513671875, -1.6845703125, -1.60400390625, -1.5234375, -1.44287109375, -1.3623046875, -1.28173828125, -1.201171875, -1.12060546875, -1.0400390625, -0.95947265625, -0.87890625, -0.79833984375, -0.7177734375, -0.63720703125, -0.556640625, -0.47607421875, -0.3955078125, -0.31494140625, -0.234375, -0.15380859375, -0.0732421875, 0.00732421875, 0.087890625, 0.16845703125, 0.2490234375, 0.32958984375, 0.41015625, 0.49072265625, 0.5712890625, 0.65185546875, 0.732421875, 0.81298828125, 0.8935546875, 0.97412109375, 1.0546875, 1.13525390625, 1.2158203125, 1.29638671875, 1.376953125, 1.45751953125, 1.5380859375, 1.61865234375, 1.69921875, 1.77978515625, 1.8603515625, 1.94091796875, 2.021484375, 2.10205078125, 2.1826171875, 2.26318359375, 2.34375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 11.0, 28.0, 31.0, 57.0, 65.0, 92.0, 110.0, 110.0, 115.0, 101.0, 88.0, 60.0, 36.0, 17.0, 21.0, 9.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001811981201171875, -0.00017610937356948853, -0.00017102062702178955, -0.00016593188047409058, -0.0001608431339263916, -0.00015575438737869263, -0.00015066564083099365, -0.00014557689428329468, -0.0001404881477355957, -0.00013539940118789673, -0.00013031065464019775, -0.00012522190809249878, -0.0001201331615447998, -0.00011504441499710083, -0.00010995566844940186, -0.00010486692190170288, -9.97781753540039e-05, -9.468942880630493e-05, -8.960068225860596e-05, -8.451193571090698e-05, -7.942318916320801e-05, -7.433444261550903e-05, -6.924569606781006e-05, -6.415694952011108e-05, -5.906820297241211e-05, -5.3979456424713135e-05, -4.889070987701416e-05, -4.3801963329315186e-05, -3.871321678161621e-05, -3.3624470233917236e-05, -2.8535723686218262e-05, -2.3446977138519287e-05, -1.8358230590820312e-05, -1.3269484043121338e-05, -8.180737495422363e-06, -3.0919909477233887e-06, 1.996755599975586e-06, 7.0855021476745605e-06, 1.2174248695373535e-05, 1.726299524307251e-05, 2.2351741790771484e-05, 2.744048833847046e-05, 3.2529234886169434e-05, 3.761798143386841e-05, 4.270672798156738e-05, 4.779547452926636e-05, 5.288422107696533e-05, 5.797296762466431e-05, 6.306171417236328e-05, 6.815046072006226e-05, 7.323920726776123e-05, 7.83279538154602e-05, 8.341670036315918e-05, 8.850544691085815e-05, 9.359419345855713e-05, 9.86829400062561e-05, 0.00010377168655395508, 0.00010886043310165405, 0.00011394917964935303, 0.000119037926197052, 0.00012412667274475098, 0.00012921541929244995, 0.00013430416584014893, 0.0001393929123878479, 0.00014448165893554688]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 9.0, 22.0, 20.0, 52.0, 116.0, 190.0, 497.0, 1536.0, 6567.0, 66924.0, 887791.0, 75285.0, 6947.0, 1647.0, 494.0, 215.0, 102.0, 59.0, 28.0, 14.0, 13.0, 3.0, 8.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.90301513671875, -1.8548583984375, -1.80670166015625, -1.758544921875, -1.71038818359375, -1.6622314453125, -1.61407470703125, -1.56591796875, -1.51776123046875, -1.4696044921875, -1.42144775390625, -1.373291015625, -1.32513427734375, -1.2769775390625, -1.22882080078125, -1.1806640625, -1.13250732421875, -1.0843505859375, -1.03619384765625, -0.988037109375, -0.93988037109375, -0.8917236328125, -0.84356689453125, -0.79541015625, -0.74725341796875, -0.6990966796875, -0.65093994140625, -0.602783203125, -0.55462646484375, -0.5064697265625, -0.45831298828125, -0.41015625, -0.36199951171875, -0.3138427734375, -0.26568603515625, -0.217529296875, -0.16937255859375, -0.1212158203125, -0.07305908203125, -0.02490234375, 0.02325439453125, 0.0714111328125, 0.11956787109375, 0.167724609375, 0.21588134765625, 0.2640380859375, 0.31219482421875, 0.3603515625, 0.40850830078125, 0.4566650390625, 0.50482177734375, 0.552978515625, 0.60113525390625, 0.6492919921875, 0.69744873046875, 0.74560546875, 0.79376220703125, 0.8419189453125, 0.89007568359375, 0.938232421875, 0.98638916015625, 1.0345458984375, 1.08270263671875, 1.130859375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 7.0, 3.0, 5.0, 5.0, 8.0, 23.0, 29.0, 58.0, 97.0, 180.0, 197.0, 139.0, 103.0, 52.0, 28.0, 10.0, 12.0, 7.0, 3.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5322265625, -1.4740447998046875, -1.415863037109375, -1.3576812744140625, -1.29949951171875, -1.2413177490234375, -1.183135986328125, -1.1249542236328125, -1.0667724609375, -1.0085906982421875, -0.950408935546875, -0.8922271728515625, -0.83404541015625, -0.7758636474609375, -0.717681884765625, -0.6595001220703125, -0.601318359375, -0.5431365966796875, -0.484954833984375, -0.4267730712890625, -0.36859130859375, -0.3104095458984375, -0.252227783203125, -0.1940460205078125, -0.1358642578125, -0.0776824951171875, -0.019500732421875, 0.0386810302734375, 0.09686279296875, 0.1550445556640625, 0.213226318359375, 0.2714080810546875, 0.32958984375, 0.3877716064453125, 0.445953369140625, 0.5041351318359375, 0.56231689453125, 0.6204986572265625, 0.678680419921875, 0.7368621826171875, 0.7950439453125, 0.8532257080078125, 0.911407470703125, 0.9695892333984375, 1.02777099609375, 1.0859527587890625, 1.144134521484375, 1.2023162841796875, 1.260498046875, 1.3186798095703125, 1.376861572265625, 1.4350433349609375, 1.49322509765625, 1.5514068603515625, 1.609588623046875, 1.6677703857421875, 1.7259521484375, 1.7841339111328125, 1.842315673828125, 1.9004974365234375, 1.95867919921875, 2.0168609619140625, 2.075042724609375, 2.1332244873046875, 2.19140625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 10.0, 26.0, 58.0, 142.0, 236.0, 247.0, 170.0, 70.0, 30.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.619155883789062, -25.79039192199707, -24.96162986755371, -24.13286590576172, -23.304101943969727, -22.475339889526367, -21.646575927734375, -20.817813873291016, -19.989049911499023, -19.16028594970703, -18.331523895263672, -17.50275993347168, -16.673995971679688, -15.845233917236328, -15.016469955444336, -14.18770694732666, -13.358942985534668, -12.530179977416992, -11.701416015625, -10.872653007507324, -10.043889999389648, -9.215126037597656, -8.38636302947998, -7.557600021362305, -6.728836536407471, -5.900073051452637, -5.071310043334961, -4.242546558380127, -3.413783311843872, -2.585020065307617, -1.7562565803527832, -0.9274935722351074, -0.09873008728027344, 0.7300332188606262, 1.5587965250015259, 2.3875598907470703, 3.216323137283325, 4.04508638381958, 4.873849868774414, 5.70261287689209, 6.531376361846924, 7.360139846801758, 8.188902854919434, 9.01766586303711, 9.846429824829102, 10.675192832946777, 11.503955841064453, 12.332719802856445, 13.161482810974121, 13.990245819091797, 14.819009780883789, 15.647772789001465, 16.47653579711914, 17.305299758911133, 18.134063720703125, 18.962825775146484, 19.791589736938477, 20.62035369873047, 21.449115753173828, 22.27787971496582, 23.106643676757812, 23.935405731201172, 24.764169692993164, 25.592933654785156, 26.421695709228516]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 10.0, 13.0, 7.0, 21.0, 20.0, 31.0, 30.0, 48.0, 56.0, 62.0, 72.0, 72.0, 77.0, 75.0, 70.0, 57.0, 49.0, 36.0, 43.0, 27.0, 26.0, 17.0, 31.0, 20.0, 10.0, 3.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.770374298095703, -21.159971237182617, -20.54956817626953, -19.939165115356445, -19.32876205444336, -18.718360900878906, -18.10795783996582, -17.497554779052734, -16.88715171813965, -16.276748657226562, -15.666345596313477, -15.055943489074707, -14.445540428161621, -13.835137367248535, -13.224735260009766, -12.61433219909668, -12.003929138183594, -11.393526077270508, -10.783123016357422, -10.172720909118652, -9.562317848205566, -8.95191478729248, -8.341512680053711, -7.731109619140625, -7.120706558227539, -6.510303497314453, -5.899900913238525, -5.289498329162598, -4.679095268249512, -4.068692207336426, -3.458289623260498, -2.8478870391845703, -2.2374820709228516, -1.6270792484283447, -1.016676425933838, -0.40627360343933105, 0.20412921905517578, 0.8145320415496826, 1.4249348640441895, 2.035337448120117, 2.645740509033203, 3.25614333152771, 3.866546154022217, 4.4769487380981445, 5.0873517990112305, 5.697754859924316, 6.308157444000244, 6.918560028076172, 7.528963088989258, 8.139366149902344, 8.74976921081543, 9.3601713180542, 9.970574378967285, 10.580977439880371, 11.19137954711914, 11.801782608032227, 12.412185668945312, 13.022588729858398, 13.632991790771484, 14.243393898010254, 14.85379695892334, 15.464200019836426, 16.074602127075195, 16.68500518798828, 17.295408248901367]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 10.0, 7.0, 6.0, 17.0, 22.0, 18.0, 40.0, 56.0, 41.0, 87.0, 118.0, 156.0, 262.0, 400.0, 712.0, 1286.0, 2720.0, 6732.0, 21509.0, 151597.0, 3936943.0, 51127.0, 11907.0, 4265.0, 1871.0, 953.0, 521.0, 302.0, 177.0, 108.0, 81.0, 58.0, 46.0, 27.0, 22.0, 12.0, 17.0, 15.0, 8.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.9599609375, -1.9073638916015625, -1.854766845703125, -1.8021697998046875, -1.74957275390625, -1.6969757080078125, -1.644378662109375, -1.5917816162109375, -1.5391845703125, -1.4865875244140625, -1.433990478515625, -1.3813934326171875, -1.32879638671875, -1.2761993408203125, -1.223602294921875, -1.1710052490234375, -1.118408203125, -1.0658111572265625, -1.013214111328125, -0.9606170654296875, -0.90802001953125, -0.8554229736328125, -0.802825927734375, -0.7502288818359375, -0.6976318359375, -0.6450347900390625, -0.592437744140625, -0.5398406982421875, -0.48724365234375, -0.4346466064453125, -0.382049560546875, -0.3294525146484375, -0.27685546875, -0.2242584228515625, -0.171661376953125, -0.1190643310546875, -0.06646728515625, -0.0138702392578125, 0.038726806640625, 0.0913238525390625, 0.1439208984375, 0.1965179443359375, 0.249114990234375, 0.3017120361328125, 0.35430908203125, 0.4069061279296875, 0.459503173828125, 0.5121002197265625, 0.564697265625, 0.6172943115234375, 0.669891357421875, 0.7224884033203125, 0.77508544921875, 0.8276824951171875, 0.880279541015625, 0.9328765869140625, 0.9854736328125, 1.0380706787109375, 1.090667724609375, 1.1432647705078125, 1.19586181640625, 1.2484588623046875, 1.301055908203125, 1.3536529541015625, 1.40625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 11.0, 7.0, 7.0, 10.0, 14.0, 41.0, 50.0, 65.0, 78.0, 128.0, 127.0, 108.0, 104.0, 78.0, 59.0, 32.0, 26.0, 17.0, 15.0, 7.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0], "bins": [-1.9111328125, -1.8692169189453125, -1.827301025390625, -1.7853851318359375, -1.74346923828125, -1.7015533447265625, -1.659637451171875, -1.6177215576171875, -1.5758056640625, -1.5338897705078125, -1.491973876953125, -1.4500579833984375, -1.40814208984375, -1.3662261962890625, -1.324310302734375, -1.2823944091796875, -1.240478515625, -1.1985626220703125, -1.156646728515625, -1.1147308349609375, -1.07281494140625, -1.0308990478515625, -0.988983154296875, -0.9470672607421875, -0.9051513671875, -0.8632354736328125, -0.821319580078125, -0.7794036865234375, -0.73748779296875, -0.6955718994140625, -0.653656005859375, -0.6117401123046875, -0.56982421875, -0.5279083251953125, -0.485992431640625, -0.4440765380859375, -0.40216064453125, -0.3602447509765625, -0.318328857421875, -0.2764129638671875, -0.2344970703125, -0.1925811767578125, -0.150665283203125, -0.1087493896484375, -0.06683349609375, -0.0249176025390625, 0.016998291015625, 0.0589141845703125, 0.100830078125, 0.1427459716796875, 0.184661865234375, 0.2265777587890625, 0.26849365234375, 0.3104095458984375, 0.352325439453125, 0.3942413330078125, 0.4361572265625, 0.4780731201171875, 0.519989013671875, 0.5619049072265625, 0.60382080078125, 0.6457366943359375, 0.687652587890625, 0.7295684814453125, 0.771484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 7.0, 10.0, 16.0, 18.0, 24.0, 44.0, 45.0, 69.0, 81.0, 121.0, 148.0, 227.0, 291.0, 426.0, 642.0, 1266.0, 3460.0, 14911.0, 199065.0, 3928654.0, 34572.0, 5752.0, 1816.0, 809.0, 445.0, 346.0, 252.0, 176.0, 131.0, 104.0, 85.0, 60.0, 49.0, 38.0, 25.0, 18.0, 15.0, 9.0, 11.0, 9.0, 3.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5078125, -2.42193603515625, -2.3360595703125, -2.25018310546875, -2.164306640625, -2.07843017578125, -1.9925537109375, -1.90667724609375, -1.82080078125, -1.73492431640625, -1.6490478515625, -1.56317138671875, -1.477294921875, -1.39141845703125, -1.3055419921875, -1.21966552734375, -1.1337890625, -1.04791259765625, -0.9620361328125, -0.87615966796875, -0.790283203125, -0.70440673828125, -0.6185302734375, -0.53265380859375, -0.44677734375, -0.36090087890625, -0.2750244140625, -0.18914794921875, -0.103271484375, -0.01739501953125, 0.0684814453125, 0.15435791015625, 0.240234375, 0.32611083984375, 0.4119873046875, 0.49786376953125, 0.583740234375, 0.66961669921875, 0.7554931640625, 0.84136962890625, 0.92724609375, 1.01312255859375, 1.0989990234375, 1.18487548828125, 1.270751953125, 1.35662841796875, 1.4425048828125, 1.52838134765625, 1.6142578125, 1.70013427734375, 1.7860107421875, 1.87188720703125, 1.957763671875, 2.04364013671875, 2.1295166015625, 2.21539306640625, 2.30126953125, 2.38714599609375, 2.4730224609375, 2.55889892578125, 2.644775390625, 2.73065185546875, 2.8165283203125, 2.90240478515625, 2.98828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 11.0, 23.0, 39.0, 94.0, 355.0, 3312.0, 152.0, 51.0, 18.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.2567138671875, -1.204833984375, -1.1529541015625, -1.10107421875, -1.0491943359375, -0.997314453125, -0.9454345703125, -0.8935546875, -0.8416748046875, -0.789794921875, -0.7379150390625, -0.68603515625, -0.6341552734375, -0.582275390625, -0.5303955078125, -0.478515625, -0.4266357421875, -0.374755859375, -0.3228759765625, -0.27099609375, -0.2191162109375, -0.167236328125, -0.1153564453125, -0.0634765625, -0.0115966796875, 0.040283203125, 0.0921630859375, 0.14404296875, 0.1959228515625, 0.247802734375, 0.2996826171875, 0.3515625, 0.4034423828125, 0.455322265625, 0.5072021484375, 0.55908203125, 0.6109619140625, 0.662841796875, 0.7147216796875, 0.7666015625, 0.8184814453125, 0.870361328125, 0.9222412109375, 0.97412109375, 1.0260009765625, 1.077880859375, 1.1297607421875, 1.181640625, 1.2335205078125, 1.285400390625, 1.3372802734375, 1.38916015625, 1.4410400390625, 1.492919921875, 1.5447998046875, 1.5966796875, 1.6485595703125, 1.700439453125, 1.7523193359375, 1.80419921875, 1.8560791015625, 1.907958984375, 1.9598388671875, 2.01171875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 19.0, 28.0, 56.0, 77.0, 120.0, 165.0, 184.0, 161.0, 77.0, 51.0, 24.0, 15.0, 9.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.152436256408691, -3.9816713333129883, -3.810906171798706, -3.640141248703003, -3.4693763256073, -3.2986111640930176, -3.1278462409973145, -2.9570813179016113, -2.786316394805908, -2.615551471710205, -2.444786310195923, -2.2740213871002197, -2.1032564640045166, -1.932491421699524, -1.7617263793945312, -1.5909614562988281, -1.420196294784546, -1.2494312524795532, -1.07866632938385, -0.9079012870788574, -0.7371363043785095, -0.5663713216781616, -0.39560627937316895, -0.22484135627746582, -0.054076313972473145, 0.11668868362903595, 0.28745368123054504, 0.45821869373321533, 0.6289836764335632, 0.7997486591339111, 0.9705137014389038, 1.141278624534607, 1.3120436668395996, 1.4828087091445923, 1.6535736322402954, 1.824338674545288, 1.9951035976409912, 2.1658687591552734, 2.3366336822509766, 2.5073986053466797, 2.678163528442383, 2.848928451538086, 3.019693613052368, 3.1904585361480713, 3.3612234592437744, 3.5319886207580566, 3.7027535438537598, 3.873518466949463, 4.044283866882324, 4.215048789978027, 4.3858137130737305, 4.556578636169434, 4.727344036102295, 4.898108959197998, 5.068873882293701, 5.239638805389404, 5.410403728485107, 5.5811686515808105, 5.751933574676514, 5.922698974609375, 6.093463897705078, 6.264228820800781, 6.434993743896484, 6.6057586669921875, 6.776523590087891]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 1.0, 5.0, 11.0, 7.0, 13.0, 12.0, 23.0, 31.0, 35.0, 36.0, 48.0, 44.0, 44.0, 52.0, 49.0, 57.0, 59.0, 60.0, 51.0, 53.0, 48.0, 35.0, 40.0, 33.0, 43.0, 14.0, 20.0, 19.0, 12.0, 9.0, 7.0, 2.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.3887202739715576, -3.2974400520324707, -3.206159830093384, -3.114879608154297, -3.023599624633789, -2.932319402694702, -2.8410391807556152, -2.7497589588165283, -2.6584787368774414, -2.5671985149383545, -2.4759182929992676, -2.3846383094787598, -2.293358087539673, -2.202077865600586, -2.110797643661499, -2.019517421722412, -1.9282374382019043, -1.8369572162628174, -1.74567711353302, -1.654396891593933, -1.5631167888641357, -1.4718365669250488, -1.380556344985962, -1.289276123046875, -1.1979960203170776, -1.1067157983779907, -1.0154356956481934, -0.9241554737091064, -0.8328753113746643, -0.7415951490402222, -0.6503149271011353, -0.5590347647666931, -0.4677543640136719, -0.37647420167922974, -0.2851940095424652, -0.19391381740570068, -0.10263365507125854, -0.011353492736816406, 0.07992672920227051, 0.17120689153671265, 0.2624870538711548, 0.3537672162055969, 0.44504740834236145, 0.536327600479126, 0.6276077628135681, 0.7188879251480103, 0.8101681470870972, 0.9014483094215393, 0.9927284717559814, 1.0840086936950684, 1.1752887964248657, 1.2665690183639526, 1.35784912109375, 1.449129343032837, 1.5404095649719238, 1.6316897869110107, 1.722969889640808, 1.814250111579895, 1.9055302143096924, 1.9968104362487793, 2.088090658187866, 2.179370880126953, 2.270650863647461, 2.361931085586548, 2.4532113075256348]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 12.0, 9.0, 13.0, 24.0, 26.0, 48.0, 105.0, 179.0, 342.0, 832.0, 2472.0, 8889.0, 45698.0, 293943.0, 552096.0, 117193.0, 19543.0, 4565.0, 1496.0, 526.0, 250.0, 125.0, 71.0, 35.0, 24.0, 16.0, 9.0, 6.0, 7.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7626953125, -1.7024383544921875, -1.642181396484375, -1.5819244384765625, -1.52166748046875, -1.4614105224609375, -1.401153564453125, -1.3408966064453125, -1.2806396484375, -1.2203826904296875, -1.160125732421875, -1.0998687744140625, -1.03961181640625, -0.9793548583984375, -0.919097900390625, -0.8588409423828125, -0.798583984375, -0.7383270263671875, -0.678070068359375, -0.6178131103515625, -0.55755615234375, -0.4972991943359375, -0.437042236328125, -0.3767852783203125, -0.3165283203125, -0.2562713623046875, -0.196014404296875, -0.1357574462890625, -0.07550048828125, -0.0152435302734375, 0.045013427734375, 0.1052703857421875, 0.16552734375, 0.2257843017578125, 0.286041259765625, 0.3462982177734375, 0.40655517578125, 0.4668121337890625, 0.527069091796875, 0.5873260498046875, 0.6475830078125, 0.7078399658203125, 0.768096923828125, 0.8283538818359375, 0.88861083984375, 0.9488677978515625, 1.009124755859375, 1.0693817138671875, 1.129638671875, 1.1898956298828125, 1.250152587890625, 1.3104095458984375, 1.37066650390625, 1.4309234619140625, 1.491180419921875, 1.5514373779296875, 1.6116943359375, 1.6719512939453125, 1.732208251953125, 1.7924652099609375, 1.85272216796875, 1.9129791259765625, 1.973236083984375, 2.0334930419921875, 2.09375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 4.0, 11.0, 11.0, 18.0, 19.0, 45.0, 69.0, 77.0, 95.0, 87.0, 105.0, 100.0, 82.0, 70.0, 52.0, 40.0, 38.0, 25.0, 14.0, 11.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6337890625, -1.5943832397460938, -1.5549774169921875, -1.5155715942382812, -1.476165771484375, -1.4367599487304688, -1.3973541259765625, -1.3579483032226562, -1.31854248046875, -1.2791366577148438, -1.2397308349609375, -1.2003250122070312, -1.160919189453125, -1.1215133666992188, -1.0821075439453125, -1.0427017211914062, -1.0032958984375, -0.9638900756835938, -0.9244842529296875, -0.8850784301757812, -0.845672607421875, -0.8062667846679688, -0.7668609619140625, -0.7274551391601562, -0.68804931640625, -0.6486434936523438, -0.6092376708984375, -0.5698318481445312, -0.530426025390625, -0.49102020263671875, -0.4516143798828125, -0.41220855712890625, -0.372802734375, -0.33339691162109375, -0.2939910888671875, -0.25458526611328125, -0.215179443359375, -0.17577362060546875, -0.1363677978515625, -0.09696197509765625, -0.05755615234375, -0.01815032958984375, 0.0212554931640625, 0.06066131591796875, 0.100067138671875, 0.13947296142578125, 0.1788787841796875, 0.21828460693359375, 0.2576904296875, 0.29709625244140625, 0.3365020751953125, 0.37590789794921875, 0.415313720703125, 0.45471954345703125, 0.4941253662109375, 0.5335311889648438, 0.57293701171875, 0.6123428344726562, 0.6517486572265625, 0.6911544799804688, 0.730560302734375, 0.7699661254882812, 0.8093719482421875, 0.8487777709960938, 0.88818359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 11.0, 9.0, 23.0, 30.0, 56.0, 111.0, 190.0, 466.0, 1088.0, 3779.0, 28844.0, 576589.0, 411475.0, 20935.0, 3183.0, 958.0, 397.0, 187.0, 102.0, 51.0, 33.0, 20.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30859375, -3.219024658203125, -3.12945556640625, -3.039886474609375, -2.9503173828125, -2.860748291015625, -2.77117919921875, -2.681610107421875, -2.592041015625, -2.502471923828125, -2.41290283203125, -2.323333740234375, -2.2337646484375, -2.144195556640625, -2.05462646484375, -1.965057373046875, -1.87548828125, -1.785919189453125, -1.69635009765625, -1.606781005859375, -1.5172119140625, -1.427642822265625, -1.33807373046875, -1.248504638671875, -1.158935546875, -1.069366455078125, -0.97979736328125, -0.890228271484375, -0.8006591796875, -0.711090087890625, -0.62152099609375, -0.531951904296875, -0.4423828125, -0.352813720703125, -0.26324462890625, -0.173675537109375, -0.0841064453125, 0.005462646484375, 0.09503173828125, 0.184600830078125, 0.274169921875, 0.363739013671875, 0.45330810546875, 0.542877197265625, 0.6324462890625, 0.722015380859375, 0.81158447265625, 0.901153564453125, 0.99072265625, 1.080291748046875, 1.16986083984375, 1.259429931640625, 1.3489990234375, 1.438568115234375, 1.52813720703125, 1.617706298828125, 1.707275390625, 1.796844482421875, 1.88641357421875, 1.975982666015625, 2.0655517578125, 2.155120849609375, 2.24468994140625, 2.334259033203125, 2.423828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 10.0, 13.0, 12.0, 12.0, 20.0, 17.0, 22.0, 39.0, 38.0, 54.0, 49.0, 60.0, 46.0, 59.0, 64.0, 59.0, 53.0, 64.0, 45.0, 42.0, 37.0, 43.0, 31.0, 28.0, 19.0, 10.0, 12.0, 12.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.12890625, -4.028045654296875, -3.92718505859375, -3.826324462890625, -3.7254638671875, -3.624603271484375, -3.52374267578125, -3.422882080078125, -3.322021484375, -3.221160888671875, -3.12030029296875, -3.019439697265625, -2.9185791015625, -2.817718505859375, -2.71685791015625, -2.615997314453125, -2.51513671875, -2.414276123046875, -2.31341552734375, -2.212554931640625, -2.1116943359375, -2.010833740234375, -1.90997314453125, -1.809112548828125, -1.708251953125, -1.607391357421875, -1.50653076171875, -1.405670166015625, -1.3048095703125, -1.203948974609375, -1.10308837890625, -1.002227783203125, -0.9013671875, -0.800506591796875, -0.69964599609375, -0.598785400390625, -0.4979248046875, -0.397064208984375, -0.29620361328125, -0.195343017578125, -0.094482421875, 0.006378173828125, 0.10723876953125, 0.208099365234375, 0.3089599609375, 0.409820556640625, 0.51068115234375, 0.611541748046875, 0.71240234375, 0.813262939453125, 0.91412353515625, 1.014984130859375, 1.1158447265625, 1.216705322265625, 1.31756591796875, 1.418426513671875, 1.519287109375, 1.620147705078125, 1.72100830078125, 1.821868896484375, 1.9227294921875, 2.023590087890625, 2.12445068359375, 2.225311279296875, 2.326171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 8.0, 6.0, 5.0, 16.0, 13.0, 31.0, 39.0, 54.0, 113.0, 258.0, 438.0, 1113.0, 3643.0, 20107.0, 304879.0, 666572.0, 42646.0, 5718.0, 1593.0, 608.0, 295.0, 167.0, 80.0, 38.0, 30.0, 26.0, 18.0, 8.0, 4.0, 7.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0048828125, -0.98046875, -0.9560546875, -0.931640625, -0.9072265625, -0.8828125, -0.8583984375, -0.833984375, -0.8095703125, -0.78515625, -0.7607421875, -0.736328125, -0.7119140625, -0.6875, -0.6630859375, -0.638671875, -0.6142578125, -0.58984375, -0.5654296875, -0.541015625, -0.5166015625, -0.4921875, -0.4677734375, -0.443359375, -0.4189453125, -0.39453125, -0.3701171875, -0.345703125, -0.3212890625, -0.296875, -0.2724609375, -0.248046875, -0.2236328125, -0.19921875, -0.1748046875, -0.150390625, -0.1259765625, -0.1015625, -0.0771484375, -0.052734375, -0.0283203125, -0.00390625, 0.0205078125, 0.044921875, 0.0693359375, 0.09375, 0.1181640625, 0.142578125, 0.1669921875, 0.19140625, 0.2158203125, 0.240234375, 0.2646484375, 0.2890625, 0.3134765625, 0.337890625, 0.3623046875, 0.38671875, 0.4111328125, 0.435546875, 0.4599609375, 0.484375, 0.5087890625, 0.533203125, 0.5576171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 9.0, 23.0, 21.0, 22.0, 33.0, 51.0, 73.0, 57.0, 116.0, 110.0, 97.0, 103.0, 66.0, 61.0, 39.0, 26.0, 28.0, 24.0, 10.0, 5.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00015366077423095703, -0.0001497967168688774, -0.0001459326595067978, -0.00014206860214471817, -0.00013820454478263855, -0.00013434048742055893, -0.0001304764300584793, -0.0001266123726963997, -0.00012274831533432007, -0.00011888425797224045, -0.00011502020061016083, -0.00011115614324808121, -0.00010729208588600159, -0.00010342802852392197, -9.956397116184235e-05, -9.569991379976273e-05, -9.18358564376831e-05, -8.797179907560349e-05, -8.410774171352386e-05, -8.024368435144424e-05, -7.637962698936462e-05, -7.2515569627285e-05, -6.865151226520538e-05, -6.478745490312576e-05, -6.092339754104614e-05, -5.705934017896652e-05, -5.31952828168869e-05, -4.933122545480728e-05, -4.546716809272766e-05, -4.160311073064804e-05, -3.773905336856842e-05, -3.38749960064888e-05, -3.001093864440918e-05, -2.614688128232956e-05, -2.228282392024994e-05, -1.841876655817032e-05, -1.4554709196090698e-05, -1.0690651834011078e-05, -6.8265944719314575e-06, -2.962537109851837e-06, 9.015202522277832e-07, 4.7655776143074036e-06, 8.629634976387024e-06, 1.2493692338466644e-05, 1.6357749700546265e-05, 2.0221807062625885e-05, 2.4085864424705505e-05, 2.7949921786785126e-05, 3.1813979148864746e-05, 3.5678036510944366e-05, 3.954209387302399e-05, 4.340615123510361e-05, 4.727020859718323e-05, 5.113426595926285e-05, 5.499832332134247e-05, 5.886238068342209e-05, 6.272643804550171e-05, 6.659049540758133e-05, 7.045455276966095e-05, 7.431861013174057e-05, 7.818266749382019e-05, 8.204672485589981e-05, 8.591078221797943e-05, 8.977483958005905e-05, 9.363889694213867e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 4.0, 10.0, 14.0, 20.0, 36.0, 65.0, 114.0, 245.0, 605.0, 1566.0, 5650.0, 36874.0, 648435.0, 328270.0, 20547.0, 3946.0, 1183.0, 487.0, 198.0, 105.0, 54.0, 47.0, 23.0, 11.0, 15.0, 10.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.97802734375, -0.9491500854492188, -0.9202728271484375, -0.8913955688476562, -0.862518310546875, -0.8336410522460938, -0.8047637939453125, -0.7758865356445312, -0.74700927734375, -0.7181320190429688, -0.6892547607421875, -0.6603775024414062, -0.631500244140625, -0.6026229858398438, -0.5737457275390625, -0.5448684692382812, -0.5159912109375, -0.48711395263671875, -0.4582366943359375, -0.42935943603515625, -0.400482177734375, -0.37160491943359375, -0.3427276611328125, -0.31385040283203125, -0.28497314453125, -0.25609588623046875, -0.2272186279296875, -0.19834136962890625, -0.169464111328125, -0.14058685302734375, -0.1117095947265625, -0.08283233642578125, -0.053955078125, -0.02507781982421875, 0.0037994384765625, 0.03267669677734375, 0.061553955078125, 0.09043121337890625, 0.1193084716796875, 0.14818572998046875, 0.17706298828125, 0.20594024658203125, 0.2348175048828125, 0.26369476318359375, 0.292572021484375, 0.32144927978515625, 0.3503265380859375, 0.37920379638671875, 0.4080810546875, 0.43695831298828125, 0.4658355712890625, 0.49471282958984375, 0.523590087890625, 0.5524673461914062, 0.5813446044921875, 0.6102218627929688, 0.63909912109375, 0.6679763793945312, 0.6968536376953125, 0.7257308959960938, 0.754608154296875, 0.7834854125976562, 0.8123626708984375, 0.8412399291992188, 0.8701171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 12.0, 10.0, 22.0, 34.0, 25.0, 39.0, 48.0, 50.0, 88.0, 74.0, 86.0, 99.0, 80.0, 68.0, 50.0, 53.0, 47.0, 29.0, 17.0, 15.0, 13.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8037109375, -0.7822647094726562, -0.7608184814453125, -0.7393722534179688, -0.717926025390625, -0.6964797973632812, -0.6750335693359375, -0.6535873413085938, -0.63214111328125, -0.6106948852539062, -0.5892486572265625, -0.5678024291992188, -0.546356201171875, -0.5249099731445312, -0.5034637451171875, -0.48201751708984375, -0.4605712890625, -0.43912506103515625, -0.4176788330078125, -0.39623260498046875, -0.374786376953125, -0.35334014892578125, -0.3318939208984375, -0.31044769287109375, -0.28900146484375, -0.26755523681640625, -0.2461090087890625, -0.22466278076171875, -0.203216552734375, -0.18177032470703125, -0.1603240966796875, -0.13887786865234375, -0.117431640625, -0.09598541259765625, -0.0745391845703125, -0.05309295654296875, -0.031646728515625, -0.01020050048828125, 0.0112457275390625, 0.03269195556640625, 0.05413818359375, 0.07558441162109375, 0.0970306396484375, 0.11847686767578125, 0.139923095703125, 0.16136932373046875, 0.1828155517578125, 0.20426177978515625, 0.2257080078125, 0.24715423583984375, 0.2686004638671875, 0.29004669189453125, 0.311492919921875, 0.33293914794921875, 0.3543853759765625, 0.37583160400390625, 0.39727783203125, 0.41872406005859375, 0.4401702880859375, 0.46161651611328125, 0.483062744140625, 0.5045089721679688, 0.5259552001953125, 0.5474014282226562, 0.56884765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 24.0, 55.0, 143.0, 266.0, 232.0, 148.0, 78.0, 35.0, 14.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.696379661560059, -11.946297645568848, -11.196216583251953, -10.446134567260742, -9.696052551269531, -8.94597053527832, -8.195889472961426, -7.445807456970215, -6.695725917816162, -5.945644378662109, -5.195562362670898, -4.445480823516846, -3.695399045944214, -2.945317268371582, -2.1952357292175293, -1.4451537132263184, -0.6950721740722656, 0.055009543895721436, 0.8050912618637085, 1.5551729202270508, 2.3052546977996826, 3.0553364753723145, 3.805418014526367, 4.555500030517578, 5.305581569671631, 6.055663108825684, 6.8057451248168945, 7.555826663970947, 8.305908203125, 9.055990219116211, 9.806072235107422, 10.556154251098633, 11.306234359741211, 12.056316375732422, 12.806397438049316, 13.556479454040527, 14.306561470031738, 15.056642532348633, 15.806724548339844, 16.556806564331055, 17.306888580322266, 18.056970596313477, 18.807052612304688, 19.557132720947266, 20.307214736938477, 21.057296752929688, 21.8073787689209, 22.55746078491211, 23.307540893554688, 24.0576229095459, 24.80770492553711, 25.557785034179688, 26.3078670501709, 27.05794906616211, 27.80803108215332, 28.55811309814453, 29.308195114135742, 30.058277130126953, 30.808359146118164, 31.558441162109375, 32.30852127075195, 33.0586051940918, 33.808685302734375, 34.55876922607422, 35.3088493347168]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 11.0, 15.0, 12.0, 24.0, 20.0, 32.0, 38.0, 43.0, 52.0, 52.0, 63.0, 71.0, 63.0, 85.0, 60.0, 49.0, 52.0, 35.0, 49.0, 29.0, 25.0, 27.0, 28.0, 14.0, 12.0, 6.0, 5.0, 10.0, 7.0, 6.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.054407119750977, -13.55333137512207, -13.052255630493164, -12.551179885864258, -12.050104141235352, -11.549028396606445, -11.047952651977539, -10.546876907348633, -10.045801162719727, -9.54472541809082, -9.043649673461914, -8.542573928833008, -8.041498184204102, -7.540422439575195, -7.039346694946289, -6.538270950317383, -6.037195205688477, -5.53611946105957, -5.035043716430664, -4.533967971801758, -4.032892227172852, -3.5318164825439453, -3.030740737915039, -2.529664993286133, -2.0285892486572266, -1.5275135040283203, -1.026437759399414, -0.5253620147705078, -0.024286270141601562, 0.4767894744873047, 0.9778652191162109, 1.4789409637451172, 1.9800148010253906, 2.481090545654297, 2.982166290283203, 3.4832420349121094, 3.9843177795410156, 4.485393524169922, 4.986469268798828, 5.487545013427734, 5.988620758056641, 6.489696502685547, 6.990772247314453, 7.491847991943359, 7.992923736572266, 8.493999481201172, 8.995075225830078, 9.496150970458984, 9.99722671508789, 10.498302459716797, 10.999378204345703, 11.50045394897461, 12.001529693603516, 12.502605438232422, 13.003681182861328, 13.504756927490234, 14.00583267211914, 14.506908416748047, 15.007984161376953, 15.50905990600586, 16.010135650634766, 16.511211395263672, 17.012287139892578, 17.513362884521484, 18.01443862915039]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 11.0, 10.0, 12.0, 18.0, 19.0, 37.0, 50.0, 77.0, 124.0, 168.0, 259.0, 389.0, 652.0, 1178.0, 2065.0, 3675.0, 7618.0, 16978.0, 45377.0, 184570.0, 1886594.0, 1791380.0, 175690.0, 44730.0, 16656.0, 7203.0, 3677.0, 1982.0, 1171.0, 682.0, 412.0, 276.0, 182.0, 111.0, 73.0, 70.0, 39.0, 17.0, 13.0, 11.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7802734375, -0.7558822631835938, -0.7314910888671875, -0.7070999145507812, -0.682708740234375, -0.6583175659179688, -0.6339263916015625, -0.6095352172851562, -0.58514404296875, -0.5607528686523438, -0.5363616943359375, -0.5119705200195312, -0.487579345703125, -0.46318817138671875, -0.4387969970703125, -0.41440582275390625, -0.3900146484375, -0.36562347412109375, -0.3412322998046875, -0.31684112548828125, -0.292449951171875, -0.26805877685546875, -0.2436676025390625, -0.21927642822265625, -0.19488525390625, -0.17049407958984375, -0.1461029052734375, -0.12171173095703125, -0.097320556640625, -0.07292938232421875, -0.0485382080078125, -0.02414703369140625, 0.000244140625, 0.02463531494140625, 0.0490264892578125, 0.07341766357421875, 0.097808837890625, 0.12220001220703125, 0.1465911865234375, 0.17098236083984375, 0.19537353515625, 0.21976470947265625, 0.2441558837890625, 0.26854705810546875, 0.292938232421875, 0.31732940673828125, 0.3417205810546875, 0.36611175537109375, 0.3905029296875, 0.41489410400390625, 0.4392852783203125, 0.46367645263671875, 0.488067626953125, 0.5124588012695312, 0.5368499755859375, 0.5612411499023438, 0.58563232421875, 0.6100234985351562, 0.6344146728515625, 0.6588058471679688, 0.683197021484375, 0.7075881958007812, 0.7319793701171875, 0.7563705444335938, 0.78076171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 19.0, 16.0, 22.0, 30.0, 36.0, 52.0, 61.0, 54.0, 46.0, 56.0, 74.0, 79.0, 65.0, 56.0, 57.0, 40.0, 38.0, 39.0, 30.0, 23.0, 20.0, 18.0, 9.0, 15.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.81982421875, -0.795806884765625, -0.77178955078125, -0.747772216796875, -0.7237548828125, -0.699737548828125, -0.67572021484375, -0.651702880859375, -0.627685546875, -0.603668212890625, -0.57965087890625, -0.555633544921875, -0.5316162109375, -0.507598876953125, -0.48358154296875, -0.459564208984375, -0.435546875, -0.411529541015625, -0.38751220703125, -0.363494873046875, -0.3394775390625, -0.315460205078125, -0.29144287109375, -0.267425537109375, -0.243408203125, -0.219390869140625, -0.19537353515625, -0.171356201171875, -0.1473388671875, -0.123321533203125, -0.09930419921875, -0.075286865234375, -0.05126953125, -0.027252197265625, -0.00323486328125, 0.020782470703125, 0.0447998046875, 0.068817138671875, 0.09283447265625, 0.116851806640625, 0.140869140625, 0.164886474609375, 0.18890380859375, 0.212921142578125, 0.2369384765625, 0.260955810546875, 0.28497314453125, 0.308990478515625, 0.3330078125, 0.357025146484375, 0.38104248046875, 0.405059814453125, 0.4290771484375, 0.453094482421875, 0.47711181640625, 0.501129150390625, 0.525146484375, 0.549163818359375, 0.57318115234375, 0.597198486328125, 0.6212158203125, 0.645233154296875, 0.66925048828125, 0.693267822265625, 0.71728515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 16.0, 14.0, 26.0, 42.0, 82.0, 157.0, 389.0, 951.0, 3535.0, 21453.0, 867836.0, 3260075.0, 33426.0, 4448.0, 1106.0, 352.0, 148.0, 70.0, 54.0, 24.0, 23.0, 19.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.697265625, -2.61322021484375, -2.5291748046875, -2.44512939453125, -2.361083984375, -2.27703857421875, -2.1929931640625, -2.10894775390625, -2.02490234375, -1.94085693359375, -1.8568115234375, -1.77276611328125, -1.688720703125, -1.60467529296875, -1.5206298828125, -1.43658447265625, -1.3525390625, -1.26849365234375, -1.1844482421875, -1.10040283203125, -1.016357421875, -0.93231201171875, -0.8482666015625, -0.76422119140625, -0.68017578125, -0.59613037109375, -0.5120849609375, -0.42803955078125, -0.343994140625, -0.25994873046875, -0.1759033203125, -0.09185791015625, -0.0078125, 0.07623291015625, 0.1602783203125, 0.24432373046875, 0.328369140625, 0.41241455078125, 0.4964599609375, 0.58050537109375, 0.66455078125, 0.74859619140625, 0.8326416015625, 0.91668701171875, 1.000732421875, 1.08477783203125, 1.1688232421875, 1.25286865234375, 1.3369140625, 1.42095947265625, 1.5050048828125, 1.58905029296875, 1.673095703125, 1.75714111328125, 1.8411865234375, 1.92523193359375, 2.00927734375, 2.09332275390625, 2.1773681640625, 2.26141357421875, 2.345458984375, 2.42950439453125, 2.5135498046875, 2.59759521484375, 2.681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 12.0, 4.0, 12.0, 6.0, 10.0, 11.0, 15.0, 25.0, 43.0, 45.0, 98.0, 197.0, 432.0, 1009.0, 1057.0, 511.0, 215.0, 129.0, 70.0, 45.0, 28.0, 31.0, 14.0, 14.0, 5.0, 3.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.796875, -1.74700927734375, -1.6971435546875, -1.64727783203125, -1.597412109375, -1.54754638671875, -1.4976806640625, -1.44781494140625, -1.39794921875, -1.34808349609375, -1.2982177734375, -1.24835205078125, -1.198486328125, -1.14862060546875, -1.0987548828125, -1.04888916015625, -0.9990234375, -0.94915771484375, -0.8992919921875, -0.84942626953125, -0.799560546875, -0.74969482421875, -0.6998291015625, -0.64996337890625, -0.60009765625, -0.55023193359375, -0.5003662109375, -0.45050048828125, -0.400634765625, -0.35076904296875, -0.3009033203125, -0.25103759765625, -0.201171875, -0.15130615234375, -0.1014404296875, -0.05157470703125, -0.001708984375, 0.04815673828125, 0.0980224609375, 0.14788818359375, 0.19775390625, 0.24761962890625, 0.2974853515625, 0.34735107421875, 0.397216796875, 0.44708251953125, 0.4969482421875, 0.54681396484375, 0.5966796875, 0.64654541015625, 0.6964111328125, 0.74627685546875, 0.796142578125, 0.84600830078125, 0.8958740234375, 0.94573974609375, 0.99560546875, 1.04547119140625, 1.0953369140625, 1.14520263671875, 1.195068359375, 1.24493408203125, 1.2947998046875, 1.34466552734375, 1.39453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 12.0, 24.0, 48.0, 94.0, 128.0, 203.0, 175.0, 133.0, 79.0, 39.0, 19.0, 14.0, 10.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.686397552490234, -13.26620864868164, -12.846019744873047, -12.42583179473877, -12.005642890930176, -11.585453987121582, -11.165266036987305, -10.745077133178711, -10.324888229370117, -9.904699325561523, -9.48451042175293, -9.064322471618652, -8.644133567810059, -8.223944664001465, -7.803756237030029, -7.383567810058594, -6.96337890625, -6.543190002441406, -6.123001575469971, -5.702813148498535, -5.282624244689941, -4.862435340881348, -4.442246913909912, -4.022058486938477, -3.601869583129883, -3.181680917739868, -2.7614922523498535, -2.341303586959839, -1.9211149215698242, -1.5009262561798096, -1.080737590789795, -0.6605489253997803, -0.24036026000976562, 0.17982840538024902, 0.6000170707702637, 1.0202057361602783, 1.440394401550293, 1.8605830669403076, 2.2807717323303223, 2.700960397720337, 3.1211490631103516, 3.541337728500366, 3.961526393890381, 4.381714820861816, 4.80190372467041, 5.222092628479004, 5.6422810554504395, 6.062469482421875, 6.482658386230469, 6.9028472900390625, 7.323035717010498, 7.743224143981934, 8.163413047790527, 8.583601951599121, 9.003789901733398, 9.423978805541992, 9.844167709350586, 10.26435661315918, 10.684545516967773, 11.10473346710205, 11.524922370910645, 11.945111274719238, 12.365299224853516, 12.78548812866211, 13.205677032470703]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 9.0, 11.0, 16.0, 20.0, 21.0, 22.0, 41.0, 42.0, 45.0, 42.0, 43.0, 52.0, 52.0, 63.0, 68.0, 46.0, 51.0, 52.0, 48.0, 49.0, 36.0, 36.0, 27.0, 26.0, 18.0, 13.0, 18.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.923761367797852, -6.668846607208252, -6.413931846618652, -6.159017086029053, -5.904102325439453, -5.649187088012695, -5.394272327423096, -5.139357566833496, -4.8844428062438965, -4.629528045654297, -4.374613285064697, -4.119698524475098, -3.864783525466919, -3.6098687648773193, -3.3549537658691406, -3.100039005279541, -2.8451242446899414, -2.590209484100342, -2.335294723510742, -2.0803797245025635, -1.8254649639129639, -1.5705502033233643, -1.315635323524475, -1.060720443725586, -0.8058056831359863, -0.5508908629417419, -0.29597604274749756, -0.041061222553253174, 0.2138535976409912, 0.4687683582305908, 0.72368323802948, 0.9785981178283691, 1.2335128784179688, 1.4884276390075684, 1.7433425188064575, 1.9982573986053467, 2.2531721591949463, 2.508086919784546, 2.7630019187927246, 3.017916679382324, 3.272831439971924, 3.5277462005615234, 3.782660961151123, 4.037575721740723, 4.2924909591674805, 4.547405242919922, 4.80232048034668, 5.057235240936279, 5.312150001525879, 5.5670647621154785, 5.821979522705078, 6.076894283294678, 6.331809043884277, 6.586724281311035, 6.841639041900635, 7.096553802490234, 7.351468563079834, 7.606383323669434, 7.861298084259033, 8.116212844848633, 8.37112808227539, 8.626042366027832, 8.88095760345459, 9.135871887207031, 9.390787124633789]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 11.0, 26.0, 32.0, 45.0, 64.0, 101.0, 155.0, 228.0, 309.0, 638.0, 992.0, 1763.0, 3229.0, 5974.0, 11640.0, 23967.0, 49854.0, 104586.0, 200588.0, 267857.0, 188762.0, 95788.0, 46253.0, 22060.0, 10733.0, 5614.0, 2996.0, 1667.0, 981.0, 584.0, 383.0, 223.0, 143.0, 96.0, 73.0, 40.0, 18.0, 15.0, 11.0, 15.0, 5.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.64990234375, -0.6285552978515625, -0.607208251953125, -0.5858612060546875, -0.56451416015625, -0.5431671142578125, -0.521820068359375, -0.5004730224609375, -0.4791259765625, -0.4577789306640625, -0.436431884765625, -0.4150848388671875, -0.39373779296875, -0.3723907470703125, -0.351043701171875, -0.3296966552734375, -0.308349609375, -0.2870025634765625, -0.265655517578125, -0.2443084716796875, -0.22296142578125, -0.2016143798828125, -0.180267333984375, -0.1589202880859375, -0.1375732421875, -0.1162261962890625, -0.094879150390625, -0.0735321044921875, -0.05218505859375, -0.0308380126953125, -0.009490966796875, 0.0118560791015625, 0.033203125, 0.0545501708984375, 0.075897216796875, 0.0972442626953125, 0.11859130859375, 0.1399383544921875, 0.161285400390625, 0.1826324462890625, 0.2039794921875, 0.2253265380859375, 0.246673583984375, 0.2680206298828125, 0.28936767578125, 0.3107147216796875, 0.332061767578125, 0.3534088134765625, 0.374755859375, 0.3961029052734375, 0.417449951171875, 0.4387969970703125, 0.46014404296875, 0.4814910888671875, 0.502838134765625, 0.5241851806640625, 0.5455322265625, 0.5668792724609375, 0.588226318359375, 0.6095733642578125, 0.63092041015625, 0.6522674560546875, 0.673614501953125, 0.6949615478515625, 0.71630859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 12.0, 16.0, 24.0, 25.0, 30.0, 32.0, 42.0, 55.0, 41.0, 63.0, 62.0, 68.0, 76.0, 63.0, 59.0, 35.0, 54.0, 51.0, 29.0, 45.0, 22.0, 16.0, 17.0, 19.0, 4.0, 6.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.82080078125, -0.7968368530273438, -0.7728729248046875, -0.7489089965820312, -0.724945068359375, -0.7009811401367188, -0.6770172119140625, -0.6530532836914062, -0.62908935546875, -0.6051254272460938, -0.5811614990234375, -0.5571975708007812, -0.533233642578125, -0.5092697143554688, -0.4853057861328125, -0.46134185791015625, -0.4373779296875, -0.41341400146484375, -0.3894500732421875, -0.36548614501953125, -0.341522216796875, -0.31755828857421875, -0.2935943603515625, -0.26963043212890625, -0.24566650390625, -0.22170257568359375, -0.1977386474609375, -0.17377471923828125, -0.149810791015625, -0.12584686279296875, -0.1018829345703125, -0.07791900634765625, -0.053955078125, -0.02999114990234375, -0.0060272216796875, 0.01793670654296875, 0.041900634765625, 0.06586456298828125, 0.0898284912109375, 0.11379241943359375, 0.13775634765625, 0.16172027587890625, 0.1856842041015625, 0.20964813232421875, 0.233612060546875, 0.25757598876953125, 0.2815399169921875, 0.30550384521484375, 0.3294677734375, 0.35343170166015625, 0.3773956298828125, 0.40135955810546875, 0.425323486328125, 0.44928741455078125, 0.4732513427734375, 0.49721527099609375, 0.52117919921875, 0.5451431274414062, 0.5691070556640625, 0.5930709838867188, 0.617034912109375, 0.6409988403320312, 0.6649627685546875, 0.6889266967773438, 0.712890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 2.0, 4.0, 9.0, 15.0, 25.0, 29.0, 47.0, 79.0, 87.0, 169.0, 311.0, 457.0, 787.0, 1573.0, 3886.0, 15553.0, 120541.0, 696567.0, 178575.0, 21051.0, 4771.0, 1847.0, 880.0, 502.0, 299.0, 172.0, 101.0, 57.0, 50.0, 39.0, 17.0, 14.0, 10.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4521484375, -1.399505615234375, -1.34686279296875, -1.294219970703125, -1.2415771484375, -1.188934326171875, -1.13629150390625, -1.083648681640625, -1.031005859375, -0.978363037109375, -0.92572021484375, -0.873077392578125, -0.8204345703125, -0.767791748046875, -0.71514892578125, -0.662506103515625, -0.60986328125, -0.557220458984375, -0.50457763671875, -0.451934814453125, -0.3992919921875, -0.346649169921875, -0.29400634765625, -0.241363525390625, -0.188720703125, -0.136077880859375, -0.08343505859375, -0.030792236328125, 0.0218505859375, 0.074493408203125, 0.12713623046875, 0.179779052734375, 0.232421875, 0.285064697265625, 0.33770751953125, 0.390350341796875, 0.4429931640625, 0.495635986328125, 0.54827880859375, 0.600921630859375, 0.653564453125, 0.706207275390625, 0.75885009765625, 0.811492919921875, 0.8641357421875, 0.916778564453125, 0.96942138671875, 1.022064208984375, 1.07470703125, 1.127349853515625, 1.17999267578125, 1.232635498046875, 1.2852783203125, 1.337921142578125, 1.39056396484375, 1.443206787109375, 1.495849609375, 1.548492431640625, 1.60113525390625, 1.653778076171875, 1.7064208984375, 1.759063720703125, 1.81170654296875, 1.864349365234375, 1.9169921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 9.0, 11.0, 17.0, 17.0, 15.0, 14.0, 24.0, 19.0, 24.0, 21.0, 39.0, 26.0, 46.0, 37.0, 43.0, 52.0, 42.0, 47.0, 45.0, 42.0, 39.0, 44.0, 42.0, 31.0, 33.0, 36.0, 26.0, 25.0, 18.0, 19.0, 29.0, 13.0, 9.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0859375, -2.021209716796875, -1.95648193359375, -1.891754150390625, -1.8270263671875, -1.762298583984375, -1.69757080078125, -1.632843017578125, -1.568115234375, -1.503387451171875, -1.43865966796875, -1.373931884765625, -1.3092041015625, -1.244476318359375, -1.17974853515625, -1.115020751953125, -1.05029296875, -0.985565185546875, -0.92083740234375, -0.856109619140625, -0.7913818359375, -0.726654052734375, -0.66192626953125, -0.597198486328125, -0.532470703125, -0.467742919921875, -0.40301513671875, -0.338287353515625, -0.2735595703125, -0.208831787109375, -0.14410400390625, -0.079376220703125, -0.0146484375, 0.050079345703125, 0.11480712890625, 0.179534912109375, 0.2442626953125, 0.308990478515625, 0.37371826171875, 0.438446044921875, 0.503173828125, 0.567901611328125, 0.63262939453125, 0.697357177734375, 0.7620849609375, 0.826812744140625, 0.89154052734375, 0.956268310546875, 1.02099609375, 1.085723876953125, 1.15045166015625, 1.215179443359375, 1.2799072265625, 1.344635009765625, 1.40936279296875, 1.474090576171875, 1.538818359375, 1.603546142578125, 1.66827392578125, 1.733001708984375, 1.7977294921875, 1.862457275390625, 1.92718505859375, 1.991912841796875, 2.056640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 7.0, 6.0, 9.0, 18.0, 33.0, 31.0, 47.0, 87.0, 147.0, 280.0, 492.0, 1145.0, 3215.0, 13427.0, 140813.0, 798159.0, 76683.0, 9281.0, 2556.0, 959.0, 495.0, 239.0, 137.0, 82.0, 53.0, 38.0, 24.0, 19.0, 17.0, 11.0, 7.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.7060546875, -0.6828231811523438, -0.6595916748046875, -0.6363601684570312, -0.613128662109375, -0.5898971557617188, -0.5666656494140625, -0.5434341430664062, -0.52020263671875, -0.49697113037109375, -0.4737396240234375, -0.45050811767578125, -0.427276611328125, -0.40404510498046875, -0.3808135986328125, -0.35758209228515625, -0.3343505859375, -0.31111907958984375, -0.2878875732421875, -0.26465606689453125, -0.241424560546875, -0.21819305419921875, -0.1949615478515625, -0.17173004150390625, -0.14849853515625, -0.12526702880859375, -0.1020355224609375, -0.07880401611328125, -0.055572509765625, -0.03234100341796875, -0.0091094970703125, 0.01412200927734375, 0.037353515625, 0.06058502197265625, 0.0838165283203125, 0.10704803466796875, 0.130279541015625, 0.15351104736328125, 0.1767425537109375, 0.19997406005859375, 0.22320556640625, 0.24643707275390625, 0.2696685791015625, 0.29290008544921875, 0.316131591796875, 0.33936309814453125, 0.3625946044921875, 0.38582611083984375, 0.4090576171875, 0.43228912353515625, 0.4555206298828125, 0.47875213623046875, 0.501983642578125, 0.5252151489257812, 0.5484466552734375, 0.5716781616210938, 0.59490966796875, 0.6181411743164062, 0.6413726806640625, 0.6646041870117188, 0.687835693359375, 0.7110671997070312, 0.7342987060546875, 0.7575302124023438, 0.78076171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 2.0, 7.0, 10.0, 20.0, 32.0, 30.0, 57.0, 86.0, 107.0, 139.0, 140.0, 105.0, 71.0, 58.0, 46.0, 24.0, 22.0, 14.0, 11.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016045570373535156, -0.0001554153859615326, -0.00015037506818771362, -0.00014533475041389465, -0.00014029443264007568, -0.00013525411486625671, -0.00013021379709243774, -0.00012517347931861877, -0.0001201331615447998, -0.00011509284377098083, -0.00011005252599716187, -0.0001050122082233429, -9.997189044952393e-05, -9.493157267570496e-05, -8.989125490188599e-05, -8.485093712806702e-05, -7.981061935424805e-05, -7.477030158042908e-05, -6.972998380661011e-05, -6.468966603279114e-05, -5.964934825897217e-05, -5.46090304851532e-05, -4.956871271133423e-05, -4.452839493751526e-05, -3.948807716369629e-05, -3.444775938987732e-05, -2.940744161605835e-05, -2.436712384223938e-05, -1.932680606842041e-05, -1.428648829460144e-05, -9.24617052078247e-06, -4.205852746963501e-06, 8.344650268554688e-07, 5.8747828006744385e-06, 1.0915100574493408e-05, 1.5955418348312378e-05, 2.0995736122131348e-05, 2.6036053895950317e-05, 3.107637166976929e-05, 3.611668944358826e-05, 4.1157007217407227e-05, 4.6197324991226196e-05, 5.1237642765045166e-05, 5.6277960538864136e-05, 6.13182783126831e-05, 6.635859608650208e-05, 7.139891386032104e-05, 7.643923163414001e-05, 8.147954940795898e-05, 8.651986718177795e-05, 9.156018495559692e-05, 9.66005027294159e-05, 0.00010164082050323486, 0.00010668113827705383, 0.0001117214560508728, 0.00011676177382469177, 0.00012180209159851074, 0.0001268424093723297, 0.00013188272714614868, 0.00013692304491996765, 0.00014196336269378662, 0.0001470036804676056, 0.00015204399824142456, 0.00015708431601524353, 0.0001621246337890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 6.0, 8.0, 15.0, 20.0, 30.0, 60.0, 97.0, 195.0, 400.0, 992.0, 2995.0, 14116.0, 168068.0, 783142.0, 67098.0, 7829.0, 2049.0, 762.0, 297.0, 132.0, 74.0, 41.0, 33.0, 25.0, 20.0, 9.0, 6.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.91357421875, -0.8884353637695312, -0.8632965087890625, -0.8381576538085938, -0.813018798828125, -0.7878799438476562, -0.7627410888671875, -0.7376022338867188, -0.71246337890625, -0.6873245239257812, -0.6621856689453125, -0.6370468139648438, -0.611907958984375, -0.5867691040039062, -0.5616302490234375, -0.5364913940429688, -0.5113525390625, -0.48621368408203125, -0.4610748291015625, -0.43593597412109375, -0.410797119140625, -0.38565826416015625, -0.3605194091796875, -0.33538055419921875, -0.31024169921875, -0.28510284423828125, -0.2599639892578125, -0.23482513427734375, -0.209686279296875, -0.18454742431640625, -0.1594085693359375, -0.13426971435546875, -0.109130859375, -0.08399200439453125, -0.0588531494140625, -0.03371429443359375, -0.008575439453125, 0.01656341552734375, 0.0417022705078125, 0.06684112548828125, 0.09197998046875, 0.11711883544921875, 0.1422576904296875, 0.16739654541015625, 0.192535400390625, 0.21767425537109375, 0.2428131103515625, 0.26795196533203125, 0.2930908203125, 0.31822967529296875, 0.3433685302734375, 0.36850738525390625, 0.393646240234375, 0.41878509521484375, 0.4439239501953125, 0.46906280517578125, 0.49420166015625, 0.5193405151367188, 0.5444793701171875, 0.5696182250976562, 0.594757080078125, 0.6198959350585938, 0.6450347900390625, 0.6701736450195312, 0.6953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 6.0, 12.0, 19.0, 20.0, 36.0, 34.0, 54.0, 45.0, 62.0, 71.0, 90.0, 103.0, 74.0, 87.0, 58.0, 47.0, 50.0, 26.0, 19.0, 26.0, 13.0, 11.0, 5.0, 7.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74169921875, -0.7213058471679688, -0.7009124755859375, -0.6805191040039062, -0.660125732421875, -0.6397323608398438, -0.6193389892578125, -0.5989456176757812, -0.57855224609375, -0.5581588745117188, -0.5377655029296875, -0.5173721313476562, -0.496978759765625, -0.47658538818359375, -0.4561920166015625, -0.43579864501953125, -0.4154052734375, -0.39501190185546875, -0.3746185302734375, -0.35422515869140625, -0.333831787109375, -0.31343841552734375, -0.2930450439453125, -0.27265167236328125, -0.25225830078125, -0.23186492919921875, -0.2114715576171875, -0.19107818603515625, -0.170684814453125, -0.15029144287109375, -0.1298980712890625, -0.10950469970703125, -0.089111328125, -0.06871795654296875, -0.0483245849609375, -0.02793121337890625, -0.007537841796875, 0.01285552978515625, 0.0332489013671875, 0.05364227294921875, 0.07403564453125, 0.09442901611328125, 0.1148223876953125, 0.13521575927734375, 0.155609130859375, 0.17600250244140625, 0.1963958740234375, 0.21678924560546875, 0.2371826171875, 0.25757598876953125, 0.2779693603515625, 0.29836273193359375, 0.318756103515625, 0.33914947509765625, 0.3595428466796875, 0.37993621826171875, 0.40032958984375, 0.42072296142578125, 0.4411163330078125, 0.46150970458984375, 0.481903076171875, 0.5022964477539062, 0.5226898193359375, 0.5430831909179688, 0.5634765625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 1.0, 8.0, 19.0, 81.0, 267.0, 394.0, 186.0, 36.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.449127197265625, -26.548717498779297, -25.64830780029297, -24.74789810180664, -23.847488403320312, -22.947078704833984, -22.046667098999023, -21.146257400512695, -20.245847702026367, -19.34543800354004, -18.44502830505371, -17.544618606567383, -16.644207000732422, -15.74379825592041, -14.843387603759766, -13.942977905273438, -13.04256820678711, -12.142158508300781, -11.241748809814453, -10.341338157653809, -9.44092845916748, -8.540518760681152, -7.640108585357666, -6.73969841003418, -5.839288711547852, -4.938879013061523, -4.038468837738037, -3.13805890083313, -2.2376489639282227, -1.3372392654418945, -0.4368290901184082, 0.4635810852050781, 1.3639888763427734, 2.2643988132476807, 3.164808750152588, 4.065218925476074, 4.965628623962402, 5.8660383224487305, 6.766448497772217, 7.666858673095703, 8.567268371582031, 9.46767807006836, 10.368087768554688, 11.268498420715332, 12.16890811920166, 13.069317817687988, 13.969728469848633, 14.870138168334961, 15.770547866821289, 16.670957565307617, 17.571367263793945, 18.471776962280273, 19.372188568115234, 20.272598266601562, 21.17300796508789, 22.07341766357422, 22.973827362060547, 23.874237060546875, 24.774646759033203, 25.67505645751953, 26.57546615600586, 27.475875854492188, 28.37628746032715, 29.276697158813477, 30.177106857299805]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 11.0, 15.0, 14.0, 29.0, 30.0, 34.0, 39.0, 54.0, 64.0, 55.0, 68.0, 82.0, 82.0, 59.0, 61.0, 55.0, 56.0, 39.0, 25.0, 25.0, 21.0, 18.0, 18.0, 13.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.986358642578125, -11.588202476501465, -11.190046310424805, -10.791890144348145, -10.393733978271484, -9.995576858520508, -9.597420692443848, -9.199264526367188, -8.801108360290527, -8.402952194213867, -8.004796028137207, -7.606639385223389, -7.2084832191467285, -6.810327053070068, -6.41217041015625, -6.01401424407959, -5.61585807800293, -5.2177019119262695, -4.819545745849609, -4.421389102935791, -4.023232936859131, -3.6250767707824707, -3.2269203662872314, -2.828763961791992, -2.430607795715332, -2.032451629638672, -1.6342952251434326, -1.236138939857483, -0.8379826545715332, -0.4398263692855835, -0.04167008399963379, 0.35648632049560547, 0.7546424865722656, 1.1527987718582153, 1.550955057144165, 1.9491113424301147, 2.3472676277160645, 2.7454237937927246, 3.143580198287964, 3.541736602783203, 3.9398927688598633, 4.338048934936523, 4.736205101013184, 5.134361743927002, 5.532517910003662, 5.930674076080322, 6.328830718994141, 6.726986885070801, 7.125143051147461, 7.523299217224121, 7.921455383300781, 8.319611549377441, 8.717767715454102, 9.115924835205078, 9.514081001281738, 9.912237167358398, 10.310393333435059, 10.708549499511719, 11.106705665588379, 11.504861831665039, 11.903018951416016, 12.301175117492676, 12.699331283569336, 13.097487449645996, 13.495643615722656]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 10.0, 12.0, 15.0, 22.0, 34.0, 41.0, 77.0, 100.0, 168.0, 412.0, 1442.0, 9941.0, 1197001.0, 2969394.0, 13019.0, 1610.0, 449.0, 178.0, 114.0, 69.0, 44.0, 35.0, 20.0, 18.0, 13.0, 12.0, 9.0, 1.0, 2.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.123046875, -3.033935546875, -2.94482421875, -2.855712890625, -2.7666015625, -2.677490234375, -2.58837890625, -2.499267578125, -2.41015625, -2.321044921875, -2.23193359375, -2.142822265625, -2.0537109375, -1.964599609375, -1.87548828125, -1.786376953125, -1.697265625, -1.608154296875, -1.51904296875, -1.429931640625, -1.3408203125, -1.251708984375, -1.16259765625, -1.073486328125, -0.984375, -0.895263671875, -0.80615234375, -0.717041015625, -0.6279296875, -0.538818359375, -0.44970703125, -0.360595703125, -0.271484375, -0.182373046875, -0.09326171875, -0.004150390625, 0.0849609375, 0.174072265625, 0.26318359375, 0.352294921875, 0.44140625, 0.530517578125, 0.61962890625, 0.708740234375, 0.7978515625, 0.886962890625, 0.97607421875, 1.065185546875, 1.154296875, 1.243408203125, 1.33251953125, 1.421630859375, 1.5107421875, 1.599853515625, 1.68896484375, 1.778076171875, 1.8671875, 1.956298828125, 2.04541015625, 2.134521484375, 2.2236328125, 2.312744140625, 2.40185546875, 2.490966796875, 2.580078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 23.0, 21.0, 35.0, 56.0, 71.0, 73.0, 88.0, 122.0, 104.0, 78.0, 87.0, 73.0, 50.0, 46.0, 20.0, 20.0, 11.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3134765625, -1.277099609375, -1.24072265625, -1.204345703125, -1.16796875, -1.131591796875, -1.09521484375, -1.058837890625, -1.0224609375, -0.986083984375, -0.94970703125, -0.913330078125, -0.876953125, -0.840576171875, -0.80419921875, -0.767822265625, -0.7314453125, -0.695068359375, -0.65869140625, -0.622314453125, -0.5859375, -0.549560546875, -0.51318359375, -0.476806640625, -0.4404296875, -0.404052734375, -0.36767578125, -0.331298828125, -0.294921875, -0.258544921875, -0.22216796875, -0.185791015625, -0.1494140625, -0.113037109375, -0.07666015625, -0.040283203125, -0.00390625, 0.032470703125, 0.06884765625, 0.105224609375, 0.1416015625, 0.177978515625, 0.21435546875, 0.250732421875, 0.287109375, 0.323486328125, 0.35986328125, 0.396240234375, 0.4326171875, 0.468994140625, 0.50537109375, 0.541748046875, 0.578125, 0.614501953125, 0.65087890625, 0.687255859375, 0.7236328125, 0.760009765625, 0.79638671875, 0.832763671875, 0.869140625, 0.905517578125, 0.94189453125, 0.978271484375, 1.0146484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 14.0, 25.0, 47.0, 94.0, 153.0, 317.0, 667.0, 1472.0, 3827.0, 11879.0, 49447.0, 546451.0, 3406183.0, 140589.0, 23033.0, 6169.0, 2186.0, 900.0, 382.0, 216.0, 87.0, 57.0, 27.0, 12.0, 9.0, 8.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.491241455078125, -1.45123291015625, -1.411224365234375, -1.3712158203125, -1.331207275390625, -1.29119873046875, -1.251190185546875, -1.211181640625, -1.171173095703125, -1.13116455078125, -1.091156005859375, -1.0511474609375, -1.011138916015625, -0.97113037109375, -0.931121826171875, -0.89111328125, -0.851104736328125, -0.81109619140625, -0.771087646484375, -0.7310791015625, -0.691070556640625, -0.65106201171875, -0.611053466796875, -0.571044921875, -0.531036376953125, -0.49102783203125, -0.451019287109375, -0.4110107421875, -0.371002197265625, -0.33099365234375, -0.290985107421875, -0.2509765625, -0.210968017578125, -0.17095947265625, -0.130950927734375, -0.0909423828125, -0.050933837890625, -0.01092529296875, 0.029083251953125, 0.069091796875, 0.109100341796875, 0.14910888671875, 0.189117431640625, 0.2291259765625, 0.269134521484375, 0.30914306640625, 0.349151611328125, 0.38916015625, 0.429168701171875, 0.46917724609375, 0.509185791015625, 0.5491943359375, 0.589202880859375, 0.62921142578125, 0.669219970703125, 0.709228515625, 0.749237060546875, 0.78924560546875, 0.829254150390625, 0.8692626953125, 0.909271240234375, 0.94927978515625, 0.989288330078125, 1.029296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 0.0, 3.0, 3.0, 10.0, 11.0, 14.0, 5.0, 27.0, 37.0, 43.0, 70.0, 124.0, 268.0, 554.0, 1159.0, 941.0, 371.0, 172.0, 85.0, 63.0, 40.0, 22.0, 19.0, 6.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.51953125, -1.4782257080078125, -1.436920166015625, -1.3956146240234375, -1.35430908203125, -1.3130035400390625, -1.271697998046875, -1.2303924560546875, -1.1890869140625, -1.1477813720703125, -1.106475830078125, -1.0651702880859375, -1.02386474609375, -0.9825592041015625, -0.941253662109375, -0.8999481201171875, -0.858642578125, -0.8173370361328125, -0.776031494140625, -0.7347259521484375, -0.69342041015625, -0.6521148681640625, -0.610809326171875, -0.5695037841796875, -0.5281982421875, -0.4868927001953125, -0.445587158203125, -0.4042816162109375, -0.36297607421875, -0.3216705322265625, -0.280364990234375, -0.2390594482421875, -0.19775390625, -0.1564483642578125, -0.115142822265625, -0.0738372802734375, -0.03253173828125, 0.0087738037109375, 0.050079345703125, 0.0913848876953125, 0.1326904296875, 0.1739959716796875, 0.215301513671875, 0.2566070556640625, 0.29791259765625, 0.3392181396484375, 0.380523681640625, 0.4218292236328125, 0.463134765625, 0.5044403076171875, 0.545745849609375, 0.5870513916015625, 0.62835693359375, 0.6696624755859375, 0.710968017578125, 0.7522735595703125, 0.7935791015625, 0.8348846435546875, 0.876190185546875, 0.9174957275390625, 0.95880126953125, 1.0001068115234375, 1.041412353515625, 1.0827178955078125, 1.1240234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 11.0, 21.0, 59.0, 128.0, 256.0, 260.0, 138.0, 72.0, 25.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.50623321533203, -17.10053825378418, -16.694843292236328, -16.289148330688477, -15.883453369140625, -15.477758407592773, -15.072062492370605, -14.666367530822754, -14.260672569274902, -13.85497760772705, -13.4492826461792, -13.043587684631348, -12.63789176940918, -12.232196807861328, -11.826501846313477, -11.420806884765625, -11.015111923217773, -10.609416961669922, -10.20372200012207, -9.798027038574219, -9.392332077026367, -8.986637115478516, -8.580941200256348, -8.175246238708496, -7.7695512771606445, -7.363856315612793, -6.958161354064941, -6.552465915679932, -6.14677095413208, -5.7410759925842285, -5.335380554199219, -4.929685592651367, -4.523990631103516, -4.118295669555664, -3.7126004695892334, -3.3069052696228027, -2.901210308074951, -2.4955153465270996, -2.089820146560669, -1.6841249465942383, -1.2784299850463867, -0.8727349042892456, -0.4670398235321045, -0.06134474277496338, 0.34435033798217773, 0.7500452995300293, 1.15574049949646, 1.5614356994628906, 1.9671306610107422, 2.3728256225585938, 2.7785208225250244, 3.184216022491455, 3.5899109840393066, 3.995605945587158, 4.401301383972168, 4.8069963455200195, 5.212691307067871, 5.618386268615723, 6.024081230163574, 6.429776668548584, 6.8354716300964355, 7.241166591644287, 7.646862030029297, 8.052556991577148, 8.458251953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 6.0, 8.0, 14.0, 15.0, 18.0, 22.0, 22.0, 23.0, 34.0, 42.0, 41.0, 41.0, 42.0, 43.0, 66.0, 47.0, 51.0, 60.0, 48.0, 54.0, 49.0, 36.0, 39.0, 35.0, 23.0, 28.0, 14.0, 18.0, 10.0, 12.0, 12.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.527782440185547, -5.3810014724731445, -5.234220504760742, -5.087440013885498, -4.940659046173096, -4.793878078460693, -4.647097587585449, -4.500316619873047, -4.3535356521606445, -4.206754684448242, -4.05997371673584, -3.9131932258605957, -3.7664122581481934, -3.619631290435791, -3.4728505611419678, -3.3260698318481445, -3.179288864135742, -3.03250789642334, -2.8857271671295166, -2.7389464378356934, -2.592165470123291, -2.4453845024108887, -2.2986037731170654, -2.151823043823242, -2.00504207611084, -1.858261227607727, -1.7114803791046143, -1.5646995306015015, -1.4179186820983887, -1.2711378335952759, -1.124356985092163, -0.9775761365890503, -0.8307948112487793, -0.6840139627456665, -0.5372331142425537, -0.3904522657394409, -0.24367141723632812, -0.09689056873321533, 0.04989027976989746, 0.19667112827301025, 0.34345197677612305, 0.49023282527923584, 0.6370136737823486, 0.7837945222854614, 0.9305753707885742, 1.077356219291687, 1.2241370677947998, 1.3709179162979126, 1.5176987648010254, 1.6644796133041382, 1.811260461807251, 1.9580413103103638, 2.1048221588134766, 2.251603126525879, 2.398383855819702, 2.5451645851135254, 2.6919455528259277, 2.83872652053833, 2.9855072498321533, 3.1322879791259766, 3.279068946838379, 3.4258499145507812, 3.5726306438446045, 3.7194113731384277, 3.86619234085083]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 4.0, 14.0, 22.0, 21.0, 41.0, 49.0, 107.0, 122.0, 194.0, 322.0, 573.0, 1061.0, 1778.0, 3593.0, 7244.0, 15533.0, 35319.0, 83785.0, 198201.0, 323872.0, 213127.0, 92010.0, 38641.0, 16803.0, 7733.0, 3800.0, 1951.0, 1019.0, 602.0, 399.0, 222.0, 137.0, 88.0, 47.0, 33.0, 24.0, 17.0, 18.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.861328125, -0.8356552124023438, -0.8099822998046875, -0.7843093872070312, -0.758636474609375, -0.7329635620117188, -0.7072906494140625, -0.6816177368164062, -0.65594482421875, -0.6302719116210938, -0.6045989990234375, -0.5789260864257812, -0.553253173828125, -0.5275802612304688, -0.5019073486328125, -0.47623443603515625, -0.4505615234375, -0.42488861083984375, -0.3992156982421875, -0.37354278564453125, -0.347869873046875, -0.32219696044921875, -0.2965240478515625, -0.27085113525390625, -0.24517822265625, -0.21950531005859375, -0.1938323974609375, -0.16815948486328125, -0.142486572265625, -0.11681365966796875, -0.0911407470703125, -0.06546783447265625, -0.039794921875, -0.01412200927734375, 0.0115509033203125, 0.03722381591796875, 0.062896728515625, 0.08856964111328125, 0.1142425537109375, 0.13991546630859375, 0.16558837890625, 0.19126129150390625, 0.2169342041015625, 0.24260711669921875, 0.268280029296875, 0.29395294189453125, 0.3196258544921875, 0.34529876708984375, 0.3709716796875, 0.39664459228515625, 0.4223175048828125, 0.44799041748046875, 0.473663330078125, 0.49933624267578125, 0.5250091552734375, 0.5506820678710938, 0.57635498046875, 0.6020278930664062, 0.6277008056640625, 0.6533737182617188, 0.679046630859375, 0.7047195434570312, 0.7303924560546875, 0.7560653686523438, 0.78173828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 9.0, 4.0, 14.0, 18.0, 18.0, 32.0, 37.0, 46.0, 56.0, 48.0, 71.0, 79.0, 93.0, 88.0, 68.0, 63.0, 54.0, 51.0, 36.0, 32.0, 26.0, 14.0, 14.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8496780395507812, -0.8228912353515625, -0.7961044311523438, -0.769317626953125, -0.7425308227539062, -0.7157440185546875, -0.6889572143554688, -0.66217041015625, -0.6353836059570312, -0.6085968017578125, -0.5818099975585938, -0.555023193359375, -0.5282363891601562, -0.5014495849609375, -0.47466278076171875, -0.4478759765625, -0.42108917236328125, -0.3943023681640625, -0.36751556396484375, -0.340728759765625, -0.31394195556640625, -0.2871551513671875, -0.26036834716796875, -0.23358154296875, -0.20679473876953125, -0.1800079345703125, -0.15322113037109375, -0.126434326171875, -0.09964752197265625, -0.0728607177734375, -0.04607391357421875, -0.019287109375, 0.00749969482421875, 0.0342864990234375, 0.06107330322265625, 0.087860107421875, 0.11464691162109375, 0.1414337158203125, 0.16822052001953125, 0.19500732421875, 0.22179412841796875, 0.2485809326171875, 0.27536773681640625, 0.302154541015625, 0.32894134521484375, 0.3557281494140625, 0.38251495361328125, 0.4093017578125, 0.43608856201171875, 0.4628753662109375, 0.48966217041015625, 0.516448974609375, 0.5432357788085938, 0.5700225830078125, 0.5968093872070312, 0.62359619140625, 0.6503829956054688, 0.6771697998046875, 0.7039566040039062, 0.730743408203125, 0.7575302124023438, 0.7843170166015625, 0.8111038208007812, 0.837890625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 3.0, 5.0, 14.0, 14.0, 18.0, 26.0, 25.0, 52.0, 103.0, 152.0, 275.0, 538.0, 1275.0, 3899.0, 18414.0, 143086.0, 716730.0, 139751.0, 17751.0, 3820.0, 1297.0, 546.0, 308.0, 177.0, 81.0, 53.0, 42.0, 19.0, 12.0, 18.0, 14.0, 4.0, 8.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.10546875, -2.0477752685546875, -1.990081787109375, -1.9323883056640625, -1.87469482421875, -1.8170013427734375, -1.759307861328125, -1.7016143798828125, -1.6439208984375, -1.5862274169921875, -1.528533935546875, -1.4708404541015625, -1.41314697265625, -1.3554534912109375, -1.297760009765625, -1.2400665283203125, -1.182373046875, -1.1246795654296875, -1.066986083984375, -1.0092926025390625, -0.95159912109375, -0.8939056396484375, -0.836212158203125, -0.7785186767578125, -0.7208251953125, -0.6631317138671875, -0.605438232421875, -0.5477447509765625, -0.49005126953125, -0.4323577880859375, -0.374664306640625, -0.3169708251953125, -0.25927734375, -0.2015838623046875, -0.143890380859375, -0.0861968994140625, -0.02850341796875, 0.0291900634765625, 0.086883544921875, 0.1445770263671875, 0.2022705078125, 0.2599639892578125, 0.317657470703125, 0.3753509521484375, 0.43304443359375, 0.4907379150390625, 0.548431396484375, 0.6061248779296875, 0.663818359375, 0.7215118408203125, 0.779205322265625, 0.8368988037109375, 0.89459228515625, 0.9522857666015625, 1.009979248046875, 1.0676727294921875, 1.1253662109375, 1.1830596923828125, 1.240753173828125, 1.2984466552734375, 1.35614013671875, 1.4138336181640625, 1.471527099609375, 1.5292205810546875, 1.5869140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 3.0, 7.0, 7.0, 12.0, 12.0, 15.0, 16.0, 19.0, 18.0, 19.0, 30.0, 25.0, 37.0, 35.0, 40.0, 43.0, 44.0, 44.0, 32.0, 54.0, 50.0, 37.0, 26.0, 58.0, 37.0, 34.0, 35.0, 27.0, 26.0, 21.0, 19.0, 24.0, 16.0, 13.0, 15.0, 12.0, 7.0, 4.0, 5.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7890625, -1.7338409423828125, -1.678619384765625, -1.6233978271484375, -1.56817626953125, -1.5129547119140625, -1.457733154296875, -1.4025115966796875, -1.3472900390625, -1.2920684814453125, -1.236846923828125, -1.1816253662109375, -1.12640380859375, -1.0711822509765625, -1.015960693359375, -0.9607391357421875, -0.905517578125, -0.8502960205078125, -0.795074462890625, -0.7398529052734375, -0.68463134765625, -0.6294097900390625, -0.574188232421875, -0.5189666748046875, -0.4637451171875, -0.4085235595703125, -0.353302001953125, -0.2980804443359375, -0.24285888671875, -0.1876373291015625, -0.132415771484375, -0.0771942138671875, -0.02197265625, 0.0332489013671875, 0.088470458984375, 0.1436920166015625, 0.19891357421875, 0.2541351318359375, 0.309356689453125, 0.3645782470703125, 0.4197998046875, 0.4750213623046875, 0.530242919921875, 0.5854644775390625, 0.64068603515625, 0.6959075927734375, 0.751129150390625, 0.8063507080078125, 0.861572265625, 0.9167938232421875, 0.972015380859375, 1.0272369384765625, 1.08245849609375, 1.1376800537109375, 1.192901611328125, 1.2481231689453125, 1.3033447265625, 1.3585662841796875, 1.413787841796875, 1.4690093994140625, 1.52423095703125, 1.5794525146484375, 1.634674072265625, 1.6898956298828125, 1.7451171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 11.0, 16.0, 13.0, 19.0, 42.0, 55.0, 77.0, 183.0, 417.0, 1026.0, 4067.0, 42637.0, 914960.0, 77521.0, 5287.0, 1284.0, 447.0, 209.0, 103.0, 51.0, 29.0, 27.0, 18.0, 14.0, 13.0, 4.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.248046875, -1.208526611328125, -1.16900634765625, -1.129486083984375, -1.0899658203125, -1.050445556640625, -1.01092529296875, -0.971405029296875, -0.931884765625, -0.892364501953125, -0.85284423828125, -0.813323974609375, -0.7738037109375, -0.734283447265625, -0.69476318359375, -0.655242919921875, -0.61572265625, -0.576202392578125, -0.53668212890625, -0.497161865234375, -0.4576416015625, -0.418121337890625, -0.37860107421875, -0.339080810546875, -0.299560546875, -0.260040283203125, -0.22052001953125, -0.180999755859375, -0.1414794921875, -0.101959228515625, -0.06243896484375, -0.022918701171875, 0.0166015625, 0.056121826171875, 0.09564208984375, 0.135162353515625, 0.1746826171875, 0.214202880859375, 0.25372314453125, 0.293243408203125, 0.332763671875, 0.372283935546875, 0.41180419921875, 0.451324462890625, 0.4908447265625, 0.530364990234375, 0.56988525390625, 0.609405517578125, 0.64892578125, 0.688446044921875, 0.72796630859375, 0.767486572265625, 0.8070068359375, 0.846527099609375, 0.88604736328125, 0.925567626953125, 0.965087890625, 1.004608154296875, 1.04412841796875, 1.083648681640625, 1.1231689453125, 1.162689208984375, 1.20220947265625, 1.241729736328125, 1.28125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 10.0, 41.0, 162.0, 325.0, 292.0, 102.0, 31.0, 16.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002665519714355469, -0.00025072693824768066, -0.00023490190505981445, -0.00021907687187194824, -0.00020325183868408203, -0.00018742680549621582, -0.0001716017723083496, -0.0001557767391204834, -0.0001399517059326172, -0.00012412667274475098, -0.00010830163955688477, -9.247660636901855e-05, -7.665157318115234e-05, -6.082653999328613e-05, -4.500150680541992e-05, -2.917647361755371e-05, -1.33514404296875e-05, 2.473592758178711e-06, 1.8298625946044922e-05, 3.412365913391113e-05, 4.9948692321777344e-05, 6.577372550964355e-05, 8.159875869750977e-05, 9.742379188537598e-05, 0.00011324882507324219, 0.0001290738582611084, 0.0001448988914489746, 0.00016072392463684082, 0.00017654895782470703, 0.00019237399101257324, 0.00020819902420043945, 0.00022402405738830566, 0.00023984909057617188, 0.0002556741237640381, 0.0002714991569519043, 0.0002873241901397705, 0.0003031492233276367, 0.00031897425651550293, 0.00033479928970336914, 0.00035062432289123535, 0.00036644935607910156, 0.0003822743892669678, 0.000398099422454834, 0.0004139244556427002, 0.0004297494888305664, 0.0004455745220184326, 0.00046139955520629883, 0.00047722458839416504, 0.0004930496215820312, 0.0005088746547698975, 0.0005246996879577637, 0.0005405247211456299, 0.0005563497543334961, 0.0005721747875213623, 0.0005879998207092285, 0.0006038248538970947, 0.0006196498870849609, 0.0006354749202728271, 0.0006512999534606934, 0.0006671249866485596, 0.0006829500198364258, 0.000698775053024292, 0.0007146000862121582, 0.0007304251194000244, 0.0007462501525878906]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 9.0, 11.0, 8.0, 15.0, 25.0, 24.0, 41.0, 59.0, 119.0, 172.0, 320.0, 623.0, 1757.0, 5642.0, 29543.0, 306421.0, 635779.0, 55128.0, 8712.0, 2359.0, 891.0, 378.0, 195.0, 104.0, 63.0, 44.0, 28.0, 29.0, 16.0, 12.0, 8.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.671875, -0.6488265991210938, -0.6257781982421875, -0.6027297973632812, -0.579681396484375, -0.5566329956054688, -0.5335845947265625, -0.5105361938476562, -0.48748779296875, -0.46443939208984375, -0.4413909912109375, -0.41834259033203125, -0.395294189453125, -0.37224578857421875, -0.3491973876953125, -0.32614898681640625, -0.3031005859375, -0.28005218505859375, -0.2570037841796875, -0.23395538330078125, -0.210906982421875, -0.18785858154296875, -0.1648101806640625, -0.14176177978515625, -0.11871337890625, -0.09566497802734375, -0.0726165771484375, -0.04956817626953125, -0.026519775390625, -0.00347137451171875, 0.0195770263671875, 0.04262542724609375, 0.065673828125, 0.08872222900390625, 0.1117706298828125, 0.13481903076171875, 0.157867431640625, 0.18091583251953125, 0.2039642333984375, 0.22701263427734375, 0.25006103515625, 0.27310943603515625, 0.2961578369140625, 0.31920623779296875, 0.342254638671875, 0.36530303955078125, 0.3883514404296875, 0.41139984130859375, 0.4344482421875, 0.45749664306640625, 0.4805450439453125, 0.5035934448242188, 0.526641845703125, 0.5496902465820312, 0.5727386474609375, 0.5957870483398438, 0.61883544921875, 0.6418838500976562, 0.6649322509765625, 0.6879806518554688, 0.711029052734375, 0.7340774536132812, 0.7571258544921875, 0.7801742553710938, 0.80322265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 10.0, 2.0, 9.0, 10.0, 19.0, 19.0, 48.0, 48.0, 77.0, 92.0, 122.0, 123.0, 108.0, 97.0, 90.0, 55.0, 33.0, 18.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2431640625, -1.2163543701171875, -1.189544677734375, -1.1627349853515625, -1.13592529296875, -1.1091156005859375, -1.082305908203125, -1.0554962158203125, -1.0286865234375, -1.0018768310546875, -0.975067138671875, -0.9482574462890625, -0.92144775390625, -0.8946380615234375, -0.867828369140625, -0.8410186767578125, -0.814208984375, -0.7873992919921875, -0.760589599609375, -0.7337799072265625, -0.70697021484375, -0.6801605224609375, -0.653350830078125, -0.6265411376953125, -0.5997314453125, -0.5729217529296875, -0.546112060546875, -0.5193023681640625, -0.49249267578125, -0.4656829833984375, -0.438873291015625, -0.4120635986328125, -0.38525390625, -0.3584442138671875, -0.331634521484375, -0.3048248291015625, -0.27801513671875, -0.2512054443359375, -0.224395751953125, -0.1975860595703125, -0.1707763671875, -0.1439666748046875, -0.117156982421875, -0.0903472900390625, -0.06353759765625, -0.0367279052734375, -0.009918212890625, 0.0168914794921875, 0.043701171875, 0.0705108642578125, 0.097320556640625, 0.1241302490234375, 0.15093994140625, 0.1777496337890625, 0.204559326171875, 0.2313690185546875, 0.2581787109375, 0.2849884033203125, 0.311798095703125, 0.3386077880859375, 0.36541748046875, 0.3922271728515625, 0.419036865234375, 0.4458465576171875, 0.47265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 13.0, 28.0, 70.0, 131.0, 245.0, 225.0, 153.0, 72.0, 24.0, 17.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.205233097076416, -6.692345142364502, -6.179457664489746, -5.666569709777832, -5.153681755065918, -4.640794277191162, -4.127906322479248, -3.615018606185913, -3.102130889892578, -2.589243173599243, -2.076355457305908, -1.5634675025939941, -1.0505797863006592, -0.5376920700073242, -0.024804115295410156, 0.4880836009979248, 1.0009713172912598, 1.5138590335845947, 2.0267467498779297, 2.5396347045898438, 3.0525224208831787, 3.5654101371765137, 4.078298091888428, 4.591185569763184, 5.104073524475098, 5.616961479187012, 6.129848957061768, 6.642736911773682, 7.1556243896484375, 7.668512344360352, 8.181400299072266, 8.69428825378418, 9.207174301147461, 9.720062255859375, 10.232950210571289, 10.745838165283203, 11.2587251663208, 11.771613121032715, 12.284501075744629, 12.797389030456543, 13.31027603149414, 13.823163986206055, 14.336051940917969, 14.848939895629883, 15.36182689666748, 15.874714851379395, 16.387603759765625, 16.900489807128906, 17.413379669189453, 17.926267623901367, 18.43915557861328, 18.952043533325195, 19.46493148803711, 19.97781753540039, 20.490707397460938, 21.00359344482422, 21.516481399536133, 22.029369354248047, 22.54225730895996, 23.055145263671875, 23.56803321838379, 24.080921173095703, 24.593807220458984, 25.1066951751709, 25.619583129882812]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 6.0, 6.0, 10.0, 13.0, 18.0, 24.0, 24.0, 25.0, 24.0, 30.0, 35.0, 45.0, 46.0, 46.0, 40.0, 58.0, 60.0, 64.0, 51.0, 45.0, 50.0, 37.0, 37.0, 34.0, 23.0, 15.0, 18.0, 19.0, 13.0, 18.0, 11.0, 9.0, 4.0, 10.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-10.110296249389648, -9.855095863342285, -9.599895477294922, -9.344694137573242, -9.089493751525879, -8.834293365478516, -8.579092979431152, -8.323892593383789, -8.06869125366211, -7.813490867614746, -7.558290004730225, -7.303089618682861, -7.04788875579834, -6.792688369750977, -6.537487983703613, -6.28228759765625, -6.027087211608887, -5.771886825561523, -5.516685962677002, -5.261485576629639, -5.006284713745117, -4.751084327697754, -4.495883941650391, -4.240683555603027, -3.985482692718506, -3.7302820682525635, -3.475081443786621, -3.219881057739258, -2.9646804332733154, -2.709479808807373, -2.4542794227600098, -2.1990787982940674, -1.943878173828125, -1.6886775493621826, -1.4334770441055298, -1.178276538848877, -0.9230759143829346, -0.6678752899169922, -0.41267478466033936, -0.15747427940368652, 0.09772634506225586, 0.35292690992355347, 0.6081274747848511, 0.8633280396461487, 1.1185286045074463, 1.3737292289733887, 1.6289297342300415, 1.8841302394866943, 2.1393308639526367, 2.394531488418579, 2.6497321128845215, 2.9049324989318848, 3.160133123397827, 3.4153337478637695, 3.670534133911133, 3.925734758377075, 4.180935382843018, 4.436135768890381, 4.691336631774902, 4.946537017822266, 5.201737403869629, 5.45693826675415, 5.712138652801514, 5.967339515686035, 6.222539901733398]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 9.0, 11.0, 23.0, 35.0, 59.0, 114.0, 156.0, 274.0, 572.0, 1079.0, 2473.0, 6352.0, 21016.0, 112675.0, 1808041.0, 2081785.0, 125901.0, 22088.0, 6550.0, 2594.0, 1150.0, 608.0, 292.0, 163.0, 97.0, 66.0, 41.0, 18.0, 10.0, 12.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.99853515625, -0.9682998657226562, -0.9380645751953125, -0.9078292846679688, -0.877593994140625, -0.8473587036132812, -0.8171234130859375, -0.7868881225585938, -0.75665283203125, -0.7264175415039062, -0.6961822509765625, -0.6659469604492188, -0.635711669921875, -0.6054763793945312, -0.5752410888671875, -0.5450057983398438, -0.5147705078125, -0.48453521728515625, -0.4542999267578125, -0.42406463623046875, -0.393829345703125, -0.36359405517578125, -0.3333587646484375, -0.30312347412109375, -0.27288818359375, -0.24265289306640625, -0.2124176025390625, -0.18218231201171875, -0.151947021484375, -0.12171173095703125, -0.0914764404296875, -0.06124114990234375, -0.031005859375, -0.00077056884765625, 0.0294647216796875, 0.05970001220703125, 0.089935302734375, 0.12017059326171875, 0.1504058837890625, 0.18064117431640625, 0.21087646484375, 0.24111175537109375, 0.2713470458984375, 0.30158233642578125, 0.331817626953125, 0.36205291748046875, 0.3922882080078125, 0.42252349853515625, 0.4527587890625, 0.48299407958984375, 0.5132293701171875, 0.5434646606445312, 0.573699951171875, 0.6039352416992188, 0.6341705322265625, 0.6644058227539062, 0.69464111328125, 0.7248764038085938, 0.7551116943359375, 0.7853469848632812, 0.815582275390625, 0.8458175659179688, 0.8760528564453125, 0.9062881469726562, 0.9365234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 7.0, 6.0, 18.0, 27.0, 32.0, 33.0, 44.0, 47.0, 50.0, 64.0, 65.0, 100.0, 91.0, 58.0, 57.0, 78.0, 43.0, 34.0, 38.0, 28.0, 22.0, 9.0, 18.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.78271484375, -0.759674072265625, -0.73663330078125, -0.713592529296875, -0.6905517578125, -0.667510986328125, -0.64447021484375, -0.621429443359375, -0.598388671875, -0.575347900390625, -0.55230712890625, -0.529266357421875, -0.5062255859375, -0.483184814453125, -0.46014404296875, -0.437103271484375, -0.4140625, -0.391021728515625, -0.36798095703125, -0.344940185546875, -0.3218994140625, -0.298858642578125, -0.27581787109375, -0.252777099609375, -0.229736328125, -0.206695556640625, -0.18365478515625, -0.160614013671875, -0.1375732421875, -0.114532470703125, -0.09149169921875, -0.068450927734375, -0.04541015625, -0.022369384765625, 0.00067138671875, 0.023712158203125, 0.0467529296875, 0.069793701171875, 0.09283447265625, 0.115875244140625, 0.138916015625, 0.161956787109375, 0.18499755859375, 0.208038330078125, 0.2310791015625, 0.254119873046875, 0.27716064453125, 0.300201416015625, 0.3232421875, 0.346282958984375, 0.36932373046875, 0.392364501953125, 0.4154052734375, 0.438446044921875, 0.46148681640625, 0.484527587890625, 0.507568359375, 0.530609130859375, 0.55364990234375, 0.576690673828125, 0.5997314453125, 0.622772216796875, 0.64581298828125, 0.668853759765625, 0.69189453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 12.0, 13.0, 19.0, 35.0, 39.0, 83.0, 122.0, 249.0, 513.0, 1377.0, 4646.0, 27905.0, 667185.0, 3407092.0, 72685.0, 8958.0, 2079.0, 687.0, 267.0, 142.0, 64.0, 28.0, 27.0, 16.0, 9.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.7392425537109375, -1.681610107421875, -1.6239776611328125, -1.56634521484375, -1.5087127685546875, -1.451080322265625, -1.3934478759765625, -1.3358154296875, -1.2781829833984375, -1.220550537109375, -1.1629180908203125, -1.10528564453125, -1.0476531982421875, -0.990020751953125, -0.9323883056640625, -0.874755859375, -0.8171234130859375, -0.759490966796875, -0.7018585205078125, -0.64422607421875, -0.5865936279296875, -0.528961181640625, -0.4713287353515625, -0.4136962890625, -0.3560638427734375, -0.298431396484375, -0.2407989501953125, -0.18316650390625, -0.1255340576171875, -0.067901611328125, -0.0102691650390625, 0.04736328125, 0.1049957275390625, 0.162628173828125, 0.2202606201171875, 0.27789306640625, 0.3355255126953125, 0.393157958984375, 0.4507904052734375, 0.5084228515625, 0.5660552978515625, 0.623687744140625, 0.6813201904296875, 0.73895263671875, 0.7965850830078125, 0.854217529296875, 0.9118499755859375, 0.969482421875, 1.0271148681640625, 1.084747314453125, 1.1423797607421875, 1.20001220703125, 1.2576446533203125, 1.315277099609375, 1.3729095458984375, 1.4305419921875, 1.4881744384765625, 1.545806884765625, 1.6034393310546875, 1.66107177734375, 1.7187042236328125, 1.776336669921875, 1.8339691162109375, 1.8916015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 15.0, 17.0, 45.0, 76.0, 123.0, 291.0, 702.0, 1283.0, 796.0, 297.0, 163.0, 87.0, 50.0, 40.0, 19.0, 15.0, 17.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.345703125, -2.28790283203125, -2.2301025390625, -2.17230224609375, -2.114501953125, -2.05670166015625, -1.9989013671875, -1.94110107421875, -1.88330078125, -1.82550048828125, -1.7677001953125, -1.70989990234375, -1.652099609375, -1.59429931640625, -1.5364990234375, -1.47869873046875, -1.4208984375, -1.36309814453125, -1.3052978515625, -1.24749755859375, -1.189697265625, -1.13189697265625, -1.0740966796875, -1.01629638671875, -0.95849609375, -0.90069580078125, -0.8428955078125, -0.78509521484375, -0.727294921875, -0.66949462890625, -0.6116943359375, -0.55389404296875, -0.49609375, -0.43829345703125, -0.3804931640625, -0.32269287109375, -0.264892578125, -0.20709228515625, -0.1492919921875, -0.09149169921875, -0.03369140625, 0.02410888671875, 0.0819091796875, 0.13970947265625, 0.197509765625, 0.25531005859375, 0.3131103515625, 0.37091064453125, 0.4287109375, 0.48651123046875, 0.5443115234375, 0.60211181640625, 0.659912109375, 0.71771240234375, 0.7755126953125, 0.83331298828125, 0.89111328125, 0.94891357421875, 1.0067138671875, 1.06451416015625, 1.122314453125, 1.18011474609375, 1.2379150390625, 1.29571533203125, 1.353515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 20.0, 47.0, 107.0, 212.0, 272.0, 172.0, 83.0, 34.0, 15.0, 10.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.645408630371094, -15.1768159866333, -14.708223342895508, -14.239630699157715, -13.771038055419922, -13.302445411682129, -12.833852767944336, -12.365259170532227, -11.89666748046875, -11.428074836730957, -10.959482192993164, -10.490889549255371, -10.022296905517578, -9.553704261779785, -9.085111618041992, -8.616518020629883, -8.14792537689209, -7.679332733154297, -7.210740089416504, -6.742147445678711, -6.273554801940918, -5.804962158203125, -5.336369037628174, -4.867776393890381, -4.399183750152588, -3.930591106414795, -3.461998462677002, -2.99340558052063, -2.524812936782837, -2.056220293045044, -1.5876274108886719, -1.119034767150879, -0.6504421234130859, -0.1818494200706482, 0.28674328327178955, 0.7553360462188721, 1.223928689956665, 1.692521333694458, 2.16111421585083, 2.629706859588623, 3.098299503326416, 3.566892147064209, 4.035484790802002, 4.504077911376953, 4.972670555114746, 5.441263198852539, 5.909855842590332, 6.378448486328125, 6.847041130065918, 7.315633773803711, 7.784226417541504, 8.252819061279297, 8.72141170501709, 9.190004348754883, 9.658597946166992, 10.127189636230469, 10.595783233642578, 11.064375877380371, 11.532968521118164, 12.001561164855957, 12.47015380859375, 12.938746452331543, 13.407339096069336, 13.875932693481445, 14.344524383544922]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 9.0, 8.0, 10.0, 16.0, 11.0, 19.0, 26.0, 17.0, 23.0, 26.0, 34.0, 30.0, 32.0, 41.0, 41.0, 46.0, 52.0, 46.0, 46.0, 49.0, 37.0, 50.0, 44.0, 42.0, 29.0, 32.0, 28.0, 31.0, 22.0, 18.0, 19.0, 13.0, 10.0, 11.0, 6.0, 9.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.679101467132568, -5.513421535491943, -5.347741603851318, -5.182061672210693, -5.016382217407227, -4.850702285766602, -4.685022354125977, -4.519342422485352, -4.353662490844727, -4.187982559204102, -4.022302627563477, -3.8566229343414307, -3.6909430027008057, -3.5252630710601807, -3.3595833778381348, -3.1939034461975098, -3.0282235145568848, -2.8625435829162598, -2.6968636512756348, -2.531183958053589, -2.365504026412964, -2.199824094772339, -2.034144401550293, -1.868464469909668, -1.702784538269043, -1.537104606628418, -1.3714247941970825, -1.205744981765747, -1.040065050125122, -0.8743851780891418, -0.7087053060531616, -0.5430254936218262, -0.37734508514404297, -0.21166521310806274, -0.04598534107208252, 0.1196945309638977, 0.28537440299987793, 0.45105427503585815, 0.6167341470718384, 0.7824139595031738, 0.9480938911437988, 1.1137738227844238, 1.2794536352157593, 1.4451334476470947, 1.6108133792877197, 1.7764933109283447, 1.9421731233596802, 2.1078529357910156, 2.2735328674316406, 2.4392127990722656, 2.6048927307128906, 2.7705724239349365, 2.9362523555755615, 3.1019322872161865, 3.2676119804382324, 3.4332919120788574, 3.5989718437194824, 3.7646517753601074, 3.9303317070007324, 4.096011638641357, 4.261691093444824, 4.427371025085449, 4.593050956726074, 4.758730888366699, 4.924410820007324]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 16.0, 17.0, 29.0, 44.0, 54.0, 85.0, 187.0, 274.0, 547.0, 960.0, 1936.0, 4011.0, 9435.0, 23336.0, 59498.0, 149121.0, 307547.0, 280766.0, 126135.0, 49941.0, 19292.0, 8114.0, 3556.0, 1651.0, 872.0, 461.0, 269.0, 134.0, 89.0, 75.0, 36.0, 27.0, 16.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88134765625, -0.8553543090820312, -0.8293609619140625, -0.8033676147460938, -0.777374267578125, -0.7513809204101562, -0.7253875732421875, -0.6993942260742188, -0.67340087890625, -0.6474075317382812, -0.6214141845703125, -0.5954208374023438, -0.569427490234375, -0.5434341430664062, -0.5174407958984375, -0.49144744873046875, -0.4654541015625, -0.43946075439453125, -0.4134674072265625, -0.38747406005859375, -0.361480712890625, -0.33548736572265625, -0.3094940185546875, -0.28350067138671875, -0.25750732421875, -0.23151397705078125, -0.2055206298828125, -0.17952728271484375, -0.153533935546875, -0.12754058837890625, -0.1015472412109375, -0.07555389404296875, -0.049560546875, -0.02356719970703125, 0.0024261474609375, 0.02841949462890625, 0.054412841796875, 0.08040618896484375, 0.1063995361328125, 0.13239288330078125, 0.15838623046875, 0.18437957763671875, 0.2103729248046875, 0.23636627197265625, 0.262359619140625, 0.28835296630859375, 0.3143463134765625, 0.34033966064453125, 0.3663330078125, 0.39232635498046875, 0.4183197021484375, 0.44431304931640625, 0.470306396484375, 0.49629974365234375, 0.5222930908203125, 0.5482864379882812, 0.57427978515625, 0.6002731323242188, 0.6262664794921875, 0.6522598266601562, 0.678253173828125, 0.7042465209960938, 0.7302398681640625, 0.7562332153320312, 0.7822265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 12.0, 23.0, 20.0, 34.0, 42.0, 49.0, 51.0, 59.0, 74.0, 83.0, 88.0, 77.0, 69.0, 63.0, 61.0, 45.0, 37.0, 29.0, 17.0, 14.0, 11.0, 8.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.83642578125, -0.811981201171875, -0.78753662109375, -0.763092041015625, -0.7386474609375, -0.714202880859375, -0.68975830078125, -0.665313720703125, -0.640869140625, -0.616424560546875, -0.59197998046875, -0.567535400390625, -0.5430908203125, -0.518646240234375, -0.49420166015625, -0.469757080078125, -0.4453125, -0.420867919921875, -0.39642333984375, -0.371978759765625, -0.3475341796875, -0.323089599609375, -0.29864501953125, -0.274200439453125, -0.249755859375, -0.225311279296875, -0.20086669921875, -0.176422119140625, -0.1519775390625, -0.127532958984375, -0.10308837890625, -0.078643798828125, -0.05419921875, -0.029754638671875, -0.00531005859375, 0.019134521484375, 0.0435791015625, 0.068023681640625, 0.09246826171875, 0.116912841796875, 0.141357421875, 0.165802001953125, 0.19024658203125, 0.214691162109375, 0.2391357421875, 0.263580322265625, 0.28802490234375, 0.312469482421875, 0.3369140625, 0.361358642578125, 0.38580322265625, 0.410247802734375, 0.4346923828125, 0.459136962890625, 0.48358154296875, 0.508026123046875, 0.532470703125, 0.556915283203125, 0.58135986328125, 0.605804443359375, 0.6302490234375, 0.654693603515625, 0.67913818359375, 0.703582763671875, 0.72802734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 11.0, 11.0, 11.0, 15.0, 28.0, 46.0, 55.0, 77.0, 86.0, 115.0, 175.0, 218.0, 353.0, 521.0, 818.0, 1395.0, 2811.0, 7787.0, 29062.0, 149717.0, 618599.0, 185060.0, 35310.0, 8971.0, 3121.0, 1536.0, 797.0, 528.0, 362.0, 268.0, 162.0, 123.0, 115.0, 74.0, 50.0, 39.0, 36.0, 26.0, 10.0, 7.0, 14.0, 8.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.166656494140625, -1.12432861328125, -1.082000732421875, -1.0396728515625, -0.997344970703125, -0.95501708984375, -0.912689208984375, -0.870361328125, -0.828033447265625, -0.78570556640625, -0.743377685546875, -0.7010498046875, -0.658721923828125, -0.61639404296875, -0.574066162109375, -0.53173828125, -0.489410400390625, -0.44708251953125, -0.404754638671875, -0.3624267578125, -0.320098876953125, -0.27777099609375, -0.235443115234375, -0.193115234375, -0.150787353515625, -0.10845947265625, -0.066131591796875, -0.0238037109375, 0.018524169921875, 0.06085205078125, 0.103179931640625, 0.1455078125, 0.187835693359375, 0.23016357421875, 0.272491455078125, 0.3148193359375, 0.357147216796875, 0.39947509765625, 0.441802978515625, 0.484130859375, 0.526458740234375, 0.56878662109375, 0.611114501953125, 0.6534423828125, 0.695770263671875, 0.73809814453125, 0.780426025390625, 0.82275390625, 0.865081787109375, 0.90740966796875, 0.949737548828125, 0.9920654296875, 1.034393310546875, 1.07672119140625, 1.119049072265625, 1.161376953125, 1.203704833984375, 1.24603271484375, 1.288360595703125, 1.3306884765625, 1.373016357421875, 1.41534423828125, 1.457672119140625, 1.5]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 3.0, 3.0, 3.0, 4.0, 9.0, 8.0, 14.0, 15.0, 25.0, 26.0, 18.0, 30.0, 33.0, 29.0, 28.0, 43.0, 31.0, 46.0, 48.0, 46.0, 62.0, 55.0, 46.0, 37.0, 47.0, 40.0, 42.0, 35.0, 25.0, 19.0, 17.0, 18.0, 20.0, 13.0, 18.0, 10.0, 7.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.318359375, -2.248809814453125, -2.17926025390625, -2.109710693359375, -2.0401611328125, -1.970611572265625, -1.90106201171875, -1.831512451171875, -1.761962890625, -1.692413330078125, -1.62286376953125, -1.553314208984375, -1.4837646484375, -1.414215087890625, -1.34466552734375, -1.275115966796875, -1.20556640625, -1.136016845703125, -1.06646728515625, -0.996917724609375, -0.9273681640625, -0.857818603515625, -0.78826904296875, -0.718719482421875, -0.649169921875, -0.579620361328125, -0.51007080078125, -0.440521240234375, -0.3709716796875, -0.301422119140625, -0.23187255859375, -0.162322998046875, -0.0927734375, -0.023223876953125, 0.04632568359375, 0.115875244140625, 0.1854248046875, 0.254974365234375, 0.32452392578125, 0.394073486328125, 0.463623046875, 0.533172607421875, 0.60272216796875, 0.672271728515625, 0.7418212890625, 0.811370849609375, 0.88092041015625, 0.950469970703125, 1.02001953125, 1.089569091796875, 1.15911865234375, 1.228668212890625, 1.2982177734375, 1.367767333984375, 1.43731689453125, 1.506866455078125, 1.576416015625, 1.645965576171875, 1.71551513671875, 1.785064697265625, 1.8546142578125, 1.924163818359375, 1.99371337890625, 2.063262939453125, 2.1328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 21.0, 23.0, 32.0, 45.0, 105.0, 208.0, 534.0, 1429.0, 5334.0, 44471.0, 887868.0, 97309.0, 8014.0, 1946.0, 670.0, 264.0, 111.0, 64.0, 32.0, 19.0, 13.0, 9.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1057815551757812, -1.0728912353515625, -1.0400009155273438, -1.007110595703125, -0.9742202758789062, -0.9413299560546875, -0.9084396362304688, -0.87554931640625, -0.8426589965820312, -0.8097686767578125, -0.7768783569335938, -0.743988037109375, -0.7110977172851562, -0.6782073974609375, -0.6453170776367188, -0.6124267578125, -0.5795364379882812, -0.5466461181640625, -0.5137557983398438, -0.480865478515625, -0.44797515869140625, -0.4150848388671875, -0.38219451904296875, -0.34930419921875, -0.31641387939453125, -0.2835235595703125, -0.25063323974609375, -0.217742919921875, -0.18485260009765625, -0.1519622802734375, -0.11907196044921875, -0.086181640625, -0.05329132080078125, -0.0204010009765625, 0.01248931884765625, 0.045379638671875, 0.07826995849609375, 0.1111602783203125, 0.14405059814453125, 0.17694091796875, 0.20983123779296875, 0.2427215576171875, 0.27561187744140625, 0.308502197265625, 0.34139251708984375, 0.3742828369140625, 0.40717315673828125, 0.4400634765625, 0.47295379638671875, 0.5058441162109375, 0.5387344360351562, 0.571624755859375, 0.6045150756835938, 0.6374053955078125, 0.6702957153320312, 0.70318603515625, 0.7360763549804688, 0.7689666748046875, 0.8018569946289062, 0.834747314453125, 0.8676376342773438, 0.9005279541015625, 0.9334182739257812, 0.96630859375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 16.0, 14.0, 16.0, 29.0, 46.0, 57.0, 73.0, 99.0, 109.0, 137.0, 110.0, 85.0, 60.0, 45.0, 29.0, 20.0, 12.0, 5.0, 6.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00022518634796142578, -0.00021913275122642517, -0.00021307915449142456, -0.00020702555775642395, -0.00020097196102142334, -0.00019491836428642273, -0.00018886476755142212, -0.0001828111708164215, -0.0001767575740814209, -0.0001707039773464203, -0.00016465038061141968, -0.00015859678387641907, -0.00015254318714141846, -0.00014648959040641785, -0.00014043599367141724, -0.00013438239693641663, -0.00012832880020141602, -0.0001222752034664154, -0.0001162216067314148, -0.00011016800999641418, -0.00010411441326141357, -9.806081652641296e-05, -9.200721979141235e-05, -8.595362305641174e-05, -7.990002632141113e-05, -7.384642958641052e-05, -6.779283285140991e-05, -6.17392361164093e-05, -5.568563938140869e-05, -4.963204264640808e-05, -4.357844591140747e-05, -3.752484917640686e-05, -3.147125244140625e-05, -2.541765570640564e-05, -1.936405897140503e-05, -1.3310462236404419e-05, -7.256865501403809e-06, -1.2032687664031982e-06, 4.850327968597412e-06, 1.0903924703598022e-05, 1.6957521438598633e-05, 2.3011118173599243e-05, 2.9064714908599854e-05, 3.5118311643600464e-05, 4.1171908378601074e-05, 4.7225505113601685e-05, 5.3279101848602295e-05, 5.9332698583602905e-05, 6.538629531860352e-05, 7.143989205360413e-05, 7.749348878860474e-05, 8.354708552360535e-05, 8.960068225860596e-05, 9.565427899360657e-05, 0.00010170787572860718, 0.00010776147246360779, 0.0001138150691986084, 0.00011986866593360901, 0.00012592226266860962, 0.00013197585940361023, 0.00013802945613861084, 0.00014408305287361145, 0.00015013664960861206, 0.00015619024634361267, 0.00016224384307861328]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 10.0, 6.0, 11.0, 10.0, 14.0, 29.0, 23.0, 45.0, 66.0, 131.0, 203.0, 305.0, 646.0, 1310.0, 3517.0, 12085.0, 78135.0, 776079.0, 150084.0, 17771.0, 4584.0, 1799.0, 763.0, 386.0, 210.0, 103.0, 79.0, 47.0, 29.0, 17.0, 16.0, 9.0, 12.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8388671875, -0.8159637451171875, -0.793060302734375, -0.7701568603515625, -0.74725341796875, -0.7243499755859375, -0.701446533203125, -0.6785430908203125, -0.6556396484375, -0.6327362060546875, -0.609832763671875, -0.5869293212890625, -0.56402587890625, -0.5411224365234375, -0.518218994140625, -0.4953155517578125, -0.472412109375, -0.4495086669921875, -0.426605224609375, -0.4037017822265625, -0.38079833984375, -0.3578948974609375, -0.334991455078125, -0.3120880126953125, -0.2891845703125, -0.2662811279296875, -0.243377685546875, -0.2204742431640625, -0.19757080078125, -0.1746673583984375, -0.151763916015625, -0.1288604736328125, -0.10595703125, -0.0830535888671875, -0.060150146484375, -0.0372467041015625, -0.01434326171875, 0.0085601806640625, 0.031463623046875, 0.0543670654296875, 0.0772705078125, 0.1001739501953125, 0.123077392578125, 0.1459808349609375, 0.16888427734375, 0.1917877197265625, 0.214691162109375, 0.2375946044921875, 0.260498046875, 0.2834014892578125, 0.306304931640625, 0.3292083740234375, 0.35211181640625, 0.3750152587890625, 0.397918701171875, 0.4208221435546875, 0.4437255859375, 0.4666290283203125, 0.489532470703125, 0.5124359130859375, 0.53533935546875, 0.5582427978515625, 0.581146240234375, 0.6040496826171875, 0.626953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 11.0, 10.0, 12.0, 18.0, 27.0, 38.0, 58.0, 77.0, 96.0, 99.0, 110.0, 94.0, 75.0, 61.0, 64.0, 43.0, 26.0, 26.0, 13.0, 11.0, 6.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73388671875, -0.7111282348632812, -0.6883697509765625, -0.6656112670898438, -0.642852783203125, -0.6200942993164062, -0.5973358154296875, -0.5745773315429688, -0.55181884765625, -0.5290603637695312, -0.5063018798828125, -0.48354339599609375, -0.460784912109375, -0.43802642822265625, -0.4152679443359375, -0.39250946044921875, -0.3697509765625, -0.34699249267578125, -0.3242340087890625, -0.30147552490234375, -0.278717041015625, -0.25595855712890625, -0.2332000732421875, -0.21044158935546875, -0.18768310546875, -0.16492462158203125, -0.1421661376953125, -0.11940765380859375, -0.096649169921875, -0.07389068603515625, -0.0511322021484375, -0.02837371826171875, -0.005615234375, 0.01714324951171875, 0.0399017333984375, 0.06266021728515625, 0.085418701171875, 0.10817718505859375, 0.1309356689453125, 0.15369415283203125, 0.17645263671875, 0.19921112060546875, 0.2219696044921875, 0.24472808837890625, 0.267486572265625, 0.29024505615234375, 0.3130035400390625, 0.33576202392578125, 0.3585205078125, 0.38127899169921875, 0.4040374755859375, 0.42679595947265625, 0.449554443359375, 0.47231292724609375, 0.4950714111328125, 0.5178298950195312, 0.54058837890625, 0.5633468627929688, 0.5861053466796875, 0.6088638305664062, 0.631622314453125, 0.6543807983398438, 0.6771392822265625, 0.6998977661132812, 0.72265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 9.0, 14.0, 30.0, 74.0, 142.0, 275.0, 255.0, 110.0, 52.0, 25.0, 9.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.005552291870117, -20.43624496459961, -19.86693572998047, -19.29762840270996, -18.728321075439453, -18.159013748168945, -17.589706420898438, -17.020397186279297, -16.45108985900879, -15.881782531738281, -15.312474250793457, -14.743165969848633, -14.173858642578125, -13.604551315307617, -13.035243034362793, -12.465934753417969, -11.896627426147461, -11.327320098876953, -10.758011817932129, -10.188703536987305, -9.619396209716797, -9.050088882446289, -8.480780601501465, -7.911472797393799, -7.342164993286133, -6.772857189178467, -6.203549385070801, -5.634241580963135, -5.064933776855469, -4.495625972747803, -3.9263181686401367, -3.3570103645324707, -2.787700653076172, -2.218392848968506, -1.6490850448608398, -1.0797772407531738, -0.5104694366455078, 0.0588383674621582, 0.6281461715698242, 1.1974539756774902, 1.7667617797851562, 2.3360695838928223, 2.9053773880004883, 3.4746851921081543, 4.04399299621582, 4.613300800323486, 5.182608604431152, 5.751916408538818, 6.321224212646484, 6.89053201675415, 7.459839820861816, 8.02914810180664, 8.598455429077148, 9.167762756347656, 9.73707103729248, 10.306379318237305, 10.875686645507812, 11.44499397277832, 12.014302253723145, 12.583610534667969, 13.152917861938477, 13.722225189208984, 14.291533470153809, 14.860841751098633, 15.43014907836914]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 6.0, 15.0, 5.0, 15.0, 14.0, 21.0, 32.0, 27.0, 22.0, 21.0, 37.0, 31.0, 44.0, 44.0, 51.0, 55.0, 84.0, 68.0, 47.0, 45.0, 37.0, 31.0, 33.0, 29.0, 22.0, 20.0, 18.0, 13.0, 20.0, 20.0, 13.0, 6.0, 10.0, 6.0, 11.0, 6.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.886995315551758, -9.6072416305542, -9.327488899230957, -9.047735214233398, -8.767982482910156, -8.488228797912598, -8.208475112915039, -7.928721904754639, -7.648968696594238, -7.369215488433838, -7.0894622802734375, -6.809708595275879, -6.5299553871154785, -6.250202178955078, -5.9704484939575195, -5.690695285797119, -5.410942077636719, -5.131188869476318, -4.851435661315918, -4.571681976318359, -4.291928768157959, -4.012175559997559, -3.732422113418579, -3.4526686668395996, -3.172915458679199, -2.893162250518799, -2.6134088039398193, -2.33365535736084, -2.0539021492004395, -1.7741488218307495, -1.4943954944610596, -1.2146421670913696, -0.9348888397216797, -0.6551355123519897, -0.3753821849822998, -0.09562885761260986, 0.18412446975708008, 0.46387779712677, 0.74363112449646, 1.02338445186615, 1.3031377792358398, 1.5828911066055298, 1.8626444339752197, 2.142397880554199, 2.4221510887145996, 2.701904296875, 2.9816577434539795, 3.261411190032959, 3.5411643981933594, 3.8209176063537598, 4.10067081451416, 4.380424499511719, 4.660177707672119, 4.9399309158325195, 5.219684600830078, 5.4994378089904785, 5.779191017150879, 6.058944225311279, 6.33869743347168, 6.618451118469238, 6.898204326629639, 7.177957534790039, 7.457711219787598, 7.737464427947998, 8.017217636108398]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 6.0, 6.0, 7.0, 10.0, 15.0, 14.0, 18.0, 37.0, 48.0, 92.0, 112.0, 154.0, 230.0, 329.0, 576.0, 803.0, 1432.0, 2611.0, 5187.0, 11558.0, 29692.0, 99908.0, 469829.0, 2118270.0, 1153260.0, 210292.0, 54098.0, 18737.0, 7952.0, 3885.0, 1985.0, 1163.0, 673.0, 435.0, 277.0, 182.0, 118.0, 97.0, 61.0, 37.0, 24.0, 24.0, 8.0, 9.0, 9.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-0.57421875, -0.5585975646972656, -0.5429763793945312, -0.5273551940917969, -0.5117340087890625, -0.4961128234863281, -0.48049163818359375, -0.4648704528808594, -0.449249267578125, -0.4336280822753906, -0.41800689697265625, -0.4023857116699219, -0.3867645263671875, -0.3711433410644531, -0.35552215576171875, -0.3399009704589844, -0.32427978515625, -0.3086585998535156, -0.29303741455078125, -0.2774162292480469, -0.2617950439453125, -0.24617385864257812, -0.23055267333984375, -0.21493148803710938, -0.199310302734375, -0.18368911743164062, -0.16806793212890625, -0.15244674682617188, -0.1368255615234375, -0.12120437622070312, -0.10558319091796875, -0.08996200561523438, -0.0743408203125, -0.058719635009765625, -0.04309844970703125, -0.027477264404296875, -0.0118560791015625, 0.003765106201171875, 0.01938629150390625, 0.035007476806640625, 0.050628662109375, 0.06624984741210938, 0.08187103271484375, 0.09749221801757812, 0.1131134033203125, 0.12873458862304688, 0.14435577392578125, 0.15997695922851562, 0.17559814453125, 0.19121932983398438, 0.20684051513671875, 0.22246170043945312, 0.2380828857421875, 0.2537040710449219, 0.26932525634765625, 0.2849464416503906, 0.300567626953125, 0.3161888122558594, 0.33180999755859375, 0.3474311828613281, 0.3630523681640625, 0.3786735534667969, 0.39429473876953125, 0.4099159240722656, 0.425537109375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 13.0, 20.0, 21.0, 18.0, 32.0, 33.0, 40.0, 64.0, 71.0, 91.0, 86.0, 87.0, 72.0, 66.0, 60.0, 43.0, 45.0, 37.0, 29.0, 21.0, 7.0, 9.0, 8.0, 11.0, 7.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9248046875, -0.8998641967773438, -0.8749237060546875, -0.8499832153320312, -0.825042724609375, -0.8001022338867188, -0.7751617431640625, -0.7502212524414062, -0.72528076171875, -0.7003402709960938, -0.6753997802734375, -0.6504592895507812, -0.625518798828125, -0.6005783081054688, -0.5756378173828125, -0.5506973266601562, -0.5257568359375, -0.5008163452148438, -0.4758758544921875, -0.45093536376953125, -0.425994873046875, -0.40105438232421875, -0.3761138916015625, -0.35117340087890625, -0.32623291015625, -0.30129241943359375, -0.2763519287109375, -0.25141143798828125, -0.226470947265625, -0.20153045654296875, -0.1765899658203125, -0.15164947509765625, -0.126708984375, -0.10176849365234375, -0.0768280029296875, -0.05188751220703125, -0.026947021484375, -0.00200653076171875, 0.0229339599609375, 0.04787445068359375, 0.07281494140625, 0.09775543212890625, 0.1226959228515625, 0.14763641357421875, 0.172576904296875, 0.19751739501953125, 0.2224578857421875, 0.24739837646484375, 0.2723388671875, 0.29727935791015625, 0.3222198486328125, 0.34716033935546875, 0.372100830078125, 0.39704132080078125, 0.4219818115234375, 0.44692230224609375, 0.47186279296875, 0.49680328369140625, 0.5217437744140625, 0.5466842651367188, 0.571624755859375, 0.5965652465820312, 0.6215057373046875, 0.6464462280273438, 0.67138671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 11.0, 6.0, 14.0, 18.0, 27.0, 38.0, 46.0, 65.0, 133.0, 157.0, 252.0, 470.0, 976.0, 2367.0, 7928.0, 41141.0, 712388.0, 3282073.0, 120849.0, 18187.0, 4379.0, 1415.0, 574.0, 306.0, 175.0, 106.0, 52.0, 44.0, 27.0, 11.0, 14.0, 10.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2900390625, -1.25, -1.2099609375, -1.169921875, -1.1298828125, -1.08984375, -1.0498046875, -1.009765625, -0.9697265625, -0.9296875, -0.8896484375, -0.849609375, -0.8095703125, -0.76953125, -0.7294921875, -0.689453125, -0.6494140625, -0.609375, -0.5693359375, -0.529296875, -0.4892578125, -0.44921875, -0.4091796875, -0.369140625, -0.3291015625, -0.2890625, -0.2490234375, -0.208984375, -0.1689453125, -0.12890625, -0.0888671875, -0.048828125, -0.0087890625, 0.03125, 0.0712890625, 0.111328125, 0.1513671875, 0.19140625, 0.2314453125, 0.271484375, 0.3115234375, 0.3515625, 0.3916015625, 0.431640625, 0.4716796875, 0.51171875, 0.5517578125, 0.591796875, 0.6318359375, 0.671875, 0.7119140625, 0.751953125, 0.7919921875, 0.83203125, 0.8720703125, 0.912109375, 0.9521484375, 0.9921875, 1.0322265625, 1.072265625, 1.1123046875, 1.15234375, 1.1923828125, 1.232421875, 1.2724609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 3.0, 10.0, 9.0, 9.0, 23.0, 29.0, 26.0, 57.0, 88.0, 196.0, 385.0, 684.0, 846.0, 731.0, 369.0, 208.0, 122.0, 77.0, 48.0, 45.0, 33.0, 25.0, 10.0, 6.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.451171875, -1.4125518798828125, -1.373931884765625, -1.3353118896484375, -1.29669189453125, -1.2580718994140625, -1.219451904296875, -1.1808319091796875, -1.1422119140625, -1.1035919189453125, -1.064971923828125, -1.0263519287109375, -0.98773193359375, -0.9491119384765625, -0.910491943359375, -0.8718719482421875, -0.833251953125, -0.7946319580078125, -0.756011962890625, -0.7173919677734375, -0.67877197265625, -0.6401519775390625, -0.601531982421875, -0.5629119873046875, -0.5242919921875, -0.4856719970703125, -0.447052001953125, -0.4084320068359375, -0.36981201171875, -0.3311920166015625, -0.292572021484375, -0.2539520263671875, -0.21533203125, -0.1767120361328125, -0.138092041015625, -0.0994720458984375, -0.06085205078125, -0.0222320556640625, 0.016387939453125, 0.0550079345703125, 0.0936279296875, 0.1322479248046875, 0.170867919921875, 0.2094879150390625, 0.24810791015625, 0.2867279052734375, 0.325347900390625, 0.3639678955078125, 0.402587890625, 0.4412078857421875, 0.479827880859375, 0.5184478759765625, 0.55706787109375, 0.5956878662109375, 0.634307861328125, 0.6729278564453125, 0.7115478515625, 0.7501678466796875, 0.788787841796875, 0.8274078369140625, 0.86602783203125, 0.9046478271484375, 0.943267822265625, 0.9818878173828125, 1.0205078125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 25.0, 88.0, 265.0, 340.0, 180.0, 65.0, 18.0, 7.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.717849731445312, -15.069784164428711, -14.42171859741211, -13.773653030395508, -13.12558650970459, -12.477520942687988, -11.829455375671387, -11.181388854980469, -10.533323287963867, -9.885257720947266, -9.237192153930664, -8.589126586914062, -7.9410600662231445, -7.292994499206543, -6.644928932189941, -5.996862888336182, -5.348797798156738, -4.700732231140137, -4.052666187286377, -3.4046006202697754, -2.7565348148345947, -2.108469009399414, -1.4604034423828125, -0.8123373985290527, -0.16427183151245117, 0.4837939143180847, 1.1318596601486206, 1.7799253463745117, 2.4279911518096924, 3.076056957244873, 3.7241225242614746, 4.372188568115234, 5.020254135131836, 5.6683197021484375, 6.316385746002197, 6.964451313018799, 7.612517356872559, 8.26058292388916, 8.908648490905762, 9.55671501159668, 10.204780578613281, 10.852846145629883, 11.500911712646484, 12.148977279663086, 12.797043800354004, 13.445109367370605, 14.093174934387207, 14.741241455078125, 15.38930606842041, 16.037372589111328, 16.68543815612793, 17.33350372314453, 17.981569290161133, 18.629634857177734, 19.277700424194336, 19.925765991210938, 20.57383155822754, 21.22189712524414, 21.869962692260742, 22.518028259277344, 23.166093826293945, 23.814159393310547, 24.46222686767578, 25.110292434692383, 25.758358001708984]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 5.0, 7.0, 3.0, 8.0, 6.0, 20.0, 16.0, 25.0, 41.0, 27.0, 45.0, 41.0, 48.0, 63.0, 66.0, 53.0, 59.0, 56.0, 46.0, 51.0, 54.0, 39.0, 31.0, 32.0, 30.0, 20.0, 23.0, 20.0, 19.0, 10.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.452091217041016, -5.278045654296875, -5.104000091552734, -4.929954528808594, -4.755908966064453, -4.581862926483154, -4.407817363739014, -4.233771800994873, -4.059726238250732, -3.885680675506592, -3.711635112762451, -3.5375893115997314, -3.363543748855591, -3.18949818611145, -3.0154523849487305, -2.84140682220459, -2.667361259460449, -2.4933156967163086, -2.319270133972168, -2.1452243328094482, -1.9711787700653076, -1.797133207321167, -1.6230875253677368, -1.4490418434143066, -1.274996280670166, -1.1009507179260254, -0.9269050359725952, -0.7528594136238098, -0.5788137912750244, -0.404768168926239, -0.2307225465774536, -0.05667686462402344, 0.11736869812011719, 0.2914143204689026, 0.465459942817688, 0.6395055651664734, 0.8135511875152588, 0.9875968098640442, 1.1616424322128296, 1.3356881141662598, 1.5097336769104004, 1.683779239654541, 1.8578249216079712, 2.0318706035614014, 2.205916166305542, 2.3799617290496826, 2.5540075302124023, 2.728053092956543, 2.9020986557006836, 3.076144218444824, 3.250189781188965, 3.4242355823516846, 3.598281145095825, 3.772326707839966, 3.9463725090026855, 4.120418071746826, 4.294463634490967, 4.468509197235107, 4.642554759979248, 4.816600322723389, 4.9906463623046875, 5.164691925048828, 5.338737487792969, 5.512783050537109, 5.68682861328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 20.0, 4.0, 16.0, 29.0, 26.0, 64.0, 91.0, 134.0, 221.0, 324.0, 512.0, 859.0, 1397.0, 2296.0, 4122.0, 7519.0, 14305.0, 27524.0, 55244.0, 113443.0, 223348.0, 272271.0, 163133.0, 79110.0, 39086.0, 19640.0, 10175.0, 5677.0, 3166.0, 1784.0, 1099.0, 695.0, 401.0, 267.0, 174.0, 130.0, 79.0, 53.0, 40.0, 22.0, 15.0, 9.0, 10.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.652740478515625, -0.63116455078125, -0.609588623046875, -0.5880126953125, -0.566436767578125, -0.54486083984375, -0.523284912109375, -0.501708984375, -0.480133056640625, -0.45855712890625, -0.436981201171875, -0.4154052734375, -0.393829345703125, -0.37225341796875, -0.350677490234375, -0.3291015625, -0.307525634765625, -0.28594970703125, -0.264373779296875, -0.2427978515625, -0.221221923828125, -0.19964599609375, -0.178070068359375, -0.156494140625, -0.134918212890625, -0.11334228515625, -0.091766357421875, -0.0701904296875, -0.048614501953125, -0.02703857421875, -0.005462646484375, 0.01611328125, 0.037689208984375, 0.05926513671875, 0.080841064453125, 0.1024169921875, 0.123992919921875, 0.14556884765625, 0.167144775390625, 0.188720703125, 0.210296630859375, 0.23187255859375, 0.253448486328125, 0.2750244140625, 0.296600341796875, 0.31817626953125, 0.339752197265625, 0.361328125, 0.382904052734375, 0.40447998046875, 0.426055908203125, 0.4476318359375, 0.469207763671875, 0.49078369140625, 0.512359619140625, 0.533935546875, 0.555511474609375, 0.57708740234375, 0.598663330078125, 0.6202392578125, 0.641815185546875, 0.66339111328125, 0.684967041015625, 0.70654296875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 7.0, 16.0, 13.0, 26.0, 26.0, 34.0, 56.0, 49.0, 81.0, 68.0, 75.0, 67.0, 75.0, 80.0, 66.0, 61.0, 57.0, 35.0, 29.0, 25.0, 12.0, 11.0, 10.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8974609375, -0.8722152709960938, -0.8469696044921875, -0.8217239379882812, -0.796478271484375, -0.7712326049804688, -0.7459869384765625, -0.7207412719726562, -0.69549560546875, -0.6702499389648438, -0.6450042724609375, -0.6197586059570312, -0.594512939453125, -0.5692672729492188, -0.5440216064453125, -0.5187759399414062, -0.4935302734375, -0.46828460693359375, -0.4430389404296875, -0.41779327392578125, -0.392547607421875, -0.36730194091796875, -0.3420562744140625, -0.31681060791015625, -0.29156494140625, -0.26631927490234375, -0.2410736083984375, -0.21582794189453125, -0.190582275390625, -0.16533660888671875, -0.1400909423828125, -0.11484527587890625, -0.089599609375, -0.06435394287109375, -0.0391082763671875, -0.01386260986328125, 0.011383056640625, 0.03662872314453125, 0.0618743896484375, 0.08712005615234375, 0.11236572265625, 0.13761138916015625, 0.1628570556640625, 0.18810272216796875, 0.213348388671875, 0.23859405517578125, 0.2638397216796875, 0.28908538818359375, 0.3143310546875, 0.33957672119140625, 0.3648223876953125, 0.39006805419921875, 0.415313720703125, 0.44055938720703125, 0.4658050537109375, 0.49105072021484375, 0.51629638671875, 0.5415420532226562, 0.5667877197265625, 0.5920333862304688, 0.617279052734375, 0.6425247192382812, 0.6677703857421875, 0.6930160522460938, 0.71826171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 5.0, 16.0, 14.0, 29.0, 39.0, 50.0, 77.0, 130.0, 196.0, 298.0, 472.0, 785.0, 1654.0, 4112.0, 17896.0, 119542.0, 700552.0, 169199.0, 24164.0, 5064.0, 1812.0, 905.0, 551.0, 328.0, 196.0, 149.0, 98.0, 59.0, 44.0, 31.0, 30.0, 16.0, 11.0, 4.0, 2.0, 8.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.443572998046875, -1.38714599609375, -1.330718994140625, -1.2742919921875, -1.217864990234375, -1.16143798828125, -1.105010986328125, -1.048583984375, -0.992156982421875, -0.93572998046875, -0.879302978515625, -0.8228759765625, -0.766448974609375, -0.71002197265625, -0.653594970703125, -0.59716796875, -0.540740966796875, -0.48431396484375, -0.427886962890625, -0.3714599609375, -0.315032958984375, -0.25860595703125, -0.202178955078125, -0.145751953125, -0.089324951171875, -0.03289794921875, 0.023529052734375, 0.0799560546875, 0.136383056640625, 0.19281005859375, 0.249237060546875, 0.3056640625, 0.362091064453125, 0.41851806640625, 0.474945068359375, 0.5313720703125, 0.587799072265625, 0.64422607421875, 0.700653076171875, 0.757080078125, 0.813507080078125, 0.86993408203125, 0.926361083984375, 0.9827880859375, 1.039215087890625, 1.09564208984375, 1.152069091796875, 1.20849609375, 1.264923095703125, 1.32135009765625, 1.377777099609375, 1.4342041015625, 1.490631103515625, 1.54705810546875, 1.603485107421875, 1.659912109375, 1.716339111328125, 1.77276611328125, 1.829193115234375, 1.8856201171875, 1.942047119140625, 1.99847412109375, 2.054901123046875, 2.111328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 6.0, 5.0, 7.0, 6.0, 11.0, 9.0, 18.0, 17.0, 18.0, 37.0, 30.0, 25.0, 39.0, 38.0, 37.0, 35.0, 60.0, 48.0, 49.0, 50.0, 65.0, 42.0, 49.0, 41.0, 41.0, 30.0, 25.0, 23.0, 19.0, 23.0, 13.0, 20.0, 16.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.696136474609375, -1.63641357421875, -1.576690673828125, -1.5169677734375, -1.457244873046875, -1.39752197265625, -1.337799072265625, -1.278076171875, -1.218353271484375, -1.15863037109375, -1.098907470703125, -1.0391845703125, -0.979461669921875, -0.91973876953125, -0.860015869140625, -0.80029296875, -0.740570068359375, -0.68084716796875, -0.621124267578125, -0.5614013671875, -0.501678466796875, -0.44195556640625, -0.382232666015625, -0.322509765625, -0.262786865234375, -0.20306396484375, -0.143341064453125, -0.0836181640625, -0.023895263671875, 0.03582763671875, 0.095550537109375, 0.1552734375, 0.214996337890625, 0.27471923828125, 0.334442138671875, 0.3941650390625, 0.453887939453125, 0.51361083984375, 0.573333740234375, 0.633056640625, 0.692779541015625, 0.75250244140625, 0.812225341796875, 0.8719482421875, 0.931671142578125, 0.99139404296875, 1.051116943359375, 1.11083984375, 1.170562744140625, 1.23028564453125, 1.290008544921875, 1.3497314453125, 1.409454345703125, 1.46917724609375, 1.528900146484375, 1.588623046875, 1.648345947265625, 1.70806884765625, 1.767791748046875, 1.8275146484375, 1.887237548828125, 1.94696044921875, 2.006683349609375, 2.06640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 11.0, 17.0, 20.0, 20.0, 25.0, 49.0, 94.0, 150.0, 287.0, 621.0, 1442.0, 3840.0, 12478.0, 50227.0, 306122.0, 579971.0, 68855.0, 16158.0, 4892.0, 1694.0, 786.0, 344.0, 157.0, 106.0, 61.0, 38.0, 26.0, 16.0, 13.0, 12.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.564453125, -0.5463027954101562, -0.5281524658203125, -0.5100021362304688, -0.491851806640625, -0.47370147705078125, -0.4555511474609375, -0.43740081787109375, -0.41925048828125, -0.40110015869140625, -0.3829498291015625, -0.36479949951171875, -0.346649169921875, -0.32849884033203125, -0.3103485107421875, -0.29219818115234375, -0.2740478515625, -0.25589752197265625, -0.2377471923828125, -0.21959686279296875, -0.201446533203125, -0.18329620361328125, -0.1651458740234375, -0.14699554443359375, -0.12884521484375, -0.11069488525390625, -0.0925445556640625, -0.07439422607421875, -0.056243896484375, -0.03809356689453125, -0.0199432373046875, -0.00179290771484375, 0.016357421875, 0.03450775146484375, 0.0526580810546875, 0.07080841064453125, 0.088958740234375, 0.10710906982421875, 0.1252593994140625, 0.14340972900390625, 0.16156005859375, 0.17971038818359375, 0.1978607177734375, 0.21601104736328125, 0.234161376953125, 0.25231170654296875, 0.2704620361328125, 0.28861236572265625, 0.3067626953125, 0.32491302490234375, 0.3430633544921875, 0.36121368408203125, 0.379364013671875, 0.39751434326171875, 0.4156646728515625, 0.43381500244140625, 0.45196533203125, 0.47011566162109375, 0.4882659912109375, 0.5064163208007812, 0.524566650390625, 0.5427169799804688, 0.5608673095703125, 0.5790176391601562, 0.59716796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 8.0, 12.0, 18.0, 27.0, 36.0, 40.0, 62.0, 95.0, 120.0, 128.0, 123.0, 72.0, 53.0, 39.0, 24.0, 23.0, 21.0, 16.0, 7.0, 10.0, 4.0, 8.0, 4.0, 2.0, 6.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002028942108154297, -0.00019639357924461365, -0.0001898929476737976, -0.00018339231610298157, -0.00017689168453216553, -0.0001703910529613495, -0.00016389042139053345, -0.0001573897898197174, -0.00015088915824890137, -0.00014438852667808533, -0.0001378878951072693, -0.00013138726353645325, -0.0001248866319656372, -0.00011838600039482117, -0.00011188536882400513, -0.00010538473725318909, -9.888410568237305e-05, -9.238347411155701e-05, -8.588284254074097e-05, -7.938221096992493e-05, -7.288157939910889e-05, -6.638094782829285e-05, -5.988031625747681e-05, -5.3379684686660767e-05, -4.6879053115844727e-05, -4.0378421545028687e-05, -3.3877789974212646e-05, -2.7377158403396606e-05, -2.0876526832580566e-05, -1.4375895261764526e-05, -7.875263690948486e-06, -1.3746321201324463e-06, 5.125999450683594e-06, 1.1626631021499634e-05, 1.8127262592315674e-05, 2.4627894163131714e-05, 3.1128525733947754e-05, 3.7629157304763794e-05, 4.4129788875579834e-05, 5.0630420446395874e-05, 5.7131052017211914e-05, 6.363168358802795e-05, 7.0132315158844e-05, 7.663294672966003e-05, 8.313357830047607e-05, 8.963420987129211e-05, 9.613484144210815e-05, 0.0001026354730129242, 0.00010913610458374023, 0.00011563673615455627, 0.00012213736772537231, 0.00012863799929618835, 0.0001351386308670044, 0.00014163926243782043, 0.00014813989400863647, 0.00015464052557945251, 0.00016114115715026855, 0.0001676417887210846, 0.00017414242029190063, 0.00018064305186271667, 0.00018714368343353271, 0.00019364431500434875, 0.0002001449465751648, 0.00020664557814598083, 0.00021314620971679688]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 6.0, 7.0, 8.0, 20.0, 16.0, 32.0, 51.0, 80.0, 134.0, 249.0, 494.0, 955.0, 2302.0, 6379.0, 25159.0, 162554.0, 707979.0, 113626.0, 19323.0, 5338.0, 1953.0, 862.0, 430.0, 252.0, 121.0, 86.0, 39.0, 19.0, 15.0, 18.0, 11.0, 7.0, 10.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6513671875, -0.6318740844726562, -0.6123809814453125, -0.5928878784179688, -0.573394775390625, -0.5539016723632812, -0.5344085693359375, -0.5149154663085938, -0.49542236328125, -0.47592926025390625, -0.4564361572265625, -0.43694305419921875, -0.417449951171875, -0.39795684814453125, -0.3784637451171875, -0.35897064208984375, -0.3394775390625, -0.31998443603515625, -0.3004913330078125, -0.28099822998046875, -0.261505126953125, -0.24201202392578125, -0.2225189208984375, -0.20302581787109375, -0.18353271484375, -0.16403961181640625, -0.1445465087890625, -0.12505340576171875, -0.105560302734375, -0.08606719970703125, -0.0665740966796875, -0.04708099365234375, -0.027587890625, -0.00809478759765625, 0.0113983154296875, 0.03089141845703125, 0.050384521484375, 0.06987762451171875, 0.0893707275390625, 0.10886383056640625, 0.12835693359375, 0.14785003662109375, 0.1673431396484375, 0.18683624267578125, 0.206329345703125, 0.22582244873046875, 0.2453155517578125, 0.26480865478515625, 0.2843017578125, 0.30379486083984375, 0.3232879638671875, 0.34278106689453125, 0.362274169921875, 0.38176727294921875, 0.4012603759765625, 0.42075347900390625, 0.44024658203125, 0.45973968505859375, 0.4792327880859375, 0.49872589111328125, 0.518218994140625, 0.5377120971679688, 0.5572052001953125, 0.5766983032226562, 0.59619140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 7.0, 7.0, 13.0, 13.0, 21.0, 34.0, 47.0, 72.0, 83.0, 109.0, 118.0, 109.0, 92.0, 84.0, 61.0, 35.0, 19.0, 26.0, 19.0, 11.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88671875, -0.8646240234375, -0.842529296875, -0.8204345703125, -0.79833984375, -0.7762451171875, -0.754150390625, -0.7320556640625, -0.7099609375, -0.6878662109375, -0.665771484375, -0.6436767578125, -0.62158203125, -0.5994873046875, -0.577392578125, -0.5552978515625, -0.533203125, -0.5111083984375, -0.489013671875, -0.4669189453125, -0.44482421875, -0.4227294921875, -0.400634765625, -0.3785400390625, -0.3564453125, -0.3343505859375, -0.312255859375, -0.2901611328125, -0.26806640625, -0.2459716796875, -0.223876953125, -0.2017822265625, -0.1796875, -0.1575927734375, -0.135498046875, -0.1134033203125, -0.09130859375, -0.0692138671875, -0.047119140625, -0.0250244140625, -0.0029296875, 0.0191650390625, 0.041259765625, 0.0633544921875, 0.08544921875, 0.1075439453125, 0.129638671875, 0.1517333984375, 0.173828125, 0.1959228515625, 0.218017578125, 0.2401123046875, 0.26220703125, 0.2843017578125, 0.306396484375, 0.3284912109375, 0.3505859375, 0.3726806640625, 0.394775390625, 0.4168701171875, 0.43896484375, 0.4610595703125, 0.483154296875, 0.5052490234375, 0.52734375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 5.0, 3.0, 9.0, 24.0, 37.0, 89.0, 144.0, 274.0, 182.0, 113.0, 60.0, 27.0, 16.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.544530868530273, -16.093183517456055, -15.641834259033203, -15.190485954284668, -14.739137649536133, -14.287790298461914, -13.836441040039062, -13.385093688964844, -12.933745384216309, -12.482397079467773, -12.031048774719238, -11.579700469970703, -11.128352165222168, -10.677003860473633, -10.225656509399414, -9.774308204650879, -9.322959899902344, -8.871611595153809, -8.420263290405273, -7.968914985656738, -7.517567157745361, -7.066218852996826, -6.614870548248291, -6.163522720336914, -5.7121734619140625, -5.260825157165527, -4.809476852416992, -4.358128547668457, -3.90678071975708, -3.455432415008545, -3.0040841102600098, -2.5527360439300537, -2.1013879776000977, -1.650039792060852, -1.1986916065216064, -0.7473433017730713, -0.2959951162338257, 0.15535306930541992, 0.6067013740539551, 1.0580494403839111, 1.5093977451324463, 1.960745930671692, 2.4120941162109375, 2.8634424209594727, 3.314790725708008, 3.766138792037964, 4.217487335205078, 4.668835163116455, 5.12018346786499, 5.571531772613525, 6.0228800773620605, 6.4742279052734375, 6.925576210021973, 7.376924514770508, 7.828272819519043, 8.279621124267578, 8.730969429016113, 9.182317733764648, 9.633666038513184, 10.085014343261719, 10.536362648010254, 10.987710952758789, 11.439058303833008, 11.890406608581543, 12.341754913330078]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 2.0, 6.0, 3.0, 11.0, 11.0, 10.0, 15.0, 15.0, 13.0, 16.0, 15.0, 23.0, 17.0, 22.0, 34.0, 36.0, 36.0, 45.0, 45.0, 75.0, 69.0, 71.0, 55.0, 37.0, 49.0, 24.0, 33.0, 42.0, 30.0, 13.0, 24.0, 18.0, 20.0, 12.0, 12.0, 8.0, 9.0, 12.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.604677677154541, -7.371061325073242, -7.137444496154785, -6.903828144073486, -6.6702117919921875, -6.436595439910889, -6.20297908782959, -5.969362258911133, -5.735745906829834, -5.502129554748535, -5.268512725830078, -5.034896373748779, -4.8012800216674805, -4.567663669586182, -4.334047317504883, -4.100430488586426, -3.866814136505127, -3.633197784423828, -3.39958119392395, -3.1659646034240723, -2.9323482513427734, -2.6987318992614746, -2.4651153087615967, -2.2314987182617188, -1.99788236618042, -1.7642658948898315, -1.5306494235992432, -1.2970329523086548, -1.0634164810180664, -0.829800009727478, -0.5961835384368896, -0.36256706714630127, -0.1289501190185547, 0.10466635227203369, 0.33828282356262207, 0.5718992948532104, 0.8055157661437988, 1.0391322374343872, 1.2727487087249756, 1.506365180015564, 1.7399816513061523, 1.9735981225967407, 2.207214593887329, 2.440831184387207, 2.674447536468506, 2.9080638885498047, 3.1416804790496826, 3.3752970695495605, 3.6089134216308594, 3.842529773712158, 4.076146125793457, 4.309762954711914, 4.543379306793213, 4.776995658874512, 5.010612487792969, 5.244228839874268, 5.477845191955566, 5.711461544036865, 5.945077896118164, 6.178694725036621, 6.41231107711792, 6.645927429199219, 6.879544258117676, 7.113160610198975, 7.346776962280273]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 8.0, 11.0, 14.0, 9.0, 14.0, 23.0, 33.0, 39.0, 64.0, 77.0, 96.0, 125.0, 205.0, 300.0, 437.0, 727.0, 1124.0, 1924.0, 4051.0, 10384.0, 33555.0, 162232.0, 1198844.0, 2320689.0, 371189.0, 59688.0, 15744.0, 6034.0, 2710.0, 1430.0, 785.0, 505.0, 377.0, 240.0, 169.0, 113.0, 100.0, 70.0, 41.0, 30.0, 21.0, 18.0, 9.0, 14.0, 11.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.6845703125, -0.665130615234375, -0.64569091796875, -0.626251220703125, -0.6068115234375, -0.587371826171875, -0.56793212890625, -0.548492431640625, -0.529052734375, -0.509613037109375, -0.49017333984375, -0.470733642578125, -0.4512939453125, -0.431854248046875, -0.41241455078125, -0.392974853515625, -0.37353515625, -0.354095458984375, -0.33465576171875, -0.315216064453125, -0.2957763671875, -0.276336669921875, -0.25689697265625, -0.237457275390625, -0.218017578125, -0.198577880859375, -0.17913818359375, -0.159698486328125, -0.1402587890625, -0.120819091796875, -0.10137939453125, -0.081939697265625, -0.0625, -0.043060302734375, -0.02362060546875, -0.004180908203125, 0.0152587890625, 0.034698486328125, 0.05413818359375, 0.073577880859375, 0.093017578125, 0.112457275390625, 0.13189697265625, 0.151336669921875, 0.1707763671875, 0.190216064453125, 0.20965576171875, 0.229095458984375, 0.24853515625, 0.267974853515625, 0.28741455078125, 0.306854248046875, 0.3262939453125, 0.345733642578125, 0.36517333984375, 0.384613037109375, 0.404052734375, 0.423492431640625, 0.44293212890625, 0.462371826171875, 0.4818115234375, 0.501251220703125, 0.52069091796875, 0.540130615234375, 0.5595703125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 12.0, 13.0, 19.0, 28.0, 39.0, 50.0, 56.0, 66.0, 72.0, 65.0, 86.0, 82.0, 79.0, 71.0, 51.0, 46.0, 37.0, 36.0, 19.0, 23.0, 11.0, 10.0, 11.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.912109375, -0.8873443603515625, -0.862579345703125, -0.8378143310546875, -0.81304931640625, -0.7882843017578125, -0.763519287109375, -0.7387542724609375, -0.7139892578125, -0.6892242431640625, -0.664459228515625, -0.6396942138671875, -0.61492919921875, -0.5901641845703125, -0.565399169921875, -0.5406341552734375, -0.515869140625, -0.4911041259765625, -0.466339111328125, -0.4415740966796875, -0.41680908203125, -0.3920440673828125, -0.367279052734375, -0.3425140380859375, -0.3177490234375, -0.2929840087890625, -0.268218994140625, -0.2434539794921875, -0.21868896484375, -0.1939239501953125, -0.169158935546875, -0.1443939208984375, -0.11962890625, -0.0948638916015625, -0.070098876953125, -0.0453338623046875, -0.02056884765625, 0.0041961669921875, 0.028961181640625, 0.0537261962890625, 0.0784912109375, 0.1032562255859375, 0.128021240234375, 0.1527862548828125, 0.17755126953125, 0.2023162841796875, 0.227081298828125, 0.2518463134765625, 0.276611328125, 0.3013763427734375, 0.326141357421875, 0.3509063720703125, 0.37567138671875, 0.4004364013671875, 0.425201416015625, 0.4499664306640625, 0.4747314453125, 0.4994964599609375, 0.524261474609375, 0.5490264892578125, 0.57379150390625, 0.5985565185546875, 0.623321533203125, 0.6480865478515625, 0.6728515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 16.0, 14.0, 14.0, 22.0, 30.0, 54.0, 68.0, 80.0, 135.0, 231.0, 361.0, 770.0, 1747.0, 4928.0, 25187.0, 674290.0, 3408030.0, 65555.0, 8628.0, 2277.0, 874.0, 396.0, 207.0, 130.0, 70.0, 63.0, 27.0, 18.0, 15.0, 7.0, 8.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.630859375, -1.5802001953125, -1.529541015625, -1.4788818359375, -1.42822265625, -1.3775634765625, -1.326904296875, -1.2762451171875, -1.2255859375, -1.1749267578125, -1.124267578125, -1.0736083984375, -1.02294921875, -0.9722900390625, -0.921630859375, -0.8709716796875, -0.8203125, -0.7696533203125, -0.718994140625, -0.6683349609375, -0.61767578125, -0.5670166015625, -0.516357421875, -0.4656982421875, -0.4150390625, -0.3643798828125, -0.313720703125, -0.2630615234375, -0.21240234375, -0.1617431640625, -0.111083984375, -0.0604248046875, -0.009765625, 0.0408935546875, 0.091552734375, 0.1422119140625, 0.19287109375, 0.2435302734375, 0.294189453125, 0.3448486328125, 0.3955078125, 0.4461669921875, 0.496826171875, 0.5474853515625, 0.59814453125, 0.6488037109375, 0.699462890625, 0.7501220703125, 0.80078125, 0.8514404296875, 0.902099609375, 0.9527587890625, 1.00341796875, 1.0540771484375, 1.104736328125, 1.1553955078125, 1.2060546875, 1.2567138671875, 1.307373046875, 1.3580322265625, 1.40869140625, 1.4593505859375, 1.510009765625, 1.5606689453125, 1.611328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 12.0, 9.0, 30.0, 24.0, 42.0, 78.0, 135.0, 237.0, 460.0, 752.0, 858.0, 606.0, 345.0, 182.0, 98.0, 62.0, 38.0, 22.0, 13.0, 15.0, 11.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0], "bins": [-1.623046875, -1.5846176147460938, -1.5461883544921875, -1.5077590942382812, -1.469329833984375, -1.4309005737304688, -1.3924713134765625, -1.3540420532226562, -1.31561279296875, -1.2771835327148438, -1.2387542724609375, -1.2003250122070312, -1.161895751953125, -1.1234664916992188, -1.0850372314453125, -1.0466079711914062, -1.0081787109375, -0.9697494506835938, -0.9313201904296875, -0.8928909301757812, -0.854461669921875, -0.8160324096679688, -0.7776031494140625, -0.7391738891601562, -0.70074462890625, -0.6623153686523438, -0.6238861083984375, -0.5854568481445312, -0.547027587890625, -0.5085983276367188, -0.4701690673828125, -0.43173980712890625, -0.393310546875, -0.35488128662109375, -0.3164520263671875, -0.27802276611328125, -0.239593505859375, -0.20116424560546875, -0.1627349853515625, -0.12430572509765625, -0.08587646484375, -0.04744720458984375, -0.0090179443359375, 0.02941131591796875, 0.067840576171875, 0.10626983642578125, 0.1446990966796875, 0.18312835693359375, 0.2215576171875, 0.25998687744140625, 0.2984161376953125, 0.33684539794921875, 0.375274658203125, 0.41370391845703125, 0.4521331787109375, 0.49056243896484375, 0.52899169921875, 0.5674209594726562, 0.6058502197265625, 0.6442794799804688, 0.682708740234375, 0.7211380004882812, 0.7595672607421875, 0.7979965209960938, 0.83642578125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 17.0, 54.0, 110.0, 165.0, 173.0, 193.0, 115.0, 70.0, 29.0, 19.0, 12.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.369527816772461, -12.996055603027344, -12.62258243560791, -12.249110221862793, -11.87563705444336, -11.502164840698242, -11.128692626953125, -10.755219459533691, -10.381746292114258, -10.00827407836914, -9.634800910949707, -9.26132869720459, -8.887855529785156, -8.514383316040039, -8.140911102294922, -7.767437934875488, -7.393965721130371, -7.020493030548096, -6.64702033996582, -6.273548126220703, -5.9000749588012695, -5.526602745056152, -5.153130054473877, -4.779657363891602, -4.406184673309326, -4.032711982727051, -3.6592392921447754, -3.285766839981079, -2.9122941493988037, -2.5388214588165283, -2.165349006652832, -1.7918763160705566, -1.4184045791625977, -1.0449318885803223, -0.6714593172073364, -0.2979867458343506, 0.0754859447479248, 0.4489586353302002, 0.8224310874938965, 1.1959037780761719, 1.5693764686584473, 1.9428491592407227, 2.316321849822998, 2.6897943019866943, 3.0632669925689697, 3.436739683151245, 3.8102121353149414, 4.183684825897217, 4.557157516479492, 4.930630207061768, 5.304102897644043, 5.67757511138916, 6.051048278808594, 6.424520492553711, 6.797993183135986, 7.171465873718262, 7.544938564300537, 7.9184112548828125, 8.29188346862793, 8.665356636047363, 9.03882884979248, 9.412302017211914, 9.785774230957031, 10.159246444702148, 10.532719612121582]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 10.0, 13.0, 8.0, 22.0, 18.0, 20.0, 18.0, 30.0, 35.0, 39.0, 43.0, 37.0, 49.0, 59.0, 47.0, 52.0, 49.0, 43.0, 39.0, 37.0, 43.0, 40.0, 36.0, 25.0, 25.0, 27.0, 16.0, 14.0, 15.0, 17.0, 8.0, 10.0, 11.0, 8.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.286811828613281, -5.130206108093262, -4.973600387573242, -4.816994667053223, -4.660388946533203, -4.503783226013184, -4.347177505493164, -4.1905717849731445, -4.033966064453125, -3.8773603439331055, -3.720754623413086, -3.5641489028930664, -3.407543182373047, -3.2509374618530273, -3.094331979751587, -2.9377262592315674, -2.781120777130127, -2.6245150566101074, -2.467909336090088, -2.3113036155700684, -2.154697895050049, -1.9980922937393188, -1.8414866924285889, -1.6848809719085693, -1.5282752513885498, -1.3716695308685303, -1.2150638103485107, -1.0584582090377808, -0.9018524885177612, -0.7452467679977417, -0.5886411070823669, -0.4320354461669922, -0.27542972564697266, -0.11882403492927551, 0.03778165578842163, 0.19438734650611877, 0.3509930372238159, 0.5075987577438354, 0.6642044186592102, 0.820810079574585, 0.9774158000946045, 1.134021520614624, 1.2906272411346436, 1.4472328424453735, 1.603838562965393, 1.7604442834854126, 1.9170498847961426, 2.073655605316162, 2.2302613258361816, 2.386867046356201, 2.5434727668762207, 2.7000784873962402, 2.8566842079162598, 3.0132899284362793, 3.1698954105377197, 3.3265011310577393, 3.483106851577759, 3.6397125720977783, 3.796318292617798, 3.9529240131378174, 4.109529495239258, 4.266135215759277, 4.422740936279297, 4.579346656799316, 4.735952377319336]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 14.0, 16.0, 35.0, 42.0, 58.0, 78.0, 145.0, 234.0, 351.0, 577.0, 892.0, 1608.0, 2834.0, 5284.0, 10934.0, 23501.0, 54898.0, 129465.0, 258400.0, 281321.0, 155530.0, 66614.0, 28608.0, 13009.0, 6476.0, 3163.0, 1803.0, 990.0, 604.0, 359.0, 217.0, 164.0, 91.0, 68.0, 42.0, 40.0, 26.0, 11.0, 10.0, 12.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7626953125, -0.7381820678710938, -0.7136688232421875, -0.6891555786132812, -0.664642333984375, -0.6401290893554688, -0.6156158447265625, -0.5911026000976562, -0.56658935546875, -0.5420761108398438, -0.5175628662109375, -0.49304962158203125, -0.468536376953125, -0.44402313232421875, -0.4195098876953125, -0.39499664306640625, -0.3704833984375, -0.34597015380859375, -0.3214569091796875, -0.29694366455078125, -0.272430419921875, -0.24791717529296875, -0.2234039306640625, -0.19889068603515625, -0.17437744140625, -0.14986419677734375, -0.1253509521484375, -0.10083770751953125, -0.076324462890625, -0.05181121826171875, -0.0272979736328125, -0.00278472900390625, 0.021728515625, 0.04624176025390625, 0.0707550048828125, 0.09526824951171875, 0.119781494140625, 0.14429473876953125, 0.1688079833984375, 0.19332122802734375, 0.21783447265625, 0.24234771728515625, 0.2668609619140625, 0.29137420654296875, 0.315887451171875, 0.34040069580078125, 0.3649139404296875, 0.38942718505859375, 0.4139404296875, 0.43845367431640625, 0.4629669189453125, 0.48748016357421875, 0.511993408203125, 0.5365066528320312, 0.5610198974609375, 0.5855331420898438, 0.61004638671875, 0.6345596313476562, 0.6590728759765625, 0.6835861206054688, 0.708099365234375, 0.7326126098632812, 0.7571258544921875, 0.7816390991210938, 0.80615234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 17.0, 9.0, 14.0, 21.0, 38.0, 45.0, 43.0, 55.0, 59.0, 86.0, 77.0, 77.0, 86.0, 60.0, 77.0, 50.0, 35.0, 34.0, 32.0, 19.0, 19.0, 11.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.93408203125, -0.9090118408203125, -0.883941650390625, -0.8588714599609375, -0.83380126953125, -0.8087310791015625, -0.783660888671875, -0.7585906982421875, -0.7335205078125, -0.7084503173828125, -0.683380126953125, -0.6583099365234375, -0.63323974609375, -0.6081695556640625, -0.583099365234375, -0.5580291748046875, -0.532958984375, -0.5078887939453125, -0.482818603515625, -0.4577484130859375, -0.43267822265625, -0.4076080322265625, -0.382537841796875, -0.3574676513671875, -0.3323974609375, -0.3073272705078125, -0.282257080078125, -0.2571868896484375, -0.23211669921875, -0.2070465087890625, -0.181976318359375, -0.1569061279296875, -0.1318359375, -0.1067657470703125, -0.081695556640625, -0.0566253662109375, -0.03155517578125, -0.0064849853515625, 0.018585205078125, 0.0436553955078125, 0.0687255859375, 0.0937957763671875, 0.118865966796875, 0.1439361572265625, 0.16900634765625, 0.1940765380859375, 0.219146728515625, 0.2442169189453125, 0.269287109375, 0.2943572998046875, 0.319427490234375, 0.3444976806640625, 0.36956787109375, 0.3946380615234375, 0.419708251953125, 0.4447784423828125, 0.4698486328125, 0.4949188232421875, 0.519989013671875, 0.5450592041015625, 0.57012939453125, 0.5951995849609375, 0.620269775390625, 0.6453399658203125, 0.67041015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 13.0, 8.0, 9.0, 12.0, 17.0, 29.0, 38.0, 31.0, 61.0, 78.0, 124.0, 184.0, 305.0, 648.0, 1367.0, 3675.0, 10977.0, 40248.0, 173655.0, 599504.0, 163013.0, 37750.0, 10456.0, 3493.0, 1294.0, 612.0, 344.0, 194.0, 95.0, 77.0, 53.0, 45.0, 35.0, 27.0, 14.0, 15.0, 9.0, 9.0, 11.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.390625, -1.347808837890625, -1.30499267578125, -1.262176513671875, -1.2193603515625, -1.176544189453125, -1.13372802734375, -1.090911865234375, -1.048095703125, -1.005279541015625, -0.96246337890625, -0.919647216796875, -0.8768310546875, -0.834014892578125, -0.79119873046875, -0.748382568359375, -0.70556640625, -0.662750244140625, -0.61993408203125, -0.577117919921875, -0.5343017578125, -0.491485595703125, -0.44866943359375, -0.405853271484375, -0.363037109375, -0.320220947265625, -0.27740478515625, -0.234588623046875, -0.1917724609375, -0.148956298828125, -0.10614013671875, -0.063323974609375, -0.0205078125, 0.022308349609375, 0.06512451171875, 0.107940673828125, 0.1507568359375, 0.193572998046875, 0.23638916015625, 0.279205322265625, 0.322021484375, 0.364837646484375, 0.40765380859375, 0.450469970703125, 0.4932861328125, 0.536102294921875, 0.57891845703125, 0.621734619140625, 0.66455078125, 0.707366943359375, 0.75018310546875, 0.792999267578125, 0.8358154296875, 0.878631591796875, 0.92144775390625, 0.964263916015625, 1.007080078125, 1.049896240234375, 1.09271240234375, 1.135528564453125, 1.1783447265625, 1.221160888671875, 1.26397705078125, 1.306793212890625, 1.349609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 9.0, 7.0, 10.0, 10.0, 16.0, 27.0, 26.0, 34.0, 41.0, 43.0, 43.0, 44.0, 52.0, 55.0, 85.0, 67.0, 73.0, 62.0, 47.0, 41.0, 42.0, 25.0, 27.0, 18.0, 29.0, 10.0, 6.0, 8.0, 7.0, 10.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88671875, -2.81036376953125, -2.7340087890625, -2.65765380859375, -2.581298828125, -2.50494384765625, -2.4285888671875, -2.35223388671875, -2.27587890625, -2.19952392578125, -2.1231689453125, -2.04681396484375, -1.970458984375, -1.89410400390625, -1.8177490234375, -1.74139404296875, -1.6650390625, -1.58868408203125, -1.5123291015625, -1.43597412109375, -1.359619140625, -1.28326416015625, -1.2069091796875, -1.13055419921875, -1.05419921875, -0.97784423828125, -0.9014892578125, -0.82513427734375, -0.748779296875, -0.67242431640625, -0.5960693359375, -0.51971435546875, -0.443359375, -0.36700439453125, -0.2906494140625, -0.21429443359375, -0.137939453125, -0.06158447265625, 0.0147705078125, 0.09112548828125, 0.16748046875, 0.24383544921875, 0.3201904296875, 0.39654541015625, 0.472900390625, 0.54925537109375, 0.6256103515625, 0.70196533203125, 0.7783203125, 0.85467529296875, 0.9310302734375, 1.00738525390625, 1.083740234375, 1.16009521484375, 1.2364501953125, 1.31280517578125, 1.38916015625, 1.46551513671875, 1.5418701171875, 1.61822509765625, 1.694580078125, 1.77093505859375, 1.8472900390625, 1.92364501953125, 2.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 2.0, 9.0, 8.0, 15.0, 25.0, 27.0, 57.0, 102.0, 157.0, 399.0, 892.0, 2477.0, 8181.0, 32605.0, 172537.0, 682252.0, 115642.0, 23456.0, 6344.0, 1901.0, 778.0, 302.0, 167.0, 85.0, 46.0, 25.0, 20.0, 12.0, 4.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6757659912109375, -0.657196044921875, -0.6386260986328125, -0.62005615234375, -0.6014862060546875, -0.582916259765625, -0.5643463134765625, -0.5457763671875, -0.5272064208984375, -0.508636474609375, -0.4900665283203125, -0.47149658203125, -0.4529266357421875, -0.434356689453125, -0.4157867431640625, -0.397216796875, -0.3786468505859375, -0.360076904296875, -0.3415069580078125, -0.32293701171875, -0.3043670654296875, -0.285797119140625, -0.2672271728515625, -0.2486572265625, -0.2300872802734375, -0.211517333984375, -0.1929473876953125, -0.17437744140625, -0.1558074951171875, -0.137237548828125, -0.1186676025390625, -0.10009765625, -0.0815277099609375, -0.062957763671875, -0.0443878173828125, -0.02581787109375, -0.0072479248046875, 0.011322021484375, 0.0298919677734375, 0.0484619140625, 0.0670318603515625, 0.085601806640625, 0.1041717529296875, 0.12274169921875, 0.1413116455078125, 0.159881591796875, 0.1784515380859375, 0.197021484375, 0.2155914306640625, 0.234161376953125, 0.2527313232421875, 0.27130126953125, 0.2898712158203125, 0.308441162109375, 0.3270111083984375, 0.3455810546875, 0.3641510009765625, 0.382720947265625, 0.4012908935546875, 0.41986083984375, 0.4384307861328125, 0.457000732421875, 0.4755706787109375, 0.494140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 13.0, 8.0, 5.0, 20.0, 20.0, 22.0, 36.0, 46.0, 63.0, 90.0, 105.0, 87.0, 93.0, 72.0, 61.0, 39.0, 41.0, 28.0, 25.0, 20.0, 13.0, 5.0, 10.0, 8.0, 8.0, 4.0, 8.0, 8.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0001709461212158203, -0.00016579777002334595, -0.00016064941883087158, -0.00015550106763839722, -0.00015035271644592285, -0.00014520436525344849, -0.00014005601406097412, -0.00013490766286849976, -0.0001297593116760254, -0.00012461096048355103, -0.00011946260929107666, -0.0001143142580986023, -0.00010916590690612793, -0.00010401755571365356, -9.88692045211792e-05, -9.372085332870483e-05, -8.857250213623047e-05, -8.34241509437561e-05, -7.827579975128174e-05, -7.312744855880737e-05, -6.797909736633301e-05, -6.283074617385864e-05, -5.768239498138428e-05, -5.253404378890991e-05, -4.738569259643555e-05, -4.223734140396118e-05, -3.7088990211486816e-05, -3.194063901901245e-05, -2.6792287826538086e-05, -2.164393663406372e-05, -1.6495585441589355e-05, -1.134723424911499e-05, -6.198883056640625e-06, -1.0505318641662598e-06, 4.0978193283081055e-06, 9.24617052078247e-06, 1.4394521713256836e-05, 1.95428729057312e-05, 2.4691224098205566e-05, 2.983957529067993e-05, 3.49879264831543e-05, 4.013627767562866e-05, 4.528462886810303e-05, 5.043298006057739e-05, 5.558133125305176e-05, 6.072968244552612e-05, 6.587803363800049e-05, 7.102638483047485e-05, 7.617473602294922e-05, 8.132308721542358e-05, 8.647143840789795e-05, 9.161978960037231e-05, 9.676814079284668e-05, 0.00010191649198532104, 0.00010706484317779541, 0.00011221319437026978, 0.00011736154556274414, 0.0001225098967552185, 0.00012765824794769287, 0.00013280659914016724, 0.0001379549503326416, 0.00014310330152511597, 0.00014825165271759033, 0.0001534000039100647, 0.00015854835510253906]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 9.0, 7.0, 25.0, 39.0, 72.0, 121.0, 399.0, 1332.0, 7417.0, 68262.0, 780280.0, 172290.0, 15141.0, 2233.0, 537.0, 205.0, 74.0, 51.0, 24.0, 18.0, 10.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0818023681640625, -1.055206298828125, -1.0286102294921875, -1.00201416015625, -0.9754180908203125, -0.948822021484375, -0.9222259521484375, -0.8956298828125, -0.8690338134765625, -0.842437744140625, -0.8158416748046875, -0.78924560546875, -0.7626495361328125, -0.736053466796875, -0.7094573974609375, -0.682861328125, -0.6562652587890625, -0.629669189453125, -0.6030731201171875, -0.57647705078125, -0.5498809814453125, -0.523284912109375, -0.4966888427734375, -0.4700927734375, -0.4434967041015625, -0.416900634765625, -0.3903045654296875, -0.36370849609375, -0.3371124267578125, -0.310516357421875, -0.2839202880859375, -0.25732421875, -0.2307281494140625, -0.204132080078125, -0.1775360107421875, -0.15093994140625, -0.1243438720703125, -0.097747802734375, -0.0711517333984375, -0.0445556640625, -0.0179595947265625, 0.008636474609375, 0.0352325439453125, 0.06182861328125, 0.0884246826171875, 0.115020751953125, 0.1416168212890625, 0.168212890625, 0.1948089599609375, 0.221405029296875, 0.2480010986328125, 0.27459716796875, 0.3011932373046875, 0.327789306640625, 0.3543853759765625, 0.3809814453125, 0.4075775146484375, 0.434173583984375, 0.4607696533203125, 0.48736572265625, 0.5139617919921875, 0.540557861328125, 0.5671539306640625, 0.59375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 5.0, 7.0, 21.0, 28.0, 51.0, 72.0, 82.0, 145.0, 128.0, 112.0, 116.0, 77.0, 51.0, 41.0, 25.0, 16.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.2216796875, -1.1960372924804688, -1.1703948974609375, -1.1447525024414062, -1.119110107421875, -1.0934677124023438, -1.0678253173828125, -1.0421829223632812, -1.01654052734375, -0.9908981323242188, -0.9652557373046875, -0.9396133422851562, -0.913970947265625, -0.8883285522460938, -0.8626861572265625, -0.8370437622070312, -0.8114013671875, -0.7857589721679688, -0.7601165771484375, -0.7344741821289062, -0.708831787109375, -0.6831893920898438, -0.6575469970703125, -0.6319046020507812, -0.60626220703125, -0.5806198120117188, -0.5549774169921875, -0.5293350219726562, -0.503692626953125, -0.47805023193359375, -0.4524078369140625, -0.42676544189453125, -0.401123046875, -0.37548065185546875, -0.3498382568359375, -0.32419586181640625, -0.298553466796875, -0.27291107177734375, -0.2472686767578125, -0.22162628173828125, -0.19598388671875, -0.17034149169921875, -0.1446990966796875, -0.11905670166015625, -0.093414306640625, -0.06777191162109375, -0.0421295166015625, -0.01648712158203125, 0.0091552734375, 0.03479766845703125, 0.0604400634765625, 0.08608245849609375, 0.111724853515625, 0.13736724853515625, 0.1630096435546875, 0.18865203857421875, 0.21429443359375, 0.23993682861328125, 0.2655792236328125, 0.29122161865234375, 0.316864013671875, 0.34250640869140625, 0.3681488037109375, 0.39379119873046875, 0.41943359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 6.0, 20.0, 23.0, 71.0, 138.0, 241.0, 277.0, 117.0, 56.0, 29.0, 9.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.208133697509766, -26.675291061401367, -26.14244842529297, -25.60960578918457, -25.076763153076172, -24.54391860961914, -24.011077880859375, -23.478233337402344, -22.945390701293945, -22.412548065185547, -21.87970542907715, -21.34686279296875, -20.81402015686035, -20.281177520751953, -19.748332977294922, -19.215490341186523, -18.682647705078125, -18.149805068969727, -17.616962432861328, -17.08411979675293, -16.55127716064453, -16.0184326171875, -15.485590934753418, -14.95274829864502, -14.419906616210938, -13.887063980102539, -13.35422134399414, -12.821378707885742, -12.288535118103027, -11.755692481994629, -11.22284984588623, -10.690007209777832, -10.157164573669434, -9.624321937561035, -9.091479301452637, -8.558635711669922, -8.025793075561523, -7.492950439453125, -6.960107803344727, -6.427265167236328, -5.8944220542907715, -5.361579418182373, -4.828736305236816, -4.295893669128418, -3.7630507946014404, -3.230207920074463, -2.6973652839660645, -2.164522409439087, -1.6316795349121094, -1.0988366603851318, -0.5659939050674438, -0.03315114974975586, 0.4996917247772217, 1.0325345993041992, 1.5653772354125977, 2.098220109939575, 2.6310629844665527, 3.1639058589935303, 3.696748733520508, 4.229591369628906, 4.762434005737305, 5.295277118682861, 5.82811975479126, 6.360962867736816, 6.893805503845215]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 9.0, 9.0, 14.0, 16.0, 14.0, 15.0, 20.0, 17.0, 25.0, 37.0, 30.0, 38.0, 33.0, 41.0, 50.0, 59.0, 84.0, 78.0, 60.0, 39.0, 33.0, 30.0, 43.0, 28.0, 25.0, 26.0, 17.0, 17.0, 11.0, 8.0, 10.0, 8.0, 10.0, 7.0, 3.0, 7.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.202334880828857, -6.960450172424316, -6.718564987182617, -6.476679801940918, -6.234795093536377, -5.992910385131836, -5.751025199890137, -5.5091400146484375, -5.2672553062438965, -5.0253705978393555, -4.783485412597656, -4.541600227355957, -4.299715518951416, -4.057830810546875, -3.815945625305176, -3.5740606784820557, -3.3321757316589355, -3.0902907848358154, -2.8484058380126953, -2.606520891189575, -2.364635944366455, -2.122750997543335, -1.8808660507202148, -1.6389811038970947, -1.3970961570739746, -1.1552112102508545, -0.9133262634277344, -0.6714413166046143, -0.42955636978149414, -0.18767142295837402, 0.054213523864746094, 0.2960984706878662, 0.5379829406738281, 0.7798678874969482, 1.0217528343200684, 1.2636377811431885, 1.5055227279663086, 1.7474076747894287, 1.9892926216125488, 2.231177568435669, 2.473062515258789, 2.714947462081909, 2.9568324089050293, 3.1987173557281494, 3.4406023025512695, 3.6824872493743896, 3.9243721961975098, 4.166256904602051, 4.40814208984375, 4.650027275085449, 4.89191198348999, 5.133796691894531, 5.3756818771362305, 5.61756706237793, 5.859451770782471, 6.101336479187012, 6.343221664428711, 6.58510684967041, 6.826991558074951, 7.068876266479492, 7.310761451721191, 7.552646636962891, 7.794531345367432, 8.036416053771973, 8.278301239013672]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 9.0, 11.0, 8.0, 21.0, 21.0, 19.0, 31.0, 37.0, 55.0, 74.0, 134.0, 167.0, 252.0, 387.0, 657.0, 1172.0, 2405.0, 7155.0, 34762.0, 306157.0, 2744876.0, 989648.0, 84770.0, 13414.0, 4044.0, 1642.0, 827.0, 494.0, 321.0, 201.0, 147.0, 98.0, 50.0, 45.0, 32.0, 19.0, 23.0, 17.0, 15.0, 13.0, 13.0, 8.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.89892578125, -0.8730392456054688, -0.8471527099609375, -0.8212661743164062, -0.795379638671875, -0.7694931030273438, -0.7436065673828125, -0.7177200317382812, -0.69183349609375, -0.6659469604492188, -0.6400604248046875, -0.6141738891601562, -0.588287353515625, -0.5624008178710938, -0.5365142822265625, -0.5106277465820312, -0.4847412109375, -0.45885467529296875, -0.4329681396484375, -0.40708160400390625, -0.381195068359375, -0.35530853271484375, -0.3294219970703125, -0.30353546142578125, -0.27764892578125, -0.25176239013671875, -0.2258758544921875, -0.19998931884765625, -0.174102783203125, -0.14821624755859375, -0.1223297119140625, -0.09644317626953125, -0.070556640625, -0.04467010498046875, -0.0187835693359375, 0.00710296630859375, 0.032989501953125, 0.05887603759765625, 0.0847625732421875, 0.11064910888671875, 0.13653564453125, 0.16242218017578125, 0.1883087158203125, 0.21419525146484375, 0.240081787109375, 0.26596832275390625, 0.2918548583984375, 0.31774139404296875, 0.3436279296875, 0.36951446533203125, 0.3954010009765625, 0.42128753662109375, 0.447174072265625, 0.47306060791015625, 0.4989471435546875, 0.5248336791992188, 0.55072021484375, 0.5766067504882812, 0.6024932861328125, 0.6283798217773438, 0.654266357421875, 0.6801528930664062, 0.7060394287109375, 0.7319259643554688, 0.7578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 12.0, 6.0, 17.0, 11.0, 16.0, 33.0, 30.0, 50.0, 46.0, 62.0, 66.0, 74.0, 86.0, 81.0, 61.0, 72.0, 61.0, 52.0, 43.0, 28.0, 31.0, 18.0, 19.0, 10.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93994140625, -0.914459228515625, -0.88897705078125, -0.863494873046875, -0.8380126953125, -0.812530517578125, -0.78704833984375, -0.761566162109375, -0.736083984375, -0.710601806640625, -0.68511962890625, -0.659637451171875, -0.6341552734375, -0.608673095703125, -0.58319091796875, -0.557708740234375, -0.5322265625, -0.506744384765625, -0.48126220703125, -0.455780029296875, -0.4302978515625, -0.404815673828125, -0.37933349609375, -0.353851318359375, -0.328369140625, -0.302886962890625, -0.27740478515625, -0.251922607421875, -0.2264404296875, -0.200958251953125, -0.17547607421875, -0.149993896484375, -0.12451171875, -0.099029541015625, -0.07354736328125, -0.048065185546875, -0.0225830078125, 0.002899169921875, 0.02838134765625, 0.053863525390625, 0.079345703125, 0.104827880859375, 0.13031005859375, 0.155792236328125, 0.1812744140625, 0.206756591796875, 0.23223876953125, 0.257720947265625, 0.283203125, 0.308685302734375, 0.33416748046875, 0.359649658203125, 0.3851318359375, 0.410614013671875, 0.43609619140625, 0.461578369140625, 0.487060546875, 0.512542724609375, 0.53802490234375, 0.563507080078125, 0.5889892578125, 0.614471435546875, 0.63995361328125, 0.665435791015625, 0.69091796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 14.0, 26.0, 37.0, 71.0, 162.0, 335.0, 712.0, 2044.0, 11246.0, 812771.0, 3342145.0, 20659.0, 2597.0, 807.0, 306.0, 151.0, 100.0, 54.0, 13.0, 11.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.443359375, -2.367279052734375, -2.29119873046875, -2.215118408203125, -2.1390380859375, -2.062957763671875, -1.98687744140625, -1.910797119140625, -1.834716796875, -1.758636474609375, -1.68255615234375, -1.606475830078125, -1.5303955078125, -1.454315185546875, -1.37823486328125, -1.302154541015625, -1.22607421875, -1.149993896484375, -1.07391357421875, -0.997833251953125, -0.9217529296875, -0.845672607421875, -0.76959228515625, -0.693511962890625, -0.617431640625, -0.541351318359375, -0.46527099609375, -0.389190673828125, -0.3131103515625, -0.237030029296875, -0.16094970703125, -0.084869384765625, -0.0087890625, 0.067291259765625, 0.14337158203125, 0.219451904296875, 0.2955322265625, 0.371612548828125, 0.44769287109375, 0.523773193359375, 0.599853515625, 0.675933837890625, 0.75201416015625, 0.828094482421875, 0.9041748046875, 0.980255126953125, 1.05633544921875, 1.132415771484375, 1.20849609375, 1.284576416015625, 1.36065673828125, 1.436737060546875, 1.5128173828125, 1.588897705078125, 1.66497802734375, 1.741058349609375, 1.817138671875, 1.893218994140625, 1.96929931640625, 2.045379638671875, 2.1214599609375, 2.197540283203125, 2.27362060546875, 2.349700927734375, 2.42578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 10.0, 11.0, 16.0, 24.0, 30.0, 59.0, 107.0, 219.0, 444.0, 734.0, 932.0, 664.0, 366.0, 169.0, 111.0, 63.0, 41.0, 19.0, 16.0, 8.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.470611572265625, -1.42657470703125, -1.382537841796875, -1.3385009765625, -1.294464111328125, -1.25042724609375, -1.206390380859375, -1.162353515625, -1.118316650390625, -1.07427978515625, -1.030242919921875, -0.9862060546875, -0.942169189453125, -0.89813232421875, -0.854095458984375, -0.81005859375, -0.766021728515625, -0.72198486328125, -0.677947998046875, -0.6339111328125, -0.589874267578125, -0.54583740234375, -0.501800537109375, -0.457763671875, -0.413726806640625, -0.36968994140625, -0.325653076171875, -0.2816162109375, -0.237579345703125, -0.19354248046875, -0.149505615234375, -0.10546875, -0.061431884765625, -0.01739501953125, 0.026641845703125, 0.0706787109375, 0.114715576171875, 0.15875244140625, 0.202789306640625, 0.246826171875, 0.290863037109375, 0.33489990234375, 0.378936767578125, 0.4229736328125, 0.467010498046875, 0.51104736328125, 0.555084228515625, 0.59912109375, 0.643157958984375, 0.68719482421875, 0.731231689453125, 0.7752685546875, 0.819305419921875, 0.86334228515625, 0.907379150390625, 0.951416015625, 0.995452880859375, 1.03948974609375, 1.083526611328125, 1.1275634765625, 1.171600341796875, 1.21563720703125, 1.259674072265625, 1.3037109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 10.0, 35.0, 53.0, 88.0, 148.0, 160.0, 163.0, 114.0, 92.0, 48.0, 32.0, 15.0, 13.0, 9.0, 5.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.978214263916016, -5.6743268966674805, -5.370439529418945, -5.06655216217041, -4.762664794921875, -4.45877742767334, -4.154890537261963, -3.8510031700134277, -3.5471158027648926, -3.2432284355163574, -2.9393410682678223, -2.635453939437866, -2.331566572189331, -2.027679204940796, -1.7237919569015503, -1.4199047088623047, -1.1160173416137695, -0.8121300339698792, -0.5082427263259888, -0.2043554186820984, 0.09953188896179199, 0.40341925621032715, 0.7073065042495728, 1.0111937522888184, 1.3150811195373535, 1.6189684867858887, 1.9228557348251343, 2.22674298286438, 2.530630350112915, 2.83451771736145, 3.1384048461914062, 3.4422922134399414, 3.7461795806884766, 4.050066947937012, 4.353954315185547, 4.657841682434082, 4.961729049682617, 5.265616416931152, 5.569503307342529, 5.8733906745910645, 6.1772780418396, 6.481165409088135, 6.78505277633667, 7.088940143585205, 7.392827033996582, 7.696714401245117, 8.000601768493652, 8.304489135742188, 8.608376502990723, 8.912263870239258, 9.216151237487793, 9.520038604736328, 9.823925971984863, 10.127813339233398, 10.431700706481934, 10.735588073730469, 11.039474487304688, 11.343361854553223, 11.647249221801758, 11.951136589050293, 12.255023956298828, 12.558911323547363, 12.862798690795898, 13.166685104370117, 13.470573425292969]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 5.0, 14.0, 12.0, 13.0, 20.0, 18.0, 22.0, 19.0, 39.0, 31.0, 31.0, 41.0, 35.0, 50.0, 48.0, 41.0, 61.0, 40.0, 45.0, 56.0, 37.0, 28.0, 42.0, 41.0, 21.0, 23.0, 27.0, 22.0, 18.0, 22.0, 10.0, 14.0, 9.0, 9.0, 8.0, 3.0, 3.0, 1.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.281271457672119, -4.141806602478027, -4.002341270446777, -3.8628764152526855, -3.7234115600585938, -3.583946704864502, -3.444481611251831, -3.30501651763916, -3.1655516624450684, -3.0260868072509766, -2.8866217136383057, -2.7471566200256348, -2.607691764831543, -2.468226909637451, -2.3287618160247803, -2.1892967224121094, -2.0498318672180176, -1.9103668928146362, -1.7709019184112549, -1.6314369440078735, -1.4919719696044922, -1.3525069952011108, -1.2130420207977295, -1.0735770463943481, -0.9341120719909668, -0.7946470975875854, -0.6551821231842041, -0.5157171487808228, -0.3762521743774414, -0.23678719997406006, -0.09732222557067871, 0.04214274883270264, 0.1816082000732422, 0.32107317447662354, 0.4605381488800049, 0.6000031232833862, 0.7394680976867676, 0.8789330720901489, 1.0183980464935303, 1.1578630208969116, 1.297327995300293, 1.4367929697036743, 1.5762579441070557, 1.715722918510437, 1.8551878929138184, 1.9946528673171997, 2.134117841720581, 2.273582935333252, 2.4130477905273438, 2.5525126457214355, 2.6919777393341064, 2.8314428329467773, 2.970907688140869, 3.110372543334961, 3.249837636947632, 3.3893027305603027, 3.5287675857543945, 3.6682324409484863, 3.8076975345611572, 3.947162628173828, 4.08662748336792, 4.226092338562012, 4.365557670593262, 4.5050225257873535, 4.644487380981445]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 9.0, 4.0, 14.0, 15.0, 20.0, 27.0, 38.0, 44.0, 68.0, 94.0, 123.0, 176.0, 286.0, 537.0, 876.0, 1542.0, 2897.0, 5504.0, 11310.0, 24102.0, 53421.0, 120178.0, 247896.0, 287459.0, 159706.0, 70853.0, 31478.0, 14529.0, 7050.0, 3534.0, 1943.0, 1064.0, 611.0, 385.0, 248.0, 149.0, 109.0, 75.0, 62.0, 40.0, 11.0, 22.0, 15.0, 9.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.72412109375, -0.7022933959960938, -0.6804656982421875, -0.6586380004882812, -0.636810302734375, -0.6149826049804688, -0.5931549072265625, -0.5713272094726562, -0.54949951171875, -0.5276718139648438, -0.5058441162109375, -0.48401641845703125, -0.462188720703125, -0.44036102294921875, -0.4185333251953125, -0.39670562744140625, -0.3748779296875, -0.35305023193359375, -0.3312225341796875, -0.30939483642578125, -0.287567138671875, -0.26573944091796875, -0.2439117431640625, -0.22208404541015625, -0.20025634765625, -0.17842864990234375, -0.1566009521484375, -0.13477325439453125, -0.112945556640625, -0.09111785888671875, -0.0692901611328125, -0.04746246337890625, -0.025634765625, -0.00380706787109375, 0.0180206298828125, 0.03984832763671875, 0.061676025390625, 0.08350372314453125, 0.1053314208984375, 0.12715911865234375, 0.14898681640625, 0.17081451416015625, 0.1926422119140625, 0.21446990966796875, 0.236297607421875, 0.25812530517578125, 0.2799530029296875, 0.30178070068359375, 0.3236083984375, 0.34543609619140625, 0.3672637939453125, 0.38909149169921875, 0.410919189453125, 0.43274688720703125, 0.4545745849609375, 0.47640228271484375, 0.49822998046875, 0.5200576782226562, 0.5418853759765625, 0.5637130737304688, 0.585540771484375, 0.6073684692382812, 0.6291961669921875, 0.6510238647460938, 0.6728515625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 5.0, 8.0, 12.0, 11.0, 25.0, 26.0, 36.0, 31.0, 48.0, 70.0, 57.0, 79.0, 85.0, 56.0, 71.0, 72.0, 63.0, 49.0, 59.0, 32.0, 33.0, 16.0, 13.0, 9.0, 12.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95556640625, -0.9297943115234375, -0.904022216796875, -0.8782501220703125, -0.85247802734375, -0.8267059326171875, -0.800933837890625, -0.7751617431640625, -0.7493896484375, -0.7236175537109375, -0.697845458984375, -0.6720733642578125, -0.64630126953125, -0.6205291748046875, -0.594757080078125, -0.5689849853515625, -0.543212890625, -0.5174407958984375, -0.491668701171875, -0.4658966064453125, -0.44012451171875, -0.4143524169921875, -0.388580322265625, -0.3628082275390625, -0.3370361328125, -0.3112640380859375, -0.285491943359375, -0.2597198486328125, -0.23394775390625, -0.2081756591796875, -0.182403564453125, -0.1566314697265625, -0.130859375, -0.1050872802734375, -0.079315185546875, -0.0535430908203125, -0.02777099609375, -0.0019989013671875, 0.023773193359375, 0.0495452880859375, 0.0753173828125, 0.1010894775390625, 0.126861572265625, 0.1526336669921875, 0.17840576171875, 0.2041778564453125, 0.229949951171875, 0.2557220458984375, 0.281494140625, 0.3072662353515625, 0.333038330078125, 0.3588104248046875, 0.38458251953125, 0.4103546142578125, 0.436126708984375, 0.4618988037109375, 0.4876708984375, 0.5134429931640625, 0.539215087890625, 0.5649871826171875, 0.59075927734375, 0.6165313720703125, 0.642303466796875, 0.6680755615234375, 0.69384765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 3.0, 16.0, 19.0, 48.0, 60.0, 85.0, 162.0, 221.0, 421.0, 779.0, 1727.0, 5233.0, 24527.0, 169281.0, 720611.0, 102326.0, 16216.0, 3839.0, 1332.0, 639.0, 388.0, 217.0, 132.0, 89.0, 52.0, 30.0, 21.0, 21.0, 10.0, 7.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.572265625, -1.5205078125, -1.46875, -1.4169921875, -1.365234375, -1.3134765625, -1.26171875, -1.2099609375, -1.158203125, -1.1064453125, -1.0546875, -1.0029296875, -0.951171875, -0.8994140625, -0.84765625, -0.7958984375, -0.744140625, -0.6923828125, -0.640625, -0.5888671875, -0.537109375, -0.4853515625, -0.43359375, -0.3818359375, -0.330078125, -0.2783203125, -0.2265625, -0.1748046875, -0.123046875, -0.0712890625, -0.01953125, 0.0322265625, 0.083984375, 0.1357421875, 0.1875, 0.2392578125, 0.291015625, 0.3427734375, 0.39453125, 0.4462890625, 0.498046875, 0.5498046875, 0.6015625, 0.6533203125, 0.705078125, 0.7568359375, 0.80859375, 0.8603515625, 0.912109375, 0.9638671875, 1.015625, 1.0673828125, 1.119140625, 1.1708984375, 1.22265625, 1.2744140625, 1.326171875, 1.3779296875, 1.4296875, 1.4814453125, 1.533203125, 1.5849609375, 1.63671875, 1.6884765625, 1.740234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 14.0, 17.0, 17.0, 24.0, 33.0, 42.0, 42.0, 66.0, 71.0, 67.0, 66.0, 77.0, 72.0, 73.0, 67.0, 53.0, 48.0, 26.0, 27.0, 29.0, 22.0, 10.0, 12.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.21923828125, -2.1240234375, -2.02880859375, -1.93359375, -1.83837890625, -1.7431640625, -1.64794921875, -1.552734375, -1.45751953125, -1.3623046875, -1.26708984375, -1.171875, -1.07666015625, -0.9814453125, -0.88623046875, -0.791015625, -0.69580078125, -0.6005859375, -0.50537109375, -0.41015625, -0.31494140625, -0.2197265625, -0.12451171875, -0.029296875, 0.06591796875, 0.1611328125, 0.25634765625, 0.3515625, 0.44677734375, 0.5419921875, 0.63720703125, 0.732421875, 0.82763671875, 0.9228515625, 1.01806640625, 1.11328125, 1.20849609375, 1.3037109375, 1.39892578125, 1.494140625, 1.58935546875, 1.6845703125, 1.77978515625, 1.875, 1.97021484375, 2.0654296875, 2.16064453125, 2.255859375, 2.35107421875, 2.4462890625, 2.54150390625, 2.63671875, 2.73193359375, 2.8271484375, 2.92236328125, 3.017578125, 3.11279296875, 3.2080078125, 3.30322265625, 3.3984375, 3.49365234375, 3.5888671875, 3.68408203125, 3.779296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 8.0, 11.0, 13.0, 8.0, 12.0, 23.0, 26.0, 49.0, 53.0, 92.0, 127.0, 233.0, 376.0, 592.0, 1124.0, 2331.0, 5333.0, 13626.0, 39447.0, 131230.0, 606508.0, 169447.0, 48942.0, 16620.0, 6423.0, 2784.0, 1369.0, 645.0, 414.0, 220.0, 151.0, 96.0, 63.0, 43.0, 29.0, 21.0, 15.0, 20.0, 8.0, 7.0, 5.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.319091796875, -0.30866241455078125, -0.2982330322265625, -0.28780364990234375, -0.277374267578125, -0.26694488525390625, -0.2565155029296875, -0.24608612060546875, -0.23565673828125, -0.22522735595703125, -0.2147979736328125, -0.20436859130859375, -0.193939208984375, -0.18350982666015625, -0.1730804443359375, -0.16265106201171875, -0.1522216796875, -0.14179229736328125, -0.1313629150390625, -0.12093353271484375, -0.110504150390625, -0.10007476806640625, -0.0896453857421875, -0.07921600341796875, -0.06878662109375, -0.05835723876953125, -0.0479278564453125, -0.03749847412109375, -0.027069091796875, -0.01663970947265625, -0.0062103271484375, 0.00421905517578125, 0.0146484375, 0.02507781982421875, 0.0355072021484375, 0.04593658447265625, 0.056365966796875, 0.06679534912109375, 0.0772247314453125, 0.08765411376953125, 0.09808349609375, 0.10851287841796875, 0.1189422607421875, 0.12937164306640625, 0.139801025390625, 0.15023040771484375, 0.1606597900390625, 0.17108917236328125, 0.1815185546875, 0.19194793701171875, 0.2023773193359375, 0.21280670166015625, 0.223236083984375, 0.23366546630859375, 0.2440948486328125, 0.25452423095703125, 0.26495361328125, 0.27538299560546875, 0.2858123779296875, 0.29624176025390625, 0.306671142578125, 0.31710052490234375, 0.3275299072265625, 0.33795928955078125, 0.348388671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 6.0, 6.0, 15.0, 14.0, 19.0, 38.0, 28.0, 49.0, 56.0, 87.0, 109.0, 128.0, 116.0, 71.0, 47.0, 50.0, 26.0, 33.0, 23.0, 11.0, 19.0, 9.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00016832351684570312, -0.00016340985894203186, -0.0001584962010383606, -0.00015358254313468933, -0.00014866888523101807, -0.0001437552273273468, -0.00013884156942367554, -0.00013392791152000427, -0.000129014253616333, -0.00012410059571266174, -0.00011918693780899048, -0.00011427327990531921, -0.00010935962200164795, -0.00010444596409797668, -9.953230619430542e-05, -9.461864829063416e-05, -8.970499038696289e-05, -8.479133248329163e-05, -7.987767457962036e-05, -7.49640166759491e-05, -7.005035877227783e-05, -6.513670086860657e-05, -6.02230429649353e-05, -5.530938506126404e-05, -5.0395727157592773e-05, -4.548206925392151e-05, -4.0568411350250244e-05, -3.565475344657898e-05, -3.0741095542907715e-05, -2.582743763923645e-05, -2.0913779735565186e-05, -1.600012183189392e-05, -1.1086463928222656e-05, -6.172806024551392e-06, -1.259148120880127e-06, 3.6545097827911377e-06, 8.568167686462402e-06, 1.3481825590133667e-05, 1.839548349380493e-05, 2.3309141397476196e-05, 2.822279930114746e-05, 3.3136457204818726e-05, 3.805011510848999e-05, 4.2963773012161255e-05, 4.787743091583252e-05, 5.2791088819503784e-05, 5.770474672317505e-05, 6.261840462684631e-05, 6.753206253051758e-05, 7.244572043418884e-05, 7.735937833786011e-05, 8.227303624153137e-05, 8.718669414520264e-05, 9.21003520488739e-05, 9.701400995254517e-05, 0.00010192766785621643, 0.0001068413257598877, 0.00011175498366355896, 0.00011666864156723022, 0.00012158229947090149, 0.00012649595737457275, 0.00013140961527824402, 0.00013632327318191528, 0.00014123693108558655, 0.0001461505889892578]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 6.0, 7.0, 13.0, 8.0, 34.0, 40.0, 83.0, 97.0, 225.0, 468.0, 964.0, 2544.0, 8834.0, 36810.0, 220415.0, 674906.0, 79503.0, 16410.0, 4376.0, 1519.0, 600.0, 287.0, 162.0, 91.0, 58.0, 35.0, 23.0, 10.0, 4.0, 6.0, 8.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.40283203125, -0.38747406005859375, -0.3721160888671875, -0.35675811767578125, -0.341400146484375, -0.32604217529296875, -0.3106842041015625, -0.29532623291015625, -0.27996826171875, -0.26461029052734375, -0.2492523193359375, -0.23389434814453125, -0.218536376953125, -0.20317840576171875, -0.1878204345703125, -0.17246246337890625, -0.1571044921875, -0.14174652099609375, -0.1263885498046875, -0.11103057861328125, -0.095672607421875, -0.08031463623046875, -0.0649566650390625, -0.04959869384765625, -0.03424072265625, -0.01888275146484375, -0.0035247802734375, 0.01183319091796875, 0.027191162109375, 0.04254913330078125, 0.0579071044921875, 0.07326507568359375, 0.088623046875, 0.10398101806640625, 0.1193389892578125, 0.13469696044921875, 0.150054931640625, 0.16541290283203125, 0.1807708740234375, 0.19612884521484375, 0.21148681640625, 0.22684478759765625, 0.2422027587890625, 0.25756072998046875, 0.272918701171875, 0.28827667236328125, 0.3036346435546875, 0.31899261474609375, 0.3343505859375, 0.34970855712890625, 0.3650665283203125, 0.38042449951171875, 0.395782470703125, 0.41114044189453125, 0.4264984130859375, 0.44185638427734375, 0.45721435546875, 0.47257232666015625, 0.4879302978515625, 0.5032882690429688, 0.518646240234375, 0.5340042114257812, 0.5493621826171875, 0.5647201538085938, 0.580078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 8.0, 11.0, 15.0, 24.0, 31.0, 23.0, 45.0, 56.0, 96.0, 126.0, 118.0, 124.0, 88.0, 67.0, 52.0, 37.0, 21.0, 21.0, 9.0, 14.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5359420776367188, -0.5171966552734375, -0.49845123291015625, -0.479705810546875, -0.46096038818359375, -0.4422149658203125, -0.42346954345703125, -0.40472412109375, -0.38597869873046875, -0.3672332763671875, -0.34848785400390625, -0.329742431640625, -0.31099700927734375, -0.2922515869140625, -0.27350616455078125, -0.2547607421875, -0.23601531982421875, -0.2172698974609375, -0.19852447509765625, -0.179779052734375, -0.16103363037109375, -0.1422882080078125, -0.12354278564453125, -0.10479736328125, -0.08605194091796875, -0.0673065185546875, -0.04856109619140625, -0.029815673828125, -0.01107025146484375, 0.0076751708984375, 0.02642059326171875, 0.045166015625, 0.06391143798828125, 0.0826568603515625, 0.10140228271484375, 0.120147705078125, 0.13889312744140625, 0.1576385498046875, 0.17638397216796875, 0.19512939453125, 0.21387481689453125, 0.2326202392578125, 0.25136566162109375, 0.270111083984375, 0.28885650634765625, 0.3076019287109375, 0.32634735107421875, 0.3450927734375, 0.36383819580078125, 0.3825836181640625, 0.40132904052734375, 0.420074462890625, 0.43881988525390625, 0.4575653076171875, 0.47631072998046875, 0.49505615234375, 0.5138015747070312, 0.5325469970703125, 0.5512924194335938, 0.570037841796875, 0.5887832641601562, 0.6075286865234375, 0.6262741088867188, 0.64501953125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 11.0, 17.0, 29.0, 89.0, 156.0, 374.0, 174.0, 85.0, 35.0, 16.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.33283519744873, -14.846481323242188, -14.360127449035645, -13.873773574829102, -13.387419700622559, -12.901065826416016, -12.414711952209473, -11.92835807800293, -11.442004203796387, -10.955650329589844, -10.4692964553833, -9.982942581176758, -9.496588706970215, -9.010234832763672, -8.523880958557129, -8.037527084350586, -7.551173210144043, -7.0648193359375, -6.578465461730957, -6.092111587524414, -5.605757713317871, -5.119403839111328, -4.633049964904785, -4.146696090698242, -3.660342216491699, -3.1739883422851562, -2.6876344680786133, -2.2012805938720703, -1.7149267196655273, -1.2285728454589844, -0.7422189712524414, -0.25586509704589844, 0.23048877716064453, 0.7168426513671875, 1.2031965255737305, 1.6895503997802734, 2.1759042739868164, 2.6622581481933594, 3.1486120223999023, 3.6349658966064453, 4.121319770812988, 4.607673645019531, 5.094027519226074, 5.580381393432617, 6.06673526763916, 6.553089141845703, 7.039443016052246, 7.525796890258789, 8.012150764465332, 8.498504638671875, 8.984858512878418, 9.471212387084961, 9.957566261291504, 10.443920135498047, 10.93027400970459, 11.416627883911133, 11.902981758117676, 12.389335632324219, 12.875689506530762, 13.362043380737305, 13.848397254943848, 14.33475112915039, 14.821105003356934, 15.307458877563477, 15.79381275177002]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 7.0, 8.0, 8.0, 13.0, 7.0, 15.0, 18.0, 24.0, 25.0, 27.0, 30.0, 39.0, 43.0, 40.0, 92.0, 138.0, 105.0, 55.0, 48.0, 57.0, 26.0, 31.0, 25.0, 16.0, 23.0, 11.0, 11.0, 10.0, 10.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881823539733887, -8.582170486450195, -8.282517433166504, -7.982863903045654, -7.683210849761963, -7.383557319641113, -7.083904266357422, -6.7842512130737305, -6.484598159790039, -6.184945106506348, -5.885291576385498, -5.585638523101807, -5.285985469818115, -4.986331939697266, -4.686678886413574, -4.387025833129883, -4.087372303009033, -3.7877190113067627, -3.4880659580230713, -3.188412666320801, -2.8887596130371094, -2.589106321334839, -2.2894530296325684, -1.989799976348877, -1.6901466846466064, -1.3904935121536255, -1.0908403396606445, -0.791187047958374, -0.49153387546539307, -0.1918807029724121, 0.1077725887298584, 0.4074256420135498, 0.7070789337158203, 1.0067321062088013, 1.3063852787017822, 1.6060385704040527, 1.9056917428970337, 2.2053449153900146, 2.504998207092285, 2.8046512603759766, 3.104304552078247, 3.4039578437805176, 3.703610897064209, 4.003264427185059, 4.30291748046875, 4.602570533752441, 4.902223587036133, 5.201876640319824, 5.501530170440674, 5.801183223724365, 6.100836753845215, 6.400489807128906, 6.700142860412598, 6.999795913696289, 7.299449443817139, 7.59910249710083, 7.89875602722168, 8.198409080505371, 8.498062133789062, 8.79771614074707, 9.097369194030762, 9.397022247314453, 9.696675300598145, 9.996328353881836, 10.295981407165527]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 9.0, 2.0, 5.0, 5.0, 3.0, 4.0, 11.0, 16.0, 10.0, 14.0, 35.0, 30.0, 43.0, 52.0, 62.0, 98.0, 118.0, 128.0, 164.0, 204.0, 330.0, 463.0, 842.0, 2018.0, 9324.0, 92975.0, 2053423.0, 1934745.0, 85450.0, 9251.0, 1964.0, 752.0, 430.0, 291.0, 227.0, 169.0, 122.0, 103.0, 97.0, 72.0, 52.0, 33.0, 41.0, 23.0, 25.0, 15.0, 11.0, 8.0, 8.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2724609375, -1.2326812744140625, -1.192901611328125, -1.1531219482421875, -1.11334228515625, -1.0735626220703125, -1.033782958984375, -0.9940032958984375, -0.9542236328125, -0.9144439697265625, -0.874664306640625, -0.8348846435546875, -0.79510498046875, -0.7553253173828125, -0.715545654296875, -0.6757659912109375, -0.635986328125, -0.5962066650390625, -0.556427001953125, -0.5166473388671875, -0.47686767578125, -0.4370880126953125, -0.397308349609375, -0.3575286865234375, -0.3177490234375, -0.2779693603515625, -0.238189697265625, -0.1984100341796875, -0.15863037109375, -0.1188507080078125, -0.079071044921875, -0.0392913818359375, 0.00048828125, 0.0402679443359375, 0.080047607421875, 0.1198272705078125, 0.15960693359375, 0.1993865966796875, 0.239166259765625, 0.2789459228515625, 0.3187255859375, 0.3585052490234375, 0.398284912109375, 0.4380645751953125, 0.47784423828125, 0.5176239013671875, 0.557403564453125, 0.5971832275390625, 0.636962890625, 0.6767425537109375, 0.716522216796875, 0.7563018798828125, 0.79608154296875, 0.8358612060546875, 0.875640869140625, 0.9154205322265625, 0.9552001953125, 0.9949798583984375, 1.034759521484375, 1.0745391845703125, 1.11431884765625, 1.1540985107421875, 1.193878173828125, 1.2336578369140625, 1.2734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 0.0, 5.0, 7.0, 8.0, 13.0, 8.0, 21.0, 24.0, 30.0, 47.0, 58.0, 63.0, 51.0, 91.0, 79.0, 67.0, 74.0, 81.0, 48.0, 53.0, 48.0, 26.0, 37.0, 15.0, 15.0, 12.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.94775390625, -0.922149658203125, -0.89654541015625, -0.870941162109375, -0.8453369140625, -0.819732666015625, -0.79412841796875, -0.768524169921875, -0.742919921875, -0.717315673828125, -0.69171142578125, -0.666107177734375, -0.6405029296875, -0.614898681640625, -0.58929443359375, -0.563690185546875, -0.5380859375, -0.512481689453125, -0.48687744140625, -0.461273193359375, -0.4356689453125, -0.410064697265625, -0.38446044921875, -0.358856201171875, -0.333251953125, -0.307647705078125, -0.28204345703125, -0.256439208984375, -0.2308349609375, -0.205230712890625, -0.17962646484375, -0.154022216796875, -0.12841796875, -0.102813720703125, -0.07720947265625, -0.051605224609375, -0.0260009765625, -0.000396728515625, 0.02520751953125, 0.050811767578125, 0.076416015625, 0.102020263671875, 0.12762451171875, 0.153228759765625, 0.1788330078125, 0.204437255859375, 0.23004150390625, 0.255645751953125, 0.28125, 0.306854248046875, 0.33245849609375, 0.358062744140625, 0.3836669921875, 0.409271240234375, 0.43487548828125, 0.460479736328125, 0.486083984375, 0.511688232421875, 0.53729248046875, 0.562896728515625, 0.5885009765625, 0.614105224609375, 0.63970947265625, 0.665313720703125, 0.69091796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 13.0, 9.0, 13.0, 16.0, 33.0, 59.0, 94.0, 96.0, 239.0, 493.0, 1563.0, 9043.0, 278146.0, 3842428.0, 55996.0, 4290.0, 965.0, 336.0, 176.0, 92.0, 73.0, 44.0, 21.0, 14.0, 16.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8037567138671875, -1.729583740234375, -1.6554107666015625, -1.58123779296875, -1.5070648193359375, -1.432891845703125, -1.3587188720703125, -1.2845458984375, -1.2103729248046875, -1.136199951171875, -1.0620269775390625, -0.98785400390625, -0.9136810302734375, -0.839508056640625, -0.7653350830078125, -0.691162109375, -0.6169891357421875, -0.542816162109375, -0.4686431884765625, -0.39447021484375, -0.3202972412109375, -0.246124267578125, -0.1719512939453125, -0.0977783203125, -0.0236053466796875, 0.050567626953125, 0.1247406005859375, 0.19891357421875, 0.2730865478515625, 0.347259521484375, 0.4214324951171875, 0.49560546875, 0.5697784423828125, 0.643951416015625, 0.7181243896484375, 0.79229736328125, 0.8664703369140625, 0.940643310546875, 1.0148162841796875, 1.0889892578125, 1.1631622314453125, 1.237335205078125, 1.3115081787109375, 1.38568115234375, 1.4598541259765625, 1.534027099609375, 1.6082000732421875, 1.682373046875, 1.7565460205078125, 1.830718994140625, 1.9048919677734375, 1.97906494140625, 2.0532379150390625, 2.127410888671875, 2.2015838623046875, 2.2757568359375, 2.3499298095703125, 2.424102783203125, 2.4982757568359375, 2.57244873046875, 2.6466217041015625, 2.720794677734375, 2.7949676513671875, 2.869140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 24.0, 32.0, 54.0, 123.0, 291.0, 688.0, 1196.0, 925.0, 431.0, 150.0, 79.0, 44.0, 12.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.29296875, -3.2158050537109375, -3.138641357421875, -3.0614776611328125, -2.98431396484375, -2.9071502685546875, -2.829986572265625, -2.7528228759765625, -2.6756591796875, -2.5984954833984375, -2.521331787109375, -2.4441680908203125, -2.36700439453125, -2.2898406982421875, -2.212677001953125, -2.1355133056640625, -2.058349609375, -1.9811859130859375, -1.904022216796875, -1.8268585205078125, -1.74969482421875, -1.6725311279296875, -1.595367431640625, -1.5182037353515625, -1.4410400390625, -1.3638763427734375, -1.286712646484375, -1.2095489501953125, -1.13238525390625, -1.0552215576171875, -0.978057861328125, -0.9008941650390625, -0.82373046875, -0.7465667724609375, -0.669403076171875, -0.5922393798828125, -0.51507568359375, -0.4379119873046875, -0.360748291015625, -0.2835845947265625, -0.2064208984375, -0.1292572021484375, -0.052093505859375, 0.0250701904296875, 0.10223388671875, 0.1793975830078125, 0.256561279296875, 0.3337249755859375, 0.410888671875, 0.4880523681640625, 0.565216064453125, 0.6423797607421875, 0.71954345703125, 0.7967071533203125, 0.873870849609375, 0.9510345458984375, 1.0281982421875, 1.1053619384765625, 1.182525634765625, 1.2596893310546875, 1.33685302734375, 1.4140167236328125, 1.491180419921875, 1.5683441162109375, 1.6455078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 32.0, 38.0, 88.0, 159.0, 223.0, 192.0, 115.0, 68.0, 35.0, 10.0, 12.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.97688102722168, -17.535297393798828, -17.093713760375977, -16.652128219604492, -16.21054458618164, -15.768960952758789, -15.327377319335938, -14.88579273223877, -14.444209098815918, -14.002625465393066, -13.561040878295898, -13.119457244873047, -12.677872657775879, -12.236289024353027, -11.79470443725586, -11.353120803833008, -10.911537170410156, -10.469953536987305, -10.028368949890137, -9.586785316467285, -9.145200729370117, -8.703617095947266, -8.262033462524414, -7.820448875427246, -7.378864288330078, -6.937280178070068, -6.495696067810059, -6.054112434387207, -5.612528324127197, -5.1709442138671875, -4.729360103607178, -4.287775993347168, -3.8461923599243164, -3.4046082496643066, -2.963024377822876, -2.521440267562866, -2.0798563957214355, -1.6382722854614258, -1.196688175201416, -0.7551043033599854, -0.3135201930999756, 0.12806382775306702, 0.5696478486061096, 1.0112318992614746, 1.4528158903121948, 1.894399881362915, 2.335983991622925, 2.7775678634643555, 3.2191519737243652, 3.660736083984375, 4.102320194244385, 4.5439043045043945, 4.985487937927246, 5.427072048187256, 5.868656158447266, 6.310239791870117, 6.751824378967285, 7.193408489227295, 7.634992599487305, 8.076576232910156, 8.518160820007324, 8.959744453430176, 9.401329040527344, 9.842912673950195, 10.284496307373047]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 12.0, 15.0, 18.0, 27.0, 23.0, 37.0, 47.0, 48.0, 54.0, 70.0, 102.0, 107.0, 71.0, 74.0, 56.0, 46.0, 41.0, 37.0, 30.0, 17.0, 22.0, 12.0, 13.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.853775978088379, -4.56828498840332, -4.28279447555542, -3.9973034858703613, -3.711812734603882, -3.4263219833374023, -3.1408309936523438, -2.8553402423858643, -2.5698494911193848, -2.2843587398529053, -1.9988678693771362, -1.7133769989013672, -1.4278862476348877, -1.1423954963684082, -0.8569046258926392, -0.5714137554168701, -0.2859230041503906, -0.0004321932792663574, 0.2850586175918579, 0.5705494284629822, 0.8560402393341064, 1.141530990600586, 1.427021861076355, 1.712512731552124, 1.9980034828186035, 2.283494234085083, 2.5689849853515625, 2.854475975036621, 3.1399667263031006, 3.42545747756958, 3.7109484672546387, 3.996439218521118, 4.281930923461914, 4.567421913146973, 4.852912425994873, 5.138403415679932, 5.423893928527832, 5.709384918212891, 5.994875907897949, 6.280366897583008, 6.565857410430908, 6.851348400115967, 7.136838912963867, 7.422329902648926, 7.707820892333984, 7.993311405181885, 8.278801918029785, 8.564292907714844, 8.849783897399902, 9.135274887084961, 9.42076587677002, 9.706255912780762, 9.99174690246582, 10.277237892150879, 10.562728881835938, 10.848219871520996, 11.133710861206055, 11.419201850891113, 11.704692840576172, 11.990182876586914, 12.275673866271973, 12.561164855957031, 12.84665584564209, 13.132146835327148, 13.41763687133789]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 8.0, 6.0, 13.0, 11.0, 16.0, 27.0, 46.0, 58.0, 74.0, 135.0, 192.0, 294.0, 485.0, 844.0, 1500.0, 2744.0, 4879.0, 9612.0, 19926.0, 44741.0, 110006.0, 273733.0, 327787.0, 144203.0, 56991.0, 24819.0, 11969.0, 5986.0, 3161.0, 1719.0, 968.0, 594.0, 344.0, 221.0, 126.0, 100.0, 69.0, 43.0, 34.0, 24.0, 13.0, 8.0, 9.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.82470703125, -0.7982254028320312, -0.7717437744140625, -0.7452621459960938, -0.718780517578125, -0.6922988891601562, -0.6658172607421875, -0.6393356323242188, -0.61285400390625, -0.5863723754882812, -0.5598907470703125, -0.5334091186523438, -0.506927490234375, -0.48044586181640625, -0.4539642333984375, -0.42748260498046875, -0.4010009765625, -0.37451934814453125, -0.3480377197265625, -0.32155609130859375, -0.295074462890625, -0.26859283447265625, -0.2421112060546875, -0.21562957763671875, -0.18914794921875, -0.16266632080078125, -0.1361846923828125, -0.10970306396484375, -0.083221435546875, -0.05673980712890625, -0.0302581787109375, -0.00377655029296875, 0.022705078125, 0.04918670654296875, 0.0756683349609375, 0.10214996337890625, 0.128631591796875, 0.15511322021484375, 0.1815948486328125, 0.20807647705078125, 0.23455810546875, 0.26103973388671875, 0.2875213623046875, 0.31400299072265625, 0.340484619140625, 0.36696624755859375, 0.3934478759765625, 0.41992950439453125, 0.4464111328125, 0.47289276123046875, 0.4993743896484375, 0.5258560180664062, 0.552337646484375, 0.5788192749023438, 0.6053009033203125, 0.6317825317382812, 0.65826416015625, 0.6847457885742188, 0.7112274169921875, 0.7377090454101562, 0.764190673828125, 0.7906723022460938, 0.8171539306640625, 0.8436355590820312, 0.8701171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 1.0, 6.0, 5.0, 16.0, 13.0, 14.0, 27.0, 31.0, 31.0, 46.0, 55.0, 66.0, 70.0, 73.0, 64.0, 73.0, 76.0, 48.0, 66.0, 50.0, 34.0, 27.0, 29.0, 24.0, 16.0, 13.0, 6.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97607421875, -0.9494476318359375, -0.922821044921875, -0.8961944580078125, -0.86956787109375, -0.8429412841796875, -0.816314697265625, -0.7896881103515625, -0.7630615234375, -0.7364349365234375, -0.709808349609375, -0.6831817626953125, -0.65655517578125, -0.6299285888671875, -0.603302001953125, -0.5766754150390625, -0.550048828125, -0.5234222412109375, -0.496795654296875, -0.4701690673828125, -0.44354248046875, -0.4169158935546875, -0.390289306640625, -0.3636627197265625, -0.3370361328125, -0.3104095458984375, -0.283782958984375, -0.2571563720703125, -0.23052978515625, -0.2039031982421875, -0.177276611328125, -0.1506500244140625, -0.1240234375, -0.0973968505859375, -0.070770263671875, -0.0441436767578125, -0.01751708984375, 0.0091094970703125, 0.035736083984375, 0.0623626708984375, 0.0889892578125, 0.1156158447265625, 0.142242431640625, 0.1688690185546875, 0.19549560546875, 0.2221221923828125, 0.248748779296875, 0.2753753662109375, 0.302001953125, 0.3286285400390625, 0.355255126953125, 0.3818817138671875, 0.40850830078125, 0.4351348876953125, 0.461761474609375, 0.4883880615234375, 0.5150146484375, 0.5416412353515625, 0.568267822265625, 0.5948944091796875, 0.62152099609375, 0.6481475830078125, 0.674774169921875, 0.7014007568359375, 0.72802734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 11.0, 9.0, 22.0, 27.0, 41.0, 54.0, 95.0, 141.0, 238.0, 407.0, 677.0, 1267.0, 3477.0, 17797.0, 262444.0, 724222.0, 29489.0, 4669.0, 1580.0, 757.0, 419.0, 229.0, 165.0, 95.0, 64.0, 53.0, 23.0, 33.0, 15.0, 9.0, 7.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.47979736328125, -2.4049072265625, -2.33001708984375, -2.255126953125, -2.18023681640625, -2.1053466796875, -2.03045654296875, -1.95556640625, -1.88067626953125, -1.8057861328125, -1.73089599609375, -1.656005859375, -1.58111572265625, -1.5062255859375, -1.43133544921875, -1.3564453125, -1.28155517578125, -1.2066650390625, -1.13177490234375, -1.056884765625, -0.98199462890625, -0.9071044921875, -0.83221435546875, -0.75732421875, -0.68243408203125, -0.6075439453125, -0.53265380859375, -0.457763671875, -0.38287353515625, -0.3079833984375, -0.23309326171875, -0.158203125, -0.08331298828125, -0.0084228515625, 0.06646728515625, 0.141357421875, 0.21624755859375, 0.2911376953125, 0.36602783203125, 0.44091796875, 0.51580810546875, 0.5906982421875, 0.66558837890625, 0.740478515625, 0.81536865234375, 0.8902587890625, 0.96514892578125, 1.0400390625, 1.11492919921875, 1.1898193359375, 1.26470947265625, 1.339599609375, 1.41448974609375, 1.4893798828125, 1.56427001953125, 1.63916015625, 1.71405029296875, 1.7889404296875, 1.86383056640625, 1.938720703125, 2.01361083984375, 2.0885009765625, 2.16339111328125, 2.23828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 8.0, 7.0, 13.0, 23.0, 25.0, 27.0, 38.0, 56.0, 73.0, 88.0, 113.0, 100.0, 97.0, 83.0, 64.0, 43.0, 45.0, 27.0, 20.0, 11.0, 13.0, 4.0, 8.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6875, -4.559356689453125, -4.43121337890625, -4.303070068359375, -4.1749267578125, -4.046783447265625, -3.91864013671875, -3.790496826171875, -3.662353515625, -3.534210205078125, -3.40606689453125, -3.277923583984375, -3.1497802734375, -3.021636962890625, -2.89349365234375, -2.765350341796875, -2.63720703125, -2.509063720703125, -2.38092041015625, -2.252777099609375, -2.1246337890625, -1.996490478515625, -1.86834716796875, -1.740203857421875, -1.612060546875, -1.483917236328125, -1.35577392578125, -1.227630615234375, -1.0994873046875, -0.971343994140625, -0.84320068359375, -0.715057373046875, -0.5869140625, -0.458770751953125, -0.33062744140625, -0.202484130859375, -0.0743408203125, 0.053802490234375, 0.18194580078125, 0.310089111328125, 0.438232421875, 0.566375732421875, 0.69451904296875, 0.822662353515625, 0.9508056640625, 1.078948974609375, 1.20709228515625, 1.335235595703125, 1.46337890625, 1.591522216796875, 1.71966552734375, 1.847808837890625, 1.9759521484375, 2.104095458984375, 2.23223876953125, 2.360382080078125, 2.488525390625, 2.616668701171875, 2.74481201171875, 2.872955322265625, 3.0010986328125, 3.129241943359375, 3.25738525390625, 3.385528564453125, 3.513671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 19.0, 27.0, 38.0, 52.0, 74.0, 107.0, 230.0, 409.0, 741.0, 1521.0, 3986.0, 12256.0, 51274.0, 307829.0, 591733.0, 57025.0, 13599.0, 4266.0, 1545.0, 774.0, 412.0, 219.0, 145.0, 86.0, 52.0, 29.0, 18.0, 20.0, 11.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.38818359375, -0.3756752014160156, -0.36316680908203125, -0.3506584167480469, -0.3381500244140625, -0.3256416320800781, -0.31313323974609375, -0.3006248474121094, -0.288116455078125, -0.2756080627441406, -0.26309967041015625, -0.2505912780761719, -0.2380828857421875, -0.22557449340820312, -0.21306610107421875, -0.20055770874023438, -0.18804931640625, -0.17554092407226562, -0.16303253173828125, -0.15052413940429688, -0.1380157470703125, -0.12550735473632812, -0.11299896240234375, -0.10049057006835938, -0.087982177734375, -0.07547378540039062, -0.06296539306640625, -0.050457000732421875, -0.0379486083984375, -0.025440216064453125, -0.01293182373046875, -0.000423431396484375, 0.0120849609375, 0.024593353271484375, 0.03710174560546875, 0.049610137939453125, 0.0621185302734375, 0.07462692260742188, 0.08713531494140625, 0.09964370727539062, 0.112152099609375, 0.12466049194335938, 0.13716888427734375, 0.14967727661132812, 0.1621856689453125, 0.17469406127929688, 0.18720245361328125, 0.19971084594726562, 0.21221923828125, 0.22472763061523438, 0.23723602294921875, 0.24974441528320312, 0.2622528076171875, 0.2747611999511719, 0.28726959228515625, 0.2997779846191406, 0.312286376953125, 0.3247947692871094, 0.33730316162109375, 0.3498115539550781, 0.3623199462890625, 0.3748283386230469, 0.38733673095703125, 0.3998451232910156, 0.412353515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 5.0, 5.0, 9.0, 13.0, 8.0, 13.0, 15.0, 16.0, 21.0, 36.0, 60.0, 63.0, 71.0, 97.0, 106.0, 104.0, 73.0, 53.0, 47.0, 36.0, 29.0, 28.0, 24.0, 8.0, 13.0, 6.0, 4.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001575946807861328, -0.00015300512313842773, -0.00014841556549072266, -0.00014382600784301758, -0.0001392364501953125, -0.00013464689254760742, -0.00013005733489990234, -0.00012546777725219727, -0.00012087821960449219, -0.00011628866195678711, -0.00011169910430908203, -0.00010710954666137695, -0.00010251998901367188, -9.79304313659668e-05, -9.334087371826172e-05, -8.875131607055664e-05, -8.416175842285156e-05, -7.957220077514648e-05, -7.49826431274414e-05, -7.039308547973633e-05, -6.580352783203125e-05, -6.121397018432617e-05, -5.6624412536621094e-05, -5.2034854888916016e-05, -4.744529724121094e-05, -4.285573959350586e-05, -3.826618194580078e-05, -3.36766242980957e-05, -2.9087066650390625e-05, -2.4497509002685547e-05, -1.990795135498047e-05, -1.531839370727539e-05, -1.0728836059570312e-05, -6.139278411865234e-06, -1.5497207641601562e-06, 3.039836883544922e-06, 7.62939453125e-06, 1.2218952178955078e-05, 1.6808509826660156e-05, 2.1398067474365234e-05, 2.5987625122070312e-05, 3.057718276977539e-05, 3.516674041748047e-05, 3.975629806518555e-05, 4.4345855712890625e-05, 4.89354133605957e-05, 5.352497100830078e-05, 5.811452865600586e-05, 6.270408630371094e-05, 6.729364395141602e-05, 7.18832015991211e-05, 7.647275924682617e-05, 8.106231689453125e-05, 8.565187454223633e-05, 9.02414321899414e-05, 9.483098983764648e-05, 9.942054748535156e-05, 0.00010401010513305664, 0.00010859966278076172, 0.0001131892204284668, 0.00011777877807617188, 0.00012236833572387695, 0.00012695789337158203, 0.0001315474510192871, 0.0001361370086669922]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 7.0, 9.0, 19.0, 18.0, 33.0, 47.0, 76.0, 88.0, 180.0, 268.0, 529.0, 1114.0, 2380.0, 7066.0, 28533.0, 162430.0, 722866.0, 95574.0, 18382.0, 5120.0, 1864.0, 861.0, 454.0, 235.0, 117.0, 81.0, 64.0, 35.0, 38.0, 16.0, 16.0, 9.0, 8.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.397216796875, -0.38494110107421875, -0.3726654052734375, -0.36038970947265625, -0.348114013671875, -0.33583831787109375, -0.3235626220703125, -0.31128692626953125, -0.29901123046875, -0.28673553466796875, -0.2744598388671875, -0.26218414306640625, -0.249908447265625, -0.23763275146484375, -0.2253570556640625, -0.21308135986328125, -0.2008056640625, -0.18852996826171875, -0.1762542724609375, -0.16397857666015625, -0.151702880859375, -0.13942718505859375, -0.1271514892578125, -0.11487579345703125, -0.10260009765625, -0.09032440185546875, -0.0780487060546875, -0.06577301025390625, -0.053497314453125, -0.04122161865234375, -0.0289459228515625, -0.01667022705078125, -0.00439453125, 0.00788116455078125, 0.0201568603515625, 0.03243255615234375, 0.044708251953125, 0.05698394775390625, 0.0692596435546875, 0.08153533935546875, 0.09381103515625, 0.10608673095703125, 0.1183624267578125, 0.13063812255859375, 0.142913818359375, 0.15518951416015625, 0.1674652099609375, 0.17974090576171875, 0.1920166015625, 0.20429229736328125, 0.2165679931640625, 0.22884368896484375, 0.241119384765625, 0.25339508056640625, 0.2656707763671875, 0.27794647216796875, 0.29022216796875, 0.30249786376953125, 0.3147735595703125, 0.32704925537109375, 0.339324951171875, 0.35160064697265625, 0.3638763427734375, 0.37615203857421875, 0.388427734375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 15.0, 10.0, 8.0, 27.0, 32.0, 39.0, 82.0, 90.0, 114.0, 111.0, 113.0, 92.0, 65.0, 55.0, 39.0, 31.0, 22.0, 17.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.6279296875, -0.612213134765625, -0.59649658203125, -0.580780029296875, -0.5650634765625, -0.549346923828125, -0.53363037109375, -0.517913818359375, -0.502197265625, -0.486480712890625, -0.47076416015625, -0.455047607421875, -0.4393310546875, -0.423614501953125, -0.40789794921875, -0.392181396484375, -0.37646484375, -0.360748291015625, -0.34503173828125, -0.329315185546875, -0.3135986328125, -0.297882080078125, -0.28216552734375, -0.266448974609375, -0.250732421875, -0.235015869140625, -0.21929931640625, -0.203582763671875, -0.1878662109375, -0.172149658203125, -0.15643310546875, -0.140716552734375, -0.125, -0.109283447265625, -0.09356689453125, -0.077850341796875, -0.0621337890625, -0.046417236328125, -0.03070068359375, -0.014984130859375, 0.000732421875, 0.016448974609375, 0.03216552734375, 0.047882080078125, 0.0635986328125, 0.079315185546875, 0.09503173828125, 0.110748291015625, 0.12646484375, 0.142181396484375, 0.15789794921875, 0.173614501953125, 0.1893310546875, 0.205047607421875, 0.22076416015625, 0.236480712890625, 0.252197265625, 0.267913818359375, 0.28363037109375, 0.299346923828125, 0.3150634765625, 0.330780029296875, 0.34649658203125, 0.362213134765625, 0.3779296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 12.0, 15.0, 43.0, 94.0, 153.0, 429.0, 144.0, 57.0, 27.0, 14.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.384563446044922, -21.88277816772461, -21.380992889404297, -20.879207611083984, -20.377422332763672, -19.875635147094727, -19.373849868774414, -18.8720645904541, -18.37027931213379, -17.868494033813477, -17.366708755493164, -16.86492347717285, -16.363136291503906, -15.86135196685791, -15.359565734863281, -14.857780456542969, -14.355995178222656, -13.854209899902344, -13.352424621582031, -12.850638389587402, -12.34885311126709, -11.847067832946777, -11.345281600952148, -10.843496322631836, -10.341711044311523, -9.839925765991211, -9.338140487670898, -8.83635425567627, -8.334568977355957, -7.8327836990356445, -7.330997943878174, -6.829212188720703, -6.327426910400391, -5.825641632080078, -5.323855876922607, -4.822070121765137, -4.320284843444824, -3.8184993267059326, -3.316713809967041, -2.8149282932281494, -2.313142776489258, -1.8113572597503662, -1.3095717430114746, -0.807786226272583, -0.3060007095336914, 0.1957848072052002, 0.6975703239440918, 1.1993558406829834, 1.701141357421875, 2.2029268741607666, 2.704712390899658, 3.20649790763855, 3.7082834243774414, 4.210068702697754, 4.711854457855225, 5.213640213012695, 5.715425491333008, 6.21721076965332, 6.718996524810791, 7.220782279968262, 7.722567558288574, 8.224352836608887, 8.726139068603516, 9.227924346923828, 9.72970962524414]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 5.0, 10.0, 8.0, 11.0, 7.0, 16.0, 13.0, 21.0, 22.0, 20.0, 30.0, 22.0, 30.0, 27.0, 37.0, 67.0, 137.0, 136.0, 59.0, 43.0, 32.0, 29.0, 27.0, 26.0, 25.0, 22.0, 13.0, 18.0, 13.0, 13.0, 13.0, 7.0, 5.0, 5.0, 7.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.575469017028809, -8.307669639587402, -8.039871215820312, -7.772071838378906, -7.5042724609375, -7.236473560333252, -6.968674659729004, -6.700875282287598, -6.43307638168335, -6.165277481079102, -5.897478103637695, -5.629679203033447, -5.361880302429199, -5.094080924987793, -4.826282024383545, -4.558483123779297, -4.290683746337891, -4.022884845733643, -3.7550854682922363, -3.4872865676879883, -3.219487428665161, -2.951688289642334, -2.683889389038086, -2.416090250015259, -2.1482911109924316, -1.8804919719696045, -1.612692952156067, -1.3448939323425293, -1.0770947933197021, -0.809295654296875, -0.5414966344833374, -0.2736976146697998, -0.005898475646972656, 0.2619006037712097, 0.5296996831893921, 0.7974987626075745, 1.0652978420257568, 1.333096981048584, 1.6008960008621216, 1.8686950206756592, 2.1364941596984863, 2.4042932987213135, 2.6720924377441406, 2.9398913383483887, 3.207690477371216, 3.475489616394043, 3.743288516998291, 4.011087417602539, 4.278886795043945, 4.546685695648193, 4.8144850730896, 5.082283973693848, 5.350083351135254, 5.617882251739502, 5.88568115234375, 6.153480529785156, 6.421279430389404, 6.689078330993652, 6.956877708435059, 7.224676609039307, 7.492475509643555, 7.760274887084961, 8.028074264526367, 8.295872688293457, 8.563672065734863]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 0.0, 6.0, 11.0, 5.0, 17.0, 19.0, 26.0, 30.0, 50.0, 73.0, 101.0, 142.0, 211.0, 350.0, 566.0, 961.0, 1751.0, 3350.0, 7161.0, 19857.0, 69576.0, 293016.0, 1089307.0, 1762328.0, 704586.0, 171265.0, 43800.0, 13659.0, 5722.0, 2645.0, 1430.0, 769.0, 528.0, 319.0, 197.0, 141.0, 92.0, 63.0, 52.0, 29.0, 28.0, 11.0, 7.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.841796875, -0.817962646484375, -0.79412841796875, -0.770294189453125, -0.7464599609375, -0.722625732421875, -0.69879150390625, -0.674957275390625, -0.651123046875, -0.627288818359375, -0.60345458984375, -0.579620361328125, -0.5557861328125, -0.531951904296875, -0.50811767578125, -0.484283447265625, -0.46044921875, -0.436614990234375, -0.41278076171875, -0.388946533203125, -0.3651123046875, -0.341278076171875, -0.31744384765625, -0.293609619140625, -0.269775390625, -0.245941162109375, -0.22210693359375, -0.198272705078125, -0.1744384765625, -0.150604248046875, -0.12677001953125, -0.102935791015625, -0.0791015625, -0.055267333984375, -0.03143310546875, -0.007598876953125, 0.0162353515625, 0.040069580078125, 0.06390380859375, 0.087738037109375, 0.111572265625, 0.135406494140625, 0.15924072265625, 0.183074951171875, 0.2069091796875, 0.230743408203125, 0.25457763671875, 0.278411865234375, 0.30224609375, 0.326080322265625, 0.34991455078125, 0.373748779296875, 0.3975830078125, 0.421417236328125, 0.44525146484375, 0.469085693359375, 0.492919921875, 0.516754150390625, 0.54058837890625, 0.564422607421875, 0.5882568359375, 0.612091064453125, 0.63592529296875, 0.659759521484375, 0.68359375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 7.0, 14.0, 13.0, 8.0, 20.0, 34.0, 47.0, 42.0, 43.0, 65.0, 69.0, 73.0, 68.0, 62.0, 72.0, 67.0, 64.0, 49.0, 49.0, 29.0, 25.0, 16.0, 15.0, 19.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98046875, -0.9552688598632812, -0.9300689697265625, -0.9048690795898438, -0.879669189453125, -0.8544692993164062, -0.8292694091796875, -0.8040695190429688, -0.77886962890625, -0.7536697387695312, -0.7284698486328125, -0.7032699584960938, -0.678070068359375, -0.6528701782226562, -0.6276702880859375, -0.6024703979492188, -0.5772705078125, -0.5520706176757812, -0.5268707275390625, -0.5016708374023438, -0.476470947265625, -0.45127105712890625, -0.4260711669921875, -0.40087127685546875, -0.37567138671875, -0.35047149658203125, -0.3252716064453125, -0.30007171630859375, -0.274871826171875, -0.24967193603515625, -0.2244720458984375, -0.19927215576171875, -0.174072265625, -0.14887237548828125, -0.1236724853515625, -0.09847259521484375, -0.073272705078125, -0.04807281494140625, -0.0228729248046875, 0.00232696533203125, 0.02752685546875, 0.05272674560546875, 0.0779266357421875, 0.10312652587890625, 0.128326416015625, 0.15352630615234375, 0.1787261962890625, 0.20392608642578125, 0.2291259765625, 0.25432586669921875, 0.2795257568359375, 0.30472564697265625, 0.329925537109375, 0.35512542724609375, 0.3803253173828125, 0.40552520751953125, 0.43072509765625, 0.45592498779296875, 0.4811248779296875, 0.5063247680664062, 0.531524658203125, 0.5567245483398438, 0.5819244384765625, 0.6071243286132812, 0.63232421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 11.0, 17.0, 14.0, 28.0, 39.0, 47.0, 103.0, 152.0, 282.0, 515.0, 1065.0, 3236.0, 24509.0, 3801719.0, 351352.0, 7671.0, 1786.0, 811.0, 357.0, 217.0, 136.0, 62.0, 40.0, 30.0, 20.0, 21.0, 8.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.75, -3.628173828125, -3.50634765625, -3.384521484375, -3.2626953125, -3.140869140625, -3.01904296875, -2.897216796875, -2.775390625, -2.653564453125, -2.53173828125, -2.409912109375, -2.2880859375, -2.166259765625, -2.04443359375, -1.922607421875, -1.80078125, -1.678955078125, -1.55712890625, -1.435302734375, -1.3134765625, -1.191650390625, -1.06982421875, -0.947998046875, -0.826171875, -0.704345703125, -0.58251953125, -0.460693359375, -0.3388671875, -0.217041015625, -0.09521484375, 0.026611328125, 0.1484375, 0.270263671875, 0.39208984375, 0.513916015625, 0.6357421875, 0.757568359375, 0.87939453125, 1.001220703125, 1.123046875, 1.244873046875, 1.36669921875, 1.488525390625, 1.6103515625, 1.732177734375, 1.85400390625, 1.975830078125, 2.09765625, 2.219482421875, 2.34130859375, 2.463134765625, 2.5849609375, 2.706787109375, 2.82861328125, 2.950439453125, 3.072265625, 3.194091796875, 3.31591796875, 3.437744140625, 3.5595703125, 3.681396484375, 3.80322265625, 3.925048828125, 4.046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 23.0, 24.0, 38.0, 63.0, 97.0, 159.0, 276.0, 436.0, 647.0, 778.0, 602.0, 375.0, 198.0, 120.0, 75.0, 57.0, 40.0, 24.0, 10.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.31402587890625, -3.2276611328125, -3.14129638671875, -3.054931640625, -2.96856689453125, -2.8822021484375, -2.79583740234375, -2.70947265625, -2.62310791015625, -2.5367431640625, -2.45037841796875, -2.364013671875, -2.27764892578125, -2.1912841796875, -2.10491943359375, -2.0185546875, -1.93218994140625, -1.8458251953125, -1.75946044921875, -1.673095703125, -1.58673095703125, -1.5003662109375, -1.41400146484375, -1.32763671875, -1.24127197265625, -1.1549072265625, -1.06854248046875, -0.982177734375, -0.89581298828125, -0.8094482421875, -0.72308349609375, -0.63671875, -0.55035400390625, -0.4639892578125, -0.37762451171875, -0.291259765625, -0.20489501953125, -0.1185302734375, -0.03216552734375, 0.05419921875, 0.14056396484375, 0.2269287109375, 0.31329345703125, 0.399658203125, 0.48602294921875, 0.5723876953125, 0.65875244140625, 0.7451171875, 0.83148193359375, 0.9178466796875, 1.00421142578125, 1.090576171875, 1.17694091796875, 1.2633056640625, 1.34967041015625, 1.43603515625, 1.52239990234375, 1.6087646484375, 1.69512939453125, 1.781494140625, 1.86785888671875, 1.9542236328125, 2.04058837890625, 2.126953125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 7.0, 3.0, 0.0, 1.0, 8.0, 16.0, 22.0, 68.0, 153.0, 295.0, 255.0, 92.0, 45.0, 23.0, 12.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.16006088256836, -53.98428726196289, -52.808509826660156, -51.63273620605469, -50.45696258544922, -49.28118896484375, -48.105411529541016, -46.92963790893555, -45.75386047363281, -44.578086853027344, -43.40230941772461, -42.22653579711914, -41.05076217651367, -39.87498474121094, -38.69921112060547, -37.5234375, -36.34766387939453, -35.17189025878906, -33.99611282348633, -32.82033920288086, -31.64456558227539, -30.46879005432129, -29.293014526367188, -28.11724090576172, -26.941465377807617, -25.765689849853516, -24.589916229248047, -23.414140701293945, -22.238365173339844, -21.062591552734375, -19.886816024780273, -18.711040496826172, -17.53527069091797, -16.359495162963867, -15.183721542358398, -14.007946014404297, -12.832171440124512, -11.656396865844727, -10.480621337890625, -9.30484676361084, -8.129072189331055, -6.9532976150512695, -5.777522563934326, -4.601747512817383, -3.4259729385375977, -2.2501983642578125, -1.0744233131408691, 0.10135173797607422, 1.2771263122558594, 2.4529011249542236, 3.628675937652588, 4.804450988769531, 5.980225563049316, 7.156000137329102, 8.331775665283203, 9.507550239562988, 10.683324813842773, 11.859099388122559, 13.034873962402344, 14.210649490356445, 15.38642406463623, 16.562198638916016, 17.737974166870117, 18.91374969482422, 20.089523315429688]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 11.0, 16.0, 16.0, 39.0, 27.0, 61.0, 68.0, 79.0, 100.0, 127.0, 91.0, 79.0, 49.0, 47.0, 52.0, 37.0, 31.0, 19.0, 15.0, 15.0, 5.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.348106384277344, -17.676523208618164, -17.00493812561035, -16.333354949951172, -15.66176986694336, -14.99018669128418, -14.318602561950684, -13.647018432617188, -12.975434303283691, -12.303850173950195, -11.6322660446167, -10.960681915283203, -10.289098739624023, -9.617513656616211, -8.945930480957031, -8.274346351623535, -7.602762222290039, -6.931178092956543, -6.259593963623047, -5.588010311126709, -4.916426181793213, -4.244842052459717, -3.573258399963379, -2.901674270629883, -2.2300901412963867, -1.5585061311721802, -0.8869221210479736, -0.21533823013305664, 0.45624589920043945, 1.1278300285339355, 1.7994136810302734, 2.4709978103637695, 3.1425819396972656, 3.8141660690307617, 4.485750198364258, 5.157333850860596, 5.828917980194092, 6.500502109527588, 7.172085762023926, 7.843669891357422, 8.515254020690918, 9.186838150024414, 9.85842227935791, 10.530006408691406, 11.201589584350586, 11.873174667358398, 12.544757843017578, 13.216341972351074, 13.88792610168457, 14.559510231018066, 15.231094360351562, 15.902677536010742, 16.574262619018555, 17.245845794677734, 17.917430877685547, 18.589014053344727, 19.260597229003906, 19.932180404663086, 20.6037654876709, 21.275348663330078, 21.94693374633789, 22.61851692199707, 23.29010009765625, 23.961685180664062, 24.633270263671875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 10.0, 9.0, 11.0, 17.0, 25.0, 30.0, 54.0, 81.0, 153.0, 241.0, 620.0, 1531.0, 5992.0, 33942.0, 485991.0, 477474.0, 33594.0, 6008.0, 1573.0, 584.0, 261.0, 129.0, 69.0, 52.0, 29.0, 22.0, 13.0, 9.0, 9.0, 3.0, 4.0, 10.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.078704833984375, -2.00701904296875, -1.935333251953125, -1.8636474609375, -1.791961669921875, -1.72027587890625, -1.648590087890625, -1.576904296875, -1.505218505859375, -1.43353271484375, -1.361846923828125, -1.2901611328125, -1.218475341796875, -1.14678955078125, -1.075103759765625, -1.00341796875, -0.931732177734375, -0.86004638671875, -0.788360595703125, -0.7166748046875, -0.644989013671875, -0.57330322265625, -0.501617431640625, -0.429931640625, -0.358245849609375, -0.28656005859375, -0.214874267578125, -0.1431884765625, -0.071502685546875, 0.00018310546875, 0.071868896484375, 0.1435546875, 0.215240478515625, 0.28692626953125, 0.358612060546875, 0.4302978515625, 0.501983642578125, 0.57366943359375, 0.645355224609375, 0.717041015625, 0.788726806640625, 0.86041259765625, 0.932098388671875, 1.0037841796875, 1.075469970703125, 1.14715576171875, 1.218841552734375, 1.29052734375, 1.362213134765625, 1.43389892578125, 1.505584716796875, 1.5772705078125, 1.648956298828125, 1.72064208984375, 1.792327880859375, 1.864013671875, 1.935699462890625, 2.00738525390625, 2.079071044921875, 2.1507568359375, 2.222442626953125, 2.29412841796875, 2.365814208984375, 2.4375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 6.0, 18.0, 34.0, 61.0, 66.0, 106.0, 134.0, 144.0, 132.0, 103.0, 69.0, 52.0, 30.0, 24.0, 11.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7365264892578125, -1.673248291015625, -1.6099700927734375, -1.54669189453125, -1.4834136962890625, -1.420135498046875, -1.3568572998046875, -1.2935791015625, -1.2303009033203125, -1.167022705078125, -1.1037445068359375, -1.04046630859375, -0.9771881103515625, -0.913909912109375, -0.8506317138671875, -0.787353515625, -0.7240753173828125, -0.660797119140625, -0.5975189208984375, -0.53424072265625, -0.4709625244140625, -0.407684326171875, -0.3444061279296875, -0.2811279296875, -0.2178497314453125, -0.154571533203125, -0.0912933349609375, -0.02801513671875, 0.0352630615234375, 0.098541259765625, 0.1618194580078125, 0.22509765625, 0.2883758544921875, 0.351654052734375, 0.4149322509765625, 0.47821044921875, 0.5414886474609375, 0.604766845703125, 0.6680450439453125, 0.7313232421875, 0.7946014404296875, 0.857879638671875, 0.9211578369140625, 0.98443603515625, 1.0477142333984375, 1.110992431640625, 1.1742706298828125, 1.237548828125, 1.3008270263671875, 1.364105224609375, 1.4273834228515625, 1.49066162109375, 1.5539398193359375, 1.617218017578125, 1.6804962158203125, 1.7437744140625, 1.8070526123046875, 1.870330810546875, 1.9336090087890625, 1.99688720703125, 2.0601654052734375, 2.123443603515625, 2.1867218017578125, 2.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 3.0, 8.0, 13.0, 13.0, 17.0, 20.0, 35.0, 46.0, 56.0, 82.0, 111.0, 176.0, 303.0, 467.0, 988.0, 2311.0, 7858.0, 47991.0, 877114.0, 93031.0, 11987.0, 3126.0, 1202.0, 589.0, 353.0, 188.0, 125.0, 90.0, 52.0, 46.0, 38.0, 28.0, 19.0, 15.0, 11.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9072265625, -1.8537139892578125, -1.800201416015625, -1.7466888427734375, -1.69317626953125, -1.6396636962890625, -1.586151123046875, -1.5326385498046875, -1.4791259765625, -1.4256134033203125, -1.372100830078125, -1.3185882568359375, -1.26507568359375, -1.2115631103515625, -1.158050537109375, -1.1045379638671875, -1.051025390625, -0.9975128173828125, -0.944000244140625, -0.8904876708984375, -0.83697509765625, -0.7834625244140625, -0.729949951171875, -0.6764373779296875, -0.6229248046875, -0.5694122314453125, -0.515899658203125, -0.4623870849609375, -0.40887451171875, -0.3553619384765625, -0.301849365234375, -0.2483367919921875, -0.19482421875, -0.1413116455078125, -0.087799072265625, -0.0342864990234375, 0.01922607421875, 0.0727386474609375, 0.126251220703125, 0.1797637939453125, 0.2332763671875, 0.2867889404296875, 0.340301513671875, 0.3938140869140625, 0.44732666015625, 0.5008392333984375, 0.554351806640625, 0.6078643798828125, 0.661376953125, 0.7148895263671875, 0.768402099609375, 0.8219146728515625, 0.87542724609375, 0.9289398193359375, 0.982452392578125, 1.0359649658203125, 1.0894775390625, 1.1429901123046875, 1.196502685546875, 1.2500152587890625, 1.30352783203125, 1.3570404052734375, 1.410552978515625, 1.4640655517578125, 1.517578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 15.0, 3.0, 8.0, 10.0, 12.0, 19.0, 21.0, 29.0, 30.0, 35.0, 51.0, 73.0, 73.0, 70.0, 113.0, 76.0, 56.0, 58.0, 42.0, 38.0, 31.0, 22.0, 23.0, 26.0, 12.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.40234375, -4.29046630859375, -4.1785888671875, -4.06671142578125, -3.954833984375, -3.84295654296875, -3.7310791015625, -3.61920166015625, -3.50732421875, -3.39544677734375, -3.2835693359375, -3.17169189453125, -3.059814453125, -2.94793701171875, -2.8360595703125, -2.72418212890625, -2.6123046875, -2.50042724609375, -2.3885498046875, -2.27667236328125, -2.164794921875, -2.05291748046875, -1.9410400390625, -1.82916259765625, -1.71728515625, -1.60540771484375, -1.4935302734375, -1.38165283203125, -1.269775390625, -1.15789794921875, -1.0460205078125, -0.93414306640625, -0.822265625, -0.71038818359375, -0.5985107421875, -0.48663330078125, -0.374755859375, -0.26287841796875, -0.1510009765625, -0.03912353515625, 0.07275390625, 0.18463134765625, 0.2965087890625, 0.40838623046875, 0.520263671875, 0.63214111328125, 0.7440185546875, 0.85589599609375, 0.9677734375, 1.07965087890625, 1.1915283203125, 1.30340576171875, 1.415283203125, 1.52716064453125, 1.6390380859375, 1.75091552734375, 1.86279296875, 1.97467041015625, 2.0865478515625, 2.19842529296875, 2.310302734375, 2.42218017578125, 2.5340576171875, 2.64593505859375, 2.7578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 4.0, 10.0, 12.0, 21.0, 31.0, 38.0, 71.0, 93.0, 106.0, 215.0, 357.0, 688.0, 1572.0, 3936.0, 12765.0, 56429.0, 848122.0, 96493.0, 18363.0, 5257.0, 1965.0, 896.0, 421.0, 240.0, 165.0, 80.0, 54.0, 42.0, 37.0, 19.0, 11.0, 11.0, 6.0, 8.0, 6.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391357421875, -0.3803749084472656, -0.36939239501953125, -0.3584098815917969, -0.3474273681640625, -0.3364448547363281, -0.32546234130859375, -0.3144798278808594, -0.303497314453125, -0.2925148010253906, -0.28153228759765625, -0.2705497741699219, -0.2595672607421875, -0.24858474731445312, -0.23760223388671875, -0.22661972045898438, -0.21563720703125, -0.20465469360351562, -0.19367218017578125, -0.18268966674804688, -0.1717071533203125, -0.16072463989257812, -0.14974212646484375, -0.13875961303710938, -0.127777099609375, -0.11679458618164062, -0.10581207275390625, -0.09482955932617188, -0.0838470458984375, -0.07286453247070312, -0.06188201904296875, -0.050899505615234375, -0.0399169921875, -0.028934478759765625, -0.01795196533203125, -0.006969451904296875, 0.0040130615234375, 0.014995574951171875, 0.02597808837890625, 0.036960601806640625, 0.047943115234375, 0.058925628662109375, 0.06990814208984375, 0.08089065551757812, 0.0918731689453125, 0.10285568237304688, 0.11383819580078125, 0.12482070922851562, 0.13580322265625, 0.14678573608398438, 0.15776824951171875, 0.16875076293945312, 0.1797332763671875, 0.19071578979492188, 0.20169830322265625, 0.21268081665039062, 0.223663330078125, 0.23464584350585938, 0.24562835693359375, 0.2566108703613281, 0.2675933837890625, 0.2785758972167969, 0.28955841064453125, 0.3005409240722656, 0.3115234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 7.0, 7.0, 9.0, 12.0, 10.0, 22.0, 27.0, 43.0, 36.0, 69.0, 108.0, 133.0, 141.0, 100.0, 65.0, 45.0, 34.0, 31.0, 20.0, 9.0, 10.0, 8.0, 8.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0001628398895263672, -0.00015853624790906906, -0.00015423260629177094, -0.0001499289646744728, -0.00014562532305717468, -0.00014132168143987656, -0.00013701803982257843, -0.0001327143982052803, -0.00012841075658798218, -0.00012410711497068405, -0.00011980347335338593, -0.0001154998317360878, -0.00011119619011878967, -0.00010689254850149155, -0.00010258890688419342, -9.82852652668953e-05, -9.398162364959717e-05, -8.967798203229904e-05, -8.537434041500092e-05, -8.107069879770279e-05, -7.676705718040466e-05, -7.246341556310654e-05, -6.815977394580841e-05, -6.385613232851028e-05, -5.955249071121216e-05, -5.524884909391403e-05, -5.0945207476615906e-05, -4.664156585931778e-05, -4.233792424201965e-05, -3.803428262472153e-05, -3.37306410074234e-05, -2.9426999390125275e-05, -2.512335777282715e-05, -2.0819716155529022e-05, -1.6516074538230896e-05, -1.221243292093277e-05, -7.908791303634644e-06, -3.6051496863365173e-06, 6.984919309616089e-07, 5.002133548259735e-06, 9.305775165557861e-06, 1.3609416782855988e-05, 1.7913058400154114e-05, 2.221670001745224e-05, 2.6520341634750366e-05, 3.082398325204849e-05, 3.512762486934662e-05, 3.9431266486644745e-05, 4.373490810394287e-05, 4.8038549721241e-05, 5.2342191338539124e-05, 5.664583295583725e-05, 6.0949474573135376e-05, 6.52531161904335e-05, 6.955675780773163e-05, 7.386039942502975e-05, 7.816404104232788e-05, 8.246768265962601e-05, 8.677132427692413e-05, 9.107496589422226e-05, 9.537860751152039e-05, 9.968224912881851e-05, 0.00010398589074611664, 0.00010828953236341476, 0.00011259317398071289]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 13.0, 7.0, 21.0, 17.0, 26.0, 53.0, 59.0, 120.0, 181.0, 303.0, 499.0, 990.0, 1972.0, 4321.0, 10786.0, 33436.0, 192392.0, 733436.0, 46088.0, 13759.0, 5236.0, 2262.0, 1141.0, 617.0, 315.0, 207.0, 124.0, 48.0, 30.0, 29.0, 18.0, 12.0, 7.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18167495727539062, -0.17414093017578125, -0.16660690307617188, -0.1590728759765625, -0.15153884887695312, -0.14400482177734375, -0.13647079467773438, -0.128936767578125, -0.12140274047851562, -0.11386871337890625, -0.10633468627929688, -0.0988006591796875, -0.09126663208007812, -0.08373260498046875, -0.07619857788085938, -0.06866455078125, -0.061130523681640625, -0.05359649658203125, -0.046062469482421875, -0.0385284423828125, -0.030994415283203125, -0.02346038818359375, -0.015926361083984375, -0.008392333984375, -0.000858306884765625, 0.00667572021484375, 0.014209747314453125, 0.0217437744140625, 0.029277801513671875, 0.03681182861328125, 0.044345855712890625, 0.0518798828125, 0.059413909912109375, 0.06694793701171875, 0.07448196411132812, 0.0820159912109375, 0.08955001831054688, 0.09708404541015625, 0.10461807250976562, 0.112152099609375, 0.11968612670898438, 0.12722015380859375, 0.13475418090820312, 0.1422882080078125, 0.14982223510742188, 0.15735626220703125, 0.16489028930664062, 0.17242431640625, 0.17995834350585938, 0.18749237060546875, 0.19502639770507812, 0.2025604248046875, 0.21009445190429688, 0.21762847900390625, 0.22516250610351562, 0.232696533203125, 0.24023056030273438, 0.24776458740234375, 0.2552986145019531, 0.2628326416015625, 0.2703666687011719, 0.27790069580078125, 0.2854347229003906, 0.29296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 4.0, 6.0, 1.0, 3.0, 9.0, 7.0, 9.0, 11.0, 13.0, 18.0, 18.0, 25.0, 30.0, 45.0, 41.0, 77.0, 94.0, 116.0, 86.0, 92.0, 67.0, 45.0, 48.0, 21.0, 20.0, 9.0, 14.0, 6.0, 16.0, 9.0, 8.0, 3.0, 4.0, 2.0, 11.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.3974609375, -0.3878898620605469, -0.37831878662109375, -0.3687477111816406, -0.3591766357421875, -0.3496055603027344, -0.34003448486328125, -0.3304634094238281, -0.320892333984375, -0.3113212585449219, -0.30175018310546875, -0.2921791076660156, -0.2826080322265625, -0.2730369567871094, -0.26346588134765625, -0.2538948059082031, -0.24432373046875, -0.23475265502929688, -0.22518157958984375, -0.21561050415039062, -0.2060394287109375, -0.19646835327148438, -0.18689727783203125, -0.17732620239257812, -0.167755126953125, -0.15818405151367188, -0.14861297607421875, -0.13904190063476562, -0.1294708251953125, -0.11989974975585938, -0.11032867431640625, -0.10075759887695312, -0.0911865234375, -0.08161544799804688, -0.07204437255859375, -0.062473297119140625, -0.0529022216796875, -0.043331146240234375, -0.03376007080078125, -0.024188995361328125, -0.014617919921875, -0.005046844482421875, 0.00452423095703125, 0.014095306396484375, 0.0236663818359375, 0.033237457275390625, 0.04280853271484375, 0.052379608154296875, 0.06195068359375, 0.07152175903320312, 0.08109283447265625, 0.09066390991210938, 0.1002349853515625, 0.10980606079101562, 0.11937713623046875, 0.12894821166992188, 0.138519287109375, 0.14809036254882812, 0.15766143798828125, 0.16723251342773438, 0.1768035888671875, 0.18637466430664062, 0.19594573974609375, 0.20551681518554688, 0.215087890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 8.0, 18.0, 32.0, 74.0, 197.0, 479.0, 68.0, 63.0, 29.0, 6.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.75851058959961, -15.283124923706055, -14.807740211486816, -14.332355499267578, -13.856969833374023, -13.381584167480469, -12.90619945526123, -12.430814743041992, -11.955429077148438, -11.480043411254883, -11.004658699035645, -10.529273986816406, -10.053888320922852, -9.578502655029297, -9.103117942810059, -8.62773323059082, -8.152347564697266, -7.676962375640869, -7.201577186584473, -6.726191997528076, -6.25080680847168, -5.775421619415283, -5.300036430358887, -4.82465124130249, -4.349266052246094, -3.8738808631896973, -3.398495674133301, -2.9231104850769043, -2.447725296020508, -1.9723401069641113, -1.4969549179077148, -1.0215697288513184, -0.5461854934692383, -0.0708003044128418, 0.4045848846435547, 0.8799700736999512, 1.3553552627563477, 1.8307404518127441, 2.3061256408691406, 2.781510829925537, 3.2568960189819336, 3.73228120803833, 4.207666397094727, 4.683051586151123, 5.1584367752075195, 5.633821964263916, 6.1092071533203125, 6.584592342376709, 7.0599775314331055, 7.535362720489502, 8.010747909545898, 8.486133575439453, 8.961518287658691, 9.43690299987793, 9.912288665771484, 10.387674331665039, 10.863059043884277, 11.338443756103516, 11.81382942199707, 12.289215087890625, 12.764599800109863, 13.239984512329102, 13.715370178222656, 14.190755844116211, 14.66614055633545]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 12.0, 8.0, 12.0, 11.0, 13.0, 23.0, 19.0, 33.0, 31.0, 33.0, 139.0, 338.0, 73.0, 37.0, 25.0, 30.0, 24.0, 24.0, 28.0, 25.0, 10.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.105731964111328, -10.80048656463623, -10.495241165161133, -10.189995765686035, -9.884750366210938, -9.57950496673584, -9.274259567260742, -8.969014167785645, -8.663768768310547, -8.35852336883545, -8.053277969360352, -7.748032569885254, -7.442787170410156, -7.137541770935059, -6.832296371459961, -6.527050971984863, -6.221806049346924, -5.916560649871826, -5.6113152503967285, -5.306069850921631, -5.000824451446533, -4.6955790519714355, -4.390334129333496, -4.085088729858398, -3.7798430919647217, -3.474597692489624, -3.1693522930145264, -2.864107131958008, -2.55886173248291, -2.2536163330078125, -1.9483709335327148, -1.6431255340576172, -1.3378801345825195, -1.0326347351074219, -0.727389395236969, -0.4221440553665161, -0.11689865589141846, 0.1883467435836792, 0.4935920238494873, 0.798837423324585, 1.1040828227996826, 1.4093282222747803, 1.714573621749878, 2.0198187828063965, 2.325064182281494, 2.630309581756592, 2.9355549812316895, 3.240800380706787, 3.5460457801818848, 3.8512911796569824, 4.15653657913208, 4.461781978607178, 4.767027378082275, 5.072272777557373, 5.3775177001953125, 5.68276309967041, 5.988008499145508, 6.2932538986206055, 6.598499298095703, 6.903744697570801, 7.208990097045898, 7.514235496520996, 7.819480895996094, 8.124726295471191, 8.429971694946289]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 21.0, 9.0, 27.0, 17.0, 32.0, 27.0, 49.0, 50.0, 66.0, 218.0, 146.0, 48.0, 42.0, 34.0, 26.0, 22.0, 21.0, 15.0, 17.0, 15.0, 11.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.740234375, -0.7168350219726562, -0.6934356689453125, -0.6700363159179688, -0.646636962890625, -0.6232376098632812, -0.5998382568359375, -0.5764389038085938, -0.55303955078125, -0.5296401977539062, -0.5062408447265625, -0.48284149169921875, -0.459442138671875, -0.43604278564453125, -0.4126434326171875, -0.38924407958984375, -0.3658447265625, -0.34244537353515625, -0.3190460205078125, -0.29564666748046875, -0.272247314453125, -0.24884796142578125, -0.2254486083984375, -0.20204925537109375, -0.17864990234375, -0.15525054931640625, -0.1318511962890625, -0.10845184326171875, -0.085052490234375, -0.06165313720703125, -0.0382537841796875, -0.01485443115234375, 0.008544921875, 0.03194427490234375, 0.0553436279296875, 0.07874298095703125, 0.102142333984375, 0.12554168701171875, 0.1489410400390625, 0.17234039306640625, 0.19573974609375, 0.21913909912109375, 0.2425384521484375, 0.26593780517578125, 0.289337158203125, 0.31273651123046875, 0.3361358642578125, 0.35953521728515625, 0.3829345703125, 0.40633392333984375, 0.4297332763671875, 0.45313262939453125, 0.476531982421875, 0.49993133544921875, 0.5233306884765625, 0.5467300415039062, 0.57012939453125, 0.5935287475585938, 0.6169281005859375, 0.6403274536132812, 0.663726806640625, 0.6871261596679688, 0.7105255126953125, 0.7339248657226562, 0.75732421875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 11.0, 6.0, 4.0, 13.0, 27.0, 38.0, 63.0, 58.0, 132.0, 230.0, 606.0, 2136.0, 10770.0, 8347408.0, 22437.0, 3119.0, 814.0, 285.0, 145.0, 105.0, 56.0, 24.0, 19.0, 20.0, 14.0, 7.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.430327415466309, -6.197672367095947, -5.965016841888428, -5.732361793518066, -5.499706745147705, -5.267051696777344, -5.034396171569824, -4.801741123199463, -4.569086074829102, -4.33643102645874, -4.103775501251221, -3.8711204528808594, -3.638465404510498, -3.4058101177215576, -3.173154830932617, -2.940499782562256, -2.7078444957733154, -2.475189208984375, -2.2425341606140137, -2.0098788738250732, -1.777223825454712, -1.5445685386657715, -1.3119133710861206, -1.0792582035064697, -0.8466030359268188, -0.613947868347168, -0.3812926709651947, -0.14863747358322144, 0.08401769399642944, 0.3166729211807251, 0.549328088760376, 0.7819832563400269, 1.0146384239196777, 1.2472935914993286, 1.4799487590789795, 1.71260404586792, 1.9452590942382812, 2.1779143810272217, 2.410569667816162, 2.6432247161865234, 2.8758797645568848, 3.108535051345825, 3.3411900997161865, 3.573845386505127, 3.8065004348754883, 4.039155960083008, 4.271811008453369, 4.5044660568237305, 4.73712158203125, 4.969776630401611, 5.202432155609131, 5.435087203979492, 5.6677422523498535, 5.900397300720215, 6.133052825927734, 6.365707874298096, 6.598362922668457, 6.831017971038818, 7.063673496246338, 7.296328544616699, 7.5289835929870605, 7.761638641357422, 7.994294166564941, 8.226949691772461, 8.459604263305664]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 11.0, 5.0, 0.0, 4.0, 3.0, 4.0, 7.0, 10.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.243095874786377, -5.058807373046875, -4.874518394470215, -4.690229892730713, -4.505941390991211, -4.321652889251709, -4.137364387512207, -3.953075408935547, -3.768786907196045, -3.584498405456543, -3.400209665298462, -3.215920925140381, -3.031632423400879, -2.847343921661377, -2.663055181503296, -2.478766441345215, -2.294477939605713, -2.110189437866211, -1.9259006977081299, -1.7416120767593384, -1.5573234558105469, -1.3730348348617554, -1.1887462139129639, -1.0044575929641724, -0.8201689720153809, -0.6358803510665894, -0.45159173011779785, -0.26730310916900635, -0.08301448822021484, 0.10127413272857666, 0.28556275367736816, 0.46985137462615967, 0.6541399955749512, 0.8384286165237427, 1.0227172374725342, 1.2070058584213257, 1.3912944793701172, 1.5755831003189087, 1.7598717212677002, 1.9441603422164917, 2.128448963165283, 2.312737464904785, 2.497026205062866, 2.6813149452209473, 2.865603446960449, 3.049891948699951, 3.2341806888580322, 3.4184694290161133, 3.6027579307556152, 3.787046432495117, 3.9713351726531982, 4.155623912811279, 4.339912414550781, 4.524200916290283, 4.708489418029785, 4.892778396606445, 5.077066898345947, 5.261355400085449, 5.445644378662109, 5.629932880401611, 5.814221382141113, 5.998509883880615, 6.182798385620117, 6.367087364196777, 6.551375865936279]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 5.0, 12.0, 14.0, 18.0, 15.0, 28.0, 40.0, 50.0, 96.0, 115.0, 216.0, 289.0, 619.0, 1277.0, 3117.0, 8882.0, 27000.0, 91343.0, 226016.0, 114665.0, 33315.0, 10358.0, 3566.0, 1409.0, 677.0, 352.0, 215.0, 151.0, 102.0, 82.0, 47.0, 51.0, 26.0, 25.0, 15.0, 13.0, 7.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.79498291015625, -5.6055908203125, -5.41619873046875, -5.226806640625, -5.03741455078125, -4.8480224609375, -4.65863037109375, -4.46923828125, -4.27984619140625, -4.0904541015625, -3.90106201171875, -3.711669921875, -3.52227783203125, -3.3328857421875, -3.14349365234375, -2.9541015625, -2.76470947265625, -2.5753173828125, -2.38592529296875, -2.196533203125, -2.00714111328125, -1.8177490234375, -1.62835693359375, -1.43896484375, -1.24957275390625, -1.0601806640625, -0.87078857421875, -0.681396484375, -0.49200439453125, -0.3026123046875, -0.11322021484375, 0.076171875, 0.26556396484375, 0.4549560546875, 0.64434814453125, 0.833740234375, 1.02313232421875, 1.2125244140625, 1.40191650390625, 1.59130859375, 1.78070068359375, 1.9700927734375, 2.15948486328125, 2.348876953125, 2.53826904296875, 2.7276611328125, 2.91705322265625, 3.1064453125, 3.29583740234375, 3.4852294921875, 3.67462158203125, 3.864013671875, 4.05340576171875, 4.2427978515625, 4.43218994140625, 4.62158203125, 4.81097412109375, 5.0003662109375, 5.18975830078125, 5.379150390625, 5.56854248046875, 5.7579345703125, 5.94732666015625, 6.13671875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 15.0, 34.0, 39.0, 76.0, 119.0, 163.0, 160.0, 145.0, 111.0, 60.0, 33.0, 31.0, 13.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.95703125, -1.888214111328125, -1.81939697265625, -1.750579833984375, -1.6817626953125, -1.612945556640625, -1.54412841796875, -1.475311279296875, -1.406494140625, -1.337677001953125, -1.26885986328125, -1.200042724609375, -1.1312255859375, -1.062408447265625, -0.99359130859375, -0.924774169921875, -0.85595703125, -0.787139892578125, -0.71832275390625, -0.649505615234375, -0.5806884765625, -0.511871337890625, -0.44305419921875, -0.374237060546875, -0.305419921875, -0.236602783203125, -0.16778564453125, -0.098968505859375, -0.0301513671875, 0.038665771484375, 0.10748291015625, 0.176300048828125, 0.2451171875, 0.313934326171875, 0.38275146484375, 0.451568603515625, 0.5203857421875, 0.589202880859375, 0.65802001953125, 0.726837158203125, 0.795654296875, 0.864471435546875, 0.93328857421875, 1.002105712890625, 1.0709228515625, 1.139739990234375, 1.20855712890625, 1.277374267578125, 1.34619140625, 1.415008544921875, 1.48382568359375, 1.552642822265625, 1.6214599609375, 1.690277099609375, 1.75909423828125, 1.827911376953125, 1.896728515625, 1.965545654296875, 2.03436279296875, 2.103179931640625, 2.1719970703125, 2.240814208984375, 2.30963134765625, 2.378448486328125, 2.447265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 9.0, 17.0, 34.0, 45.0, 82.0, 77.0, 75.0, 43.0, 24.0, 12.0, 12.0, 6.0, 5.0, 7.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.181715488433838, -5.986423015594482, -5.791130542755127, -5.5958380699157715, -5.400545597076416, -5.2052531242370605, -5.009961128234863, -4.814668655395508, -4.619376182556152, -4.424083709716797, -4.228791236877441, -4.033498764038086, -3.8382062911987305, -3.642913818359375, -3.4476215839385986, -3.252329111099243, -3.0570363998413086, -2.861743927001953, -2.6664514541625977, -2.471158981323242, -2.2758665084838867, -2.0805740356445312, -1.8852818012237549, -1.6899893283843994, -1.494696855545044, -1.2994043827056885, -1.104111909866333, -0.9088195562362671, -0.7135270833969116, -0.5182346105575562, -0.32294225692749023, -0.12764978408813477, 0.0676422119140625, 0.2629346549510956, 0.45822709798812866, 0.6535195112228394, 0.8488119840621948, 1.0441044569015503, 1.2393968105316162, 1.4346892833709717, 1.6299817562103271, 1.8252742290496826, 2.020566701889038, 2.2158589363098145, 2.41115140914917, 2.6064438819885254, 2.801736354827881, 2.9970288276672363, 3.192321300506592, 3.3876137733459473, 3.5829062461853027, 3.778198719024658, 3.9734911918640137, 4.168783664703369, 4.364075660705566, 4.559368133544922, 4.754660606384277, 4.949953079223633, 5.145245552062988, 5.340538024902344, 5.535830497741699, 5.731122970581055, 5.92641544342041, 6.121707916259766, 6.317000389099121]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 13.0, 33.0, 68.0, 102.0, 89.0, 55.0, 26.0, 10.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7101640701293945, -4.532390117645264, -4.354616641998291, -4.17684268951416, -3.9990689754486084, -3.8212952613830566, -3.643521547317505, -3.465747833251953, -3.2879738807678223, -3.1102001667022705, -2.9324264526367188, -2.754652500152588, -2.576878786087036, -2.3991050720214844, -2.2213313579559326, -2.043557643890381, -1.865783929824829, -1.6880102157592773, -1.510236382484436, -1.3324626684188843, -1.154688835144043, -0.9769151210784912, -0.7991414070129395, -0.6213675737380981, -0.4435938596725464, -0.26582008600234985, -0.08804634213447571, 0.08972740173339844, 0.26750117540359497, 0.4452749490737915, 0.6230486631393433, 0.8008224964141846, 0.9785962104797363, 1.156369924545288, 1.3341437578201294, 1.5119174718856812, 1.6896913051605225, 1.8674650192260742, 2.045238733291626, 2.2230124473571777, 2.4007863998413086, 2.5785601139068604, 2.756333827972412, 2.934107780456543, 3.1118814945220947, 3.2896552085876465, 3.4674289226531982, 3.64520263671875, 3.8229763507843018, 4.0007500648498535, 4.178524017333984, 4.356297492980957, 4.534071445465088, 4.711845397949219, 4.889618873596191, 5.067392826080322, 5.245166301727295, 5.422940254211426, 5.600713729858398, 5.778487682342529, 5.956261157989502, 6.134035110473633, 6.3118085861206055, 6.489582538604736, 6.667356491088867]}, "eval/loss": 4.671250343322754, "eval/wer": 1.9355811186037286, "eval/runtime": 785.3163, "eval/samples_per_second": 3.364, "eval/steps_per_second": 0.281} \ No newline at end of file +{"train/loss": 4.425, "train/learning_rate": 2.8011611030478957e-05, "train/epoch": 0.84, "train/global_step": 1000, "_runtime": 5740, "_timestamp": 1646185121, "_step": 1001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 315.0, 699.0, 2.0, 0.0, 1.0], "bins": [-924.809326171875, -909.4195556640625, -894.02978515625, -878.6399536132812, -863.2501831054688, -847.8604125976562, -832.4706420898438, -817.080810546875, -801.6910400390625, -786.30126953125, -770.9114990234375, -755.5216674804688, -740.1318969726562, -724.7421264648438, -709.3523559570312, -693.9625244140625, -678.57275390625, -663.1829833984375, -647.793212890625, -632.4033813476562, -617.0136108398438, -601.6238403320312, -586.2340698242188, -570.84423828125, -555.4544677734375, -540.064697265625, -524.6749267578125, -509.2851257324219, -493.89532470703125, -478.50555419921875, -463.1157531738281, -447.7259826660156, -432.336181640625, -416.9464111328125, -401.5566101074219, -386.1668395996094, -370.77703857421875, -355.38726806640625, -339.9974670410156, -324.6076965332031, -309.2179260253906, -293.8281555175781, -278.4383544921875, -263.048583984375, -247.65878295898438, -232.26901245117188, -216.87921142578125, -201.48944091796875, -186.09963989257812, -170.70985412597656, -155.320068359375, -139.93028259277344, -124.54049682617188, -109.15071868896484, -93.76093292236328, -78.37114715576172, -62.98135757446289, -47.59157180786133, -32.20178985595703, -16.81200408935547, -1.4222183227539062, 13.96756362915039, 29.357349395751953, 44.747135162353516, 60.13692092895508]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 10.0, 5.0, 14.0, 21.0, 29.0, 35.0, 44.0, 45.0, 57.0, 57.0, 62.0, 54.0, 65.0, 84.0, 73.0, 51.0, 71.0, 53.0, 51.0, 30.0, 17.0, 24.0, 11.0, 8.0, 8.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.4429931640625, -79.00655364990234, -76.57011413574219, -74.13367462158203, -71.69723510742188, -69.26079559326172, -66.82435607910156, -64.3879165649414, -61.95147705078125, -59.515037536621094, -57.07859802246094, -54.64215850830078, -52.205718994140625, -49.76927947998047, -47.33283996582031, -44.896400451660156, -42.4599609375, -40.023521423339844, -37.58708190917969, -35.15064239501953, -32.714202880859375, -30.27776336669922, -27.841323852539062, -25.404884338378906, -22.96844482421875, -20.532005310058594, -18.095565795898438, -15.659126281738281, -13.222686767578125, -10.786247253417969, -8.349807739257812, -5.913368225097656, -3.4769287109375, -1.0404891967773438, 1.3959503173828125, 3.8323898315429688, 6.268829345703125, 8.705268859863281, 11.141708374023438, 13.578147888183594, 16.01458740234375, 18.451026916503906, 20.887466430664062, 23.32390594482422, 25.760345458984375, 28.19678497314453, 30.633224487304688, 33.069664001464844, 35.506103515625, 37.942543029785156, 40.37898254394531, 42.81542205810547, 45.251861572265625, 47.68830108642578, 50.12474060058594, 52.561180114746094, 54.99761962890625, 57.434059143066406, 59.87049865722656, 62.30693817138672, 64.74337768554688, 67.17981719970703, 69.61625671386719, 72.05269622802734, 74.4891357421875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 7.0, 7.0, 8.0, 6.0, 9.0, 12.0, 34.0, 24.0, 37.0, 25.0, 35.0, 31.0, 50.0, 40.0, 48.0, 45.0, 39.0, 52.0, 50.0, 55.0, 47.0, 49.0, 46.0, 41.0, 37.0, 34.0, 28.0, 28.0, 20.0, 12.0, 7.0, 12.0, 7.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.75390625, -1.687469482421875, -1.62103271484375, -1.554595947265625, -1.4881591796875, -1.421722412109375, -1.35528564453125, -1.288848876953125, -1.222412109375, -1.155975341796875, -1.08953857421875, -1.023101806640625, -0.9566650390625, -0.890228271484375, -0.82379150390625, -0.757354736328125, -0.69091796875, -0.624481201171875, -0.55804443359375, -0.491607666015625, -0.4251708984375, -0.358734130859375, -0.29229736328125, -0.225860595703125, -0.159423828125, -0.092987060546875, -0.02655029296875, 0.039886474609375, 0.1063232421875, 0.172760009765625, 0.23919677734375, 0.305633544921875, 0.3720703125, 0.438507080078125, 0.50494384765625, 0.571380615234375, 0.6378173828125, 0.704254150390625, 0.77069091796875, 0.837127685546875, 0.903564453125, 0.970001220703125, 1.03643798828125, 1.102874755859375, 1.1693115234375, 1.235748291015625, 1.30218505859375, 1.368621826171875, 1.43505859375, 1.501495361328125, 1.56793212890625, 1.634368896484375, 1.7008056640625, 1.767242431640625, 1.83367919921875, 1.900115966796875, 1.966552734375, 2.032989501953125, 2.09942626953125, 2.165863037109375, 2.2322998046875, 2.298736572265625, 2.36517333984375, 2.431610107421875, 2.498046875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 4.0, 8.0, 15.0, 19.0, 26.0, 39.0, 54.0, 76.0, 129.0, 157.0, 255.0, 384.0, 630.0, 1084.0, 2168.0, 5136.0, 18434.0, 108915.0, 1991648.0, 1932368.0, 104808.0, 17783.0, 5253.0, 2074.0, 1064.0, 605.0, 373.0, 244.0, 160.0, 115.0, 61.0, 49.0, 43.0, 26.0, 20.0, 14.0, 13.0, 5.0, 9.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1640625, -8.8245849609375, -8.485107421875, -8.1456298828125, -7.80615234375, -7.4666748046875, -7.127197265625, -6.7877197265625, -6.4482421875, -6.1087646484375, -5.769287109375, -5.4298095703125, -5.09033203125, -4.7508544921875, -4.411376953125, -4.0718994140625, -3.732421875, -3.3929443359375, -3.053466796875, -2.7139892578125, -2.37451171875, -2.0350341796875, -1.695556640625, -1.3560791015625, -1.0166015625, -0.6771240234375, -0.337646484375, 0.0018310546875, 0.34130859375, 0.6807861328125, 1.020263671875, 1.3597412109375, 1.69921875, 2.0386962890625, 2.378173828125, 2.7176513671875, 3.05712890625, 3.3966064453125, 3.736083984375, 4.0755615234375, 4.4150390625, 4.7545166015625, 5.093994140625, 5.4334716796875, 5.77294921875, 6.1124267578125, 6.451904296875, 6.7913818359375, 7.130859375, 7.4703369140625, 7.809814453125, 8.1492919921875, 8.48876953125, 8.8282470703125, 9.167724609375, 9.5072021484375, 9.8466796875, 10.1861572265625, 10.525634765625, 10.8651123046875, 11.20458984375, 11.5440673828125, 11.883544921875, 12.2230224609375, 12.5625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 17.0, 55.0, 113.0, 321.0, 722.0, 1254.0, 878.0, 418.0, 179.0, 62.0, 23.0, 15.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.6875, -29.00830078125, -28.3291015625, -27.64990234375, -26.970703125, -26.29150390625, -25.6123046875, -24.93310546875, -24.25390625, -23.57470703125, -22.8955078125, -22.21630859375, -21.537109375, -20.85791015625, -20.1787109375, -19.49951171875, -18.8203125, -18.14111328125, -17.4619140625, -16.78271484375, -16.103515625, -15.42431640625, -14.7451171875, -14.06591796875, -13.38671875, -12.70751953125, -12.0283203125, -11.34912109375, -10.669921875, -9.99072265625, -9.3115234375, -8.63232421875, -7.953125, -7.27392578125, -6.5947265625, -5.91552734375, -5.236328125, -4.55712890625, -3.8779296875, -3.19873046875, -2.51953125, -1.84033203125, -1.1611328125, -0.48193359375, 0.197265625, 0.87646484375, 1.5556640625, 2.23486328125, 2.9140625, 3.59326171875, 4.2724609375, 4.95166015625, 5.630859375, 6.31005859375, 6.9892578125, 7.66845703125, 8.34765625, 9.02685546875, 9.7060546875, 10.38525390625, 11.064453125, 11.74365234375, 12.4228515625, 13.10205078125, 13.78125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 10.0, 22.0, 60.0, 184.0, 600.0, 2690.0, 2091270.0, 2095917.0, 2577.0, 637.0, 183.0, 72.0, 26.0, 13.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.8125, -78.287109375, -75.76171875, -73.236328125, -70.7109375, -68.185546875, -65.66015625, -63.134765625, -60.609375, -58.083984375, -55.55859375, -53.033203125, -50.5078125, -47.982421875, -45.45703125, -42.931640625, -40.40625, -37.880859375, -35.35546875, -32.830078125, -30.3046875, -27.779296875, -25.25390625, -22.728515625, -20.203125, -17.677734375, -15.15234375, -12.626953125, -10.1015625, -7.576171875, -5.05078125, -2.525390625, 0.0, 2.525390625, 5.05078125, 7.576171875, 10.1015625, 12.626953125, 15.15234375, 17.677734375, 20.203125, 22.728515625, 25.25390625, 27.779296875, 30.3046875, 32.830078125, 35.35546875, 37.880859375, 40.40625, 42.931640625, 45.45703125, 47.982421875, 50.5078125, 53.033203125, 55.55859375, 58.083984375, 60.609375, 63.134765625, 65.66015625, 68.185546875, 70.7109375, 73.236328125, 75.76171875, 78.287109375, 80.8125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 517.0, 481.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.01999282836914, -24.805633544921875, -16.59127426147461, -8.376914978027344, -0.16255569458007812, 8.051803588867188, 16.266162872314453, 24.48052215576172, 32.694881439208984, 40.90924072265625, 49.123600006103516, 57.33795928955078, 65.55232238769531, 73.76667785644531, 81.98103332519531, 90.19539642333984, 98.40975952148438, 106.62411499023438, 114.8384780883789, 123.05284118652344, 131.26719665527344, 139.48155212402344, 147.6959228515625, 155.9102783203125, 164.1246337890625, 172.3389892578125, 180.5533447265625, 188.76771545410156, 196.98207092285156, 205.19642639160156, 213.41079711914062, 221.62515258789062, 229.83950805664062, 238.05386352539062, 246.26821899414062, 254.4825897216797, 262.69696044921875, 270.91131591796875, 279.12567138671875, 287.34002685546875, 295.55438232421875, 303.76873779296875, 311.98309326171875, 320.19744873046875, 328.41180419921875, 336.6261901855469, 344.8405456542969, 353.0549011230469, 361.2692565917969, 369.4836120605469, 377.6979675292969, 385.9123229980469, 394.126708984375, 402.341064453125, 410.555419921875, 418.769775390625, 426.984130859375, 435.198486328125, 443.412841796875, 451.627197265625, 459.841552734375, 468.0559387207031, 476.2702941894531, 484.4846496582031, 492.6990051269531]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 9.0, 29.0, 17.0, 24.0, 30.0, 42.0, 38.0, 33.0, 46.0, 60.0, 43.0, 34.0, 57.0, 44.0, 57.0, 68.0, 37.0, 49.0, 35.0, 40.0, 33.0, 27.0, 32.0, 20.0, 15.0, 9.0, 11.0, 10.0, 11.0, 7.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.7867431640625, -36.5736083984375, -35.3604736328125, -34.147342681884766, -32.934207916259766, -31.721073150634766, -30.5079402923584, -29.29480743408203, -28.08167266845703, -26.86853790283203, -25.655405044555664, -24.442272186279297, -23.229137420654297, -22.016002655029297, -20.80286979675293, -19.589736938476562, -18.376602172851562, -17.163467407226562, -15.950334548950195, -14.737200736999512, -13.524066925048828, -12.310933113098145, -11.097799301147461, -9.884665489196777, -8.671531677246094, -7.45839786529541, -6.245264053344727, -5.032130241394043, -3.8189964294433594, -2.605862617492676, -1.3927288055419922, -0.1795949935913086, 1.033538818359375, 2.2466726303100586, 3.459806442260742, 4.672940254211426, 5.886074066162109, 7.099207878112793, 8.312341690063477, 9.52547550201416, 10.738609313964844, 11.951743125915527, 13.164876937866211, 14.378010749816895, 15.591144561767578, 16.804279327392578, 18.017412185668945, 19.230545043945312, 20.443679809570312, 21.656814575195312, 22.86994743347168, 24.083080291748047, 25.296215057373047, 26.509349822998047, 27.722482681274414, 28.93561553955078, 30.14875030517578, 31.36188507080078, 32.57501983642578, 33.788150787353516, 35.001285552978516, 36.214420318603516, 37.42755126953125, 38.64068603515625, 39.85382080078125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 3.0, 3.0, 9.0, 9.0, 8.0, 8.0, 13.0, 11.0, 11.0, 21.0, 27.0, 24.0, 22.0, 36.0, 31.0, 33.0, 21.0, 36.0, 30.0, 33.0, 36.0, 41.0, 38.0, 35.0, 38.0, 26.0, 39.0, 42.0, 27.0, 39.0, 34.0, 23.0, 36.0, 33.0, 21.0, 15.0, 12.0, 13.0, 16.0, 6.0, 11.0, 4.0, 7.0, 3.0, 1.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7119140625, -1.6591644287109375, -1.606414794921875, -1.5536651611328125, -1.50091552734375, -1.4481658935546875, -1.395416259765625, -1.3426666259765625, -1.2899169921875, -1.2371673583984375, -1.184417724609375, -1.1316680908203125, -1.07891845703125, -1.0261688232421875, -0.973419189453125, -0.9206695556640625, -0.867919921875, -0.8151702880859375, -0.762420654296875, -0.7096710205078125, -0.65692138671875, -0.6041717529296875, -0.551422119140625, -0.4986724853515625, -0.4459228515625, -0.3931732177734375, -0.340423583984375, -0.2876739501953125, -0.23492431640625, -0.1821746826171875, -0.129425048828125, -0.0766754150390625, -0.02392578125, 0.0288238525390625, 0.081573486328125, 0.1343231201171875, 0.18707275390625, 0.2398223876953125, 0.292572021484375, 0.3453216552734375, 0.3980712890625, 0.4508209228515625, 0.503570556640625, 0.5563201904296875, 0.60906982421875, 0.6618194580078125, 0.714569091796875, 0.7673187255859375, 0.820068359375, 0.8728179931640625, 0.925567626953125, 0.9783172607421875, 1.03106689453125, 1.0838165283203125, 1.136566162109375, 1.1893157958984375, 1.2420654296875, 1.2948150634765625, 1.347564697265625, 1.4003143310546875, 1.45306396484375, 1.5058135986328125, 1.558563232421875, 1.6113128662109375, 1.6640625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 7.0, 6.0, 6.0, 14.0, 15.0, 17.0, 18.0, 39.0, 43.0, 82.0, 96.0, 132.0, 178.0, 289.0, 414.0, 624.0, 895.0, 1355.0, 1949.0, 3118.0, 4879.0, 7756.0, 12476.0, 20125.0, 32929.0, 54153.0, 88061.0, 133396.0, 179180.0, 171905.0, 124449.0, 80253.0, 49670.0, 30297.0, 18277.0, 11331.0, 7024.0, 4444.0, 2866.0, 1875.0, 1313.0, 841.0, 567.0, 386.0, 230.0, 187.0, 118.0, 87.0, 60.0, 47.0, 25.0, 22.0, 16.0, 6.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.18535995483398438, -0.17894744873046875, -0.17253494262695312, -0.1661224365234375, -0.15970993041992188, -0.15329742431640625, -0.14688491821289062, -0.140472412109375, -0.13405990600585938, -0.12764739990234375, -0.12123489379882812, -0.1148223876953125, -0.10840988159179688, -0.10199737548828125, -0.09558486938476562, -0.08917236328125, -0.08275985717773438, -0.07634735107421875, -0.06993484497070312, -0.0635223388671875, -0.057109832763671875, -0.05069732666015625, -0.044284820556640625, -0.037872314453125, -0.031459808349609375, -0.02504730224609375, -0.018634796142578125, -0.0122222900390625, -0.005809783935546875, 0.00060272216796875, 0.007015228271484375, 0.013427734375, 0.019840240478515625, 0.02625274658203125, 0.032665252685546875, 0.0390777587890625, 0.045490264892578125, 0.05190277099609375, 0.058315277099609375, 0.064727783203125, 0.07114028930664062, 0.07755279541015625, 0.08396530151367188, 0.0903778076171875, 0.09679031372070312, 0.10320281982421875, 0.10961532592773438, 0.11602783203125, 0.12244033813476562, 0.12885284423828125, 0.13526535034179688, 0.1416778564453125, 0.14809036254882812, 0.15450286865234375, 0.16091537475585938, 0.167327880859375, 0.17374038696289062, 0.18015289306640625, 0.18656539916992188, 0.1929779052734375, 0.19939041137695312, 0.20580291748046875, 0.21221542358398438, 0.2186279296875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 0.0, 4.0, 5.0, 0.0, 7.0, 5.0, 10.0, 9.0, 7.0, 12.0, 14.0, 11.0, 17.0, 17.0, 26.0, 21.0, 25.0, 23.0, 38.0, 27.0, 24.0, 39.0, 38.0, 39.0, 30.0, 1063.0, 43.0, 42.0, 52.0, 52.0, 31.0, 32.0, 39.0, 26.0, 34.0, 28.0, 26.0, 21.0, 17.0, 15.0, 15.0, 10.0, 10.0, 4.0, 12.0, 5.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0673828125, -1.0301361083984375, -0.992889404296875, -0.9556427001953125, -0.91839599609375, -0.8811492919921875, -0.843902587890625, -0.8066558837890625, -0.7694091796875, -0.7321624755859375, -0.694915771484375, -0.6576690673828125, -0.62042236328125, -0.5831756591796875, -0.545928955078125, -0.5086822509765625, -0.471435546875, -0.4341888427734375, -0.396942138671875, -0.3596954345703125, -0.32244873046875, -0.2852020263671875, -0.247955322265625, -0.2107086181640625, -0.1734619140625, -0.1362152099609375, -0.098968505859375, -0.0617218017578125, -0.02447509765625, 0.0127716064453125, 0.050018310546875, 0.0872650146484375, 0.12451171875, 0.1617584228515625, 0.199005126953125, 0.2362518310546875, 0.27349853515625, 0.3107452392578125, 0.347991943359375, 0.3852386474609375, 0.4224853515625, 0.4597320556640625, 0.496978759765625, 0.5342254638671875, 0.57147216796875, 0.6087188720703125, 0.645965576171875, 0.6832122802734375, 0.720458984375, 0.7577056884765625, 0.794952392578125, 0.8321990966796875, 0.86944580078125, 0.9066925048828125, 0.943939208984375, 0.9811859130859375, 1.0184326171875, 1.0556793212890625, 1.092926025390625, 1.1301727294921875, 1.16741943359375, 1.2046661376953125, 1.241912841796875, 1.2791595458984375, 1.31640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 8.0, 14.0, 10.0, 21.0, 41.0, 49.0, 69.0, 101.0, 162.0, 239.0, 413.0, 665.0, 943.0, 1488.0, 2373.0, 3818.0, 5807.0, 9319.0, 14640.0, 22717.0, 35626.0, 53727.0, 80071.0, 112617.0, 211470.0, 1116423.0, 136070.0, 97470.0, 66432.0, 44427.0, 28890.0, 18489.0, 11784.0, 7540.0, 4748.0, 2993.0, 1909.0, 1277.0, 800.0, 479.0, 348.0, 213.0, 143.0, 94.0, 69.0, 45.0, 27.0, 19.0, 18.0, 8.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.117919921875, -0.11437511444091797, -0.11083030700683594, -0.1072854995727539, -0.10374069213867188, -0.10019588470458984, -0.09665107727050781, -0.09310626983642578, -0.08956146240234375, -0.08601665496826172, -0.08247184753417969, -0.07892704010009766, -0.07538223266601562, -0.0718374252319336, -0.06829261779785156, -0.06474781036376953, -0.0612030029296875, -0.05765819549560547, -0.05411338806152344, -0.050568580627441406, -0.047023773193359375, -0.043478965759277344, -0.03993415832519531, -0.03638935089111328, -0.03284454345703125, -0.02929973602294922, -0.025754928588867188, -0.022210121154785156, -0.018665313720703125, -0.015120506286621094, -0.011575698852539062, -0.008030891418457031, -0.004486083984375, -0.0009412765502929688, 0.0026035308837890625, 0.006148338317871094, 0.009693145751953125, 0.013237953186035156, 0.016782760620117188, 0.02032756805419922, 0.02387237548828125, 0.02741718292236328, 0.030961990356445312, 0.034506797790527344, 0.038051605224609375, 0.041596412658691406, 0.04514122009277344, 0.04868602752685547, 0.0522308349609375, 0.05577564239501953, 0.05932044982910156, 0.0628652572631836, 0.06641006469726562, 0.06995487213134766, 0.07349967956542969, 0.07704448699951172, 0.08058929443359375, 0.08413410186767578, 0.08767890930175781, 0.09122371673583984, 0.09476852416992188, 0.0983133316040039, 0.10185813903808594, 0.10540294647216797, 0.10894775390625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 2.0, 11.0, 16.0, 12.0, 11.0, 18.0, 16.0, 16.0, 31.0, 22.0, 30.0, 39.0, 28.0, 44.0, 51.0, 81.0, 95.0, 74.0, 50.0, 58.0, 47.0, 30.0, 27.0, 20.0, 21.0, 18.0, 25.0, 18.0, 10.0, 12.0, 11.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005962371826171875, -0.005777239799499512, -0.0055921077728271484, -0.005406975746154785, -0.005221843719482422, -0.005036711692810059, -0.004851579666137695, -0.004666447639465332, -0.004481315612792969, -0.0042961835861206055, -0.004111051559448242, -0.003925919532775879, -0.0037407875061035156, -0.0035556554794311523, -0.003370523452758789, -0.0031853914260864258, -0.0030002593994140625, -0.0028151273727416992, -0.002629995346069336, -0.0024448633193969727, -0.0022597312927246094, -0.002074599266052246, -0.0018894672393798828, -0.0017043352127075195, -0.0015192031860351562, -0.001334071159362793, -0.0011489391326904297, -0.0009638071060180664, -0.0007786750793457031, -0.0005935430526733398, -0.00040841102600097656, -0.00022327899932861328, -3.814697265625e-05, 0.00014698505401611328, 0.00033211708068847656, 0.0005172491073608398, 0.0007023811340332031, 0.0008875131607055664, 0.0010726451873779297, 0.001257777214050293, 0.0014429092407226562, 0.0016280412673950195, 0.0018131732940673828, 0.001998305320739746, 0.0021834373474121094, 0.0023685693740844727, 0.002553701400756836, 0.0027388334274291992, 0.0029239654541015625, 0.0031090974807739258, 0.003294229507446289, 0.0034793615341186523, 0.0036644935607910156, 0.003849625587463379, 0.004034757614135742, 0.0042198896408081055, 0.004405021667480469, 0.004590153694152832, 0.004775285720825195, 0.004960417747497559, 0.005145549774169922, 0.005330681800842285, 0.0055158138275146484, 0.005700945854187012, 0.005886077880859375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 5.0, 15.0, 23.0, 33.0, 23.0, 32.0, 55.0, 87.0, 113.0, 177.0, 245.0, 401.0, 860.0, 59303.0, 983680.0, 1947.0, 530.0, 305.0, 189.0, 140.0, 78.0, 66.0, 42.0, 38.0, 16.0, 14.0, 16.0, 23.0, 12.0, 16.0, 5.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17083168029785156, -0.16405105590820312, -0.1572704315185547, -0.15048980712890625, -0.1437091827392578, -0.13692855834960938, -0.13014793395996094, -0.1233673095703125, -0.11658668518066406, -0.10980606079101562, -0.10302543640136719, -0.09624481201171875, -0.08946418762207031, -0.08268356323242188, -0.07590293884277344, -0.069122314453125, -0.06234169006347656, -0.055561065673828125, -0.04878044128417969, -0.04199981689453125, -0.03521919250488281, -0.028438568115234375, -0.021657943725585938, -0.0148773193359375, -0.008096694946289062, -0.001316070556640625, 0.0054645538330078125, 0.01224517822265625, 0.019025802612304688, 0.025806427001953125, 0.03258705139160156, 0.03936767578125, 0.04614830017089844, 0.052928924560546875, 0.05970954895019531, 0.06649017333984375, 0.07327079772949219, 0.08005142211914062, 0.08683204650878906, 0.0936126708984375, 0.10039329528808594, 0.10717391967773438, 0.11395454406738281, 0.12073516845703125, 0.1275157928466797, 0.13429641723632812, 0.14107704162597656, 0.147857666015625, 0.15463829040527344, 0.16141891479492188, 0.1681995391845703, 0.17498016357421875, 0.1817607879638672, 0.18854141235351562, 0.19532203674316406, 0.2021026611328125, 0.20888328552246094, 0.21566390991210938, 0.2224445343017578, 0.22922515869140625, 0.2360057830810547, 0.24278640747070312, 0.24956703186035156, 0.25634765625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 159.0, 838.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3295329213142395, -0.32378077507019043, -0.31802862882614136, -0.3122764825820923, -0.3065243661403656, -0.30077221989631653, -0.29502007365226746, -0.2892679274082184, -0.2835157811641693, -0.27776363492012024, -0.27201148867607117, -0.2662593424320221, -0.2605072259902954, -0.25475507974624634, -0.24900293350219727, -0.2432507872581482, -0.23749864101409912, -0.23174649477005005, -0.22599436342716217, -0.2202422171831131, -0.21449007093906403, -0.20873792469501495, -0.20298579335212708, -0.197233647108078, -0.19148151576519012, -0.18572936952114105, -0.17997723817825317, -0.1742250919342041, -0.16847294569015503, -0.16272079944610596, -0.15696866810321808, -0.151216521859169, -0.14546436071395874, -0.13971221446990967, -0.1339600831270218, -0.12820793688297272, -0.12245579063892365, -0.11670365184545517, -0.1109515130519867, -0.10519936680793762, -0.09944723546504974, -0.09369509667158127, -0.0879429504275322, -0.08219081163406372, -0.07643866539001465, -0.07068652659654617, -0.0649343878030777, -0.059182241559028625, -0.05343009531497955, -0.04767795279622078, -0.041925810277462006, -0.03617367148399353, -0.030421527102589607, -0.024669384583830833, -0.01891724392771721, -0.013165101408958435, -0.007412958890199661, -0.0016608168371021748, 0.004091325215995312, 0.009843466803431511, 0.015595609322190285, 0.02134775184094906, 0.027099892497062683, 0.03285203501582146, 0.03860417753458023]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 5.0, 12.0, 13.0, 18.0, 20.0, 20.0, 28.0, 34.0, 34.0, 50.0, 48.0, 58.0, 52.0, 44.0, 56.0, 44.0, 46.0, 62.0, 43.0, 37.0, 62.0, 34.0, 30.0, 33.0, 28.0, 21.0, 11.0, 8.0, 10.0, 5.0, 8.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0075286030769348145, -0.0073126088827848434, -0.0070966146886348724, -0.006880620494484901, -0.00666462630033493, -0.006448632106184959, -0.006232637912034988, -0.006016643717885017, -0.005800649523735046, -0.005584655329585075, -0.005368661135435104, -0.005152666941285133, -0.004936672747135162, -0.004720678552985191, -0.00450468435883522, -0.004288690164685249, -0.004072695970535278, -0.0038567017763853073, -0.0036407075822353363, -0.0034247133880853653, -0.0032087191939353943, -0.0029927249997854233, -0.0027767308056354523, -0.0025607366114854813, -0.0023447424173355103, -0.0021287482231855392, -0.0019127540290355682, -0.0016967598348855972, -0.0014807656407356262, -0.0012647714465856552, -0.0010487772524356842, -0.0008327830582857132, -0.0006167888641357422, -0.0004007946699857712, -0.00018480047583580017, 3.119371831417084e-05, 0.00024718791246414185, 0.00046318210661411285, 0.0006791763007640839, 0.0008951704949140549, 0.0011111646890640259, 0.0013271588832139969, 0.001543153077363968, 0.001759147271513939, 0.00197514146566391, 0.002191135659813881, 0.002407129853963852, 0.002623124048113823, 0.002839118242263794, 0.003055112436413765, 0.003271106630563736, 0.003487100824713707, 0.003703095018863678, 0.003919089213013649, 0.00413508340716362, 0.004351077601313591, 0.004567071795463562, 0.004783065989613533, 0.004999060183763504, 0.005215054377913475, 0.005431048572063446, 0.005647042766213417, 0.005863036960363388, 0.006079031154513359, 0.00629502534866333]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 3.0, 3.0, 9.0, 9.0, 8.0, 8.0, 13.0, 11.0, 11.0, 21.0, 27.0, 24.0, 22.0, 35.0, 32.0, 33.0, 21.0, 36.0, 30.0, 33.0, 36.0, 41.0, 38.0, 35.0, 38.0, 26.0, 39.0, 42.0, 27.0, 39.0, 34.0, 23.0, 36.0, 33.0, 21.0, 15.0, 11.0, 14.0, 16.0, 6.0, 11.0, 4.0, 7.0, 3.0, 1.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7119140625, -1.6591644287109375, -1.606414794921875, -1.5536651611328125, -1.50091552734375, -1.4481658935546875, -1.395416259765625, -1.3426666259765625, -1.2899169921875, -1.2371673583984375, -1.184417724609375, -1.1316680908203125, -1.07891845703125, -1.0261688232421875, -0.973419189453125, -0.9206695556640625, -0.867919921875, -0.8151702880859375, -0.762420654296875, -0.7096710205078125, -0.65692138671875, -0.6041717529296875, -0.551422119140625, -0.4986724853515625, -0.4459228515625, -0.3931732177734375, -0.340423583984375, -0.2876739501953125, -0.23492431640625, -0.1821746826171875, -0.129425048828125, -0.0766754150390625, -0.02392578125, 0.0288238525390625, 0.081573486328125, 0.1343231201171875, 0.18707275390625, 0.2398223876953125, 0.292572021484375, 0.3453216552734375, 0.3980712890625, 0.4508209228515625, 0.503570556640625, 0.5563201904296875, 0.60906982421875, 0.6618194580078125, 0.714569091796875, 0.7673187255859375, 0.820068359375, 0.8728179931640625, 0.925567626953125, 0.9783172607421875, 1.03106689453125, 1.0838165283203125, 1.136566162109375, 1.1893157958984375, 1.2420654296875, 1.2948150634765625, 1.347564697265625, 1.4003143310546875, 1.45306396484375, 1.5058135986328125, 1.558563232421875, 1.6113128662109375, 1.6640625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 14.0, 15.0, 22.0, 21.0, 36.0, 45.0, 55.0, 79.0, 111.0, 158.0, 208.0, 339.0, 423.0, 633.0, 787.0, 1168.0, 1621.0, 2233.0, 3423.0, 5167.0, 8224.0, 14527.0, 34417.0, 131603.0, 506480.0, 236784.0, 51958.0, 19152.0, 9659.0, 6007.0, 4064.0, 2620.0, 1847.0, 1374.0, 923.0, 665.0, 457.0, 340.0, 239.0, 174.0, 139.0, 91.0, 67.0, 39.0, 43.0, 28.0, 24.0, 14.0, 5.0, 12.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.3553466796875, -6.148193359375, -5.9410400390625, -5.73388671875, -5.5267333984375, -5.319580078125, -5.1124267578125, -4.9052734375, -4.6981201171875, -4.490966796875, -4.2838134765625, -4.07666015625, -3.8695068359375, -3.662353515625, -3.4552001953125, -3.248046875, -3.0408935546875, -2.833740234375, -2.6265869140625, -2.41943359375, -2.2122802734375, -2.005126953125, -1.7979736328125, -1.5908203125, -1.3836669921875, -1.176513671875, -0.9693603515625, -0.76220703125, -0.5550537109375, -0.347900390625, -0.1407470703125, 0.06640625, 0.2735595703125, 0.480712890625, 0.6878662109375, 0.89501953125, 1.1021728515625, 1.309326171875, 1.5164794921875, 1.7236328125, 1.9307861328125, 2.137939453125, 2.3450927734375, 2.55224609375, 2.7593994140625, 2.966552734375, 3.1737060546875, 3.380859375, 3.5880126953125, 3.795166015625, 4.0023193359375, 4.20947265625, 4.4166259765625, 4.623779296875, 4.8309326171875, 5.0380859375, 5.2452392578125, 5.452392578125, 5.6595458984375, 5.86669921875, 6.0738525390625, 6.281005859375, 6.4881591796875, 6.6953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 9.0, 10.0, 12.0, 20.0, 24.0, 23.0, 20.0, 26.0, 30.0, 49.0, 36.0, 44.0, 66.0, 83.0, 121.0, 247.0, 1460.0, 233.0, 132.0, 74.0, 57.0, 34.0, 43.0, 23.0, 25.0, 33.0, 20.0, 21.0, 21.0, 17.0, 12.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.078125, -6.865966796875, -6.65380859375, -6.441650390625, -6.2294921875, -6.017333984375, -5.80517578125, -5.593017578125, -5.380859375, -5.168701171875, -4.95654296875, -4.744384765625, -4.5322265625, -4.320068359375, -4.10791015625, -3.895751953125, -3.68359375, -3.471435546875, -3.25927734375, -3.047119140625, -2.8349609375, -2.622802734375, -2.41064453125, -2.198486328125, -1.986328125, -1.774169921875, -1.56201171875, -1.349853515625, -1.1376953125, -0.925537109375, -0.71337890625, -0.501220703125, -0.2890625, -0.076904296875, 0.13525390625, 0.347412109375, 0.5595703125, 0.771728515625, 0.98388671875, 1.196044921875, 1.408203125, 1.620361328125, 1.83251953125, 2.044677734375, 2.2568359375, 2.468994140625, 2.68115234375, 2.893310546875, 3.10546875, 3.317626953125, 3.52978515625, 3.741943359375, 3.9541015625, 4.166259765625, 4.37841796875, 4.590576171875, 4.802734375, 5.014892578125, 5.22705078125, 5.439208984375, 5.6513671875, 5.863525390625, 6.07568359375, 6.287841796875, 6.5]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 16.0, 11.0, 7.0, 21.0, 22.0, 19.0, 24.0, 24.0, 39.0, 40.0, 63.0, 130.0, 378.0, 1913.0, 710634.0, 2428859.0, 2544.0, 437.0, 158.0, 78.0, 53.0, 36.0, 41.0, 27.0, 22.0, 16.0, 20.0, 19.0, 8.0, 15.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.53125, -27.58203125, -26.6328125, -25.68359375, -24.734375, -23.78515625, -22.8359375, -21.88671875, -20.9375, -19.98828125, -19.0390625, -18.08984375, -17.140625, -16.19140625, -15.2421875, -14.29296875, -13.34375, -12.39453125, -11.4453125, -10.49609375, -9.546875, -8.59765625, -7.6484375, -6.69921875, -5.75, -4.80078125, -3.8515625, -2.90234375, -1.953125, -1.00390625, -0.0546875, 0.89453125, 1.84375, 2.79296875, 3.7421875, 4.69140625, 5.640625, 6.58984375, 7.5390625, 8.48828125, 9.4375, 10.38671875, 11.3359375, 12.28515625, 13.234375, 14.18359375, 15.1328125, 16.08203125, 17.03125, 17.98046875, 18.9296875, 19.87890625, 20.828125, 21.77734375, 22.7265625, 23.67578125, 24.625, 25.57421875, 26.5234375, 27.47265625, 28.421875, 29.37109375, 30.3203125, 31.26953125, 32.21875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 400.0, 617.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-253.70907592773438, -249.2605743408203, -244.81207275390625, -240.36358642578125, -235.9150848388672, -231.46658325195312, -227.01808166503906, -222.569580078125, -218.12107849121094, -213.67257690429688, -209.2240753173828, -204.77557373046875, -200.32708740234375, -195.8785858154297, -191.43008422851562, -186.98158264160156, -182.5330810546875, -178.08457946777344, -173.63607788085938, -169.18759155273438, -164.7390899658203, -160.29058837890625, -155.8420867919922, -151.39358520507812, -146.94509887695312, -142.49659729003906, -138.048095703125, -133.599609375, -129.15110778808594, -124.70260620117188, -120.25410461425781, -115.80560302734375, -111.35710906982422, -106.90860748291016, -102.46011352539062, -98.01161193847656, -93.5631103515625, -89.11460876464844, -84.6661148071289, -80.21761322021484, -75.76911926269531, -71.32061767578125, -66.87212371826172, -62.423622131347656, -57.975120544433594, -53.5266227722168, -49.078125, -44.62962341308594, -40.181121826171875, -35.73262405395508, -31.284122467041016, -26.83562469482422, -22.38712501525879, -17.93862533569336, -13.490127563476562, -9.041627883911133, -4.593128204345703, -0.14462900161743164, 4.30387020111084, 8.752368927001953, 13.200868606567383, 17.649368286132812, 22.09786605834961, 26.54636573791504, 30.99486541748047]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 5.0, 6.0, 9.0, 15.0, 9.0, 15.0, 23.0, 14.0, 25.0, 18.0, 19.0, 30.0, 35.0, 32.0, 42.0, 53.0, 43.0, 55.0, 46.0, 47.0, 43.0, 27.0, 37.0, 32.0, 25.0, 42.0, 23.0, 28.0, 29.0, 31.0, 27.0, 17.0, 18.0, 10.0, 16.0, 17.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.899330139160156, -17.330888748168945, -16.762449264526367, -16.194007873535156, -15.625568389892578, -15.057126998901367, -14.488686561584473, -13.920246124267578, -13.351805686950684, -12.783365249633789, -12.214924812316895, -11.646484375, -11.078042984008789, -10.509603500366211, -9.941162109375, -9.372721672058105, -8.804281234741211, -8.235840797424316, -7.667400360107422, -7.098959445953369, -6.530519008636475, -5.96207857131958, -5.393637657165527, -4.825197219848633, -4.256756782531738, -3.6883163452148438, -3.11987566947937, -2.5514349937438965, -1.982994556427002, -1.4145541191101074, -0.8461134433746338, -0.27767276763916016, 0.2907676696777344, 0.8592082262039185, 1.4276487827301025, 1.9960893392562866, 2.5645298957824707, 3.1329703330993652, 3.701411008834839, 4.2698516845703125, 4.838292121887207, 5.406732559204102, 5.975172996520996, 6.543613910675049, 7.112054347991943, 7.680494785308838, 8.24893569946289, 8.817376136779785, 9.38581657409668, 9.954257011413574, 10.522697448730469, 11.091137886047363, 11.659578323364258, 12.228019714355469, 12.796460151672363, 13.364900588989258, 13.933341026306152, 14.501781463623047, 15.070221900939941, 15.638662338256836, 16.207103729248047, 16.775543212890625, 17.343984603881836, 17.912425994873047, 18.480865478515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 4.0, 2.0, 6.0, 5.0, 11.0, 13.0, 13.0, 11.0, 16.0, 22.0, 16.0, 22.0, 23.0, 34.0, 42.0, 23.0, 28.0, 26.0, 37.0, 32.0, 40.0, 33.0, 45.0, 33.0, 29.0, 25.0, 39.0, 41.0, 32.0, 30.0, 31.0, 30.0, 26.0, 31.0, 31.0, 14.0, 22.0, 9.0, 7.0, 10.0, 9.0, 9.0, 3.0, 10.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.76953125, -1.7151031494140625, -1.660675048828125, -1.6062469482421875, -1.55181884765625, -1.4973907470703125, -1.442962646484375, -1.3885345458984375, -1.3341064453125, -1.2796783447265625, -1.225250244140625, -1.1708221435546875, -1.11639404296875, -1.0619659423828125, -1.007537841796875, -0.9531097412109375, -0.898681640625, -0.8442535400390625, -0.789825439453125, -0.7353973388671875, -0.68096923828125, -0.6265411376953125, -0.572113037109375, -0.5176849365234375, -0.4632568359375, -0.4088287353515625, -0.354400634765625, -0.2999725341796875, -0.24554443359375, -0.1911163330078125, -0.136688232421875, -0.0822601318359375, -0.02783203125, 0.0265960693359375, 0.081024169921875, 0.1354522705078125, 0.18988037109375, 0.2443084716796875, 0.298736572265625, 0.3531646728515625, 0.4075927734375, 0.4620208740234375, 0.516448974609375, 0.5708770751953125, 0.62530517578125, 0.6797332763671875, 0.734161376953125, 0.7885894775390625, 0.843017578125, 0.8974456787109375, 0.951873779296875, 1.0063018798828125, 1.06072998046875, 1.1151580810546875, 1.169586181640625, 1.2240142822265625, 1.2784423828125, 1.3328704833984375, 1.387298583984375, 1.4417266845703125, 1.49615478515625, 1.5505828857421875, 1.605010986328125, 1.6594390869140625, 1.7138671875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 3.0, 4.0, 9.0, 13.0, 13.0, 16.0, 25.0, 39.0, 44.0, 60.0, 73.0, 109.0, 155.0, 218.0, 306.0, 513.0, 843.0, 1930.0, 4881.0, 16376.0, 74737.0, 568988.0, 2975987.0, 462145.0, 63793.0, 14436.0, 4426.0, 1772.0, 839.0, 470.0, 295.0, 215.0, 151.0, 131.0, 61.0, 51.0, 48.0, 23.0, 27.0, 23.0, 6.0, 5.0, 6.0, 5.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.146728515625, -8.85595703125, -8.565185546875, -8.2744140625, -7.983642578125, -7.69287109375, -7.402099609375, -7.111328125, -6.820556640625, -6.52978515625, -6.239013671875, -5.9482421875, -5.657470703125, -5.36669921875, -5.075927734375, -4.78515625, -4.494384765625, -4.20361328125, -3.912841796875, -3.6220703125, -3.331298828125, -3.04052734375, -2.749755859375, -2.458984375, -2.168212890625, -1.87744140625, -1.586669921875, -1.2958984375, -1.005126953125, -0.71435546875, -0.423583984375, -0.1328125, 0.157958984375, 0.44873046875, 0.739501953125, 1.0302734375, 1.321044921875, 1.61181640625, 1.902587890625, 2.193359375, 2.484130859375, 2.77490234375, 3.065673828125, 3.3564453125, 3.647216796875, 3.93798828125, 4.228759765625, 4.51953125, 4.810302734375, 5.10107421875, 5.391845703125, 5.6826171875, 5.973388671875, 6.26416015625, 6.554931640625, 6.845703125, 7.136474609375, 7.42724609375, 7.718017578125, 8.0087890625, 8.299560546875, 8.59033203125, 8.881103515625, 9.171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 5.0, 18.0, 31.0, 47.0, 58.0, 115.0, 144.0, 235.0, 279.0, 412.0, 569.0, 604.0, 482.0, 337.0, 248.0, 151.0, 111.0, 84.0, 44.0, 27.0, 18.0, 16.0, 7.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.384765625, -9.07421875, -8.763671875, -8.453125, -8.142578125, -7.83203125, -7.521484375, -7.2109375, -6.900390625, -6.58984375, -6.279296875, -5.96875, -5.658203125, -5.34765625, -5.037109375, -4.7265625, -4.416015625, -4.10546875, -3.794921875, -3.484375, -3.173828125, -2.86328125, -2.552734375, -2.2421875, -1.931640625, -1.62109375, -1.310546875, -1.0, -0.689453125, -0.37890625, -0.068359375, 0.2421875, 0.552734375, 0.86328125, 1.173828125, 1.484375, 1.794921875, 2.10546875, 2.416015625, 2.7265625, 3.037109375, 3.34765625, 3.658203125, 3.96875, 4.279296875, 4.58984375, 4.900390625, 5.2109375, 5.521484375, 5.83203125, 6.142578125, 6.453125, 6.763671875, 7.07421875, 7.384765625, 7.6953125, 8.005859375, 8.31640625, 8.626953125, 8.9375, 9.248046875, 9.55859375, 9.869140625, 10.1796875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 14.0, 25.0, 30.0, 66.0, 131.0, 245.0, 559.0, 2054.0, 46336.0, 3951724.0, 188214.0, 3312.0, 856.0, 316.0, 177.0, 72.0, 54.0, 21.0, 23.0, 15.0, 9.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.6875, -39.4775390625, -38.267578125, -37.0576171875, -35.84765625, -34.6376953125, -33.427734375, -32.2177734375, -31.0078125, -29.7978515625, -28.587890625, -27.3779296875, -26.16796875, -24.9580078125, -23.748046875, -22.5380859375, -21.328125, -20.1181640625, -18.908203125, -17.6982421875, -16.48828125, -15.2783203125, -14.068359375, -12.8583984375, -11.6484375, -10.4384765625, -9.228515625, -8.0185546875, -6.80859375, -5.5986328125, -4.388671875, -3.1787109375, -1.96875, -0.7587890625, 0.451171875, 1.6611328125, 2.87109375, 4.0810546875, 5.291015625, 6.5009765625, 7.7109375, 8.9208984375, 10.130859375, 11.3408203125, 12.55078125, 13.7607421875, 14.970703125, 16.1806640625, 17.390625, 18.6005859375, 19.810546875, 21.0205078125, 22.23046875, 23.4404296875, 24.650390625, 25.8603515625, 27.0703125, 28.2802734375, 29.490234375, 30.7001953125, 31.91015625, 33.1201171875, 34.330078125, 35.5400390625, 36.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 21.0, 102.0, 196.0, 279.0, 235.0, 116.0, 46.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.661731719970703, -28.421232223510742, -26.18073081970215, -23.940231323242188, -21.699729919433594, -19.459230422973633, -17.218730926513672, -14.978230476379395, -12.737730026245117, -10.49722957611084, -8.256729125976562, -6.016229629516602, -3.775729179382324, -1.5352287292480469, 0.7052707672119141, 2.9457712173461914, 5.186271667480469, 7.426772117614746, 9.667272567749023, 11.907772064208984, 14.148272514343262, 16.38877296447754, 18.6292724609375, 20.869773864746094, 23.110273361206055, 25.350772857666016, 27.59127426147461, 29.83177375793457, 32.07227325439453, 34.312774658203125, 36.55327606201172, 38.79377365112305, 41.034271240234375, 43.27477264404297, 45.5152702331543, 47.75577163696289, 49.996273040771484, 52.23677062988281, 54.477272033691406, 56.7177734375, 58.958274841308594, 61.19877624511719, 63.439273834228516, 65.67977905273438, 67.92027282714844, 70.16077423095703, 72.40127563476562, 74.64177703857422, 76.88227844238281, 79.1227798461914, 81.36328125, 83.60377502441406, 85.84427642822266, 88.08477783203125, 90.32527923583984, 92.56578063964844, 94.8062744140625, 97.0467758178711, 99.28727722167969, 101.52777099609375, 103.76827239990234, 106.00877380371094, 108.24927520751953, 110.48977661132812, 112.73027801513672]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 6.0, 14.0, 16.0, 20.0, 12.0, 17.0, 22.0, 26.0, 35.0, 35.0, 19.0, 35.0, 36.0, 37.0, 34.0, 42.0, 37.0, 37.0, 40.0, 43.0, 40.0, 30.0, 38.0, 35.0, 34.0, 38.0, 26.0, 20.0, 22.0, 27.0, 18.0, 18.0, 16.0, 10.0, 9.0, 6.0, 9.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.72325897216797, -25.89497947692871, -25.066699981689453, -24.238420486450195, -23.410140991210938, -22.581859588623047, -21.75358009338379, -20.92530059814453, -20.097021102905273, -19.268741607666016, -18.440462112426758, -17.6121826171875, -16.78390121459961, -15.955622673034668, -15.127342224121094, -14.299062728881836, -13.470783233642578, -12.64250373840332, -11.814224243164062, -10.985943794250488, -10.15766429901123, -9.329384803771973, -8.501104354858398, -7.672824859619141, -6.844545364379883, -6.016265869140625, -5.187985897064209, -4.359705924987793, -3.531426429748535, -2.7031469345092773, -1.8748669624328613, -1.0465869903564453, -0.2183074951171875, 0.6099722385406494, 1.4382519721984863, 2.2665317058563232, 3.09481143951416, 3.923090934753418, 4.751370906829834, 5.57965087890625, 6.407930374145508, 7.236209869384766, 8.064489364624023, 8.892769813537598, 9.721049308776855, 10.549328804016113, 11.377609252929688, 12.205888748168945, 13.034168243408203, 13.862447738647461, 14.690727233886719, 15.519007682800293, 16.347286224365234, 17.175567626953125, 18.003847122192383, 18.83212661743164, 19.6604061126709, 20.488685607910156, 21.316965103149414, 22.145244598388672, 22.973526000976562, 23.801803588867188, 24.630084991455078, 25.458364486694336, 26.286643981933594]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 10.0, 11.0, 12.0, 11.0, 8.0, 14.0, 15.0, 30.0, 25.0, 17.0, 22.0, 27.0, 35.0, 30.0, 41.0, 50.0, 41.0, 30.0, 41.0, 47.0, 45.0, 38.0, 30.0, 38.0, 31.0, 47.0, 35.0, 31.0, 25.0, 32.0, 25.0, 17.0, 23.0, 15.0, 9.0, 10.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -2.002410888671875, -1.93841552734375, -1.874420166015625, -1.8104248046875, -1.746429443359375, -1.68243408203125, -1.618438720703125, -1.554443359375, -1.490447998046875, -1.42645263671875, -1.362457275390625, -1.2984619140625, -1.234466552734375, -1.17047119140625, -1.106475830078125, -1.04248046875, -0.978485107421875, -0.91448974609375, -0.850494384765625, -0.7864990234375, -0.722503662109375, -0.65850830078125, -0.594512939453125, -0.530517578125, -0.466522216796875, -0.40252685546875, -0.338531494140625, -0.2745361328125, -0.210540771484375, -0.14654541015625, -0.082550048828125, -0.0185546875, 0.045440673828125, 0.10943603515625, 0.173431396484375, 0.2374267578125, 0.301422119140625, 0.36541748046875, 0.429412841796875, 0.493408203125, 0.557403564453125, 0.62139892578125, 0.685394287109375, 0.7493896484375, 0.813385009765625, 0.87738037109375, 0.941375732421875, 1.00537109375, 1.069366455078125, 1.13336181640625, 1.197357177734375, 1.2613525390625, 1.325347900390625, 1.38934326171875, 1.453338623046875, 1.517333984375, 1.581329345703125, 1.64532470703125, 1.709320068359375, 1.7733154296875, 1.837310791015625, 1.90130615234375, 1.965301513671875, 2.029296875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 13.0, 14.0, 27.0, 35.0, 57.0, 65.0, 101.0, 142.0, 202.0, 290.0, 439.0, 644.0, 976.0, 1447.0, 2256.0, 3403.0, 5552.0, 8513.0, 13515.0, 21449.0, 34230.0, 53312.0, 82613.0, 121307.0, 158333.0, 163230.0, 128775.0, 89217.0, 57611.0, 36601.0, 23169.0, 14848.0, 9284.0, 5772.0, 3828.0, 2446.0, 1539.0, 1076.0, 678.0, 470.0, 321.0, 216.0, 174.0, 115.0, 92.0, 59.0, 24.0, 23.0, 16.0, 12.0, 13.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1871337890625, -0.18111419677734375, -0.1750946044921875, -0.16907501220703125, -0.163055419921875, -0.15703582763671875, -0.1510162353515625, -0.14499664306640625, -0.13897705078125, -0.13295745849609375, -0.1269378662109375, -0.12091827392578125, -0.114898681640625, -0.10887908935546875, -0.1028594970703125, -0.09683990478515625, -0.0908203125, -0.08480072021484375, -0.0787811279296875, -0.07276153564453125, -0.066741943359375, -0.06072235107421875, -0.0547027587890625, -0.04868316650390625, -0.04266357421875, -0.03664398193359375, -0.0306243896484375, -0.02460479736328125, -0.018585205078125, -0.01256561279296875, -0.0065460205078125, -0.00052642822265625, 0.0054931640625, 0.01151275634765625, 0.0175323486328125, 0.02355194091796875, 0.029571533203125, 0.03559112548828125, 0.0416107177734375, 0.04763031005859375, 0.05364990234375, 0.05966949462890625, 0.0656890869140625, 0.07170867919921875, 0.077728271484375, 0.08374786376953125, 0.0897674560546875, 0.09578704833984375, 0.101806640625, 0.10782623291015625, 0.1138458251953125, 0.11986541748046875, 0.125885009765625, 0.13190460205078125, 0.1379241943359375, 0.14394378662109375, 0.14996337890625, 0.15598297119140625, 0.1620025634765625, 0.16802215576171875, 0.174041748046875, 0.18006134033203125, 0.1860809326171875, 0.19210052490234375, 0.1981201171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 8.0, 8.0, 6.0, 5.0, 19.0, 17.0, 25.0, 16.0, 19.0, 34.0, 33.0, 43.0, 42.0, 37.0, 48.0, 53.0, 57.0, 1073.0, 41.0, 46.0, 43.0, 45.0, 48.0, 35.0, 28.0, 24.0, 28.0, 32.0, 20.0, 23.0, 13.0, 8.0, 8.0, 11.0, 7.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.3473663330078125, -1.300201416015625, -1.2530364990234375, -1.20587158203125, -1.1587066650390625, -1.111541748046875, -1.0643768310546875, -1.0172119140625, -0.9700469970703125, -0.922882080078125, -0.8757171630859375, -0.82855224609375, -0.7813873291015625, -0.734222412109375, -0.6870574951171875, -0.639892578125, -0.5927276611328125, -0.545562744140625, -0.4983978271484375, -0.45123291015625, -0.4040679931640625, -0.356903076171875, -0.3097381591796875, -0.2625732421875, -0.2154083251953125, -0.168243408203125, -0.1210784912109375, -0.07391357421875, -0.0267486572265625, 0.020416259765625, 0.0675811767578125, 0.11474609375, 0.1619110107421875, 0.209075927734375, 0.2562408447265625, 0.30340576171875, 0.3505706787109375, 0.397735595703125, 0.4449005126953125, 0.4920654296875, 0.5392303466796875, 0.586395263671875, 0.6335601806640625, 0.68072509765625, 0.7278900146484375, 0.775054931640625, 0.8222198486328125, 0.869384765625, 0.9165496826171875, 0.963714599609375, 1.0108795166015625, 1.05804443359375, 1.1052093505859375, 1.152374267578125, 1.1995391845703125, 1.2467041015625, 1.2938690185546875, 1.341033935546875, 1.3881988525390625, 1.43536376953125, 1.4825286865234375, 1.529693603515625, 1.5768585205078125, 1.6240234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 13.0, 17.0, 28.0, 33.0, 69.0, 107.0, 146.0, 225.0, 371.0, 498.0, 869.0, 1341.0, 2033.0, 3163.0, 4902.0, 7767.0, 11944.0, 18922.0, 28700.0, 43129.0, 64940.0, 92264.0, 122989.0, 1048813.0, 274049.0, 114356.0, 84647.0, 59048.0, 39327.0, 25696.0, 16510.0, 10781.0, 6882.0, 4603.0, 2913.0, 1732.0, 1211.0, 742.0, 448.0, 321.0, 209.0, 133.0, 92.0, 59.0, 29.0, 22.0, 13.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.1220703125, -0.11835670471191406, -0.11464309692382812, -0.11092948913574219, -0.10721588134765625, -0.10350227355957031, -0.09978866577148438, -0.09607505798339844, -0.0923614501953125, -0.08864784240722656, -0.08493423461914062, -0.08122062683105469, -0.07750701904296875, -0.07379341125488281, -0.07007980346679688, -0.06636619567871094, -0.062652587890625, -0.05893898010253906, -0.055225372314453125, -0.05151176452636719, -0.04779815673828125, -0.04408454895019531, -0.040370941162109375, -0.03665733337402344, -0.0329437255859375, -0.029230117797851562, -0.025516510009765625, -0.021802902221679688, -0.01808929443359375, -0.014375686645507812, -0.010662078857421875, -0.0069484710693359375, -0.00323486328125, 0.0004787445068359375, 0.004192352294921875, 0.007905960083007812, 0.01161956787109375, 0.015333175659179688, 0.019046783447265625, 0.022760391235351562, 0.0264739990234375, 0.030187606811523438, 0.033901214599609375, 0.03761482238769531, 0.04132843017578125, 0.04504203796386719, 0.048755645751953125, 0.05246925354003906, 0.056182861328125, 0.05989646911621094, 0.06361007690429688, 0.06732368469238281, 0.07103729248046875, 0.07475090026855469, 0.07846450805664062, 0.08217811584472656, 0.0858917236328125, 0.08960533142089844, 0.09331893920898438, 0.09703254699707031, 0.10074615478515625, 0.10445976257324219, 0.10817337036132812, 0.11188697814941406, 0.1156005859375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 8.0, 4.0, 13.0, 12.0, 14.0, 19.0, 20.0, 36.0, 38.0, 59.0, 74.0, 141.0, 181.0, 89.0, 64.0, 23.0, 34.0, 30.0, 23.0, 20.0, 13.0, 9.0, 9.0, 8.0, 5.0, 9.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007171630859375, -0.006925463676452637, -0.0066792964935302734, -0.00643312931060791, -0.006186962127685547, -0.005940794944763184, -0.00569462776184082, -0.005448460578918457, -0.005202293395996094, -0.0049561262130737305, -0.004709959030151367, -0.004463791847229004, -0.004217624664306641, -0.003971457481384277, -0.003725290298461914, -0.0034791231155395508, -0.0032329559326171875, -0.0029867887496948242, -0.002740621566772461, -0.0024944543838500977, -0.0022482872009277344, -0.002002120018005371, -0.0017559528350830078, -0.0015097856521606445, -0.0012636184692382812, -0.001017451286315918, -0.0007712841033935547, -0.0005251169204711914, -0.0002789497375488281, -3.2782554626464844e-05, 0.00021338462829589844, 0.0004595518112182617, 0.000705718994140625, 0.0009518861770629883, 0.0011980533599853516, 0.0014442205429077148, 0.0016903877258300781, 0.0019365549087524414, 0.0021827220916748047, 0.002428889274597168, 0.0026750564575195312, 0.0029212236404418945, 0.003167390823364258, 0.003413558006286621, 0.0036597251892089844, 0.0039058923721313477, 0.004152059555053711, 0.004398226737976074, 0.0046443939208984375, 0.004890561103820801, 0.005136728286743164, 0.005382895469665527, 0.005629062652587891, 0.005875229835510254, 0.006121397018432617, 0.0063675642013549805, 0.006613731384277344, 0.006859898567199707, 0.00710606575012207, 0.007352232933044434, 0.007598400115966797, 0.00784456729888916, 0.008090734481811523, 0.008336901664733887, 0.00858306884765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 8.0, 13.0, 10.0, 16.0, 16.0, 19.0, 33.0, 52.0, 88.0, 131.0, 213.0, 528.0, 6422.0, 1038784.0, 1287.0, 373.0, 185.0, 112.0, 68.0, 49.0, 30.0, 16.0, 20.0, 15.0, 3.0, 18.0, 6.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.289306640625, -0.28061676025390625, -0.2719268798828125, -0.26323699951171875, -0.254547119140625, -0.24585723876953125, -0.2371673583984375, -0.22847747802734375, -0.21978759765625, -0.21109771728515625, -0.2024078369140625, -0.19371795654296875, -0.185028076171875, -0.17633819580078125, -0.1676483154296875, -0.15895843505859375, -0.1502685546875, -0.14157867431640625, -0.1328887939453125, -0.12419891357421875, -0.115509033203125, -0.10681915283203125, -0.0981292724609375, -0.08943939208984375, -0.08074951171875, -0.07205963134765625, -0.0633697509765625, -0.05467987060546875, -0.045989990234375, -0.03730010986328125, -0.0286102294921875, -0.01992034912109375, -0.01123046875, -0.00254058837890625, 0.0061492919921875, 0.01483917236328125, 0.023529052734375, 0.03221893310546875, 0.0409088134765625, 0.04959869384765625, 0.05828857421875, 0.06697845458984375, 0.0756683349609375, 0.08435821533203125, 0.093048095703125, 0.10173797607421875, 0.1104278564453125, 0.11911773681640625, 0.1278076171875, 0.13649749755859375, 0.1451873779296875, 0.15387725830078125, 0.162567138671875, 0.17125701904296875, 0.1799468994140625, 0.18863677978515625, 0.19732666015625, 0.20601654052734375, 0.2147064208984375, 0.22339630126953125, 0.232086181640625, 0.24077606201171875, 0.2494659423828125, 0.25815582275390625, 0.266845703125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 16.0, 761.0, 237.0], "bins": [-0.28093189001083374, -0.27646803855895996, -0.2720041871070862, -0.26754030585289, -0.26307645440101624, -0.25861260294914246, -0.2541487514972687, -0.2496848851442337, -0.24522101879119873, -0.24075716733932495, -0.23629330098628998, -0.2318294495344162, -0.22736558318138123, -0.22290173172950745, -0.21843786537647247, -0.2139740139245987, -0.20951014757156372, -0.20504629611968994, -0.20058242976665497, -0.1961185783147812, -0.19165471196174622, -0.18719086050987244, -0.18272699415683746, -0.17826314270496368, -0.1737992912530899, -0.16933543980121613, -0.16487157344818115, -0.16040772199630737, -0.1559438556432724, -0.15148000419139862, -0.14701613783836365, -0.14255228638648987, -0.1380884349346161, -0.1336245834827423, -0.12916071712970734, -0.12469685822725296, -0.12023299932479858, -0.11576914042234421, -0.11130528151988983, -0.10684143006801605, -0.10237756371498108, -0.0979137048125267, -0.09344984591007233, -0.08898598700761795, -0.08452212810516357, -0.0800582692027092, -0.07559441030025482, -0.07113055884838104, -0.06666669994592667, -0.06220284104347229, -0.057738982141017914, -0.05327512323856354, -0.04881126433610916, -0.044347405433654785, -0.03988355025649071, -0.03541969135403633, -0.030955830588936806, -0.02649197168648243, -0.022028114646673203, -0.017564255744218826, -0.01310039684176445, -0.008636537939310074, -0.004172680899500847, 0.00029117800295352936, 0.004755036905407906]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 4.0, 1.0, 1.0, 3.0, 6.0, 13.0, 15.0, 12.0, 11.0, 24.0, 19.0, 36.0, 42.0, 42.0, 32.0, 59.0, 46.0, 41.0, 42.0, 57.0, 52.0, 49.0, 41.0, 47.0, 48.0, 40.0, 47.0, 32.0, 28.0, 23.0, 22.0, 19.0, 16.0, 11.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006202518939971924, -0.00593939796090126, -0.005676276981830597, -0.0054131560027599335, -0.00515003502368927, -0.004886914044618607, -0.004623793065547943, -0.00436067208647728, -0.004097551107406616, -0.0038344301283359528, -0.0035713091492652893, -0.003308188170194626, -0.0030450671911239624, -0.002781946212053299, -0.0025188252329826355, -0.002255704253911972, -0.0019925832748413086, -0.0017294622957706451, -0.0014663413166999817, -0.0012032203376293182, -0.0009400993585586548, -0.0006769783794879913, -0.0004138574004173279, -0.00015073642134666443, 0.00011238455772399902, 0.0003755055367946625, 0.0006386265158653259, 0.0009017474949359894, 0.0011648684740066528, 0.0014279894530773163, 0.0016911104321479797, 0.001954231411218643, 0.0022173523902893066, 0.00248047336935997, 0.0027435943484306335, 0.003006715327501297, 0.0032698363065719604, 0.003532957285642624, 0.0037960782647132874, 0.004059199243783951, 0.004322320222854614, 0.004585441201925278, 0.004848562180995941, 0.005111683160066605, 0.005374804139137268, 0.0056379251182079315, 0.005901046097278595, 0.006164167076349258, 0.006427288055419922, 0.006690409034490585, 0.006953530013561249, 0.007216650992631912, 0.007479771971702576, 0.007742892950773239, 0.008006013929843903, 0.008269134908914566, 0.00853225588798523, 0.008795376867055893, 0.009058497846126556, 0.00932161882519722, 0.009584739804267883, 0.009847860783338547, 0.01011098176240921, 0.010374102741479874, 0.010637223720550537]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 10.0, 11.0, 12.0, 11.0, 8.0, 14.0, 15.0, 30.0, 25.0, 17.0, 22.0, 27.0, 35.0, 30.0, 41.0, 50.0, 41.0, 30.0, 41.0, 47.0, 45.0, 37.0, 31.0, 38.0, 31.0, 47.0, 35.0, 31.0, 25.0, 32.0, 26.0, 16.0, 23.0, 15.0, 9.0, 10.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -2.002410888671875, -1.93841552734375, -1.874420166015625, -1.8104248046875, -1.746429443359375, -1.68243408203125, -1.618438720703125, -1.554443359375, -1.490447998046875, -1.42645263671875, -1.362457275390625, -1.2984619140625, -1.234466552734375, -1.17047119140625, -1.106475830078125, -1.04248046875, -0.978485107421875, -0.91448974609375, -0.850494384765625, -0.7864990234375, -0.722503662109375, -0.65850830078125, -0.594512939453125, -0.530517578125, -0.466522216796875, -0.40252685546875, -0.338531494140625, -0.2745361328125, -0.210540771484375, -0.14654541015625, -0.082550048828125, -0.0185546875, 0.045440673828125, 0.10943603515625, 0.173431396484375, 0.2374267578125, 0.301422119140625, 0.36541748046875, 0.429412841796875, 0.493408203125, 0.557403564453125, 0.62139892578125, 0.685394287109375, 0.7493896484375, 0.813385009765625, 0.87738037109375, 0.941375732421875, 1.00537109375, 1.069366455078125, 1.13336181640625, 1.197357177734375, 1.2613525390625, 1.325347900390625, 1.38934326171875, 1.453338623046875, 1.517333984375, 1.581329345703125, 1.64532470703125, 1.709320068359375, 1.7733154296875, 1.837310791015625, 1.90130615234375, 1.965301513671875, 2.029296875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 0.0, 6.0, 19.0, 22.0, 26.0, 26.0, 37.0, 52.0, 71.0, 79.0, 131.0, 177.0, 291.0, 385.0, 748.0, 1242.0, 2454.0, 5404.0, 12601.0, 31297.0, 84443.0, 226633.0, 368865.0, 194277.0, 71695.0, 26747.0, 10797.0, 4652.0, 2232.0, 1165.0, 682.0, 372.0, 296.0, 161.0, 128.0, 98.0, 83.0, 40.0, 38.0, 12.0, 19.0, 19.0, 17.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.947265625, -1.885284423828125, -1.82330322265625, -1.761322021484375, -1.6993408203125, -1.637359619140625, -1.57537841796875, -1.513397216796875, -1.451416015625, -1.389434814453125, -1.32745361328125, -1.265472412109375, -1.2034912109375, -1.141510009765625, -1.07952880859375, -1.017547607421875, -0.95556640625, -0.893585205078125, -0.83160400390625, -0.769622802734375, -0.7076416015625, -0.645660400390625, -0.58367919921875, -0.521697998046875, -0.459716796875, -0.397735595703125, -0.33575439453125, -0.273773193359375, -0.2117919921875, -0.149810791015625, -0.08782958984375, -0.025848388671875, 0.0361328125, 0.098114013671875, 0.16009521484375, 0.222076416015625, 0.2840576171875, 0.346038818359375, 0.40802001953125, 0.470001220703125, 0.531982421875, 0.593963623046875, 0.65594482421875, 0.717926025390625, 0.7799072265625, 0.841888427734375, 0.90386962890625, 0.965850830078125, 1.02783203125, 1.089813232421875, 1.15179443359375, 1.213775634765625, 1.2757568359375, 1.337738037109375, 1.39971923828125, 1.461700439453125, 1.523681640625, 1.585662841796875, 1.64764404296875, 1.709625244140625, 1.7716064453125, 1.833587646484375, 1.89556884765625, 1.957550048828125, 2.01953125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 3.0, 19.0, 14.0, 20.0, 19.0, 19.0, 21.0, 31.0, 19.0, 43.0, 27.0, 36.0, 40.0, 46.0, 66.0, 108.0, 409.0, 1496.0, 152.0, 65.0, 62.0, 38.0, 29.0, 39.0, 31.0, 34.0, 21.0, 33.0, 14.0, 18.0, 13.0, 16.0, 5.0, 6.0, 5.0, 6.0, 3.0, 1.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.8046875, -7.5758056640625, -7.346923828125, -7.1180419921875, -6.88916015625, -6.6602783203125, -6.431396484375, -6.2025146484375, -5.9736328125, -5.7447509765625, -5.515869140625, -5.2869873046875, -5.05810546875, -4.8292236328125, -4.600341796875, -4.3714599609375, -4.142578125, -3.9136962890625, -3.684814453125, -3.4559326171875, -3.22705078125, -2.9981689453125, -2.769287109375, -2.5404052734375, -2.3115234375, -2.0826416015625, -1.853759765625, -1.6248779296875, -1.39599609375, -1.1671142578125, -0.938232421875, -0.7093505859375, -0.48046875, -0.2515869140625, -0.022705078125, 0.2061767578125, 0.43505859375, 0.6639404296875, 0.892822265625, 1.1217041015625, 1.3505859375, 1.5794677734375, 1.808349609375, 2.0372314453125, 2.26611328125, 2.4949951171875, 2.723876953125, 2.9527587890625, 3.181640625, 3.4105224609375, 3.639404296875, 3.8682861328125, 4.09716796875, 4.3260498046875, 4.554931640625, 4.7838134765625, 5.0126953125, 5.2415771484375, 5.470458984375, 5.6993408203125, 5.92822265625, 6.1571044921875, 6.385986328125, 6.6148681640625, 6.84375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 14.0, 18.0, 17.0, 11.0, 23.0, 29.0, 41.0, 41.0, 39.0, 80.0, 73.0, 183.0, 374.0, 1166.0, 13615.0, 3066045.0, 60979.0, 1709.0, 493.0, 228.0, 130.0, 71.0, 54.0, 44.0, 33.0, 27.0, 25.0, 24.0, 14.0, 22.0, 20.0, 8.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.296875, -14.8133544921875, -14.329833984375, -13.8463134765625, -13.36279296875, -12.8792724609375, -12.395751953125, -11.9122314453125, -11.4287109375, -10.9451904296875, -10.461669921875, -9.9781494140625, -9.49462890625, -9.0111083984375, -8.527587890625, -8.0440673828125, -7.560546875, -7.0770263671875, -6.593505859375, -6.1099853515625, -5.62646484375, -5.1429443359375, -4.659423828125, -4.1759033203125, -3.6923828125, -3.2088623046875, -2.725341796875, -2.2418212890625, -1.75830078125, -1.2747802734375, -0.791259765625, -0.3077392578125, 0.17578125, 0.6593017578125, 1.142822265625, 1.6263427734375, 2.10986328125, 2.5933837890625, 3.076904296875, 3.5604248046875, 4.0439453125, 4.5274658203125, 5.010986328125, 5.4945068359375, 5.97802734375, 6.4615478515625, 6.945068359375, 7.4285888671875, 7.912109375, 8.3956298828125, 8.879150390625, 9.3626708984375, 9.84619140625, 10.3297119140625, 10.813232421875, 11.2967529296875, 11.7802734375, 12.2637939453125, 12.747314453125, 13.2308349609375, 13.71435546875, 14.1978759765625, 14.681396484375, 15.1649169921875, 15.6484375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 108.0, 562.0, 317.0, 22.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.971656799316406, -5.762825965881348, -4.553994655609131, -3.345163583755493, -2.1363325119018555, -0.9275016784667969, 0.2813296318054199, 1.4901609420776367, 2.6989917755126953, 3.907822847366333, 5.116653919219971, 6.3254852294921875, 7.534316062927246, 8.743146896362305, 9.95197868347168, 11.160809516906738, 12.369640350341797, 13.578471183776855, 14.787302017211914, 15.996133804321289, 17.20496368408203, 18.413795471191406, 19.62262725830078, 20.831459045410156, 22.0402889251709, 23.249120712280273, 24.457950592041016, 25.66678237915039, 26.875614166259766, 28.084444046020508, 29.293275833129883, 30.502105712890625, 31.7109375, 32.919769287109375, 34.12860107421875, 35.33742904663086, 36.546260833740234, 37.75509262084961, 38.963924407958984, 40.17275619506836, 41.38158416748047, 42.590415954589844, 43.79924774169922, 45.00807571411133, 46.2169075012207, 47.42573928833008, 48.63457107543945, 49.84340286254883, 51.0522346496582, 52.26106643676758, 53.46989822387695, 54.67872619628906, 55.88755798339844, 57.09638977050781, 58.30522155761719, 59.51405334472656, 60.72288513183594, 61.93171691894531, 63.14054870605469, 64.34938049316406, 65.55821228027344, 66.76704406738281, 67.97586822509766, 69.18470001220703, 70.3935317993164]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 13.0, 10.0, 9.0, 16.0, 10.0, 29.0, 18.0, 29.0, 22.0, 32.0, 35.0, 34.0, 36.0, 50.0, 42.0, 45.0, 41.0, 48.0, 40.0, 43.0, 36.0, 30.0, 42.0, 39.0, 33.0, 32.0, 19.0, 23.0, 19.0, 26.0, 12.0, 9.0, 10.0, 9.0, 4.0, 13.0, 3.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-23.55523681640625, -22.84619903564453, -22.137161254882812, -21.428123474121094, -20.719085693359375, -20.010046005249023, -19.301008224487305, -18.591970443725586, -17.882932662963867, -17.17389488220215, -16.46485710144043, -15.755818367004395, -15.046780586242676, -14.337742805480957, -13.628704071044922, -12.919666290283203, -12.210628509521484, -11.501590728759766, -10.792552947998047, -10.083514213562012, -9.374476432800293, -8.665438652038574, -7.956400394439697, -7.24736213684082, -6.538324356079102, -5.829286575317383, -5.120248317718506, -4.411210060119629, -3.70217227935791, -2.9931342601776123, -2.2840962409973145, -1.5750579833984375, -0.8660202026367188, -0.1569821834564209, 0.552055835723877, 1.2610938549041748, 1.9701318740844727, 2.6791698932647705, 3.3882079124450684, 4.097246170043945, 4.806283950805664, 5.515321731567383, 6.22435998916626, 6.933398246765137, 7.6424360275268555, 8.351473808288574, 9.06051254272461, 9.769550323486328, 10.478588104248047, 11.187625885009766, 11.896663665771484, 12.60570240020752, 13.314740180969238, 14.023777961730957, 14.732816696166992, 15.441854476928711, 16.15089225769043, 16.85993003845215, 17.568967819213867, 18.278005599975586, 18.987045288085938, 19.696083068847656, 20.405120849609375, 21.114158630371094, 21.823196411132812]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 10.0, 9.0, 9.0, 10.0, 14.0, 13.0, 16.0, 17.0, 27.0, 19.0, 23.0, 21.0, 35.0, 36.0, 27.0, 45.0, 48.0, 32.0, 36.0, 45.0, 42.0, 49.0, 35.0, 26.0, 37.0, 44.0, 38.0, 32.0, 24.0, 28.0, 29.0, 24.0, 22.0, 18.0, 12.0, 11.0, 8.0, 7.0, 8.0, 8.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.06787109375, -2.0029296875, -1.93798828125, -1.873046875, -1.80810546875, -1.7431640625, -1.67822265625, -1.61328125, -1.54833984375, -1.4833984375, -1.41845703125, -1.353515625, -1.28857421875, -1.2236328125, -1.15869140625, -1.09375, -1.02880859375, -0.9638671875, -0.89892578125, -0.833984375, -0.76904296875, -0.7041015625, -0.63916015625, -0.57421875, -0.50927734375, -0.4443359375, -0.37939453125, -0.314453125, -0.24951171875, -0.1845703125, -0.11962890625, -0.0546875, 0.01025390625, 0.0751953125, 0.14013671875, 0.205078125, 0.27001953125, 0.3349609375, 0.39990234375, 0.46484375, 0.52978515625, 0.5947265625, 0.65966796875, 0.724609375, 0.78955078125, 0.8544921875, 0.91943359375, 0.984375, 1.04931640625, 1.1142578125, 1.17919921875, 1.244140625, 1.30908203125, 1.3740234375, 1.43896484375, 1.50390625, 1.56884765625, 1.6337890625, 1.69873046875, 1.763671875, 1.82861328125, 1.8935546875, 1.95849609375, 2.0234375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 7.0, 2.0, 7.0, 12.0, 11.0, 12.0, 22.0, 30.0, 21.0, 29.0, 40.0, 51.0, 50.0, 64.0, 68.0, 113.0, 229.0, 588.0, 1873.0, 7451.0, 36612.0, 258101.0, 2544837.0, 1204600.0, 113815.0, 18920.0, 4259.0, 1274.0, 460.0, 211.0, 123.0, 91.0, 71.0, 44.0, 30.0, 30.0, 25.0, 20.0, 16.0, 18.0, 12.0, 14.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.3515625, -8.0889892578125, -7.826416015625, -7.5638427734375, -7.30126953125, -7.0386962890625, -6.776123046875, -6.5135498046875, -6.2509765625, -5.9884033203125, -5.725830078125, -5.4632568359375, -5.20068359375, -4.9381103515625, -4.675537109375, -4.4129638671875, -4.150390625, -3.8878173828125, -3.625244140625, -3.3626708984375, -3.10009765625, -2.8375244140625, -2.574951171875, -2.3123779296875, -2.0498046875, -1.7872314453125, -1.524658203125, -1.2620849609375, -0.99951171875, -0.7369384765625, -0.474365234375, -0.2117919921875, 0.05078125, 0.3133544921875, 0.575927734375, 0.8385009765625, 1.10107421875, 1.3636474609375, 1.626220703125, 1.8887939453125, 2.1513671875, 2.4139404296875, 2.676513671875, 2.9390869140625, 3.20166015625, 3.4642333984375, 3.726806640625, 3.9893798828125, 4.251953125, 4.5145263671875, 4.777099609375, 5.0396728515625, 5.30224609375, 5.5648193359375, 5.827392578125, 6.0899658203125, 6.3525390625, 6.6151123046875, 6.877685546875, 7.1402587890625, 7.40283203125, 7.6654052734375, 7.927978515625, 8.1905517578125, 8.453125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 17.0, 16.0, 27.0, 37.0, 67.0, 89.0, 126.0, 168.0, 234.0, 305.0, 428.0, 477.0, 474.0, 429.0, 338.0, 242.0, 176.0, 127.0, 83.0, 54.0, 44.0, 26.0, 18.0, 11.0, 15.0, 5.0, 4.0, 3.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.75994873046875, -6.5003662109375, -6.24078369140625, -5.981201171875, -5.72161865234375, -5.4620361328125, -5.20245361328125, -4.94287109375, -4.68328857421875, -4.4237060546875, -4.16412353515625, -3.904541015625, -3.64495849609375, -3.3853759765625, -3.12579345703125, -2.8662109375, -2.60662841796875, -2.3470458984375, -2.08746337890625, -1.827880859375, -1.56829833984375, -1.3087158203125, -1.04913330078125, -0.78955078125, -0.52996826171875, -0.2703857421875, -0.01080322265625, 0.248779296875, 0.50836181640625, 0.7679443359375, 1.02752685546875, 1.287109375, 1.54669189453125, 1.8062744140625, 2.06585693359375, 2.325439453125, 2.58502197265625, 2.8446044921875, 3.10418701171875, 3.36376953125, 3.62335205078125, 3.8829345703125, 4.14251708984375, 4.402099609375, 4.66168212890625, 4.9212646484375, 5.18084716796875, 5.4404296875, 5.70001220703125, 5.9595947265625, 6.21917724609375, 6.478759765625, 6.73834228515625, 6.9979248046875, 7.25750732421875, 7.51708984375, 7.77667236328125, 8.0362548828125, 8.29583740234375, 8.555419921875, 8.81500244140625, 9.0745849609375, 9.33416748046875, 9.59375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 10.0, 16.0, 21.0, 43.0, 57.0, 92.0, 164.0, 343.0, 746.0, 1983.0, 9619.0, 109748.0, 2353032.0, 1630309.0, 77478.0, 7629.0, 1678.0, 599.0, 299.0, 153.0, 98.0, 62.0, 27.0, 17.0, 15.0, 6.0, 12.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.96875, -21.357421875, -20.74609375, -20.134765625, -19.5234375, -18.912109375, -18.30078125, -17.689453125, -17.078125, -16.466796875, -15.85546875, -15.244140625, -14.6328125, -14.021484375, -13.41015625, -12.798828125, -12.1875, -11.576171875, -10.96484375, -10.353515625, -9.7421875, -9.130859375, -8.51953125, -7.908203125, -7.296875, -6.685546875, -6.07421875, -5.462890625, -4.8515625, -4.240234375, -3.62890625, -3.017578125, -2.40625, -1.794921875, -1.18359375, -0.572265625, 0.0390625, 0.650390625, 1.26171875, 1.873046875, 2.484375, 3.095703125, 3.70703125, 4.318359375, 4.9296875, 5.541015625, 6.15234375, 6.763671875, 7.375, 7.986328125, 8.59765625, 9.208984375, 9.8203125, 10.431640625, 11.04296875, 11.654296875, 12.265625, 12.876953125, 13.48828125, 14.099609375, 14.7109375, 15.322265625, 15.93359375, 16.544921875, 17.15625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 19.0, 71.0, 134.0, 248.0, 256.0, 165.0, 79.0, 28.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.081417083740234, -36.6553840637207, -34.229347229003906, -31.803314208984375, -29.37727928161621, -26.951244354248047, -24.525211334228516, -22.09917640686035, -19.673141479492188, -17.247106552124023, -14.821072578430176, -12.395038604736328, -9.969003677368164, -7.54296875, -5.116934776306152, -2.6909008026123047, -0.2648658752441406, 2.1611685752868652, 4.587203025817871, 7.013237476348877, 9.439271926879883, 11.865306854248047, 14.291340827941895, 16.717374801635742, 19.143409729003906, 21.56944465637207, 23.995479583740234, 26.421512603759766, 28.84754753112793, 31.273582458496094, 33.699615478515625, 36.125648498535156, 38.55168914794922, 40.97772216796875, 43.40375900268555, 45.82979202270508, 48.255828857421875, 50.681861877441406, 53.10789489746094, 55.53392791748047, 57.959964752197266, 60.3859977722168, 62.812034606933594, 65.23806762695312, 67.66410064697266, 70.09013366699219, 72.51617431640625, 74.94220733642578, 77.36824035644531, 79.79427337646484, 82.22030639648438, 84.64634704589844, 87.07238006591797, 89.4984130859375, 91.92444610595703, 94.35047912597656, 96.77651977539062, 99.20255279541016, 101.62858581542969, 104.05462646484375, 106.48065948486328, 108.90669250488281, 111.33272552490234, 113.75875854492188, 116.1847915649414]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 0.0, 6.0, 8.0, 5.0, 3.0, 3.0, 6.0, 9.0, 16.0, 8.0, 17.0, 13.0, 18.0, 18.0, 18.0, 43.0, 27.0, 33.0, 43.0, 30.0, 54.0, 45.0, 29.0, 47.0, 39.0, 37.0, 24.0, 45.0, 32.0, 32.0, 37.0, 39.0, 30.0, 27.0, 21.0, 18.0, 21.0, 26.0, 19.0, 15.0, 11.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.880813598632812, -20.142555236816406, -19.404296875, -18.666038513183594, -17.927780151367188, -17.18952178955078, -16.451263427734375, -15.713005065917969, -14.974746704101562, -14.236488342285156, -13.49822998046875, -12.759971618652344, -12.021713256835938, -11.283454895019531, -10.545196533203125, -9.806938171386719, -9.068679809570312, -8.330421447753906, -7.5921630859375, -6.853904724121094, -6.1156463623046875, -5.377388000488281, -4.639129638671875, -3.9008712768554688, -3.1626129150390625, -2.4243545532226562, -1.68609619140625, -0.9478378295898438, -0.2095794677734375, 0.5286788940429688, 1.266937255859375, 2.0051956176757812, 2.7434539794921875, 3.4817123413085938, 4.219970703125, 4.958229064941406, 5.6964874267578125, 6.434745788574219, 7.173004150390625, 7.911262512207031, 8.649520874023438, 9.387779235839844, 10.12603759765625, 10.864295959472656, 11.602554321289062, 12.340812683105469, 13.079071044921875, 13.817329406738281, 14.555587768554688, 15.293846130371094, 16.0321044921875, 16.770362854003906, 17.508621215820312, 18.24687957763672, 18.985137939453125, 19.72339630126953, 20.461654663085938, 21.199913024902344, 21.93817138671875, 22.676429748535156, 23.414688110351562, 24.15294647216797, 24.891204833984375, 25.62946319580078, 26.367721557617188]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 10.0, 9.0, 9.0, 16.0, 17.0, 19.0, 17.0, 22.0, 18.0, 30.0, 33.0, 26.0, 25.0, 42.0, 41.0, 30.0, 43.0, 54.0, 51.0, 47.0, 33.0, 45.0, 33.0, 46.0, 35.0, 30.0, 23.0, 27.0, 21.0, 30.0, 16.0, 17.0, 26.0, 6.0, 14.0, 8.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.298828125, -2.23004150390625, -2.1612548828125, -2.09246826171875, -2.023681640625, -1.95489501953125, -1.8861083984375, -1.81732177734375, -1.74853515625, -1.67974853515625, -1.6109619140625, -1.54217529296875, -1.473388671875, -1.40460205078125, -1.3358154296875, -1.26702880859375, -1.1982421875, -1.12945556640625, -1.0606689453125, -0.99188232421875, -0.923095703125, -0.85430908203125, -0.7855224609375, -0.71673583984375, -0.64794921875, -0.57916259765625, -0.5103759765625, -0.44158935546875, -0.372802734375, -0.30401611328125, -0.2352294921875, -0.16644287109375, -0.09765625, -0.02886962890625, 0.0399169921875, 0.10870361328125, 0.177490234375, 0.24627685546875, 0.3150634765625, 0.38385009765625, 0.45263671875, 0.52142333984375, 0.5902099609375, 0.65899658203125, 0.727783203125, 0.79656982421875, 0.8653564453125, 0.93414306640625, 1.0029296875, 1.07171630859375, 1.1405029296875, 1.20928955078125, 1.278076171875, 1.34686279296875, 1.4156494140625, 1.48443603515625, 1.55322265625, 1.62200927734375, 1.6907958984375, 1.75958251953125, 1.828369140625, 1.89715576171875, 1.9659423828125, 2.03472900390625, 2.103515625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 8.0, 7.0, 6.0, 5.0, 10.0, 23.0, 36.0, 50.0, 53.0, 90.0, 155.0, 195.0, 311.0, 538.0, 926.0, 1432.0, 2454.0, 4059.0, 6995.0, 12201.0, 21406.0, 37095.0, 65279.0, 109068.0, 167167.0, 201985.0, 163470.0, 105555.0, 62820.0, 36194.0, 20663.0, 11662.0, 6696.0, 3861.0, 2250.0, 1371.0, 829.0, 519.0, 390.0, 216.0, 140.0, 98.0, 80.0, 60.0, 27.0, 22.0, 23.0, 16.0, 14.0, 13.0, 10.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.249755859375, -0.2420635223388672, -0.23437118530273438, -0.22667884826660156, -0.21898651123046875, -0.21129417419433594, -0.20360183715820312, -0.1959095001220703, -0.1882171630859375, -0.1805248260498047, -0.17283248901367188, -0.16514015197753906, -0.15744781494140625, -0.14975547790527344, -0.14206314086914062, -0.1343708038330078, -0.126678466796875, -0.11898612976074219, -0.11129379272460938, -0.10360145568847656, -0.09590911865234375, -0.08821678161621094, -0.08052444458007812, -0.07283210754394531, -0.0651397705078125, -0.05744743347167969, -0.049755096435546875, -0.04206275939941406, -0.03437042236328125, -0.026678085327148438, -0.018985748291015625, -0.011293411254882812, -0.00360107421875, 0.0040912628173828125, 0.011783599853515625, 0.019475936889648438, 0.02716827392578125, 0.03486061096191406, 0.042552947998046875, 0.05024528503417969, 0.0579376220703125, 0.06562995910644531, 0.07332229614257812, 0.08101463317871094, 0.08870697021484375, 0.09639930725097656, 0.10409164428710938, 0.11178398132324219, 0.119476318359375, 0.1271686553955078, 0.13486099243164062, 0.14255332946777344, 0.15024566650390625, 0.15793800354003906, 0.16563034057617188, 0.1733226776123047, 0.1810150146484375, 0.1887073516845703, 0.19639968872070312, 0.20409202575683594, 0.21178436279296875, 0.21947669982910156, 0.22716903686523438, 0.2348613739013672, 0.2425537109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 12.0, 8.0, 6.0, 14.0, 19.0, 6.0, 16.0, 6.0, 28.0, 18.0, 18.0, 24.0, 32.0, 33.0, 38.0, 37.0, 38.0, 43.0, 37.0, 39.0, 1054.0, 45.0, 36.0, 40.0, 41.0, 38.0, 24.0, 31.0, 23.0, 34.0, 23.0, 30.0, 17.0, 22.0, 17.0, 15.0, 12.0, 6.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.326171875, -1.2820587158203125, -1.237945556640625, -1.1938323974609375, -1.14971923828125, -1.1056060791015625, -1.061492919921875, -1.0173797607421875, -0.9732666015625, -0.9291534423828125, -0.885040283203125, -0.8409271240234375, -0.79681396484375, -0.7527008056640625, -0.708587646484375, -0.6644744873046875, -0.620361328125, -0.5762481689453125, -0.532135009765625, -0.4880218505859375, -0.44390869140625, -0.3997955322265625, -0.355682373046875, -0.3115692138671875, -0.2674560546875, -0.2233428955078125, -0.179229736328125, -0.1351165771484375, -0.09100341796875, -0.0468902587890625, -0.002777099609375, 0.0413360595703125, 0.08544921875, 0.1295623779296875, 0.173675537109375, 0.2177886962890625, 0.26190185546875, 0.3060150146484375, 0.350128173828125, 0.3942413330078125, 0.4383544921875, 0.4824676513671875, 0.526580810546875, 0.5706939697265625, 0.61480712890625, 0.6589202880859375, 0.703033447265625, 0.7471466064453125, 0.791259765625, 0.8353729248046875, 0.879486083984375, 0.9235992431640625, 0.96771240234375, 1.0118255615234375, 1.055938720703125, 1.1000518798828125, 1.1441650390625, 1.1882781982421875, 1.232391357421875, 1.2765045166015625, 1.32061767578125, 1.3647308349609375, 1.408843994140625, 1.4529571533203125, 1.4970703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 6.0, 5.0, 9.0, 22.0, 22.0, 32.0, 54.0, 89.0, 110.0, 192.0, 256.0, 416.0, 620.0, 914.0, 1514.0, 2233.0, 3428.0, 5151.0, 8128.0, 12722.0, 19324.0, 28964.0, 43851.0, 63639.0, 88532.0, 117569.0, 787983.0, 521285.0, 115115.0, 87754.0, 62387.0, 42753.0, 28508.0, 18707.0, 12207.0, 7958.0, 5107.0, 3372.0, 2088.0, 1381.0, 946.0, 645.0, 367.0, 263.0, 187.0, 98.0, 69.0, 59.0, 30.0, 29.0, 12.0, 15.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.11224365234375, -0.10849857330322266, -0.10475349426269531, -0.10100841522216797, -0.09726333618164062, -0.09351825714111328, -0.08977317810058594, -0.0860280990600586, -0.08228302001953125, -0.0785379409790039, -0.07479286193847656, -0.07104778289794922, -0.06730270385742188, -0.06355762481689453, -0.05981254577636719, -0.056067466735839844, -0.0523223876953125, -0.048577308654785156, -0.04483222961425781, -0.04108715057373047, -0.037342071533203125, -0.03359699249267578, -0.029851913452148438, -0.026106834411621094, -0.02236175537109375, -0.018616676330566406, -0.014871597290039062, -0.011126518249511719, -0.007381439208984375, -0.0036363601684570312, 0.0001087188720703125, 0.0038537979125976562, 0.007598876953125, 0.011343955993652344, 0.015089035034179688, 0.01883411407470703, 0.022579193115234375, 0.02632427215576172, 0.030069351196289062, 0.033814430236816406, 0.03755950927734375, 0.041304588317871094, 0.04504966735839844, 0.04879474639892578, 0.052539825439453125, 0.05628490447998047, 0.06002998352050781, 0.06377506256103516, 0.0675201416015625, 0.07126522064208984, 0.07501029968261719, 0.07875537872314453, 0.08250045776367188, 0.08624553680419922, 0.08999061584472656, 0.0937356948852539, 0.09748077392578125, 0.1012258529663086, 0.10497093200683594, 0.10871601104736328, 0.11246109008789062, 0.11620616912841797, 0.11995124816894531, 0.12369632720947266, 0.12744140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 9.0, 7.0, 9.0, 23.0, 21.0, 27.0, 30.0, 48.0, 72.0, 136.0, 252.0, 120.0, 75.0, 30.0, 34.0, 29.0, 25.0, 10.0, 14.0, 9.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01226043701171875, -0.011882305145263672, -0.011504173278808594, -0.011126041412353516, -0.010747909545898438, -0.01036977767944336, -0.009991645812988281, -0.009613513946533203, -0.009235382080078125, -0.008857250213623047, -0.008479118347167969, -0.00810098648071289, -0.0077228546142578125, -0.007344722747802734, -0.006966590881347656, -0.006588459014892578, -0.0062103271484375, -0.005832195281982422, -0.005454063415527344, -0.005075931549072266, -0.0046977996826171875, -0.004319667816162109, -0.003941535949707031, -0.003563404083251953, -0.003185272216796875, -0.002807140350341797, -0.0024290084838867188, -0.0020508766174316406, -0.0016727447509765625, -0.0012946128845214844, -0.0009164810180664062, -0.0005383491516113281, -0.00016021728515625, 0.00021791458129882812, 0.0005960464477539062, 0.0009741783142089844, 0.0013523101806640625, 0.0017304420471191406, 0.0021085739135742188, 0.002486705780029297, 0.002864837646484375, 0.003242969512939453, 0.0036211013793945312, 0.003999233245849609, 0.0043773651123046875, 0.004755496978759766, 0.005133628845214844, 0.005511760711669922, 0.005889892578125, 0.006268024444580078, 0.006646156311035156, 0.007024288177490234, 0.0074024200439453125, 0.007780551910400391, 0.008158683776855469, 0.008536815643310547, 0.008914947509765625, 0.009293079376220703, 0.009671211242675781, 0.01004934310913086, 0.010427474975585938, 0.010805606842041016, 0.011183738708496094, 0.011561870574951172, 0.01194000244140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 8.0, 6.0, 9.0, 11.0, 19.0, 15.0, 23.0, 17.0, 31.0, 41.0, 50.0, 92.0, 139.0, 195.0, 318.0, 710.0, 4018.0, 651953.0, 385617.0, 3622.0, 690.0, 310.0, 186.0, 122.0, 85.0, 50.0, 43.0, 27.0, 26.0, 17.0, 12.0, 13.0, 12.0, 10.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.22021484375, -0.21373367309570312, -0.20725250244140625, -0.20077133178710938, -0.1942901611328125, -0.18780899047851562, -0.18132781982421875, -0.17484664916992188, -0.168365478515625, -0.16188430786132812, -0.15540313720703125, -0.14892196655273438, -0.1424407958984375, -0.13595962524414062, -0.12947845458984375, -0.12299728393554688, -0.11651611328125, -0.11003494262695312, -0.10355377197265625, -0.09707260131835938, -0.0905914306640625, -0.08411026000976562, -0.07762908935546875, -0.07114791870117188, -0.064666748046875, -0.058185577392578125, -0.05170440673828125, -0.045223236083984375, -0.0387420654296875, -0.032260894775390625, -0.02577972412109375, -0.019298553466796875, -0.0128173828125, -0.006336212158203125, 0.00014495849609375, 0.006626129150390625, 0.0131072998046875, 0.019588470458984375, 0.02606964111328125, 0.032550811767578125, 0.039031982421875, 0.045513153076171875, 0.05199432373046875, 0.058475494384765625, 0.0649566650390625, 0.07143783569335938, 0.07791900634765625, 0.08440017700195312, 0.09088134765625, 0.09736251831054688, 0.10384368896484375, 0.11032485961914062, 0.1168060302734375, 0.12328720092773438, 0.12976837158203125, 0.13624954223632812, 0.142730712890625, 0.14921188354492188, 0.15569305419921875, 0.16217422485351562, 0.1686553955078125, 0.17513656616210938, 0.18161773681640625, 0.18809890747070312, 0.194580078125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 24.0, 66.0, 412.0, 444.0, 55.0, 9.0], "bins": [-0.21687912940979004, -0.21332520246505737, -0.2097712755203247, -0.20621734857559204, -0.20266342163085938, -0.1991094946861267, -0.19555556774139404, -0.19200164079666138, -0.1884477138519287, -0.18489378690719604, -0.18133985996246338, -0.1777859330177307, -0.17423200607299805, -0.17067807912826538, -0.16712415218353271, -0.16357022523880005, -0.16001631319522858, -0.1564623862504959, -0.15290845930576324, -0.14935453236103058, -0.1458006054162979, -0.14224667847156525, -0.13869275152683258, -0.1351388394832611, -0.13158491253852844, -0.12803098559379578, -0.12447705864906311, -0.12092313170433044, -0.11736920475959778, -0.11381527781486511, -0.11026135832071304, -0.10670743137598038, -0.10315349698066711, -0.09959957003593445, -0.09604564309120178, -0.09249171614646912, -0.08893778920173645, -0.08538386225700378, -0.08182994276285172, -0.07827601581811905, -0.07472209632396698, -0.07116816937923431, -0.06761424243450165, -0.06406031548976898, -0.060506392270326614, -0.05695246532559395, -0.05339854210615158, -0.049844615161418915, -0.04629068449139595, -0.042736757546663284, -0.03918283432722092, -0.03562890738248825, -0.032074980437755585, -0.02852105349302292, -0.024967128410935402, -0.021413203328847885, -0.01785927638411522, -0.014305350370705128, -0.010751424357295036, -0.007197498343884945, -0.0036435723304748535, -8.96453857421875e-05, 0.0034642796963453293, 0.007018204778432846, 0.010572131723165512]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 6.0, 10.0, 7.0, 17.0, 11.0, 16.0, 19.0, 22.0, 23.0, 17.0, 34.0, 37.0, 38.0, 34.0, 40.0, 37.0, 47.0, 44.0, 38.0, 52.0, 42.0, 42.0, 46.0, 30.0, 21.0, 37.0, 23.0, 31.0, 24.0, 22.0, 24.0, 14.0, 14.0, 12.0, 12.0, 10.0, 8.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042945146560668945, -0.004139101132750511, -0.003983687609434128, -0.0038282740861177444, -0.003672860562801361, -0.0035174470394849777, -0.0033620335161685944, -0.003206619992852211, -0.0030512064695358276, -0.0028957929462194443, -0.002740379422903061, -0.0025849658995866776, -0.002429552376270294, -0.002274138852953911, -0.0021187253296375275, -0.001963311806321144, -0.0018078982830047607, -0.0016524847596883774, -0.001497071236371994, -0.0013416577130556107, -0.0011862441897392273, -0.001030830666422844, -0.0008754171431064606, -0.0007200036197900772, -0.0005645900964736938, -0.0004091765731573105, -0.0002537630498409271, -9.834952652454376e-05, 5.70639967918396e-05, 0.00021247752010822296, 0.0003678910434246063, 0.0005233045667409897, 0.000678718090057373, 0.0008341316133737564, 0.0009895451366901398, 0.0011449586600065231, 0.0013003721833229065, 0.0014557857066392899, 0.0016111992299556732, 0.0017666127532720566, 0.00192202627658844, 0.0020774397999048233, 0.0022328533232212067, 0.00238826684653759, 0.0025436803698539734, 0.0026990938931703568, 0.00285450741648674, 0.0030099209398031235, 0.003165334463119507, 0.00332074798643589, 0.0034761615097522736, 0.003631575033068657, 0.0037869885563850403, 0.003942402079701424, 0.004097815603017807, 0.00425322912633419, 0.004408642649650574, 0.004564056172966957, 0.0047194696962833405, 0.004874883219599724, 0.005030296742916107, 0.0051857102662324905, 0.005341123789548874, 0.005496537312865257, 0.005651950836181641]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 10.0, 9.0, 9.0, 16.0, 17.0, 19.0, 17.0, 22.0, 18.0, 30.0, 33.0, 26.0, 25.0, 42.0, 41.0, 30.0, 43.0, 52.0, 53.0, 47.0, 32.0, 45.0, 32.0, 45.0, 38.0, 30.0, 23.0, 27.0, 21.0, 28.0, 18.0, 17.0, 25.0, 7.0, 14.0, 8.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.298828125, -2.230072021484375, -2.16131591796875, -2.092559814453125, -2.0238037109375, -1.955047607421875, -1.88629150390625, -1.817535400390625, -1.748779296875, -1.680023193359375, -1.61126708984375, -1.542510986328125, -1.4737548828125, -1.404998779296875, -1.33624267578125, -1.267486572265625, -1.19873046875, -1.129974365234375, -1.06121826171875, -0.992462158203125, -0.9237060546875, -0.854949951171875, -0.78619384765625, -0.717437744140625, -0.648681640625, -0.579925537109375, -0.51116943359375, -0.442413330078125, -0.3736572265625, -0.304901123046875, -0.23614501953125, -0.167388916015625, -0.0986328125, -0.029876708984375, 0.03887939453125, 0.107635498046875, 0.1763916015625, 0.245147705078125, 0.31390380859375, 0.382659912109375, 0.451416015625, 0.520172119140625, 0.58892822265625, 0.657684326171875, 0.7264404296875, 0.795196533203125, 0.86395263671875, 0.932708740234375, 1.00146484375, 1.070220947265625, 1.13897705078125, 1.207733154296875, 1.2764892578125, 1.345245361328125, 1.41400146484375, 1.482757568359375, 1.551513671875, 1.620269775390625, 1.68902587890625, 1.757781982421875, 1.8265380859375, 1.895294189453125, 1.96405029296875, 2.032806396484375, 2.1015625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 4.0, 18.0, 15.0, 41.0, 46.0, 73.0, 132.0, 187.0, 276.0, 420.0, 665.0, 994.0, 1591.0, 2431.0, 3792.0, 6061.0, 10133.0, 18502.0, 37262.0, 88424.0, 238020.0, 356693.0, 158297.0, 61065.0, 27069.0, 14335.0, 8204.0, 4800.0, 3143.0, 2028.0, 1320.0, 888.0, 589.0, 373.0, 252.0, 140.0, 100.0, 63.0, 45.0, 28.0, 13.0, 12.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.9951171875, -1.941619873046875, -1.88812255859375, -1.834625244140625, -1.7811279296875, -1.727630615234375, -1.67413330078125, -1.620635986328125, -1.567138671875, -1.513641357421875, -1.46014404296875, -1.406646728515625, -1.3531494140625, -1.299652099609375, -1.24615478515625, -1.192657470703125, -1.13916015625, -1.085662841796875, -1.03216552734375, -0.978668212890625, -0.9251708984375, -0.871673583984375, -0.81817626953125, -0.764678955078125, -0.711181640625, -0.657684326171875, -0.60418701171875, -0.550689697265625, -0.4971923828125, -0.443695068359375, -0.39019775390625, -0.336700439453125, -0.283203125, -0.229705810546875, -0.17620849609375, -0.122711181640625, -0.0692138671875, -0.015716552734375, 0.03778076171875, 0.091278076171875, 0.144775390625, 0.198272705078125, 0.25177001953125, 0.305267333984375, 0.3587646484375, 0.412261962890625, 0.46575927734375, 0.519256591796875, 0.57275390625, 0.626251220703125, 0.67974853515625, 0.733245849609375, 0.7867431640625, 0.840240478515625, 0.89373779296875, 0.947235107421875, 1.000732421875, 1.054229736328125, 1.10772705078125, 1.161224365234375, 1.2147216796875, 1.268218994140625, 1.32171630859375, 1.375213623046875, 1.4287109375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 3.0, 5.0, 9.0, 10.0, 17.0, 17.0, 12.0, 24.0, 19.0, 22.0, 22.0, 25.0, 42.0, 33.0, 46.0, 37.0, 52.0, 61.0, 171.0, 1524.0, 350.0, 110.0, 63.0, 43.0, 37.0, 34.0, 31.0, 27.0, 27.0, 29.0, 18.0, 21.0, 16.0, 13.0, 12.0, 6.0, 12.0, 11.0, 10.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.99609375, -7.7528076171875, -7.509521484375, -7.2662353515625, -7.02294921875, -6.7796630859375, -6.536376953125, -6.2930908203125, -6.0498046875, -5.8065185546875, -5.563232421875, -5.3199462890625, -5.07666015625, -4.8333740234375, -4.590087890625, -4.3468017578125, -4.103515625, -3.8602294921875, -3.616943359375, -3.3736572265625, -3.13037109375, -2.8870849609375, -2.643798828125, -2.4005126953125, -2.1572265625, -1.9139404296875, -1.670654296875, -1.4273681640625, -1.18408203125, -0.9407958984375, -0.697509765625, -0.4542236328125, -0.2109375, 0.0323486328125, 0.275634765625, 0.5189208984375, 0.76220703125, 1.0054931640625, 1.248779296875, 1.4920654296875, 1.7353515625, 1.9786376953125, 2.221923828125, 2.4652099609375, 2.70849609375, 2.9517822265625, 3.195068359375, 3.4383544921875, 3.681640625, 3.9249267578125, 4.168212890625, 4.4114990234375, 4.65478515625, 4.8980712890625, 5.141357421875, 5.3846435546875, 5.6279296875, 5.8712158203125, 6.114501953125, 6.3577880859375, 6.60107421875, 6.8443603515625, 7.087646484375, 7.3309326171875, 7.57421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 5.0, 0.0, 4.0, 3.0, 6.0, 4.0, 7.0, 7.0, 11.0, 9.0, 13.0, 11.0, 24.0, 21.0, 25.0, 36.0, 43.0, 68.0, 88.0, 132.0, 235.0, 455.0, 1271.0, 8314.0, 203147.0, 2877153.0, 48882.0, 3906.0, 841.0, 365.0, 169.0, 114.0, 80.0, 44.0, 37.0, 29.0, 24.0, 25.0, 30.0, 17.0, 10.0, 11.0, 10.0, 4.0, 3.0, 9.0, 8.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.1832275390625, -10.788330078125, -10.3934326171875, -9.99853515625, -9.6036376953125, -9.208740234375, -8.8138427734375, -8.4189453125, -8.0240478515625, -7.629150390625, -7.2342529296875, -6.83935546875, -6.4444580078125, -6.049560546875, -5.6546630859375, -5.259765625, -4.8648681640625, -4.469970703125, -4.0750732421875, -3.68017578125, -3.2852783203125, -2.890380859375, -2.4954833984375, -2.1005859375, -1.7056884765625, -1.310791015625, -0.9158935546875, -0.52099609375, -0.1260986328125, 0.268798828125, 0.6636962890625, 1.05859375, 1.4534912109375, 1.848388671875, 2.2432861328125, 2.63818359375, 3.0330810546875, 3.427978515625, 3.8228759765625, 4.2177734375, 4.6126708984375, 5.007568359375, 5.4024658203125, 5.79736328125, 6.1922607421875, 6.587158203125, 6.9820556640625, 7.376953125, 7.7718505859375, 8.166748046875, 8.5616455078125, 8.95654296875, 9.3514404296875, 9.746337890625, 10.1412353515625, 10.5361328125, 10.9310302734375, 11.325927734375, 11.7208251953125, 12.11572265625, 12.5106201171875, 12.905517578125, 13.3004150390625, 13.6953125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 385.0, 631.0, 2.0, 0.0, 0.0, 1.0], "bins": [-253.60528564453125, -249.31167602539062, -245.01806640625, -240.7244415283203, -236.4308319091797, -232.13722229003906, -227.84361267089844, -223.5500030517578, -219.25637817382812, -214.9627685546875, -210.66915893554688, -206.3755340576172, -202.08192443847656, -197.78831481933594, -193.4947052001953, -189.2010955810547, -184.90748596191406, -180.61387634277344, -176.3202667236328, -172.02664184570312, -167.7330322265625, -163.43942260742188, -159.14581298828125, -154.85220336914062, -150.55859375, -146.26498413085938, -141.97137451171875, -137.67774963378906, -133.38414001464844, -129.0905303955078, -124.79692077636719, -120.50331115722656, -116.20967864990234, -111.91606903076172, -107.62245178222656, -103.32884216308594, -99.03523254394531, -94.74161529541016, -90.44800567626953, -86.15438842773438, -81.86077880859375, -77.56716918945312, -73.27355194091797, -68.97994232177734, -64.68632507324219, -60.39271545410156, -56.09910583496094, -51.80549240112305, -47.511878967285156, -43.218265533447266, -38.924652099609375, -34.63104248046875, -30.33742904663086, -26.04381561279297, -21.75020408630371, -17.456592559814453, -13.162979125976562, -8.869366645812988, -4.575754165649414, -0.28214168548583984, 4.011470794677734, 8.305084228515625, 12.598695755004883, 16.89230728149414, 21.18592071533203]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 8.0, 11.0, 9.0, 15.0, 9.0, 12.0, 19.0, 23.0, 25.0, 37.0, 27.0, 26.0, 31.0, 47.0, 34.0, 38.0, 45.0, 32.0, 50.0, 48.0, 26.0, 36.0, 40.0, 41.0, 42.0, 26.0, 37.0, 24.0, 33.0, 20.0, 20.0, 16.0, 14.0, 11.0, 6.0, 5.0, 9.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.641633987426758, -23.86092758178711, -23.08022117614746, -22.299514770507812, -21.518808364868164, -20.738101959228516, -19.957395553588867, -19.17668914794922, -18.39598274230957, -17.615276336669922, -16.834569931030273, -16.053863525390625, -15.273157119750977, -14.492450714111328, -13.71174430847168, -12.931037902832031, -12.150331497192383, -11.369625091552734, -10.588918685913086, -9.808212280273438, -9.027505874633789, -8.24679946899414, -7.466093063354492, -6.685386657714844, -5.904680252075195, -5.123973846435547, -4.343267440795898, -3.56256103515625, -2.7818546295166016, -2.001148223876953, -1.2204418182373047, -0.43973541259765625, 0.340972900390625, 1.1216793060302734, 1.9023857116699219, 2.6830921173095703, 3.4637985229492188, 4.244504928588867, 5.025211334228516, 5.805917739868164, 6.5866241455078125, 7.367330551147461, 8.14803695678711, 8.928743362426758, 9.709449768066406, 10.490156173706055, 11.270862579345703, 12.051568984985352, 12.832275390625, 13.612981796264648, 14.393688201904297, 15.174394607543945, 15.955101013183594, 16.735807418823242, 17.51651382446289, 18.29722023010254, 19.077926635742188, 19.858633041381836, 20.639339447021484, 21.420045852661133, 22.20075225830078, 22.98145866394043, 23.762165069580078, 24.542871475219727, 25.323577880859375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 1.0, 5.0, 5.0, 13.0, 10.0, 12.0, 11.0, 16.0, 11.0, 25.0, 24.0, 24.0, 22.0, 25.0, 32.0, 32.0, 36.0, 31.0, 49.0, 42.0, 49.0, 46.0, 47.0, 36.0, 32.0, 32.0, 54.0, 45.0, 23.0, 22.0, 21.0, 26.0, 29.0, 18.0, 17.0, 15.0, 20.0, 10.0, 9.0, 7.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.36328125, -2.29254150390625, -2.2218017578125, -2.15106201171875, -2.080322265625, -2.00958251953125, -1.9388427734375, -1.86810302734375, -1.79736328125, -1.72662353515625, -1.6558837890625, -1.58514404296875, -1.514404296875, -1.44366455078125, -1.3729248046875, -1.30218505859375, -1.2314453125, -1.16070556640625, -1.0899658203125, -1.01922607421875, -0.948486328125, -0.87774658203125, -0.8070068359375, -0.73626708984375, -0.66552734375, -0.59478759765625, -0.5240478515625, -0.45330810546875, -0.382568359375, -0.31182861328125, -0.2410888671875, -0.17034912109375, -0.099609375, -0.02886962890625, 0.0418701171875, 0.11260986328125, 0.183349609375, 0.25408935546875, 0.3248291015625, 0.39556884765625, 0.46630859375, 0.53704833984375, 0.6077880859375, 0.67852783203125, 0.749267578125, 0.82000732421875, 0.8907470703125, 0.96148681640625, 1.0322265625, 1.10296630859375, 1.1737060546875, 1.24444580078125, 1.315185546875, 1.38592529296875, 1.4566650390625, 1.52740478515625, 1.59814453125, 1.66888427734375, 1.7396240234375, 1.81036376953125, 1.881103515625, 1.95184326171875, 2.0225830078125, 2.09332275390625, 2.1640625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 12.0, 7.0, 11.0, 8.0, 14.0, 15.0, 22.0, 31.0, 23.0, 36.0, 37.0, 83.0, 98.0, 131.0, 231.0, 640.0, 2543.0, 12839.0, 85243.0, 1174053.0, 2685708.0, 201230.0, 24785.0, 4504.0, 1027.0, 316.0, 176.0, 100.0, 72.0, 60.0, 47.0, 29.0, 20.0, 24.0, 19.0, 18.0, 10.0, 14.0, 5.0, 8.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-10.5, -10.19287109375, -9.8857421875, -9.57861328125, -9.271484375, -8.96435546875, -8.6572265625, -8.35009765625, -8.04296875, -7.73583984375, -7.4287109375, -7.12158203125, -6.814453125, -6.50732421875, -6.2001953125, -5.89306640625, -5.5859375, -5.27880859375, -4.9716796875, -4.66455078125, -4.357421875, -4.05029296875, -3.7431640625, -3.43603515625, -3.12890625, -2.82177734375, -2.5146484375, -2.20751953125, -1.900390625, -1.59326171875, -1.2861328125, -0.97900390625, -0.671875, -0.36474609375, -0.0576171875, 0.24951171875, 0.556640625, 0.86376953125, 1.1708984375, 1.47802734375, 1.78515625, 2.09228515625, 2.3994140625, 2.70654296875, 3.013671875, 3.32080078125, 3.6279296875, 3.93505859375, 4.2421875, 4.54931640625, 4.8564453125, 5.16357421875, 5.470703125, 5.77783203125, 6.0849609375, 6.39208984375, 6.69921875, 7.00634765625, 7.3134765625, 7.62060546875, 7.927734375, 8.23486328125, 8.5419921875, 8.84912109375, 9.15625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 15.0, 18.0, 18.0, 36.0, 49.0, 64.0, 96.0, 146.0, 180.0, 235.0, 359.0, 458.0, 462.0, 498.0, 433.0, 297.0, 199.0, 147.0, 108.0, 62.0, 60.0, 37.0, 21.0, 22.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.765625, -10.50750732421875, -10.2493896484375, -9.99127197265625, -9.733154296875, -9.47503662109375, -9.2169189453125, -8.95880126953125, -8.70068359375, -8.44256591796875, -8.1844482421875, -7.92633056640625, -7.668212890625, -7.41009521484375, -7.1519775390625, -6.89385986328125, -6.6357421875, -6.37762451171875, -6.1195068359375, -5.86138916015625, -5.603271484375, -5.34515380859375, -5.0870361328125, -4.82891845703125, -4.57080078125, -4.31268310546875, -4.0545654296875, -3.79644775390625, -3.538330078125, -3.28021240234375, -3.0220947265625, -2.76397705078125, -2.505859375, -2.24774169921875, -1.9896240234375, -1.73150634765625, -1.473388671875, -1.21527099609375, -0.9571533203125, -0.69903564453125, -0.44091796875, -0.18280029296875, 0.0753173828125, 0.33343505859375, 0.591552734375, 0.84967041015625, 1.1077880859375, 1.36590576171875, 1.6240234375, 1.88214111328125, 2.1402587890625, 2.39837646484375, 2.656494140625, 2.91461181640625, 3.1727294921875, 3.43084716796875, 3.68896484375, 3.94708251953125, 4.2052001953125, 4.46331787109375, 4.721435546875, 4.97955322265625, 5.2376708984375, 5.49578857421875, 5.75390625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 10.0, 7.0, 13.0, 12.0, 34.0, 53.0, 64.0, 123.0, 212.0, 381.0, 859.0, 3260.0, 37469.0, 1438805.0, 2640805.0, 65504.0, 4613.0, 964.0, 464.0, 246.0, 151.0, 68.0, 64.0, 41.0, 31.0, 11.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.1875, -24.42626953125, -23.6650390625, -22.90380859375, -22.142578125, -21.38134765625, -20.6201171875, -19.85888671875, -19.09765625, -18.33642578125, -17.5751953125, -16.81396484375, -16.052734375, -15.29150390625, -14.5302734375, -13.76904296875, -13.0078125, -12.24658203125, -11.4853515625, -10.72412109375, -9.962890625, -9.20166015625, -8.4404296875, -7.67919921875, -6.91796875, -6.15673828125, -5.3955078125, -4.63427734375, -3.873046875, -3.11181640625, -2.3505859375, -1.58935546875, -0.828125, -0.06689453125, 0.6943359375, 1.45556640625, 2.216796875, 2.97802734375, 3.7392578125, 4.50048828125, 5.26171875, 6.02294921875, 6.7841796875, 7.54541015625, 8.306640625, 9.06787109375, 9.8291015625, 10.59033203125, 11.3515625, 12.11279296875, 12.8740234375, 13.63525390625, 14.396484375, 15.15771484375, 15.9189453125, 16.68017578125, 17.44140625, 18.20263671875, 18.9638671875, 19.72509765625, 20.486328125, 21.24755859375, 22.0087890625, 22.77001953125, 23.53125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 33.0, 92.0, 164.0, 225.0, 217.0, 150.0, 76.0, 31.0, 11.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0709114074707, -55.74771499633789, -53.424522399902344, -51.10132598876953, -48.77812957763672, -46.454933166503906, -44.131736755371094, -41.80854415893555, -39.485347747802734, -37.16215133666992, -34.838958740234375, -32.51576232910156, -30.19256591796875, -27.869369506835938, -25.546175003051758, -23.222980499267578, -20.899784088134766, -18.576587677001953, -16.253393173217773, -13.930197715759277, -11.607002258300781, -9.283806800842285, -6.960611343383789, -4.637416839599609, -2.314220428466797, 0.008975028991699219, 2.3321704864501953, 4.655365943908691, 6.9785614013671875, 9.301756858825684, 11.62495231628418, 13.94814682006836, 16.271347045898438, 18.59454345703125, 20.91773796081543, 23.24093246459961, 25.564128875732422, 27.887325286865234, 30.210519790649414, 32.533714294433594, 34.856910705566406, 37.18010711669922, 39.50330352783203, 41.82649612426758, 44.14969253540039, 46.4728889465332, 48.79608154296875, 51.11927795410156, 53.442474365234375, 55.76567077636719, 58.0888671875, 60.41205978393555, 62.73525619506836, 65.0584487915039, 67.38164520263672, 69.70484161376953, 72.02803802490234, 74.35123443603516, 76.67443084716797, 78.99762725830078, 81.32081604003906, 83.64401245117188, 85.96720886230469, 88.2904052734375, 90.61360168457031]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 4.0, 4.0, 10.0, 12.0, 17.0, 13.0, 16.0, 22.0, 11.0, 26.0, 24.0, 33.0, 32.0, 35.0, 33.0, 43.0, 30.0, 49.0, 36.0, 40.0, 53.0, 30.0, 38.0, 40.0, 42.0, 36.0, 31.0, 16.0, 29.0, 17.0, 31.0, 12.0, 17.0, 18.0, 16.0, 16.0, 11.0, 7.0, 8.0, 8.0, 10.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-24.102630615234375, -23.330764770507812, -22.558897018432617, -21.787031173706055, -21.01516342163086, -20.243297576904297, -19.4714298248291, -18.69956398010254, -17.927696228027344, -17.15583038330078, -16.383962631225586, -15.612095832824707, -14.840229034423828, -14.06836223602295, -13.29649543762207, -12.524629592895508, -11.752762794494629, -10.98089599609375, -10.209029197692871, -9.437162399291992, -8.665295600891113, -7.893428802490234, -7.121562480926514, -6.349695682525635, -5.577828884124756, -4.805962085723877, -4.034095287322998, -3.2622287273406982, -2.4903619289398193, -1.7184951305389404, -0.9466285705566406, -0.17476177215576172, 0.5971050262451172, 1.368971824645996, 2.140838623046875, 2.912705183029175, 3.6845719814300537, 4.456439018249512, 5.228305339813232, 6.000172138214111, 6.77203893661499, 7.543905735015869, 8.31577205657959, 9.087638854980469, 9.859505653381348, 10.631372451782227, 11.403239250183105, 12.175106048583984, 12.946972846984863, 13.718839645385742, 14.490706443786621, 15.2625732421875, 16.034439086914062, 16.806306838989258, 17.57817268371582, 18.350040435791016, 19.121906280517578, 19.89377212524414, 20.665639877319336, 21.4375057220459, 22.209373474121094, 22.981239318847656, 23.75310707092285, 24.524972915649414, 25.29684066772461]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 8.0, 5.0, 8.0, 13.0, 5.0, 19.0, 16.0, 18.0, 27.0, 23.0, 16.0, 29.0, 35.0, 34.0, 29.0, 42.0, 44.0, 54.0, 33.0, 42.0, 49.0, 34.0, 43.0, 42.0, 33.0, 37.0, 29.0, 32.0, 33.0, 29.0, 25.0, 16.0, 20.0, 18.0, 7.0, 15.0, 7.0, 5.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.24658203125, -2.1708984375, -2.09521484375, -2.01953125, -1.94384765625, -1.8681640625, -1.79248046875, -1.716796875, -1.64111328125, -1.5654296875, -1.48974609375, -1.4140625, -1.33837890625, -1.2626953125, -1.18701171875, -1.111328125, -1.03564453125, -0.9599609375, -0.88427734375, -0.80859375, -0.73291015625, -0.6572265625, -0.58154296875, -0.505859375, -0.43017578125, -0.3544921875, -0.27880859375, -0.203125, -0.12744140625, -0.0517578125, 0.02392578125, 0.099609375, 0.17529296875, 0.2509765625, 0.32666015625, 0.40234375, 0.47802734375, 0.5537109375, 0.62939453125, 0.705078125, 0.78076171875, 0.8564453125, 0.93212890625, 1.0078125, 1.08349609375, 1.1591796875, 1.23486328125, 1.310546875, 1.38623046875, 1.4619140625, 1.53759765625, 1.61328125, 1.68896484375, 1.7646484375, 1.84033203125, 1.916015625, 1.99169921875, 2.0673828125, 2.14306640625, 2.21875, 2.29443359375, 2.3701171875, 2.44580078125, 2.521484375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 0.0, 12.0, 14.0, 14.0, 25.0, 28.0, 35.0, 58.0, 71.0, 130.0, 224.0, 296.0, 449.0, 774.0, 1236.0, 2012.0, 3597.0, 6358.0, 11591.0, 21553.0, 40549.0, 75667.0, 135172.0, 208545.0, 216668.0, 144833.0, 81993.0, 44159.0, 23510.0, 12538.0, 6830.0, 3781.0, 2228.0, 1262.0, 817.0, 494.0, 318.0, 238.0, 133.0, 116.0, 70.0, 46.0, 46.0, 14.0, 22.0, 15.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296142578125, -0.28629302978515625, -0.2764434814453125, -0.26659393310546875, -0.256744384765625, -0.24689483642578125, -0.2370452880859375, -0.22719573974609375, -0.21734619140625, -0.20749664306640625, -0.1976470947265625, -0.18779754638671875, -0.177947998046875, -0.16809844970703125, -0.1582489013671875, -0.14839935302734375, -0.1385498046875, -0.12870025634765625, -0.1188507080078125, -0.10900115966796875, -0.099151611328125, -0.08930206298828125, -0.0794525146484375, -0.06960296630859375, -0.05975341796875, -0.04990386962890625, -0.0400543212890625, -0.03020477294921875, -0.020355224609375, -0.01050567626953125, -0.0006561279296875, 0.00919342041015625, 0.01904296875, 0.02889251708984375, 0.0387420654296875, 0.04859161376953125, 0.058441162109375, 0.06829071044921875, 0.0781402587890625, 0.08798980712890625, 0.09783935546875, 0.10768890380859375, 0.1175384521484375, 0.12738800048828125, 0.137237548828125, 0.14708709716796875, 0.1569366455078125, 0.16678619384765625, 0.1766357421875, 0.18648529052734375, 0.1963348388671875, 0.20618438720703125, 0.216033935546875, 0.22588348388671875, 0.2357330322265625, 0.24558258056640625, 0.25543212890625, 0.26528167724609375, 0.2751312255859375, 0.28498077392578125, 0.294830322265625, 0.30467987060546875, 0.3145294189453125, 0.32437896728515625, 0.334228515625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 9.0, 6.0, 10.0, 11.0, 15.0, 18.0, 26.0, 23.0, 30.0, 33.0, 19.0, 30.0, 32.0, 36.0, 29.0, 35.0, 31.0, 44.0, 1063.0, 41.0, 32.0, 43.0, 29.0, 40.0, 36.0, 50.0, 29.0, 33.0, 21.0, 22.0, 28.0, 17.0, 15.0, 12.0, 14.0, 10.0, 11.0, 11.0, 2.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5537109375, -1.5048370361328125, -1.455963134765625, -1.4070892333984375, -1.35821533203125, -1.3093414306640625, -1.260467529296875, -1.2115936279296875, -1.1627197265625, -1.1138458251953125, -1.064971923828125, -1.0160980224609375, -0.96722412109375, -0.9183502197265625, -0.869476318359375, -0.8206024169921875, -0.771728515625, -0.7228546142578125, -0.673980712890625, -0.6251068115234375, -0.57623291015625, -0.5273590087890625, -0.478485107421875, -0.4296112060546875, -0.3807373046875, -0.3318634033203125, -0.282989501953125, -0.2341156005859375, -0.18524169921875, -0.1363677978515625, -0.087493896484375, -0.0386199951171875, 0.01025390625, 0.0591278076171875, 0.108001708984375, 0.1568756103515625, 0.20574951171875, 0.2546234130859375, 0.303497314453125, 0.3523712158203125, 0.4012451171875, 0.4501190185546875, 0.498992919921875, 0.5478668212890625, 0.59674072265625, 0.6456146240234375, 0.694488525390625, 0.7433624267578125, 0.792236328125, 0.8411102294921875, 0.889984130859375, 0.9388580322265625, 0.98773193359375, 1.0366058349609375, 1.085479736328125, 1.1343536376953125, 1.1832275390625, 1.2321014404296875, 1.280975341796875, 1.3298492431640625, 1.37872314453125, 1.4275970458984375, 1.476470947265625, 1.5253448486328125, 1.57421875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [8.0, 2.0, 5.0, 5.0, 12.0, 8.0, 16.0, 26.0, 29.0, 53.0, 67.0, 105.0, 148.0, 205.0, 326.0, 423.0, 634.0, 941.0, 1378.0, 1960.0, 2970.0, 4360.0, 6729.0, 9863.0, 15002.0, 21922.0, 32562.0, 47649.0, 68087.0, 91808.0, 123754.0, 1031802.0, 255653.0, 109352.0, 82323.0, 59437.0, 41300.0, 28192.0, 19019.0, 12817.0, 8563.0, 5684.0, 3822.0, 2590.0, 1740.0, 1183.0, 814.0, 550.0, 375.0, 275.0, 172.0, 136.0, 106.0, 64.0, 29.0, 34.0, 16.0, 10.0, 12.0, 4.0, 6.0, 10.0, 4.0, 1.0], "bins": [-0.1214599609375, -0.11764144897460938, -0.11382293701171875, -0.11000442504882812, -0.1061859130859375, -0.10236740112304688, -0.09854888916015625, -0.09473037719726562, -0.090911865234375, -0.08709335327148438, -0.08327484130859375, -0.07945632934570312, -0.0756378173828125, -0.07181930541992188, -0.06800079345703125, -0.06418228149414062, -0.06036376953125, -0.056545257568359375, -0.05272674560546875, -0.048908233642578125, -0.0450897216796875, -0.041271209716796875, -0.03745269775390625, -0.033634185791015625, -0.029815673828125, -0.025997161865234375, -0.02217864990234375, -0.018360137939453125, -0.0145416259765625, -0.010723114013671875, -0.00690460205078125, -0.003086090087890625, 0.000732421875, 0.004550933837890625, 0.00836944580078125, 0.012187957763671875, 0.0160064697265625, 0.019824981689453125, 0.02364349365234375, 0.027462005615234375, 0.031280517578125, 0.035099029541015625, 0.03891754150390625, 0.042736053466796875, 0.0465545654296875, 0.050373077392578125, 0.05419158935546875, 0.058010101318359375, 0.06182861328125, 0.06564712524414062, 0.06946563720703125, 0.07328414916992188, 0.0771026611328125, 0.08092117309570312, 0.08473968505859375, 0.08855819702148438, 0.092376708984375, 0.09619522094726562, 0.10001373291015625, 0.10383224487304688, 0.1076507568359375, 0.11146926879882812, 0.11528778076171875, 0.11910629272460938, 0.1229248046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 7.0, 17.0, 18.0, 19.0, 30.0, 39.0, 36.0, 85.0, 192.0, 207.0, 117.0, 60.0, 42.0, 24.0, 20.0, 15.0, 10.0, 8.0, 14.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02410888671875, -0.02331066131591797, -0.022512435913085938, -0.021714210510253906, -0.020915985107421875, -0.020117759704589844, -0.019319534301757812, -0.01852130889892578, -0.01772308349609375, -0.01692485809326172, -0.016126632690429688, -0.015328407287597656, -0.014530181884765625, -0.013731956481933594, -0.012933731079101562, -0.012135505676269531, -0.0113372802734375, -0.010539054870605469, -0.009740829467773438, -0.008942604064941406, -0.008144378662109375, -0.007346153259277344, -0.0065479278564453125, -0.005749702453613281, -0.00495147705078125, -0.004153251647949219, -0.0033550262451171875, -0.0025568008422851562, -0.001758575439453125, -0.0009603500366210938, -0.0001621246337890625, 0.0006361007690429688, 0.001434326171875, 0.0022325515747070312, 0.0030307769775390625, 0.0038290023803710938, 0.004627227783203125, 0.005425453186035156, 0.0062236785888671875, 0.007021903991699219, 0.00782012939453125, 0.008618354797363281, 0.009416580200195312, 0.010214805603027344, 0.011013031005859375, 0.011811256408691406, 0.012609481811523438, 0.013407707214355469, 0.0142059326171875, 0.015004158020019531, 0.015802383422851562, 0.016600608825683594, 0.017398834228515625, 0.018197059631347656, 0.018995285034179688, 0.01979351043701172, 0.02059173583984375, 0.02138996124267578, 0.022188186645507812, 0.022986412048339844, 0.023784637451171875, 0.024582862854003906, 0.025381088256835938, 0.02617931365966797, 0.0269775390625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 9.0, 9.0, 18.0, 23.0, 32.0, 49.0, 83.0, 102.0, 142.0, 253.0, 630.0, 3947.0, 133412.0, 900243.0, 7671.0, 1072.0, 313.0, 139.0, 128.0, 67.0, 45.0, 38.0, 23.0, 15.0, 12.0, 16.0, 11.0, 6.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364013671875, -0.35193634033203125, -0.3398590087890625, -0.32778167724609375, -0.315704345703125, -0.30362701416015625, -0.2915496826171875, -0.27947235107421875, -0.26739501953125, -0.25531768798828125, -0.2432403564453125, -0.23116302490234375, -0.219085693359375, -0.20700836181640625, -0.1949310302734375, -0.18285369873046875, -0.1707763671875, -0.15869903564453125, -0.1466217041015625, -0.13454437255859375, -0.122467041015625, -0.11038970947265625, -0.0983123779296875, -0.08623504638671875, -0.07415771484375, -0.06208038330078125, -0.0500030517578125, -0.03792572021484375, -0.025848388671875, -0.01377105712890625, -0.0016937255859375, 0.01038360595703125, 0.0224609375, 0.03453826904296875, 0.0466156005859375, 0.05869293212890625, 0.070770263671875, 0.08284759521484375, 0.0949249267578125, 0.10700225830078125, 0.11907958984375, 0.13115692138671875, 0.1432342529296875, 0.15531158447265625, 0.167388916015625, 0.17946624755859375, 0.1915435791015625, 0.20362091064453125, 0.2156982421875, 0.22777557373046875, 0.2398529052734375, 0.25193023681640625, 0.264007568359375, 0.27608489990234375, 0.2881622314453125, 0.30023956298828125, 0.31231689453125, 0.32439422607421875, 0.3364715576171875, 0.34854888916015625, 0.360626220703125, 0.37270355224609375, 0.3847808837890625, 0.39685821533203125, 0.408935546875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 21.0, 36.0, 86.0, 278.0, 419.0, 117.0, 35.0, 11.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23239365220069885, -0.2279408872127533, -0.22348812222480774, -0.21903537213802338, -0.21458260715007782, -0.21012984216213226, -0.2056770920753479, -0.20122432708740234, -0.1967715620994568, -0.19231879711151123, -0.18786603212356567, -0.1834132820367813, -0.17896051704883575, -0.1745077520608902, -0.17005500197410583, -0.16560223698616028, -0.16114947199821472, -0.15669670701026917, -0.1522439420223236, -0.14779119193553925, -0.1433384269475937, -0.13888566195964813, -0.13443291187286377, -0.1299801468849182, -0.12552738189697266, -0.1210746169090271, -0.11662185937166214, -0.11216910183429718, -0.10771633684635162, -0.10326357185840607, -0.09881081432104111, -0.09435805678367615, -0.08990529179573059, -0.08545252680778503, -0.08099976927042007, -0.07654701173305511, -0.07209424674510956, -0.067641481757164, -0.06318872421979904, -0.058735962957143784, -0.054283205419778824, -0.049830444157123566, -0.04537768289446831, -0.04092492163181305, -0.03647216036915779, -0.03201939910650253, -0.027566637843847275, -0.023113876581192017, -0.01866111531853676, -0.0142083540558815, -0.009755592793226242, -0.005302831530570984, -0.0008500702679157257, 0.0036026909947395325, 0.00805545225739479, 0.012508213520050049, 0.016960974782705307, 0.021413736045360565, 0.025866497308015823, 0.03031925857067108, 0.03477201983332634, 0.0392247810959816, 0.043677542358636856, 0.048130303621292114, 0.05258306488394737]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 8.0, 8.0, 12.0, 5.0, 12.0, 15.0, 19.0, 17.0, 17.0, 19.0, 35.0, 35.0, 31.0, 41.0, 34.0, 46.0, 46.0, 38.0, 39.0, 39.0, 42.0, 41.0, 41.0, 57.0, 37.0, 34.0, 37.0, 27.0, 23.0, 29.0, 20.0, 16.0, 12.0, 18.0, 10.0, 6.0, 7.0, 10.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.026595473289489746, -0.025811992585659027, -0.02502851001918316, -0.02424502745270729, -0.02346154674887657, -0.022678066045045853, -0.021894583478569984, -0.021111100912094116, -0.020327620208263397, -0.019544139504432678, -0.01876065693795681, -0.017977174371480942, -0.017193693667650223, -0.016410212963819504, -0.015626730397343636, -0.014843248762190342, -0.014059767127037048, -0.013276285491883755, -0.012492803856730461, -0.011709322221577168, -0.010925840586423874, -0.01014235895127058, -0.009358877316117287, -0.008575395680963993, -0.0077919140458106995, -0.007008432410657406, -0.006224950775504112, -0.005441469140350819, -0.004657987505197525, -0.0038745058700442314, -0.003091024234890938, -0.002307542599737644, -0.0015240609645843506, -0.000740579329431057, 4.290230572223663e-05, 0.0008263839408755302, 0.0016098655760288239, 0.0023933472111821175, 0.003176828846335411, 0.003960310481488705, 0.004743792116641998, 0.005527273751795292, 0.0063107553869485855, 0.007094237022101879, 0.007877718657255173, 0.008661200292408466, 0.00944468192756176, 0.010228163562715054, 0.011011645197868347, 0.01179512683302164, 0.012578608468174934, 0.013362090103328228, 0.014145571738481522, 0.014929053373634815, 0.01571253500878811, 0.016496017575263977, 0.017279498279094696, 0.018062978982925415, 0.018846461549401283, 0.01962994411587715, 0.02041342481970787, 0.02119690552353859, 0.021980388090014458, 0.022763870656490326, 0.023547351360321045]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 8.0, 5.0, 9.0, 12.0, 5.0, 20.0, 15.0, 19.0, 26.0, 24.0, 15.0, 29.0, 35.0, 36.0, 27.0, 44.0, 43.0, 53.0, 33.0, 42.0, 50.0, 35.0, 41.0, 42.0, 33.0, 37.0, 29.0, 33.0, 32.0, 29.0, 25.0, 17.0, 20.0, 17.0, 7.0, 15.0, 7.0, 5.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3203125, -2.244659423828125, -2.16900634765625, -2.093353271484375, -2.0177001953125, -1.942047119140625, -1.86639404296875, -1.790740966796875, -1.715087890625, -1.639434814453125, -1.56378173828125, -1.488128662109375, -1.4124755859375, -1.336822509765625, -1.26116943359375, -1.185516357421875, -1.10986328125, -1.034210205078125, -0.95855712890625, -0.882904052734375, -0.8072509765625, -0.731597900390625, -0.65594482421875, -0.580291748046875, -0.504638671875, -0.428985595703125, -0.35333251953125, -0.277679443359375, -0.2020263671875, -0.126373291015625, -0.05072021484375, 0.024932861328125, 0.1005859375, 0.176239013671875, 0.25189208984375, 0.327545166015625, 0.4031982421875, 0.478851318359375, 0.55450439453125, 0.630157470703125, 0.705810546875, 0.781463623046875, 0.85711669921875, 0.932769775390625, 1.0084228515625, 1.084075927734375, 1.15972900390625, 1.235382080078125, 1.31103515625, 1.386688232421875, 1.46234130859375, 1.537994384765625, 1.6136474609375, 1.689300537109375, 1.76495361328125, 1.840606689453125, 1.916259765625, 1.991912841796875, 2.06756591796875, 2.143218994140625, 2.2188720703125, 2.294525146484375, 2.37017822265625, 2.445831298828125, 2.521484375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 7.0, 19.0, 28.0, 40.0, 57.0, 74.0, 152.0, 226.0, 435.0, 768.0, 1346.0, 2499.0, 4769.0, 9164.0, 19646.0, 47151.0, 146020.0, 437697.0, 252319.0, 72424.0, 27687.0, 12506.0, 6174.0, 3249.0, 1752.0, 970.0, 547.0, 323.0, 179.0, 115.0, 72.0, 50.0, 21.0, 16.0, 10.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.177734375, -2.113128662109375, -2.04852294921875, -1.983917236328125, -1.9193115234375, -1.854705810546875, -1.79010009765625, -1.725494384765625, -1.660888671875, -1.596282958984375, -1.53167724609375, -1.467071533203125, -1.4024658203125, -1.337860107421875, -1.27325439453125, -1.208648681640625, -1.14404296875, -1.079437255859375, -1.01483154296875, -0.950225830078125, -0.8856201171875, -0.821014404296875, -0.75640869140625, -0.691802978515625, -0.627197265625, -0.562591552734375, -0.49798583984375, -0.433380126953125, -0.3687744140625, -0.304168701171875, -0.23956298828125, -0.174957275390625, -0.1103515625, -0.045745849609375, 0.01885986328125, 0.083465576171875, 0.1480712890625, 0.212677001953125, 0.27728271484375, 0.341888427734375, 0.406494140625, 0.471099853515625, 0.53570556640625, 0.600311279296875, 0.6649169921875, 0.729522705078125, 0.79412841796875, 0.858734130859375, 0.92333984375, 0.987945556640625, 1.05255126953125, 1.117156982421875, 1.1817626953125, 1.246368408203125, 1.31097412109375, 1.375579833984375, 1.440185546875, 1.504791259765625, 1.56939697265625, 1.634002685546875, 1.6986083984375, 1.763214111328125, 1.82781982421875, 1.892425537109375, 1.95703125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 14.0, 10.0, 14.0, 17.0, 15.0, 14.0, 12.0, 24.0, 38.0, 36.0, 38.0, 39.0, 37.0, 52.0, 58.0, 107.0, 310.0, 1637.0, 122.0, 71.0, 41.0, 48.0, 50.0, 41.0, 33.0, 26.0, 25.0, 22.0, 24.0, 9.0, 16.0, 11.0, 9.0, 4.0, 4.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -8.142822265625, -7.86376953125, -7.584716796875, -7.3056640625, -7.026611328125, -6.74755859375, -6.468505859375, -6.189453125, -5.910400390625, -5.63134765625, -5.352294921875, -5.0732421875, -4.794189453125, -4.51513671875, -4.236083984375, -3.95703125, -3.677978515625, -3.39892578125, -3.119873046875, -2.8408203125, -2.561767578125, -2.28271484375, -2.003662109375, -1.724609375, -1.445556640625, -1.16650390625, -0.887451171875, -0.6083984375, -0.329345703125, -0.05029296875, 0.228759765625, 0.5078125, 0.786865234375, 1.06591796875, 1.344970703125, 1.6240234375, 1.903076171875, 2.18212890625, 2.461181640625, 2.740234375, 3.019287109375, 3.29833984375, 3.577392578125, 3.8564453125, 4.135498046875, 4.41455078125, 4.693603515625, 4.97265625, 5.251708984375, 5.53076171875, 5.809814453125, 6.0888671875, 6.367919921875, 6.64697265625, 6.926025390625, 7.205078125, 7.484130859375, 7.76318359375, 8.042236328125, 8.3212890625, 8.600341796875, 8.87939453125, 9.158447265625, 9.4375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 8.0, 12.0, 16.0, 13.0, 28.0, 33.0, 26.0, 46.0, 61.0, 117.0, 167.0, 340.0, 737.0, 2079.0, 10937.0, 269908.0, 2828395.0, 26871.0, 3634.0, 1155.0, 440.0, 214.0, 123.0, 86.0, 56.0, 45.0, 29.0, 13.0, 21.0, 16.0, 18.0, 8.0, 16.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6484375, -14.2071533203125, -13.765869140625, -13.3245849609375, -12.88330078125, -12.4420166015625, -12.000732421875, -11.5594482421875, -11.1181640625, -10.6768798828125, -10.235595703125, -9.7943115234375, -9.35302734375, -8.9117431640625, -8.470458984375, -8.0291748046875, -7.587890625, -7.1466064453125, -6.705322265625, -6.2640380859375, -5.82275390625, -5.3814697265625, -4.940185546875, -4.4989013671875, -4.0576171875, -3.6163330078125, -3.175048828125, -2.7337646484375, -2.29248046875, -1.8511962890625, -1.409912109375, -0.9686279296875, -0.52734375, -0.0860595703125, 0.355224609375, 0.7965087890625, 1.23779296875, 1.6790771484375, 2.120361328125, 2.5616455078125, 3.0029296875, 3.4442138671875, 3.885498046875, 4.3267822265625, 4.76806640625, 5.2093505859375, 5.650634765625, 6.0919189453125, 6.533203125, 6.9744873046875, 7.415771484375, 7.8570556640625, 8.29833984375, 8.7396240234375, 9.180908203125, 9.6221923828125, 10.0634765625, 10.5047607421875, 10.946044921875, 11.3873291015625, 11.82861328125, 12.2698974609375, 12.711181640625, 13.1524658203125, 13.59375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [58.0, 813.0, 148.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.236794471740723, -2.011749029159546, 1.2132964134216309, 4.438342094421387, 7.663387298583984, 10.888432502746582, 14.113478660583496, 17.338523864746094, 20.563568115234375, 23.78861427307129, 27.01365852355957, 30.238704681396484, 33.463748931884766, 36.68879699707031, 39.913841247558594, 43.138885498046875, 46.36393356323242, 49.5889778137207, 52.81402587890625, 56.03907012939453, 59.26411437988281, 62.489158630371094, 65.71420288085938, 68.93925476074219, 72.16429901123047, 75.38934326171875, 78.61438751220703, 81.83943176269531, 85.06448364257812, 88.2895278930664, 91.51457214355469, 94.73961639404297, 97.96465301513672, 101.189697265625, 104.41474151611328, 107.63978576660156, 110.86483764648438, 114.08988189697266, 117.31492614746094, 120.53997039794922, 123.7650146484375, 126.99005889892578, 130.21510314941406, 133.44015502929688, 136.66519165039062, 139.89024353027344, 143.11529541015625, 146.34033203125, 149.5653839111328, 152.79043579101562, 156.01547241210938, 159.2405242919922, 162.46556091308594, 165.69061279296875, 168.9156494140625, 172.1407012939453, 175.36573791503906, 178.59078979492188, 181.81582641601562, 185.04087829589844, 188.2659149169922, 191.490966796875, 194.71600341796875, 197.94105529785156, 201.16610717773438]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 10.0, 10.0, 7.0, 5.0, 12.0, 20.0, 20.0, 12.0, 24.0, 31.0, 24.0, 26.0, 21.0, 28.0, 40.0, 39.0, 37.0, 44.0, 32.0, 59.0, 49.0, 53.0, 42.0, 36.0, 41.0, 30.0, 21.0, 24.0, 27.0, 24.0, 19.0, 26.0, 21.0, 10.0, 17.0, 8.0, 6.0, 10.0, 6.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-24.72364616394043, -23.941390991210938, -23.159137725830078, -22.376882553100586, -21.594629287719727, -20.812374114990234, -20.030120849609375, -19.247865676879883, -18.46561050415039, -17.6833553314209, -16.90110206604004, -16.118846893310547, -15.336593627929688, -14.554338455200195, -13.77208423614502, -12.989830017089844, -12.207576751708984, -11.425322532653809, -10.643068313598633, -9.86081314086914, -9.078559875488281, -8.296304702758789, -7.514050483703613, -6.7317962646484375, -5.949542045593262, -5.167287826538086, -4.38503360748291, -3.602778911590576, -2.8205246925354004, -2.0382704734802246, -1.2560157775878906, -0.47376155853271484, 0.3084907531738281, 1.0907450914382935, 1.8729994297027588, 2.6552538871765137, 3.4375081062316895, 4.219762325286865, 5.002017021179199, 5.784271240234375, 6.566525459289551, 7.348779678344727, 8.131033897399902, 8.913288116455078, 9.69554328918457, 10.47779655456543, 11.260051727294922, 12.042305946350098, 12.824560165405273, 13.60681438446045, 14.389068603515625, 15.171323776245117, 15.953577041625977, 16.73583221435547, 17.518085479736328, 18.30034065246582, 19.082595825195312, 19.864850997924805, 20.647104263305664, 21.429359436035156, 22.211612701416016, 22.993867874145508, 23.776123046875, 24.55837631225586, 25.34062957763672]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 5.0, 8.0, 11.0, 7.0, 12.0, 15.0, 23.0, 21.0, 23.0, 16.0, 20.0, 31.0, 42.0, 35.0, 36.0, 39.0, 52.0, 35.0, 50.0, 47.0, 36.0, 54.0, 48.0, 23.0, 39.0, 30.0, 37.0, 27.0, 29.0, 25.0, 22.0, 19.0, 17.0, 8.0, 14.0, 12.0, 6.0, 7.0, 1.0, 11.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.474609375, -2.395263671875, -2.31591796875, -2.236572265625, -2.1572265625, -2.077880859375, -1.99853515625, -1.919189453125, -1.83984375, -1.760498046875, -1.68115234375, -1.601806640625, -1.5224609375, -1.443115234375, -1.36376953125, -1.284423828125, -1.205078125, -1.125732421875, -1.04638671875, -0.967041015625, -0.8876953125, -0.808349609375, -0.72900390625, -0.649658203125, -0.5703125, -0.490966796875, -0.41162109375, -0.332275390625, -0.2529296875, -0.173583984375, -0.09423828125, -0.014892578125, 0.064453125, 0.143798828125, 0.22314453125, 0.302490234375, 0.3818359375, 0.461181640625, 0.54052734375, 0.619873046875, 0.69921875, 0.778564453125, 0.85791015625, 0.937255859375, 1.0166015625, 1.095947265625, 1.17529296875, 1.254638671875, 1.333984375, 1.413330078125, 1.49267578125, 1.572021484375, 1.6513671875, 1.730712890625, 1.81005859375, 1.889404296875, 1.96875, 2.048095703125, 2.12744140625, 2.206787109375, 2.2861328125, 2.365478515625, 2.44482421875, 2.524169921875, 2.603515625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 9.0, 8.0, 10.0, 10.0, 22.0, 30.0, 38.0, 70.0, 89.0, 157.0, 311.0, 632.0, 1368.0, 3724.0, 9869.0, 29048.0, 95279.0, 402491.0, 1883522.0, 1392218.0, 270645.0, 69992.0, 22017.0, 7617.0, 2786.0, 1132.0, 547.0, 232.0, 147.0, 76.0, 46.0, 35.0, 27.0, 24.0, 11.0, 9.0, 7.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66015625, -5.48797607421875, -5.3157958984375, -5.14361572265625, -4.971435546875, -4.79925537109375, -4.6270751953125, -4.45489501953125, -4.28271484375, -4.11053466796875, -3.9383544921875, -3.76617431640625, -3.593994140625, -3.42181396484375, -3.2496337890625, -3.07745361328125, -2.9052734375, -2.73309326171875, -2.5609130859375, -2.38873291015625, -2.216552734375, -2.04437255859375, -1.8721923828125, -1.70001220703125, -1.52783203125, -1.35565185546875, -1.1834716796875, -1.01129150390625, -0.839111328125, -0.66693115234375, -0.4947509765625, -0.32257080078125, -0.150390625, 0.02178955078125, 0.1939697265625, 0.36614990234375, 0.538330078125, 0.71051025390625, 0.8826904296875, 1.05487060546875, 1.22705078125, 1.39923095703125, 1.5714111328125, 1.74359130859375, 1.915771484375, 2.08795166015625, 2.2601318359375, 2.43231201171875, 2.6044921875, 2.77667236328125, 2.9488525390625, 3.12103271484375, 3.293212890625, 3.46539306640625, 3.6375732421875, 3.80975341796875, 3.98193359375, 4.15411376953125, 4.3262939453125, 4.49847412109375, 4.670654296875, 4.84283447265625, 5.0150146484375, 5.18719482421875, 5.359375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 13.0, 13.0, 21.0, 33.0, 55.0, 83.0, 146.0, 208.0, 337.0, 479.0, 677.0, 656.0, 450.0, 347.0, 204.0, 131.0, 83.0, 54.0, 21.0, 28.0, 10.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6171875, -11.263916015625, -10.91064453125, -10.557373046875, -10.2041015625, -9.850830078125, -9.49755859375, -9.144287109375, -8.791015625, -8.437744140625, -8.08447265625, -7.731201171875, -7.3779296875, -7.024658203125, -6.67138671875, -6.318115234375, -5.96484375, -5.611572265625, -5.25830078125, -4.905029296875, -4.5517578125, -4.198486328125, -3.84521484375, -3.491943359375, -3.138671875, -2.785400390625, -2.43212890625, -2.078857421875, -1.7255859375, -1.372314453125, -1.01904296875, -0.665771484375, -0.3125, 0.040771484375, 0.39404296875, 0.747314453125, 1.1005859375, 1.453857421875, 1.80712890625, 2.160400390625, 2.513671875, 2.866943359375, 3.22021484375, 3.573486328125, 3.9267578125, 4.280029296875, 4.63330078125, 4.986572265625, 5.33984375, 5.693115234375, 6.04638671875, 6.399658203125, 6.7529296875, 7.106201171875, 7.45947265625, 7.812744140625, 8.166015625, 8.519287109375, 8.87255859375, 9.225830078125, 9.5791015625, 9.932373046875, 10.28564453125, 10.638916015625, 10.9921875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 14.0, 13.0, 21.0, 31.0, 43.0, 48.0, 72.0, 119.0, 184.0, 369.0, 594.0, 1315.0, 4420.0, 34572.0, 567870.0, 3276895.0, 282310.0, 19805.0, 3134.0, 1072.0, 554.0, 305.0, 161.0, 108.0, 72.0, 45.0, 32.0, 21.0, 19.0, 19.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.140625, -18.53076171875, -17.9208984375, -17.31103515625, -16.701171875, -16.09130859375, -15.4814453125, -14.87158203125, -14.26171875, -13.65185546875, -13.0419921875, -12.43212890625, -11.822265625, -11.21240234375, -10.6025390625, -9.99267578125, -9.3828125, -8.77294921875, -8.1630859375, -7.55322265625, -6.943359375, -6.33349609375, -5.7236328125, -5.11376953125, -4.50390625, -3.89404296875, -3.2841796875, -2.67431640625, -2.064453125, -1.45458984375, -0.8447265625, -0.23486328125, 0.375, 0.98486328125, 1.5947265625, 2.20458984375, 2.814453125, 3.42431640625, 4.0341796875, 4.64404296875, 5.25390625, 5.86376953125, 6.4736328125, 7.08349609375, 7.693359375, 8.30322265625, 8.9130859375, 9.52294921875, 10.1328125, 10.74267578125, 11.3525390625, 11.96240234375, 12.572265625, 13.18212890625, 13.7919921875, 14.40185546875, 15.01171875, 15.62158203125, 16.2314453125, 16.84130859375, 17.451171875, 18.06103515625, 18.6708984375, 19.28076171875, 19.890625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 21.0, 49.0, 103.0, 185.0, 210.0, 228.0, 120.0, 59.0, 20.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.66728210449219, -113.12980651855469, -110.59233093261719, -108.05485534667969, -105.51737976074219, -102.97990417480469, -100.44242858886719, -97.90495300292969, -95.36747741699219, -92.83000183105469, -90.29252624511719, -87.75505065917969, -85.21757507324219, -82.68009948730469, -80.14262390136719, -77.60514831542969, -75.06767272949219, -72.53019714355469, -69.99272155761719, -67.45524597167969, -64.91777038574219, -62.38029479980469, -59.84281921386719, -57.30534362792969, -54.76787567138672, -52.23040008544922, -49.69292449951172, -47.15544891357422, -44.61797332763672, -42.08049774169922, -39.54302215576172, -37.00554656982422, -34.46806716918945, -31.930591583251953, -29.393115997314453, -26.855640411376953, -24.318164825439453, -21.780689239501953, -19.243215560913086, -16.705739974975586, -14.168264389038086, -11.630788803100586, -9.093313217163086, -6.555838584899902, -4.018362998962402, -1.4808874130249023, 1.0565872192382812, 3.5940628051757812, 6.131538391113281, 8.669013977050781, 11.206489562988281, 13.743964195251465, 16.28144073486328, 18.81891632080078, 21.35638999938965, 23.89386558532715, 26.43134117126465, 28.96881675720215, 31.50629234313965, 34.043766021728516, 36.581241607666016, 39.118717193603516, 41.656192779541016, 44.193668365478516, 46.731143951416016]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 8.0, 5.0, 8.0, 8.0, 8.0, 10.0, 17.0, 19.0, 19.0, 17.0, 29.0, 26.0, 35.0, 29.0, 30.0, 39.0, 32.0, 46.0, 40.0, 40.0, 33.0, 41.0, 34.0, 46.0, 31.0, 32.0, 36.0, 25.0, 27.0, 27.0, 39.0, 22.0, 21.0, 16.0, 19.0, 17.0, 15.0, 14.0, 7.0, 9.0, 7.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-26.786483764648438, -25.994264602661133, -25.202043533325195, -24.40982437133789, -23.617603302001953, -22.82538414001465, -22.033164978027344, -21.240943908691406, -20.4487247467041, -19.656505584716797, -18.86428451538086, -18.072065353393555, -17.27984619140625, -16.487625122070312, -15.695405960083008, -14.903185844421387, -14.110965728759766, -13.318745613098145, -12.526525497436523, -11.734306335449219, -10.942086219787598, -10.149866104125977, -9.357646942138672, -8.56542682647705, -7.77320671081543, -6.980986595153809, -6.188766956329346, -5.396547317504883, -4.604327201843262, -3.8121073246002197, -3.0198874473571777, -2.227667808532715, -1.4354476928710938, -0.6432278156280518, 0.14899206161499023, 0.9412119388580322, 1.7334318161010742, 2.525651693344116, 3.317871570587158, 4.110091209411621, 4.902311325073242, 5.694531440734863, 6.486751079559326, 7.278970718383789, 8.07119083404541, 8.863410949707031, 9.655630111694336, 10.447850227355957, 11.240070343017578, 12.0322904586792, 12.82451057434082, 13.616729736328125, 14.408949851989746, 15.201169967651367, 15.993389129638672, 16.78561019897461, 17.577829360961914, 18.37004852294922, 19.162269592285156, 19.95448875427246, 20.746707916259766, 21.538928985595703, 22.331148147583008, 23.123367309570312, 23.91558837890625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 7.0, 7.0, 2.0, 9.0, 8.0, 17.0, 15.0, 17.0, 24.0, 23.0, 28.0, 33.0, 27.0, 42.0, 32.0, 41.0, 52.0, 44.0, 43.0, 56.0, 39.0, 53.0, 43.0, 45.0, 37.0, 41.0, 24.0, 21.0, 27.0, 22.0, 19.0, 18.0, 18.0, 16.0, 16.0, 8.0, 10.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.388671875, -2.30078125, -2.212890625, -2.125, -2.037109375, -1.94921875, -1.861328125, -1.7734375, -1.685546875, -1.59765625, -1.509765625, -1.421875, -1.333984375, -1.24609375, -1.158203125, -1.0703125, -0.982421875, -0.89453125, -0.806640625, -0.71875, -0.630859375, -0.54296875, -0.455078125, -0.3671875, -0.279296875, -0.19140625, -0.103515625, -0.015625, 0.072265625, 0.16015625, 0.248046875, 0.3359375, 0.423828125, 0.51171875, 0.599609375, 0.6875, 0.775390625, 0.86328125, 0.951171875, 1.0390625, 1.126953125, 1.21484375, 1.302734375, 1.390625, 1.478515625, 1.56640625, 1.654296875, 1.7421875, 1.830078125, 1.91796875, 2.005859375, 2.09375, 2.181640625, 2.26953125, 2.357421875, 2.4453125, 2.533203125, 2.62109375, 2.708984375, 2.796875, 2.884765625, 2.97265625, 3.060546875, 3.1484375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 6.0, 17.0, 18.0, 21.0, 34.0, 39.0, 75.0, 109.0, 147.0, 190.0, 342.0, 494.0, 747.0, 1302.0, 2126.0, 3620.0, 6382.0, 10831.0, 19312.0, 33285.0, 58031.0, 96771.0, 152077.0, 199700.0, 174925.0, 117629.0, 71784.0, 41786.0, 23835.0, 13599.0, 7955.0, 4561.0, 2555.0, 1573.0, 1017.0, 573.0, 359.0, 218.0, 143.0, 123.0, 64.0, 43.0, 48.0, 25.0, 21.0, 9.0, 13.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.283203125, -0.27426910400390625, -0.2653350830078125, -0.25640106201171875, -0.247467041015625, -0.23853302001953125, -0.2295989990234375, -0.22066497802734375, -0.21173095703125, -0.20279693603515625, -0.1938629150390625, -0.18492889404296875, -0.175994873046875, -0.16706085205078125, -0.1581268310546875, -0.14919281005859375, -0.1402587890625, -0.13132476806640625, -0.1223907470703125, -0.11345672607421875, -0.104522705078125, -0.09558868408203125, -0.0866546630859375, -0.07772064208984375, -0.06878662109375, -0.05985260009765625, -0.0509185791015625, -0.04198455810546875, -0.033050537109375, -0.02411651611328125, -0.0151824951171875, -0.00624847412109375, 0.002685546875, 0.01161956787109375, 0.0205535888671875, 0.02948760986328125, 0.038421630859375, 0.04735565185546875, 0.0562896728515625, 0.06522369384765625, 0.07415771484375, 0.08309173583984375, 0.0920257568359375, 0.10095977783203125, 0.109893798828125, 0.11882781982421875, 0.1277618408203125, 0.13669586181640625, 0.1456298828125, 0.15456390380859375, 0.1634979248046875, 0.17243194580078125, 0.181365966796875, 0.19029998779296875, 0.1992340087890625, 0.20816802978515625, 0.21710205078125, 0.22603607177734375, 0.2349700927734375, 0.24390411376953125, 0.252838134765625, 0.26177215576171875, 0.2707061767578125, 0.27964019775390625, 0.28857421875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 3.0, 10.0, 5.0, 4.0, 5.0, 11.0, 16.0, 8.0, 14.0, 23.0, 21.0, 24.0, 21.0, 25.0, 26.0, 28.0, 35.0, 30.0, 30.0, 38.0, 50.0, 28.0, 1062.0, 40.0, 37.0, 35.0, 36.0, 31.0, 41.0, 36.0, 27.0, 33.0, 25.0, 34.0, 21.0, 17.0, 11.0, 14.0, 14.0, 11.0, 11.0, 7.0, 5.0, 7.0, 3.0, 3.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.6611328125, -1.61004638671875, -1.5589599609375, -1.50787353515625, -1.456787109375, -1.40570068359375, -1.3546142578125, -1.30352783203125, -1.25244140625, -1.20135498046875, -1.1502685546875, -1.09918212890625, -1.048095703125, -0.99700927734375, -0.9459228515625, -0.89483642578125, -0.84375, -0.79266357421875, -0.7415771484375, -0.69049072265625, -0.639404296875, -0.58831787109375, -0.5372314453125, -0.48614501953125, -0.43505859375, -0.38397216796875, -0.3328857421875, -0.28179931640625, -0.230712890625, -0.17962646484375, -0.1285400390625, -0.07745361328125, -0.0263671875, 0.02471923828125, 0.0758056640625, 0.12689208984375, 0.177978515625, 0.22906494140625, 0.2801513671875, 0.33123779296875, 0.38232421875, 0.43341064453125, 0.4844970703125, 0.53558349609375, 0.586669921875, 0.63775634765625, 0.6888427734375, 0.73992919921875, 0.791015625, 0.84210205078125, 0.8931884765625, 0.94427490234375, 0.995361328125, 1.04644775390625, 1.0975341796875, 1.14862060546875, 1.19970703125, 1.25079345703125, 1.3018798828125, 1.35296630859375, 1.404052734375, 1.45513916015625, 1.5062255859375, 1.55731201171875, 1.6083984375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 20.0, 29.0, 48.0, 79.0, 75.0, 128.0, 252.0, 367.0, 481.0, 763.0, 1144.0, 1785.0, 2723.0, 4141.0, 6336.0, 9802.0, 14873.0, 22953.0, 34989.0, 51665.0, 73258.0, 100185.0, 144784.0, 1122751.0, 163111.0, 103827.0, 76582.0, 53571.0, 36428.0, 24159.0, 15790.0, 10570.0, 6786.0, 4439.0, 2878.0, 1853.0, 1196.0, 777.0, 524.0, 346.0, 215.0, 163.0, 86.0, 73.0, 44.0, 23.0, 15.0, 13.0, 9.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.141357421875, -0.13701629638671875, -0.1326751708984375, -0.12833404541015625, -0.123992919921875, -0.11965179443359375, -0.1153106689453125, -0.11096954345703125, -0.10662841796875, -0.10228729248046875, -0.0979461669921875, -0.09360504150390625, -0.089263916015625, -0.08492279052734375, -0.0805816650390625, -0.07624053955078125, -0.0718994140625, -0.06755828857421875, -0.0632171630859375, -0.05887603759765625, -0.054534912109375, -0.05019378662109375, -0.0458526611328125, -0.04151153564453125, -0.03717041015625, -0.03282928466796875, -0.0284881591796875, -0.02414703369140625, -0.019805908203125, -0.01546478271484375, -0.0111236572265625, -0.00678253173828125, -0.00244140625, 0.00189971923828125, 0.0062408447265625, 0.01058197021484375, 0.014923095703125, 0.01926422119140625, 0.0236053466796875, 0.02794647216796875, 0.03228759765625, 0.03662872314453125, 0.0409698486328125, 0.04531097412109375, 0.049652099609375, 0.05399322509765625, 0.0583343505859375, 0.06267547607421875, 0.0670166015625, 0.07135772705078125, 0.0756988525390625, 0.08003997802734375, 0.084381103515625, 0.08872222900390625, 0.0930633544921875, 0.09740447998046875, 0.10174560546875, 0.10608673095703125, 0.1104278564453125, 0.11476898193359375, 0.119110107421875, 0.12345123291015625, 0.1277923583984375, 0.13213348388671875, 0.136474609375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 8.0, 8.0, 9.0, 8.0, 17.0, 30.0, 35.0, 69.0, 92.0, 96.0, 177.0, 115.0, 94.0, 68.0, 47.0, 26.0, 27.0, 10.0, 7.0, 10.0, 6.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0258941650390625, -0.0252077579498291, -0.024521350860595703, -0.023834943771362305, -0.023148536682128906, -0.022462129592895508, -0.02177572250366211, -0.02108931541442871, -0.020402908325195312, -0.019716501235961914, -0.019030094146728516, -0.018343687057495117, -0.01765727996826172, -0.01697087287902832, -0.016284465789794922, -0.015598058700561523, -0.014911651611328125, -0.014225244522094727, -0.013538837432861328, -0.01285243034362793, -0.012166023254394531, -0.011479616165161133, -0.010793209075927734, -0.010106801986694336, -0.009420394897460938, -0.008733987808227539, -0.00804758071899414, -0.007361173629760742, -0.006674766540527344, -0.005988359451293945, -0.005301952362060547, -0.0046155452728271484, -0.00392913818359375, -0.0032427310943603516, -0.002556324005126953, -0.0018699169158935547, -0.0011835098266601562, -0.0004971027374267578, 0.00018930435180664062, 0.0008757114410400391, 0.0015621185302734375, 0.002248525619506836, 0.0029349327087402344, 0.003621339797973633, 0.004307746887207031, 0.00499415397644043, 0.005680561065673828, 0.0063669681549072266, 0.007053375244140625, 0.0077397823333740234, 0.008426189422607422, 0.00911259651184082, 0.009799003601074219, 0.010485410690307617, 0.011171817779541016, 0.011858224868774414, 0.012544631958007812, 0.013231039047241211, 0.01391744613647461, 0.014603853225708008, 0.015290260314941406, 0.015976667404174805, 0.016663074493408203, 0.0173494815826416, 0.018035888671875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 2.0, 2.0, 8.0, 9.0, 5.0, 15.0, 19.0, 18.0, 41.0, 49.0, 59.0, 92.0, 150.0, 315.0, 836.0, 8829.0, 985107.0, 50180.0, 1758.0, 464.0, 220.0, 116.0, 71.0, 45.0, 39.0, 27.0, 14.0, 11.0, 10.0, 5.0, 3.0, 8.0, 3.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31103515625, -0.2993888854980469, -0.28774261474609375, -0.2760963439941406, -0.2644500732421875, -0.2528038024902344, -0.24115753173828125, -0.22951126098632812, -0.217864990234375, -0.20621871948242188, -0.19457244873046875, -0.18292617797851562, -0.1712799072265625, -0.15963363647460938, -0.14798736572265625, -0.13634109497070312, -0.12469482421875, -0.11304855346679688, -0.10140228271484375, -0.08975601196289062, -0.0781097412109375, -0.06646347045898438, -0.05481719970703125, -0.043170928955078125, -0.031524658203125, -0.019878387451171875, -0.00823211669921875, 0.003414154052734375, 0.0150604248046875, 0.026706695556640625, 0.03835296630859375, 0.049999237060546875, 0.0616455078125, 0.07329177856445312, 0.08493804931640625, 0.09658432006835938, 0.1082305908203125, 0.11987686157226562, 0.13152313232421875, 0.14316940307617188, 0.154815673828125, 0.16646194458007812, 0.17810821533203125, 0.18975448608398438, 0.2014007568359375, 0.21304702758789062, 0.22469329833984375, 0.23633956909179688, 0.24798583984375, 0.2596321105957031, 0.27127838134765625, 0.2829246520996094, 0.2945709228515625, 0.3062171936035156, 0.31786346435546875, 0.3295097351074219, 0.341156005859375, 0.3528022766113281, 0.36444854736328125, 0.3760948181152344, 0.3877410888671875, 0.3993873596191406, 0.41103363037109375, 0.4226799011230469, 0.434326171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 20.0, 34.0, 97.0, 260.0, 468.0, 97.0, 28.0, 5.0], "bins": [-0.26065051555633545, -0.2563200891017914, -0.2519896328449249, -0.24765920639038086, -0.2433287799358368, -0.23899833858013153, -0.23466789722442627, -0.2303374707698822, -0.22600702941417694, -0.22167658805847168, -0.2173461616039276, -0.21301572024822235, -0.2086852788925171, -0.20435485243797302, -0.20002441108226776, -0.1956939846277237, -0.19136354327201843, -0.18703310191631317, -0.1827026754617691, -0.17837223410606384, -0.17404180765151978, -0.16971136629581451, -0.16538092494010925, -0.16105049848556519, -0.15672005712985992, -0.15238961577415466, -0.1480591893196106, -0.14372874796390533, -0.13939830660820007, -0.135067880153656, -0.13073743879795074, -0.12640701234340668, -0.12207657098770142, -0.11774613708257675, -0.11341570317745209, -0.10908526182174683, -0.10475482791662216, -0.1004243940114975, -0.09609395265579224, -0.09176351875066757, -0.08743308484554291, -0.08310265094041824, -0.07877221703529358, -0.07444177567958832, -0.07011134177446365, -0.06578090786933899, -0.061450470238924026, -0.057120032608509064, -0.0527895987033844, -0.048459164798259735, -0.04412872716784477, -0.03979828953742981, -0.035467855632305145, -0.03113741986453533, -0.026806984096765518, -0.022476548328995705, -0.01814611442387104, -0.013815678656101227, -0.009485242888331413, -0.0051548071205616, -0.0008243713527917862, 0.0035060644149780273, 0.007836500182747841, 0.012166935950517654, 0.016497371718287468]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 14.0, 14.0, 14.0, 20.0, 17.0, 14.0, 22.0, 26.0, 26.0, 20.0, 29.0, 31.0, 32.0, 45.0, 36.0, 35.0, 46.0, 46.0, 49.0, 40.0, 43.0, 34.0, 44.0, 44.0, 29.0, 42.0, 25.0, 18.0, 14.0, 18.0, 26.0, 15.0, 11.0, 13.0, 9.0, 7.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02419579029083252, -0.023412737995386124, -0.02262968383729458, -0.021846629679203033, -0.021063577383756638, -0.02028052508831024, -0.019497470930218697, -0.01871441677212715, -0.017931364476680756, -0.01714831218123436, -0.016365258023142815, -0.015582204796373844, -0.014799151569604874, -0.014016098342835903, -0.013233045116066933, -0.012449991889297962, -0.011666938662528992, -0.010883885435760021, -0.01010083220899105, -0.00931777898222208, -0.00853472575545311, -0.007751672528684139, -0.006968619301915169, -0.006185566075146198, -0.005402512848377228, -0.004619459621608257, -0.003836406394839287, -0.0030533531680703163, -0.002270299941301346, -0.0014872467145323753, -0.0007041934877634048, 7.885973900556564e-05, 0.0008619129657745361, 0.0016449661925435066, 0.002428019419312477, 0.0032110726460814476, 0.003994125872850418, 0.004777179099619389, 0.005560232326388359, 0.0063432855531573296, 0.0071263387799263, 0.00790939200669527, 0.008692445233464241, 0.009475498460233212, 0.010258551687002182, 0.011041604913771152, 0.011824658140540123, 0.012607711367309093, 0.013390764594078064, 0.014173817820847034, 0.014956871047616005, 0.01573992520570755, 0.016522977501153946, 0.017306029796600342, 0.018089083954691887, 0.018872138112783432, 0.019655190408229828, 0.020438242703676224, 0.02122129686176777, 0.022004351019859314, 0.02278740331530571, 0.023570455610752106, 0.02435350976884365, 0.025136563926935196, 0.025919616222381592]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 7.0, 7.0, 2.0, 9.0, 8.0, 17.0, 15.0, 18.0, 23.0, 23.0, 28.0, 32.0, 28.0, 42.0, 33.0, 40.0, 52.0, 44.0, 43.0, 56.0, 39.0, 52.0, 44.0, 45.0, 37.0, 41.0, 24.0, 21.0, 27.0, 22.0, 18.0, 19.0, 18.0, 16.0, 16.0, 7.0, 11.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.388671875, -2.30078125, -2.212890625, -2.125, -2.037109375, -1.94921875, -1.861328125, -1.7734375, -1.685546875, -1.59765625, -1.509765625, -1.421875, -1.333984375, -1.24609375, -1.158203125, -1.0703125, -0.982421875, -0.89453125, -0.806640625, -0.71875, -0.630859375, -0.54296875, -0.455078125, -0.3671875, -0.279296875, -0.19140625, -0.103515625, -0.015625, 0.072265625, 0.16015625, 0.248046875, 0.3359375, 0.423828125, 0.51171875, 0.599609375, 0.6875, 0.775390625, 0.86328125, 0.951171875, 1.0390625, 1.126953125, 1.21484375, 1.302734375, 1.390625, 1.478515625, 1.56640625, 1.654296875, 1.7421875, 1.830078125, 1.91796875, 2.005859375, 2.09375, 2.181640625, 2.26953125, 2.357421875, 2.4453125, 2.533203125, 2.62109375, 2.708984375, 2.796875, 2.884765625, 2.97265625, 3.060546875, 3.1484375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 9.0, 8.0, 12.0, 23.0, 23.0, 42.0, 66.0, 105.0, 135.0, 207.0, 275.0, 548.0, 803.0, 1228.0, 1844.0, 2932.0, 5048.0, 8959.0, 16992.0, 36470.0, 88498.0, 235082.0, 364363.0, 163567.0, 62728.0, 27079.0, 13128.0, 7037.0, 4152.0, 2574.0, 1682.0, 1037.0, 635.0, 461.0, 298.0, 161.0, 126.0, 84.0, 56.0, 24.0, 21.0, 14.0, 8.0, 10.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1640625, -2.1009979248046875, -2.037933349609375, -1.9748687744140625, -1.91180419921875, -1.8487396240234375, -1.785675048828125, -1.7226104736328125, -1.6595458984375, -1.5964813232421875, -1.533416748046875, -1.4703521728515625, -1.40728759765625, -1.3442230224609375, -1.281158447265625, -1.2180938720703125, -1.155029296875, -1.0919647216796875, -1.028900146484375, -0.9658355712890625, -0.90277099609375, -0.8397064208984375, -0.776641845703125, -0.7135772705078125, -0.6505126953125, -0.5874481201171875, -0.524383544921875, -0.4613189697265625, -0.39825439453125, -0.3351898193359375, -0.272125244140625, -0.2090606689453125, -0.14599609375, -0.0829315185546875, -0.019866943359375, 0.0431976318359375, 0.10626220703125, 0.1693267822265625, 0.232391357421875, 0.2954559326171875, 0.3585205078125, 0.4215850830078125, 0.484649658203125, 0.5477142333984375, 0.61077880859375, 0.6738433837890625, 0.736907958984375, 0.7999725341796875, 0.863037109375, 0.9261016845703125, 0.989166259765625, 1.0522308349609375, 1.11529541015625, 1.1783599853515625, 1.241424560546875, 1.3044891357421875, 1.3675537109375, 1.4306182861328125, 1.493682861328125, 1.5567474365234375, 1.61981201171875, 1.6828765869140625, 1.745941162109375, 1.8090057373046875, 1.8720703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 8.0, 10.0, 10.0, 14.0, 9.0, 17.0, 25.0, 21.0, 34.0, 25.0, 40.0, 33.0, 48.0, 56.0, 47.0, 69.0, 215.0, 1669.0, 223.0, 80.0, 56.0, 43.0, 38.0, 36.0, 34.0, 30.0, 33.0, 27.0, 22.0, 10.0, 11.0, 10.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.890625, -9.5660400390625, -9.241455078125, -8.9168701171875, -8.59228515625, -8.2677001953125, -7.943115234375, -7.6185302734375, -7.2939453125, -6.9693603515625, -6.644775390625, -6.3201904296875, -5.99560546875, -5.6710205078125, -5.346435546875, -5.0218505859375, -4.697265625, -4.3726806640625, -4.048095703125, -3.7235107421875, -3.39892578125, -3.0743408203125, -2.749755859375, -2.4251708984375, -2.1005859375, -1.7760009765625, -1.451416015625, -1.1268310546875, -0.80224609375, -0.4776611328125, -0.153076171875, 0.1715087890625, 0.49609375, 0.8206787109375, 1.145263671875, 1.4698486328125, 1.79443359375, 2.1190185546875, 2.443603515625, 2.7681884765625, 3.0927734375, 3.4173583984375, 3.741943359375, 4.0665283203125, 4.39111328125, 4.7156982421875, 5.040283203125, 5.3648681640625, 5.689453125, 6.0140380859375, 6.338623046875, 6.6632080078125, 6.98779296875, 7.3123779296875, 7.636962890625, 7.9615478515625, 8.2861328125, 8.6107177734375, 8.935302734375, 9.2598876953125, 9.58447265625, 9.9090576171875, 10.233642578125, 10.5582275390625, 10.8828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 8.0, 17.0, 19.0, 24.0, 46.0, 39.0, 57.0, 87.0, 112.0, 176.0, 289.0, 780.0, 4458.0, 193378.0, 2922123.0, 21231.0, 1541.0, 454.0, 244.0, 169.0, 100.0, 73.0, 49.0, 48.0, 20.0, 36.0, 21.0, 14.0, 10.0, 13.0, 7.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.231201171875, -15.72802734375, -15.224853515625, -14.7216796875, -14.218505859375, -13.71533203125, -13.212158203125, -12.708984375, -12.205810546875, -11.70263671875, -11.199462890625, -10.6962890625, -10.193115234375, -9.68994140625, -9.186767578125, -8.68359375, -8.180419921875, -7.67724609375, -7.174072265625, -6.6708984375, -6.167724609375, -5.66455078125, -5.161376953125, -4.658203125, -4.155029296875, -3.65185546875, -3.148681640625, -2.6455078125, -2.142333984375, -1.63916015625, -1.135986328125, -0.6328125, -0.129638671875, 0.37353515625, 0.876708984375, 1.3798828125, 1.883056640625, 2.38623046875, 2.889404296875, 3.392578125, 3.895751953125, 4.39892578125, 4.902099609375, 5.4052734375, 5.908447265625, 6.41162109375, 6.914794921875, 7.41796875, 7.921142578125, 8.42431640625, 8.927490234375, 9.4306640625, 9.933837890625, 10.43701171875, 10.940185546875, 11.443359375, 11.946533203125, 12.44970703125, 12.952880859375, 13.4560546875, 13.959228515625, 14.46240234375, 14.965576171875, 15.46875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 104.0, 854.0, 59.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.0399627685547, -201.46641540527344, -197.8928680419922, -194.31932067871094, -190.7457733154297, -187.17222595214844, -183.5986785888672, -180.02511596679688, -176.45156860351562, -172.87802124023438, -169.30447387695312, -165.73092651367188, -162.15737915039062, -158.58383178710938, -155.01028442382812, -151.43673706054688, -147.86318969726562, -144.28964233398438, -140.71609497070312, -137.14254760742188, -133.56900024414062, -129.99545288085938, -126.4218978881836, -122.84835052490234, -119.2748031616211, -115.70125579833984, -112.1277084350586, -108.55416107177734, -104.98060607910156, -101.40705871582031, -97.83351135253906, -94.25996398925781, -90.68641662597656, -87.11286926269531, -83.53932189941406, -79.96577453613281, -76.39222717285156, -72.81867980957031, -69.24512481689453, -65.67157745361328, -62.09803009033203, -58.52448272705078, -54.95093536376953, -51.377384185791016, -47.803836822509766, -44.230289459228516, -40.65673828125, -37.08319091796875, -33.5096435546875, -29.93609619140625, -26.362546920776367, -22.788997650146484, -19.215450286865234, -15.641902923583984, -12.068353652954102, -8.494804382324219, -4.921257019042969, -1.3477087020874023, 2.225839614868164, 5.7993879318237305, 9.372936248779297, 12.946483612060547, 16.52003288269043, 20.093582153320312, 23.667129516601562]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 8.0, 8.0, 5.0, 7.0, 7.0, 7.0, 11.0, 9.0, 14.0, 17.0, 22.0, 26.0, 16.0, 22.0, 32.0, 24.0, 34.0, 26.0, 27.0, 40.0, 39.0, 32.0, 38.0, 33.0, 36.0, 35.0, 39.0, 28.0, 23.0, 20.0, 33.0, 22.0, 33.0, 22.0, 25.0, 18.0, 29.0, 22.0, 18.0, 19.0, 7.0, 14.0, 12.0, 10.0, 8.0, 6.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.193906784057617, -24.39202308654785, -23.59014129638672, -22.788257598876953, -21.986373901367188, -21.184492111206055, -20.38260841369629, -19.580726623535156, -18.77884292602539, -17.976959228515625, -17.175077438354492, -16.373193740844727, -15.571310997009277, -14.769428253173828, -13.967544555664062, -13.165661811828613, -12.363779067993164, -11.561896324157715, -10.760013580322266, -9.9581298828125, -9.15624713897705, -8.354364395141602, -7.552481174468994, -6.750597953796387, -5.9487152099609375, -5.146832466125488, -4.344949245452881, -3.5430662631988525, -2.741183280944824, -1.939300537109375, -1.1374173164367676, -0.33553409576416016, 0.46634864807128906, 1.2682316303253174, 2.0701146125793457, 2.871997594833374, 3.6738805770874023, 4.475763320922852, 5.277646541595459, 6.079529762268066, 6.881412506103516, 7.683295249938965, 8.485177993774414, 9.28706169128418, 10.088944435119629, 10.890827178955078, 11.692710876464844, 12.494593620300293, 13.296476364135742, 14.098359107971191, 14.90024185180664, 15.702125549316406, 16.504009246826172, 17.305891036987305, 18.10777473449707, 18.909656524658203, 19.71154022216797, 20.513423919677734, 21.315305709838867, 22.117189407348633, 22.919071197509766, 23.72095489501953, 24.522838592529297, 25.324722290039062, 26.126604080200195]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 7.0, 4.0, 9.0, 10.0, 7.0, 13.0, 20.0, 18.0, 26.0, 22.0, 35.0, 29.0, 37.0, 32.0, 26.0, 42.0, 49.0, 46.0, 46.0, 43.0, 45.0, 52.0, 47.0, 40.0, 41.0, 29.0, 33.0, 31.0, 15.0, 16.0, 18.0, 22.0, 16.0, 16.0, 16.0, 9.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.447265625, -2.35968017578125, -2.2720947265625, -2.18450927734375, -2.096923828125, -2.00933837890625, -1.9217529296875, -1.83416748046875, -1.74658203125, -1.65899658203125, -1.5714111328125, -1.48382568359375, -1.396240234375, -1.30865478515625, -1.2210693359375, -1.13348388671875, -1.0458984375, -0.95831298828125, -0.8707275390625, -0.78314208984375, -0.695556640625, -0.60797119140625, -0.5203857421875, -0.43280029296875, -0.34521484375, -0.25762939453125, -0.1700439453125, -0.08245849609375, 0.005126953125, 0.09271240234375, 0.1802978515625, 0.26788330078125, 0.35546875, 0.44305419921875, 0.5306396484375, 0.61822509765625, 0.705810546875, 0.79339599609375, 0.8809814453125, 0.96856689453125, 1.05615234375, 1.14373779296875, 1.2313232421875, 1.31890869140625, 1.406494140625, 1.49407958984375, 1.5816650390625, 1.66925048828125, 1.7568359375, 1.84442138671875, 1.9320068359375, 2.01959228515625, 2.107177734375, 2.19476318359375, 2.2823486328125, 2.36993408203125, 2.45751953125, 2.54510498046875, 2.6326904296875, 2.72027587890625, 2.807861328125, 2.89544677734375, 2.9830322265625, 3.07061767578125, 3.158203125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 13.0, 15.0, 15.0, 24.0, 17.0, 44.0, 55.0, 100.0, 158.0, 314.0, 822.0, 2445.0, 9079.0, 38092.0, 192477.0, 1506660.0, 2088717.0, 286637.0, 51744.0, 11806.0, 3147.0, 983.0, 408.0, 181.0, 93.0, 46.0, 45.0, 17.0, 27.0, 12.0, 15.0, 12.0, 12.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2578125, -7.0167236328125, -6.775634765625, -6.5345458984375, -6.29345703125, -6.0523681640625, -5.811279296875, -5.5701904296875, -5.3291015625, -5.0880126953125, -4.846923828125, -4.6058349609375, -4.36474609375, -4.1236572265625, -3.882568359375, -3.6414794921875, -3.400390625, -3.1593017578125, -2.918212890625, -2.6771240234375, -2.43603515625, -2.1949462890625, -1.953857421875, -1.7127685546875, -1.4716796875, -1.2305908203125, -0.989501953125, -0.7484130859375, -0.50732421875, -0.2662353515625, -0.025146484375, 0.2159423828125, 0.45703125, 0.6981201171875, 0.939208984375, 1.1802978515625, 1.42138671875, 1.6624755859375, 1.903564453125, 2.1446533203125, 2.3857421875, 2.6268310546875, 2.867919921875, 3.1090087890625, 3.35009765625, 3.5911865234375, 3.832275390625, 4.0733642578125, 4.314453125, 4.5555419921875, 4.796630859375, 5.0377197265625, 5.27880859375, 5.5198974609375, 5.760986328125, 6.0020751953125, 6.2431640625, 6.4842529296875, 6.725341796875, 6.9664306640625, 7.20751953125, 7.4486083984375, 7.689697265625, 7.9307861328125, 8.171875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 29.0, 28.0, 50.0, 90.0, 109.0, 170.0, 195.0, 305.0, 360.0, 498.0, 495.0, 463.0, 354.0, 287.0, 184.0, 122.0, 94.0, 63.0, 47.0, 28.0, 19.0, 12.0, 6.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.9361572265625, -9.637939453125, -9.3397216796875, -9.04150390625, -8.7432861328125, -8.445068359375, -8.1468505859375, -7.8486328125, -7.5504150390625, -7.252197265625, -6.9539794921875, -6.65576171875, -6.3575439453125, -6.059326171875, -5.7611083984375, -5.462890625, -5.1646728515625, -4.866455078125, -4.5682373046875, -4.27001953125, -3.9718017578125, -3.673583984375, -3.3753662109375, -3.0771484375, -2.7789306640625, -2.480712890625, -2.1824951171875, -1.88427734375, -1.5860595703125, -1.287841796875, -0.9896240234375, -0.69140625, -0.3931884765625, -0.094970703125, 0.2032470703125, 0.50146484375, 0.7996826171875, 1.097900390625, 1.3961181640625, 1.6943359375, 1.9925537109375, 2.290771484375, 2.5889892578125, 2.88720703125, 3.1854248046875, 3.483642578125, 3.7818603515625, 4.080078125, 4.3782958984375, 4.676513671875, 4.9747314453125, 5.27294921875, 5.5711669921875, 5.869384765625, 6.1676025390625, 6.4658203125, 6.7640380859375, 7.062255859375, 7.3604736328125, 7.65869140625, 7.9569091796875, 8.255126953125, 8.5533447265625, 8.8515625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 8.0, 12.0, 14.0, 20.0, 45.0, 47.0, 81.0, 123.0, 181.0, 348.0, 775.0, 2150.0, 9191.0, 69064.0, 956510.0, 2888561.0, 237493.0, 23085.0, 4142.0, 1231.0, 503.0, 254.0, 134.0, 81.0, 75.0, 35.0, 28.0, 17.0, 11.0, 12.0, 16.0, 6.0, 7.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.71875, -18.15576171875, -17.5927734375, -17.02978515625, -16.466796875, -15.90380859375, -15.3408203125, -14.77783203125, -14.21484375, -13.65185546875, -13.0888671875, -12.52587890625, -11.962890625, -11.39990234375, -10.8369140625, -10.27392578125, -9.7109375, -9.14794921875, -8.5849609375, -8.02197265625, -7.458984375, -6.89599609375, -6.3330078125, -5.77001953125, -5.20703125, -4.64404296875, -4.0810546875, -3.51806640625, -2.955078125, -2.39208984375, -1.8291015625, -1.26611328125, -0.703125, -0.14013671875, 0.4228515625, 0.98583984375, 1.548828125, 2.11181640625, 2.6748046875, 3.23779296875, 3.80078125, 4.36376953125, 4.9267578125, 5.48974609375, 6.052734375, 6.61572265625, 7.1787109375, 7.74169921875, 8.3046875, 8.86767578125, 9.4306640625, 9.99365234375, 10.556640625, 11.11962890625, 11.6826171875, 12.24560546875, 12.80859375, 13.37158203125, 13.9345703125, 14.49755859375, 15.060546875, 15.62353515625, 16.1865234375, 16.74951171875, 17.3125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 15.0, 11.0, 22.0, 23.0, 32.0, 33.0, 41.0, 56.0, 69.0, 79.0, 88.0, 84.0, 94.0, 70.0, 49.0, 65.0, 40.0, 28.0, 34.0, 17.0, 12.0, 8.0, 13.0, 8.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.96895217895508, -39.97862243652344, -38.98829650878906, -37.99796676635742, -37.00763702392578, -36.017311096191406, -35.026981353759766, -34.036651611328125, -33.04632568359375, -32.05599594116211, -31.0656681060791, -30.075340270996094, -29.085012435913086, -28.094682693481445, -27.104354858398438, -26.114025115966797, -25.123695373535156, -24.13336753845215, -23.143037796020508, -22.1527099609375, -21.162382125854492, -20.17205238342285, -19.181724548339844, -18.191394805908203, -17.201068878173828, -16.21074104309082, -15.220412254333496, -14.230083465576172, -13.239754676818848, -12.249425888061523, -11.259098052978516, -10.268769264221191, -9.278440475463867, -8.288111686706543, -7.297783374786377, -6.307455062866211, -5.317126274108887, -4.326797962188721, -3.3364696502685547, -2.3461408615112305, -1.3558125495910645, -0.3654840588569641, 0.6248444318771362, 1.6151728630065918, 2.605501413345337, 3.595829963684082, 4.586158275604248, 5.576487064361572, 6.566815376281738, 7.557143688201904, 8.54747200012207, 9.537800788879395, 10.528129577636719, 11.518457412719727, 12.50878620147705, 13.499114990234375, 14.489442825317383, 15.479771614074707, 16.47010040283203, 17.46042823791504, 18.450756072998047, 19.441085815429688, 20.431413650512695, 21.421741485595703, 22.412071228027344]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 13.0, 10.0, 16.0, 19.0, 13.0, 18.0, 21.0, 21.0, 33.0, 31.0, 34.0, 32.0, 45.0, 35.0, 45.0, 38.0, 45.0, 47.0, 44.0, 38.0, 46.0, 42.0, 40.0, 33.0, 25.0, 29.0, 33.0, 13.0, 11.0, 20.0, 18.0, 19.0, 10.0, 9.0, 8.0, 7.0, 9.0, 6.0, 6.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-27.64544677734375, -26.790151596069336, -25.934856414794922, -25.079561233520508, -24.224266052246094, -23.368968963623047, -22.513673782348633, -21.65837860107422, -20.803083419799805, -19.94778823852539, -19.092493057250977, -18.237197875976562, -17.381900787353516, -16.526607513427734, -15.671310424804688, -14.816015243530273, -13.96072006225586, -13.105424880981445, -12.250129699707031, -11.3948335647583, -10.539538383483887, -9.684243202209473, -8.828947067260742, -7.973651885986328, -7.118356704711914, -6.2630615234375, -5.407765865325928, -4.5524702072143555, -3.6971750259399414, -2.8418798446655273, -1.986584186553955, -1.1312885284423828, -0.27599334716796875, 0.5793020725250244, 1.4345974922180176, 2.2898929119110107, 3.145188331604004, 4.000483512878418, 4.85577917098999, 5.7110748291015625, 6.566370010375977, 7.421665191650391, 8.276960372924805, 9.132256507873535, 9.98755168914795, 10.842846870422363, 11.698143005371094, 12.553438186645508, 13.408733367919922, 14.264028549194336, 15.11932373046875, 15.97461986541748, 16.829914093017578, 17.685211181640625, 18.54050636291504, 19.395801544189453, 20.251096725463867, 21.10639190673828, 21.961687088012695, 22.81698226928711, 23.672279357910156, 24.527572631835938, 25.382869720458984, 26.2381649017334, 27.093460083007812]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 11.0, 9.0, 5.0, 13.0, 19.0, 14.0, 15.0, 26.0, 24.0, 20.0, 32.0, 31.0, 40.0, 43.0, 28.0, 42.0, 35.0, 37.0, 44.0, 36.0, 47.0, 45.0, 50.0, 36.0, 30.0, 28.0, 29.0, 32.0, 27.0, 24.0, 23.0, 11.0, 19.0, 14.0, 6.0, 8.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.499298095703125, -2.41461181640625, -2.329925537109375, -2.2452392578125, -2.160552978515625, -2.07586669921875, -1.991180419921875, -1.906494140625, -1.821807861328125, -1.73712158203125, -1.652435302734375, -1.5677490234375, -1.483062744140625, -1.39837646484375, -1.313690185546875, -1.22900390625, -1.144317626953125, -1.05963134765625, -0.974945068359375, -0.8902587890625, -0.805572509765625, -0.72088623046875, -0.636199951171875, -0.551513671875, -0.466827392578125, -0.38214111328125, -0.297454833984375, -0.2127685546875, -0.128082275390625, -0.04339599609375, 0.041290283203125, 0.1259765625, 0.210662841796875, 0.29534912109375, 0.380035400390625, 0.4647216796875, 0.549407958984375, 0.63409423828125, 0.718780517578125, 0.803466796875, 0.888153076171875, 0.97283935546875, 1.057525634765625, 1.1422119140625, 1.226898193359375, 1.31158447265625, 1.396270751953125, 1.48095703125, 1.565643310546875, 1.65032958984375, 1.735015869140625, 1.8197021484375, 1.904388427734375, 1.98907470703125, 2.073760986328125, 2.158447265625, 2.243133544921875, 2.32781982421875, 2.412506103515625, 2.4971923828125, 2.581878662109375, 2.66656494140625, 2.751251220703125, 2.8359375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 2.0, 11.0, 17.0, 16.0, 24.0, 38.0, 58.0, 73.0, 128.0, 183.0, 242.0, 362.0, 528.0, 814.0, 1292.0, 2181.0, 3794.0, 6861.0, 12989.0, 25007.0, 51117.0, 105546.0, 206548.0, 272404.0, 179259.0, 88920.0, 42786.0, 21735.0, 11037.0, 5903.0, 3248.0, 1942.0, 1222.0, 715.0, 486.0, 322.0, 248.0, 158.0, 104.0, 71.0, 54.0, 38.0, 26.0, 16.0, 13.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5020675659179688, -0.4860687255859375, -0.47006988525390625, -0.454071044921875, -0.43807220458984375, -0.4220733642578125, -0.40607452392578125, -0.39007568359375, -0.37407684326171875, -0.3580780029296875, -0.34207916259765625, -0.326080322265625, -0.31008148193359375, -0.2940826416015625, -0.27808380126953125, -0.2620849609375, -0.24608612060546875, -0.2300872802734375, -0.21408843994140625, -0.198089599609375, -0.18209075927734375, -0.1660919189453125, -0.15009307861328125, -0.13409423828125, -0.11809539794921875, -0.1020965576171875, -0.08609771728515625, -0.070098876953125, -0.05410003662109375, -0.0381011962890625, -0.02210235595703125, -0.006103515625, 0.00989532470703125, 0.0258941650390625, 0.04189300537109375, 0.057891845703125, 0.07389068603515625, 0.0898895263671875, 0.10588836669921875, 0.12188720703125, 0.13788604736328125, 0.1538848876953125, 0.16988372802734375, 0.185882568359375, 0.20188140869140625, 0.2178802490234375, 0.23387908935546875, 0.2498779296875, 0.26587677001953125, 0.2818756103515625, 0.29787445068359375, 0.313873291015625, 0.32987213134765625, 0.3458709716796875, 0.36186981201171875, 0.37786865234375, 0.39386749267578125, 0.4098663330078125, 0.42586517333984375, 0.441864013671875, 0.45786285400390625, 0.4738616943359375, 0.48986053466796875, 0.505859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 5.0, 11.0, 7.0, 15.0, 6.0, 13.0, 11.0, 13.0, 22.0, 19.0, 17.0, 29.0, 28.0, 21.0, 25.0, 32.0, 21.0, 34.0, 47.0, 38.0, 1061.0, 33.0, 45.0, 43.0, 52.0, 39.0, 36.0, 30.0, 37.0, 33.0, 23.0, 23.0, 28.0, 15.0, 15.0, 15.0, 14.0, 21.0, 9.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.7939453125, -1.741058349609375, -1.68817138671875, -1.635284423828125, -1.5823974609375, -1.529510498046875, -1.47662353515625, -1.423736572265625, -1.370849609375, -1.317962646484375, -1.26507568359375, -1.212188720703125, -1.1593017578125, -1.106414794921875, -1.05352783203125, -1.000640869140625, -0.94775390625, -0.894866943359375, -0.84197998046875, -0.789093017578125, -0.7362060546875, -0.683319091796875, -0.63043212890625, -0.577545166015625, -0.524658203125, -0.471771240234375, -0.41888427734375, -0.365997314453125, -0.3131103515625, -0.260223388671875, -0.20733642578125, -0.154449462890625, -0.1015625, -0.048675537109375, 0.00421142578125, 0.057098388671875, 0.1099853515625, 0.162872314453125, 0.21575927734375, 0.268646240234375, 0.321533203125, 0.374420166015625, 0.42730712890625, 0.480194091796875, 0.5330810546875, 0.585968017578125, 0.63885498046875, 0.691741943359375, 0.74462890625, 0.797515869140625, 0.85040283203125, 0.903289794921875, 0.9561767578125, 1.009063720703125, 1.06195068359375, 1.114837646484375, 1.167724609375, 1.220611572265625, 1.27349853515625, 1.326385498046875, 1.3792724609375, 1.432159423828125, 1.48504638671875, 1.537933349609375, 1.5908203125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 2.0, 8.0, 13.0, 18.0, 28.0, 37.0, 55.0, 101.0, 128.0, 189.0, 329.0, 479.0, 878.0, 1317.0, 2340.0, 3840.0, 6812.0, 11779.0, 20758.0, 37286.0, 65183.0, 112199.0, 185956.0, 1206465.0, 181926.0, 110089.0, 64737.0, 36238.0, 20251.0, 11585.0, 6511.0, 3854.0, 2228.0, 1297.0, 837.0, 473.0, 313.0, 218.0, 112.0, 82.0, 60.0, 34.0, 28.0, 19.0, 17.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.220703125, -0.21346282958984375, -0.2062225341796875, -0.19898223876953125, -0.191741943359375, -0.18450164794921875, -0.1772613525390625, -0.17002105712890625, -0.16278076171875, -0.15554046630859375, -0.1483001708984375, -0.14105987548828125, -0.133819580078125, -0.12657928466796875, -0.1193389892578125, -0.11209869384765625, -0.1048583984375, -0.09761810302734375, -0.0903778076171875, -0.08313751220703125, -0.075897216796875, -0.06865692138671875, -0.0614166259765625, -0.05417633056640625, -0.04693603515625, -0.03969573974609375, -0.0324554443359375, -0.02521514892578125, -0.017974853515625, -0.01073455810546875, -0.0034942626953125, 0.00374603271484375, 0.010986328125, 0.01822662353515625, 0.0254669189453125, 0.03270721435546875, 0.039947509765625, 0.04718780517578125, 0.0544281005859375, 0.06166839599609375, 0.06890869140625, 0.07614898681640625, 0.0833892822265625, 0.09062957763671875, 0.097869873046875, 0.10511016845703125, 0.1123504638671875, 0.11959075927734375, 0.1268310546875, 0.13407135009765625, 0.1413116455078125, 0.14855194091796875, 0.155792236328125, 0.16303253173828125, 0.1702728271484375, 0.17751312255859375, 0.18475341796875, 0.19199371337890625, 0.1992340087890625, 0.20647430419921875, 0.213714599609375, 0.22095489501953125, 0.2281951904296875, 0.23543548583984375, 0.24267578125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 6.0, 1.0, 8.0, 8.0, 4.0, 13.0, 17.0, 40.0, 45.0, 61.0, 82.0, 110.0, 198.0, 117.0, 81.0, 55.0, 52.0, 25.0, 13.0, 9.0, 9.0, 1.0, 2.0, 8.0, 6.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0538330078125, -0.05235576629638672, -0.05087852478027344, -0.049401283264160156, -0.047924041748046875, -0.046446800231933594, -0.04496955871582031, -0.04349231719970703, -0.04201507568359375, -0.04053783416748047, -0.03906059265136719, -0.037583351135253906, -0.036106109619140625, -0.034628868103027344, -0.03315162658691406, -0.03167438507080078, -0.0301971435546875, -0.02871990203857422, -0.027242660522460938, -0.025765419006347656, -0.024288177490234375, -0.022810935974121094, -0.021333694458007812, -0.01985645294189453, -0.01837921142578125, -0.01690196990966797, -0.015424728393554688, -0.013947486877441406, -0.012470245361328125, -0.010993003845214844, -0.009515762329101562, -0.008038520812988281, -0.006561279296875, -0.005084037780761719, -0.0036067962646484375, -0.0021295547485351562, -0.000652313232421875, 0.0008249282836914062, 0.0023021697998046875, 0.0037794113159179688, 0.00525665283203125, 0.006733894348144531, 0.008211135864257812, 0.009688377380371094, 0.011165618896484375, 0.012642860412597656, 0.014120101928710938, 0.015597343444824219, 0.0170745849609375, 0.01855182647705078, 0.020029067993164062, 0.021506309509277344, 0.022983551025390625, 0.024460792541503906, 0.025938034057617188, 0.02741527557373047, 0.02889251708984375, 0.03036975860595703, 0.03184700012207031, 0.033324241638183594, 0.034801483154296875, 0.036278724670410156, 0.03775596618652344, 0.03923320770263672, 0.04071044921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 16.0, 25.0, 31.0, 46.0, 57.0, 85.0, 143.0, 405.0, 1983.0, 21898.0, 973787.0, 45915.0, 3070.0, 525.0, 193.0, 112.0, 65.0, 50.0, 26.0, 20.0, 17.0, 11.0, 7.0, 7.0, 3.0, 3.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.624481201171875, -0.60101318359375, -0.577545166015625, -0.5540771484375, -0.530609130859375, -0.50714111328125, -0.483673095703125, -0.460205078125, -0.436737060546875, -0.41326904296875, -0.389801025390625, -0.3663330078125, -0.342864990234375, -0.31939697265625, -0.295928955078125, -0.2724609375, -0.248992919921875, -0.22552490234375, -0.202056884765625, -0.1785888671875, -0.155120849609375, -0.13165283203125, -0.108184814453125, -0.084716796875, -0.061248779296875, -0.03778076171875, -0.014312744140625, 0.0091552734375, 0.032623291015625, 0.05609130859375, 0.079559326171875, 0.10302734375, 0.126495361328125, 0.14996337890625, 0.173431396484375, 0.1968994140625, 0.220367431640625, 0.24383544921875, 0.267303466796875, 0.290771484375, 0.314239501953125, 0.33770751953125, 0.361175537109375, 0.3846435546875, 0.408111572265625, 0.43157958984375, 0.455047607421875, 0.478515625, 0.501983642578125, 0.52545166015625, 0.548919677734375, 0.5723876953125, 0.595855712890625, 0.61932373046875, 0.642791748046875, 0.666259765625, 0.689727783203125, 0.71319580078125, 0.736663818359375, 0.7601318359375, 0.783599853515625, 0.80706787109375, 0.830535888671875, 0.85400390625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 17.0, 54.0, 139.0, 481.0, 226.0, 65.0, 11.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37442389130592346, -0.3613996207714081, -0.3483753204345703, -0.33535104990005493, -0.32232677936553955, -0.30930250883102417, -0.2962782382965088, -0.283253937959671, -0.27022966742515564, -0.25720539689064026, -0.24418111145496368, -0.2311568260192871, -0.21813255548477173, -0.20510828495025635, -0.19208399951457977, -0.1790597140789032, -0.16603544354438782, -0.15301117300987244, -0.13998688757419586, -0.1269626021385193, -0.1139383316040039, -0.10091405361890793, -0.08788977563381195, -0.07486549764871597, -0.061841219663619995, -0.04881694167852402, -0.03579266369342804, -0.022768385708332062, -0.009744107723236084, 0.003280170261859894, 0.01630444824695587, 0.02932872623205185, 0.042353034019470215, 0.05537731200456619, 0.06840158998966217, 0.08142586797475815, 0.09445014595985413, 0.1074744239449501, 0.12049870193004608, 0.13352298736572266, 0.14654725790023804, 0.15957152843475342, 0.17259581387043, 0.18562009930610657, 0.19864436984062195, 0.21166864037513733, 0.2246929258108139, 0.23771721124649048, 0.25074148178100586, 0.26376575231552124, 0.2767900228500366, 0.2898143231868744, 0.30283859372138977, 0.31586286425590515, 0.3288871645927429, 0.3419114351272583, 0.3549357056617737, 0.36795997619628906, 0.38098424673080444, 0.3940085470676422, 0.4070328176021576, 0.420057088136673, 0.43308138847351074, 0.4461056590080261, 0.4591299295425415]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 13.0, 12.0, 12.0, 8.0, 8.0, 12.0, 22.0, 20.0, 18.0, 20.0, 26.0, 21.0, 42.0, 23.0, 39.0, 35.0, 41.0, 37.0, 28.0, 44.0, 45.0, 37.0, 29.0, 47.0, 36.0, 34.0, 39.0, 40.0, 30.0, 21.0, 26.0, 29.0, 14.0, 11.0, 22.0, 8.0, 9.0, 10.0, 6.0, 8.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07403814792633057, -0.0719212219119072, -0.06980429589748383, -0.06768736988306046, -0.06557044386863708, -0.06345351785421371, -0.061336591839790344, -0.059219665825366974, -0.057102739810943604, -0.05498581379652023, -0.05286888778209686, -0.05075196176767349, -0.04863503575325012, -0.04651810973882675, -0.04440118372440338, -0.04228425770998001, -0.04016733169555664, -0.03805040568113327, -0.0359334796667099, -0.03381655365228653, -0.03169962763786316, -0.02958270162343979, -0.02746577560901642, -0.025348849594593048, -0.023231923580169678, -0.021114997565746307, -0.018998071551322937, -0.016881145536899567, -0.014764219522476196, -0.012647293508052826, -0.010530367493629456, -0.008413441479206085, -0.006296515464782715, -0.0041795894503593445, -0.002062663435935974, 5.426257848739624e-05, 0.0021711885929107666, 0.004288114607334137, 0.006405040621757507, 0.008521966636180878, 0.010638892650604248, 0.012755818665027618, 0.014872744679450989, 0.01698967069387436, 0.01910659670829773, 0.0212235227227211, 0.02334044873714447, 0.02545737475156784, 0.02757430076599121, 0.02969122678041458, 0.03180815279483795, 0.03392507880926132, 0.03604200482368469, 0.03815893083810806, 0.04027585685253143, 0.0423927828669548, 0.044509708881378174, 0.046626634895801544, 0.048743560910224915, 0.050860486924648285, 0.052977412939071655, 0.055094338953495026, 0.057211264967918396, 0.059328190982341766, 0.06144511699676514]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 11.0, 8.0, 6.0, 12.0, 20.0, 14.0, 15.0, 26.0, 24.0, 20.0, 32.0, 34.0, 34.0, 43.0, 31.0, 41.0, 36.0, 36.0, 44.0, 36.0, 47.0, 46.0, 51.0, 34.0, 30.0, 29.0, 28.0, 33.0, 26.0, 25.0, 23.0, 11.0, 19.0, 14.0, 6.0, 8.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.49932861328125, -2.4146728515625, -2.33001708984375, -2.245361328125, -2.16070556640625, -2.0760498046875, -1.99139404296875, -1.90673828125, -1.82208251953125, -1.7374267578125, -1.65277099609375, -1.568115234375, -1.48345947265625, -1.3988037109375, -1.31414794921875, -1.2294921875, -1.14483642578125, -1.0601806640625, -0.97552490234375, -0.890869140625, -0.80621337890625, -0.7215576171875, -0.63690185546875, -0.55224609375, -0.46759033203125, -0.3829345703125, -0.29827880859375, -0.213623046875, -0.12896728515625, -0.0443115234375, 0.04034423828125, 0.125, 0.20965576171875, 0.2943115234375, 0.37896728515625, 0.463623046875, 0.54827880859375, 0.6329345703125, 0.71759033203125, 0.80224609375, 0.88690185546875, 0.9715576171875, 1.05621337890625, 1.140869140625, 1.22552490234375, 1.3101806640625, 1.39483642578125, 1.4794921875, 1.56414794921875, 1.6488037109375, 1.73345947265625, 1.818115234375, 1.90277099609375, 1.9874267578125, 2.07208251953125, 2.15673828125, 2.24139404296875, 2.3260498046875, 2.41070556640625, 2.495361328125, 2.58001708984375, 2.6646728515625, 2.74932861328125, 2.833984375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 7.0, 4.0, 7.0, 6.0, 11.0, 12.0, 21.0, 29.0, 48.0, 79.0, 99.0, 126.0, 235.0, 304.0, 519.0, 747.0, 1127.0, 1861.0, 2672.0, 4259.0, 7388.0, 13999.0, 30669.0, 76629.0, 268961.0, 447266.0, 109498.0, 41046.0, 17724.0, 8941.0, 5097.0, 3162.0, 2037.0, 1330.0, 859.0, 604.0, 367.0, 260.0, 178.0, 127.0, 82.0, 52.0, 36.0, 23.0, 18.0, 10.0, 11.0, 9.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.947265625, -2.846221923828125, -2.74517822265625, -2.644134521484375, -2.5430908203125, -2.442047119140625, -2.34100341796875, -2.239959716796875, -2.138916015625, -2.037872314453125, -1.93682861328125, -1.835784912109375, -1.7347412109375, -1.633697509765625, -1.53265380859375, -1.431610107421875, -1.33056640625, -1.229522705078125, -1.12847900390625, -1.027435302734375, -0.9263916015625, -0.825347900390625, -0.72430419921875, -0.623260498046875, -0.522216796875, -0.421173095703125, -0.32012939453125, -0.219085693359375, -0.1180419921875, -0.016998291015625, 0.08404541015625, 0.185089111328125, 0.2861328125, 0.387176513671875, 0.48822021484375, 0.589263916015625, 0.6903076171875, 0.791351318359375, 0.89239501953125, 0.993438720703125, 1.094482421875, 1.195526123046875, 1.29656982421875, 1.397613525390625, 1.4986572265625, 1.599700927734375, 1.70074462890625, 1.801788330078125, 1.90283203125, 2.003875732421875, 2.10491943359375, 2.205963134765625, 2.3070068359375, 2.408050537109375, 2.50909423828125, 2.610137939453125, 2.711181640625, 2.812225341796875, 2.91326904296875, 3.014312744140625, 3.1153564453125, 3.216400146484375, 3.31744384765625, 3.418487548828125, 3.51953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 2.0, 10.0, 3.0, 3.0, 12.0, 6.0, 6.0, 10.0, 12.0, 18.0, 18.0, 25.0, 27.0, 18.0, 25.0, 38.0, 32.0, 24.0, 36.0, 43.0, 60.0, 108.0, 232.0, 1555.0, 216.0, 79.0, 61.0, 46.0, 36.0, 44.0, 40.0, 25.0, 33.0, 27.0, 19.0, 16.0, 13.0, 13.0, 10.0, 8.0, 8.0, 6.0, 8.0, 8.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.9375, -8.6619873046875, -8.386474609375, -8.1109619140625, -7.83544921875, -7.5599365234375, -7.284423828125, -7.0089111328125, -6.7333984375, -6.4578857421875, -6.182373046875, -5.9068603515625, -5.63134765625, -5.3558349609375, -5.080322265625, -4.8048095703125, -4.529296875, -4.2537841796875, -3.978271484375, -3.7027587890625, -3.42724609375, -3.1517333984375, -2.876220703125, -2.6007080078125, -2.3251953125, -2.0496826171875, -1.774169921875, -1.4986572265625, -1.22314453125, -0.9476318359375, -0.672119140625, -0.3966064453125, -0.12109375, 0.1544189453125, 0.429931640625, 0.7054443359375, 0.98095703125, 1.2564697265625, 1.531982421875, 1.8074951171875, 2.0830078125, 2.3585205078125, 2.634033203125, 2.9095458984375, 3.18505859375, 3.4605712890625, 3.736083984375, 4.0115966796875, 4.287109375, 4.5626220703125, 4.838134765625, 5.1136474609375, 5.38916015625, 5.6646728515625, 5.940185546875, 6.2156982421875, 6.4912109375, 6.7667236328125, 7.042236328125, 7.3177490234375, 7.59326171875, 7.8687744140625, 8.144287109375, 8.4197998046875, 8.6953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 7.0, 5.0, 7.0, 9.0, 21.0, 12.0, 17.0, 20.0, 36.0, 59.0, 79.0, 97.0, 152.0, 225.0, 558.0, 2278.0, 16994.0, 2027140.0, 1079829.0, 14795.0, 2011.0, 523.0, 231.0, 152.0, 110.0, 83.0, 66.0, 45.0, 32.0, 22.0, 20.0, 9.0, 12.0, 13.0, 8.0, 5.0, 5.0, 5.0, 11.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.453125, -17.83740234375, -17.2216796875, -16.60595703125, -15.990234375, -15.37451171875, -14.7587890625, -14.14306640625, -13.52734375, -12.91162109375, -12.2958984375, -11.68017578125, -11.064453125, -10.44873046875, -9.8330078125, -9.21728515625, -8.6015625, -7.98583984375, -7.3701171875, -6.75439453125, -6.138671875, -5.52294921875, -4.9072265625, -4.29150390625, -3.67578125, -3.06005859375, -2.4443359375, -1.82861328125, -1.212890625, -0.59716796875, 0.0185546875, 0.63427734375, 1.25, 1.86572265625, 2.4814453125, 3.09716796875, 3.712890625, 4.32861328125, 4.9443359375, 5.56005859375, 6.17578125, 6.79150390625, 7.4072265625, 8.02294921875, 8.638671875, 9.25439453125, 9.8701171875, 10.48583984375, 11.1015625, 11.71728515625, 12.3330078125, 12.94873046875, 13.564453125, 14.18017578125, 14.7958984375, 15.41162109375, 16.02734375, 16.64306640625, 17.2587890625, 17.87451171875, 18.490234375, 19.10595703125, 19.7216796875, 20.33740234375, 20.953125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 21.0, 169.0, 428.0, 298.0, 87.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.80569458007812, -64.01609802246094, -62.226505279541016, -60.436912536621094, -58.647315979003906, -56.85771942138672, -55.0681266784668, -53.278533935546875, -51.48893737792969, -49.6993408203125, -47.90974807739258, -46.120155334472656, -44.33055877685547, -42.54096221923828, -40.75136947631836, -38.96177673339844, -37.17218017578125, -35.38258361816406, -33.59299087524414, -31.803396224975586, -30.01380157470703, -28.224206924438477, -26.434612274169922, -24.645017623901367, -22.855422973632812, -21.065828323364258, -19.276233673095703, -17.48663902282715, -15.697044372558594, -13.907449722290039, -12.117855072021484, -10.32826042175293, -8.53866195678711, -6.749067306518555, -4.95947265625, -3.1698780059814453, -1.3802833557128906, 0.40931129455566406, 2.1989059448242188, 3.9885005950927734, 5.778095245361328, 7.567689895629883, 9.357284545898438, 11.146879196166992, 12.936473846435547, 14.726068496704102, 16.515663146972656, 18.30525779724121, 20.094852447509766, 21.88444709777832, 23.674041748046875, 25.46363639831543, 27.253231048583984, 29.04282569885254, 30.832420349121094, 32.62201690673828, 34.4116096496582, 36.201202392578125, 37.99079895019531, 39.7803955078125, 41.56998825073242, 43.359580993652344, 45.14917755126953, 46.93877410888672, 48.72836685180664]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 10.0, 12.0, 13.0, 14.0, 15.0, 24.0, 18.0, 23.0, 17.0, 38.0, 29.0, 31.0, 30.0, 35.0, 38.0, 33.0, 41.0, 37.0, 40.0, 37.0, 38.0, 38.0, 27.0, 35.0, 23.0, 27.0, 27.0, 23.0, 26.0, 27.0, 25.0, 13.0, 13.0, 13.0, 15.0, 9.0, 13.0, 12.0, 6.0, 11.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.7745361328125, -22.986364364624023, -22.198190689086914, -21.410018920898438, -20.621845245361328, -19.83367347717285, -19.045501708984375, -18.257328033447266, -17.469154357910156, -16.68098258972168, -15.89280891418457, -15.104637145996094, -14.316463470458984, -13.528291702270508, -12.740118980407715, -11.951946258544922, -11.163774490356445, -10.375601768493652, -9.58742904663086, -8.799257278442383, -8.011083602905273, -7.222911357879639, -6.434739112854004, -5.646566390991211, -4.858393669128418, -4.070220947265625, -3.282048463821411, -2.4938759803771973, -1.7057032585144043, -0.9175305366516113, -0.12935829162597656, 0.6588144302368164, 1.4469871520996094, 2.2351598739624023, 3.023332357406616, 3.81150484085083, 4.599677562713623, 5.387850284576416, 6.176022529602051, 6.964195251464844, 7.752367973327637, 8.54054069519043, 9.328713417053223, 10.116886138916016, 10.905057907104492, 11.693231582641602, 12.481403350830078, 13.269576072692871, 14.057748794555664, 14.845921516418457, 15.63409423828125, 16.422266006469727, 17.210439682006836, 17.998611450195312, 18.786785125732422, 19.5749568939209, 20.363128662109375, 21.15130043029785, 21.93947410583496, 22.727645874023438, 23.515819549560547, 24.303991317749023, 25.0921630859375, 25.88033676147461, 26.66851043701172]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 7.0, 13.0, 6.0, 13.0, 8.0, 14.0, 18.0, 22.0, 18.0, 21.0, 28.0, 30.0, 29.0, 37.0, 43.0, 35.0, 29.0, 37.0, 46.0, 51.0, 38.0, 44.0, 44.0, 43.0, 34.0, 31.0, 28.0, 32.0, 31.0, 35.0, 19.0, 18.0, 14.0, 14.0, 12.0, 10.0, 7.0, 6.0, 3.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.76171875, -2.673492431640625, -2.58526611328125, -2.497039794921875, -2.4088134765625, -2.320587158203125, -2.23236083984375, -2.144134521484375, -2.055908203125, -1.967681884765625, -1.87945556640625, -1.791229248046875, -1.7030029296875, -1.614776611328125, -1.52655029296875, -1.438323974609375, -1.35009765625, -1.261871337890625, -1.17364501953125, -1.085418701171875, -0.9971923828125, -0.908966064453125, -0.82073974609375, -0.732513427734375, -0.644287109375, -0.556060791015625, -0.46783447265625, -0.379608154296875, -0.2913818359375, -0.203155517578125, -0.11492919921875, -0.026702880859375, 0.0615234375, 0.149749755859375, 0.23797607421875, 0.326202392578125, 0.4144287109375, 0.502655029296875, 0.59088134765625, 0.679107666015625, 0.767333984375, 0.855560302734375, 0.94378662109375, 1.032012939453125, 1.1202392578125, 1.208465576171875, 1.29669189453125, 1.384918212890625, 1.47314453125, 1.561370849609375, 1.64959716796875, 1.737823486328125, 1.8260498046875, 1.914276123046875, 2.00250244140625, 2.090728759765625, 2.178955078125, 2.267181396484375, 2.35540771484375, 2.443634033203125, 2.5318603515625, 2.620086669921875, 2.70831298828125, 2.796539306640625, 2.884765625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 16.0, 20.0, 23.0, 27.0, 71.0, 72.0, 82.0, 137.0, 203.0, 307.0, 480.0, 829.0, 1449.0, 2613.0, 4626.0, 8957.0, 17850.0, 35473.0, 77356.0, 184494.0, 496548.0, 1182247.0, 1251447.0, 557067.0, 207864.0, 85490.0, 38688.0, 18746.0, 9659.0, 4893.0, 2701.0, 1552.0, 861.0, 536.0, 294.0, 206.0, 120.0, 80.0, 62.0, 41.0, 18.0, 29.0, 15.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3984375, -3.285369873046875, -3.17230224609375, -3.059234619140625, -2.9461669921875, -2.833099365234375, -2.72003173828125, -2.606964111328125, -2.493896484375, -2.380828857421875, -2.26776123046875, -2.154693603515625, -2.0416259765625, -1.928558349609375, -1.81549072265625, -1.702423095703125, -1.58935546875, -1.476287841796875, -1.36322021484375, -1.250152587890625, -1.1370849609375, -1.024017333984375, -0.91094970703125, -0.797882080078125, -0.684814453125, -0.571746826171875, -0.45867919921875, -0.345611572265625, -0.2325439453125, -0.119476318359375, -0.00640869140625, 0.106658935546875, 0.2197265625, 0.332794189453125, 0.44586181640625, 0.558929443359375, 0.6719970703125, 0.785064697265625, 0.89813232421875, 1.011199951171875, 1.124267578125, 1.237335205078125, 1.35040283203125, 1.463470458984375, 1.5765380859375, 1.689605712890625, 1.80267333984375, 1.915740966796875, 2.02880859375, 2.141876220703125, 2.25494384765625, 2.368011474609375, 2.4810791015625, 2.594146728515625, 2.70721435546875, 2.820281982421875, 2.933349609375, 3.046417236328125, 3.15948486328125, 3.272552490234375, 3.3856201171875, 3.498687744140625, 3.61175537109375, 3.724822998046875, 3.837890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 7.0, 6.0, 9.0, 11.0, 14.0, 30.0, 31.0, 38.0, 62.0, 97.0, 133.0, 168.0, 223.0, 287.0, 361.0, 454.0, 451.0, 398.0, 305.0, 253.0, 194.0, 141.0, 99.0, 77.0, 57.0, 48.0, 31.0, 18.0, 20.0, 12.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.41192626953125, -9.1519775390625, -8.89202880859375, -8.632080078125, -8.37213134765625, -8.1121826171875, -7.85223388671875, -7.59228515625, -7.33233642578125, -7.0723876953125, -6.81243896484375, -6.552490234375, -6.29254150390625, -6.0325927734375, -5.77264404296875, -5.5126953125, -5.25274658203125, -4.9927978515625, -4.73284912109375, -4.472900390625, -4.21295166015625, -3.9530029296875, -3.69305419921875, -3.43310546875, -3.17315673828125, -2.9132080078125, -2.65325927734375, -2.393310546875, -2.13336181640625, -1.8734130859375, -1.61346435546875, -1.353515625, -1.09356689453125, -0.8336181640625, -0.57366943359375, -0.313720703125, -0.05377197265625, 0.2061767578125, 0.46612548828125, 0.72607421875, 0.98602294921875, 1.2459716796875, 1.50592041015625, 1.765869140625, 2.02581787109375, 2.2857666015625, 2.54571533203125, 2.8056640625, 3.06561279296875, 3.3255615234375, 3.58551025390625, 3.845458984375, 4.10540771484375, 4.3653564453125, 4.62530517578125, 4.88525390625, 5.14520263671875, 5.4051513671875, 5.66510009765625, 5.925048828125, 6.18499755859375, 6.4449462890625, 6.70489501953125, 6.96484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 11.0, 10.0, 16.0, 22.0, 30.0, 46.0, 72.0, 74.0, 133.0, 228.0, 587.0, 1670.0, 6909.0, 54013.0, 774209.0, 3048161.0, 278297.0, 23881.0, 3925.0, 1063.0, 343.0, 205.0, 104.0, 70.0, 51.0, 47.0, 29.0, 16.0, 14.0, 11.0, 8.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.578125, -22.00390625, -21.4296875, -20.85546875, -20.28125, -19.70703125, -19.1328125, -18.55859375, -17.984375, -17.41015625, -16.8359375, -16.26171875, -15.6875, -15.11328125, -14.5390625, -13.96484375, -13.390625, -12.81640625, -12.2421875, -11.66796875, -11.09375, -10.51953125, -9.9453125, -9.37109375, -8.796875, -8.22265625, -7.6484375, -7.07421875, -6.5, -5.92578125, -5.3515625, -4.77734375, -4.203125, -3.62890625, -3.0546875, -2.48046875, -1.90625, -1.33203125, -0.7578125, -0.18359375, 0.390625, 0.96484375, 1.5390625, 2.11328125, 2.6875, 3.26171875, 3.8359375, 4.41015625, 4.984375, 5.55859375, 6.1328125, 6.70703125, 7.28125, 7.85546875, 8.4296875, 9.00390625, 9.578125, 10.15234375, 10.7265625, 11.30078125, 11.875, 12.44921875, 13.0234375, 13.59765625, 14.171875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 20.0, 69.0, 121.0, 189.0, 226.0, 184.0, 124.0, 54.0, 10.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-143.73486328125, -140.88414001464844, -138.03343200683594, -135.18270874023438, -132.3319854736328, -129.4812774658203, -126.63055419921875, -123.77983093261719, -120.92911529541016, -118.07839965820312, -115.22767639160156, -112.37696075439453, -109.5262451171875, -106.67552185058594, -103.8248062133789, -100.97409057617188, -98.12336730957031, -95.27265167236328, -92.42192840576172, -89.57121276855469, -86.72048950195312, -83.8697738647461, -81.01905822753906, -78.1683349609375, -75.31761932373047, -72.46690368652344, -69.61618041992188, -66.76546478271484, -63.91474533081055, -61.06402587890625, -58.21331024169922, -55.36259078979492, -52.511863708496094, -49.6611442565918, -46.8104248046875, -43.95970916748047, -41.10898971557617, -38.258270263671875, -35.407554626464844, -32.55683517456055, -29.70611572265625, -26.855396270751953, -24.00467872619629, -21.153961181640625, -18.303241729736328, -15.452523231506348, -12.601804733276367, -9.751087188720703, -6.900367736816406, -4.049649238586426, -1.1989307403564453, 1.6517877578735352, 4.502506256103516, 7.353224754333496, 10.203943252563477, 13.05466079711914, 15.905380249023438, 18.756099700927734, 21.6068172454834, 24.457534790039062, 27.30825424194336, 30.158973693847656, 33.00968933105469, 35.860408782958984, 38.71112823486328]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 7.0, 12.0, 6.0, 11.0, 20.0, 17.0, 20.0, 19.0, 16.0, 38.0, 22.0, 32.0, 36.0, 34.0, 44.0, 48.0, 53.0, 45.0, 46.0, 48.0, 46.0, 37.0, 32.0, 49.0, 30.0, 36.0, 27.0, 30.0, 24.0, 17.0, 17.0, 14.0, 16.0, 12.0, 10.0, 7.0, 9.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.827207565307617, -28.90460777282715, -27.982009887695312, -27.059410095214844, -26.136810302734375, -25.21421241760254, -24.29161262512207, -23.369014739990234, -22.446414947509766, -21.523815155029297, -20.60121726989746, -19.678617477416992, -18.756019592285156, -17.833419799804688, -16.91082000732422, -15.988221168518066, -15.065622329711914, -14.143023490905762, -13.22042465209961, -12.29782485961914, -11.375226020812988, -10.452627182006836, -9.530027389526367, -8.607428550720215, -7.6848297119140625, -6.76223087310791, -5.8396315574646, -4.917032241821289, -3.9944334030151367, -3.0718345642089844, -2.149235248565674, -1.2266359329223633, -0.30403900146484375, 0.6185600757598877, 1.5411591529846191, 2.4637582302093506, 3.386357307434082, 4.308956146240234, 5.231555461883545, 6.1541547775268555, 7.076753616333008, 7.99935245513916, 8.921951293945312, 9.844551086425781, 10.767149925231934, 11.689748764038086, 12.612348556518555, 13.534947395324707, 14.45754623413086, 15.380145072937012, 16.302743911743164, 17.225343704223633, 18.14794158935547, 19.070541381835938, 19.993141174316406, 20.915740966796875, 21.83833885192871, 22.76093864440918, 23.683536529541016, 24.606136322021484, 25.528736114501953, 26.45133399963379, 27.373933792114258, 28.296531677246094, 29.219131469726562]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 5.0, 6.0, 8.0, 6.0, 6.0, 6.0, 14.0, 11.0, 15.0, 17.0, 17.0, 26.0, 31.0, 30.0, 22.0, 24.0, 28.0, 37.0, 46.0, 35.0, 37.0, 34.0, 40.0, 39.0, 40.0, 30.0, 44.0, 45.0, 43.0, 37.0, 28.0, 23.0, 33.0, 18.0, 24.0, 17.0, 13.0, 14.0, 8.0, 7.0, 7.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-3.08203125, -2.992523193359375, -2.90301513671875, -2.813507080078125, -2.7239990234375, -2.634490966796875, -2.54498291015625, -2.455474853515625, -2.365966796875, -2.276458740234375, -2.18695068359375, -2.097442626953125, -2.0079345703125, -1.918426513671875, -1.82891845703125, -1.739410400390625, -1.64990234375, -1.560394287109375, -1.47088623046875, -1.381378173828125, -1.2918701171875, -1.202362060546875, -1.11285400390625, -1.023345947265625, -0.933837890625, -0.844329833984375, -0.75482177734375, -0.665313720703125, -0.5758056640625, -0.486297607421875, -0.39678955078125, -0.307281494140625, -0.2177734375, -0.128265380859375, -0.03875732421875, 0.050750732421875, 0.1402587890625, 0.229766845703125, 0.31927490234375, 0.408782958984375, 0.498291015625, 0.587799072265625, 0.67730712890625, 0.766815185546875, 0.8563232421875, 0.945831298828125, 1.03533935546875, 1.124847412109375, 1.21435546875, 1.303863525390625, 1.39337158203125, 1.482879638671875, 1.5723876953125, 1.661895751953125, 1.75140380859375, 1.840911865234375, 1.930419921875, 2.019927978515625, 2.10943603515625, 2.198944091796875, 2.2884521484375, 2.377960205078125, 2.46746826171875, 2.556976318359375, 2.646484375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 6.0, 16.0, 25.0, 35.0, 50.0, 67.0, 115.0, 157.0, 269.0, 462.0, 752.0, 1348.0, 2663.0, 4834.0, 9997.0, 20850.0, 44922.0, 94461.0, 191720.0, 283800.0, 200282.0, 100493.0, 47251.0, 22005.0, 10651.0, 5167.0, 2670.0, 1414.0, 769.0, 487.0, 288.0, 177.0, 123.0, 71.0, 44.0, 32.0, 22.0, 15.0, 13.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5966796875, -0.578887939453125, -0.56109619140625, -0.543304443359375, -0.5255126953125, -0.507720947265625, -0.48992919921875, -0.472137451171875, -0.454345703125, -0.436553955078125, -0.41876220703125, -0.400970458984375, -0.3831787109375, -0.365386962890625, -0.34759521484375, -0.329803466796875, -0.31201171875, -0.294219970703125, -0.27642822265625, -0.258636474609375, -0.2408447265625, -0.223052978515625, -0.20526123046875, -0.187469482421875, -0.169677734375, -0.151885986328125, -0.13409423828125, -0.116302490234375, -0.0985107421875, -0.080718994140625, -0.06292724609375, -0.045135498046875, -0.02734375, -0.009552001953125, 0.00823974609375, 0.026031494140625, 0.0438232421875, 0.061614990234375, 0.07940673828125, 0.097198486328125, 0.114990234375, 0.132781982421875, 0.15057373046875, 0.168365478515625, 0.1861572265625, 0.203948974609375, 0.22174072265625, 0.239532470703125, 0.25732421875, 0.275115966796875, 0.29290771484375, 0.310699462890625, 0.3284912109375, 0.346282958984375, 0.36407470703125, 0.381866455078125, 0.399658203125, 0.417449951171875, 0.43524169921875, 0.453033447265625, 0.4708251953125, 0.488616943359375, 0.50640869140625, 0.524200439453125, 0.5419921875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 11.0, 7.0, 8.0, 8.0, 14.0, 13.0, 14.0, 11.0, 14.0, 22.0, 20.0, 26.0, 35.0, 32.0, 31.0, 31.0, 40.0, 40.0, 41.0, 41.0, 1058.0, 37.0, 42.0, 33.0, 43.0, 26.0, 38.0, 43.0, 28.0, 29.0, 36.0, 26.0, 22.0, 22.0, 11.0, 13.0, 13.0, 7.0, 14.0, 3.0, 4.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.072265625, -2.013580322265625, -1.95489501953125, -1.896209716796875, -1.8375244140625, -1.778839111328125, -1.72015380859375, -1.661468505859375, -1.602783203125, -1.544097900390625, -1.48541259765625, -1.426727294921875, -1.3680419921875, -1.309356689453125, -1.25067138671875, -1.191986083984375, -1.13330078125, -1.074615478515625, -1.01593017578125, -0.957244873046875, -0.8985595703125, -0.839874267578125, -0.78118896484375, -0.722503662109375, -0.663818359375, -0.605133056640625, -0.54644775390625, -0.487762451171875, -0.4290771484375, -0.370391845703125, -0.31170654296875, -0.253021240234375, -0.1943359375, -0.135650634765625, -0.07696533203125, -0.018280029296875, 0.0404052734375, 0.099090576171875, 0.15777587890625, 0.216461181640625, 0.275146484375, 0.333831787109375, 0.39251708984375, 0.451202392578125, 0.5098876953125, 0.568572998046875, 0.62725830078125, 0.685943603515625, 0.74462890625, 0.803314208984375, 0.86199951171875, 0.920684814453125, 0.9793701171875, 1.038055419921875, 1.09674072265625, 1.155426025390625, 1.214111328125, 1.272796630859375, 1.33148193359375, 1.390167236328125, 1.4488525390625, 1.507537841796875, 1.56622314453125, 1.624908447265625, 1.68359375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 16.0, 17.0, 27.0, 33.0, 71.0, 102.0, 157.0, 213.0, 298.0, 535.0, 750.0, 1181.0, 1746.0, 2607.0, 4157.0, 6378.0, 10081.0, 15378.0, 24318.0, 37077.0, 56205.0, 82852.0, 120236.0, 315583.0, 994387.0, 140391.0, 94765.0, 64685.0, 42767.0, 28185.0, 18453.0, 11744.0, 7633.0, 4930.0, 3133.0, 2038.0, 1331.0, 900.0, 555.0, 402.0, 285.0, 160.0, 125.0, 81.0, 51.0, 34.0, 29.0, 20.0, 15.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1768798828125, -0.1712055206298828, -0.16553115844726562, -0.15985679626464844, -0.15418243408203125, -0.14850807189941406, -0.14283370971679688, -0.1371593475341797, -0.1314849853515625, -0.1258106231689453, -0.12013626098632812, -0.11446189880371094, -0.10878753662109375, -0.10311317443847656, -0.09743881225585938, -0.09176445007324219, -0.086090087890625, -0.08041572570800781, -0.07474136352539062, -0.06906700134277344, -0.06339263916015625, -0.05771827697753906, -0.052043914794921875, -0.04636955261230469, -0.0406951904296875, -0.03502082824707031, -0.029346466064453125, -0.023672103881835938, -0.01799774169921875, -0.012323379516601562, -0.006649017333984375, -0.0009746551513671875, 0.00469970703125, 0.010374069213867188, 0.016048431396484375, 0.021722793579101562, 0.02739715576171875, 0.03307151794433594, 0.038745880126953125, 0.04442024230957031, 0.0500946044921875, 0.05576896667480469, 0.061443328857421875, 0.06711769104003906, 0.07279205322265625, 0.07846641540527344, 0.08414077758789062, 0.08981513977050781, 0.095489501953125, 0.10116386413574219, 0.10683822631835938, 0.11251258850097656, 0.11818695068359375, 0.12386131286621094, 0.12953567504882812, 0.1352100372314453, 0.1408843994140625, 0.1465587615966797, 0.15223312377929688, 0.15790748596191406, 0.16358184814453125, 0.16925621032714844, 0.17493057250976562, 0.1806049346923828, 0.186279296875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 5.0, 9.0, 10.0, 14.0, 18.0, 28.0, 39.0, 34.0, 74.0, 93.0, 141.0, 124.0, 103.0, 91.0, 45.0, 37.0, 24.0, 26.0, 13.0, 10.0, 16.0, 9.0, 9.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062408447265625, -0.06041383743286133, -0.058419227600097656, -0.056424617767333984, -0.05443000793457031, -0.05243539810180664, -0.05044078826904297, -0.0484461784362793, -0.046451568603515625, -0.04445695877075195, -0.04246234893798828, -0.04046773910522461, -0.03847312927246094, -0.036478519439697266, -0.034483909606933594, -0.03248929977416992, -0.03049468994140625, -0.028500080108642578, -0.026505470275878906, -0.024510860443115234, -0.022516250610351562, -0.02052164077758789, -0.01852703094482422, -0.016532421112060547, -0.014537811279296875, -0.012543201446533203, -0.010548591613769531, -0.00855398178100586, -0.0065593719482421875, -0.004564762115478516, -0.0025701522827148438, -0.0005755424499511719, 0.0014190673828125, 0.003413677215576172, 0.005408287048339844, 0.007402896881103516, 0.009397506713867188, 0.01139211654663086, 0.013386726379394531, 0.015381336212158203, 0.017375946044921875, 0.019370555877685547, 0.02136516571044922, 0.02335977554321289, 0.025354385375976562, 0.027348995208740234, 0.029343605041503906, 0.03133821487426758, 0.03333282470703125, 0.03532743453979492, 0.037322044372558594, 0.039316654205322266, 0.04131126403808594, 0.04330587387084961, 0.04530048370361328, 0.04729509353637695, 0.049289703369140625, 0.0512843132019043, 0.05327892303466797, 0.05527353286743164, 0.05726814270019531, 0.059262752532958984, 0.061257362365722656, 0.06325197219848633, 0.06524658203125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 9.0, 6.0, 6.0, 17.0, 14.0, 18.0, 26.0, 27.0, 48.0, 75.0, 87.0, 167.0, 455.0, 1630.0, 16537.0, 1000254.0, 26140.0, 1991.0, 489.0, 196.0, 92.0, 108.0, 49.0, 29.0, 24.0, 13.0, 9.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9736328125, -0.9437332153320312, -0.9138336181640625, -0.8839340209960938, -0.854034423828125, -0.8241348266601562, -0.7942352294921875, -0.7643356323242188, -0.73443603515625, -0.7045364379882812, -0.6746368408203125, -0.6447372436523438, -0.614837646484375, -0.5849380493164062, -0.5550384521484375, -0.5251388549804688, -0.4952392578125, -0.46533966064453125, -0.4354400634765625, -0.40554046630859375, -0.375640869140625, -0.34574127197265625, -0.3158416748046875, -0.28594207763671875, -0.25604248046875, -0.22614288330078125, -0.1962432861328125, -0.16634368896484375, -0.136444091796875, -0.10654449462890625, -0.0766448974609375, -0.04674530029296875, -0.016845703125, 0.01305389404296875, 0.0429534912109375, 0.07285308837890625, 0.102752685546875, 0.13265228271484375, 0.1625518798828125, 0.19245147705078125, 0.22235107421875, 0.25225067138671875, 0.2821502685546875, 0.31204986572265625, 0.341949462890625, 0.37184906005859375, 0.4017486572265625, 0.43164825439453125, 0.4615478515625, 0.49144744873046875, 0.5213470458984375, 0.5512466430664062, 0.581146240234375, 0.6110458374023438, 0.6409454345703125, 0.6708450317382812, 0.70074462890625, 0.7306442260742188, 0.7605438232421875, 0.7904434204101562, 0.820343017578125, 0.8502426147460938, 0.8801422119140625, 0.9100418090820312, 0.93994140625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 18.0, 50.0, 201.0, 554.0, 132.0, 28.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6166738271713257, -0.6017930507659912, -0.5869122743606567, -0.5720314383506775, -0.557150661945343, -0.5422698855400085, -0.5273891091346741, -0.5125083327293396, -0.49762752652168274, -0.48274675011634827, -0.4678659439086914, -0.45298516750335693, -0.4381043612957001, -0.4232235848903656, -0.40834277868270874, -0.39346200227737427, -0.3785812258720398, -0.3637004494667053, -0.34881964325904846, -0.333938866853714, -0.31905806064605713, -0.30417728424072266, -0.2892965078353882, -0.2744157016277313, -0.25953489542007446, -0.2446541041135788, -0.22977331280708313, -0.21489253640174866, -0.200011745095253, -0.18513095378875732, -0.17025016248226166, -0.155369371175766, -0.14048859477043152, -0.12560780346393585, -0.11072701960802078, -0.09584622830152512, -0.08096544444561005, -0.06608465313911438, -0.05120386183261871, -0.036323077976703644, -0.021442286670207977, -0.006561498157680035, 0.008319290354847908, 0.023200079798698425, 0.03808086737990379, 0.05296165496110916, 0.06784244626760483, 0.0827232301235199, 0.09760402143001556, 0.11248481273651123, 0.1273656040430069, 0.14224639534950256, 0.15712717175483704, 0.1720079630613327, 0.18688875436782837, 0.20176953077316284, 0.2166503369808197, 0.23153112828731537, 0.24641191959381104, 0.2612926959991455, 0.27617350220680237, 0.29105427861213684, 0.3059350848197937, 0.3208158612251282, 0.33569663763046265]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 5.0, 12.0, 13.0, 12.0, 8.0, 12.0, 20.0, 15.0, 20.0, 18.0, 32.0, 30.0, 27.0, 26.0, 28.0, 30.0, 34.0, 34.0, 34.0, 46.0, 36.0, 44.0, 31.0, 34.0, 39.0, 29.0, 35.0, 31.0, 27.0, 30.0, 26.0, 15.0, 21.0, 16.0, 22.0, 13.0, 11.0, 14.0, 12.0, 7.0, 8.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.08392399549484253, -0.08129259943962097, -0.07866121083498001, -0.07602982223033905, -0.07339842617511749, -0.07076703011989594, -0.06813564151525497, -0.06550425291061401, -0.06287285685539246, -0.0602414645254612, -0.05761007219552994, -0.05497867986559868, -0.05234728753566742, -0.04971589520573616, -0.0470845028758049, -0.04445311054587364, -0.04182171821594238, -0.039190325886011124, -0.036558933556079865, -0.033927541226148605, -0.031296148896217346, -0.028664756566286087, -0.026033364236354828, -0.02340197190642357, -0.02077057957649231, -0.01813918724656105, -0.015507794916629791, -0.012876402586698532, -0.010245010256767273, -0.007613617926836014, -0.004982225596904755, -0.0023508332669734955, 0.00028055906295776367, 0.002911951392889023, 0.005543343722820282, 0.008174736052751541, 0.0108061283826828, 0.01343752071261406, 0.01606891304254532, 0.018700305372476578, 0.021331697702407837, 0.023963090032339096, 0.026594482362270355, 0.029225874692201614, 0.031857267022132874, 0.03448865935206413, 0.03712005168199539, 0.03975144401192665, 0.04238283634185791, 0.04501422867178917, 0.04764562100172043, 0.05027701333165169, 0.05290840566158295, 0.055539797991514206, 0.058171190321445465, 0.060802582651376724, 0.06343397498130798, 0.06606537103652954, 0.0686967596411705, 0.07132814824581146, 0.07395954430103302, 0.07659094035625458, 0.07922232896089554, 0.0818537175655365, 0.08448511362075806]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 5.0, 6.0, 8.0, 6.0, 6.0, 7.0, 13.0, 12.0, 14.0, 17.0, 18.0, 25.0, 30.0, 33.0, 20.0, 24.0, 27.0, 39.0, 46.0, 36.0, 34.0, 35.0, 39.0, 44.0, 36.0, 29.0, 44.0, 51.0, 39.0, 36.0, 28.0, 26.0, 30.0, 18.0, 24.0, 17.0, 12.0, 16.0, 7.0, 6.0, 8.0, 9.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0], "bins": [-3.08203125, -2.99249267578125, -2.9029541015625, -2.81341552734375, -2.723876953125, -2.63433837890625, -2.5447998046875, -2.45526123046875, -2.36572265625, -2.27618408203125, -2.1866455078125, -2.09710693359375, -2.007568359375, -1.91802978515625, -1.8284912109375, -1.73895263671875, -1.6494140625, -1.55987548828125, -1.4703369140625, -1.38079833984375, -1.291259765625, -1.20172119140625, -1.1121826171875, -1.02264404296875, -0.93310546875, -0.84356689453125, -0.7540283203125, -0.66448974609375, -0.574951171875, -0.48541259765625, -0.3958740234375, -0.30633544921875, -0.216796875, -0.12725830078125, -0.0377197265625, 0.05181884765625, 0.141357421875, 0.23089599609375, 0.3204345703125, 0.40997314453125, 0.49951171875, 0.58905029296875, 0.6785888671875, 0.76812744140625, 0.857666015625, 0.94720458984375, 1.0367431640625, 1.12628173828125, 1.2158203125, 1.30535888671875, 1.3948974609375, 1.48443603515625, 1.573974609375, 1.66351318359375, 1.7530517578125, 1.84259033203125, 1.93212890625, 2.02166748046875, 2.1112060546875, 2.20074462890625, 2.290283203125, 2.37982177734375, 2.4693603515625, 2.55889892578125, 2.6484375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 25.0, 23.0, 32.0, 38.0, 79.0, 94.0, 136.0, 208.0, 263.0, 401.0, 583.0, 847.0, 1246.0, 1906.0, 2927.0, 4847.0, 8974.0, 17122.0, 37591.0, 93770.0, 266215.0, 365524.0, 141602.0, 53153.0, 23090.0, 11276.0, 6156.0, 3620.0, 2297.0, 1422.0, 965.0, 626.0, 424.0, 295.0, 232.0, 155.0, 115.0, 76.0, 55.0, 38.0, 19.0, 28.0, 13.0, 10.0, 10.0, 6.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.416259765625, -2.33056640625, -2.244873046875, -2.1591796875, -2.073486328125, -1.98779296875, -1.902099609375, -1.81640625, -1.730712890625, -1.64501953125, -1.559326171875, -1.4736328125, -1.387939453125, -1.30224609375, -1.216552734375, -1.130859375, -1.045166015625, -0.95947265625, -0.873779296875, -0.7880859375, -0.702392578125, -0.61669921875, -0.531005859375, -0.4453125, -0.359619140625, -0.27392578125, -0.188232421875, -0.1025390625, -0.016845703125, 0.06884765625, 0.154541015625, 0.240234375, 0.325927734375, 0.41162109375, 0.497314453125, 0.5830078125, 0.668701171875, 0.75439453125, 0.840087890625, 0.92578125, 1.011474609375, 1.09716796875, 1.182861328125, 1.2685546875, 1.354248046875, 1.43994140625, 1.525634765625, 1.611328125, 1.697021484375, 1.78271484375, 1.868408203125, 1.9541015625, 2.039794921875, 2.12548828125, 2.211181640625, 2.296875, 2.382568359375, 2.46826171875, 2.553955078125, 2.6396484375, 2.725341796875, 2.81103515625, 2.896728515625, 2.982421875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 10.0, 8.0, 9.0, 8.0, 17.0, 19.0, 29.0, 33.0, 38.0, 37.0, 40.0, 40.0, 40.0, 66.0, 118.0, 406.0, 1567.0, 144.0, 77.0, 55.0, 46.0, 43.0, 46.0, 34.0, 22.0, 23.0, 20.0, 8.0, 13.0, 9.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.796875, -14.3494873046875, -13.902099609375, -13.4547119140625, -13.00732421875, -12.5599365234375, -12.112548828125, -11.6651611328125, -11.2177734375, -10.7703857421875, -10.322998046875, -9.8756103515625, -9.42822265625, -8.9808349609375, -8.533447265625, -8.0860595703125, -7.638671875, -7.1912841796875, -6.743896484375, -6.2965087890625, -5.84912109375, -5.4017333984375, -4.954345703125, -4.5069580078125, -4.0595703125, -3.6121826171875, -3.164794921875, -2.7174072265625, -2.27001953125, -1.8226318359375, -1.375244140625, -0.9278564453125, -0.48046875, -0.0330810546875, 0.414306640625, 0.8616943359375, 1.30908203125, 1.7564697265625, 2.203857421875, 2.6512451171875, 3.0986328125, 3.5460205078125, 3.993408203125, 4.4407958984375, 4.88818359375, 5.3355712890625, 5.782958984375, 6.2303466796875, 6.677734375, 7.1251220703125, 7.572509765625, 8.0198974609375, 8.46728515625, 8.9146728515625, 9.362060546875, 9.8094482421875, 10.2568359375, 10.7042236328125, 11.151611328125, 11.5989990234375, 12.04638671875, 12.4937744140625, 12.941162109375, 13.3885498046875, 13.8359375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 8.0, 3.0, 5.0, 11.0, 11.0, 13.0, 14.0, 21.0, 33.0, 41.0, 68.0, 92.0, 128.0, 197.0, 361.0, 918.0, 11552.0, 3021584.0, 106889.0, 2430.0, 496.0, 265.0, 157.0, 105.0, 75.0, 61.0, 46.0, 30.0, 22.0, 20.0, 14.0, 10.0, 8.0, 8.0, 4.0, 2.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.59375, -26.696044921875, -25.79833984375, -24.900634765625, -24.0029296875, -23.105224609375, -22.20751953125, -21.309814453125, -20.412109375, -19.514404296875, -18.61669921875, -17.718994140625, -16.8212890625, -15.923583984375, -15.02587890625, -14.128173828125, -13.23046875, -12.332763671875, -11.43505859375, -10.537353515625, -9.6396484375, -8.741943359375, -7.84423828125, -6.946533203125, -6.048828125, -5.151123046875, -4.25341796875, -3.355712890625, -2.4580078125, -1.560302734375, -0.66259765625, 0.235107421875, 1.1328125, 2.030517578125, 2.92822265625, 3.825927734375, 4.7236328125, 5.621337890625, 6.51904296875, 7.416748046875, 8.314453125, 9.212158203125, 10.10986328125, 11.007568359375, 11.9052734375, 12.802978515625, 13.70068359375, 14.598388671875, 15.49609375, 16.393798828125, 17.29150390625, 18.189208984375, 19.0869140625, 19.984619140625, 20.88232421875, 21.780029296875, 22.677734375, 23.575439453125, 24.47314453125, 25.370849609375, 26.2685546875, 27.166259765625, 28.06396484375, 28.961669921875, 29.859375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 112.0, 873.0, 31.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.7069396972656, -269.7449035644531, -264.78289794921875, -259.82086181640625, -254.8588409423828, -249.89682006835938, -244.93478393554688, -239.97276306152344, -235.0107421875, -230.04872131347656, -225.08670043945312, -220.12466430664062, -215.1626434326172, -210.20062255859375, -205.23858642578125, -200.2765655517578, -195.31454467773438, -190.35252380371094, -185.3905029296875, -180.428466796875, -175.46644592285156, -170.50442504882812, -165.54238891601562, -160.5803680419922, -155.61834716796875, -150.6563262939453, -145.69430541992188, -140.73226928710938, -135.77024841308594, -130.8082275390625, -125.84619903564453, -120.88417053222656, -115.9221420288086, -110.96011352539062, -105.99809265136719, -101.03607177734375, -96.07404327392578, -91.11201477050781, -86.14999389648438, -81.18797302246094, -76.22594451904297, -71.263916015625, -66.30189514160156, -61.33987045288086, -56.377845764160156, -51.41582107543945, -46.45379638671875, -41.49177169799805, -36.529747009277344, -31.56772232055664, -26.605697631835938, -21.643672943115234, -16.68164825439453, -11.719623565673828, -6.757598876953125, -1.7955741882324219, 3.1664505004882812, 8.128475189208984, 13.090499877929688, 18.05252456665039, 23.014549255371094, 27.976573944091797, 32.9385986328125, 37.9006233215332, 42.862648010253906]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 13.0, 9.0, 12.0, 20.0, 16.0, 10.0, 16.0, 20.0, 27.0, 28.0, 31.0, 32.0, 29.0, 35.0, 31.0, 55.0, 40.0, 29.0, 30.0, 39.0, 30.0, 38.0, 45.0, 31.0, 39.0, 22.0, 35.0, 24.0, 25.0, 19.0, 17.0, 25.0, 20.0, 11.0, 15.0, 9.0, 12.0, 12.0, 12.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0], "bins": [-26.7233943939209, -25.895402908325195, -25.06740951538086, -24.239418029785156, -23.411426544189453, -22.583433151245117, -21.755441665649414, -20.927448272705078, -20.099456787109375, -19.271465301513672, -18.443471908569336, -17.615480422973633, -16.787487030029297, -15.959495544433594, -15.13150405883789, -14.303511619567871, -13.475519180297852, -12.647526741027832, -11.819534301757812, -10.99154281616211, -10.16355037689209, -9.33555793762207, -8.507566452026367, -7.679574012756348, -6.851581573486328, -6.023589134216309, -5.195597171783447, -4.367605209350586, -3.5396127700805664, -2.711620330810547, -1.8836283683776855, -1.0556364059448242, -0.22764205932617188, 0.6003501415252686, 1.428342342376709, 2.2563345432281494, 3.08432674407959, 3.9123191833496094, 4.740311145782471, 5.568303108215332, 6.396295547485352, 7.224287986755371, 8.05228042602539, 8.880271911621094, 9.708264350891113, 10.536256790161133, 11.364248275756836, 12.192240715026855, 13.020233154296875, 13.848225593566895, 14.676218032836914, 15.504209518432617, 16.332202911376953, 17.160194396972656, 17.98818588256836, 18.816177368164062, 19.6441707611084, 20.4721622467041, 21.300155639648438, 22.12814712524414, 22.956138610839844, 23.78413200378418, 24.612123489379883, 25.44011688232422, 26.268108367919922]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 8.0, 7.0, 4.0, 4.0, 10.0, 5.0, 15.0, 14.0, 17.0, 20.0, 20.0, 28.0, 25.0, 32.0, 25.0, 27.0, 24.0, 40.0, 36.0, 49.0, 35.0, 39.0, 37.0, 42.0, 41.0, 32.0, 36.0, 36.0, 44.0, 43.0, 18.0, 30.0, 25.0, 23.0, 12.0, 21.0, 16.0, 7.0, 8.0, 9.0, 9.0, 3.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-3.12890625, -3.0364990234375, -2.944091796875, -2.8516845703125, -2.75927734375, -2.6668701171875, -2.574462890625, -2.4820556640625, -2.3896484375, -2.2972412109375, -2.204833984375, -2.1124267578125, -2.02001953125, -1.9276123046875, -1.835205078125, -1.7427978515625, -1.650390625, -1.5579833984375, -1.465576171875, -1.3731689453125, -1.28076171875, -1.1883544921875, -1.095947265625, -1.0035400390625, -0.9111328125, -0.8187255859375, -0.726318359375, -0.6339111328125, -0.54150390625, -0.4490966796875, -0.356689453125, -0.2642822265625, -0.171875, -0.0794677734375, 0.012939453125, 0.1053466796875, 0.19775390625, 0.2901611328125, 0.382568359375, 0.4749755859375, 0.5673828125, 0.6597900390625, 0.752197265625, 0.8446044921875, 0.93701171875, 1.0294189453125, 1.121826171875, 1.2142333984375, 1.306640625, 1.3990478515625, 1.491455078125, 1.5838623046875, 1.67626953125, 1.7686767578125, 1.861083984375, 1.9534912109375, 2.0458984375, 2.1383056640625, 2.230712890625, 2.3231201171875, 2.41552734375, 2.5079345703125, 2.600341796875, 2.6927490234375, 2.78515625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 2.0, 4.0, 3.0, 5.0, 11.0, 12.0, 10.0, 15.0, 11.0, 19.0, 30.0, 42.0, 38.0, 53.0, 72.0, 91.0, 144.0, 249.0, 758.0, 2719.0, 13801.0, 106990.0, 1601750.0, 2281803.0, 160994.0, 19296.0, 3473.0, 933.0, 343.0, 159.0, 111.0, 69.0, 48.0, 48.0, 33.0, 27.0, 20.0, 22.0, 11.0, 10.0, 10.0, 12.0, 9.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.270263671875, -10.90771484375, -10.545166015625, -10.1826171875, -9.820068359375, -9.45751953125, -9.094970703125, -8.732421875, -8.369873046875, -8.00732421875, -7.644775390625, -7.2822265625, -6.919677734375, -6.55712890625, -6.194580078125, -5.83203125, -5.469482421875, -5.10693359375, -4.744384765625, -4.3818359375, -4.019287109375, -3.65673828125, -3.294189453125, -2.931640625, -2.569091796875, -2.20654296875, -1.843994140625, -1.4814453125, -1.118896484375, -0.75634765625, -0.393798828125, -0.03125, 0.331298828125, 0.69384765625, 1.056396484375, 1.4189453125, 1.781494140625, 2.14404296875, 2.506591796875, 2.869140625, 3.231689453125, 3.59423828125, 3.956787109375, 4.3193359375, 4.681884765625, 5.04443359375, 5.406982421875, 5.76953125, 6.132080078125, 6.49462890625, 6.857177734375, 7.2197265625, 7.582275390625, 7.94482421875, 8.307373046875, 8.669921875, 9.032470703125, 9.39501953125, 9.757568359375, 10.1201171875, 10.482666015625, 10.84521484375, 11.207763671875, 11.5703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 14.0, 14.0, 12.0, 24.0, 34.0, 51.0, 68.0, 99.0, 128.0, 170.0, 264.0, 336.0, 394.0, 507.0, 450.0, 400.0, 290.0, 199.0, 182.0, 125.0, 69.0, 70.0, 59.0, 31.0, 26.0, 18.0, 7.0, 4.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.6448974609375, -9.360107421875, -9.0753173828125, -8.79052734375, -8.5057373046875, -8.220947265625, -7.9361572265625, -7.6513671875, -7.3665771484375, -7.081787109375, -6.7969970703125, -6.51220703125, -6.2274169921875, -5.942626953125, -5.6578369140625, -5.373046875, -5.0882568359375, -4.803466796875, -4.5186767578125, -4.23388671875, -3.9490966796875, -3.664306640625, -3.3795166015625, -3.0947265625, -2.8099365234375, -2.525146484375, -2.2403564453125, -1.95556640625, -1.6707763671875, -1.385986328125, -1.1011962890625, -0.81640625, -0.5316162109375, -0.246826171875, 0.0379638671875, 0.32275390625, 0.6075439453125, 0.892333984375, 1.1771240234375, 1.4619140625, 1.7467041015625, 2.031494140625, 2.3162841796875, 2.60107421875, 2.8858642578125, 3.170654296875, 3.4554443359375, 3.740234375, 4.0250244140625, 4.309814453125, 4.5946044921875, 4.87939453125, 5.1641845703125, 5.448974609375, 5.7337646484375, 6.0185546875, 6.3033447265625, 6.588134765625, 6.8729248046875, 7.15771484375, 7.4425048828125, 7.727294921875, 8.0120849609375, 8.296875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 10.0, 8.0, 10.0, 15.0, 14.0, 22.0, 41.0, 51.0, 73.0, 91.0, 132.0, 201.0, 335.0, 670.0, 2216.0, 17090.0, 361152.0, 3484113.0, 309267.0, 15004.0, 2109.0, 689.0, 327.0, 190.0, 133.0, 100.0, 63.0, 44.0, 38.0, 13.0, 18.0, 15.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.11181640625, -19.3798828125, -18.64794921875, -17.916015625, -17.18408203125, -16.4521484375, -15.72021484375, -14.98828125, -14.25634765625, -13.5244140625, -12.79248046875, -12.060546875, -11.32861328125, -10.5966796875, -9.86474609375, -9.1328125, -8.40087890625, -7.6689453125, -6.93701171875, -6.205078125, -5.47314453125, -4.7412109375, -4.00927734375, -3.27734375, -2.54541015625, -1.8134765625, -1.08154296875, -0.349609375, 0.38232421875, 1.1142578125, 1.84619140625, 2.578125, 3.31005859375, 4.0419921875, 4.77392578125, 5.505859375, 6.23779296875, 6.9697265625, 7.70166015625, 8.43359375, 9.16552734375, 9.8974609375, 10.62939453125, 11.361328125, 12.09326171875, 12.8251953125, 13.55712890625, 14.2890625, 15.02099609375, 15.7529296875, 16.48486328125, 17.216796875, 17.94873046875, 18.6806640625, 19.41259765625, 20.14453125, 20.87646484375, 21.6083984375, 22.34033203125, 23.072265625, 23.80419921875, 24.5361328125, 25.26806640625, 26.0]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 19.0, 57.0, 125.0, 235.0, 257.0, 181.0, 90.0, 37.0, 10.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.6572036743164, -88.17896270751953, -84.70072174072266, -81.22248077392578, -77.74423217773438, -74.2659912109375, -70.78775024414062, -67.30950927734375, -63.831268310546875, -60.35302734375, -56.874786376953125, -53.396541595458984, -49.91830062866211, -46.440059661865234, -42.961814880371094, -39.48357391357422, -36.005332946777344, -32.52709197998047, -29.04884910583496, -25.570606231689453, -22.092365264892578, -18.614124298095703, -15.135881423950195, -11.657638549804688, -8.179397583007812, -4.701155662536621, -1.2229137420654297, 2.2553281784057617, 5.733570098876953, 9.211811065673828, 12.690053939819336, 16.168296813964844, 19.64654541015625, 23.124786376953125, 26.603029251098633, 30.08127212524414, 33.559513092041016, 37.03775405883789, 40.51599884033203, 43.994239807128906, 47.47248077392578, 50.950721740722656, 54.42896270751953, 57.90720748901367, 61.38544845581055, 64.86369323730469, 68.34193420410156, 71.82017517089844, 75.29841613769531, 78.77665710449219, 82.25489807128906, 85.73313903808594, 89.21138000488281, 92.68962097167969, 96.1678695678711, 99.64611053466797, 103.12435150146484, 106.60259246826172, 110.0808334350586, 113.55907440185547, 117.03732299804688, 120.51556396484375, 123.99380493164062, 127.4720458984375, 130.95028686523438]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 7.0, 12.0, 17.0, 3.0, 14.0, 17.0, 16.0, 20.0, 23.0, 24.0, 40.0, 27.0, 31.0, 38.0, 34.0, 35.0, 47.0, 34.0, 38.0, 52.0, 37.0, 38.0, 39.0, 34.0, 27.0, 44.0, 32.0, 31.0, 24.0, 20.0, 23.0, 30.0, 15.0, 10.0, 13.0, 11.0, 14.0, 6.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.69482421875, -27.821910858154297, -26.948997497558594, -26.07608413696289, -25.203170776367188, -24.330257415771484, -23.45734405517578, -22.584430694580078, -21.711517333984375, -20.838603973388672, -19.96569061279297, -19.092777252197266, -18.219863891601562, -17.34695053100586, -16.474037170410156, -15.601123809814453, -14.72821044921875, -13.855297088623047, -12.982383728027344, -12.10947036743164, -11.236557006835938, -10.363643646240234, -9.490730285644531, -8.617816925048828, -7.744903564453125, -6.871990203857422, -5.999076843261719, -5.126163482666016, -4.2532501220703125, -3.3803367614746094, -2.5074234008789062, -1.6345100402832031, -0.7615966796875, 0.11131668090820312, 0.9842300415039062, 1.8571434020996094, 2.7300567626953125, 3.6029701232910156, 4.475883483886719, 5.348796844482422, 6.221710205078125, 7.094623565673828, 7.967536926269531, 8.840450286865234, 9.713363647460938, 10.58627700805664, 11.459190368652344, 12.332103729248047, 13.20501708984375, 14.077930450439453, 14.950843811035156, 15.82375717163086, 16.696670532226562, 17.569583892822266, 18.44249725341797, 19.315410614013672, 20.188323974609375, 21.061237335205078, 21.93415069580078, 22.807064056396484, 23.679977416992188, 24.55289077758789, 25.425804138183594, 26.298717498779297, 27.171630859375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 7.0, 10.0, 6.0, 13.0, 12.0, 24.0, 26.0, 14.0, 24.0, 27.0, 31.0, 22.0, 32.0, 29.0, 31.0, 36.0, 42.0, 35.0, 34.0, 49.0, 31.0, 41.0, 44.0, 40.0, 43.0, 31.0, 27.0, 20.0, 33.0, 28.0, 17.0, 28.0, 18.0, 16.0, 8.0, 5.0, 8.0, 5.0, 9.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.994140625, -2.900634765625, -2.80712890625, -2.713623046875, -2.6201171875, -2.526611328125, -2.43310546875, -2.339599609375, -2.24609375, -2.152587890625, -2.05908203125, -1.965576171875, -1.8720703125, -1.778564453125, -1.68505859375, -1.591552734375, -1.498046875, -1.404541015625, -1.31103515625, -1.217529296875, -1.1240234375, -1.030517578125, -0.93701171875, -0.843505859375, -0.75, -0.656494140625, -0.56298828125, -0.469482421875, -0.3759765625, -0.282470703125, -0.18896484375, -0.095458984375, -0.001953125, 0.091552734375, 0.18505859375, 0.278564453125, 0.3720703125, 0.465576171875, 0.55908203125, 0.652587890625, 0.74609375, 0.839599609375, 0.93310546875, 1.026611328125, 1.1201171875, 1.213623046875, 1.30712890625, 1.400634765625, 1.494140625, 1.587646484375, 1.68115234375, 1.774658203125, 1.8681640625, 1.961669921875, 2.05517578125, 2.148681640625, 2.2421875, 2.335693359375, 2.42919921875, 2.522705078125, 2.6162109375, 2.709716796875, 2.80322265625, 2.896728515625, 2.990234375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 12.0, 20.0, 23.0, 46.0, 62.0, 67.0, 132.0, 192.0, 273.0, 490.0, 724.0, 1038.0, 1684.0, 2431.0, 3821.0, 5890.0, 8892.0, 13544.0, 20294.0, 30690.0, 45944.0, 67977.0, 96976.0, 129616.0, 150398.0, 136996.0, 104977.0, 74427.0, 50746.0, 33797.0, 22628.0, 14952.0, 9888.0, 6414.0, 4332.0, 2826.0, 1837.0, 1248.0, 789.0, 468.0, 339.0, 208.0, 149.0, 92.0, 59.0, 61.0, 21.0, 26.0, 12.0, 10.0, 5.0, 6.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.3056640625, -0.296295166015625, -0.28692626953125, -0.277557373046875, -0.2681884765625, -0.258819580078125, -0.24945068359375, -0.240081787109375, -0.230712890625, -0.221343994140625, -0.21197509765625, -0.202606201171875, -0.1932373046875, -0.183868408203125, -0.17449951171875, -0.165130615234375, -0.15576171875, -0.146392822265625, -0.13702392578125, -0.127655029296875, -0.1182861328125, -0.108917236328125, -0.09954833984375, -0.090179443359375, -0.080810546875, -0.071441650390625, -0.06207275390625, -0.052703857421875, -0.0433349609375, -0.033966064453125, -0.02459716796875, -0.015228271484375, -0.005859375, 0.003509521484375, 0.01287841796875, 0.022247314453125, 0.0316162109375, 0.040985107421875, 0.05035400390625, 0.059722900390625, 0.069091796875, 0.078460693359375, 0.08782958984375, 0.097198486328125, 0.1065673828125, 0.115936279296875, 0.12530517578125, 0.134674072265625, 0.14404296875, 0.153411865234375, 0.16278076171875, 0.172149658203125, 0.1815185546875, 0.190887451171875, 0.20025634765625, 0.209625244140625, 0.218994140625, 0.228363037109375, 0.23773193359375, 0.247100830078125, 0.2564697265625, 0.265838623046875, 0.27520751953125, 0.284576416015625, 0.2939453125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 11.0, 8.0, 11.0, 14.0, 17.0, 21.0, 18.0, 21.0, 28.0, 38.0, 24.0, 24.0, 30.0, 46.0, 36.0, 37.0, 46.0, 1059.0, 49.0, 45.0, 50.0, 36.0, 38.0, 39.0, 44.0, 30.0, 31.0, 25.0, 32.0, 24.0, 16.0, 14.0, 11.0, 12.0, 13.0, 10.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.1890869140625, -2.118408203125, -2.0477294921875, -1.97705078125, -1.9063720703125, -1.835693359375, -1.7650146484375, -1.6943359375, -1.6236572265625, -1.552978515625, -1.4822998046875, -1.41162109375, -1.3409423828125, -1.270263671875, -1.1995849609375, -1.12890625, -1.0582275390625, -0.987548828125, -0.9168701171875, -0.84619140625, -0.7755126953125, -0.704833984375, -0.6341552734375, -0.5634765625, -0.4927978515625, -0.422119140625, -0.3514404296875, -0.28076171875, -0.2100830078125, -0.139404296875, -0.0687255859375, 0.001953125, 0.0726318359375, 0.143310546875, 0.2139892578125, 0.28466796875, 0.3553466796875, 0.426025390625, 0.4967041015625, 0.5673828125, 0.6380615234375, 0.708740234375, 0.7794189453125, 0.85009765625, 0.9207763671875, 0.991455078125, 1.0621337890625, 1.1328125, 1.2034912109375, 1.274169921875, 1.3448486328125, 1.41552734375, 1.4862060546875, 1.556884765625, 1.6275634765625, 1.6982421875, 1.7689208984375, 1.839599609375, 1.9102783203125, 1.98095703125, 2.0516357421875, 2.122314453125, 2.1929931640625, 2.263671875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 9.0, 15.0, 23.0, 30.0, 49.0, 72.0, 112.0, 156.0, 271.0, 390.0, 508.0, 805.0, 1242.0, 1829.0, 2831.0, 4028.0, 6219.0, 9593.0, 14400.0, 21357.0, 32800.0, 48040.0, 69927.0, 98017.0, 144973.0, 1047124.0, 228669.0, 112078.0, 80563.0, 56572.0, 38609.0, 25465.0, 17156.0, 11234.0, 7413.0, 4910.0, 3303.0, 2157.0, 1381.0, 917.0, 594.0, 424.0, 301.0, 201.0, 112.0, 85.0, 65.0, 36.0, 21.0, 27.0, 8.0, 7.0, 7.0, 1.0, 2.0], "bins": [-0.1837158203125, -0.1784229278564453, -0.17313003540039062, -0.16783714294433594, -0.16254425048828125, -0.15725135803222656, -0.15195846557617188, -0.1466655731201172, -0.1413726806640625, -0.1360797882080078, -0.13078689575195312, -0.12549400329589844, -0.12020111083984375, -0.11490821838378906, -0.10961532592773438, -0.10432243347167969, -0.099029541015625, -0.09373664855957031, -0.08844375610351562, -0.08315086364746094, -0.07785797119140625, -0.07256507873535156, -0.06727218627929688, -0.06197929382324219, -0.0566864013671875, -0.05139350891113281, -0.046100616455078125, -0.04080772399902344, -0.03551483154296875, -0.030221939086914062, -0.024929046630859375, -0.019636154174804688, -0.01434326171875, -0.009050369262695312, -0.003757476806640625, 0.0015354156494140625, 0.00682830810546875, 0.012121200561523438, 0.017414093017578125, 0.022706985473632812, 0.0279998779296875, 0.03329277038574219, 0.038585662841796875, 0.04387855529785156, 0.04917144775390625, 0.05446434020996094, 0.059757232666015625, 0.06505012512207031, 0.070343017578125, 0.07563591003417969, 0.08092880249023438, 0.08622169494628906, 0.09151458740234375, 0.09680747985839844, 0.10210037231445312, 0.10739326477050781, 0.1126861572265625, 0.11797904968261719, 0.12327194213867188, 0.12856483459472656, 0.13385772705078125, 0.13915061950683594, 0.14444351196289062, 0.1497364044189453, 0.155029296875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 7.0, 18.0, 18.0, 16.0, 19.0, 39.0, 46.0, 46.0, 71.0, 105.0, 184.0, 101.0, 63.0, 51.0, 42.0, 26.0, 26.0, 15.0, 14.0, 19.0, 8.0, 1.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.058624267578125, -0.057106971740722656, -0.05558967590332031, -0.05407238006591797, -0.052555084228515625, -0.05103778839111328, -0.04952049255371094, -0.048003196716308594, -0.04648590087890625, -0.044968605041503906, -0.04345130920410156, -0.04193401336669922, -0.040416717529296875, -0.03889942169189453, -0.03738212585449219, -0.035864830017089844, -0.0343475341796875, -0.032830238342285156, -0.03131294250488281, -0.02979564666748047, -0.028278350830078125, -0.02676105499267578, -0.025243759155273438, -0.023726463317871094, -0.02220916748046875, -0.020691871643066406, -0.019174575805664062, -0.01765727996826172, -0.016139984130859375, -0.014622688293457031, -0.013105392456054688, -0.011588096618652344, -0.01007080078125, -0.008553504943847656, -0.0070362091064453125, -0.005518913269042969, -0.004001617431640625, -0.0024843215942382812, -0.0009670257568359375, 0.0005502700805664062, 0.00206756591796875, 0.0035848617553710938, 0.0051021575927734375, 0.006619453430175781, 0.008136749267578125, 0.009654045104980469, 0.011171340942382812, 0.012688636779785156, 0.0142059326171875, 0.015723228454589844, 0.017240524291992188, 0.01875782012939453, 0.020275115966796875, 0.02179241180419922, 0.023309707641601562, 0.024827003479003906, 0.02634429931640625, 0.027861595153808594, 0.029378890991210938, 0.03089618682861328, 0.032413482666015625, 0.03393077850341797, 0.03544807434082031, 0.036965370178222656, 0.038482666015625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 4.0, 5.0, 16.0, 27.0, 24.0, 51.0, 66.0, 120.0, 246.0, 922.0, 17385.0, 1017380.0, 11001.0, 731.0, 212.0, 111.0, 62.0, 46.0, 32.0, 26.0, 14.0, 12.0, 12.0, 3.0, 6.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79345703125, -0.7622756958007812, -0.7310943603515625, -0.6999130249023438, -0.668731689453125, -0.6375503540039062, -0.6063690185546875, -0.5751876831054688, -0.54400634765625, -0.5128250122070312, -0.4816436767578125, -0.45046234130859375, -0.419281005859375, -0.38809967041015625, -0.3569183349609375, -0.32573699951171875, -0.2945556640625, -0.26337432861328125, -0.2321929931640625, -0.20101165771484375, -0.169830322265625, -0.13864898681640625, -0.1074676513671875, -0.07628631591796875, -0.04510498046875, -0.01392364501953125, 0.0172576904296875, 0.04843902587890625, 0.079620361328125, 0.11080169677734375, 0.1419830322265625, 0.17316436767578125, 0.204345703125, 0.23552703857421875, 0.2667083740234375, 0.29788970947265625, 0.329071044921875, 0.36025238037109375, 0.3914337158203125, 0.42261505126953125, 0.45379638671875, 0.48497772216796875, 0.5161590576171875, 0.5473403930664062, 0.578521728515625, 0.6097030639648438, 0.6408843994140625, 0.6720657348632812, 0.7032470703125, 0.7344284057617188, 0.7656097412109375, 0.7967910766601562, 0.827972412109375, 0.8591537475585938, 0.8903350830078125, 0.9215164184570312, 0.95269775390625, 0.9838790893554688, 1.0150604248046875, 1.0462417602539062, 1.077423095703125, 1.1086044311523438, 1.1397857666015625, 1.1709671020507812, 1.2021484375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 18.0, 25.0, 91.0, 276.0, 455.0, 104.0, 20.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5164682865142822, -0.5065786838531494, -0.4966890811920166, -0.4867994785308838, -0.476909875869751, -0.46702027320861816, -0.45713067054748535, -0.44724106788635254, -0.4373514652252197, -0.4274618625640869, -0.4175722599029541, -0.4076826572418213, -0.3977930545806885, -0.38790345191955566, -0.37801384925842285, -0.36812424659729004, -0.3582346439361572, -0.3483450412750244, -0.3384554386138916, -0.3285658359527588, -0.318676233291626, -0.30878663063049316, -0.29889702796936035, -0.28900742530822754, -0.2791178226470947, -0.2692282199859619, -0.2593386173248291, -0.2494490146636963, -0.23955941200256348, -0.22966980934143066, -0.21978020668029785, -0.20989060401916504, -0.20000098645687103, -0.19011138379573822, -0.1802217811346054, -0.1703321784734726, -0.16044257581233978, -0.15055297315120697, -0.14066337049007416, -0.13077376782894135, -0.12088416516780853, -0.11099456250667572, -0.10110495984554291, -0.0912153571844101, -0.08132575452327728, -0.07143615186214447, -0.06154654920101166, -0.051656946539878845, -0.04176734387874603, -0.03187774121761322, -0.021988138556480408, -0.012098535895347595, -0.0022089332342147827, 0.00768066942691803, 0.017570272088050842, 0.027459874749183655, 0.03734947741031647, 0.04723908007144928, 0.05712868273258209, 0.0670182853937149, 0.07690788805484772, 0.08679749071598053, 0.09668709337711334, 0.10657669603824615, 0.11646629869937897]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 7.0, 7.0, 12.0, 10.0, 20.0, 26.0, 20.0, 23.0, 27.0, 30.0, 31.0, 17.0, 22.0, 34.0, 36.0, 41.0, 43.0, 28.0, 47.0, 33.0, 21.0, 40.0, 44.0, 24.0, 31.0, 31.0, 31.0, 28.0, 27.0, 21.0, 24.0, 18.0, 19.0, 28.0, 13.0, 15.0, 11.0, 4.0, 10.0, 5.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06097853183746338, -0.058819644153118134, -0.05666075646877289, -0.054501865059137344, -0.0523429773747921, -0.050184089690446854, -0.04802519828081131, -0.045866310596466064, -0.04370742291212082, -0.041548535227775574, -0.03938964754343033, -0.037230756133794785, -0.03507186844944954, -0.032912980765104294, -0.0307540912181139, -0.028595201671123505, -0.02643631398677826, -0.024277426302433014, -0.02211853675544262, -0.019959647208452225, -0.01780075952410698, -0.015641871839761734, -0.01348298229277134, -0.01132409367710352, -0.0091652050614357, -0.0070063164457678795, -0.0048474278301000595, -0.0026885392144322395, -0.0005296505987644196, 0.0016292380169034004, 0.0037881266325712204, 0.00594701524823904, 0.00810590386390686, 0.01026479247957468, 0.0124236810952425, 0.01458256971091032, 0.01674145832657814, 0.018900346010923386, 0.02105923555791378, 0.023218125104904175, 0.02537701278924942, 0.027535900473594666, 0.02969479002058506, 0.031853679567575455, 0.0340125672519207, 0.036171454936265945, 0.03833034634590149, 0.040489234030246735, 0.04264812171459198, 0.044807009398937225, 0.04696589708328247, 0.049124788492918015, 0.05128367617726326, 0.053442563861608505, 0.05560145527124405, 0.057760342955589294, 0.05991923063993454, 0.062078118324279785, 0.06423700600862503, 0.06639589369297028, 0.06855478882789612, 0.07071367651224136, 0.07287256419658661, 0.07503145188093185, 0.0771903395652771]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 9.0, 7.0, 10.0, 6.0, 13.0, 10.0, 24.0, 28.0, 14.0, 23.0, 28.0, 30.0, 22.0, 30.0, 32.0, 31.0, 33.0, 44.0, 33.0, 35.0, 50.0, 31.0, 42.0, 42.0, 38.0, 46.0, 31.0, 27.0, 21.0, 33.0, 28.0, 15.0, 29.0, 19.0, 16.0, 8.0, 4.0, 9.0, 5.0, 9.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.998046875, -2.904510498046875, -2.81097412109375, -2.717437744140625, -2.6239013671875, -2.530364990234375, -2.43682861328125, -2.343292236328125, -2.249755859375, -2.156219482421875, -2.06268310546875, -1.969146728515625, -1.8756103515625, -1.782073974609375, -1.68853759765625, -1.595001220703125, -1.50146484375, -1.407928466796875, -1.31439208984375, -1.220855712890625, -1.1273193359375, -1.033782958984375, -0.94024658203125, -0.846710205078125, -0.753173828125, -0.659637451171875, -0.56610107421875, -0.472564697265625, -0.3790283203125, -0.285491943359375, -0.19195556640625, -0.098419189453125, -0.0048828125, 0.088653564453125, 0.18218994140625, 0.275726318359375, 0.3692626953125, 0.462799072265625, 0.55633544921875, 0.649871826171875, 0.743408203125, 0.836944580078125, 0.93048095703125, 1.024017333984375, 1.1175537109375, 1.211090087890625, 1.30462646484375, 1.398162841796875, 1.49169921875, 1.585235595703125, 1.67877197265625, 1.772308349609375, 1.8658447265625, 1.959381103515625, 2.05291748046875, 2.146453857421875, 2.239990234375, 2.333526611328125, 2.42706298828125, 2.520599365234375, 2.6141357421875, 2.707672119140625, 2.80120849609375, 2.894744873046875, 2.98828125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 13.0, 20.0, 15.0, 36.0, 50.0, 62.0, 77.0, 130.0, 184.0, 268.0, 405.0, 613.0, 1002.0, 1519.0, 2400.0, 3807.0, 6093.0, 9702.0, 15754.0, 26589.0, 47522.0, 89679.0, 185123.0, 311018.0, 161502.0, 79088.0, 42665.0, 24316.0, 14463.0, 8927.0, 5644.0, 3537.0, 2223.0, 1397.0, 918.0, 572.0, 379.0, 271.0, 177.0, 129.0, 95.0, 63.0, 32.0, 24.0, 13.0, 16.0, 7.0, 10.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.171875, -2.10687255859375, -2.0418701171875, -1.97686767578125, -1.911865234375, -1.84686279296875, -1.7818603515625, -1.71685791015625, -1.65185546875, -1.58685302734375, -1.5218505859375, -1.45684814453125, -1.391845703125, -1.32684326171875, -1.2618408203125, -1.19683837890625, -1.1318359375, -1.06683349609375, -1.0018310546875, -0.93682861328125, -0.871826171875, -0.80682373046875, -0.7418212890625, -0.67681884765625, -0.61181640625, -0.54681396484375, -0.4818115234375, -0.41680908203125, -0.351806640625, -0.28680419921875, -0.2218017578125, -0.15679931640625, -0.091796875, -0.02679443359375, 0.0382080078125, 0.10321044921875, 0.168212890625, 0.23321533203125, 0.2982177734375, 0.36322021484375, 0.42822265625, 0.49322509765625, 0.5582275390625, 0.62322998046875, 0.688232421875, 0.75323486328125, 0.8182373046875, 0.88323974609375, 0.9482421875, 1.01324462890625, 1.0782470703125, 1.14324951171875, 1.208251953125, 1.27325439453125, 1.3382568359375, 1.40325927734375, 1.46826171875, 1.53326416015625, 1.5982666015625, 1.66326904296875, 1.728271484375, 1.79327392578125, 1.8582763671875, 1.92327880859375, 1.98828125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 2.0, 2.0, 8.0, 7.0, 8.0, 10.0, 6.0, 15.0, 15.0, 16.0, 21.0, 22.0, 32.0, 26.0, 41.0, 30.0, 30.0, 56.0, 56.0, 68.0, 149.0, 1447.0, 351.0, 132.0, 81.0, 61.0, 56.0, 32.0, 36.0, 25.0, 35.0, 27.0, 19.0, 28.0, 15.0, 16.0, 12.0, 17.0, 12.0, 4.0, 9.0, 4.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1015625, -11.7342529296875, -11.366943359375, -10.9996337890625, -10.63232421875, -10.2650146484375, -9.897705078125, -9.5303955078125, -9.1630859375, -8.7957763671875, -8.428466796875, -8.0611572265625, -7.69384765625, -7.3265380859375, -6.959228515625, -6.5919189453125, -6.224609375, -5.8572998046875, -5.489990234375, -5.1226806640625, -4.75537109375, -4.3880615234375, -4.020751953125, -3.6534423828125, -3.2861328125, -2.9188232421875, -2.551513671875, -2.1842041015625, -1.81689453125, -1.4495849609375, -1.082275390625, -0.7149658203125, -0.34765625, 0.0196533203125, 0.386962890625, 0.7542724609375, 1.12158203125, 1.4888916015625, 1.856201171875, 2.2235107421875, 2.5908203125, 2.9581298828125, 3.325439453125, 3.6927490234375, 4.06005859375, 4.4273681640625, 4.794677734375, 5.1619873046875, 5.529296875, 5.8966064453125, 6.263916015625, 6.6312255859375, 6.99853515625, 7.3658447265625, 7.733154296875, 8.1004638671875, 8.4677734375, 8.8350830078125, 9.202392578125, 9.5697021484375, 9.93701171875, 10.3043212890625, 10.671630859375, 11.0389404296875, 11.40625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 15.0, 18.0, 24.0, 40.0, 67.0, 82.0, 155.0, 240.0, 490.0, 1435.0, 39446.0, 3091013.0, 10754.0, 983.0, 399.0, 169.0, 131.0, 77.0, 48.0, 32.0, 31.0, 11.0, 13.0, 11.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.84375, -48.577880859375, -47.31201171875, -46.046142578125, -44.7802734375, -43.514404296875, -42.24853515625, -40.982666015625, -39.716796875, -38.450927734375, -37.18505859375, -35.919189453125, -34.6533203125, -33.387451171875, -32.12158203125, -30.855712890625, -29.58984375, -28.323974609375, -27.05810546875, -25.792236328125, -24.5263671875, -23.260498046875, -21.99462890625, -20.728759765625, -19.462890625, -18.197021484375, -16.93115234375, -15.665283203125, -14.3994140625, -13.133544921875, -11.86767578125, -10.601806640625, -9.3359375, -8.070068359375, -6.80419921875, -5.538330078125, -4.2724609375, -3.006591796875, -1.74072265625, -0.474853515625, 0.791015625, 2.056884765625, 3.32275390625, 4.588623046875, 5.8544921875, 7.120361328125, 8.38623046875, 9.652099609375, 10.91796875, 12.183837890625, 13.44970703125, 14.715576171875, 15.9814453125, 17.247314453125, 18.51318359375, 19.779052734375, 21.044921875, 22.310791015625, 23.57666015625, 24.842529296875, 26.1083984375, 27.374267578125, 28.64013671875, 29.906005859375, 31.171875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [21.0, 233.0, 549.0, 192.0, 20.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.597906112670898, -4.626360893249512, -1.6548161506652832, 1.3167285919189453, 4.288273811340332, 7.259819030761719, 10.231363296508789, 13.202909469604492, 16.174453735351562, 19.145998001098633, 22.117544174194336, 25.089088439941406, 28.06063461303711, 31.03217887878418, 34.00372314453125, 36.97526931762695, 39.946815490722656, 42.91836166381836, 45.8899040222168, 48.8614501953125, 51.8329963684082, 54.804542541503906, 57.776084899902344, 60.74763107299805, 63.719173431396484, 66.69071960449219, 69.66226196289062, 72.63380432128906, 75.60535430908203, 78.57689666748047, 81.54844665527344, 84.51998901367188, 87.49153900146484, 90.46308135986328, 93.43463134765625, 96.40617370605469, 99.37771606445312, 102.3492660522461, 105.32080841064453, 108.2923583984375, 111.26390075683594, 114.23544311523438, 117.20699310302734, 120.17853546142578, 123.15007781982422, 126.12162780761719, 129.09317016601562, 132.06471252441406, 135.0362548828125, 138.00779724121094, 140.97933959960938, 143.95089721679688, 146.9224395751953, 149.89398193359375, 152.8655242919922, 155.83706665039062, 158.80862426757812, 161.78016662597656, 164.751708984375, 167.7232666015625, 170.69480895996094, 173.66635131835938, 176.6378936767578, 179.60943603515625, 182.5809783935547]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 4.0, 7.0, 12.0, 13.0, 20.0, 17.0, 19.0, 31.0, 23.0, 36.0, 41.0, 30.0, 51.0, 49.0, 46.0, 45.0, 36.0, 42.0, 39.0, 28.0, 35.0, 44.0, 46.0, 40.0, 30.0, 39.0, 28.0, 27.0, 23.0, 11.0, 18.0, 12.0, 19.0, 9.0, 9.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.29036331176758, -33.1875114440918, -32.08466339111328, -30.9818115234375, -29.87895965576172, -28.77610969543457, -27.673259735107422, -26.57040786743164, -25.467557907104492, -24.364707946777344, -23.261856079101562, -22.159006118774414, -21.056156158447266, -19.953304290771484, -18.850454330444336, -17.747604370117188, -16.644752502441406, -15.541901588439941, -14.439050674438477, -13.336200714111328, -12.233349800109863, -11.130498886108398, -10.02764892578125, -8.924798011779785, -7.82194709777832, -6.7190961837768555, -5.616245746612549, -4.513395309448242, -3.4105443954467773, -2.3076934814453125, -1.2048430442810059, -0.10199260711669922, 1.0008621215820312, 2.103712797164917, 3.2065634727478027, 4.309413909912109, 5.412264823913574, 6.515115737915039, 7.617966175079346, 8.720816612243652, 9.823667526245117, 10.926518440246582, 12.029369354248047, 13.132219314575195, 14.23507022857666, 15.337921142578125, 16.440771102905273, 17.543621063232422, 18.646472930908203, 19.74932289123535, 20.852174758911133, 21.95502471923828, 23.057876586914062, 24.16072654724121, 25.26357650756836, 26.36642837524414, 27.46927833557129, 28.572128295898438, 29.67498016357422, 30.777830123901367, 31.880680084228516, 32.9835319519043, 34.08638381958008, 35.189231872558594, 36.292083740234375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 9.0, 10.0, 6.0, 5.0, 9.0, 13.0, 13.0, 15.0, 25.0, 16.0, 21.0, 23.0, 38.0, 29.0, 20.0, 34.0, 27.0, 31.0, 36.0, 42.0, 39.0, 43.0, 46.0, 31.0, 34.0, 43.0, 32.0, 45.0, 30.0, 26.0, 25.0, 30.0, 29.0, 21.0, 19.0, 15.0, 14.0, 10.0, 7.0, 12.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.1484375, -3.04852294921875, -2.9486083984375, -2.84869384765625, -2.748779296875, -2.64886474609375, -2.5489501953125, -2.44903564453125, -2.34912109375, -2.24920654296875, -2.1492919921875, -2.04937744140625, -1.949462890625, -1.84954833984375, -1.7496337890625, -1.64971923828125, -1.5498046875, -1.44989013671875, -1.3499755859375, -1.25006103515625, -1.150146484375, -1.05023193359375, -0.9503173828125, -0.85040283203125, -0.75048828125, -0.65057373046875, -0.5506591796875, -0.45074462890625, -0.350830078125, -0.25091552734375, -0.1510009765625, -0.05108642578125, 0.048828125, 0.14874267578125, 0.2486572265625, 0.34857177734375, 0.448486328125, 0.54840087890625, 0.6483154296875, 0.74822998046875, 0.84814453125, 0.94805908203125, 1.0479736328125, 1.14788818359375, 1.247802734375, 1.34771728515625, 1.4476318359375, 1.54754638671875, 1.6474609375, 1.74737548828125, 1.8472900390625, 1.94720458984375, 2.047119140625, 2.14703369140625, 2.2469482421875, 2.34686279296875, 2.44677734375, 2.54669189453125, 2.6466064453125, 2.74652099609375, 2.846435546875, 2.94635009765625, 3.0462646484375, 3.14617919921875, 3.24609375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 16.0, 31.0, 29.0, 45.0, 58.0, 57.0, 120.0, 148.0, 233.0, 419.0, 744.0, 1485.0, 3325.0, 7742.0, 19499.0, 52308.0, 160501.0, 576022.0, 1539903.0, 1256852.0, 396082.0, 113834.0, 38895.0, 14603.0, 6027.0, 2473.0, 1196.0, 591.0, 356.0, 227.0, 115.0, 73.0, 62.0, 53.0, 34.0, 27.0, 14.0, 12.0, 8.0, 11.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.09375, -4.933837890625, -4.77392578125, -4.614013671875, -4.4541015625, -4.294189453125, -4.13427734375, -3.974365234375, -3.814453125, -3.654541015625, -3.49462890625, -3.334716796875, -3.1748046875, -3.014892578125, -2.85498046875, -2.695068359375, -2.53515625, -2.375244140625, -2.21533203125, -2.055419921875, -1.8955078125, -1.735595703125, -1.57568359375, -1.415771484375, -1.255859375, -1.095947265625, -0.93603515625, -0.776123046875, -0.6162109375, -0.456298828125, -0.29638671875, -0.136474609375, 0.0234375, 0.183349609375, 0.34326171875, 0.503173828125, 0.6630859375, 0.822998046875, 0.98291015625, 1.142822265625, 1.302734375, 1.462646484375, 1.62255859375, 1.782470703125, 1.9423828125, 2.102294921875, 2.26220703125, 2.422119140625, 2.58203125, 2.741943359375, 2.90185546875, 3.061767578125, 3.2216796875, 3.381591796875, 3.54150390625, 3.701416015625, 3.861328125, 4.021240234375, 4.18115234375, 4.341064453125, 4.5009765625, 4.660888671875, 4.82080078125, 4.980712890625, 5.140625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 9.0, 17.0, 18.0, 22.0, 30.0, 41.0, 51.0, 57.0, 85.0, 114.0, 138.0, 166.0, 250.0, 364.0, 364.0, 383.0, 364.0, 320.0, 291.0, 251.0, 170.0, 127.0, 98.0, 87.0, 72.0, 41.0, 34.0, 23.0, 16.0, 16.0, 10.0, 7.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4140625, -7.173583984375, -6.93310546875, -6.692626953125, -6.4521484375, -6.211669921875, -5.97119140625, -5.730712890625, -5.490234375, -5.249755859375, -5.00927734375, -4.768798828125, -4.5283203125, -4.287841796875, -4.04736328125, -3.806884765625, -3.56640625, -3.325927734375, -3.08544921875, -2.844970703125, -2.6044921875, -2.364013671875, -2.12353515625, -1.883056640625, -1.642578125, -1.402099609375, -1.16162109375, -0.921142578125, -0.6806640625, -0.440185546875, -0.19970703125, 0.040771484375, 0.28125, 0.521728515625, 0.76220703125, 1.002685546875, 1.2431640625, 1.483642578125, 1.72412109375, 1.964599609375, 2.205078125, 2.445556640625, 2.68603515625, 2.926513671875, 3.1669921875, 3.407470703125, 3.64794921875, 3.888427734375, 4.12890625, 4.369384765625, 4.60986328125, 4.850341796875, 5.0908203125, 5.331298828125, 5.57177734375, 5.812255859375, 6.052734375, 6.293212890625, 6.53369140625, 6.774169921875, 7.0146484375, 7.255126953125, 7.49560546875, 7.736083984375, 7.9765625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 6.0, 2.0, 5.0, 10.0, 11.0, 16.0, 18.0, 16.0, 27.0, 38.0, 59.0, 32.0, 65.0, 99.0, 142.0, 218.0, 338.0, 722.0, 2426.0, 13896.0, 138137.0, 2009092.0, 1882960.0, 128962.0, 12811.0, 2309.0, 737.0, 345.0, 209.0, 139.0, 110.0, 81.0, 63.0, 38.0, 42.0, 26.0, 20.0, 16.0, 12.0, 7.0, 4.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.328125, -16.786376953125, -16.24462890625, -15.702880859375, -15.1611328125, -14.619384765625, -14.07763671875, -13.535888671875, -12.994140625, -12.452392578125, -11.91064453125, -11.368896484375, -10.8271484375, -10.285400390625, -9.74365234375, -9.201904296875, -8.66015625, -8.118408203125, -7.57666015625, -7.034912109375, -6.4931640625, -5.951416015625, -5.40966796875, -4.867919921875, -4.326171875, -3.784423828125, -3.24267578125, -2.700927734375, -2.1591796875, -1.617431640625, -1.07568359375, -0.533935546875, 0.0078125, 0.549560546875, 1.09130859375, 1.633056640625, 2.1748046875, 2.716552734375, 3.25830078125, 3.800048828125, 4.341796875, 4.883544921875, 5.42529296875, 5.967041015625, 6.5087890625, 7.050537109375, 7.59228515625, 8.134033203125, 8.67578125, 9.217529296875, 9.75927734375, 10.301025390625, 10.8427734375, 11.384521484375, 11.92626953125, 12.468017578125, 13.009765625, 13.551513671875, 14.09326171875, 14.635009765625, 15.1767578125, 15.718505859375, 16.26025390625, 16.802001953125, 17.34375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 15.0, 39.0, 82.0, 128.0, 188.0, 198.0, 154.0, 119.0, 48.0, 26.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.10188293457031, -103.64897155761719, -101.1960678100586, -98.74315643310547, -96.29024505615234, -93.83733367919922, -91.38442993164062, -88.9315185546875, -86.47860717773438, -84.02569580078125, -81.57279205322266, -79.11988067626953, -76.6669692993164, -74.21405792236328, -71.76115417480469, -69.30824279785156, -66.85533142089844, -64.40242004394531, -61.94951248168945, -59.496604919433594, -57.04369354248047, -54.59078598022461, -52.13787841796875, -49.684967041015625, -47.23206329345703, -44.77915573120117, -42.32624435424805, -39.87333679199219, -37.42042541503906, -34.9675178527832, -32.514610290527344, -30.06169891357422, -27.608787536621094, -25.1558780670166, -22.70296859741211, -20.25006103515625, -17.797149658203125, -15.34424114227295, -12.891332626342773, -10.438423156738281, -7.985513687133789, -5.532604217529297, -3.079695224761963, -0.6267862319946289, 1.8261232376098633, 4.2790327072143555, 6.731941223144531, 9.184850692749023, 11.637760162353516, 14.090669631958008, 16.5435791015625, 18.99648666381836, 21.449398040771484, 23.902305603027344, 26.355215072631836, 28.808124542236328, 31.26103401184082, 33.71394348144531, 36.16685104370117, 38.6197624206543, 41.072669982910156, 43.52558135986328, 45.97848892211914, 48.431396484375, 50.884307861328125]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 7.0, 3.0, 2.0, 2.0, 9.0, 15.0, 10.0, 9.0, 13.0, 13.0, 14.0, 19.0, 24.0, 29.0, 29.0, 26.0, 31.0, 35.0, 31.0, 34.0, 35.0, 34.0, 42.0, 48.0, 40.0, 46.0, 41.0, 34.0, 40.0, 26.0, 27.0, 31.0, 25.0, 26.0, 19.0, 24.0, 24.0, 19.0, 11.0, 8.0, 9.0, 11.0, 4.0, 8.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.620132446289062, -23.839879989624023, -23.059629440307617, -22.279376983642578, -21.499126434326172, -20.718873977661133, -19.938621520996094, -19.158370971679688, -18.37811851501465, -17.59786605834961, -16.817615509033203, -16.037363052368164, -15.257111549377441, -14.476860046386719, -13.69660758972168, -12.916356086730957, -12.136104583740234, -11.355853080749512, -10.575601577758789, -9.79534912109375, -9.015097618103027, -8.234846115112305, -7.454594135284424, -6.674342155456543, -5.89409065246582, -5.113839149475098, -4.333587169647217, -3.553335428237915, -2.7730836868286133, -1.9928319454193115, -1.2125802040100098, -0.4323282241821289, 0.34792327880859375, 1.1281750202178955, 1.9084267616271973, 2.688678503036499, 3.468930244445801, 4.249181747436523, 5.029433727264404, 5.809685707092285, 6.589937210083008, 7.3701887130737305, 8.150440216064453, 8.930692672729492, 9.710944175720215, 10.491195678710938, 11.271448135375977, 12.0516996383667, 12.831951141357422, 13.612202644348145, 14.392454147338867, 15.172706604003906, 15.952958106994629, 16.73320960998535, 17.51346206665039, 18.293712615966797, 19.073965072631836, 19.854217529296875, 20.63446807861328, 21.41472053527832, 22.19497299194336, 22.975223541259766, 23.755475997924805, 24.535728454589844, 25.31597900390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 6.0, 6.0, 11.0, 9.0, 9.0, 20.0, 17.0, 23.0, 26.0, 24.0, 23.0, 30.0, 28.0, 27.0, 34.0, 36.0, 34.0, 38.0, 30.0, 43.0, 38.0, 47.0, 52.0, 43.0, 36.0, 28.0, 29.0, 25.0, 26.0, 20.0, 31.0, 17.0, 27.0, 15.0, 16.0, 8.0, 10.0, 11.0, 11.0, 6.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.158203125, -3.0555419921875, -2.952880859375, -2.8502197265625, -2.74755859375, -2.6448974609375, -2.542236328125, -2.4395751953125, -2.3369140625, -2.2342529296875, -2.131591796875, -2.0289306640625, -1.92626953125, -1.8236083984375, -1.720947265625, -1.6182861328125, -1.515625, -1.4129638671875, -1.310302734375, -1.2076416015625, -1.10498046875, -1.0023193359375, -0.899658203125, -0.7969970703125, -0.6943359375, -0.5916748046875, -0.489013671875, -0.3863525390625, -0.28369140625, -0.1810302734375, -0.078369140625, 0.0242919921875, 0.126953125, 0.2296142578125, 0.332275390625, 0.4349365234375, 0.53759765625, 0.6402587890625, 0.742919921875, 0.8455810546875, 0.9482421875, 1.0509033203125, 1.153564453125, 1.2562255859375, 1.35888671875, 1.4615478515625, 1.564208984375, 1.6668701171875, 1.76953125, 1.8721923828125, 1.974853515625, 2.0775146484375, 2.18017578125, 2.2828369140625, 2.385498046875, 2.4881591796875, 2.5908203125, 2.6934814453125, 2.796142578125, 2.8988037109375, 3.00146484375, 3.1041259765625, 3.206787109375, 3.3094482421875, 3.412109375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 13.0, 16.0, 19.0, 39.0, 40.0, 78.0, 135.0, 229.0, 426.0, 700.0, 1237.0, 2271.0, 4773.0, 9334.0, 19906.0, 40820.0, 84250.0, 164669.0, 254446.0, 221316.0, 123874.0, 61522.0, 29835.0, 14226.0, 6863.0, 3541.0, 1687.0, 969.0, 514.0, 282.0, 191.0, 113.0, 75.0, 46.0, 31.0, 24.0, 19.0, 10.0, 6.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5009765625, -0.482269287109375, -0.46356201171875, -0.444854736328125, -0.4261474609375, -0.407440185546875, -0.38873291015625, -0.370025634765625, -0.351318359375, -0.332611083984375, -0.31390380859375, -0.295196533203125, -0.2764892578125, -0.257781982421875, -0.23907470703125, -0.220367431640625, -0.20166015625, -0.182952880859375, -0.16424560546875, -0.145538330078125, -0.1268310546875, -0.108123779296875, -0.08941650390625, -0.070709228515625, -0.052001953125, -0.033294677734375, -0.01458740234375, 0.004119873046875, 0.0228271484375, 0.041534423828125, 0.06024169921875, 0.078948974609375, 0.09765625, 0.116363525390625, 0.13507080078125, 0.153778076171875, 0.1724853515625, 0.191192626953125, 0.20989990234375, 0.228607177734375, 0.247314453125, 0.266021728515625, 0.28472900390625, 0.303436279296875, 0.3221435546875, 0.340850830078125, 0.35955810546875, 0.378265380859375, 0.39697265625, 0.415679931640625, 0.43438720703125, 0.453094482421875, 0.4718017578125, 0.490509033203125, 0.50921630859375, 0.527923583984375, 0.546630859375, 0.565338134765625, 0.58404541015625, 0.602752685546875, 0.6214599609375, 0.640167236328125, 0.65887451171875, 0.677581787109375, 0.6962890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 7.0, 11.0, 16.0, 15.0, 19.0, 18.0, 17.0, 27.0, 22.0, 27.0, 25.0, 34.0, 50.0, 30.0, 30.0, 53.0, 43.0, 1074.0, 37.0, 48.0, 40.0, 40.0, 36.0, 46.0, 23.0, 33.0, 28.0, 28.0, 29.0, 12.0, 12.0, 15.0, 20.0, 9.0, 8.0, 8.0, 4.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.45703125, -2.38250732421875, -2.3079833984375, -2.23345947265625, -2.158935546875, -2.08441162109375, -2.0098876953125, -1.93536376953125, -1.86083984375, -1.78631591796875, -1.7117919921875, -1.63726806640625, -1.562744140625, -1.48822021484375, -1.4136962890625, -1.33917236328125, -1.2646484375, -1.19012451171875, -1.1156005859375, -1.04107666015625, -0.966552734375, -0.89202880859375, -0.8175048828125, -0.74298095703125, -0.66845703125, -0.59393310546875, -0.5194091796875, -0.44488525390625, -0.370361328125, -0.29583740234375, -0.2213134765625, -0.14678955078125, -0.072265625, 0.00225830078125, 0.0767822265625, 0.15130615234375, 0.225830078125, 0.30035400390625, 0.3748779296875, 0.44940185546875, 0.52392578125, 0.59844970703125, 0.6729736328125, 0.74749755859375, 0.822021484375, 0.89654541015625, 0.9710693359375, 1.04559326171875, 1.1201171875, 1.19464111328125, 1.2691650390625, 1.34368896484375, 1.418212890625, 1.49273681640625, 1.5672607421875, 1.64178466796875, 1.71630859375, 1.79083251953125, 1.8653564453125, 1.93988037109375, 2.014404296875, 2.08892822265625, 2.1634521484375, 2.23797607421875, 2.3125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 7.0, 6.0, 9.0, 14.0, 14.0, 24.0, 33.0, 69.0, 67.0, 111.0, 166.0, 242.0, 339.0, 508.0, 765.0, 1121.0, 1662.0, 2587.0, 3800.0, 6040.0, 9266.0, 14590.0, 22394.0, 34517.0, 52204.0, 77268.0, 108359.0, 188398.0, 1108713.0, 153778.0, 100699.0, 71538.0, 48216.0, 31375.0, 20406.0, 13217.0, 8737.0, 5534.0, 3414.0, 2269.0, 1525.0, 1024.0, 658.0, 479.0, 319.0, 227.0, 133.0, 94.0, 66.0, 44.0, 33.0, 22.0, 7.0, 12.0, 9.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0], "bins": [-0.194091796875, -0.1879100799560547, -0.18172836303710938, -0.17554664611816406, -0.16936492919921875, -0.16318321228027344, -0.15700149536132812, -0.1508197784423828, -0.1446380615234375, -0.1384563446044922, -0.13227462768554688, -0.12609291076660156, -0.11991119384765625, -0.11372947692871094, -0.10754776000976562, -0.10136604309082031, -0.095184326171875, -0.08900260925292969, -0.08282089233398438, -0.07663917541503906, -0.07045745849609375, -0.06427574157714844, -0.058094024658203125, -0.05191230773925781, -0.0457305908203125, -0.03954887390136719, -0.033367156982421875, -0.027185440063476562, -0.02100372314453125, -0.014822006225585938, -0.008640289306640625, -0.0024585723876953125, 0.00372314453125, 0.009904861450195312, 0.016086578369140625, 0.022268295288085938, 0.02845001220703125, 0.03463172912597656, 0.040813446044921875, 0.04699516296386719, 0.0531768798828125, 0.05935859680175781, 0.06554031372070312, 0.07172203063964844, 0.07790374755859375, 0.08408546447753906, 0.09026718139648438, 0.09644889831542969, 0.102630615234375, 0.10881233215332031, 0.11499404907226562, 0.12117576599121094, 0.12735748291015625, 0.13353919982910156, 0.13972091674804688, 0.1459026336669922, 0.1520843505859375, 0.1582660675048828, 0.16444778442382812, 0.17062950134277344, 0.17681121826171875, 0.18299293518066406, 0.18917465209960938, 0.1953563690185547, 0.2015380859375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 7.0, 11.0, 7.0, 16.0, 19.0, 33.0, 28.0, 40.0, 42.0, 56.0, 51.0, 45.0, 83.0, 95.0, 90.0, 50.0, 43.0, 49.0, 40.0, 37.0, 24.0, 30.0, 19.0, 14.0, 11.0, 9.0, 8.0, 2.0, 6.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.045745849609375, -0.04437875747680664, -0.04301166534423828, -0.04164457321166992, -0.04027748107910156, -0.0389103889465332, -0.037543296813964844, -0.036176204681396484, -0.034809112548828125, -0.033442020416259766, -0.032074928283691406, -0.030707836151123047, -0.029340744018554688, -0.027973651885986328, -0.02660655975341797, -0.02523946762084961, -0.02387237548828125, -0.02250528335571289, -0.02113819122314453, -0.019771099090576172, -0.018404006958007812, -0.017036914825439453, -0.015669822692871094, -0.014302730560302734, -0.012935638427734375, -0.011568546295166016, -0.010201454162597656, -0.008834362030029297, -0.0074672698974609375, -0.006100177764892578, -0.004733085632324219, -0.0033659934997558594, -0.0019989013671875, -0.0006318092346191406, 0.0007352828979492188, 0.002102375030517578, 0.0034694671630859375, 0.004836559295654297, 0.006203651428222656, 0.007570743560791016, 0.008937835693359375, 0.010304927825927734, 0.011672019958496094, 0.013039112091064453, 0.014406204223632812, 0.015773296356201172, 0.01714038848876953, 0.01850748062133789, 0.01987457275390625, 0.02124166488647461, 0.02260875701904297, 0.023975849151611328, 0.025342941284179688, 0.026710033416748047, 0.028077125549316406, 0.029444217681884766, 0.030811309814453125, 0.032178401947021484, 0.033545494079589844, 0.0349125862121582, 0.03627967834472656, 0.03764677047729492, 0.03901386260986328, 0.04038095474243164, 0.041748046875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 9.0, 5.0, 12.0, 18.0, 19.0, 31.0, 39.0, 51.0, 72.0, 104.0, 218.0, 730.0, 13905.0, 1020531.0, 11473.0, 690.0, 241.0, 105.0, 62.0, 56.0, 42.0, 34.0, 22.0, 16.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8666000366210938, -0.8372039794921875, -0.8078079223632812, -0.778411865234375, -0.7490158081054688, -0.7196197509765625, -0.6902236938476562, -0.66082763671875, -0.6314315795898438, -0.6020355224609375, -0.5726394653320312, -0.543243408203125, -0.5138473510742188, -0.4844512939453125, -0.45505523681640625, -0.4256591796875, -0.39626312255859375, -0.3668670654296875, -0.33747100830078125, -0.308074951171875, -0.27867889404296875, -0.2492828369140625, -0.21988677978515625, -0.19049072265625, -0.16109466552734375, -0.1316986083984375, -0.10230255126953125, -0.072906494140625, -0.04351043701171875, -0.0141143798828125, 0.01528167724609375, 0.044677734375, 0.07407379150390625, 0.1034698486328125, 0.13286590576171875, 0.162261962890625, 0.19165802001953125, 0.2210540771484375, 0.25045013427734375, 0.27984619140625, 0.30924224853515625, 0.3386383056640625, 0.36803436279296875, 0.397430419921875, 0.42682647705078125, 0.4562225341796875, 0.48561859130859375, 0.5150146484375, 0.5444107055664062, 0.5738067626953125, 0.6032028198242188, 0.632598876953125, 0.6619949340820312, 0.6913909912109375, 0.7207870483398438, 0.75018310546875, 0.7795791625976562, 0.8089752197265625, 0.8383712768554688, 0.867767333984375, 0.8971633911132812, 0.9265594482421875, 0.9559555053710938, 0.9853515625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 9.0, 12.0, 44.0, 110.0, 408.0, 345.0, 56.0, 17.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47800084948539734, -0.4684353768825531, -0.45886990427970886, -0.4493044316768646, -0.4397389888763428, -0.43017351627349854, -0.4206080436706543, -0.41104257106781006, -0.4014770984649658, -0.3919116258621216, -0.38234615325927734, -0.3727806806564331, -0.36321520805358887, -0.353649765253067, -0.3440842926502228, -0.33451882004737854, -0.3249533474445343, -0.31538787484169006, -0.3058224022388458, -0.2962569296360016, -0.28669148683547974, -0.2771260142326355, -0.26756054162979126, -0.257995069026947, -0.24842959642410278, -0.23886412382125854, -0.2292986512184143, -0.21973319351673126, -0.21016772091388702, -0.20060224831104279, -0.19103679060935974, -0.1814713180065155, -0.17190583050251007, -0.16234035789966583, -0.1527749001979828, -0.14320942759513855, -0.1336439549922943, -0.12407848238945007, -0.11451301723718643, -0.10494755208492279, -0.09538207948207855, -0.08581660687923431, -0.07625114172697067, -0.06668567657470703, -0.05712020397186279, -0.04755473509430885, -0.03798926621675491, -0.028423801064491272, -0.018858328461647034, -0.009292859584093094, 0.00027260929346084595, 0.009838078171014786, 0.019403547048568726, 0.028969015926122665, 0.038534484803676605, 0.04809994995594025, 0.057665422558784485, 0.06723089516162872, 0.07679636031389236, 0.086361825466156, 0.09592729806900024, 0.10549277067184448, 0.11505823582410812, 0.12462370097637177, 0.134189173579216]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 6.0, 5.0, 4.0, 5.0, 12.0, 7.0, 11.0, 18.0, 16.0, 18.0, 27.0, 32.0, 26.0, 36.0, 39.0, 22.0, 34.0, 31.0, 33.0, 40.0, 62.0, 48.0, 38.0, 38.0, 42.0, 27.0, 26.0, 41.0, 24.0, 29.0, 29.0, 23.0, 29.0, 25.0, 20.0, 12.0, 18.0, 7.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.08212399482727051, -0.07944123446941376, -0.07675846666097641, -0.07407570630311966, -0.07139293849468231, -0.06871017813682556, -0.06602741777896881, -0.06334465742111206, -0.06066188961267471, -0.057979125529527664, -0.055296361446380615, -0.052613601088523865, -0.049930837005376816, -0.04724807292222977, -0.044565312564373016, -0.04188254848122597, -0.03919978439807892, -0.03651702031493187, -0.03383425623178482, -0.03115149587392807, -0.02846873179078102, -0.025785967707633972, -0.023103205487132072, -0.020420443266630173, -0.017737679183483124, -0.01505491603165865, -0.012372152879834175, -0.0096893897280097, -0.0070066265761852264, -0.004323863424360752, -0.0016411002725362778, 0.001041661947965622, 0.003724426031112671, 0.006407189182937145, 0.00908995233476162, 0.011772715486586094, 0.014455478638410568, 0.017138242721557617, 0.019821004942059517, 0.022503767162561417, 0.025186531245708466, 0.027869295328855515, 0.030552057549357414, 0.033234819769859314, 0.03591758385300636, 0.03860034793615341, 0.04128310829401016, 0.04396587237715721, 0.04664863646030426, 0.04933140054345131, 0.05201416462659836, 0.05469692498445511, 0.05737968906760216, 0.06006245315074921, 0.06274521350860596, 0.06542797386646271, 0.06811074167490005, 0.0707935020327568, 0.07347626984119415, 0.0761590301990509, 0.07884179055690765, 0.081524558365345, 0.08420731872320175, 0.0868900865316391, 0.08957284688949585]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 7.0, 5.0, 6.0, 11.0, 8.0, 10.0, 19.0, 18.0, 23.0, 25.0, 23.0, 24.0, 30.0, 28.0, 27.0, 35.0, 33.0, 36.0, 38.0, 29.0, 45.0, 36.0, 49.0, 51.0, 40.0, 41.0, 26.0, 30.0, 25.0, 26.0, 20.0, 30.0, 16.0, 27.0, 17.0, 15.0, 9.0, 10.0, 11.0, 10.0, 7.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.16015625, -3.057525634765625, -2.95489501953125, -2.852264404296875, -2.7496337890625, -2.647003173828125, -2.54437255859375, -2.441741943359375, -2.339111328125, -2.236480712890625, -2.13385009765625, -2.031219482421875, -1.9285888671875, -1.825958251953125, -1.72332763671875, -1.620697021484375, -1.51806640625, -1.415435791015625, -1.31280517578125, -1.210174560546875, -1.1075439453125, -1.004913330078125, -0.90228271484375, -0.799652099609375, -0.697021484375, -0.594390869140625, -0.49176025390625, -0.389129638671875, -0.2864990234375, -0.183868408203125, -0.08123779296875, 0.021392822265625, 0.1240234375, 0.226654052734375, 0.32928466796875, 0.431915283203125, 0.5345458984375, 0.637176513671875, 0.73980712890625, 0.842437744140625, 0.945068359375, 1.047698974609375, 1.15032958984375, 1.252960205078125, 1.3555908203125, 1.458221435546875, 1.56085205078125, 1.663482666015625, 1.76611328125, 1.868743896484375, 1.97137451171875, 2.074005126953125, 2.1766357421875, 2.279266357421875, 2.38189697265625, 2.484527587890625, 2.587158203125, 2.689788818359375, 2.79241943359375, 2.895050048828125, 2.9976806640625, 3.100311279296875, 3.20294189453125, 3.305572509765625, 3.408203125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 10.0, 11.0, 21.0, 20.0, 35.0, 43.0, 67.0, 96.0, 126.0, 280.0, 444.0, 736.0, 1415.0, 2559.0, 5121.0, 10948.0, 23627.0, 52903.0, 129158.0, 346402.0, 288329.0, 103623.0, 43963.0, 19869.0, 9227.0, 4354.0, 2284.0, 1149.0, 682.0, 407.0, 236.0, 154.0, 85.0, 62.0, 33.0, 24.0, 14.0, 15.0, 4.0, 6.0, 8.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.328125, -4.20751953125, -4.0869140625, -3.96630859375, -3.845703125, -3.72509765625, -3.6044921875, -3.48388671875, -3.36328125, -3.24267578125, -3.1220703125, -3.00146484375, -2.880859375, -2.76025390625, -2.6396484375, -2.51904296875, -2.3984375, -2.27783203125, -2.1572265625, -2.03662109375, -1.916015625, -1.79541015625, -1.6748046875, -1.55419921875, -1.43359375, -1.31298828125, -1.1923828125, -1.07177734375, -0.951171875, -0.83056640625, -0.7099609375, -0.58935546875, -0.46875, -0.34814453125, -0.2275390625, -0.10693359375, 0.013671875, 0.13427734375, 0.2548828125, 0.37548828125, 0.49609375, 0.61669921875, 0.7373046875, 0.85791015625, 0.978515625, 1.09912109375, 1.2197265625, 1.34033203125, 1.4609375, 1.58154296875, 1.7021484375, 1.82275390625, 1.943359375, 2.06396484375, 2.1845703125, 2.30517578125, 2.42578125, 2.54638671875, 2.6669921875, 2.78759765625, 2.908203125, 3.02880859375, 3.1494140625, 3.27001953125, 3.390625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 9.0, 15.0, 10.0, 13.0, 13.0, 18.0, 19.0, 30.0, 29.0, 33.0, 35.0, 38.0, 43.0, 69.0, 75.0, 133.0, 316.0, 1502.0, 140.0, 97.0, 67.0, 43.0, 43.0, 43.0, 29.0, 21.0, 27.0, 33.0, 18.0, 17.0, 16.0, 10.0, 10.0, 5.0, 2.0, 7.0, 7.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.8671875, -13.4085693359375, -12.949951171875, -12.4913330078125, -12.03271484375, -11.5740966796875, -11.115478515625, -10.6568603515625, -10.1982421875, -9.7396240234375, -9.281005859375, -8.8223876953125, -8.36376953125, -7.9051513671875, -7.446533203125, -6.9879150390625, -6.529296875, -6.0706787109375, -5.612060546875, -5.1534423828125, -4.69482421875, -4.2362060546875, -3.777587890625, -3.3189697265625, -2.8603515625, -2.4017333984375, -1.943115234375, -1.4844970703125, -1.02587890625, -0.5672607421875, -0.108642578125, 0.3499755859375, 0.80859375, 1.2672119140625, 1.725830078125, 2.1844482421875, 2.64306640625, 3.1016845703125, 3.560302734375, 4.0189208984375, 4.4775390625, 4.9361572265625, 5.394775390625, 5.8533935546875, 6.31201171875, 6.7706298828125, 7.229248046875, 7.6878662109375, 8.146484375, 8.6051025390625, 9.063720703125, 9.5223388671875, 9.98095703125, 10.4395751953125, 10.898193359375, 11.3568115234375, 11.8154296875, 12.2740478515625, 12.732666015625, 13.1912841796875, 13.64990234375, 14.1085205078125, 14.567138671875, 15.0257568359375, 15.484375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 4.0, 13.0, 9.0, 21.0, 16.0, 35.0, 42.0, 65.0, 86.0, 118.0, 221.0, 304.0, 616.0, 2973.0, 435861.0, 2698593.0, 4833.0, 797.0, 370.0, 216.0, 177.0, 93.0, 62.0, 41.0, 40.0, 24.0, 24.0, 20.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-52.71875, -51.404052734375, -50.08935546875, -48.774658203125, -47.4599609375, -46.145263671875, -44.83056640625, -43.515869140625, -42.201171875, -40.886474609375, -39.57177734375, -38.257080078125, -36.9423828125, -35.627685546875, -34.31298828125, -32.998291015625, -31.68359375, -30.368896484375, -29.05419921875, -27.739501953125, -26.4248046875, -25.110107421875, -23.79541015625, -22.480712890625, -21.166015625, -19.851318359375, -18.53662109375, -17.221923828125, -15.9072265625, -14.592529296875, -13.27783203125, -11.963134765625, -10.6484375, -9.333740234375, -8.01904296875, -6.704345703125, -5.3896484375, -4.074951171875, -2.76025390625, -1.445556640625, -0.130859375, 1.183837890625, 2.49853515625, 3.813232421875, 5.1279296875, 6.442626953125, 7.75732421875, 9.072021484375, 10.38671875, 11.701416015625, 13.01611328125, 14.330810546875, 15.6455078125, 16.960205078125, 18.27490234375, 19.589599609375, 20.904296875, 22.218994140625, 23.53369140625, 24.848388671875, 26.1630859375, 27.477783203125, 28.79248046875, 30.107177734375, 31.421875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 11.0, 70.0, 464.0, 410.0, 58.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.39975357055664, -19.182167053222656, -15.964580535888672, -12.746994018554688, -9.529407501220703, -6.311820983886719, -3.0942344665527344, 0.12335205078125, 3.3409385681152344, 6.558525085449219, 9.776111602783203, 12.993698120117188, 16.211284637451172, 19.428871154785156, 22.64645767211914, 25.864044189453125, 29.08163070678711, 32.299217224121094, 35.51680374145508, 38.73439025878906, 41.95197677612305, 45.16956329345703, 48.387149810791016, 51.604736328125, 54.822322845458984, 58.03990936279297, 61.25749588012695, 64.47508239746094, 67.69267272949219, 70.9102554321289, 74.12783813476562, 77.34542846679688, 80.56301879882812, 83.78060913085938, 86.9981918334961, 90.21577453613281, 93.43336486816406, 96.65095520019531, 99.86853790283203, 103.08612060546875, 106.3037109375, 109.52130126953125, 112.73888397216797, 115.95646667480469, 119.17405700683594, 122.39164733886719, 125.6092300415039, 128.82681274414062, 132.04440307617188, 135.26199340820312, 138.47958374023438, 141.69715881347656, 144.9147491455078, 148.13233947753906, 151.34991455078125, 154.5675048828125, 157.78509521484375, 161.002685546875, 164.22027587890625, 167.43785095214844, 170.6554412841797, 173.87303161621094, 177.09060668945312, 180.30819702148438, 183.52578735351562]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 11.0, 8.0, 16.0, 8.0, 19.0, 13.0, 23.0, 27.0, 32.0, 24.0, 31.0, 30.0, 44.0, 31.0, 35.0, 42.0, 39.0, 50.0, 37.0, 44.0, 43.0, 30.0, 43.0, 43.0, 28.0, 27.0, 21.0, 24.0, 34.0, 21.0, 19.0, 20.0, 14.0, 14.0, 11.0, 6.0, 9.0, 4.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.0926456451416, -27.120649337768555, -26.14865493774414, -25.176658630371094, -24.204662322998047, -23.232666015625, -22.260669708251953, -21.28867530822754, -20.316679000854492, -19.344682693481445, -18.37268829345703, -17.400691986083984, -16.428695678710938, -15.45669937133789, -14.48470401763916, -13.51270866394043, -12.540712356567383, -11.568716049194336, -10.596720695495605, -9.624725341796875, -8.652729034423828, -7.6807332038879395, -6.708737373352051, -5.736741542816162, -4.764745712280273, -3.7927498817443848, -2.820754051208496, -1.8487582206726074, -0.8767623901367188, 0.09523344039916992, 1.0672292709350586, 2.0392251014709473, 3.0112228393554688, 3.9832186698913574, 4.955214500427246, 5.927210330963135, 6.899206161499023, 7.871201992034912, 8.8431978225708, 9.815193176269531, 10.787189483642578, 11.759185791015625, 12.731181144714355, 13.703176498413086, 14.675172805786133, 15.64716911315918, 16.619163513183594, 17.59115982055664, 18.563156127929688, 19.535152435302734, 20.50714874267578, 21.479143142700195, 22.451139450073242, 23.42313575744629, 24.395130157470703, 25.36712646484375, 26.339122772216797, 27.311119079589844, 28.28311538696289, 29.255109786987305, 30.22710609436035, 31.1991024017334, 32.17109680175781, 33.14309310913086, 34.115089416503906]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 9.0, 14.0, 12.0, 10.0, 11.0, 18.0, 13.0, 24.0, 22.0, 30.0, 34.0, 31.0, 34.0, 43.0, 34.0, 28.0, 31.0, 26.0, 43.0, 51.0, 37.0, 52.0, 34.0, 30.0, 34.0, 40.0, 27.0, 23.0, 18.0, 24.0, 18.0, 25.0, 16.0, 17.0, 12.0, 13.0, 7.0, 8.0, 9.0, 9.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.28515625, -3.178497314453125, -3.07183837890625, -2.965179443359375, -2.8585205078125, -2.751861572265625, -2.64520263671875, -2.538543701171875, -2.431884765625, -2.325225830078125, -2.21856689453125, -2.111907958984375, -2.0052490234375, -1.898590087890625, -1.79193115234375, -1.685272216796875, -1.57861328125, -1.471954345703125, -1.36529541015625, -1.258636474609375, -1.1519775390625, -1.045318603515625, -0.93865966796875, -0.832000732421875, -0.725341796875, -0.618682861328125, -0.51202392578125, -0.405364990234375, -0.2987060546875, -0.192047119140625, -0.08538818359375, 0.021270751953125, 0.1279296875, 0.234588623046875, 0.34124755859375, 0.447906494140625, 0.5545654296875, 0.661224365234375, 0.76788330078125, 0.874542236328125, 0.981201171875, 1.087860107421875, 1.19451904296875, 1.301177978515625, 1.4078369140625, 1.514495849609375, 1.62115478515625, 1.727813720703125, 1.83447265625, 1.941131591796875, 2.04779052734375, 2.154449462890625, 2.2611083984375, 2.367767333984375, 2.47442626953125, 2.581085205078125, 2.687744140625, 2.794403076171875, 2.90106201171875, 3.007720947265625, 3.1143798828125, 3.221038818359375, 3.32769775390625, 3.434356689453125, 3.541015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 3.0, 12.0, 10.0, 13.0, 20.0, 13.0, 13.0, 26.0, 28.0, 33.0, 36.0, 58.0, 108.0, 227.0, 810.0, 3777.0, 28203.0, 343624.0, 2891862.0, 858717.0, 58117.0, 6624.0, 1195.0, 303.0, 130.0, 58.0, 42.0, 29.0, 30.0, 19.0, 16.0, 19.0, 13.0, 17.0, 11.0, 9.0, 5.0, 14.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.9765625, -11.5982666015625, -11.219970703125, -10.8416748046875, -10.46337890625, -10.0850830078125, -9.706787109375, -9.3284912109375, -8.9501953125, -8.5718994140625, -8.193603515625, -7.8153076171875, -7.43701171875, -7.0587158203125, -6.680419921875, -6.3021240234375, -5.923828125, -5.5455322265625, -5.167236328125, -4.7889404296875, -4.41064453125, -4.0323486328125, -3.654052734375, -3.2757568359375, -2.8974609375, -2.5191650390625, -2.140869140625, -1.7625732421875, -1.38427734375, -1.0059814453125, -0.627685546875, -0.2493896484375, 0.12890625, 0.5072021484375, 0.885498046875, 1.2637939453125, 1.64208984375, 2.0203857421875, 2.398681640625, 2.7769775390625, 3.1552734375, 3.5335693359375, 3.911865234375, 4.2901611328125, 4.66845703125, 5.0467529296875, 5.425048828125, 5.8033447265625, 6.181640625, 6.5599365234375, 6.938232421875, 7.3165283203125, 7.69482421875, 8.0731201171875, 8.451416015625, 8.8297119140625, 9.2080078125, 9.5863037109375, 9.964599609375, 10.3428955078125, 10.72119140625, 11.0994873046875, 11.477783203125, 11.8560791015625, 12.234375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 11.0, 17.0, 18.0, 33.0, 29.0, 48.0, 96.0, 114.0, 133.0, 193.0, 281.0, 361.0, 452.0, 469.0, 477.0, 381.0, 281.0, 188.0, 133.0, 111.0, 77.0, 45.0, 41.0, 26.0, 17.0, 14.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.275634765625, -8.98095703125, -8.686279296875, -8.3916015625, -8.096923828125, -7.80224609375, -7.507568359375, -7.212890625, -6.918212890625, -6.62353515625, -6.328857421875, -6.0341796875, -5.739501953125, -5.44482421875, -5.150146484375, -4.85546875, -4.560791015625, -4.26611328125, -3.971435546875, -3.6767578125, -3.382080078125, -3.08740234375, -2.792724609375, -2.498046875, -2.203369140625, -1.90869140625, -1.614013671875, -1.3193359375, -1.024658203125, -0.72998046875, -0.435302734375, -0.140625, 0.154052734375, 0.44873046875, 0.743408203125, 1.0380859375, 1.332763671875, 1.62744140625, 1.922119140625, 2.216796875, 2.511474609375, 2.80615234375, 3.100830078125, 3.3955078125, 3.690185546875, 3.98486328125, 4.279541015625, 4.57421875, 4.868896484375, 5.16357421875, 5.458251953125, 5.7529296875, 6.047607421875, 6.34228515625, 6.636962890625, 6.931640625, 7.226318359375, 7.52099609375, 7.815673828125, 8.1103515625, 8.405029296875, 8.69970703125, 8.994384765625, 9.2890625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 18.0, 14.0, 25.0, 26.0, 43.0, 58.0, 60.0, 91.0, 124.0, 176.0, 273.0, 533.0, 1583.0, 8882.0, 127176.0, 2706783.0, 1287052.0, 54196.0, 4783.0, 1033.0, 447.0, 240.0, 174.0, 105.0, 101.0, 49.0, 52.0, 45.0, 42.0, 24.0, 17.0, 9.0, 7.0, 11.0, 3.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.17041015625, -18.5283203125, -17.88623046875, -17.244140625, -16.60205078125, -15.9599609375, -15.31787109375, -14.67578125, -14.03369140625, -13.3916015625, -12.74951171875, -12.107421875, -11.46533203125, -10.8232421875, -10.18115234375, -9.5390625, -8.89697265625, -8.2548828125, -7.61279296875, -6.970703125, -6.32861328125, -5.6865234375, -5.04443359375, -4.40234375, -3.76025390625, -3.1181640625, -2.47607421875, -1.833984375, -1.19189453125, -0.5498046875, 0.09228515625, 0.734375, 1.37646484375, 2.0185546875, 2.66064453125, 3.302734375, 3.94482421875, 4.5869140625, 5.22900390625, 5.87109375, 6.51318359375, 7.1552734375, 7.79736328125, 8.439453125, 9.08154296875, 9.7236328125, 10.36572265625, 11.0078125, 11.64990234375, 12.2919921875, 12.93408203125, 13.576171875, 14.21826171875, 14.8603515625, 15.50244140625, 16.14453125, 16.78662109375, 17.4287109375, 18.07080078125, 18.712890625, 19.35498046875, 19.9970703125, 20.63916015625, 21.28125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 14.0, 156.0, 459.0, 323.0, 63.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.87850189208984, -102.39380645751953, -95.90910339355469, -89.42440795898438, -82.93970489501953, -76.45500946044922, -69.97030639648438, -63.48561096191406, -57.000911712646484, -50.516212463378906, -44.03151321411133, -37.54681396484375, -31.062116622924805, -24.57741928100586, -18.09272003173828, -11.608020782470703, -5.123321533203125, 1.361377239227295, 7.846076011657715, 14.330774307250977, 20.815473556518555, 27.3001708984375, 33.78487014770508, 40.269569396972656, 46.754268646240234, 53.23896789550781, 59.72366714477539, 66.20836639404297, 72.69306182861328, 79.17776489257812, 85.66246032714844, 92.14715576171875, 98.63185119628906, 105.11654663085938, 111.60124969482422, 118.08594512939453, 124.57064819335938, 131.0553436279297, 137.5400390625, 144.02474975585938, 150.5094451904297, 156.994140625, 163.4788360595703, 169.9635467529297, 176.4482421875, 182.9329376220703, 189.41763305664062, 195.90234375, 202.38702392578125, 208.87171936035156, 215.35641479492188, 221.84112548828125, 228.32582092285156, 234.81051635742188, 241.2952117919922, 247.7799072265625, 254.26461791992188, 260.74932861328125, 267.2340087890625, 273.7187194824219, 280.2033996582031, 286.6881103515625, 293.1728210449219, 299.6575012207031, 306.1422119140625]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 8.0, 5.0, 11.0, 9.0, 9.0, 16.0, 14.0, 18.0, 19.0, 27.0, 19.0, 28.0, 36.0, 33.0, 42.0, 36.0, 45.0, 34.0, 43.0, 46.0, 33.0, 45.0, 32.0, 34.0, 36.0, 31.0, 31.0, 34.0, 22.0, 33.0, 26.0, 23.0, 16.0, 22.0, 14.0, 11.0, 9.0, 8.0, 9.0, 8.0, 9.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.666175842285156, -24.8515567779541, -24.036937713623047, -23.22231674194336, -22.407697677612305, -21.59307861328125, -20.778459548950195, -19.96384048461914, -19.149219512939453, -18.3346004486084, -17.519981384277344, -16.705360412597656, -15.890741348266602, -15.076122283935547, -14.261503219604492, -13.446884155273438, -12.632265090942383, -11.817646026611328, -11.003026008605957, -10.188406944274902, -9.373786926269531, -8.559167861938477, -7.744548797607422, -6.929929256439209, -6.115309715270996, -5.300690174102783, -4.48607063293457, -3.6714515686035156, -2.8568320274353027, -2.04221248626709, -1.2275934219360352, -0.41297388076782227, 0.4016456604003906, 1.216265082359314, 2.0308845043182373, 2.845503807067871, 3.660123348236084, 4.474742889404297, 5.289361953735352, 6.1039814949035645, 6.918601036071777, 7.73322057723999, 8.547840118408203, 9.362459182739258, 10.177078247070312, 10.991698265075684, 11.806317329406738, 12.62093734741211, 13.435556411743164, 14.250175476074219, 15.06479549407959, 15.879414558410645, 16.694034576416016, 17.50865364074707, 18.323272705078125, 19.13789176940918, 19.952510833740234, 20.76712989807129, 21.581748962402344, 22.39636993408203, 23.210988998413086, 24.02560806274414, 24.840227127075195, 25.65484619140625, 26.469467163085938]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 9.0, 4.0, 16.0, 14.0, 12.0, 10.0, 14.0, 13.0, 17.0, 20.0, 34.0, 32.0, 32.0, 27.0, 29.0, 47.0, 38.0, 40.0, 32.0, 48.0, 39.0, 43.0, 41.0, 36.0, 32.0, 37.0, 31.0, 28.0, 15.0, 33.0, 24.0, 21.0, 20.0, 17.0, 18.0, 12.0, 7.0, 10.0, 12.0, 4.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.330078125, -3.22265625, -3.115234375, -3.0078125, -2.900390625, -2.79296875, -2.685546875, -2.578125, -2.470703125, -2.36328125, -2.255859375, -2.1484375, -2.041015625, -1.93359375, -1.826171875, -1.71875, -1.611328125, -1.50390625, -1.396484375, -1.2890625, -1.181640625, -1.07421875, -0.966796875, -0.859375, -0.751953125, -0.64453125, -0.537109375, -0.4296875, -0.322265625, -0.21484375, -0.107421875, 0.0, 0.107421875, 0.21484375, 0.322265625, 0.4296875, 0.537109375, 0.64453125, 0.751953125, 0.859375, 0.966796875, 1.07421875, 1.181640625, 1.2890625, 1.396484375, 1.50390625, 1.611328125, 1.71875, 1.826171875, 1.93359375, 2.041015625, 2.1484375, 2.255859375, 2.36328125, 2.470703125, 2.578125, 2.685546875, 2.79296875, 2.900390625, 3.0078125, 3.115234375, 3.22265625, 3.330078125, 3.4375, 3.544921875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 18.0, 21.0, 47.0, 72.0, 120.0, 193.0, 353.0, 549.0, 844.0, 1424.0, 2330.0, 3800.0, 5967.0, 9498.0, 14901.0, 23871.0, 37762.0, 58503.0, 89455.0, 129899.0, 166737.0, 159267.0, 119556.0, 80355.0, 52449.0, 33432.0, 21359.0, 13429.0, 8448.0, 5297.0, 3260.0, 2128.0, 1267.0, 780.0, 463.0, 273.0, 169.0, 111.0, 64.0, 39.0, 19.0, 14.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.399169921875, -0.3866462707519531, -0.37412261962890625, -0.3615989685058594, -0.3490753173828125, -0.3365516662597656, -0.32402801513671875, -0.3115043640136719, -0.298980712890625, -0.2864570617675781, -0.27393341064453125, -0.2614097595214844, -0.2488861083984375, -0.23636245727539062, -0.22383880615234375, -0.21131515502929688, -0.19879150390625, -0.18626785278320312, -0.17374420166015625, -0.16122055053710938, -0.1486968994140625, -0.13617324829101562, -0.12364959716796875, -0.11112594604492188, -0.098602294921875, -0.08607864379882812, -0.07355499267578125, -0.061031341552734375, -0.0485076904296875, -0.035984039306640625, -0.02346038818359375, -0.010936737060546875, 0.0015869140625, 0.014110565185546875, 0.02663421630859375, 0.039157867431640625, 0.0516815185546875, 0.06420516967773438, 0.07672882080078125, 0.08925247192382812, 0.101776123046875, 0.11429977416992188, 0.12682342529296875, 0.13934707641601562, 0.1518707275390625, 0.16439437866210938, 0.17691802978515625, 0.18944168090820312, 0.20196533203125, 0.21448898315429688, 0.22701263427734375, 0.23953628540039062, 0.2520599365234375, 0.2645835876464844, 0.27710723876953125, 0.2896308898925781, 0.302154541015625, 0.3146781921386719, 0.32720184326171875, 0.3397254943847656, 0.3522491455078125, 0.3647727966308594, 0.37729644775390625, 0.3898200988769531, 0.40234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 4.0, 6.0, 13.0, 11.0, 13.0, 13.0, 11.0, 24.0, 23.0, 18.0, 33.0, 31.0, 29.0, 41.0, 39.0, 49.0, 33.0, 42.0, 41.0, 1073.0, 38.0, 42.0, 45.0, 35.0, 30.0, 39.0, 38.0, 33.0, 23.0, 31.0, 19.0, 20.0, 11.0, 17.0, 13.0, 7.0, 13.0, 9.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.284759521484375, -2.20819091796875, -2.131622314453125, -2.0550537109375, -1.978485107421875, -1.90191650390625, -1.825347900390625, -1.748779296875, -1.672210693359375, -1.59564208984375, -1.519073486328125, -1.4425048828125, -1.365936279296875, -1.28936767578125, -1.212799072265625, -1.13623046875, -1.059661865234375, -0.98309326171875, -0.906524658203125, -0.8299560546875, -0.753387451171875, -0.67681884765625, -0.600250244140625, -0.523681640625, -0.447113037109375, -0.37054443359375, -0.293975830078125, -0.2174072265625, -0.140838623046875, -0.06427001953125, 0.012298583984375, 0.0888671875, 0.165435791015625, 0.24200439453125, 0.318572998046875, 0.3951416015625, 0.471710205078125, 0.54827880859375, 0.624847412109375, 0.701416015625, 0.777984619140625, 0.85455322265625, 0.931121826171875, 1.0076904296875, 1.084259033203125, 1.16082763671875, 1.237396240234375, 1.31396484375, 1.390533447265625, 1.46710205078125, 1.543670654296875, 1.6202392578125, 1.696807861328125, 1.77337646484375, 1.849945068359375, 1.926513671875, 2.003082275390625, 2.07965087890625, 2.156219482421875, 2.2327880859375, 2.309356689453125, 2.38592529296875, 2.462493896484375, 2.5390625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 15.0, 12.0, 39.0, 47.0, 56.0, 98.0, 148.0, 244.0, 381.0, 598.0, 930.0, 1467.0, 2290.0, 3377.0, 5472.0, 8153.0, 12880.0, 19880.0, 30100.0, 46013.0, 67563.0, 95466.0, 127210.0, 1137733.0, 181939.0, 111159.0, 80438.0, 56135.0, 37328.0, 24784.0, 16076.0, 10238.0, 6554.0, 4475.0, 2778.0, 1803.0, 1208.0, 727.0, 481.0, 327.0, 181.0, 126.0, 80.0, 49.0, 27.0, 18.0, 12.0, 10.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.2313232421875, -0.224853515625, -0.2183837890625, -0.2119140625, -0.2054443359375, -0.198974609375, -0.1925048828125, -0.18603515625, -0.1795654296875, -0.173095703125, -0.1666259765625, -0.16015625, -0.1536865234375, -0.147216796875, -0.1407470703125, -0.13427734375, -0.1278076171875, -0.121337890625, -0.1148681640625, -0.1083984375, -0.1019287109375, -0.095458984375, -0.0889892578125, -0.08251953125, -0.0760498046875, -0.069580078125, -0.0631103515625, -0.056640625, -0.0501708984375, -0.043701171875, -0.0372314453125, -0.03076171875, -0.0242919921875, -0.017822265625, -0.0113525390625, -0.0048828125, 0.0015869140625, 0.008056640625, 0.0145263671875, 0.02099609375, 0.0274658203125, 0.033935546875, 0.0404052734375, 0.046875, 0.0533447265625, 0.059814453125, 0.0662841796875, 0.07275390625, 0.0792236328125, 0.085693359375, 0.0921630859375, 0.0986328125, 0.1051025390625, 0.111572265625, 0.1180419921875, 0.12451171875, 0.1309814453125, 0.137451171875, 0.1439208984375, 0.150390625, 0.1568603515625, 0.163330078125, 0.1697998046875, 0.17626953125, 0.1827392578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 3.0, 7.0, 7.0, 7.0, 10.0, 11.0, 8.0, 9.0, 21.0, 30.0, 38.0, 72.0, 96.0, 78.0, 150.0, 86.0, 101.0, 64.0, 43.0, 29.0, 29.0, 16.0, 9.0, 9.0, 7.0, 16.0, 11.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0303497314453125, -0.02944183349609375, -0.028533935546875, -0.02762603759765625, -0.0267181396484375, -0.02581024169921875, -0.02490234375, -0.02399444580078125, -0.0230865478515625, -0.02217864990234375, -0.021270751953125, -0.02036285400390625, -0.0194549560546875, -0.01854705810546875, -0.01763916015625, -0.01673126220703125, -0.0158233642578125, -0.01491546630859375, -0.014007568359375, -0.01309967041015625, -0.0121917724609375, -0.01128387451171875, -0.0103759765625, -0.00946807861328125, -0.0085601806640625, -0.00765228271484375, -0.006744384765625, -0.00583648681640625, -0.0049285888671875, -0.00402069091796875, -0.00311279296875, -0.00220489501953125, -0.0012969970703125, -0.00038909912109375, 0.000518798828125, 0.00142669677734375, 0.0023345947265625, 0.00324249267578125, 0.004150390625, 0.00505828857421875, 0.0059661865234375, 0.00687408447265625, 0.007781982421875, 0.00868988037109375, 0.0095977783203125, 0.01050567626953125, 0.01141357421875, 0.01232147216796875, 0.0132293701171875, 0.01413726806640625, 0.015045166015625, 0.01595306396484375, 0.0168609619140625, 0.01776885986328125, 0.0186767578125, 0.01958465576171875, 0.0204925537109375, 0.02140045166015625, 0.022308349609375, 0.02321624755859375, 0.0241241455078125, 0.02503204345703125, 0.02593994140625, 0.02684783935546875, 0.0277557373046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 14.0, 11.0, 4.0, 16.0, 15.0, 27.0, 28.0, 47.0, 77.0, 185.0, 667.0, 36556.0, 1006964.0, 3293.0, 313.0, 102.0, 56.0, 27.0, 27.0, 14.0, 12.0, 11.0, 8.0, 6.0, 12.0, 7.0, 5.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6337890625, -0.6135177612304688, -0.5932464599609375, -0.5729751586914062, -0.552703857421875, -0.5324325561523438, -0.5121612548828125, -0.49188995361328125, -0.47161865234375, -0.45134735107421875, -0.4310760498046875, -0.41080474853515625, -0.390533447265625, -0.37026214599609375, -0.3499908447265625, -0.32971954345703125, -0.3094482421875, -0.28917694091796875, -0.2689056396484375, -0.24863433837890625, -0.228363037109375, -0.20809173583984375, -0.1878204345703125, -0.16754913330078125, -0.14727783203125, -0.12700653076171875, -0.1067352294921875, -0.08646392822265625, -0.066192626953125, -0.04592132568359375, -0.0256500244140625, -0.00537872314453125, 0.014892578125, 0.03516387939453125, 0.0554351806640625, 0.07570648193359375, 0.095977783203125, 0.11624908447265625, 0.1365203857421875, 0.15679168701171875, 0.17706298828125, 0.19733428955078125, 0.2176055908203125, 0.23787689208984375, 0.258148193359375, 0.27841949462890625, 0.2986907958984375, 0.31896209716796875, 0.3392333984375, 0.35950469970703125, 0.3797760009765625, 0.40004730224609375, 0.420318603515625, 0.44058990478515625, 0.4608612060546875, 0.48113250732421875, 0.50140380859375, 0.5216751098632812, 0.5419464111328125, 0.5622177124023438, 0.582489013671875, 0.6027603149414062, 0.6230316162109375, 0.6433029174804688, 0.66357421875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 17.0, 25.0, 38.0, 62.0, 176.0, 412.0, 164.0, 67.0, 24.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18517185747623444, -0.18128155171871185, -0.17739124596118927, -0.1735009402036667, -0.1696106344461441, -0.16572032868862152, -0.16183002293109894, -0.15793973207473755, -0.15404942631721497, -0.15015912055969238, -0.1462688148021698, -0.14237850904464722, -0.13848820328712463, -0.13459789752960205, -0.13070759177207947, -0.12681728601455688, -0.1229269802570343, -0.11903667449951172, -0.11514636874198914, -0.11125606298446655, -0.10736575722694397, -0.10347545146942139, -0.0995851531624794, -0.09569484740495682, -0.09180454164743423, -0.08791423588991165, -0.08402393013238907, -0.08013362437486649, -0.0762433260679245, -0.07235302031040192, -0.06846271455287933, -0.06457240879535675, -0.06068210303783417, -0.056791797280311584, -0.052901491522789, -0.04901118949055672, -0.045120883733034134, -0.04123057797551155, -0.037340275943279266, -0.03344997018575668, -0.0295596644282341, -0.025669358670711517, -0.021779054775834084, -0.01788875088095665, -0.013998445123434067, -0.010108139365911484, -0.00621783547103405, -0.002327531576156616, 0.0015627741813659668, 0.005453079007565975, 0.009343383833765984, 0.013233688659965992, 0.017123993486166, 0.021014299243688583, 0.024904603138566017, 0.02879490703344345, 0.032685212790966034, 0.03657551854848862, 0.0404658243060112, 0.044356126338243484, 0.04824643209576607, 0.05213673785328865, 0.056027039885520935, 0.05991734564304352, 0.0638076514005661]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 9.0, 4.0, 2.0, 9.0, 7.0, 16.0, 12.0, 16.0, 19.0, 15.0, 26.0, 23.0, 32.0, 30.0, 35.0, 27.0, 39.0, 41.0, 33.0, 44.0, 38.0, 39.0, 31.0, 44.0, 38.0, 37.0, 41.0, 34.0, 20.0, 19.0, 32.0, 25.0, 23.0, 16.0, 27.0, 17.0, 18.0, 15.0, 12.0, 8.0, 6.0, 4.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036732017993927, -0.035495974123477936, -0.03425993025302887, -0.0330238901078701, -0.031787846237421036, -0.03055180236697197, -0.029315760359168053, -0.028079718351364136, -0.02684367448091507, -0.025607630610466003, -0.024371588602662086, -0.02313554659485817, -0.021899502724409103, -0.020663458853960037, -0.01942741684615612, -0.018191374838352203, -0.016955330967903137, -0.01571928709745407, -0.014483245089650154, -0.013247202150523663, -0.012011159211397171, -0.01077511627227068, -0.009539073333144188, -0.008303030394017696, -0.007066987454891205, -0.005830944515764713, -0.004594901576638222, -0.00335885863751173, -0.0021228156983852386, -0.0008867727592587471, 0.00034927017986774445, 0.001585313118994236, 0.0028213560581207275, 0.004057398997247219, 0.005293441936373711, 0.006529484875500202, 0.007765527814626694, 0.009001570753753185, 0.010237613692879677, 0.011473656632006168, 0.01270969957113266, 0.013945742510259151, 0.015181785449385643, 0.01641782745718956, 0.017653871327638626, 0.018889915198087692, 0.02012595720589161, 0.021361999213695526, 0.022598043084144592, 0.02383408695459366, 0.025070128962397575, 0.026306170970201492, 0.02754221484065056, 0.028778258711099625, 0.03001430071890354, 0.03125034272670746, 0.032486386597156525, 0.03372243046760559, 0.03495847433805466, 0.036194514483213425, 0.03743055835366249, 0.03866660222411156, 0.039902642369270325, 0.04113868623971939, 0.04237473011016846]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 9.0, 4.0, 16.0, 14.0, 11.0, 11.0, 15.0, 11.0, 18.0, 20.0, 34.0, 31.0, 33.0, 27.0, 29.0, 47.0, 38.0, 40.0, 31.0, 49.0, 39.0, 41.0, 43.0, 36.0, 32.0, 37.0, 31.0, 28.0, 15.0, 33.0, 24.0, 21.0, 19.0, 18.0, 18.0, 12.0, 7.0, 10.0, 12.0, 4.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.330078125, -3.222686767578125, -3.11529541015625, -3.007904052734375, -2.9005126953125, -2.793121337890625, -2.68572998046875, -2.578338623046875, -2.470947265625, -2.363555908203125, -2.25616455078125, -2.148773193359375, -2.0413818359375, -1.933990478515625, -1.82659912109375, -1.719207763671875, -1.61181640625, -1.504425048828125, -1.39703369140625, -1.289642333984375, -1.1822509765625, -1.074859619140625, -0.96746826171875, -0.860076904296875, -0.752685546875, -0.645294189453125, -0.53790283203125, -0.430511474609375, -0.3231201171875, -0.215728759765625, -0.10833740234375, -0.000946044921875, 0.1064453125, 0.213836669921875, 0.32122802734375, 0.428619384765625, 0.5360107421875, 0.643402099609375, 0.75079345703125, 0.858184814453125, 0.965576171875, 1.072967529296875, 1.18035888671875, 1.287750244140625, 1.3951416015625, 1.502532958984375, 1.60992431640625, 1.717315673828125, 1.82470703125, 1.932098388671875, 2.03948974609375, 2.146881103515625, 2.2542724609375, 2.361663818359375, 2.46905517578125, 2.576446533203125, 2.683837890625, 2.791229248046875, 2.89862060546875, 3.006011962890625, 3.1134033203125, 3.220794677734375, 3.32818603515625, 3.435577392578125, 3.54296875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 5.0, 13.0, 9.0, 11.0, 20.0, 33.0, 34.0, 71.0, 123.0, 200.0, 267.0, 457.0, 677.0, 1165.0, 2017.0, 3458.0, 6011.0, 11057.0, 21813.0, 45184.0, 100755.0, 252317.0, 349702.0, 135417.0, 58506.0, 27540.0, 14101.0, 7415.0, 4133.0, 2361.0, 1415.0, 850.0, 534.0, 312.0, 217.0, 108.0, 95.0, 58.0, 35.0, 25.0, 13.0, 11.0, 6.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.8665771484375, -2.752685546875, -2.6387939453125, -2.52490234375, -2.4110107421875, -2.297119140625, -2.1832275390625, -2.0693359375, -1.9554443359375, -1.841552734375, -1.7276611328125, -1.61376953125, -1.4998779296875, -1.385986328125, -1.2720947265625, -1.158203125, -1.0443115234375, -0.930419921875, -0.8165283203125, -0.70263671875, -0.5887451171875, -0.474853515625, -0.3609619140625, -0.2470703125, -0.1331787109375, -0.019287109375, 0.0946044921875, 0.20849609375, 0.3223876953125, 0.436279296875, 0.5501708984375, 0.6640625, 0.7779541015625, 0.891845703125, 1.0057373046875, 1.11962890625, 1.2335205078125, 1.347412109375, 1.4613037109375, 1.5751953125, 1.6890869140625, 1.802978515625, 1.9168701171875, 2.03076171875, 2.1446533203125, 2.258544921875, 2.3724365234375, 2.486328125, 2.6002197265625, 2.714111328125, 2.8280029296875, 2.94189453125, 3.0557861328125, 3.169677734375, 3.2835693359375, 3.3974609375, 3.5113525390625, 3.625244140625, 3.7391357421875, 3.85302734375, 3.9669189453125, 4.080810546875, 4.1947021484375, 4.30859375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 6.0, 8.0, 13.0, 21.0, 11.0, 17.0, 24.0, 30.0, 22.0, 33.0, 37.0, 38.0, 36.0, 51.0, 45.0, 63.0, 110.0, 274.0, 1461.0, 191.0, 103.0, 55.0, 50.0, 32.0, 35.0, 43.0, 25.0, 23.0, 23.0, 28.0, 19.0, 17.0, 25.0, 13.0, 17.0, 7.0, 9.0, 2.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.28125, -11.9129638671875, -11.544677734375, -11.1763916015625, -10.80810546875, -10.4398193359375, -10.071533203125, -9.7032470703125, -9.3349609375, -8.9666748046875, -8.598388671875, -8.2301025390625, -7.86181640625, -7.4935302734375, -7.125244140625, -6.7569580078125, -6.388671875, -6.0203857421875, -5.652099609375, -5.2838134765625, -4.91552734375, -4.5472412109375, -4.178955078125, -3.8106689453125, -3.4423828125, -3.0740966796875, -2.705810546875, -2.3375244140625, -1.96923828125, -1.6009521484375, -1.232666015625, -0.8643798828125, -0.49609375, -0.1278076171875, 0.240478515625, 0.6087646484375, 0.97705078125, 1.3453369140625, 1.713623046875, 2.0819091796875, 2.4501953125, 2.8184814453125, 3.186767578125, 3.5550537109375, 3.92333984375, 4.2916259765625, 4.659912109375, 5.0281982421875, 5.396484375, 5.7647705078125, 6.133056640625, 6.5013427734375, 6.86962890625, 7.2379150390625, 7.606201171875, 7.9744873046875, 8.3427734375, 8.7110595703125, 9.079345703125, 9.4476318359375, 9.81591796875, 10.1842041015625, 10.552490234375, 10.9207763671875, 11.2890625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 8.0, 8.0, 17.0, 23.0, 38.0, 67.0, 60.0, 114.0, 164.0, 340.0, 670.0, 4433.0, 2979933.0, 156866.0, 1784.0, 487.0, 254.0, 156.0, 99.0, 57.0, 50.0, 23.0, 20.0, 15.0, 5.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.875, -43.4189453125, -41.962890625, -40.5068359375, -39.05078125, -37.5947265625, -36.138671875, -34.6826171875, -33.2265625, -31.7705078125, -30.314453125, -28.8583984375, -27.40234375, -25.9462890625, -24.490234375, -23.0341796875, -21.578125, -20.1220703125, -18.666015625, -17.2099609375, -15.75390625, -14.2978515625, -12.841796875, -11.3857421875, -9.9296875, -8.4736328125, -7.017578125, -5.5615234375, -4.10546875, -2.6494140625, -1.193359375, 0.2626953125, 1.71875, 3.1748046875, 4.630859375, 6.0869140625, 7.54296875, 8.9990234375, 10.455078125, 11.9111328125, 13.3671875, 14.8232421875, 16.279296875, 17.7353515625, 19.19140625, 20.6474609375, 22.103515625, 23.5595703125, 25.015625, 26.4716796875, 27.927734375, 29.3837890625, 30.83984375, 32.2958984375, 33.751953125, 35.2080078125, 36.6640625, 38.1201171875, 39.576171875, 41.0322265625, 42.48828125, 43.9443359375, 45.400390625, 46.8564453125, 48.3125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 141.0, 653.0, 213.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-216.15609741210938, -212.39772033691406, -208.63934326171875, -204.88096618652344, -201.12258911132812, -197.36422729492188, -193.60585021972656, -189.84747314453125, -186.08909606933594, -182.33071899414062, -178.5723419189453, -174.81396484375, -171.05560302734375, -167.29722595214844, -163.53884887695312, -159.7804718017578, -156.0220947265625, -152.2637176513672, -148.50534057617188, -144.74696350097656, -140.98858642578125, -137.230224609375, -133.4718475341797, -129.71347045898438, -125.95509338378906, -122.19671630859375, -118.43833923339844, -114.67996978759766, -110.92159271240234, -107.16321563720703, -103.40484619140625, -99.64646911621094, -95.8880844116211, -92.12970733642578, -88.371337890625, -84.61296081542969, -80.85458374023438, -77.09620666503906, -73.33782958984375, -69.57946014404297, -65.82108306884766, -62.062705993652344, -58.3043327331543, -54.54595947265625, -50.78758239746094, -47.029205322265625, -43.27083206176758, -39.51245880126953, -35.75408172607422, -31.99570655822754, -28.23733139038086, -24.47895622253418, -20.7205810546875, -16.96220588684082, -13.20383071899414, -9.445455551147461, -5.687082290649414, -1.9287071228027344, 1.8296680450439453, 5.588043212890625, 9.346418380737305, 13.104793548583984, 16.863168716430664, 20.621543884277344, 24.379919052124023]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 10.0, 11.0, 12.0, 7.0, 18.0, 13.0, 18.0, 29.0, 19.0, 35.0, 37.0, 33.0, 34.0, 54.0, 45.0, 37.0, 35.0, 46.0, 49.0, 38.0, 48.0, 46.0, 40.0, 39.0, 30.0, 35.0, 33.0, 30.0, 15.0, 24.0, 24.0, 11.0, 10.0, 5.0, 6.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-46.052860260009766, -44.86296463012695, -43.673072814941406, -42.483177185058594, -41.29328155517578, -40.10338592529297, -38.91349411010742, -37.72359848022461, -36.53370666503906, -35.34381103515625, -34.1539192199707, -32.96402359008789, -31.774127960205078, -30.5842342376709, -29.39434051513672, -28.204444885253906, -27.014549255371094, -25.824655532836914, -24.6347599029541, -23.444866180419922, -22.25497055053711, -21.06507682800293, -19.87518310546875, -18.685287475585938, -17.495393753051758, -16.305500030517578, -15.115604400634766, -13.925710678100586, -12.73581600189209, -11.545921325683594, -10.356027603149414, -9.166132926940918, -7.9762420654296875, -6.786347389221191, -5.5964531898498535, -4.406558990478516, -3.2166643142700195, -2.0267696380615234, -0.8368754386901855, 0.35301876068115234, 1.5429134368896484, 2.7328078746795654, 3.9227023124694824, 5.11259651184082, 6.302491188049316, 7.4923858642578125, 8.682279586791992, 9.872174263000488, 11.062068939208984, 12.25196361541748, 13.441858291625977, 14.631752014160156, 15.821646690368652, 17.01154136657715, 18.201435089111328, 19.39133071899414, 20.58122444152832, 21.7711181640625, 22.961013793945312, 24.150907516479492, 25.340801239013672, 26.530696868896484, 27.720590591430664, 28.910484313964844, 30.100379943847656]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 6.0, 2.0, 7.0, 8.0, 8.0, 5.0, 11.0, 14.0, 17.0, 11.0, 27.0, 12.0, 24.0, 29.0, 26.0, 29.0, 21.0, 45.0, 34.0, 39.0, 39.0, 47.0, 35.0, 40.0, 38.0, 35.0, 38.0, 38.0, 36.0, 22.0, 28.0, 28.0, 24.0, 28.0, 20.0, 27.0, 14.0, 17.0, 8.0, 12.0, 7.0, 8.0, 3.0, 10.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.373046875, -3.260955810546875, -3.14886474609375, -3.036773681640625, -2.9246826171875, -2.812591552734375, -2.70050048828125, -2.588409423828125, -2.476318359375, -2.364227294921875, -2.25213623046875, -2.140045166015625, -2.0279541015625, -1.915863037109375, -1.80377197265625, -1.691680908203125, -1.57958984375, -1.467498779296875, -1.35540771484375, -1.243316650390625, -1.1312255859375, -1.019134521484375, -0.90704345703125, -0.794952392578125, -0.682861328125, -0.570770263671875, -0.45867919921875, -0.346588134765625, -0.2344970703125, -0.122406005859375, -0.01031494140625, 0.101776123046875, 0.2138671875, 0.325958251953125, 0.43804931640625, 0.550140380859375, 0.6622314453125, 0.774322509765625, 0.88641357421875, 0.998504638671875, 1.110595703125, 1.222686767578125, 1.33477783203125, 1.446868896484375, 1.5589599609375, 1.671051025390625, 1.78314208984375, 1.895233154296875, 2.00732421875, 2.119415283203125, 2.23150634765625, 2.343597412109375, 2.4556884765625, 2.567779541015625, 2.67987060546875, 2.791961669921875, 2.904052734375, 3.016143798828125, 3.12823486328125, 3.240325927734375, 3.3524169921875, 3.464508056640625, 3.57659912109375, 3.688690185546875, 3.80078125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 6.0, 4.0, 9.0, 8.0, 4.0, 7.0, 12.0, 11.0, 15.0, 11.0, 10.0, 23.0, 31.0, 38.0, 60.0, 73.0, 119.0, 254.0, 619.0, 1830.0, 6659.0, 32857.0, 224283.0, 1662160.0, 1930900.0, 282880.0, 39969.0, 7964.0, 2052.0, 683.0, 279.0, 123.0, 79.0, 59.0, 35.0, 26.0, 21.0, 26.0, 16.0, 6.0, 11.0, 7.0, 14.0, 8.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.0546875, -8.75341796875, -8.4521484375, -8.15087890625, -7.849609375, -7.54833984375, -7.2470703125, -6.94580078125, -6.64453125, -6.34326171875, -6.0419921875, -5.74072265625, -5.439453125, -5.13818359375, -4.8369140625, -4.53564453125, -4.234375, -3.93310546875, -3.6318359375, -3.33056640625, -3.029296875, -2.72802734375, -2.4267578125, -2.12548828125, -1.82421875, -1.52294921875, -1.2216796875, -0.92041015625, -0.619140625, -0.31787109375, -0.0166015625, 0.28466796875, 0.5859375, 0.88720703125, 1.1884765625, 1.48974609375, 1.791015625, 2.09228515625, 2.3935546875, 2.69482421875, 2.99609375, 3.29736328125, 3.5986328125, 3.89990234375, 4.201171875, 4.50244140625, 4.8037109375, 5.10498046875, 5.40625, 5.70751953125, 6.0087890625, 6.31005859375, 6.611328125, 6.91259765625, 7.2138671875, 7.51513671875, 7.81640625, 8.11767578125, 8.4189453125, 8.72021484375, 9.021484375, 9.32275390625, 9.6240234375, 9.92529296875, 10.2265625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 10.0, 11.0, 14.0, 5.0, 16.0, 29.0, 36.0, 39.0, 47.0, 50.0, 84.0, 102.0, 111.0, 137.0, 180.0, 236.0, 269.0, 309.0, 310.0, 341.0, 329.0, 289.0, 235.0, 175.0, 139.0, 112.0, 93.0, 73.0, 56.0, 43.0, 42.0, 24.0, 27.0, 28.0, 12.0, 15.0, 12.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.359375, -6.14764404296875, -5.9359130859375, -5.72418212890625, -5.512451171875, -5.30072021484375, -5.0889892578125, -4.87725830078125, -4.66552734375, -4.45379638671875, -4.2420654296875, -4.03033447265625, -3.818603515625, -3.60687255859375, -3.3951416015625, -3.18341064453125, -2.9716796875, -2.75994873046875, -2.5482177734375, -2.33648681640625, -2.124755859375, -1.91302490234375, -1.7012939453125, -1.48956298828125, -1.27783203125, -1.06610107421875, -0.8543701171875, -0.64263916015625, -0.430908203125, -0.21917724609375, -0.0074462890625, 0.20428466796875, 0.416015625, 0.62774658203125, 0.8394775390625, 1.05120849609375, 1.262939453125, 1.47467041015625, 1.6864013671875, 1.89813232421875, 2.10986328125, 2.32159423828125, 2.5333251953125, 2.74505615234375, 2.956787109375, 3.16851806640625, 3.3802490234375, 3.59197998046875, 3.8037109375, 4.01544189453125, 4.2271728515625, 4.43890380859375, 4.650634765625, 4.86236572265625, 5.0740966796875, 5.28582763671875, 5.49755859375, 5.70928955078125, 5.9210205078125, 6.13275146484375, 6.344482421875, 6.55621337890625, 6.7679443359375, 6.97967529296875, 7.19140625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 5.0, 6.0, 14.0, 22.0, 22.0, 24.0, 31.0, 37.0, 39.0, 61.0, 60.0, 100.0, 97.0, 135.0, 163.0, 235.0, 332.0, 680.0, 3216.0, 42064.0, 1114182.0, 2894901.0, 127881.0, 7311.0, 1067.0, 398.0, 223.0, 188.0, 158.0, 137.0, 102.0, 77.0, 73.0, 44.0, 37.0, 37.0, 22.0, 21.0, 20.0, 16.0, 11.0, 8.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.375, -20.689453125, -20.00390625, -19.318359375, -18.6328125, -17.947265625, -17.26171875, -16.576171875, -15.890625, -15.205078125, -14.51953125, -13.833984375, -13.1484375, -12.462890625, -11.77734375, -11.091796875, -10.40625, -9.720703125, -9.03515625, -8.349609375, -7.6640625, -6.978515625, -6.29296875, -5.607421875, -4.921875, -4.236328125, -3.55078125, -2.865234375, -2.1796875, -1.494140625, -0.80859375, -0.123046875, 0.5625, 1.248046875, 1.93359375, 2.619140625, 3.3046875, 3.990234375, 4.67578125, 5.361328125, 6.046875, 6.732421875, 7.41796875, 8.103515625, 8.7890625, 9.474609375, 10.16015625, 10.845703125, 11.53125, 12.216796875, 12.90234375, 13.587890625, 14.2734375, 14.958984375, 15.64453125, 16.330078125, 17.015625, 17.701171875, 18.38671875, 19.072265625, 19.7578125, 20.443359375, 21.12890625, 21.814453125, 22.5]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 77.0, 255.0, 360.0, 237.0, 65.0, 15.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.81350708007812, -165.16014099121094, -160.50677490234375, -155.8533935546875, -151.2000274658203, -146.54666137695312, -141.89329528808594, -137.23992919921875, -132.5865478515625, -127.93318176269531, -123.2798080444336, -118.6264419555664, -113.97306823730469, -109.3197021484375, -104.66633605957031, -100.01296997070312, -95.35960388183594, -90.70623779296875, -86.05286407470703, -81.39949798583984, -76.74612426757812, -72.09275817871094, -67.43939208984375, -62.7860221862793, -58.132652282714844, -53.47928237915039, -48.82591247558594, -44.17254638671875, -39.5191764831543, -34.865806579589844, -30.212438583374023, -25.559070587158203, -20.905715942382812, -16.25234603881836, -11.598978042602539, -6.945609092712402, -2.2922401428222656, 2.3611297607421875, 7.014497756958008, 11.667865753173828, 16.32123565673828, 20.974605560302734, 25.627973556518555, 30.281341552734375, 34.93471145629883, 39.58808135986328, 44.24144744873047, 48.89481735229492, 53.548187255859375, 58.20155715942383, 62.85492706298828, 67.50829315185547, 72.16166687011719, 76.81503295898438, 81.46839904785156, 86.12176513671875, 90.77513885498047, 95.42850494384766, 100.08187866210938, 104.73524475097656, 109.38861083984375, 114.04198455810547, 118.69535064697266, 123.34872436523438, 128.00209045410156]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 3.0, 3.0, 9.0, 12.0, 9.0, 8.0, 15.0, 18.0, 14.0, 15.0, 16.0, 32.0, 20.0, 20.0, 19.0, 33.0, 29.0, 35.0, 38.0, 32.0, 42.0, 37.0, 32.0, 35.0, 52.0, 37.0, 23.0, 34.0, 35.0, 39.0, 23.0, 26.0, 20.0, 17.0, 24.0, 20.0, 22.0, 11.0, 11.0, 10.0, 20.0, 9.0, 6.0, 9.0, 5.0, 2.0, 5.0, 1.0, 8.0, 1.0, 4.0, 0.0, 2.0], "bins": [-26.075408935546875, -25.31734275817871, -24.559276580810547, -23.801212310791016, -23.04314613342285, -22.285079956054688, -21.527015686035156, -20.768949508666992, -20.010883331298828, -19.252817153930664, -18.4947509765625, -17.73668670654297, -16.978620529174805, -16.22055435180664, -15.462489128112793, -14.704423904418945, -13.946357727050781, -13.188291549682617, -12.43022632598877, -11.672161102294922, -10.914094924926758, -10.156028747558594, -9.397963523864746, -8.639898300170898, -7.881832122802734, -7.1237664222717285, -6.365700721740723, -5.607635021209717, -4.849569320678711, -4.091503620147705, -3.333437919616699, -2.5753722190856934, -1.8173065185546875, -1.0592408180236816, -0.3011751174926758, 0.4568905830383301, 1.214956283569336, 1.9730219841003418, 2.7310876846313477, 3.4891533851623535, 4.247219085693359, 5.005284786224365, 5.763350486755371, 6.521416187286377, 7.279481887817383, 8.037548065185547, 8.795613288879395, 9.553678512573242, 10.311744689941406, 11.06981086730957, 11.827876091003418, 12.585941314697266, 13.34400749206543, 14.102073669433594, 14.860138893127441, 15.618204116821289, 16.376270294189453, 17.134336471557617, 17.89240264892578, 18.650466918945312, 19.408533096313477, 20.16659927368164, 20.924663543701172, 21.682729721069336, 22.4407958984375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 8.0, 6.0, 7.0, 17.0, 10.0, 20.0, 17.0, 19.0, 15.0, 29.0, 27.0, 32.0, 31.0, 28.0, 37.0, 34.0, 46.0, 31.0, 36.0, 46.0, 48.0, 41.0, 41.0, 28.0, 43.0, 27.0, 31.0, 24.0, 20.0, 19.0, 24.0, 19.0, 19.0, 15.0, 19.0, 15.0, 14.0, 14.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.466796875, -3.35345458984375, -3.2401123046875, -3.12677001953125, -3.013427734375, -2.90008544921875, -2.7867431640625, -2.67340087890625, -2.56005859375, -2.44671630859375, -2.3333740234375, -2.22003173828125, -2.106689453125, -1.99334716796875, -1.8800048828125, -1.76666259765625, -1.6533203125, -1.53997802734375, -1.4266357421875, -1.31329345703125, -1.199951171875, -1.08660888671875, -0.9732666015625, -0.85992431640625, -0.74658203125, -0.63323974609375, -0.5198974609375, -0.40655517578125, -0.293212890625, -0.17987060546875, -0.0665283203125, 0.04681396484375, 0.16015625, 0.27349853515625, 0.3868408203125, 0.50018310546875, 0.613525390625, 0.72686767578125, 0.8402099609375, 0.95355224609375, 1.06689453125, 1.18023681640625, 1.2935791015625, 1.40692138671875, 1.520263671875, 1.63360595703125, 1.7469482421875, 1.86029052734375, 1.9736328125, 2.08697509765625, 2.2003173828125, 2.31365966796875, 2.427001953125, 2.54034423828125, 2.6536865234375, 2.76702880859375, 2.88037109375, 2.99371337890625, 3.1070556640625, 3.22039794921875, 3.333740234375, 3.44708251953125, 3.5604248046875, 3.67376708984375, 3.787109375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 11.0, 5.0, 14.0, 18.0, 31.0, 34.0, 54.0, 80.0, 122.0, 163.0, 283.0, 460.0, 706.0, 1277.0, 2322.0, 5041.0, 10868.0, 24500.0, 57468.0, 135251.0, 273650.0, 283057.0, 143163.0, 61255.0, 26026.0, 11474.0, 5184.0, 2648.0, 1337.0, 756.0, 434.0, 294.0, 169.0, 111.0, 85.0, 59.0, 37.0, 32.0, 21.0, 15.0, 14.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.9892578125, -0.9625473022460938, -0.9358367919921875, -0.9091262817382812, -0.882415771484375, -0.8557052612304688, -0.8289947509765625, -0.8022842407226562, -0.77557373046875, -0.7488632202148438, -0.7221527099609375, -0.6954421997070312, -0.668731689453125, -0.6420211791992188, -0.6153106689453125, -0.5886001586914062, -0.5618896484375, -0.5351791381835938, -0.5084686279296875, -0.48175811767578125, -0.455047607421875, -0.42833709716796875, -0.4016265869140625, -0.37491607666015625, -0.34820556640625, -0.32149505615234375, -0.2947845458984375, -0.26807403564453125, -0.241363525390625, -0.21465301513671875, -0.1879425048828125, -0.16123199462890625, -0.134521484375, -0.10781097412109375, -0.0811004638671875, -0.05438995361328125, -0.027679443359375, -0.00096893310546875, 0.0257415771484375, 0.05245208740234375, 0.07916259765625, 0.10587310791015625, 0.1325836181640625, 0.15929412841796875, 0.186004638671875, 0.21271514892578125, 0.2394256591796875, 0.26613616943359375, 0.2928466796875, 0.31955718994140625, 0.3462677001953125, 0.37297821044921875, 0.399688720703125, 0.42639923095703125, 0.4531097412109375, 0.47982025146484375, 0.50653076171875, 0.5332412719726562, 0.5599517822265625, 0.5866622924804688, 0.613372802734375, 0.6400833129882812, 0.6667938232421875, 0.6935043334960938, 0.72021484375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 6.0, 8.0, 7.0, 6.0, 7.0, 13.0, 17.0, 15.0, 19.0, 21.0, 21.0, 29.0, 40.0, 35.0, 32.0, 29.0, 40.0, 39.0, 35.0, 48.0, 1064.0, 39.0, 37.0, 32.0, 38.0, 41.0, 27.0, 34.0, 32.0, 30.0, 26.0, 27.0, 15.0, 17.0, 14.0, 14.0, 9.0, 8.0, 4.0, 8.0, 8.0, 7.0, 1.0, 8.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.162109375, -2.089019775390625, -2.01593017578125, -1.942840576171875, -1.8697509765625, -1.796661376953125, -1.72357177734375, -1.650482177734375, -1.577392578125, -1.504302978515625, -1.43121337890625, -1.358123779296875, -1.2850341796875, -1.211944580078125, -1.13885498046875, -1.065765380859375, -0.99267578125, -0.919586181640625, -0.84649658203125, -0.773406982421875, -0.7003173828125, -0.627227783203125, -0.55413818359375, -0.481048583984375, -0.407958984375, -0.334869384765625, -0.26177978515625, -0.188690185546875, -0.1156005859375, -0.042510986328125, 0.03057861328125, 0.103668212890625, 0.1767578125, 0.249847412109375, 0.32293701171875, 0.396026611328125, 0.4691162109375, 0.542205810546875, 0.61529541015625, 0.688385009765625, 0.761474609375, 0.834564208984375, 0.90765380859375, 0.980743408203125, 1.0538330078125, 1.126922607421875, 1.20001220703125, 1.273101806640625, 1.34619140625, 1.419281005859375, 1.49237060546875, 1.565460205078125, 1.6385498046875, 1.711639404296875, 1.78472900390625, 1.857818603515625, 1.930908203125, 2.003997802734375, 2.07708740234375, 2.150177001953125, 2.2232666015625, 2.296356201171875, 2.36944580078125, 2.442535400390625, 2.515625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 6.0, 8.0, 15.0, 15.0, 22.0, 30.0, 44.0, 72.0, 91.0, 127.0, 231.0, 356.0, 612.0, 894.0, 1457.0, 2533.0, 4399.0, 7458.0, 13545.0, 24874.0, 45570.0, 81275.0, 138725.0, 556797.0, 886278.0, 142711.0, 83801.0, 46684.0, 25442.0, 14100.0, 7727.0, 4527.0, 2575.0, 1500.0, 929.0, 598.0, 371.0, 236.0, 165.0, 92.0, 64.0, 43.0, 34.0, 21.0, 20.0, 21.0, 9.0, 6.0, 5.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.339599609375, -0.3289947509765625, -0.318389892578125, -0.3077850341796875, -0.29718017578125, -0.2865753173828125, -0.275970458984375, -0.2653656005859375, -0.2547607421875, -0.2441558837890625, -0.233551025390625, -0.2229461669921875, -0.21234130859375, -0.2017364501953125, -0.191131591796875, -0.1805267333984375, -0.169921875, -0.1593170166015625, -0.148712158203125, -0.1381072998046875, -0.12750244140625, -0.1168975830078125, -0.106292724609375, -0.0956878662109375, -0.0850830078125, -0.0744781494140625, -0.063873291015625, -0.0532684326171875, -0.04266357421875, -0.0320587158203125, -0.021453857421875, -0.0108489990234375, -0.000244140625, 0.0103607177734375, 0.020965576171875, 0.0315704345703125, 0.04217529296875, 0.0527801513671875, 0.063385009765625, 0.0739898681640625, 0.0845947265625, 0.0951995849609375, 0.105804443359375, 0.1164093017578125, 0.12701416015625, 0.1376190185546875, 0.148223876953125, 0.1588287353515625, 0.16943359375, 0.1800384521484375, 0.190643310546875, 0.2012481689453125, 0.21185302734375, 0.2224578857421875, 0.233062744140625, 0.2436676025390625, 0.2542724609375, 0.2648773193359375, 0.275482177734375, 0.2860870361328125, 0.29669189453125, 0.3072967529296875, 0.317901611328125, 0.3285064697265625, 0.339111328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 6.0, 7.0, 11.0, 10.0, 21.0, 26.0, 62.0, 88.0, 104.0, 209.0, 130.0, 84.0, 71.0, 37.0, 29.0, 28.0, 12.0, 6.0, 10.0, 5.0, 2.0, 4.0, 10.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0782470703125, -0.07611370086669922, -0.07398033142089844, -0.07184696197509766, -0.06971359252929688, -0.0675802230834961, -0.06544685363769531, -0.06331348419189453, -0.06118011474609375, -0.05904674530029297, -0.05691337585449219, -0.054780006408691406, -0.052646636962890625, -0.050513267517089844, -0.04837989807128906, -0.04624652862548828, -0.0441131591796875, -0.04197978973388672, -0.03984642028808594, -0.037713050842285156, -0.035579681396484375, -0.033446311950683594, -0.03131294250488281, -0.02917957305908203, -0.02704620361328125, -0.02491283416748047, -0.022779464721679688, -0.020646095275878906, -0.018512725830078125, -0.016379356384277344, -0.014245986938476562, -0.012112617492675781, -0.009979248046875, -0.007845878601074219, -0.0057125091552734375, -0.0035791397094726562, -0.001445770263671875, 0.0006875991821289062, 0.0028209686279296875, 0.004954338073730469, 0.00708770751953125, 0.009221076965332031, 0.011354446411132812, 0.013487815856933594, 0.015621185302734375, 0.017754554748535156, 0.019887924194335938, 0.02202129364013672, 0.0241546630859375, 0.02628803253173828, 0.028421401977539062, 0.030554771423339844, 0.032688140869140625, 0.034821510314941406, 0.03695487976074219, 0.03908824920654297, 0.04122161865234375, 0.04335498809814453, 0.04548835754394531, 0.047621726989746094, 0.049755096435546875, 0.051888465881347656, 0.05402183532714844, 0.05615520477294922, 0.05828857421875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 3.0, 3.0, 10.0, 11.0, 10.0, 29.0, 42.0, 45.0, 112.0, 265.0, 1707.0, 917225.0, 127613.0, 1021.0, 209.0, 93.0, 43.0, 24.0, 20.0, 14.0, 9.0, 5.0, 5.0, 6.0, 1.0, 5.0, 1.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.25701904296875, -1.2103271484375, -1.16363525390625, -1.116943359375, -1.07025146484375, -1.0235595703125, -0.97686767578125, -0.93017578125, -0.88348388671875, -0.8367919921875, -0.79010009765625, -0.743408203125, -0.69671630859375, -0.6500244140625, -0.60333251953125, -0.556640625, -0.50994873046875, -0.4632568359375, -0.41656494140625, -0.369873046875, -0.32318115234375, -0.2764892578125, -0.22979736328125, -0.18310546875, -0.13641357421875, -0.0897216796875, -0.04302978515625, 0.003662109375, 0.05035400390625, 0.0970458984375, 0.14373779296875, 0.1904296875, 0.23712158203125, 0.2838134765625, 0.33050537109375, 0.377197265625, 0.42388916015625, 0.4705810546875, 0.51727294921875, 0.56396484375, 0.61065673828125, 0.6573486328125, 0.70404052734375, 0.750732421875, 0.79742431640625, 0.8441162109375, 0.89080810546875, 0.9375, 0.98419189453125, 1.0308837890625, 1.07757568359375, 1.124267578125, 1.17095947265625, 1.2176513671875, 1.26434326171875, 1.31103515625, 1.35772705078125, 1.4044189453125, 1.45111083984375, 1.497802734375, 1.54449462890625, 1.5911865234375, 1.63787841796875, 1.6845703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 26.0, 81.0, 199.0, 540.0, 113.0, 30.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2866206765174866, -0.27487069368362427, -0.2631206810474396, -0.25137069821357727, -0.23962070047855377, -0.22787070274353027, -0.21612071990966797, -0.20437072217464447, -0.19262072443962097, -0.18087072670459747, -0.16912074387073517, -0.15737074613571167, -0.14562074840068817, -0.13387075066566467, -0.12212076783180237, -0.11037077009677887, -0.09862078726291656, -0.08687079697847366, -0.07512079924345016, -0.06337080895900726, -0.05162081494927406, -0.03987082093954086, -0.02812083065509796, -0.016370832920074463, -0.004620842635631561, 0.007129150442779064, 0.01887914352118969, 0.03062913566827774, 0.04237912967801094, 0.05412912368774414, 0.06587911397218704, 0.07762911170721054, 0.08937910199165344, 0.10112909227609634, 0.11287909001111984, 0.12462908029556274, 0.13637907803058624, 0.14812907576560974, 0.15987905859947205, 0.17162905633449554, 0.18337905406951904, 0.19512905180454254, 0.20687903463840485, 0.21862903237342834, 0.23037903010845184, 0.24212902784347534, 0.25387901067733765, 0.26562899351119995, 0.27737897634506226, 0.28912895917892456, 0.30087897181510925, 0.31262895464897156, 0.32437893748283386, 0.33612895011901855, 0.34787893295288086, 0.35962891578674316, 0.37137892842292786, 0.38312891125679016, 0.39487892389297485, 0.40662890672683716, 0.41837888956069946, 0.43012890219688416, 0.44187888503074646, 0.45362889766693115, 0.46537888050079346]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 5.0, 6.0, 15.0, 12.0, 11.0, 16.0, 14.0, 25.0, 26.0, 29.0, 35.0, 26.0, 30.0, 29.0, 38.0, 32.0, 41.0, 44.0, 35.0, 34.0, 46.0, 36.0, 36.0, 36.0, 39.0, 23.0, 35.0, 23.0, 30.0, 24.0, 24.0, 22.0, 17.0, 22.0, 14.0, 15.0, 7.0, 8.0, 10.0, 6.0, 1.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07481110095977783, -0.07235562801361084, -0.06990016251802444, -0.06744469702243805, -0.06498922407627106, -0.06253375113010406, -0.06007828563451767, -0.057622816413640976, -0.05516734719276428, -0.05271187797188759, -0.050256408751010895, -0.0478009395301342, -0.04534547030925751, -0.042890001088380814, -0.04043453186750412, -0.037979062646627426, -0.03552359342575073, -0.03306812420487404, -0.030612654983997345, -0.02815718576312065, -0.025701716542243958, -0.023246247321367264, -0.02079077810049057, -0.018335308879613876, -0.015879839658737183, -0.013424370437860489, -0.010968901216983795, -0.008513431996107101, -0.006057962775230408, -0.003602493554353714, -0.0011470243334770203, 0.0013084448873996735, 0.003763914108276367, 0.006219383329153061, 0.008674852550029755, 0.011130321770906448, 0.013585790991783142, 0.016041260212659836, 0.01849672943353653, 0.020952198654413223, 0.023407667875289917, 0.02586313709616661, 0.028318606317043304, 0.030774075537919998, 0.03322954475879669, 0.035685013979673386, 0.03814048320055008, 0.04059595242142677, 0.04305142164230347, 0.04550689086318016, 0.047962360084056854, 0.05041782930493355, 0.05287329852581024, 0.055328767746686935, 0.05778423696756363, 0.06023970618844032, 0.06269517540931702, 0.06515064835548401, 0.0676061138510704, 0.0700615793466568, 0.07251705229282379, 0.07497252523899078, 0.07742799073457718, 0.07988345623016357, 0.08233892917633057]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 7.0, 7.0, 7.0, 16.0, 11.0, 19.0, 18.0, 18.0, 16.0, 27.0, 29.0, 33.0, 30.0, 26.0, 39.0, 32.0, 45.0, 33.0, 34.0, 47.0, 50.0, 40.0, 41.0, 29.0, 43.0, 26.0, 32.0, 24.0, 20.0, 19.0, 23.0, 19.0, 20.0, 15.0, 19.0, 15.0, 13.0, 15.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.46875, -3.35540771484375, -3.2420654296875, -3.12872314453125, -3.015380859375, -2.90203857421875, -2.7886962890625, -2.67535400390625, -2.56201171875, -2.44866943359375, -2.3353271484375, -2.22198486328125, -2.108642578125, -1.99530029296875, -1.8819580078125, -1.76861572265625, -1.6552734375, -1.54193115234375, -1.4285888671875, -1.31524658203125, -1.201904296875, -1.08856201171875, -0.9752197265625, -0.86187744140625, -0.74853515625, -0.63519287109375, -0.5218505859375, -0.40850830078125, -0.295166015625, -0.18182373046875, -0.0684814453125, 0.04486083984375, 0.158203125, 0.27154541015625, 0.3848876953125, 0.49822998046875, 0.611572265625, 0.72491455078125, 0.8382568359375, 0.95159912109375, 1.06494140625, 1.17828369140625, 1.2916259765625, 1.40496826171875, 1.518310546875, 1.63165283203125, 1.7449951171875, 1.85833740234375, 1.9716796875, 2.08502197265625, 2.1983642578125, 2.31170654296875, 2.425048828125, 2.53839111328125, 2.6517333984375, 2.76507568359375, 2.87841796875, 2.99176025390625, 3.1051025390625, 3.21844482421875, 3.331787109375, 3.44512939453125, 3.5584716796875, 3.67181396484375, 3.78515625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 10.0, 19.0, 23.0, 38.0, 55.0, 97.0, 145.0, 240.0, 478.0, 763.0, 1253.0, 2007.0, 3681.0, 6613.0, 12153.0, 24083.0, 55508.0, 158083.0, 410607.0, 229194.0, 78130.0, 31273.0, 15371.0, 8054.0, 4532.0, 2497.0, 1511.0, 878.0, 476.0, 286.0, 182.0, 116.0, 73.0, 43.0, 38.0, 26.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.32080078125, -3.1962890625, -3.07177734375, -2.947265625, -2.82275390625, -2.6982421875, -2.57373046875, -2.44921875, -2.32470703125, -2.2001953125, -2.07568359375, -1.951171875, -1.82666015625, -1.7021484375, -1.57763671875, -1.453125, -1.32861328125, -1.2041015625, -1.07958984375, -0.955078125, -0.83056640625, -0.7060546875, -0.58154296875, -0.45703125, -0.33251953125, -0.2080078125, -0.08349609375, 0.041015625, 0.16552734375, 0.2900390625, 0.41455078125, 0.5390625, 0.66357421875, 0.7880859375, 0.91259765625, 1.037109375, 1.16162109375, 1.2861328125, 1.41064453125, 1.53515625, 1.65966796875, 1.7841796875, 1.90869140625, 2.033203125, 2.15771484375, 2.2822265625, 2.40673828125, 2.53125, 2.65576171875, 2.7802734375, 2.90478515625, 3.029296875, 3.15380859375, 3.2783203125, 3.40283203125, 3.52734375, 3.65185546875, 3.7763671875, 3.90087890625, 4.025390625, 4.14990234375, 4.2744140625, 4.39892578125, 4.5234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 8.0, 5.0, 5.0, 5.0, 7.0, 13.0, 13.0, 18.0, 13.0, 22.0, 18.0, 22.0, 27.0, 34.0, 36.0, 34.0, 50.0, 35.0, 74.0, 164.0, 1467.0, 355.0, 155.0, 98.0, 50.0, 42.0, 29.0, 49.0, 35.0, 22.0, 16.0, 23.0, 19.0, 15.0, 19.0, 15.0, 6.0, 6.0, 14.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.90625, -13.4844970703125, -13.062744140625, -12.6409912109375, -12.21923828125, -11.7974853515625, -11.375732421875, -10.9539794921875, -10.5322265625, -10.1104736328125, -9.688720703125, -9.2669677734375, -8.84521484375, -8.4234619140625, -8.001708984375, -7.5799560546875, -7.158203125, -6.7364501953125, -6.314697265625, -5.8929443359375, -5.47119140625, -5.0494384765625, -4.627685546875, -4.2059326171875, -3.7841796875, -3.3624267578125, -2.940673828125, -2.5189208984375, -2.09716796875, -1.6754150390625, -1.253662109375, -0.8319091796875, -0.41015625, 0.0115966796875, 0.433349609375, 0.8551025390625, 1.27685546875, 1.6986083984375, 2.120361328125, 2.5421142578125, 2.9638671875, 3.3856201171875, 3.807373046875, 4.2291259765625, 4.65087890625, 5.0726318359375, 5.494384765625, 5.9161376953125, 6.337890625, 6.7596435546875, 7.181396484375, 7.6031494140625, 8.02490234375, 8.4466552734375, 8.868408203125, 9.2901611328125, 9.7119140625, 10.1336669921875, 10.555419921875, 10.9771728515625, 11.39892578125, 11.8206787109375, 12.242431640625, 12.6641845703125, 13.0859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 9.0, 9.0, 17.0, 36.0, 31.0, 63.0, 89.0, 136.0, 201.0, 301.0, 547.0, 3207.0, 2755444.0, 382385.0, 1909.0, 482.0, 270.0, 188.0, 115.0, 89.0, 65.0, 44.0, 12.0, 18.0, 14.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -44.99560546875, -43.4912109375, -41.98681640625, -40.482421875, -38.97802734375, -37.4736328125, -35.96923828125, -34.46484375, -32.96044921875, -31.4560546875, -29.95166015625, -28.447265625, -26.94287109375, -25.4384765625, -23.93408203125, -22.4296875, -20.92529296875, -19.4208984375, -17.91650390625, -16.412109375, -14.90771484375, -13.4033203125, -11.89892578125, -10.39453125, -8.89013671875, -7.3857421875, -5.88134765625, -4.376953125, -2.87255859375, -1.3681640625, 0.13623046875, 1.640625, 3.14501953125, 4.6494140625, 6.15380859375, 7.658203125, 9.16259765625, 10.6669921875, 12.17138671875, 13.67578125, 15.18017578125, 16.6845703125, 18.18896484375, 19.693359375, 21.19775390625, 22.7021484375, 24.20654296875, 25.7109375, 27.21533203125, 28.7197265625, 30.22412109375, 31.728515625, 33.23291015625, 34.7373046875, 36.24169921875, 37.74609375, 39.25048828125, 40.7548828125, 42.25927734375, 43.763671875, 45.26806640625, 46.7724609375, 48.27685546875, 49.78125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 12.0, 124.0, 528.0, 307.0, 45.0, 2.0, 1.0, 1.0], "bins": [-172.621826171875, -169.68186950683594, -166.74192810058594, -163.80197143554688, -160.86203002929688, -157.9220733642578, -154.9821319580078, -152.04217529296875, -149.10223388671875, -146.1622772216797, -143.2223358154297, -140.28237915039062, -137.34243774414062, -134.40248107910156, -131.46253967285156, -128.5225830078125, -125.5826416015625, -122.64269256591797, -119.70274353027344, -116.7627944946289, -113.82284545898438, -110.88289642333984, -107.94294738769531, -105.00299835205078, -102.06304168701172, -99.12309265136719, -96.18314361572266, -93.24319458007812, -90.3032455444336, -87.36329650878906, -84.42334747314453, -81.4833984375, -78.54344940185547, -75.60350036621094, -72.6635513305664, -69.72360229492188, -66.78365325927734, -63.84370422363281, -60.90375518798828, -57.96380615234375, -55.02385711669922, -52.08390808105469, -49.143959045410156, -46.204010009765625, -43.264060974121094, -40.32411193847656, -37.38416290283203, -34.4442138671875, -31.50426483154297, -28.564315795898438, -25.624366760253906, -22.684417724609375, -19.744468688964844, -16.804519653320312, -13.864568710327148, -10.924619674682617, -7.9846696853637695, -5.044720649719238, -2.104771137237549, 0.8351783752441406, 3.775127410888672, 6.715076446533203, 9.65502643585205, 12.594975471496582, 15.534924507141113]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 3.0, 8.0, 12.0, 13.0, 14.0, 12.0, 13.0, 14.0, 14.0, 19.0, 19.0, 21.0, 32.0, 34.0, 30.0, 39.0, 29.0, 34.0, 35.0, 29.0, 37.0, 40.0, 36.0, 32.0, 39.0, 27.0, 37.0, 33.0, 31.0, 29.0, 27.0, 18.0, 27.0, 26.0, 17.0, 13.0, 17.0, 13.0, 14.0, 13.0, 5.0, 4.0, 7.0, 5.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.529407501220703, -30.55421257019043, -29.579015731811523, -28.60382080078125, -27.628623962402344, -26.65342903137207, -25.678234100341797, -24.70303726196289, -23.727842330932617, -22.752647399902344, -21.777450561523438, -20.802255630493164, -19.82706069946289, -18.851863861083984, -17.87666893005371, -16.901473999023438, -15.926277160644531, -14.951081275939941, -13.975885391235352, -13.000690460205078, -12.025494575500488, -11.050298690795898, -10.075103759765625, -9.099907875061035, -8.124711990356445, -7.1495161056518555, -6.174320697784424, -5.199125289916992, -4.223929405212402, -3.2487335205078125, -2.273538112640381, -1.2983427047729492, -0.3231468200683594, 0.6520488262176514, 1.627244472503662, 2.602440118789673, 3.5776357650756836, 4.552831649780273, 5.528027057647705, 6.503222465515137, 7.478418350219727, 8.453614234924316, 9.428810119628906, 10.40400505065918, 11.37920093536377, 12.35439682006836, 13.329591751098633, 14.304787635803223, 15.279983520507812, 16.255178451538086, 17.230375289916992, 18.205570220947266, 19.180767059326172, 20.155961990356445, 21.13115692138672, 22.106353759765625, 23.0815486907959, 24.056743621826172, 25.031940460205078, 26.00713539123535, 26.982330322265625, 27.95752716064453, 28.932722091674805, 29.907917022705078, 30.883113861083984]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 5.0, 3.0, 9.0, 8.0, 10.0, 5.0, 17.0, 14.0, 17.0, 18.0, 19.0, 13.0, 31.0, 29.0, 28.0, 34.0, 31.0, 39.0, 28.0, 48.0, 34.0, 48.0, 38.0, 31.0, 46.0, 43.0, 38.0, 36.0, 31.0, 28.0, 27.0, 16.0, 21.0, 20.0, 14.0, 13.0, 18.0, 19.0, 14.0, 10.0, 14.0, 10.0, 9.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7109375, -3.592010498046875, -3.47308349609375, -3.354156494140625, -3.2352294921875, -3.116302490234375, -2.99737548828125, -2.878448486328125, -2.759521484375, -2.640594482421875, -2.52166748046875, -2.402740478515625, -2.2838134765625, -2.164886474609375, -2.04595947265625, -1.927032470703125, -1.80810546875, -1.689178466796875, -1.57025146484375, -1.451324462890625, -1.3323974609375, -1.213470458984375, -1.09454345703125, -0.975616455078125, -0.856689453125, -0.737762451171875, -0.61883544921875, -0.499908447265625, -0.3809814453125, -0.262054443359375, -0.14312744140625, -0.024200439453125, 0.0947265625, 0.213653564453125, 0.33258056640625, 0.451507568359375, 0.5704345703125, 0.689361572265625, 0.80828857421875, 0.927215576171875, 1.046142578125, 1.165069580078125, 1.28399658203125, 1.402923583984375, 1.5218505859375, 1.640777587890625, 1.75970458984375, 1.878631591796875, 1.99755859375, 2.116485595703125, 2.23541259765625, 2.354339599609375, 2.4732666015625, 2.592193603515625, 2.71112060546875, 2.830047607421875, 2.948974609375, 3.067901611328125, 3.18682861328125, 3.305755615234375, 3.4246826171875, 3.543609619140625, 3.66253662109375, 3.781463623046875, 3.900390625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 5.0, 5.0, 10.0, 7.0, 12.0, 25.0, 20.0, 15.0, 34.0, 32.0, 59.0, 116.0, 196.0, 321.0, 779.0, 1936.0, 5719.0, 22305.0, 103629.0, 609558.0, 2062069.0, 1134273.0, 199463.0, 38937.0, 9591.0, 2940.0, 1095.0, 455.0, 214.0, 150.0, 93.0, 43.0, 37.0, 29.0, 27.0, 13.0, 14.0, 12.0, 13.0, 7.0, 6.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.8359375, -7.58868408203125, -7.3414306640625, -7.09417724609375, -6.846923828125, -6.59967041015625, -6.3524169921875, -6.10516357421875, -5.85791015625, -5.61065673828125, -5.3634033203125, -5.11614990234375, -4.868896484375, -4.62164306640625, -4.3743896484375, -4.12713623046875, -3.8798828125, -3.63262939453125, -3.3853759765625, -3.13812255859375, -2.890869140625, -2.64361572265625, -2.3963623046875, -2.14910888671875, -1.90185546875, -1.65460205078125, -1.4073486328125, -1.16009521484375, -0.912841796875, -0.66558837890625, -0.4183349609375, -0.17108154296875, 0.076171875, 0.32342529296875, 0.5706787109375, 0.81793212890625, 1.065185546875, 1.31243896484375, 1.5596923828125, 1.80694580078125, 2.05419921875, 2.30145263671875, 2.5487060546875, 2.79595947265625, 3.043212890625, 3.29046630859375, 3.5377197265625, 3.78497314453125, 4.0322265625, 4.27947998046875, 4.5267333984375, 4.77398681640625, 5.021240234375, 5.26849365234375, 5.5157470703125, 5.76300048828125, 6.01025390625, 6.25750732421875, 6.5047607421875, 6.75201416015625, 6.999267578125, 7.24652099609375, 7.4937744140625, 7.74102783203125, 7.98828125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 8.0, 13.0, 9.0, 26.0, 26.0, 27.0, 55.0, 93.0, 98.0, 193.0, 222.0, 345.0, 447.0, 518.0, 466.0, 375.0, 346.0, 227.0, 165.0, 118.0, 99.0, 67.0, 42.0, 27.0, 20.0, 13.0, 12.0, 9.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-14.203125, -13.8795166015625, -13.555908203125, -13.2322998046875, -12.90869140625, -12.5850830078125, -12.261474609375, -11.9378662109375, -11.6142578125, -11.2906494140625, -10.967041015625, -10.6434326171875, -10.31982421875, -9.9962158203125, -9.672607421875, -9.3489990234375, -9.025390625, -8.7017822265625, -8.378173828125, -8.0545654296875, -7.73095703125, -7.4073486328125, -7.083740234375, -6.7601318359375, -6.4365234375, -6.1129150390625, -5.789306640625, -5.4656982421875, -5.14208984375, -4.8184814453125, -4.494873046875, -4.1712646484375, -3.84765625, -3.5240478515625, -3.200439453125, -2.8768310546875, -2.55322265625, -2.2296142578125, -1.906005859375, -1.5823974609375, -1.2587890625, -0.9351806640625, -0.611572265625, -0.2879638671875, 0.03564453125, 0.3592529296875, 0.682861328125, 1.0064697265625, 1.330078125, 1.6536865234375, 1.977294921875, 2.3009033203125, 2.62451171875, 2.9481201171875, 3.271728515625, 3.5953369140625, 3.9189453125, 4.2425537109375, 4.566162109375, 4.8897705078125, 5.21337890625, 5.5369873046875, 5.860595703125, 6.1842041015625, 6.5078125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 17.0, 23.0, 27.0, 34.0, 55.0, 87.0, 133.0, 191.0, 230.0, 357.0, 796.0, 5114.0, 583026.0, 3569030.0, 32557.0, 1233.0, 487.0, 296.0, 180.0, 139.0, 79.0, 63.0, 38.0, 28.0, 28.0, 9.0, 10.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -20.900146484375, -19.75341796875, -18.606689453125, -17.4599609375, -16.313232421875, -15.16650390625, -14.019775390625, -12.873046875, -11.726318359375, -10.57958984375, -9.432861328125, -8.2861328125, -7.139404296875, -5.99267578125, -4.845947265625, -3.69921875, -2.552490234375, -1.40576171875, -0.259033203125, 0.8876953125, 2.034423828125, 3.18115234375, 4.327880859375, 5.474609375, 6.621337890625, 7.76806640625, 8.914794921875, 10.0615234375, 11.208251953125, 12.35498046875, 13.501708984375, 14.6484375, 15.795166015625, 16.94189453125, 18.088623046875, 19.2353515625, 20.382080078125, 21.52880859375, 22.675537109375, 23.822265625, 24.968994140625, 26.11572265625, 27.262451171875, 28.4091796875, 29.555908203125, 30.70263671875, 31.849365234375, 32.99609375, 34.142822265625, 35.28955078125, 36.436279296875, 37.5830078125, 38.729736328125, 39.87646484375, 41.023193359375, 42.169921875, 43.316650390625, 44.46337890625, 45.610107421875, 46.7568359375, 47.903564453125, 49.05029296875, 50.197021484375, 51.34375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 2.0, 12.0, 21.0, 28.0, 64.0, 62.0, 71.0, 105.0, 112.0, 103.0, 88.0, 93.0, 73.0, 46.0, 50.0, 29.0, 19.0, 7.0, 9.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.66603469848633, -48.361122131347656, -47.05621337890625, -45.75130081176758, -44.446388244628906, -43.141475677490234, -41.83656311035156, -40.531654357910156, -39.226741790771484, -37.92182922363281, -36.616920471191406, -35.312007904052734, -34.00709533691406, -32.70218276977539, -31.39727210998535, -30.092361450195312, -28.78744888305664, -27.48253631591797, -26.17762565612793, -24.87271499633789, -23.56780242919922, -22.262889862060547, -20.957979202270508, -19.65306854248047, -18.348155975341797, -17.043243408203125, -15.738332748413086, -14.43342113494873, -13.128509521484375, -11.82359790802002, -10.518686294555664, -9.213774681091309, -7.9088592529296875, -6.603947639465332, -5.299036026000977, -3.994124412536621, -2.6892127990722656, -1.3843011856079102, -0.07938957214355469, 1.2255220413208008, 2.5304336547851562, 3.8353452682495117, 5.140256881713867, 6.445168495178223, 7.750080108642578, 9.054991722106934, 10.359903335571289, 11.664814949035645, 12.9697265625, 14.274638175964355, 15.579549789428711, 16.88446044921875, 18.189373016357422, 19.494285583496094, 20.799196243286133, 22.104106903076172, 23.409019470214844, 24.713932037353516, 26.018842697143555, 27.323753356933594, 28.628665924072266, 29.933578491210938, 31.238489151000977, 32.543399810791016, 33.84831237792969]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 5.0, 8.0, 9.0, 8.0, 6.0, 15.0, 14.0, 23.0, 22.0, 19.0, 19.0, 27.0, 28.0, 23.0, 37.0, 27.0, 18.0, 31.0, 28.0, 40.0, 29.0, 33.0, 45.0, 41.0, 33.0, 38.0, 37.0, 37.0, 28.0, 27.0, 28.0, 31.0, 19.0, 28.0, 16.0, 16.0, 19.0, 9.0, 21.0, 11.0, 6.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0], "bins": [-27.349945068359375, -26.553348541259766, -25.756750106811523, -24.96015167236328, -24.163555145263672, -23.366958618164062, -22.57036018371582, -21.773761749267578, -20.97716522216797, -20.18056869506836, -19.383970260620117, -18.587371826171875, -17.790775299072266, -16.994178771972656, -16.197580337524414, -15.400982856750488, -14.604385375976562, -13.807787895202637, -13.011190414428711, -12.214592933654785, -11.41799545288086, -10.621397972106934, -9.824800491333008, -9.028203010559082, -8.231605529785156, -7.4350080490112305, -6.638410568237305, -5.841813087463379, -5.045215606689453, -4.248618125915527, -3.4520206451416016, -2.655423164367676, -1.85882568359375, -1.0622282028198242, -0.26563072204589844, 0.5309667587280273, 1.3275642395019531, 2.124161720275879, 2.9207592010498047, 3.7173566818237305, 4.513954162597656, 5.310551643371582, 6.107149124145508, 6.903746604919434, 7.700344085693359, 8.496941566467285, 9.293539047241211, 10.090136528015137, 10.886734008789062, 11.683331489562988, 12.479928970336914, 13.27652645111084, 14.073123931884766, 14.869721412658691, 15.666318893432617, 16.46291732788086, 17.25951385498047, 18.056110382080078, 18.85270881652832, 19.649307250976562, 20.445903778076172, 21.24250030517578, 22.039098739624023, 22.835697174072266, 23.632293701171875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 7.0, 10.0, 7.0, 11.0, 11.0, 13.0, 15.0, 18.0, 20.0, 25.0, 23.0, 30.0, 23.0, 25.0, 29.0, 38.0, 35.0, 40.0, 38.0, 37.0, 48.0, 37.0, 42.0, 32.0, 38.0, 30.0, 33.0, 32.0, 30.0, 20.0, 32.0, 21.0, 24.0, 20.0, 13.0, 11.0, 15.0, 17.0, 11.0, 11.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.88671875, -3.768463134765625, -3.65020751953125, -3.531951904296875, -3.4136962890625, -3.295440673828125, -3.17718505859375, -3.058929443359375, -2.940673828125, -2.822418212890625, -2.70416259765625, -2.585906982421875, -2.4676513671875, -2.349395751953125, -2.23114013671875, -2.112884521484375, -1.99462890625, -1.876373291015625, -1.75811767578125, -1.639862060546875, -1.5216064453125, -1.403350830078125, -1.28509521484375, -1.166839599609375, -1.048583984375, -0.930328369140625, -0.81207275390625, -0.693817138671875, -0.5755615234375, -0.457305908203125, -0.33905029296875, -0.220794677734375, -0.1025390625, 0.015716552734375, 0.13397216796875, 0.252227783203125, 0.3704833984375, 0.488739013671875, 0.60699462890625, 0.725250244140625, 0.843505859375, 0.961761474609375, 1.08001708984375, 1.198272705078125, 1.3165283203125, 1.434783935546875, 1.55303955078125, 1.671295166015625, 1.78955078125, 1.907806396484375, 2.02606201171875, 2.144317626953125, 2.2625732421875, 2.380828857421875, 2.49908447265625, 2.617340087890625, 2.735595703125, 2.853851318359375, 2.97210693359375, 3.090362548828125, 3.2086181640625, 3.326873779296875, 3.44512939453125, 3.563385009765625, 3.681640625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 10.0, 10.0, 19.0, 40.0, 45.0, 65.0, 97.0, 140.0, 192.0, 367.0, 485.0, 768.0, 1203.0, 1794.0, 2823.0, 4083.0, 6315.0, 9682.0, 14664.0, 22242.0, 33031.0, 50234.0, 74023.0, 106027.0, 139079.0, 152028.0, 131356.0, 97311.0, 67122.0, 45333.0, 29853.0, 19716.0, 13168.0, 8658.0, 5657.0, 3688.0, 2506.0, 1601.0, 1158.0, 632.0, 475.0, 296.0, 173.0, 134.0, 90.0, 56.0, 39.0, 29.0, 15.0, 13.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0], "bins": [-0.425048828125, -0.4123115539550781, -0.39957427978515625, -0.3868370056152344, -0.3740997314453125, -0.3613624572753906, -0.34862518310546875, -0.3358879089355469, -0.323150634765625, -0.3104133605957031, -0.29767608642578125, -0.2849388122558594, -0.2722015380859375, -0.2594642639160156, -0.24672698974609375, -0.23398971557617188, -0.22125244140625, -0.20851516723632812, -0.19577789306640625, -0.18304061889648438, -0.1703033447265625, -0.15756607055664062, -0.14482879638671875, -0.13209152221679688, -0.119354248046875, -0.10661697387695312, -0.09387969970703125, -0.08114242553710938, -0.0684051513671875, -0.055667877197265625, -0.04293060302734375, -0.030193328857421875, -0.0174560546875, -0.004718780517578125, 0.00801849365234375, 0.020755767822265625, 0.0334930419921875, 0.046230316162109375, 0.05896759033203125, 0.07170486450195312, 0.084442138671875, 0.09717941284179688, 0.10991668701171875, 0.12265396118164062, 0.1353912353515625, 0.14812850952148438, 0.16086578369140625, 0.17360305786132812, 0.18634033203125, 0.19907760620117188, 0.21181488037109375, 0.22455215454101562, 0.2372894287109375, 0.2500267028808594, 0.26276397705078125, 0.2755012512207031, 0.288238525390625, 0.3009757995605469, 0.31371307373046875, 0.3264503479003906, 0.3391876220703125, 0.3519248962402344, 0.36466217041015625, 0.3773994445800781, 0.39013671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 11.0, 12.0, 8.0, 11.0, 22.0, 25.0, 26.0, 35.0, 38.0, 37.0, 41.0, 47.0, 38.0, 44.0, 46.0, 1078.0, 45.0, 52.0, 45.0, 41.0, 34.0, 33.0, 34.0, 30.0, 32.0, 23.0, 24.0, 17.0, 23.0, 10.0, 11.0, 7.0, 8.0, 5.0, 7.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.12109375, -3.0302734375, -2.939453125, -2.8486328125, -2.7578125, -2.6669921875, -2.576171875, -2.4853515625, -2.39453125, -2.3037109375, -2.212890625, -2.1220703125, -2.03125, -1.9404296875, -1.849609375, -1.7587890625, -1.66796875, -1.5771484375, -1.486328125, -1.3955078125, -1.3046875, -1.2138671875, -1.123046875, -1.0322265625, -0.94140625, -0.8505859375, -0.759765625, -0.6689453125, -0.578125, -0.4873046875, -0.396484375, -0.3056640625, -0.21484375, -0.1240234375, -0.033203125, 0.0576171875, 0.1484375, 0.2392578125, 0.330078125, 0.4208984375, 0.51171875, 0.6025390625, 0.693359375, 0.7841796875, 0.875, 0.9658203125, 1.056640625, 1.1474609375, 1.23828125, 1.3291015625, 1.419921875, 1.5107421875, 1.6015625, 1.6923828125, 1.783203125, 1.8740234375, 1.96484375, 2.0556640625, 2.146484375, 2.2373046875, 2.328125, 2.4189453125, 2.509765625, 2.6005859375, 2.69140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 8.0, 7.0, 20.0, 36.0, 40.0, 74.0, 99.0, 153.0, 181.0, 370.0, 521.0, 825.0, 1233.0, 1935.0, 3094.0, 4720.0, 7783.0, 12343.0, 19309.0, 30220.0, 46341.0, 70294.0, 101726.0, 138104.0, 1176343.0, 154753.0, 108630.0, 76011.0, 50930.0, 33179.0, 21160.0, 13289.0, 8527.0, 5337.0, 3397.0, 2216.0, 1320.0, 904.0, 626.0, 372.0, 220.0, 157.0, 116.0, 74.0, 44.0, 36.0, 24.0, 11.0, 12.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2266845703125, -0.21875953674316406, -0.21083450317382812, -0.2029094696044922, -0.19498443603515625, -0.1870594024658203, -0.17913436889648438, -0.17120933532714844, -0.1632843017578125, -0.15535926818847656, -0.14743423461914062, -0.1395092010498047, -0.13158416748046875, -0.12365913391113281, -0.11573410034179688, -0.10780906677246094, -0.099884033203125, -0.09195899963378906, -0.08403396606445312, -0.07610893249511719, -0.06818389892578125, -0.06025886535644531, -0.052333831787109375, -0.04440879821777344, -0.0364837646484375, -0.028558731079101562, -0.020633697509765625, -0.012708663940429688, -0.00478363037109375, 0.0031414031982421875, 0.011066436767578125, 0.018991470336914062, 0.02691650390625, 0.03484153747558594, 0.042766571044921875, 0.05069160461425781, 0.05861663818359375, 0.06654167175292969, 0.07446670532226562, 0.08239173889160156, 0.0903167724609375, 0.09824180603027344, 0.10616683959960938, 0.11409187316894531, 0.12201690673828125, 0.1299419403076172, 0.13786697387695312, 0.14579200744628906, 0.153717041015625, 0.16164207458496094, 0.16956710815429688, 0.1774921417236328, 0.18541717529296875, 0.1933422088623047, 0.20126724243164062, 0.20919227600097656, 0.2171173095703125, 0.22504234313964844, 0.23296737670898438, 0.2408924102783203, 0.24881744384765625, 0.2567424774169922, 0.2646675109863281, 0.27259254455566406, 0.280517578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 8.0, 8.0, 17.0, 17.0, 32.0, 42.0, 62.0, 90.0, 131.0, 177.0, 109.0, 61.0, 48.0, 45.0, 26.0, 29.0, 8.0, 18.0, 5.0, 8.0, 1.0, 9.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.035064697265625, -0.034044504165649414, -0.03302431106567383, -0.03200411796569824, -0.030983924865722656, -0.02996373176574707, -0.028943538665771484, -0.0279233455657959, -0.026903152465820312, -0.025882959365844727, -0.02486276626586914, -0.023842573165893555, -0.02282238006591797, -0.021802186965942383, -0.020781993865966797, -0.01976180076599121, -0.018741607666015625, -0.01772141456604004, -0.016701221466064453, -0.015681028366088867, -0.014660835266113281, -0.013640642166137695, -0.01262044906616211, -0.011600255966186523, -0.010580062866210938, -0.009559869766235352, -0.008539676666259766, -0.00751948356628418, -0.006499290466308594, -0.005479097366333008, -0.004458904266357422, -0.003438711166381836, -0.00241851806640625, -0.001398324966430664, -0.0003781318664550781, 0.0006420612335205078, 0.0016622543334960938, 0.0026824474334716797, 0.0037026405334472656, 0.0047228336334228516, 0.0057430267333984375, 0.0067632198333740234, 0.007783412933349609, 0.008803606033325195, 0.009823799133300781, 0.010843992233276367, 0.011864185333251953, 0.012884378433227539, 0.013904571533203125, 0.014924764633178711, 0.015944957733154297, 0.016965150833129883, 0.01798534393310547, 0.019005537033081055, 0.02002573013305664, 0.021045923233032227, 0.022066116333007812, 0.0230863094329834, 0.024106502532958984, 0.02512669563293457, 0.026146888732910156, 0.027167081832885742, 0.028187274932861328, 0.029207468032836914, 0.0302276611328125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 10.0, 10.0, 6.0, 5.0, 16.0, 20.0, 33.0, 38.0, 72.0, 80.0, 142.0, 477.0, 9327.0, 1019694.0, 17567.0, 550.0, 170.0, 100.0, 57.0, 43.0, 33.0, 18.0, 15.0, 11.0, 11.0, 3.0, 4.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.620849609375, -0.59912109375, -0.577392578125, -0.5556640625, -0.533935546875, -0.51220703125, -0.490478515625, -0.46875, -0.447021484375, -0.42529296875, -0.403564453125, -0.3818359375, -0.360107421875, -0.33837890625, -0.316650390625, -0.294921875, -0.273193359375, -0.25146484375, -0.229736328125, -0.2080078125, -0.186279296875, -0.16455078125, -0.142822265625, -0.12109375, -0.099365234375, -0.07763671875, -0.055908203125, -0.0341796875, -0.012451171875, 0.00927734375, 0.031005859375, 0.052734375, 0.074462890625, 0.09619140625, 0.117919921875, 0.1396484375, 0.161376953125, 0.18310546875, 0.204833984375, 0.2265625, 0.248291015625, 0.27001953125, 0.291748046875, 0.3134765625, 0.335205078125, 0.35693359375, 0.378662109375, 0.400390625, 0.422119140625, 0.44384765625, 0.465576171875, 0.4873046875, 0.509033203125, 0.53076171875, 0.552490234375, 0.57421875, 0.595947265625, 0.61767578125, 0.639404296875, 0.6611328125, 0.682861328125, 0.70458984375, 0.726318359375, 0.748046875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 11.0, 20.0, 28.0, 54.0, 83.0, 139.0, 315.0, 195.0, 73.0, 34.0, 21.0, 14.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17712287604808807, -0.17362652719020844, -0.1701301783323288, -0.16663382947444916, -0.16313748061656952, -0.15964113175868988, -0.15614478290081024, -0.1526484191417694, -0.14915207028388977, -0.14565572142601013, -0.1421593725681305, -0.13866302371025085, -0.13516667485237122, -0.13167032599449158, -0.12817397713661194, -0.1246776208281517, -0.12118127942085266, -0.11768493056297302, -0.11418858170509338, -0.11069223284721375, -0.1071958839893341, -0.10369953513145447, -0.10020317882299423, -0.0967068299651146, -0.09321048110723495, -0.08971413224935532, -0.08621778339147568, -0.08272143453359604, -0.0792250782251358, -0.07572872936725616, -0.07223238050937653, -0.06873603165149689, -0.06523968279361725, -0.06174333393573761, -0.05824698507785797, -0.054750632494688034, -0.051254283636808395, -0.04775793477892876, -0.04426158219575882, -0.04076523333787918, -0.037268880754709244, -0.033772531896829605, -0.030276181176304817, -0.02677983045578003, -0.02328348159790039, -0.019787132740020752, -0.016290782019495964, -0.012794431298971176, -0.009298082441091537, -0.005801732651889324, -0.002305382862687111, 0.0011909669265151024, 0.004687316715717316, 0.008183665573596954, 0.011680016294121742, 0.01517636701464653, 0.01867271587252617, 0.022169064730405807, 0.025665415450930595, 0.029161766171455383, 0.03265811502933502, 0.03615446388721466, 0.0396508127450943, 0.043147165328264236, 0.046643514186143875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 8.0, 12.0, 18.0, 20.0, 15.0, 19.0, 19.0, 30.0, 32.0, 34.0, 26.0, 33.0, 47.0, 32.0, 36.0, 47.0, 29.0, 50.0, 41.0, 43.0, 28.0, 29.0, 30.0, 35.0, 29.0, 37.0, 24.0, 26.0, 20.0, 19.0, 15.0, 18.0, 8.0, 16.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.04727530479431152, -0.045874178409576416, -0.04447305202484131, -0.0430719256401062, -0.041670799255371094, -0.040269672870635986, -0.03886854648590088, -0.03746742010116577, -0.036066293716430664, -0.03466516733169556, -0.03326404094696045, -0.03186291456222534, -0.030461788177490234, -0.029060661792755127, -0.02765953540802002, -0.026258409023284912, -0.024857282638549805, -0.023456156253814697, -0.02205502986907959, -0.020653903484344482, -0.019252777099609375, -0.017851650714874268, -0.01645052433013916, -0.015049397945404053, -0.013648271560668945, -0.012247145175933838, -0.01084601879119873, -0.009444892406463623, -0.008043766021728516, -0.006642639636993408, -0.005241513252258301, -0.0038403868675231934, -0.002439260482788086, -0.0010381340980529785, 0.0003629922866821289, 0.0017641186714172363, 0.0031652450561523438, 0.004566371440887451, 0.005967497825622559, 0.007368624210357666, 0.008769750595092773, 0.01017087697982788, 0.011572003364562988, 0.012973129749298096, 0.014374256134033203, 0.01577538251876831, 0.017176508903503418, 0.018577635288238525, 0.019978761672973633, 0.02137988805770874, 0.022781014442443848, 0.024182140827178955, 0.025583267211914062, 0.02698439359664917, 0.028385519981384277, 0.029786646366119385, 0.031187772750854492, 0.0325888991355896, 0.03399002552032471, 0.035391151905059814, 0.03679227828979492, 0.03819340467453003, 0.03959453105926514, 0.040995657444000244, 0.04239678382873535]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 9.0, 6.0, 13.0, 10.0, 13.0, 16.0, 17.0, 20.0, 25.0, 23.0, 29.0, 24.0, 26.0, 28.0, 38.0, 35.0, 40.0, 38.0, 38.0, 46.0, 38.0, 43.0, 31.0, 37.0, 31.0, 33.0, 32.0, 31.0, 19.0, 32.0, 21.0, 24.0, 20.0, 14.0, 10.0, 15.0, 17.0, 11.0, 11.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.884765625, -3.76654052734375, -3.6483154296875, -3.53009033203125, -3.411865234375, -3.29364013671875, -3.1754150390625, -3.05718994140625, -2.93896484375, -2.82073974609375, -2.7025146484375, -2.58428955078125, -2.466064453125, -2.34783935546875, -2.2296142578125, -2.11138916015625, -1.9931640625, -1.87493896484375, -1.7567138671875, -1.63848876953125, -1.520263671875, -1.40203857421875, -1.2838134765625, -1.16558837890625, -1.04736328125, -0.92913818359375, -0.8109130859375, -0.69268798828125, -0.574462890625, -0.45623779296875, -0.3380126953125, -0.21978759765625, -0.1015625, 0.01666259765625, 0.1348876953125, 0.25311279296875, 0.371337890625, 0.48956298828125, 0.6077880859375, 0.72601318359375, 0.84423828125, 0.96246337890625, 1.0806884765625, 1.19891357421875, 1.317138671875, 1.43536376953125, 1.5535888671875, 1.67181396484375, 1.7900390625, 1.90826416015625, 2.0264892578125, 2.14471435546875, 2.262939453125, 2.38116455078125, 2.4993896484375, 2.61761474609375, 2.73583984375, 2.85406494140625, 2.9722900390625, 3.09051513671875, 3.208740234375, 3.32696533203125, 3.4451904296875, 3.56341552734375, 3.681640625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 2.0, 6.0, 8.0, 12.0, 14.0, 19.0, 26.0, 36.0, 48.0, 69.0, 119.0, 154.0, 253.0, 446.0, 743.0, 1150.0, 1855.0, 3204.0, 5452.0, 10461.0, 21831.0, 50512.0, 134559.0, 368861.0, 275447.0, 97842.0, 38507.0, 17099.0, 8409.0, 4460.0, 2565.0, 1658.0, 976.0, 615.0, 390.0, 249.0, 169.0, 98.0, 54.0, 53.0, 39.0, 23.0, 23.0, 11.0, 9.0, 9.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.65234375, -3.5411376953125, -3.429931640625, -3.3187255859375, -3.20751953125, -3.0963134765625, -2.985107421875, -2.8739013671875, -2.7626953125, -2.6514892578125, -2.540283203125, -2.4290771484375, -2.31787109375, -2.2066650390625, -2.095458984375, -1.9842529296875, -1.873046875, -1.7618408203125, -1.650634765625, -1.5394287109375, -1.42822265625, -1.3170166015625, -1.205810546875, -1.0946044921875, -0.9833984375, -0.8721923828125, -0.760986328125, -0.6497802734375, -0.53857421875, -0.4273681640625, -0.316162109375, -0.2049560546875, -0.09375, 0.0174560546875, 0.128662109375, 0.2398681640625, 0.35107421875, 0.4622802734375, 0.573486328125, 0.6846923828125, 0.7958984375, 0.9071044921875, 1.018310546875, 1.1295166015625, 1.24072265625, 1.3519287109375, 1.463134765625, 1.5743408203125, 1.685546875, 1.7967529296875, 1.907958984375, 2.0191650390625, 2.13037109375, 2.2415771484375, 2.352783203125, 2.4639892578125, 2.5751953125, 2.6864013671875, 2.797607421875, 2.9088134765625, 3.02001953125, 3.1312255859375, 3.242431640625, 3.3536376953125, 3.46484375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 12.0, 13.0, 9.0, 9.0, 18.0, 13.0, 35.0, 34.0, 37.0, 33.0, 44.0, 37.0, 59.0, 83.0, 199.0, 1589.0, 278.0, 93.0, 59.0, 46.0, 38.0, 45.0, 32.0, 43.0, 34.0, 21.0, 18.0, 10.0, 20.0, 12.0, 10.0, 13.0, 10.0, 3.0, 5.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.5234375, -15.0616455078125, -14.599853515625, -14.1380615234375, -13.67626953125, -13.2144775390625, -12.752685546875, -12.2908935546875, -11.8291015625, -11.3673095703125, -10.905517578125, -10.4437255859375, -9.98193359375, -9.5201416015625, -9.058349609375, -8.5965576171875, -8.134765625, -7.6729736328125, -7.211181640625, -6.7493896484375, -6.28759765625, -5.8258056640625, -5.364013671875, -4.9022216796875, -4.4404296875, -3.9786376953125, -3.516845703125, -3.0550537109375, -2.59326171875, -2.1314697265625, -1.669677734375, -1.2078857421875, -0.74609375, -0.2843017578125, 0.177490234375, 0.6392822265625, 1.10107421875, 1.5628662109375, 2.024658203125, 2.4864501953125, 2.9482421875, 3.4100341796875, 3.871826171875, 4.3336181640625, 4.79541015625, 5.2572021484375, 5.718994140625, 6.1807861328125, 6.642578125, 7.1043701171875, 7.566162109375, 8.0279541015625, 8.48974609375, 8.9515380859375, 9.413330078125, 9.8751220703125, 10.3369140625, 10.7987060546875, 11.260498046875, 11.7222900390625, 12.18408203125, 12.6458740234375, 13.107666015625, 13.5694580078125, 14.03125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 6.0, 4.0, 12.0, 18.0, 19.0, 24.0, 28.0, 33.0, 59.0, 90.0, 136.0, 158.0, 248.0, 358.0, 956.0, 6847.0, 2628893.0, 501566.0, 4418.0, 732.0, 311.0, 214.0, 166.0, 102.0, 82.0, 49.0, 39.0, 22.0, 21.0, 21.0, 14.0, 7.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.125, -38.00439453125, -36.8837890625, -35.76318359375, -34.642578125, -33.52197265625, -32.4013671875, -31.28076171875, -30.16015625, -29.03955078125, -27.9189453125, -26.79833984375, -25.677734375, -24.55712890625, -23.4365234375, -22.31591796875, -21.1953125, -20.07470703125, -18.9541015625, -17.83349609375, -16.712890625, -15.59228515625, -14.4716796875, -13.35107421875, -12.23046875, -11.10986328125, -9.9892578125, -8.86865234375, -7.748046875, -6.62744140625, -5.5068359375, -4.38623046875, -3.265625, -2.14501953125, -1.0244140625, 0.09619140625, 1.216796875, 2.33740234375, 3.4580078125, 4.57861328125, 5.69921875, 6.81982421875, 7.9404296875, 9.06103515625, 10.181640625, 11.30224609375, 12.4228515625, 13.54345703125, 14.6640625, 15.78466796875, 16.9052734375, 18.02587890625, 19.146484375, 20.26708984375, 21.3876953125, 22.50830078125, 23.62890625, 24.74951171875, 25.8701171875, 26.99072265625, 28.111328125, 29.23193359375, 30.3525390625, 31.47314453125, 32.59375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 74.0, 885.0, 61.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-281.42095947265625, -276.25244140625, -271.08392333984375, -265.9154052734375, -260.7468566894531, -255.57833862304688, -250.40982055664062, -245.24130249023438, -240.07278442382812, -234.90426635742188, -229.73573303222656, -224.5672149658203, -219.39869689941406, -214.23016357421875, -209.0616455078125, -203.89312744140625, -198.72459411621094, -193.5560760498047, -188.38754272460938, -183.21902465820312, -178.05050659179688, -172.88198852539062, -167.7134552001953, -162.54493713378906, -157.37640380859375, -152.2078857421875, -147.0393524169922, -141.87083435058594, -136.7023162841797, -131.53378295898438, -126.36526489257812, -121.19674682617188, -116.02821350097656, -110.85968780517578, -105.69116973876953, -100.52264404296875, -95.3541259765625, -90.18560028076172, -85.01707458496094, -79.84855651855469, -74.68003845214844, -69.51151275634766, -64.3429946899414, -59.174468994140625, -54.00594711303711, -48.837425231933594, -43.66889953613281, -38.5003776550293, -33.331851959228516, -28.163330078125, -22.99480628967285, -17.826282501220703, -12.657760620117188, -7.489238739013672, -2.3207149505615234, 2.847808837890625, 8.01633071899414, 13.184853553771973, 18.353376388549805, 23.521900177001953, 28.69042205810547, 33.858943939208984, 39.0274658203125, 44.19599151611328, 49.3645133972168]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 9.0, 12.0, 12.0, 7.0, 9.0, 19.0, 15.0, 17.0, 19.0, 20.0, 33.0, 26.0, 40.0, 24.0, 25.0, 35.0, 31.0, 43.0, 44.0, 54.0, 37.0, 52.0, 51.0, 40.0, 39.0, 38.0, 28.0, 28.0, 28.0, 19.0, 26.0, 20.0, 17.0, 15.0, 15.0, 9.0, 14.0, 6.0, 8.0, 6.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0], "bins": [-40.91716766357422, -39.75961685180664, -38.6020622253418, -37.44451141357422, -36.28696060180664, -35.12940979003906, -33.97185516357422, -32.81430435180664, -31.656753540039062, -30.49920082092285, -29.341650009155273, -28.184097290039062, -27.026546478271484, -25.868993759155273, -24.711441040039062, -23.553890228271484, -22.396337509155273, -21.238784790039062, -20.081233978271484, -18.923681259155273, -17.766130447387695, -16.608577728271484, -15.45102596282959, -14.293474197387695, -13.1359224319458, -11.978370666503906, -10.820818901062012, -9.663267135620117, -8.505714416503906, -7.34816312789917, -6.190610885620117, -5.033059120178223, -3.875507354736328, -2.7179555892944336, -1.56040358543396, -0.40285158157348633, 0.7547001838684082, 1.9122519493103027, 3.0698041915893555, 4.22735595703125, 5.3849077224731445, 6.542459487915039, 7.700011253356934, 8.857563018798828, 10.015115737915039, 11.172666549682617, 12.330219268798828, 13.487771034240723, 14.645322799682617, 15.802874565124512, 16.960426330566406, 18.117979049682617, 19.275529861450195, 20.433082580566406, 21.590633392333984, 22.748186111450195, 23.905738830566406, 25.063291549682617, 26.220842361450195, 27.378395080566406, 28.535945892333984, 29.693498611450195, 30.851051330566406, 32.008602142333984, 33.16615295410156]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 8.0, 8.0, 7.0, 17.0, 16.0, 17.0, 20.0, 25.0, 21.0, 27.0, 24.0, 31.0, 29.0, 33.0, 34.0, 38.0, 51.0, 40.0, 45.0, 27.0, 34.0, 43.0, 22.0, 31.0, 27.0, 28.0, 29.0, 32.0, 27.0, 22.0, 23.0, 21.0, 19.0, 13.0, 23.0, 10.0, 6.0, 14.0, 11.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.9453125, -3.82550048828125, -3.7056884765625, -3.58587646484375, -3.466064453125, -3.34625244140625, -3.2264404296875, -3.10662841796875, -2.98681640625, -2.86700439453125, -2.7471923828125, -2.62738037109375, -2.507568359375, -2.38775634765625, -2.2679443359375, -2.14813232421875, -2.0283203125, -1.90850830078125, -1.7886962890625, -1.66888427734375, -1.549072265625, -1.42926025390625, -1.3094482421875, -1.18963623046875, -1.06982421875, -0.95001220703125, -0.8302001953125, -0.71038818359375, -0.590576171875, -0.47076416015625, -0.3509521484375, -0.23114013671875, -0.111328125, 0.00848388671875, 0.1282958984375, 0.24810791015625, 0.367919921875, 0.48773193359375, 0.6075439453125, 0.72735595703125, 0.84716796875, 0.96697998046875, 1.0867919921875, 1.20660400390625, 1.326416015625, 1.44622802734375, 1.5660400390625, 1.68585205078125, 1.8056640625, 1.92547607421875, 2.0452880859375, 2.16510009765625, 2.284912109375, 2.40472412109375, 2.5245361328125, 2.64434814453125, 2.76416015625, 2.88397216796875, 3.0037841796875, 3.12359619140625, 3.243408203125, 3.36322021484375, 3.4830322265625, 3.60284423828125, 3.72265625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 7.0, 11.0, 9.0, 13.0, 21.0, 27.0, 23.0, 27.0, 37.0, 62.0, 49.0, 68.0, 114.0, 196.0, 338.0, 587.0, 1374.0, 3702.0, 11860.0, 43570.0, 200335.0, 1015223.0, 1993985.0, 735719.0, 140008.0, 32167.0, 9077.0, 2992.0, 1197.0, 553.0, 286.0, 156.0, 94.0, 73.0, 52.0, 42.0, 57.0, 35.0, 23.0, 22.0, 12.0, 21.0, 16.0, 6.0, 7.0, 6.0, 3.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.921875, -7.68463134765625, -7.4473876953125, -7.21014404296875, -6.972900390625, -6.73565673828125, -6.4984130859375, -6.26116943359375, -6.02392578125, -5.78668212890625, -5.5494384765625, -5.31219482421875, -5.074951171875, -4.83770751953125, -4.6004638671875, -4.36322021484375, -4.1259765625, -3.88873291015625, -3.6514892578125, -3.41424560546875, -3.177001953125, -2.93975830078125, -2.7025146484375, -2.46527099609375, -2.22802734375, -1.99078369140625, -1.7535400390625, -1.51629638671875, -1.279052734375, -1.04180908203125, -0.8045654296875, -0.56732177734375, -0.330078125, -0.09283447265625, 0.1444091796875, 0.38165283203125, 0.618896484375, 0.85614013671875, 1.0933837890625, 1.33062744140625, 1.56787109375, 1.80511474609375, 2.0423583984375, 2.27960205078125, 2.516845703125, 2.75408935546875, 2.9913330078125, 3.22857666015625, 3.4658203125, 3.70306396484375, 3.9403076171875, 4.17755126953125, 4.414794921875, 4.65203857421875, 4.8892822265625, 5.12652587890625, 5.36376953125, 5.60101318359375, 5.8382568359375, 6.07550048828125, 6.312744140625, 6.54998779296875, 6.7872314453125, 7.02447509765625, 7.26171875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 9.0, 10.0, 7.0, 12.0, 15.0, 26.0, 37.0, 49.0, 59.0, 72.0, 110.0, 173.0, 219.0, 275.0, 369.0, 465.0, 448.0, 403.0, 346.0, 280.0, 191.0, 152.0, 96.0, 63.0, 56.0, 42.0, 19.0, 17.0, 16.0, 8.0, 8.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.72039794921875, -10.4251708984375, -10.12994384765625, -9.834716796875, -9.53948974609375, -9.2442626953125, -8.94903564453125, -8.65380859375, -8.35858154296875, -8.0633544921875, -7.76812744140625, -7.472900390625, -7.17767333984375, -6.8824462890625, -6.58721923828125, -6.2919921875, -5.99676513671875, -5.7015380859375, -5.40631103515625, -5.111083984375, -4.81585693359375, -4.5206298828125, -4.22540283203125, -3.93017578125, -3.63494873046875, -3.3397216796875, -3.04449462890625, -2.749267578125, -2.45404052734375, -2.1588134765625, -1.86358642578125, -1.568359375, -1.27313232421875, -0.9779052734375, -0.68267822265625, -0.387451171875, -0.09222412109375, 0.2030029296875, 0.49822998046875, 0.79345703125, 1.08868408203125, 1.3839111328125, 1.67913818359375, 1.974365234375, 2.26959228515625, 2.5648193359375, 2.86004638671875, 3.1552734375, 3.45050048828125, 3.7457275390625, 4.04095458984375, 4.336181640625, 4.63140869140625, 4.9266357421875, 5.22186279296875, 5.51708984375, 5.81231689453125, 6.1075439453125, 6.40277099609375, 6.697998046875, 6.99322509765625, 7.2884521484375, 7.58367919921875, 7.87890625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 12.0, 8.0, 18.0, 27.0, 46.0, 55.0, 73.0, 137.0, 213.0, 290.0, 538.0, 1459.0, 29366.0, 3906022.0, 251286.0, 2908.0, 709.0, 354.0, 256.0, 149.0, 94.0, 80.0, 48.0, 34.0, 21.0, 16.0, 10.0, 17.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.6875, -40.283203125, -38.87890625, -37.474609375, -36.0703125, -34.666015625, -33.26171875, -31.857421875, -30.453125, -29.048828125, -27.64453125, -26.240234375, -24.8359375, -23.431640625, -22.02734375, -20.623046875, -19.21875, -17.814453125, -16.41015625, -15.005859375, -13.6015625, -12.197265625, -10.79296875, -9.388671875, -7.984375, -6.580078125, -5.17578125, -3.771484375, -2.3671875, -0.962890625, 0.44140625, 1.845703125, 3.25, 4.654296875, 6.05859375, 7.462890625, 8.8671875, 10.271484375, 11.67578125, 13.080078125, 14.484375, 15.888671875, 17.29296875, 18.697265625, 20.1015625, 21.505859375, 22.91015625, 24.314453125, 25.71875, 27.123046875, 28.52734375, 29.931640625, 31.3359375, 32.740234375, 34.14453125, 35.548828125, 36.953125, 38.357421875, 39.76171875, 41.166015625, 42.5703125, 43.974609375, 45.37890625, 46.783203125, 48.1875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 22.0, 117.0, 375.0, 354.0, 130.0, 18.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.0457763671875, -271.2831115722656, -265.5204772949219, -259.7578125, -253.9951629638672, -248.23251342773438, -242.4698486328125, -236.7071990966797, -230.94454956054688, -225.18190002441406, -219.4192352294922, -213.65658569335938, -207.89393615722656, -202.13128662109375, -196.36862182617188, -190.60597229003906, -184.8433074951172, -179.08065795898438, -173.3179931640625, -167.5553436279297, -161.79269409179688, -156.030029296875, -150.2673797607422, -144.50473022460938, -138.7420654296875, -132.9794158935547, -127.21675872802734, -121.4541015625, -115.69145202636719, -109.92879486083984, -104.1661376953125, -98.40348815917969, -92.64083862304688, -86.87818145751953, -81.11553192138672, -75.35287475585938, -69.59022521972656, -63.82756805419922, -58.064910888671875, -52.3022575378418, -46.53960418701172, -40.77695083618164, -35.01429748535156, -29.25164031982422, -23.48898696899414, -17.726333618164062, -11.963676452636719, -6.201023101806641, -0.4383697509765625, 5.324284553527832, 11.086938858032227, 16.849594116210938, 22.612247467041016, 28.374900817871094, 34.13755798339844, 39.900211334228516, 45.662864685058594, 51.42551803588867, 57.18817138671875, 62.950828552246094, 68.71348571777344, 74.47613525390625, 80.2387924194336, 86.00144958496094, 91.76409912109375]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 3.0, 7.0, 10.0, 10.0, 14.0, 8.0, 10.0, 28.0, 8.0, 15.0, 29.0, 19.0, 38.0, 19.0, 38.0, 47.0, 38.0, 37.0, 48.0, 41.0, 38.0, 35.0, 46.0, 34.0, 49.0, 38.0, 43.0, 26.0, 42.0, 35.0, 30.0, 20.0, 14.0, 12.0, 16.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.287445068359375, -30.28133773803711, -29.275232315063477, -28.26912498474121, -27.263019561767578, -26.256912231445312, -25.250804901123047, -24.24469757080078, -23.23859214782715, -22.232484817504883, -21.22637939453125, -20.220272064208984, -19.21416473388672, -18.208059310913086, -17.20195198059082, -16.195846557617188, -15.189739227294922, -14.183632850646973, -13.177526473999023, -12.171419143676758, -11.165312767028809, -10.15920639038086, -9.153099060058594, -8.146992683410645, -7.140886306762695, -6.134779930114746, -5.128673076629639, -4.122566223144531, -3.116459846496582, -2.110353469848633, -1.1042466163635254, -0.09813976287841797, 0.9079666137695312, 1.9140732288360596, 2.920179843902588, 3.926286458969116, 4.9323930740356445, 5.938499450683594, 6.944606304168701, 7.950713157653809, 8.956819534301758, 9.962925910949707, 10.969032287597656, 11.975139617919922, 12.981245994567871, 13.98735237121582, 14.993459701538086, 15.999566078186035, 17.005672454833984, 18.01177978515625, 19.017885208129883, 20.02399253845215, 21.03009796142578, 22.036205291748047, 23.042312622070312, 24.048419952392578, 25.05452537536621, 26.060632705688477, 27.06673812866211, 28.072845458984375, 29.07895278930664, 30.085058212280273, 31.09116554260254, 32.09727096557617, 33.10337829589844]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 7.0, 1.0, 3.0, 10.0, 8.0, 12.0, 10.0, 14.0, 20.0, 20.0, 18.0, 17.0, 24.0, 21.0, 22.0, 20.0, 26.0, 32.0, 37.0, 25.0, 38.0, 31.0, 30.0, 34.0, 37.0, 39.0, 30.0, 29.0, 38.0, 28.0, 33.0, 28.0, 40.0, 27.0, 24.0, 28.0, 20.0, 14.0, 13.0, 11.0, 10.0, 13.0, 8.0, 5.0, 12.0, 4.0, 5.0, 6.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0], "bins": [-3.60546875, -3.493804931640625, -3.38214111328125, -3.270477294921875, -3.1588134765625, -3.047149658203125, -2.93548583984375, -2.823822021484375, -2.712158203125, -2.600494384765625, -2.48883056640625, -2.377166748046875, -2.2655029296875, -2.153839111328125, -2.04217529296875, -1.930511474609375, -1.81884765625, -1.707183837890625, -1.59552001953125, -1.483856201171875, -1.3721923828125, -1.260528564453125, -1.14886474609375, -1.037200927734375, -0.925537109375, -0.813873291015625, -0.70220947265625, -0.590545654296875, -0.4788818359375, -0.367218017578125, -0.25555419921875, -0.143890380859375, -0.0322265625, 0.079437255859375, 0.19110107421875, 0.302764892578125, 0.4144287109375, 0.526092529296875, 0.63775634765625, 0.749420166015625, 0.861083984375, 0.972747802734375, 1.08441162109375, 1.196075439453125, 1.3077392578125, 1.419403076171875, 1.53106689453125, 1.642730712890625, 1.75439453125, 1.866058349609375, 1.97772216796875, 2.089385986328125, 2.2010498046875, 2.312713623046875, 2.42437744140625, 2.536041259765625, 2.647705078125, 2.759368896484375, 2.87103271484375, 2.982696533203125, 3.0943603515625, 3.206024169921875, 3.31768798828125, 3.429351806640625, 3.541015625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 26.0, 33.0, 61.0, 98.0, 135.0, 209.0, 308.0, 444.0, 730.0, 1125.0, 1616.0, 2604.0, 4050.0, 6291.0, 9553.0, 14970.0, 23554.0, 36533.0, 55399.0, 82775.0, 117549.0, 151257.0, 154780.0, 124122.0, 88668.0, 60674.0, 39521.0, 25257.0, 16396.0, 10657.0, 6784.0, 4326.0, 2800.0, 1806.0, 1169.0, 810.0, 478.0, 344.0, 220.0, 132.0, 108.0, 55.0, 44.0, 21.0, 13.0, 12.0, 8.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.415771484375, -0.4028167724609375, -0.389862060546875, -0.3769073486328125, -0.36395263671875, -0.3509979248046875, -0.338043212890625, -0.3250885009765625, -0.3121337890625, -0.2991790771484375, -0.286224365234375, -0.2732696533203125, -0.26031494140625, -0.2473602294921875, -0.234405517578125, -0.2214508056640625, -0.20849609375, -0.1955413818359375, -0.182586669921875, -0.1696319580078125, -0.15667724609375, -0.1437225341796875, -0.130767822265625, -0.1178131103515625, -0.1048583984375, -0.0919036865234375, -0.078948974609375, -0.0659942626953125, -0.05303955078125, -0.0400848388671875, -0.027130126953125, -0.0141754150390625, -0.001220703125, 0.0117340087890625, 0.024688720703125, 0.0376434326171875, 0.05059814453125, 0.0635528564453125, 0.076507568359375, 0.0894622802734375, 0.1024169921875, 0.1153717041015625, 0.128326416015625, 0.1412811279296875, 0.15423583984375, 0.1671905517578125, 0.180145263671875, 0.1930999755859375, 0.2060546875, 0.2190093994140625, 0.231964111328125, 0.2449188232421875, 0.25787353515625, 0.2708282470703125, 0.283782958984375, 0.2967376708984375, 0.3096923828125, 0.3226470947265625, 0.335601806640625, 0.3485565185546875, 0.36151123046875, 0.3744659423828125, 0.387420654296875, 0.4003753662109375, 0.413330078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 8.0, 8.0, 6.0, 8.0, 9.0, 14.0, 19.0, 14.0, 23.0, 27.0, 15.0, 25.0, 27.0, 34.0, 38.0, 31.0, 29.0, 47.0, 41.0, 50.0, 1054.0, 41.0, 40.0, 45.0, 38.0, 36.0, 28.0, 39.0, 36.0, 21.0, 26.0, 22.0, 15.0, 18.0, 15.0, 20.0, 12.0, 8.0, 6.0, 9.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.71136474609375, -2.6258544921875, -2.54034423828125, -2.454833984375, -2.36932373046875, -2.2838134765625, -2.19830322265625, -2.11279296875, -2.02728271484375, -1.9417724609375, -1.85626220703125, -1.770751953125, -1.68524169921875, -1.5997314453125, -1.51422119140625, -1.4287109375, -1.34320068359375, -1.2576904296875, -1.17218017578125, -1.086669921875, -1.00115966796875, -0.9156494140625, -0.83013916015625, -0.74462890625, -0.65911865234375, -0.5736083984375, -0.48809814453125, -0.402587890625, -0.31707763671875, -0.2315673828125, -0.14605712890625, -0.060546875, 0.02496337890625, 0.1104736328125, 0.19598388671875, 0.281494140625, 0.36700439453125, 0.4525146484375, 0.53802490234375, 0.62353515625, 0.70904541015625, 0.7945556640625, 0.88006591796875, 0.965576171875, 1.05108642578125, 1.1365966796875, 1.22210693359375, 1.3076171875, 1.39312744140625, 1.4786376953125, 1.56414794921875, 1.649658203125, 1.73516845703125, 1.8206787109375, 1.90618896484375, 1.99169921875, 2.07720947265625, 2.1627197265625, 2.24822998046875, 2.333740234375, 2.41925048828125, 2.5047607421875, 2.59027099609375, 2.67578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 9.0, 6.0, 13.0, 10.0, 18.0, 25.0, 47.0, 73.0, 93.0, 175.0, 246.0, 390.0, 622.0, 959.0, 1587.0, 2425.0, 3929.0, 6503.0, 10343.0, 16933.0, 27612.0, 44191.0, 69523.0, 103879.0, 144191.0, 1200756.0, 152990.0, 110451.0, 74342.0, 47366.0, 29425.0, 18573.0, 11152.0, 6900.0, 4332.0, 2650.0, 1567.0, 1045.0, 597.0, 413.0, 250.0, 165.0, 121.0, 87.0, 56.0, 35.0, 17.0, 11.0, 16.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.265625, -0.2569389343261719, -0.24825286865234375, -0.23956680297851562, -0.2308807373046875, -0.22219467163085938, -0.21350860595703125, -0.20482254028320312, -0.196136474609375, -0.18745040893554688, -0.17876434326171875, -0.17007827758789062, -0.1613922119140625, -0.15270614624023438, -0.14402008056640625, -0.13533401489257812, -0.12664794921875, -0.11796188354492188, -0.10927581787109375, -0.10058975219726562, -0.0919036865234375, -0.08321762084960938, -0.07453155517578125, -0.06584548950195312, -0.057159423828125, -0.048473358154296875, -0.03978729248046875, -0.031101226806640625, -0.0224151611328125, -0.013729095458984375, -0.00504302978515625, 0.003643035888671875, 0.0123291015625, 0.021015167236328125, 0.02970123291015625, 0.038387298583984375, 0.0470733642578125, 0.055759429931640625, 0.06444549560546875, 0.07313156127929688, 0.081817626953125, 0.09050369262695312, 0.09918975830078125, 0.10787582397460938, 0.1165618896484375, 0.12524795532226562, 0.13393402099609375, 0.14262008666992188, 0.15130615234375, 0.15999221801757812, 0.16867828369140625, 0.17736434936523438, 0.1860504150390625, 0.19473648071289062, 0.20342254638671875, 0.21210861206054688, 0.220794677734375, 0.22948074340820312, 0.23816680908203125, 0.24685287475585938, 0.2555389404296875, 0.2642250061035156, 0.27291107177734375, 0.2815971374511719, 0.290283203125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 8.0, 4.0, 4.0, 10.0, 10.0, 8.0, 17.0, 11.0, 13.0, 20.0, 22.0, 36.0, 31.0, 48.0, 64.0, 63.0, 89.0, 112.0, 85.0, 54.0, 45.0, 50.0, 31.0, 23.0, 18.0, 13.0, 12.0, 8.0, 10.0, 10.0, 10.0, 6.0, 10.0, 5.0, 4.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0175933837890625, -0.017015457153320312, -0.016437530517578125, -0.015859603881835938, -0.01528167724609375, -0.014703750610351562, -0.014125823974609375, -0.013547897338867188, -0.012969970703125, -0.012392044067382812, -0.011814117431640625, -0.011236190795898438, -0.01065826416015625, -0.010080337524414062, -0.009502410888671875, -0.008924484252929688, -0.0083465576171875, -0.0077686309814453125, -0.007190704345703125, -0.0066127777099609375, -0.00603485107421875, -0.0054569244384765625, -0.004878997802734375, -0.0043010711669921875, -0.00372314453125, -0.0031452178955078125, -0.002567291259765625, -0.0019893646240234375, -0.00141143798828125, -0.0008335113525390625, -0.000255584716796875, 0.0003223419189453125, 0.0009002685546875, 0.0014781951904296875, 0.002056121826171875, 0.0026340484619140625, 0.00321197509765625, 0.0037899017333984375, 0.004367828369140625, 0.0049457550048828125, 0.005523681640625, 0.0061016082763671875, 0.006679534912109375, 0.0072574615478515625, 0.00783538818359375, 0.008413314819335938, 0.008991241455078125, 0.009569168090820312, 0.0101470947265625, 0.010725021362304688, 0.011302947998046875, 0.011880874633789062, 0.01245880126953125, 0.013036727905273438, 0.013614654541015625, 0.014192581176757812, 0.0147705078125, 0.015348434448242188, 0.015926361083984375, 0.016504287719726562, 0.01708221435546875, 0.017660140991210938, 0.018238067626953125, 0.018815994262695312, 0.0193939208984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 3.0, 6.0, 9.0, 7.0, 7.0, 9.0, 9.0, 17.0, 13.0, 16.0, 13.0, 39.0, 30.0, 60.0, 93.0, 121.0, 438.0, 5005.0, 1021423.0, 20005.0, 624.0, 194.0, 105.0, 62.0, 39.0, 31.0, 33.0, 19.0, 23.0, 13.0, 12.0, 12.0, 8.0, 7.0, 5.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.4560546875, -0.4424934387207031, -0.42893218994140625, -0.4153709411621094, -0.4018096923828125, -0.3882484436035156, -0.37468719482421875, -0.3611259460449219, -0.347564697265625, -0.3340034484863281, -0.32044219970703125, -0.3068809509277344, -0.2933197021484375, -0.2797584533691406, -0.26619720458984375, -0.2526359558105469, -0.23907470703125, -0.22551345825195312, -0.21195220947265625, -0.19839096069335938, -0.1848297119140625, -0.17126846313476562, -0.15770721435546875, -0.14414596557617188, -0.130584716796875, -0.11702346801757812, -0.10346221923828125, -0.08990097045898438, -0.0763397216796875, -0.06277847290039062, -0.04921722412109375, -0.035655975341796875, -0.0220947265625, -0.008533477783203125, 0.00502777099609375, 0.018589019775390625, 0.0321502685546875, 0.045711517333984375, 0.05927276611328125, 0.07283401489257812, 0.086395263671875, 0.09995651245117188, 0.11351776123046875, 0.12707901000976562, 0.1406402587890625, 0.15420150756835938, 0.16776275634765625, 0.18132400512695312, 0.19488525390625, 0.20844650268554688, 0.22200775146484375, 0.23556900024414062, 0.2491302490234375, 0.2626914978027344, 0.27625274658203125, 0.2898139953613281, 0.303375244140625, 0.3169364929199219, 0.33049774169921875, 0.3440589904785156, 0.3576202392578125, 0.3711814880371094, 0.38474273681640625, 0.3983039855957031, 0.411865234375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 12.0, 19.0, 78.0, 332.0, 475.0, 79.0, 18.0, 3.0, 3.0], "bins": [-0.25232696533203125, -0.2480594515800476, -0.24379193782806396, -0.23952442407608032, -0.23525691032409668, -0.23098939657211304, -0.2267218828201294, -0.22245436906814575, -0.2181868553161621, -0.21391934156417847, -0.20965182781219482, -0.20538431406021118, -0.20111680030822754, -0.1968492865562439, -0.19258177280426025, -0.1883142590522766, -0.18404674530029297, -0.17977923154830933, -0.17551171779632568, -0.17124420404434204, -0.1669766902923584, -0.16270917654037476, -0.1584416627883911, -0.15417414903640747, -0.14990663528442383, -0.14563912153244019, -0.14137160778045654, -0.1371040940284729, -0.13283658027648926, -0.12856906652450562, -0.12430155277252197, -0.12003403902053833, -0.11576651781797409, -0.11149900406599045, -0.1072314903140068, -0.10296397656202316, -0.09869646281003952, -0.09442894905805588, -0.09016143530607224, -0.08589392155408859, -0.08162640780210495, -0.07735889405012131, -0.07309138029813766, -0.06882386654615402, -0.06455635279417038, -0.06028883904218674, -0.056021325290203094, -0.05175381153821945, -0.04748629778623581, -0.04321878403425217, -0.038951270282268524, -0.03468375653028488, -0.03041624277830124, -0.026148729026317596, -0.021881215274333954, -0.01761370152235031, -0.01334618590772152, -0.009078672155737877, -0.004811158403754234, -0.0005436446517705917, 0.003723869100213051, 0.007991382852196693, 0.012258896604180336, 0.01652641035616398, 0.02079392410814762]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 4.0, 10.0, 6.0, 13.0, 17.0, 15.0, 11.0, 24.0, 21.0, 26.0, 36.0, 38.0, 35.0, 38.0, 39.0, 52.0, 50.0, 39.0, 44.0, 29.0, 45.0, 51.0, 28.0, 35.0, 24.0, 21.0, 31.0, 38.0, 27.0, 28.0, 24.0, 16.0, 13.0, 16.0, 14.0, 8.0, 10.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.03228342533111572, -0.03128441423177719, -0.03028540126979351, -0.02928638830780983, -0.028287377208471298, -0.027288366109132767, -0.026289353147149086, -0.025290340185165405, -0.024291329085826874, -0.023292317986488342, -0.02229330502450466, -0.02129429206252098, -0.02029528096318245, -0.019296269863843918, -0.018297256901860237, -0.017298243939876556, -0.016299232840538025, -0.015300220809876919, -0.014301208779215813, -0.013302196748554707, -0.0123031847178936, -0.011304172687232494, -0.010305160656571388, -0.009306148625910282, -0.008307136595249176, -0.00730812456458807, -0.006309112533926964, -0.005310100503265858, -0.004311088472604752, -0.0033120764419436455, -0.0023130644112825394, -0.0013140523806214333, -0.00031504034996032715, 0.000683971680700779, 0.001682983711361885, 0.002681995742022991, 0.0036810077726840973, 0.004680019803345203, 0.0056790318340063095, 0.006678043864667416, 0.007677055895328522, 0.008676067925989628, 0.009675079956650734, 0.01067409198731184, 0.011673104017972946, 0.012672116048634052, 0.013671128079295158, 0.014670140109956264, 0.01566915214061737, 0.016668163239955902, 0.017667176201939583, 0.018666189163923264, 0.019665200263261795, 0.020664211362600327, 0.021663224324584007, 0.022662237286567688, 0.02366124838590622, 0.02466025948524475, 0.02565927244722843, 0.026658285409212112, 0.027657296508550644, 0.028656307607889175, 0.029655320569872856, 0.030654333531856537, 0.03165334463119507]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 7.0, 1.0, 3.0, 10.0, 8.0, 12.0, 9.0, 15.0, 21.0, 19.0, 18.0, 18.0, 23.0, 21.0, 22.0, 19.0, 28.0, 31.0, 38.0, 24.0, 38.0, 31.0, 30.0, 34.0, 37.0, 39.0, 30.0, 29.0, 38.0, 28.0, 33.0, 28.0, 41.0, 26.0, 24.0, 28.0, 21.0, 13.0, 13.0, 10.0, 12.0, 12.0, 7.0, 6.0, 12.0, 4.0, 5.0, 6.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0], "bins": [-3.60546875, -3.493804931640625, -3.38214111328125, -3.270477294921875, -3.1588134765625, -3.047149658203125, -2.93548583984375, -2.823822021484375, -2.712158203125, -2.600494384765625, -2.48883056640625, -2.377166748046875, -2.2655029296875, -2.153839111328125, -2.04217529296875, -1.930511474609375, -1.81884765625, -1.707183837890625, -1.59552001953125, -1.483856201171875, -1.3721923828125, -1.260528564453125, -1.14886474609375, -1.037200927734375, -0.925537109375, -0.813873291015625, -0.70220947265625, -0.590545654296875, -0.4788818359375, -0.367218017578125, -0.25555419921875, -0.143890380859375, -0.0322265625, 0.079437255859375, 0.19110107421875, 0.302764892578125, 0.4144287109375, 0.526092529296875, 0.63775634765625, 0.749420166015625, 0.861083984375, 0.972747802734375, 1.08441162109375, 1.196075439453125, 1.3077392578125, 1.419403076171875, 1.53106689453125, 1.642730712890625, 1.75439453125, 1.866058349609375, 1.97772216796875, 2.089385986328125, 2.2010498046875, 2.312713623046875, 2.42437744140625, 2.536041259765625, 2.647705078125, 2.759368896484375, 2.87103271484375, 2.982696533203125, 3.0943603515625, 3.206024169921875, 3.31768798828125, 3.429351806640625, 3.541015625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 8.0, 3.0, 5.0, 9.0, 20.0, 33.0, 52.0, 60.0, 85.0, 152.0, 206.0, 344.0, 540.0, 865.0, 1450.0, 2388.0, 4049.0, 7111.0, 12714.0, 23298.0, 45056.0, 94157.0, 203462.0, 334792.0, 161170.0, 75149.0, 36511.0, 19469.0, 10451.0, 6107.0, 3450.0, 2012.0, 1306.0, 757.0, 468.0, 305.0, 189.0, 114.0, 62.0, 57.0, 39.0, 21.0, 10.0, 13.0, 16.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.826171875, -3.71478271484375, -3.6033935546875, -3.49200439453125, -3.380615234375, -3.26922607421875, -3.1578369140625, -3.04644775390625, -2.93505859375, -2.82366943359375, -2.7122802734375, -2.60089111328125, -2.489501953125, -2.37811279296875, -2.2667236328125, -2.15533447265625, -2.0439453125, -1.93255615234375, -1.8211669921875, -1.70977783203125, -1.598388671875, -1.48699951171875, -1.3756103515625, -1.26422119140625, -1.15283203125, -1.04144287109375, -0.9300537109375, -0.81866455078125, -0.707275390625, -0.59588623046875, -0.4844970703125, -0.37310791015625, -0.26171875, -0.15032958984375, -0.0389404296875, 0.07244873046875, 0.183837890625, 0.29522705078125, 0.4066162109375, 0.51800537109375, 0.62939453125, 0.74078369140625, 0.8521728515625, 0.96356201171875, 1.074951171875, 1.18634033203125, 1.2977294921875, 1.40911865234375, 1.5205078125, 1.63189697265625, 1.7432861328125, 1.85467529296875, 1.966064453125, 2.07745361328125, 2.1888427734375, 2.30023193359375, 2.41162109375, 2.52301025390625, 2.6343994140625, 2.74578857421875, 2.857177734375, 2.96856689453125, 3.0799560546875, 3.19134521484375, 3.302734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 9.0, 15.0, 15.0, 11.0, 26.0, 23.0, 24.0, 22.0, 37.0, 32.0, 27.0, 40.0, 50.0, 84.0, 103.0, 255.0, 1503.0, 243.0, 99.0, 55.0, 54.0, 41.0, 27.0, 41.0, 23.0, 32.0, 20.0, 17.0, 21.0, 18.0, 21.0, 7.0, 13.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-16.875, -16.41259765625, -15.9501953125, -15.48779296875, -15.025390625, -14.56298828125, -14.1005859375, -13.63818359375, -13.17578125, -12.71337890625, -12.2509765625, -11.78857421875, -11.326171875, -10.86376953125, -10.4013671875, -9.93896484375, -9.4765625, -9.01416015625, -8.5517578125, -8.08935546875, -7.626953125, -7.16455078125, -6.7021484375, -6.23974609375, -5.77734375, -5.31494140625, -4.8525390625, -4.39013671875, -3.927734375, -3.46533203125, -3.0029296875, -2.54052734375, -2.078125, -1.61572265625, -1.1533203125, -0.69091796875, -0.228515625, 0.23388671875, 0.6962890625, 1.15869140625, 1.62109375, 2.08349609375, 2.5458984375, 3.00830078125, 3.470703125, 3.93310546875, 4.3955078125, 4.85791015625, 5.3203125, 5.78271484375, 6.2451171875, 6.70751953125, 7.169921875, 7.63232421875, 8.0947265625, 8.55712890625, 9.01953125, 9.48193359375, 9.9443359375, 10.40673828125, 10.869140625, 11.33154296875, 11.7939453125, 12.25634765625, 12.71875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 15.0, 10.0, 10.0, 35.0, 36.0, 35.0, 49.0, 63.0, 91.0, 115.0, 183.0, 214.0, 386.0, 1152.0, 14282.0, 2950225.0, 173896.0, 3152.0, 671.0, 299.0, 199.0, 143.0, 124.0, 82.0, 50.0, 36.0, 32.0, 21.0, 24.0, 16.0, 19.0, 10.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.40625, -36.22802734375, -35.0498046875, -33.87158203125, -32.693359375, -31.51513671875, -30.3369140625, -29.15869140625, -27.98046875, -26.80224609375, -25.6240234375, -24.44580078125, -23.267578125, -22.08935546875, -20.9111328125, -19.73291015625, -18.5546875, -17.37646484375, -16.1982421875, -15.02001953125, -13.841796875, -12.66357421875, -11.4853515625, -10.30712890625, -9.12890625, -7.95068359375, -6.7724609375, -5.59423828125, -4.416015625, -3.23779296875, -2.0595703125, -0.88134765625, 0.296875, 1.47509765625, 2.6533203125, 3.83154296875, 5.009765625, 6.18798828125, 7.3662109375, 8.54443359375, 9.72265625, 10.90087890625, 12.0791015625, 13.25732421875, 14.435546875, 15.61376953125, 16.7919921875, 17.97021484375, 19.1484375, 20.32666015625, 21.5048828125, 22.68310546875, 23.861328125, 25.03955078125, 26.2177734375, 27.39599609375, 28.57421875, 29.75244140625, 30.9306640625, 32.10888671875, 33.287109375, 34.46533203125, 35.6435546875, 36.82177734375, 38.0]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [71.0, 606.0, 318.0, 24.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.739951133728027, -2.998826742172241, 0.7422976493835449, 4.48342227935791, 8.224546432495117, 11.965670585632324, 15.706795692443848, 19.447917938232422, 23.189044952392578, 26.9301700592041, 30.671293258666992, 34.412418365478516, 38.153541564941406, 41.89466857910156, 45.63579177856445, 49.376914978027344, 53.118038177490234, 56.859161376953125, 60.60028839111328, 64.34141540527344, 68.08253479003906, 71.82366180419922, 75.56478881835938, 79.305908203125, 83.04703521728516, 86.78816223144531, 90.52928161621094, 94.2704086303711, 98.01153564453125, 101.75265502929688, 105.49378204345703, 109.23490905761719, 112.97603607177734, 116.7171630859375, 120.45828247070312, 124.19940948486328, 127.94053649902344, 131.68165588378906, 135.42279052734375, 139.16390991210938, 142.905029296875, 146.64614868164062, 150.3872833251953, 154.12840270996094, 157.86952209472656, 161.61065673828125, 165.35177612304688, 169.0928955078125, 172.8340301513672, 176.5751495361328, 180.3162841796875, 184.05740356445312, 187.79852294921875, 191.53965759277344, 195.28077697753906, 199.0218963623047, 202.7630157470703, 206.50413513183594, 210.24526977539062, 213.98638916015625, 217.72750854492188, 221.46864318847656, 225.2097625732422, 228.9508819580078, 232.6920166015625]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 5.0, 11.0, 5.0, 11.0, 19.0, 17.0, 15.0, 22.0, 15.0, 30.0, 29.0, 18.0, 25.0, 32.0, 42.0, 27.0, 26.0, 37.0, 51.0, 45.0, 38.0, 29.0, 31.0, 35.0, 35.0, 38.0, 44.0, 29.0, 25.0, 20.0, 22.0, 20.0, 31.0, 20.0, 22.0, 7.0, 8.0, 13.0, 3.0, 15.0, 12.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.540550231933594, -32.49601364135742, -31.45147705078125, -30.406940460205078, -29.362403869628906, -28.317867279052734, -27.27332878112793, -26.228792190551758, -25.184255599975586, -24.139719009399414, -23.095182418823242, -22.05064582824707, -21.006107330322266, -19.961570739746094, -18.917034149169922, -17.87249755859375, -16.827960968017578, -15.783424377441406, -14.738887786865234, -13.694350242614746, -12.649813652038574, -11.605277061462402, -10.560739517211914, -9.516202926635742, -8.47166633605957, -7.427129745483398, -6.382592678070068, -5.338055610656738, -4.293519020080566, -3.2489824295043945, -2.2044453620910645, -1.1599082946777344, -0.1153717041015625, 0.9291651248931885, 1.9737019538879395, 3.0182387828826904, 4.062775611877441, 5.107312202453613, 6.151849269866943, 7.196386337280273, 8.240922927856445, 9.285459518432617, 10.329996109008789, 11.374533653259277, 12.41907024383545, 13.463606834411621, 14.50814437866211, 15.552680969238281, 16.597217559814453, 17.641754150390625, 18.686290740966797, 19.73082733154297, 20.77536392211914, 21.819900512695312, 22.864439010620117, 23.90897560119629, 24.95351219177246, 25.998048782348633, 27.042585372924805, 28.087121963500977, 29.13166046142578, 30.176197052001953, 31.220733642578125, 32.2652702331543, 33.30980682373047]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 9.0, 5.0, 9.0, 14.0, 17.0, 14.0, 17.0, 21.0, 21.0, 28.0, 20.0, 20.0, 25.0, 35.0, 35.0, 37.0, 33.0, 22.0, 35.0, 31.0, 33.0, 33.0, 39.0, 48.0, 35.0, 32.0, 32.0, 32.0, 36.0, 29.0, 21.0, 22.0, 19.0, 18.0, 21.0, 9.0, 13.0, 6.0, 12.0, 11.0, 5.0, 3.0, 14.0, 3.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.767578125, -3.645355224609375, -3.52313232421875, -3.400909423828125, -3.2786865234375, -3.156463623046875, -3.03424072265625, -2.912017822265625, -2.789794921875, -2.667572021484375, -2.54534912109375, -2.423126220703125, -2.3009033203125, -2.178680419921875, -2.05645751953125, -1.934234619140625, -1.81201171875, -1.689788818359375, -1.56756591796875, -1.445343017578125, -1.3231201171875, -1.200897216796875, -1.07867431640625, -0.956451416015625, -0.834228515625, -0.712005615234375, -0.58978271484375, -0.467559814453125, -0.3453369140625, -0.223114013671875, -0.10089111328125, 0.021331787109375, 0.1435546875, 0.265777587890625, 0.38800048828125, 0.510223388671875, 0.6324462890625, 0.754669189453125, 0.87689208984375, 0.999114990234375, 1.121337890625, 1.243560791015625, 1.36578369140625, 1.488006591796875, 1.6102294921875, 1.732452392578125, 1.85467529296875, 1.976898193359375, 2.09912109375, 2.221343994140625, 2.34356689453125, 2.465789794921875, 2.5880126953125, 2.710235595703125, 2.83245849609375, 2.954681396484375, 3.076904296875, 3.199127197265625, 3.32135009765625, 3.443572998046875, 3.5657958984375, 3.688018798828125, 3.81024169921875, 3.932464599609375, 4.0546875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 4.0, 6.0, 14.0, 13.0, 11.0, 17.0, 19.0, 28.0, 35.0, 23.0, 50.0, 61.0, 104.0, 214.0, 444.0, 1047.0, 3093.0, 11055.0, 51726.0, 367535.0, 2206545.0, 1346560.0, 166870.0, 28174.0, 6825.0, 2058.0, 831.0, 363.0, 166.0, 99.0, 66.0, 36.0, 27.0, 28.0, 29.0, 17.0, 14.0, 12.0, 4.0, 8.0, 6.0, 6.0, 5.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-11.0078125, -10.67236328125, -10.3369140625, -10.00146484375, -9.666015625, -9.33056640625, -8.9951171875, -8.65966796875, -8.32421875, -7.98876953125, -7.6533203125, -7.31787109375, -6.982421875, -6.64697265625, -6.3115234375, -5.97607421875, -5.640625, -5.30517578125, -4.9697265625, -4.63427734375, -4.298828125, -3.96337890625, -3.6279296875, -3.29248046875, -2.95703125, -2.62158203125, -2.2861328125, -1.95068359375, -1.615234375, -1.27978515625, -0.9443359375, -0.60888671875, -0.2734375, 0.06201171875, 0.3974609375, 0.73291015625, 1.068359375, 1.40380859375, 1.7392578125, 2.07470703125, 2.41015625, 2.74560546875, 3.0810546875, 3.41650390625, 3.751953125, 4.08740234375, 4.4228515625, 4.75830078125, 5.09375, 5.42919921875, 5.7646484375, 6.10009765625, 6.435546875, 6.77099609375, 7.1064453125, 7.44189453125, 7.77734375, 8.11279296875, 8.4482421875, 8.78369140625, 9.119140625, 9.45458984375, 9.7900390625, 10.12548828125, 10.4609375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 5.0, 6.0, 7.0, 12.0, 15.0, 11.0, 17.0, 28.0, 43.0, 54.0, 50.0, 74.0, 87.0, 130.0, 189.0, 242.0, 258.0, 343.0, 418.0, 401.0, 391.0, 285.0, 215.0, 190.0, 142.0, 108.0, 86.0, 46.0, 48.0, 45.0, 30.0, 20.0, 16.0, 17.0, 6.0, 4.0, 6.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.2421875, -8.9713134765625, -8.700439453125, -8.4295654296875, -8.15869140625, -7.8878173828125, -7.616943359375, -7.3460693359375, -7.0751953125, -6.8043212890625, -6.533447265625, -6.2625732421875, -5.99169921875, -5.7208251953125, -5.449951171875, -5.1790771484375, -4.908203125, -4.6373291015625, -4.366455078125, -4.0955810546875, -3.82470703125, -3.5538330078125, -3.282958984375, -3.0120849609375, -2.7412109375, -2.4703369140625, -2.199462890625, -1.9285888671875, -1.65771484375, -1.3868408203125, -1.115966796875, -0.8450927734375, -0.57421875, -0.3033447265625, -0.032470703125, 0.2384033203125, 0.50927734375, 0.7801513671875, 1.051025390625, 1.3218994140625, 1.5927734375, 1.8636474609375, 2.134521484375, 2.4053955078125, 2.67626953125, 2.9471435546875, 3.218017578125, 3.4888916015625, 3.759765625, 4.0306396484375, 4.301513671875, 4.5723876953125, 4.84326171875, 5.1141357421875, 5.385009765625, 5.6558837890625, 5.9267578125, 6.1976318359375, 6.468505859375, 6.7393798828125, 7.01025390625, 7.2811279296875, 7.552001953125, 7.8228759765625, 8.09375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 8.0, 14.0, 15.0, 25.0, 31.0, 47.0, 59.0, 66.0, 111.0, 152.0, 207.0, 279.0, 542.0, 2091.0, 37821.0, 3471548.0, 669269.0, 9582.0, 1037.0, 414.0, 255.0, 168.0, 133.0, 95.0, 68.0, 62.0, 49.0, 23.0, 17.0, 19.0, 12.0, 12.0, 4.0, 7.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-40.1875, -38.923828125, -37.66015625, -36.396484375, -35.1328125, -33.869140625, -32.60546875, -31.341796875, -30.078125, -28.814453125, -27.55078125, -26.287109375, -25.0234375, -23.759765625, -22.49609375, -21.232421875, -19.96875, -18.705078125, -17.44140625, -16.177734375, -14.9140625, -13.650390625, -12.38671875, -11.123046875, -9.859375, -8.595703125, -7.33203125, -6.068359375, -4.8046875, -3.541015625, -2.27734375, -1.013671875, 0.25, 1.513671875, 2.77734375, 4.041015625, 5.3046875, 6.568359375, 7.83203125, 9.095703125, 10.359375, 11.623046875, 12.88671875, 14.150390625, 15.4140625, 16.677734375, 17.94140625, 19.205078125, 20.46875, 21.732421875, 22.99609375, 24.259765625, 25.5234375, 26.787109375, 28.05078125, 29.314453125, 30.578125, 31.841796875, 33.10546875, 34.369140625, 35.6328125, 36.896484375, 38.16015625, 39.423828125, 40.6875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 31.0, 148.0, 377.0, 323.0, 109.0, 20.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.74324798583984, -90.66070556640625, -85.57817077636719, -80.4956283569336, -75.4130859375, -70.33055114746094, -65.24800872802734, -60.165470123291016, -55.08293151855469, -50.00039291381836, -44.91785430908203, -39.83531188964844, -34.75277328491211, -29.67023468017578, -24.58769416809082, -19.50515365600586, -14.422615051269531, -9.340075492858887, -4.257535934448242, 0.8250036239624023, 5.907543182373047, 10.990081787109375, 16.072622299194336, 21.155162811279297, 26.237701416015625, 31.320240020751953, 36.40277862548828, 41.485321044921875, 46.5678596496582, 51.65039825439453, 56.732940673828125, 61.81547927856445, 66.89801025390625, 71.98055267333984, 77.0630874633789, 82.1456298828125, 87.22816467285156, 92.31070709228516, 97.39324951171875, 102.47578430175781, 107.5583267211914, 112.640869140625, 117.72340393066406, 122.80594635009766, 127.88848876953125, 132.9710235595703, 138.05355834960938, 143.1361083984375, 148.21864318847656, 153.30117797851562, 158.38372802734375, 163.4662628173828, 168.54879760742188, 173.63134765625, 178.71388244628906, 183.79641723632812, 188.87896728515625, 193.9615020751953, 199.04405212402344, 204.1265869140625, 209.20912170410156, 214.29165649414062, 219.37420654296875, 224.4567413330078, 229.53927612304688]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 6.0, 5.0, 8.0, 13.0, 16.0, 10.0, 15.0, 26.0, 30.0, 22.0, 32.0, 30.0, 31.0, 33.0, 38.0, 37.0, 27.0, 44.0, 44.0, 50.0, 46.0, 42.0, 36.0, 36.0, 31.0, 38.0, 22.0, 28.0, 27.0, 22.0, 31.0, 17.0, 20.0, 15.0, 17.0, 9.0, 9.0, 4.0, 9.0, 1.0, 0.0, 4.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.20622253417969, -31.215606689453125, -30.22498893737793, -29.234373092651367, -28.243755340576172, -27.25313949584961, -26.262521743774414, -25.27190589904785, -24.281288146972656, -23.290672302246094, -22.3000545501709, -21.309438705444336, -20.31882095336914, -19.328205108642578, -18.337587356567383, -17.34697151184082, -16.356353759765625, -15.365736961364746, -14.375120162963867, -13.384503364562988, -12.39388656616211, -11.403270721435547, -10.412652969360352, -9.422037124633789, -8.431421279907227, -7.440804481506348, -6.450187683105469, -5.45957088470459, -4.468954086303711, -3.4783377647399902, -2.4877209663391113, -1.4971041679382324, -0.5064868927001953, 0.4841298460960388, 1.474746584892273, 2.4653632640838623, 3.455980062484741, 4.446596622467041, 5.43721342086792, 6.427830219268799, 7.418447017669678, 8.409063339233398, 9.399680137634277, 10.390296936035156, 11.380913734436035, 12.371530532836914, 13.362147331237793, 14.352764129638672, 15.34338092803955, 16.33399772644043, 17.324613571166992, 18.315231323242188, 19.30584716796875, 20.296464920043945, 21.287080764770508, 22.277698516845703, 23.268314361572266, 24.258930206298828, 25.249547958374023, 26.240163803100586, 27.23078155517578, 28.221397399902344, 29.21201515197754, 30.2026309967041, 31.193248748779297]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 2.0, 4.0, 6.0, 7.0, 11.0, 17.0, 15.0, 17.0, 18.0, 26.0, 29.0, 25.0, 36.0, 34.0, 35.0, 29.0, 55.0, 40.0, 47.0, 29.0, 35.0, 44.0, 42.0, 40.0, 42.0, 48.0, 39.0, 33.0, 16.0, 23.0, 17.0, 27.0, 14.0, 20.0, 14.0, 12.0, 6.0, 10.0, 7.0, 3.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.8046875, -4.65557861328125, -4.5064697265625, -4.35736083984375, -4.208251953125, -4.05914306640625, -3.9100341796875, -3.76092529296875, -3.61181640625, -3.46270751953125, -3.3135986328125, -3.16448974609375, -3.015380859375, -2.86627197265625, -2.7171630859375, -2.56805419921875, -2.4189453125, -2.26983642578125, -2.1207275390625, -1.97161865234375, -1.822509765625, -1.67340087890625, -1.5242919921875, -1.37518310546875, -1.22607421875, -1.07696533203125, -0.9278564453125, -0.77874755859375, -0.629638671875, -0.48052978515625, -0.3314208984375, -0.18231201171875, -0.033203125, 0.11590576171875, 0.2650146484375, 0.41412353515625, 0.563232421875, 0.71234130859375, 0.8614501953125, 1.01055908203125, 1.15966796875, 1.30877685546875, 1.4578857421875, 1.60699462890625, 1.756103515625, 1.90521240234375, 2.0543212890625, 2.20343017578125, 2.3525390625, 2.50164794921875, 2.6507568359375, 2.79986572265625, 2.948974609375, 3.09808349609375, 3.2471923828125, 3.39630126953125, 3.54541015625, 3.69451904296875, 3.8436279296875, 3.99273681640625, 4.141845703125, 4.29095458984375, 4.4400634765625, 4.58917236328125, 4.73828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 17.0, 18.0, 26.0, 41.0, 78.0, 105.0, 120.0, 228.0, 326.0, 566.0, 775.0, 1160.0, 1844.0, 2862.0, 4506.0, 6840.0, 10600.0, 16438.0, 24978.0, 37814.0, 56726.0, 82466.0, 115334.0, 146051.0, 149464.0, 121888.0, 88956.0, 60569.0, 40401.0, 27256.0, 17501.0, 11579.0, 7459.0, 4801.0, 3019.0, 2003.0, 1257.0, 840.0, 535.0, 352.0, 238.0, 182.0, 102.0, 58.0, 46.0, 42.0, 20.0, 24.0, 3.0, 7.0, 11.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.463134765625, -0.4491386413574219, -0.43514251708984375, -0.4211463928222656, -0.4071502685546875, -0.3931541442871094, -0.37915802001953125, -0.3651618957519531, -0.351165771484375, -0.3371696472167969, -0.32317352294921875, -0.3091773986816406, -0.2951812744140625, -0.2811851501464844, -0.26718902587890625, -0.2531929016113281, -0.23919677734375, -0.22520065307617188, -0.21120452880859375, -0.19720840454101562, -0.1832122802734375, -0.16921615600585938, -0.15522003173828125, -0.14122390747070312, -0.127227783203125, -0.11323165893554688, -0.09923553466796875, -0.08523941040039062, -0.0712432861328125, -0.057247161865234375, -0.04325103759765625, -0.029254913330078125, -0.0152587890625, -0.001262664794921875, 0.01273345947265625, 0.026729583740234375, 0.0407257080078125, 0.054721832275390625, 0.06871795654296875, 0.08271408081054688, 0.096710205078125, 0.11070632934570312, 0.12470245361328125, 0.13869857788085938, 0.1526947021484375, 0.16669082641601562, 0.18068695068359375, 0.19468307495117188, 0.20867919921875, 0.22267532348632812, 0.23667144775390625, 0.2506675720214844, 0.2646636962890625, 0.2786598205566406, 0.29265594482421875, 0.3066520690917969, 0.320648193359375, 0.3346443176269531, 0.34864044189453125, 0.3626365661621094, 0.3766326904296875, 0.3906288146972656, 0.40462493896484375, 0.4186210632324219, 0.4326171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 6.0, 12.0, 8.0, 14.0, 13.0, 18.0, 24.0, 18.0, 31.0, 24.0, 35.0, 37.0, 39.0, 45.0, 41.0, 40.0, 46.0, 1076.0, 50.0, 42.0, 45.0, 32.0, 51.0, 32.0, 24.0, 34.0, 37.0, 24.0, 14.0, 17.0, 18.0, 12.0, 13.0, 9.0, 10.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.54296875, -3.4346923828125, -3.326416015625, -3.2181396484375, -3.10986328125, -3.0015869140625, -2.893310546875, -2.7850341796875, -2.6767578125, -2.5684814453125, -2.460205078125, -2.3519287109375, -2.24365234375, -2.1353759765625, -2.027099609375, -1.9188232421875, -1.810546875, -1.7022705078125, -1.593994140625, -1.4857177734375, -1.37744140625, -1.2691650390625, -1.160888671875, -1.0526123046875, -0.9443359375, -0.8360595703125, -0.727783203125, -0.6195068359375, -0.51123046875, -0.4029541015625, -0.294677734375, -0.1864013671875, -0.078125, 0.0301513671875, 0.138427734375, 0.2467041015625, 0.35498046875, 0.4632568359375, 0.571533203125, 0.6798095703125, 0.7880859375, 0.8963623046875, 1.004638671875, 1.1129150390625, 1.22119140625, 1.3294677734375, 1.437744140625, 1.5460205078125, 1.654296875, 1.7625732421875, 1.870849609375, 1.9791259765625, 2.08740234375, 2.1956787109375, 2.303955078125, 2.4122314453125, 2.5205078125, 2.6287841796875, 2.737060546875, 2.8453369140625, 2.95361328125, 3.0618896484375, 3.170166015625, 3.2784423828125, 3.38671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 9.0, 17.0, 22.0, 46.0, 40.0, 67.0, 124.0, 185.0, 301.0, 464.0, 743.0, 1136.0, 1825.0, 2665.0, 4127.0, 6601.0, 10426.0, 16934.0, 26664.0, 42985.0, 66797.0, 101186.0, 139062.0, 1205328.0, 152171.0, 111537.0, 75494.0, 48274.0, 30493.0, 18925.0, 11820.0, 7413.0, 4782.0, 2922.0, 1978.0, 1244.0, 835.0, 533.0, 351.0, 210.0, 131.0, 88.0, 54.0, 45.0, 23.0, 22.0, 11.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.319091796875, -0.3093147277832031, -0.29953765869140625, -0.2897605895996094, -0.2799835205078125, -0.2702064514160156, -0.26042938232421875, -0.2506523132324219, -0.240875244140625, -0.23109817504882812, -0.22132110595703125, -0.21154403686523438, -0.2017669677734375, -0.19198989868164062, -0.18221282958984375, -0.17243576049804688, -0.16265869140625, -0.15288162231445312, -0.14310455322265625, -0.13332748413085938, -0.1235504150390625, -0.11377334594726562, -0.10399627685546875, -0.09421920776367188, -0.084442138671875, -0.07466506958007812, -0.06488800048828125, -0.055110931396484375, -0.0453338623046875, -0.035556793212890625, -0.02577972412109375, -0.016002655029296875, -0.0062255859375, 0.003551483154296875, 0.01332855224609375, 0.023105621337890625, 0.0328826904296875, 0.042659759521484375, 0.05243682861328125, 0.062213897705078125, 0.071990966796875, 0.08176803588867188, 0.09154510498046875, 0.10132217407226562, 0.1110992431640625, 0.12087631225585938, 0.13065338134765625, 0.14043045043945312, 0.15020751953125, 0.15998458862304688, 0.16976165771484375, 0.17953872680664062, 0.1893157958984375, 0.19909286499023438, 0.20886993408203125, 0.21864700317382812, 0.228424072265625, 0.23820114135742188, 0.24797821044921875, 0.2577552795410156, 0.2675323486328125, 0.2773094177246094, 0.28708648681640625, 0.2968635559082031, 0.306640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 2.0, 2.0, 8.0, 11.0, 10.0, 21.0, 14.0, 37.0, 44.0, 78.0, 125.0, 172.0, 157.0, 108.0, 71.0, 35.0, 29.0, 15.0, 14.0, 7.0, 11.0, 5.0, 2.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0261688232421875, -0.025418758392333984, -0.02466869354248047, -0.023918628692626953, -0.023168563842773438, -0.022418498992919922, -0.021668434143066406, -0.02091836929321289, -0.020168304443359375, -0.01941823959350586, -0.018668174743652344, -0.017918109893798828, -0.017168045043945312, -0.016417980194091797, -0.01566791534423828, -0.014917850494384766, -0.01416778564453125, -0.013417720794677734, -0.012667655944824219, -0.011917591094970703, -0.011167526245117188, -0.010417461395263672, -0.009667396545410156, -0.00891733169555664, -0.008167266845703125, -0.007417201995849609, -0.006667137145996094, -0.005917072296142578, -0.0051670074462890625, -0.004416942596435547, -0.0036668777465820312, -0.0029168128967285156, -0.002166748046875, -0.0014166831970214844, -0.0006666183471679688, 8.344650268554688e-05, 0.0008335113525390625, 0.0015835762023925781, 0.0023336410522460938, 0.0030837059020996094, 0.003833770751953125, 0.004583835601806641, 0.005333900451660156, 0.006083965301513672, 0.0068340301513671875, 0.007584095001220703, 0.008334159851074219, 0.009084224700927734, 0.00983428955078125, 0.010584354400634766, 0.011334419250488281, 0.012084484100341797, 0.012834548950195312, 0.013584613800048828, 0.014334678649902344, 0.01508474349975586, 0.015834808349609375, 0.01658487319946289, 0.017334938049316406, 0.018085002899169922, 0.018835067749023438, 0.019585132598876953, 0.02033519744873047, 0.021085262298583984, 0.0218353271484375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 7.0, 12.0, 7.0, 8.0, 27.0, 29.0, 43.0, 76.0, 143.0, 469.0, 47885.0, 998290.0, 1070.0, 192.0, 86.0, 66.0, 34.0, 26.0, 20.0, 12.0, 10.0, 6.0, 5.0, 1.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4921875, -0.475311279296875, -0.45843505859375, -0.441558837890625, -0.4246826171875, -0.407806396484375, -0.39093017578125, -0.374053955078125, -0.357177734375, -0.340301513671875, -0.32342529296875, -0.306549072265625, -0.2896728515625, -0.272796630859375, -0.25592041015625, -0.239044189453125, -0.22216796875, -0.205291748046875, -0.18841552734375, -0.171539306640625, -0.1546630859375, -0.137786865234375, -0.12091064453125, -0.104034423828125, -0.087158203125, -0.070281982421875, -0.05340576171875, -0.036529541015625, -0.0196533203125, -0.002777099609375, 0.01409912109375, 0.030975341796875, 0.0478515625, 0.064727783203125, 0.08160400390625, 0.098480224609375, 0.1153564453125, 0.132232666015625, 0.14910888671875, 0.165985107421875, 0.182861328125, 0.199737548828125, 0.21661376953125, 0.233489990234375, 0.2503662109375, 0.267242431640625, 0.28411865234375, 0.300994873046875, 0.31787109375, 0.334747314453125, 0.35162353515625, 0.368499755859375, 0.3853759765625, 0.402252197265625, 0.41912841796875, 0.436004638671875, 0.452880859375, 0.469757080078125, 0.48663330078125, 0.503509521484375, 0.5203857421875, 0.537261962890625, 0.55413818359375, 0.571014404296875, 0.587890625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 25.0, 84.0, 568.0, 297.0, 25.0, 10.0, 3.0], "bins": [-0.2608456015586853, -0.256485253572464, -0.2521249055862427, -0.24776457250118256, -0.24340422451496124, -0.23904389142990112, -0.2346835434436798, -0.2303231954574585, -0.22596284747123718, -0.22160249948501587, -0.21724216639995575, -0.21288181841373444, -0.20852147042751312, -0.204161137342453, -0.1998007893562317, -0.19544044137001038, -0.19108010828495026, -0.18671976029872894, -0.18235942721366882, -0.1779990792274475, -0.1736387312412262, -0.16927838325500488, -0.16491805016994476, -0.16055770218372345, -0.15619736909866333, -0.15183702111244202, -0.1474766880273819, -0.14311634004116058, -0.13875599205493927, -0.13439565896987915, -0.13003531098365784, -0.12567496299743652, -0.1213146224617958, -0.11695428192615509, -0.11259393393993378, -0.10823359340429306, -0.10387325286865234, -0.09951290488243103, -0.09515256434679031, -0.0907922238111496, -0.08643187582492828, -0.08207153528928757, -0.07771118730306625, -0.07335084676742554, -0.06899049878120422, -0.06463015824556351, -0.06026981770992279, -0.055909473448991776, -0.05154912918806076, -0.047188784927129745, -0.04282844066619873, -0.038468100130558014, -0.034107755869627, -0.029747411608695984, -0.025387069210410118, -0.021026726812124252, -0.016666382551193237, -0.012306039221584797, -0.007945695891976357, -0.003585352562367916, 0.0007749907672405243, 0.005135335028171539, 0.009495677426457405, 0.013856019824743271, 0.018216364085674286]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 7.0, 9.0, 12.0, 11.0, 24.0, 25.0, 23.0, 29.0, 28.0, 38.0, 26.0, 39.0, 47.0, 42.0, 36.0, 45.0, 45.0, 37.0, 50.0, 34.0, 43.0, 37.0, 24.0, 35.0, 27.0, 32.0, 28.0, 36.0, 20.0, 13.0, 17.0, 13.0, 9.0, 9.0, 8.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02130967378616333, -0.020653054118156433, -0.019996436312794685, -0.019339818507432938, -0.01868319883942604, -0.018026579171419144, -0.017369961366057396, -0.016713343560695648, -0.01605672389268875, -0.015400105156004429, -0.014743486419320107, -0.014086867682635784, -0.013430248945951462, -0.01277363020926714, -0.012117011472582817, -0.011460392735898495, -0.010803773999214172, -0.01014715526252985, -0.009490536525845528, -0.008833917789161205, -0.008177299052476883, -0.007520680315792561, -0.006864061579108238, -0.006207442842423916, -0.0055508241057395935, -0.004894205369055271, -0.004237586632370949, -0.0035809678956866264, -0.002924349159002304, -0.0022677304223179817, -0.0016111116856336594, -0.000954492948949337, -0.00029787421226501465, 0.0003587445244193077, 0.00101536326110363, 0.0016719819977879524, 0.0023286007344722748, 0.002985219471156597, 0.0036418382078409195, 0.004298456944525242, 0.004955075681209564, 0.0056116944178938866, 0.006268313154578209, 0.006924931891262531, 0.007581550627946854, 0.008238169364631176, 0.008894788101315498, 0.00955140683799982, 0.010208025574684143, 0.010864644311368465, 0.011521263048052788, 0.01217788178473711, 0.012834500521421432, 0.013491119258105755, 0.014147737994790077, 0.0148043567314744, 0.015460975468158722, 0.01611759513616562, 0.016774212941527367, 0.017430830746889114, 0.01808745041489601, 0.01874407008290291, 0.019400687888264656, 0.020057305693626404, 0.0207139253616333]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 2.0, 3.0, 7.0, 7.0, 11.0, 17.0, 15.0, 17.0, 18.0, 26.0, 29.0, 25.0, 36.0, 34.0, 35.0, 29.0, 54.0, 41.0, 46.0, 30.0, 35.0, 44.0, 43.0, 39.0, 42.0, 48.0, 39.0, 33.0, 16.0, 23.0, 17.0, 27.0, 14.0, 20.0, 14.0, 12.0, 6.0, 10.0, 7.0, 3.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.8046875, -4.65557861328125, -4.5064697265625, -4.35736083984375, -4.208251953125, -4.05914306640625, -3.9100341796875, -3.76092529296875, -3.61181640625, -3.46270751953125, -3.3135986328125, -3.16448974609375, -3.015380859375, -2.86627197265625, -2.7171630859375, -2.56805419921875, -2.4189453125, -2.26983642578125, -2.1207275390625, -1.97161865234375, -1.822509765625, -1.67340087890625, -1.5242919921875, -1.37518310546875, -1.22607421875, -1.07696533203125, -0.9278564453125, -0.77874755859375, -0.629638671875, -0.48052978515625, -0.3314208984375, -0.18231201171875, -0.033203125, 0.11590576171875, 0.2650146484375, 0.41412353515625, 0.563232421875, 0.71234130859375, 0.8614501953125, 1.01055908203125, 1.15966796875, 1.30877685546875, 1.4578857421875, 1.60699462890625, 1.756103515625, 1.90521240234375, 2.0543212890625, 2.20343017578125, 2.3525390625, 2.50164794921875, 2.6507568359375, 2.79986572265625, 2.948974609375, 3.09808349609375, 3.2471923828125, 3.39630126953125, 3.54541015625, 3.69451904296875, 3.8436279296875, 3.99273681640625, 4.141845703125, 4.29095458984375, 4.4400634765625, 4.58917236328125, 4.73828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 5.0, 4.0, 18.0, 13.0, 12.0, 23.0, 36.0, 49.0, 63.0, 99.0, 124.0, 197.0, 349.0, 496.0, 883.0, 1597.0, 3229.0, 6294.0, 13185.0, 28164.0, 61443.0, 145171.0, 390835.0, 229705.0, 89480.0, 40107.0, 18634.0, 8948.0, 4365.0, 2103.0, 1104.0, 605.0, 402.0, 241.0, 155.0, 115.0, 86.0, 49.0, 45.0, 26.0, 16.0, 17.0, 12.0, 16.0, 9.0, 10.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.765625, -4.61541748046875, -4.4652099609375, -4.31500244140625, -4.164794921875, -4.01458740234375, -3.8643798828125, -3.71417236328125, -3.56396484375, -3.41375732421875, -3.2635498046875, -3.11334228515625, -2.963134765625, -2.81292724609375, -2.6627197265625, -2.51251220703125, -2.3623046875, -2.21209716796875, -2.0618896484375, -1.91168212890625, -1.761474609375, -1.61126708984375, -1.4610595703125, -1.31085205078125, -1.16064453125, -1.01043701171875, -0.8602294921875, -0.71002197265625, -0.559814453125, -0.40960693359375, -0.2593994140625, -0.10919189453125, 0.041015625, 0.19122314453125, 0.3414306640625, 0.49163818359375, 0.641845703125, 0.79205322265625, 0.9422607421875, 1.09246826171875, 1.24267578125, 1.39288330078125, 1.5430908203125, 1.69329833984375, 1.843505859375, 1.99371337890625, 2.1439208984375, 2.29412841796875, 2.4443359375, 2.59454345703125, 2.7447509765625, 2.89495849609375, 3.045166015625, 3.19537353515625, 3.3455810546875, 3.49578857421875, 3.64599609375, 3.79620361328125, 3.9464111328125, 4.09661865234375, 4.246826171875, 4.39703369140625, 4.5472412109375, 4.69744873046875, 4.84765625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 5.0, 3.0, 13.0, 9.0, 13.0, 18.0, 29.0, 33.0, 33.0, 32.0, 45.0, 62.0, 60.0, 77.0, 85.0, 317.0, 1581.0, 174.0, 77.0, 58.0, 43.0, 42.0, 32.0, 35.0, 26.0, 27.0, 27.0, 23.0, 10.0, 6.0, 10.0, 10.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.03125, -17.488525390625, -16.94580078125, -16.403076171875, -15.8603515625, -15.317626953125, -14.77490234375, -14.232177734375, -13.689453125, -13.146728515625, -12.60400390625, -12.061279296875, -11.5185546875, -10.975830078125, -10.43310546875, -9.890380859375, -9.34765625, -8.804931640625, -8.26220703125, -7.719482421875, -7.1767578125, -6.634033203125, -6.09130859375, -5.548583984375, -5.005859375, -4.463134765625, -3.92041015625, -3.377685546875, -2.8349609375, -2.292236328125, -1.74951171875, -1.206787109375, -0.6640625, -0.121337890625, 0.42138671875, 0.964111328125, 1.5068359375, 2.049560546875, 2.59228515625, 3.135009765625, 3.677734375, 4.220458984375, 4.76318359375, 5.305908203125, 5.8486328125, 6.391357421875, 6.93408203125, 7.476806640625, 8.01953125, 8.562255859375, 9.10498046875, 9.647705078125, 10.1904296875, 10.733154296875, 11.27587890625, 11.818603515625, 12.361328125, 12.904052734375, 13.44677734375, 13.989501953125, 14.5322265625, 15.074951171875, 15.61767578125, 16.160400390625, 16.703125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 11.0, 19.0, 15.0, 19.0, 25.0, 28.0, 41.0, 57.0, 65.0, 80.0, 147.0, 176.0, 308.0, 554.0, 1866.0, 44160.0, 3057612.0, 37135.0, 1840.0, 570.0, 287.0, 192.0, 112.0, 87.0, 75.0, 53.0, 44.0, 28.0, 23.0, 19.0, 19.0, 6.0, 9.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.4375, -43.18505859375, -41.9326171875, -40.68017578125, -39.427734375, -38.17529296875, -36.9228515625, -35.67041015625, -34.41796875, -33.16552734375, -31.9130859375, -30.66064453125, -29.408203125, -28.15576171875, -26.9033203125, -25.65087890625, -24.3984375, -23.14599609375, -21.8935546875, -20.64111328125, -19.388671875, -18.13623046875, -16.8837890625, -15.63134765625, -14.37890625, -13.12646484375, -11.8740234375, -10.62158203125, -9.369140625, -8.11669921875, -6.8642578125, -5.61181640625, -4.359375, -3.10693359375, -1.8544921875, -0.60205078125, 0.650390625, 1.90283203125, 3.1552734375, 4.40771484375, 5.66015625, 6.91259765625, 8.1650390625, 9.41748046875, 10.669921875, 11.92236328125, 13.1748046875, 14.42724609375, 15.6796875, 16.93212890625, 18.1845703125, 19.43701171875, 20.689453125, 21.94189453125, 23.1943359375, 24.44677734375, 25.69921875, 26.95166015625, 28.2041015625, 29.45654296875, 30.708984375, 31.96142578125, 33.2138671875, 34.46630859375, 35.71875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 38.0, 120.0, 250.0, 328.0, 199.0, 60.0, 11.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.499195098876953, -20.797929763793945, -19.09666633605957, -17.395401000976562, -15.694136619567871, -13.99287223815918, -12.291606903076172, -10.59034252166748, -8.889078140258789, -7.187813758850098, -5.486548900604248, -3.7852840423583984, -2.084019660949707, -0.3827552795410156, 1.3185100555419922, 3.0197744369506836, 4.721038818359375, 6.422303199768066, 8.123567581176758, 9.824832916259766, 11.526097297668457, 13.227361679077148, 14.928627014160156, 16.62989044189453, 18.33115577697754, 20.032421112060547, 21.733684539794922, 23.43494987487793, 25.136215209960938, 26.837478637695312, 28.53874397277832, 30.240009307861328, 31.941268920898438, 33.64253234863281, 35.34379959106445, 37.04506301879883, 38.7463264465332, 40.447593688964844, 42.14885711669922, 43.850120544433594, 45.55138397216797, 47.252647399902344, 48.953914642333984, 50.65517807006836, 52.356441497802734, 54.057708740234375, 55.75897216796875, 57.460235595703125, 59.161502838134766, 60.86276626586914, 62.56403350830078, 64.26529693603516, 65.96656036376953, 67.6678237915039, 69.36909484863281, 71.07035827636719, 72.77162170410156, 74.47288513183594, 76.17414855957031, 77.87541198730469, 79.5766830444336, 81.27794647216797, 82.97920989990234, 84.68047332763672, 86.3817367553711]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 0.0, 4.0, 3.0, 12.0, 5.0, 11.0, 10.0, 10.0, 11.0, 12.0, 26.0, 18.0, 28.0, 23.0, 36.0, 33.0, 26.0, 41.0, 33.0, 39.0, 35.0, 28.0, 38.0, 28.0, 48.0, 46.0, 37.0, 37.0, 40.0, 32.0, 30.0, 36.0, 23.0, 31.0, 17.0, 24.0, 15.0, 17.0, 13.0, 10.0, 12.0, 6.0, 2.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.065216064453125, -33.90144729614258, -32.73767852783203, -31.57390785217285, -30.410139083862305, -29.246370315551758, -28.082599639892578, -26.91883087158203, -25.755062103271484, -24.591293334960938, -23.42752456665039, -22.26375389099121, -21.099985122680664, -19.936216354370117, -18.772445678710938, -17.60867691040039, -16.444908142089844, -15.281139373779297, -14.117369651794434, -12.95359992980957, -11.789831161499023, -10.626062393188477, -9.462292671203613, -8.29852294921875, -7.134754180908203, -5.970984935760498, -4.807215690612793, -3.643446445465088, -2.479677200317383, -1.3159079551696777, -0.15213871002197266, 1.0116310119628906, 2.1753997802734375, 3.3391690254211426, 4.502938270568848, 5.666707515716553, 6.830476760864258, 7.994246006011963, 9.158015251159668, 10.321784973144531, 11.485553741455078, 12.649322509765625, 13.813092231750488, 14.976861953735352, 16.1406307220459, 17.304399490356445, 18.468170166015625, 19.631938934326172, 20.79570770263672, 21.959476470947266, 23.123245239257812, 24.287015914916992, 25.45078468322754, 26.614553451538086, 27.778324127197266, 28.942092895507812, 30.10586166381836, 31.269630432128906, 32.43339920043945, 33.59716796875, 34.76094055175781, 35.92470932006836, 37.088478088378906, 38.25224685668945, 39.416015625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 7.0, 4.0, 3.0, 5.0, 10.0, 14.0, 13.0, 17.0, 12.0, 22.0, 19.0, 25.0, 32.0, 31.0, 35.0, 34.0, 39.0, 57.0, 35.0, 38.0, 40.0, 38.0, 39.0, 36.0, 40.0, 41.0, 41.0, 31.0, 30.0, 33.0, 21.0, 25.0, 16.0, 19.0, 20.0, 18.0, 13.0, 7.0, 9.0, 5.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.01953125, -4.86456298828125, -4.7095947265625, -4.55462646484375, -4.399658203125, -4.24468994140625, -4.0897216796875, -3.93475341796875, -3.77978515625, -3.62481689453125, -3.4698486328125, -3.31488037109375, -3.159912109375, -3.00494384765625, -2.8499755859375, -2.69500732421875, -2.5400390625, -2.38507080078125, -2.2301025390625, -2.07513427734375, -1.920166015625, -1.76519775390625, -1.6102294921875, -1.45526123046875, -1.30029296875, -1.14532470703125, -0.9903564453125, -0.83538818359375, -0.680419921875, -0.52545166015625, -0.3704833984375, -0.21551513671875, -0.060546875, 0.09442138671875, 0.2493896484375, 0.40435791015625, 0.559326171875, 0.71429443359375, 0.8692626953125, 1.02423095703125, 1.17919921875, 1.33416748046875, 1.4891357421875, 1.64410400390625, 1.799072265625, 1.95404052734375, 2.1090087890625, 2.26397705078125, 2.4189453125, 2.57391357421875, 2.7288818359375, 2.88385009765625, 3.038818359375, 3.19378662109375, 3.3487548828125, 3.50372314453125, 3.65869140625, 3.81365966796875, 3.9686279296875, 4.12359619140625, 4.278564453125, 4.43353271484375, 4.5885009765625, 4.74346923828125, 4.8984375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 6.0, 11.0, 4.0, 10.0, 14.0, 10.0, 20.0, 21.0, 22.0, 36.0, 63.0, 119.0, 149.0, 385.0, 947.0, 2463.0, 8043.0, 34865.0, 267495.0, 2316237.0, 1404010.0, 130073.0, 20653.0, 5366.0, 1747.0, 731.0, 303.0, 152.0, 77.0, 51.0, 32.0, 25.0, 25.0, 21.0, 18.0, 12.0, 8.0, 10.0, 7.0, 4.0, 2.0, 6.0, 5.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-13.078125, -12.679931640625, -12.28173828125, -11.883544921875, -11.4853515625, -11.087158203125, -10.68896484375, -10.290771484375, -9.892578125, -9.494384765625, -9.09619140625, -8.697998046875, -8.2998046875, -7.901611328125, -7.50341796875, -7.105224609375, -6.70703125, -6.308837890625, -5.91064453125, -5.512451171875, -5.1142578125, -4.716064453125, -4.31787109375, -3.919677734375, -3.521484375, -3.123291015625, -2.72509765625, -2.326904296875, -1.9287109375, -1.530517578125, -1.13232421875, -0.734130859375, -0.3359375, 0.062255859375, 0.46044921875, 0.858642578125, 1.2568359375, 1.655029296875, 2.05322265625, 2.451416015625, 2.849609375, 3.247802734375, 3.64599609375, 4.044189453125, 4.4423828125, 4.840576171875, 5.23876953125, 5.636962890625, 6.03515625, 6.433349609375, 6.83154296875, 7.229736328125, 7.6279296875, 8.026123046875, 8.42431640625, 8.822509765625, 9.220703125, 9.618896484375, 10.01708984375, 10.415283203125, 10.8134765625, 11.211669921875, 11.60986328125, 12.008056640625, 12.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 7.0, 2.0, 2.0, 10.0, 8.0, 15.0, 24.0, 23.0, 49.0, 63.0, 119.0, 179.0, 285.0, 455.0, 696.0, 710.0, 517.0, 341.0, 212.0, 121.0, 69.0, 58.0, 37.0, 14.0, 14.0, 22.0, 9.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.234375, -19.7427978515625, -19.251220703125, -18.7596435546875, -18.26806640625, -17.7764892578125, -17.284912109375, -16.7933349609375, -16.3017578125, -15.8101806640625, -15.318603515625, -14.8270263671875, -14.33544921875, -13.8438720703125, -13.352294921875, -12.8607177734375, -12.369140625, -11.8775634765625, -11.385986328125, -10.8944091796875, -10.40283203125, -9.9112548828125, -9.419677734375, -8.9281005859375, -8.4365234375, -7.9449462890625, -7.453369140625, -6.9617919921875, -6.47021484375, -5.9786376953125, -5.487060546875, -4.9954833984375, -4.50390625, -4.0123291015625, -3.520751953125, -3.0291748046875, -2.53759765625, -2.0460205078125, -1.554443359375, -1.0628662109375, -0.5712890625, -0.0797119140625, 0.411865234375, 0.9034423828125, 1.39501953125, 1.8865966796875, 2.378173828125, 2.8697509765625, 3.361328125, 3.8529052734375, 4.344482421875, 4.8360595703125, 5.32763671875, 5.8192138671875, 6.310791015625, 6.8023681640625, 7.2939453125, 7.7855224609375, 8.277099609375, 8.7686767578125, 9.26025390625, 9.7518310546875, 10.243408203125, 10.7349853515625, 11.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 24.0, 15.0, 18.0, 33.0, 67.0, 87.0, 168.0, 360.0, 957.0, 5226.0, 1166267.0, 3012191.0, 6857.0, 1081.0, 406.0, 212.0, 113.0, 67.0, 32.0, 22.0, 25.0, 10.0, 8.0, 4.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.03125, -55.51416015625, -52.9970703125, -50.47998046875, -47.962890625, -45.44580078125, -42.9287109375, -40.41162109375, -37.89453125, -35.37744140625, -32.8603515625, -30.34326171875, -27.826171875, -25.30908203125, -22.7919921875, -20.27490234375, -17.7578125, -15.24072265625, -12.7236328125, -10.20654296875, -7.689453125, -5.17236328125, -2.6552734375, -0.13818359375, 2.37890625, 4.89599609375, 7.4130859375, 9.93017578125, 12.447265625, 14.96435546875, 17.4814453125, 19.99853515625, 22.515625, 25.03271484375, 27.5498046875, 30.06689453125, 32.583984375, 35.10107421875, 37.6181640625, 40.13525390625, 42.65234375, 45.16943359375, 47.6865234375, 50.20361328125, 52.720703125, 55.23779296875, 57.7548828125, 60.27197265625, 62.7890625, 65.30615234375, 67.8232421875, 70.34033203125, 72.857421875, 75.37451171875, 77.8916015625, 80.40869140625, 82.92578125, 85.44287109375, 87.9599609375, 90.47705078125, 92.994140625, 95.51123046875, 98.0283203125, 100.54541015625, 103.0625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 11.0, 27.0, 54.0, 100.0, 138.0, 164.0, 207.0, 139.0, 86.0, 34.0, 25.0, 15.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.94692611694336, -41.362361907958984, -38.77779769897461, -36.193233489990234, -33.60866928100586, -31.024105072021484, -28.439542770385742, -25.854978561401367, -23.270414352416992, -20.685850143432617, -18.101285934448242, -15.516722679138184, -12.932158470153809, -10.347594261169434, -7.763031005859375, -5.178466796875, -2.593902587890625, -0.009338617324829102, 2.575225353240967, 5.159789085388184, 7.744353294372559, 10.328917503356934, 12.913480758666992, 15.498044967651367, 18.082609176635742, 20.667173385620117, 23.251737594604492, 25.836299896240234, 28.42086410522461, 31.005428314208984, 33.58999252319336, 36.174556732177734, 38.759117126464844, 41.34368133544922, 43.928245544433594, 46.51280975341797, 49.097373962402344, 51.68193817138672, 54.266502380371094, 56.85106658935547, 59.435630798339844, 62.02019500732422, 64.6047592163086, 67.18932342529297, 69.77388763427734, 72.35845184326172, 74.9430160522461, 77.52758026123047, 80.11213684082031, 82.69670104980469, 85.28126525878906, 87.86582946777344, 90.45039367675781, 93.03495788574219, 95.61952209472656, 98.20408630371094, 100.78865051269531, 103.37321472167969, 105.95777893066406, 108.54234313964844, 111.12690734863281, 113.71147155761719, 116.29603576660156, 118.88059997558594, 121.46516418457031]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 14.0, 13.0, 22.0, 21.0, 16.0, 34.0, 26.0, 33.0, 33.0, 41.0, 34.0, 44.0, 45.0, 37.0, 35.0, 57.0, 46.0, 45.0, 44.0, 23.0, 46.0, 30.0, 18.0, 38.0, 24.0, 19.0, 27.0, 16.0, 13.0, 10.0, 8.0, 10.0, 11.0, 8.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.99497985839844, -34.83114242553711, -33.667301177978516, -32.50346374511719, -31.33962631225586, -30.1757869720459, -29.011947631835938, -27.84811019897461, -26.68427085876465, -25.520431518554688, -24.35659408569336, -23.1927547454834, -22.028915405273438, -20.86507797241211, -19.70123863220215, -18.537399291992188, -17.37356185913086, -16.2097225189209, -15.04588508605957, -13.88204574584961, -12.718207359313965, -11.55436897277832, -10.39052963256836, -9.226691246032715, -8.06285285949707, -6.899014472961426, -5.735175609588623, -4.57133674621582, -3.407498359680176, -2.2436599731445312, -1.0798211097717285, 0.08401775360107422, 1.2478561401367188, 2.4116947650909424, 3.575533390045166, 4.739372253417969, 5.903210639953613, 7.067049026489258, 8.230888366699219, 9.394726753234863, 10.558565139770508, 11.722403526306152, 12.886241912841797, 14.050081253051758, 15.213919639587402, 16.377758026123047, 17.541597366333008, 18.70543670654297, 19.869274139404297, 21.033113479614258, 22.196950912475586, 23.360790252685547, 24.524627685546875, 25.688467025756836, 26.852306365966797, 28.016143798828125, 29.179983139038086, 30.343822479248047, 31.507659912109375, 32.6714973449707, 33.8353385925293, 34.999176025390625, 36.16301345825195, 37.32685470581055, 38.490692138671875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 2.0, 6.0, 17.0, 11.0, 13.0, 12.0, 14.0, 22.0, 20.0, 20.0, 37.0, 38.0, 38.0, 30.0, 40.0, 47.0, 40.0, 42.0, 41.0, 46.0, 50.0, 35.0, 47.0, 45.0, 26.0, 18.0, 36.0, 31.0, 24.0, 24.0, 17.0, 17.0, 21.0, 11.0, 11.0, 5.0, 6.0, 4.0, 10.0, 8.0, 1.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3203125, -5.1534423828125, -4.986572265625, -4.8197021484375, -4.65283203125, -4.4859619140625, -4.319091796875, -4.1522216796875, -3.9853515625, -3.8184814453125, -3.651611328125, -3.4847412109375, -3.31787109375, -3.1510009765625, -2.984130859375, -2.8172607421875, -2.650390625, -2.4835205078125, -2.316650390625, -2.1497802734375, -1.98291015625, -1.8160400390625, -1.649169921875, -1.4822998046875, -1.3154296875, -1.1485595703125, -0.981689453125, -0.8148193359375, -0.64794921875, -0.4810791015625, -0.314208984375, -0.1473388671875, 0.01953125, 0.1864013671875, 0.353271484375, 0.5201416015625, 0.68701171875, 0.8538818359375, 1.020751953125, 1.1876220703125, 1.3544921875, 1.5213623046875, 1.688232421875, 1.8551025390625, 2.02197265625, 2.1888427734375, 2.355712890625, 2.5225830078125, 2.689453125, 2.8563232421875, 3.023193359375, 3.1900634765625, 3.35693359375, 3.5238037109375, 3.690673828125, 3.8575439453125, 4.0244140625, 4.1912841796875, 4.358154296875, 4.5250244140625, 4.69189453125, 4.8587646484375, 5.025634765625, 5.1925048828125, 5.359375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 13.0, 18.0, 20.0, 27.0, 50.0, 79.0, 132.0, 232.0, 381.0, 671.0, 1185.0, 2235.0, 3826.0, 7362.0, 14598.0, 28475.0, 57530.0, 113116.0, 209025.0, 257939.0, 170932.0, 89826.0, 44623.0, 21948.0, 11223.0, 5916.0, 3204.0, 1694.0, 926.0, 518.0, 326.0, 174.0, 105.0, 75.0, 61.0, 30.0, 15.0, 10.0, 8.0, 4.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.125, -1.0931472778320312, -1.0612945556640625, -1.0294418334960938, -0.997589111328125, -0.9657363891601562, -0.9338836669921875, -0.9020309448242188, -0.87017822265625, -0.8383255004882812, -0.8064727783203125, -0.7746200561523438, -0.742767333984375, -0.7109146118164062, -0.6790618896484375, -0.6472091674804688, -0.6153564453125, -0.5835037231445312, -0.5516510009765625, -0.5197982788085938, -0.487945556640625, -0.45609283447265625, -0.4242401123046875, -0.39238739013671875, -0.36053466796875, -0.32868194580078125, -0.2968292236328125, -0.26497650146484375, -0.233123779296875, -0.20127105712890625, -0.1694183349609375, -0.13756561279296875, -0.105712890625, -0.07386016845703125, -0.0420074462890625, -0.01015472412109375, 0.021697998046875, 0.05355072021484375, 0.0854034423828125, 0.11725616455078125, 0.14910888671875, 0.18096160888671875, 0.2128143310546875, 0.24466705322265625, 0.276519775390625, 0.30837249755859375, 0.3402252197265625, 0.37207794189453125, 0.4039306640625, 0.43578338623046875, 0.4676361083984375, 0.49948883056640625, 0.531341552734375, 0.5631942749023438, 0.5950469970703125, 0.6268997192382812, 0.65875244140625, 0.6906051635742188, 0.7224578857421875, 0.7543106079101562, 0.786163330078125, 0.8180160522460938, 0.8498687744140625, 0.8817214965820312, 0.91357421875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 11.0, 14.0, 15.0, 14.0, 27.0, 16.0, 17.0, 17.0, 34.0, 32.0, 36.0, 43.0, 30.0, 29.0, 42.0, 37.0, 39.0, 1057.0, 58.0, 28.0, 47.0, 54.0, 41.0, 27.0, 28.0, 22.0, 37.0, 25.0, 20.0, 10.0, 18.0, 21.0, 11.0, 14.0, 10.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-4.06640625, -3.951995849609375, -3.83758544921875, -3.723175048828125, -3.6087646484375, -3.494354248046875, -3.37994384765625, -3.265533447265625, -3.151123046875, -3.036712646484375, -2.92230224609375, -2.807891845703125, -2.6934814453125, -2.579071044921875, -2.46466064453125, -2.350250244140625, -2.23583984375, -2.121429443359375, -2.00701904296875, -1.892608642578125, -1.7781982421875, -1.663787841796875, -1.54937744140625, -1.434967041015625, -1.320556640625, -1.206146240234375, -1.09173583984375, -0.977325439453125, -0.8629150390625, -0.748504638671875, -0.63409423828125, -0.519683837890625, -0.4052734375, -0.290863037109375, -0.17645263671875, -0.062042236328125, 0.0523681640625, 0.166778564453125, 0.28118896484375, 0.395599365234375, 0.510009765625, 0.624420166015625, 0.73883056640625, 0.853240966796875, 0.9676513671875, 1.082061767578125, 1.19647216796875, 1.310882568359375, 1.42529296875, 1.539703369140625, 1.65411376953125, 1.768524169921875, 1.8829345703125, 1.997344970703125, 2.11175537109375, 2.226165771484375, 2.340576171875, 2.454986572265625, 2.56939697265625, 2.683807373046875, 2.7982177734375, 2.912628173828125, 3.02703857421875, 3.141448974609375, 3.255859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 12.0, 14.0, 25.0, 27.0, 65.0, 68.0, 105.0, 150.0, 253.0, 325.0, 560.0, 896.0, 1315.0, 2043.0, 3131.0, 4704.0, 7517.0, 11993.0, 19306.0, 31047.0, 50130.0, 78822.0, 116735.0, 183867.0, 1179256.0, 138568.0, 97062.0, 63027.0, 39509.0, 24592.0, 15246.0, 9664.0, 6108.0, 3799.0, 2541.0, 1601.0, 1003.0, 675.0, 443.0, 285.0, 213.0, 132.0, 110.0, 68.0, 36.0, 32.0, 16.0, 10.0, 12.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.36803436279296875, -0.3554534912109375, -0.34287261962890625, -0.330291748046875, -0.31771087646484375, -0.3051300048828125, -0.29254913330078125, -0.27996826171875, -0.26738739013671875, -0.2548065185546875, -0.24222564697265625, -0.229644775390625, -0.21706390380859375, -0.2044830322265625, -0.19190216064453125, -0.1793212890625, -0.16674041748046875, -0.1541595458984375, -0.14157867431640625, -0.128997802734375, -0.11641693115234375, -0.1038360595703125, -0.09125518798828125, -0.07867431640625, -0.06609344482421875, -0.0535125732421875, -0.04093170166015625, -0.028350830078125, -0.01576995849609375, -0.0031890869140625, 0.00939178466796875, 0.02197265625, 0.03455352783203125, 0.0471343994140625, 0.05971527099609375, 0.072296142578125, 0.08487701416015625, 0.0974578857421875, 0.11003875732421875, 0.12261962890625, 0.13520050048828125, 0.1477813720703125, 0.16036224365234375, 0.172943115234375, 0.18552398681640625, 0.1981048583984375, 0.21068572998046875, 0.2232666015625, 0.23584747314453125, 0.2484283447265625, 0.26100921630859375, 0.273590087890625, 0.28617095947265625, 0.2987518310546875, 0.31133270263671875, 0.32391357421875, 0.33649444580078125, 0.3490753173828125, 0.36165618896484375, 0.374237060546875, 0.38681793212890625, 0.3993988037109375, 0.41197967529296875, 0.424560546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 11.0, 1.0, 9.0, 6.0, 15.0, 15.0, 24.0, 27.0, 42.0, 65.0, 82.0, 114.0, 139.0, 115.0, 90.0, 68.0, 37.0, 26.0, 25.0, 18.0, 12.0, 4.0, 5.0, 7.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029541015625, -0.02854633331298828, -0.027551651000976562, -0.026556968688964844, -0.025562286376953125, -0.024567604064941406, -0.023572921752929688, -0.02257823944091797, -0.02158355712890625, -0.02058887481689453, -0.019594192504882812, -0.018599510192871094, -0.017604827880859375, -0.016610145568847656, -0.015615463256835938, -0.014620780944824219, -0.0136260986328125, -0.012631416320800781, -0.011636734008789062, -0.010642051696777344, -0.009647369384765625, -0.008652687072753906, -0.0076580047607421875, -0.006663322448730469, -0.00566864013671875, -0.004673957824707031, -0.0036792755126953125, -0.0026845932006835938, -0.001689910888671875, -0.0006952285766601562, 0.0002994537353515625, 0.0012941360473632812, 0.002288818359375, 0.0032835006713867188, 0.0042781829833984375, 0.005272865295410156, 0.006267547607421875, 0.007262229919433594, 0.008256912231445312, 0.009251594543457031, 0.01024627685546875, 0.011240959167480469, 0.012235641479492188, 0.013230323791503906, 0.014225006103515625, 0.015219688415527344, 0.016214370727539062, 0.01720905303955078, 0.0182037353515625, 0.01919841766357422, 0.020193099975585938, 0.021187782287597656, 0.022182464599609375, 0.023177146911621094, 0.024171829223632812, 0.02516651153564453, 0.02616119384765625, 0.02715587615966797, 0.028150558471679688, 0.029145240783691406, 0.030139923095703125, 0.031134605407714844, 0.03212928771972656, 0.03312397003173828, 0.03411865234375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 8.0, 12.0, 16.0, 18.0, 30.0, 45.0, 95.0, 186.0, 693.0, 4123.0, 96264.0, 931797.0, 13005.0, 1518.0, 351.0, 137.0, 65.0, 43.0, 33.0, 20.0, 12.0, 8.0, 8.0, 7.0, 7.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.73486328125, -0.7127532958984375, -0.690643310546875, -0.6685333251953125, -0.64642333984375, -0.6243133544921875, -0.602203369140625, -0.5800933837890625, -0.5579833984375, -0.5358734130859375, -0.513763427734375, -0.4916534423828125, -0.46954345703125, -0.4474334716796875, -0.425323486328125, -0.4032135009765625, -0.381103515625, -0.3589935302734375, -0.336883544921875, -0.3147735595703125, -0.29266357421875, -0.2705535888671875, -0.248443603515625, -0.2263336181640625, -0.2042236328125, -0.1821136474609375, -0.160003662109375, -0.1378936767578125, -0.11578369140625, -0.0936737060546875, -0.071563720703125, -0.0494537353515625, -0.02734375, -0.0052337646484375, 0.016876220703125, 0.0389862060546875, 0.06109619140625, 0.0832061767578125, 0.105316162109375, 0.1274261474609375, 0.1495361328125, 0.1716461181640625, 0.193756103515625, 0.2158660888671875, 0.23797607421875, 0.2600860595703125, 0.282196044921875, 0.3043060302734375, 0.326416015625, 0.3485260009765625, 0.370635986328125, 0.3927459716796875, 0.41485595703125, 0.4369659423828125, 0.459075927734375, 0.4811859130859375, 0.5032958984375, 0.5254058837890625, 0.547515869140625, 0.5696258544921875, 0.59173583984375, 0.6138458251953125, 0.635955810546875, 0.6580657958984375, 0.68017578125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 11.0, 13.0, 9.0, 10.0, 19.0, 20.0, 32.0, 47.0, 49.0, 65.0, 105.0, 189.0, 159.0, 77.0, 67.0, 53.0, 22.0, 12.0, 9.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09589116275310516, -0.09267681837081909, -0.08946247398853302, -0.08624812960624695, -0.08303378522396088, -0.0798194408416748, -0.07660509645938873, -0.07339075207710266, -0.07017640769481659, -0.06696206331253052, -0.06374771893024445, -0.060533374547958374, -0.0573190301656723, -0.05410468578338623, -0.05089034140110016, -0.04767599701881409, -0.04446164891123772, -0.041247304528951645, -0.03803296014666557, -0.0348186157643795, -0.03160427138209343, -0.02838992513716221, -0.025175580754876137, -0.021961236372590065, -0.018746891990303993, -0.015532547608017921, -0.01231820322573185, -0.009103857912123203, -0.0058895135298371315, -0.002675168216228485, 0.0005391761660575867, 0.0037535205483436584, 0.00696786493062973, 0.010182209312915802, 0.013396553695201874, 0.016610898077487946, 0.019825242459774017, 0.02303958870470524, 0.02625393308699131, 0.029468277469277382, 0.032682619988918304, 0.035896964371204376, 0.03911130875349045, 0.04232565313577652, 0.04553999751806259, 0.04875434190034866, 0.051968686282634735, 0.05518303066492081, 0.05839737877249718, 0.06161172315478325, 0.06482607126235962, 0.06804041564464569, 0.07125476002693176, 0.07446910440921783, 0.0776834487915039, 0.08089779317378998, 0.08411213755607605, 0.08732648193836212, 0.0905408263206482, 0.09375517070293427, 0.09696951508522034, 0.10018385946750641, 0.10339820384979248, 0.10661254823207855, 0.10982689261436462]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 8.0, 10.0, 10.0, 20.0, 19.0, 24.0, 29.0, 28.0, 35.0, 44.0, 27.0, 49.0, 40.0, 41.0, 40.0, 34.0, 49.0, 39.0, 46.0, 48.0, 60.0, 41.0, 36.0, 41.0, 29.0, 18.0, 27.0, 20.0, 15.0, 10.0, 20.0, 12.0, 4.0, 5.0, 1.0, 4.0, 5.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018271148204803467, -0.01762533187866211, -0.016979515552520752, -0.016333699226379395, -0.015687882900238037, -0.01504206657409668, -0.014396250247955322, -0.013750433921813965, -0.013104617595672607, -0.01245880126953125, -0.011812984943389893, -0.011167168617248535, -0.010521352291107178, -0.00987553596496582, -0.009229719638824463, -0.008583903312683105, -0.007938086986541748, -0.007292270660400391, -0.006646454334259033, -0.006000638008117676, -0.005354821681976318, -0.004709005355834961, -0.0040631890296936035, -0.003417372703552246, -0.0027715563774108887, -0.0021257400512695312, -0.0014799237251281738, -0.0008341073989868164, -0.00018829107284545898, 0.00045752525329589844, 0.0011033415794372559, 0.0017491579055786133, 0.0023949742317199707, 0.003040790557861328, 0.0036866068840026855, 0.004332423210144043, 0.0049782395362854, 0.005624055862426758, 0.006269872188568115, 0.006915688514709473, 0.00756150484085083, 0.008207321166992188, 0.008853137493133545, 0.009498953819274902, 0.01014477014541626, 0.010790586471557617, 0.011436402797698975, 0.012082219123840332, 0.01272803544998169, 0.013373851776123047, 0.014019668102264404, 0.014665484428405762, 0.01531130075454712, 0.015957117080688477, 0.016602933406829834, 0.01724874973297119, 0.01789456605911255, 0.018540382385253906, 0.019186198711395264, 0.01983201503753662, 0.02047783136367798, 0.021123647689819336, 0.021769464015960693, 0.02241528034210205, 0.023061096668243408]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 2.0, 6.0, 17.0, 11.0, 13.0, 12.0, 14.0, 22.0, 20.0, 20.0, 40.0, 35.0, 38.0, 30.0, 41.0, 46.0, 40.0, 44.0, 39.0, 46.0, 50.0, 35.0, 49.0, 44.0, 25.0, 18.0, 36.0, 32.0, 23.0, 24.0, 17.0, 17.0, 21.0, 11.0, 11.0, 5.0, 6.0, 4.0, 10.0, 8.0, 1.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.31640625, -5.14959716796875, -4.9827880859375, -4.81597900390625, -4.649169921875, -4.48236083984375, -4.3155517578125, -4.14874267578125, -3.98193359375, -3.81512451171875, -3.6483154296875, -3.48150634765625, -3.314697265625, -3.14788818359375, -2.9810791015625, -2.81427001953125, -2.6474609375, -2.48065185546875, -2.3138427734375, -2.14703369140625, -1.980224609375, -1.81341552734375, -1.6466064453125, -1.47979736328125, -1.31298828125, -1.14617919921875, -0.9793701171875, -0.81256103515625, -0.645751953125, -0.47894287109375, -0.3121337890625, -0.14532470703125, 0.021484375, 0.18829345703125, 0.3551025390625, 0.52191162109375, 0.688720703125, 0.85552978515625, 1.0223388671875, 1.18914794921875, 1.35595703125, 1.52276611328125, 1.6895751953125, 1.85638427734375, 2.023193359375, 2.19000244140625, 2.3568115234375, 2.52362060546875, 2.6904296875, 2.85723876953125, 3.0240478515625, 3.19085693359375, 3.357666015625, 3.52447509765625, 3.6912841796875, 3.85809326171875, 4.02490234375, 4.19171142578125, 4.3585205078125, 4.52532958984375, 4.692138671875, 4.85894775390625, 5.0257568359375, 5.19256591796875, 5.359375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 5.0, 11.0, 17.0, 24.0, 25.0, 27.0, 42.0, 62.0, 84.0, 119.0, 256.0, 348.0, 758.0, 1511.0, 3337.0, 8125.0, 23536.0, 96636.0, 622221.0, 226486.0, 42505.0, 12862.0, 4918.0, 2209.0, 1076.0, 513.0, 273.0, 169.0, 109.0, 72.0, 38.0, 34.0, 36.0, 20.0, 23.0, 9.0, 6.0, 10.0, 8.0, 8.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.21875, -8.92822265625, -8.6376953125, -8.34716796875, -8.056640625, -7.76611328125, -7.4755859375, -7.18505859375, -6.89453125, -6.60400390625, -6.3134765625, -6.02294921875, -5.732421875, -5.44189453125, -5.1513671875, -4.86083984375, -4.5703125, -4.27978515625, -3.9892578125, -3.69873046875, -3.408203125, -3.11767578125, -2.8271484375, -2.53662109375, -2.24609375, -1.95556640625, -1.6650390625, -1.37451171875, -1.083984375, -0.79345703125, -0.5029296875, -0.21240234375, 0.078125, 0.36865234375, 0.6591796875, 0.94970703125, 1.240234375, 1.53076171875, 1.8212890625, 2.11181640625, 2.40234375, 2.69287109375, 2.9833984375, 3.27392578125, 3.564453125, 3.85498046875, 4.1455078125, 4.43603515625, 4.7265625, 5.01708984375, 5.3076171875, 5.59814453125, 5.888671875, 6.17919921875, 6.4697265625, 6.76025390625, 7.05078125, 7.34130859375, 7.6318359375, 7.92236328125, 8.212890625, 8.50341796875, 8.7939453125, 9.08447265625, 9.375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 12.0, 11.0, 18.0, 11.0, 10.0, 18.0, 13.0, 23.0, 30.0, 28.0, 30.0, 33.0, 33.0, 36.0, 43.0, 64.0, 93.0, 281.0, 1597.0, 147.0, 85.0, 57.0, 46.0, 34.0, 42.0, 36.0, 23.0, 26.0, 30.0, 27.0, 15.0, 17.0, 14.0, 9.0, 12.0, 11.0, 6.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.59228515625, -15.0595703125, -14.52685546875, -13.994140625, -13.46142578125, -12.9287109375, -12.39599609375, -11.86328125, -11.33056640625, -10.7978515625, -10.26513671875, -9.732421875, -9.19970703125, -8.6669921875, -8.13427734375, -7.6015625, -7.06884765625, -6.5361328125, -6.00341796875, -5.470703125, -4.93798828125, -4.4052734375, -3.87255859375, -3.33984375, -2.80712890625, -2.2744140625, -1.74169921875, -1.208984375, -0.67626953125, -0.1435546875, 0.38916015625, 0.921875, 1.45458984375, 1.9873046875, 2.52001953125, 3.052734375, 3.58544921875, 4.1181640625, 4.65087890625, 5.18359375, 5.71630859375, 6.2490234375, 6.78173828125, 7.314453125, 7.84716796875, 8.3798828125, 8.91259765625, 9.4453125, 9.97802734375, 10.5107421875, 11.04345703125, 11.576171875, 12.10888671875, 12.6416015625, 13.17431640625, 13.70703125, 14.23974609375, 14.7724609375, 15.30517578125, 15.837890625, 16.37060546875, 16.9033203125, 17.43603515625, 17.96875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 4.0, 13.0, 16.0, 12.0, 13.0, 19.0, 28.0, 34.0, 35.0, 48.0, 51.0, 70.0, 120.0, 170.0, 319.0, 756.0, 5315.0, 2803224.0, 331362.0, 2712.0, 503.0, 293.0, 137.0, 98.0, 62.0, 53.0, 38.0, 31.0, 27.0, 23.0, 17.0, 16.0, 20.0, 16.0, 10.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-55.0625, -53.48388671875, -51.9052734375, -50.32666015625, -48.748046875, -47.16943359375, -45.5908203125, -44.01220703125, -42.43359375, -40.85498046875, -39.2763671875, -37.69775390625, -36.119140625, -34.54052734375, -32.9619140625, -31.38330078125, -29.8046875, -28.22607421875, -26.6474609375, -25.06884765625, -23.490234375, -21.91162109375, -20.3330078125, -18.75439453125, -17.17578125, -15.59716796875, -14.0185546875, -12.43994140625, -10.861328125, -9.28271484375, -7.7041015625, -6.12548828125, -4.546875, -2.96826171875, -1.3896484375, 0.18896484375, 1.767578125, 3.34619140625, 4.9248046875, 6.50341796875, 8.08203125, 9.66064453125, 11.2392578125, 12.81787109375, 14.396484375, 15.97509765625, 17.5537109375, 19.13232421875, 20.7109375, 22.28955078125, 23.8681640625, 25.44677734375, 27.025390625, 28.60400390625, 30.1826171875, 31.76123046875, 33.33984375, 34.91845703125, 36.4970703125, 38.07568359375, 39.654296875, 41.23291015625, 42.8115234375, 44.39013671875, 45.96875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 120.0, 526.0, 332.0, 33.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.603519439697266, -39.50398254394531, -36.40444564819336, -33.304908752441406, -30.205373764038086, -27.105836868286133, -24.006301879882812, -20.90676498413086, -17.807228088378906, -14.707691192626953, -11.608155250549316, -8.50861930847168, -5.409082412719727, -2.3095455169677734, 0.7899894714355469, 3.8895263671875, 6.989063262939453, 10.088600158691406, 13.188136100769043, 16.28767204284668, 19.387208938598633, 22.486745834350586, 25.586280822753906, 28.68581771850586, 31.785354614257812, 34.884891510009766, 37.98442840576172, 41.083961486816406, 44.183502197265625, 47.28303527832031, 50.382572174072266, 53.48210906982422, 56.58164978027344, 59.68118667602539, 62.780723571777344, 65.88025665283203, 68.97979736328125, 72.07933044433594, 75.17886352539062, 78.27840423583984, 81.37794494628906, 84.47747802734375, 87.57701873779297, 90.67655181884766, 93.77609252929688, 96.87562561035156, 99.97515869140625, 103.07469940185547, 106.17423248291016, 109.27376556396484, 112.37330627441406, 115.47283935546875, 118.57238006591797, 121.67191314697266, 124.77145385742188, 127.87098693847656, 130.97052001953125, 134.07005310058594, 137.16958618164062, 140.26913452148438, 143.36866760253906, 146.46820068359375, 149.56773376464844, 152.66726684570312, 155.76681518554688]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 10.0, 12.0, 9.0, 10.0, 22.0, 21.0, 16.0, 21.0, 24.0, 28.0, 42.0, 33.0, 33.0, 36.0, 59.0, 44.0, 50.0, 43.0, 41.0, 56.0, 39.0, 45.0, 41.0, 36.0, 30.0, 29.0, 31.0, 33.0, 19.0, 14.0, 17.0, 10.0, 12.0, 4.0, 4.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-63.52619934082031, -61.83320999145508, -60.140220642089844, -58.44723129272461, -56.754241943359375, -55.061248779296875, -53.368263244628906, -51.675270080566406, -49.98228073120117, -48.28929138183594, -46.5963020324707, -44.90331268310547, -43.210323333740234, -41.517333984375, -39.8243408203125, -38.131351470947266, -36.43836212158203, -34.7453727722168, -33.05238342285156, -31.359394073486328, -29.66640281677246, -27.973413467407227, -26.280424118041992, -24.587432861328125, -22.894447326660156, -21.201457977294922, -19.508468627929688, -17.815479278564453, -16.122488021850586, -14.429498672485352, -12.736509323120117, -11.043519020080566, -9.350528717041016, -7.657538890838623, -5.9645490646362305, -4.271559715270996, -2.5785698890686035, -0.8855800628662109, 0.8074092864990234, 2.500399589538574, 4.193388938903809, 5.886378765106201, 7.579368591308594, 9.272357940673828, 10.965347290039062, 12.658337593078613, 14.351326942443848, 16.0443172454834, 17.737306594848633, 19.430295944213867, 21.1232852935791, 22.81627655029297, 24.509265899658203, 26.202255249023438, 27.895244598388672, 29.588233947753906, 31.28122329711914, 32.974212646484375, 34.66720199584961, 36.360191345214844, 38.05318069458008, 39.74617004394531, 41.43916320800781, 43.13215255737305, 44.82514190673828]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 7.0, 6.0, 12.0, 8.0, 12.0, 16.0, 19.0, 21.0, 27.0, 26.0, 36.0, 32.0, 28.0, 30.0, 38.0, 50.0, 37.0, 50.0, 48.0, 42.0, 38.0, 33.0, 38.0, 41.0, 41.0, 25.0, 25.0, 22.0, 29.0, 21.0, 23.0, 14.0, 14.0, 17.0, 14.0, 6.0, 9.0, 8.0, 7.0, 6.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -5.01373291015625, -4.8399658203125, -4.66619873046875, -4.492431640625, -4.31866455078125, -4.1448974609375, -3.97113037109375, -3.79736328125, -3.62359619140625, -3.4498291015625, -3.27606201171875, -3.102294921875, -2.92852783203125, -2.7547607421875, -2.58099365234375, -2.4072265625, -2.23345947265625, -2.0596923828125, -1.88592529296875, -1.712158203125, -1.53839111328125, -1.3646240234375, -1.19085693359375, -1.01708984375, -0.84332275390625, -0.6695556640625, -0.49578857421875, -0.322021484375, -0.14825439453125, 0.0255126953125, 0.19927978515625, 0.373046875, 0.54681396484375, 0.7205810546875, 0.89434814453125, 1.068115234375, 1.24188232421875, 1.4156494140625, 1.58941650390625, 1.76318359375, 1.93695068359375, 2.1107177734375, 2.28448486328125, 2.458251953125, 2.63201904296875, 2.8057861328125, 2.97955322265625, 3.1533203125, 3.32708740234375, 3.5008544921875, 3.67462158203125, 3.848388671875, 4.02215576171875, 4.1959228515625, 4.36968994140625, 4.54345703125, 4.71722412109375, 4.8909912109375, 5.06475830078125, 5.238525390625, 5.41229248046875, 5.5860595703125, 5.75982666015625, 5.93359375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 10.0, 9.0, 15.0, 18.0, 25.0, 38.0, 47.0, 104.0, 126.0, 183.0, 288.0, 415.0, 713.0, 1067.0, 1657.0, 2893.0, 5194.0, 10179.0, 24013.0, 66877.0, 227836.0, 767043.0, 1557455.0, 1037866.0, 334213.0, 96681.0, 31892.0, 12711.0, 6239.0, 3280.0, 1877.0, 1169.0, 703.0, 435.0, 326.0, 225.0, 121.0, 99.0, 65.0, 55.0, 34.0, 18.0, 18.0, 19.0, 7.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.26171875, -7.03228759765625, -6.8028564453125, -6.57342529296875, -6.343994140625, -6.11456298828125, -5.8851318359375, -5.65570068359375, -5.42626953125, -5.19683837890625, -4.9674072265625, -4.73797607421875, -4.508544921875, -4.27911376953125, -4.0496826171875, -3.82025146484375, -3.5908203125, -3.36138916015625, -3.1319580078125, -2.90252685546875, -2.673095703125, -2.44366455078125, -2.2142333984375, -1.98480224609375, -1.75537109375, -1.52593994140625, -1.2965087890625, -1.06707763671875, -0.837646484375, -0.60821533203125, -0.3787841796875, -0.14935302734375, 0.080078125, 0.30950927734375, 0.5389404296875, 0.76837158203125, 0.997802734375, 1.22723388671875, 1.4566650390625, 1.68609619140625, 1.91552734375, 2.14495849609375, 2.3743896484375, 2.60382080078125, 2.833251953125, 3.06268310546875, 3.2921142578125, 3.52154541015625, 3.7509765625, 3.98040771484375, 4.2098388671875, 4.43927001953125, 4.668701171875, 4.89813232421875, 5.1275634765625, 5.35699462890625, 5.58642578125, 5.81585693359375, 6.0452880859375, 6.27471923828125, 6.504150390625, 6.73358154296875, 6.9630126953125, 7.19244384765625, 7.421875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 8.0, 11.0, 17.0, 14.0, 20.0, 34.0, 56.0, 62.0, 99.0, 139.0, 219.0, 263.0, 408.0, 489.0, 530.0, 466.0, 344.0, 248.0, 200.0, 123.0, 78.0, 73.0, 47.0, 31.0, 27.0, 20.0, 15.0, 10.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.015625, -13.5958251953125, -13.176025390625, -12.7562255859375, -12.33642578125, -11.9166259765625, -11.496826171875, -11.0770263671875, -10.6572265625, -10.2374267578125, -9.817626953125, -9.3978271484375, -8.97802734375, -8.5582275390625, -8.138427734375, -7.7186279296875, -7.298828125, -6.8790283203125, -6.459228515625, -6.0394287109375, -5.61962890625, -5.1998291015625, -4.780029296875, -4.3602294921875, -3.9404296875, -3.5206298828125, -3.100830078125, -2.6810302734375, -2.26123046875, -1.8414306640625, -1.421630859375, -1.0018310546875, -0.58203125, -0.1622314453125, 0.257568359375, 0.6773681640625, 1.09716796875, 1.5169677734375, 1.936767578125, 2.3565673828125, 2.7763671875, 3.1961669921875, 3.615966796875, 4.0357666015625, 4.45556640625, 4.8753662109375, 5.295166015625, 5.7149658203125, 6.134765625, 6.5545654296875, 6.974365234375, 7.3941650390625, 7.81396484375, 8.2337646484375, 8.653564453125, 9.0733642578125, 9.4931640625, 9.9129638671875, 10.332763671875, 10.7525634765625, 11.17236328125, 11.5921630859375, 12.011962890625, 12.4317626953125, 12.8515625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 14.0, 14.0, 22.0, 26.0, 30.0, 48.0, 78.0, 127.0, 189.0, 379.0, 691.0, 1932.0, 8918.0, 150747.0, 3874168.0, 144520.0, 8885.0, 1851.0, 722.0, 381.0, 183.0, 110.0, 75.0, 55.0, 39.0, 17.0, 15.0, 14.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.0625, -41.650390625, -40.23828125, -38.826171875, -37.4140625, -36.001953125, -34.58984375, -33.177734375, -31.765625, -30.353515625, -28.94140625, -27.529296875, -26.1171875, -24.705078125, -23.29296875, -21.880859375, -20.46875, -19.056640625, -17.64453125, -16.232421875, -14.8203125, -13.408203125, -11.99609375, -10.583984375, -9.171875, -7.759765625, -6.34765625, -4.935546875, -3.5234375, -2.111328125, -0.69921875, 0.712890625, 2.125, 3.537109375, 4.94921875, 6.361328125, 7.7734375, 9.185546875, 10.59765625, 12.009765625, 13.421875, 14.833984375, 16.24609375, 17.658203125, 19.0703125, 20.482421875, 21.89453125, 23.306640625, 24.71875, 26.130859375, 27.54296875, 28.955078125, 30.3671875, 31.779296875, 33.19140625, 34.603515625, 36.015625, 37.427734375, 38.83984375, 40.251953125, 41.6640625, 43.076171875, 44.48828125, 45.900390625, 47.3125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 38.0, 310.0, 547.0, 117.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.59405517578125, -96.21231079101562, -86.83056640625, -77.4488296508789, -68.06708526611328, -58.685340881347656, -49.3036003112793, -39.92185974121094, -30.540115356445312, -21.15837287902832, -11.776630401611328, -2.394887924194336, 6.986854553222656, 16.36859893798828, 25.75033950805664, 35.132080078125, 44.513824462890625, 53.89556884765625, 63.27730941772461, 72.65904998779297, 82.0407943725586, 91.42253875732422, 100.80427551269531, 110.18601989746094, 119.56776428222656, 128.9495086669922, 138.3312530517578, 147.71299743652344, 157.0947265625, 166.47647094726562, 175.85821533203125, 185.23995971679688, 194.6217041015625, 204.00344848632812, 213.38519287109375, 222.76693725585938, 232.148681640625, 241.53042602539062, 250.9121551513672, 260.29388427734375, 269.6756591796875, 279.0574035644531, 288.43914794921875, 297.8208923339844, 307.20263671875, 316.5843811035156, 325.96612548828125, 335.34783935546875, 344.7295837402344, 354.111328125, 363.4930725097656, 372.87481689453125, 382.2565612792969, 391.6383056640625, 401.0200500488281, 410.40179443359375, 419.78350830078125, 429.1652526855469, 438.5469970703125, 447.9287414550781, 457.31048583984375, 466.6922302246094, 476.073974609375, 485.4556884765625, 494.83746337890625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 13.0, 10.0, 19.0, 16.0, 25.0, 24.0, 22.0, 27.0, 37.0, 31.0, 34.0, 40.0, 33.0, 41.0, 46.0, 47.0, 47.0, 43.0, 38.0, 38.0, 44.0, 41.0, 22.0, 37.0, 27.0, 29.0, 25.0, 22.0, 22.0, 18.0, 16.0, 14.0, 9.0, 3.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.166351318359375, -39.82866287231445, -38.4909782409668, -37.153289794921875, -35.81560134887695, -34.4779167175293, -33.140228271484375, -31.802541732788086, -30.464855194091797, -29.127168655395508, -27.789480209350586, -26.451793670654297, -25.114107131958008, -23.77642059326172, -22.438732147216797, -21.101045608520508, -19.763357162475586, -18.425670623779297, -17.087982177734375, -15.750295639038086, -14.412609100341797, -13.074921607971191, -11.737234115600586, -10.399547576904297, -9.061860084533691, -7.724173069000244, -6.386486053466797, -5.048798561096191, -3.711111545562744, -2.373424530029297, -1.0357370376586914, 0.30194950103759766, 1.6396369934082031, 2.9773240089416504, 4.315011024475098, 5.652698516845703, 6.99038553237915, 8.328072547912598, 9.665760040283203, 11.003446578979492, 12.341134071350098, 13.678821563720703, 15.016508102416992, 16.35419464111328, 17.691883087158203, 19.029569625854492, 20.36725616455078, 21.704944610595703, 23.042631149291992, 24.38031768798828, 25.718006134033203, 27.055692672729492, 28.39337921142578, 29.731067657470703, 31.068754196166992, 32.40644073486328, 33.7441291809082, 35.081817626953125, 36.41950225830078, 37.7571907043457, 39.094879150390625, 40.43256378173828, 41.7702522277832, 43.107940673828125, 44.44562530517578]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 12.0, 10.0, 23.0, 21.0, 14.0, 18.0, 22.0, 26.0, 38.0, 31.0, 32.0, 43.0, 46.0, 38.0, 44.0, 50.0, 45.0, 49.0, 38.0, 38.0, 48.0, 42.0, 26.0, 34.0, 28.0, 19.0, 23.0, 22.0, 15.0, 19.0, 14.0, 17.0, 9.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-6.734375, -6.54443359375, -6.3544921875, -6.16455078125, -5.974609375, -5.78466796875, -5.5947265625, -5.40478515625, -5.21484375, -5.02490234375, -4.8349609375, -4.64501953125, -4.455078125, -4.26513671875, -4.0751953125, -3.88525390625, -3.6953125, -3.50537109375, -3.3154296875, -3.12548828125, -2.935546875, -2.74560546875, -2.5556640625, -2.36572265625, -2.17578125, -1.98583984375, -1.7958984375, -1.60595703125, -1.416015625, -1.22607421875, -1.0361328125, -0.84619140625, -0.65625, -0.46630859375, -0.2763671875, -0.08642578125, 0.103515625, 0.29345703125, 0.4833984375, 0.67333984375, 0.86328125, 1.05322265625, 1.2431640625, 1.43310546875, 1.623046875, 1.81298828125, 2.0029296875, 2.19287109375, 2.3828125, 2.57275390625, 2.7626953125, 2.95263671875, 3.142578125, 3.33251953125, 3.5224609375, 3.71240234375, 3.90234375, 4.09228515625, 4.2822265625, 4.47216796875, 4.662109375, 4.85205078125, 5.0419921875, 5.23193359375, 5.421875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 10.0, 7.0, 6.0, 18.0, 21.0, 34.0, 45.0, 50.0, 79.0, 130.0, 174.0, 277.0, 435.0, 621.0, 981.0, 1460.0, 2142.0, 3474.0, 5599.0, 8698.0, 13577.0, 21176.0, 33140.0, 52077.0, 81856.0, 125067.0, 173279.0, 173211.0, 124606.0, 81700.0, 52261.0, 33300.0, 21141.0, 13684.0, 8595.0, 5456.0, 3493.0, 2337.0, 1544.0, 921.0, 615.0, 402.0, 279.0, 183.0, 140.0, 91.0, 51.0, 28.0, 34.0, 23.0, 12.0, 8.0, 12.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.64453125, -0.6243896484375, -0.604248046875, -0.5841064453125, -0.56396484375, -0.5438232421875, -0.523681640625, -0.5035400390625, -0.4833984375, -0.4632568359375, -0.443115234375, -0.4229736328125, -0.40283203125, -0.3826904296875, -0.362548828125, -0.3424072265625, -0.322265625, -0.3021240234375, -0.281982421875, -0.2618408203125, -0.24169921875, -0.2215576171875, -0.201416015625, -0.1812744140625, -0.1611328125, -0.1409912109375, -0.120849609375, -0.1007080078125, -0.08056640625, -0.0604248046875, -0.040283203125, -0.0201416015625, 0.0, 0.0201416015625, 0.040283203125, 0.0604248046875, 0.08056640625, 0.1007080078125, 0.120849609375, 0.1409912109375, 0.1611328125, 0.1812744140625, 0.201416015625, 0.2215576171875, 0.24169921875, 0.2618408203125, 0.281982421875, 0.3021240234375, 0.322265625, 0.3424072265625, 0.362548828125, 0.3826904296875, 0.40283203125, 0.4229736328125, 0.443115234375, 0.4632568359375, 0.4833984375, 0.5035400390625, 0.523681640625, 0.5438232421875, 0.56396484375, 0.5841064453125, 0.604248046875, 0.6243896484375, 0.64453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 0.0, 3.0, 6.0, 6.0, 5.0, 12.0, 12.0, 13.0, 9.0, 7.0, 18.0, 24.0, 18.0, 21.0, 22.0, 27.0, 28.0, 37.0, 34.0, 39.0, 44.0, 30.0, 33.0, 41.0, 1064.0, 42.0, 40.0, 43.0, 33.0, 25.0, 31.0, 25.0, 34.0, 29.0, 25.0, 26.0, 21.0, 14.0, 16.0, 7.0, 9.0, 22.0, 6.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.390625, -3.28131103515625, -3.1719970703125, -3.06268310546875, -2.953369140625, -2.84405517578125, -2.7347412109375, -2.62542724609375, -2.51611328125, -2.40679931640625, -2.2974853515625, -2.18817138671875, -2.078857421875, -1.96954345703125, -1.8602294921875, -1.75091552734375, -1.6416015625, -1.53228759765625, -1.4229736328125, -1.31365966796875, -1.204345703125, -1.09503173828125, -0.9857177734375, -0.87640380859375, -0.76708984375, -0.65777587890625, -0.5484619140625, -0.43914794921875, -0.329833984375, -0.22052001953125, -0.1112060546875, -0.00189208984375, 0.107421875, 0.21673583984375, 0.3260498046875, 0.43536376953125, 0.544677734375, 0.65399169921875, 0.7633056640625, 0.87261962890625, 0.98193359375, 1.09124755859375, 1.2005615234375, 1.30987548828125, 1.419189453125, 1.52850341796875, 1.6378173828125, 1.74713134765625, 1.8564453125, 1.96575927734375, 2.0750732421875, 2.18438720703125, 2.293701171875, 2.40301513671875, 2.5123291015625, 2.62164306640625, 2.73095703125, 2.84027099609375, 2.9495849609375, 3.05889892578125, 3.168212890625, 3.27752685546875, 3.3868408203125, 3.49615478515625, 3.60546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 6.0, 8.0, 17.0, 30.0, 32.0, 57.0, 76.0, 115.0, 137.0, 235.0, 303.0, 432.0, 651.0, 923.0, 1408.0, 1984.0, 2822.0, 3994.0, 5783.0, 8443.0, 12044.0, 17219.0, 24957.0, 35766.0, 51274.0, 72816.0, 100057.0, 128898.0, 1179376.0, 122491.0, 95698.0, 69544.0, 48684.0, 34068.0, 23312.0, 16105.0, 11439.0, 7942.0, 5561.0, 3669.0, 2685.0, 1913.0, 1268.0, 924.0, 617.0, 457.0, 300.0, 200.0, 129.0, 93.0, 65.0, 31.0, 28.0, 26.0, 13.0, 9.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.326904296875, -0.3168220520019531, -0.30673980712890625, -0.2966575622558594, -0.2865753173828125, -0.2764930725097656, -0.26641082763671875, -0.2563285827636719, -0.246246337890625, -0.23616409301757812, -0.22608184814453125, -0.21599960327148438, -0.2059173583984375, -0.19583511352539062, -0.18575286865234375, -0.17567062377929688, -0.16558837890625, -0.15550613403320312, -0.14542388916015625, -0.13534164428710938, -0.1252593994140625, -0.11517715454101562, -0.10509490966796875, -0.09501266479492188, -0.084930419921875, -0.07484817504882812, -0.06476593017578125, -0.054683685302734375, -0.0446014404296875, -0.034519195556640625, -0.02443695068359375, -0.014354705810546875, -0.0042724609375, 0.005809783935546875, 0.01589202880859375, 0.025974273681640625, 0.0360565185546875, 0.046138763427734375, 0.05622100830078125, 0.06630325317382812, 0.076385498046875, 0.08646774291992188, 0.09654998779296875, 0.10663223266601562, 0.1167144775390625, 0.12679672241210938, 0.13687896728515625, 0.14696121215820312, 0.15704345703125, 0.16712570190429688, 0.17720794677734375, 0.18729019165039062, 0.1973724365234375, 0.20745468139648438, 0.21753692626953125, 0.22761917114257812, 0.237701416015625, 0.24778366088867188, 0.25786590576171875, 0.2679481506347656, 0.2780303955078125, 0.2881126403808594, 0.29819488525390625, 0.3082771301269531, 0.318359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 5.0, 5.0, 8.0, 11.0, 16.0, 13.0, 19.0, 24.0, 19.0, 22.0, 35.0, 45.0, 35.0, 41.0, 47.0, 52.0, 41.0, 50.0, 62.0, 59.0, 41.0, 36.0, 36.0, 34.0, 32.0, 30.0, 23.0, 28.0, 19.0, 15.0, 14.0, 16.0, 6.0, 6.0, 9.0, 4.0, 6.0, 3.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.016754150390625, -0.0162808895111084, -0.015807628631591797, -0.015334367752075195, -0.014861106872558594, -0.014387845993041992, -0.01391458511352539, -0.013441324234008789, -0.012968063354492188, -0.012494802474975586, -0.012021541595458984, -0.011548280715942383, -0.011075019836425781, -0.01060175895690918, -0.010128498077392578, -0.009655237197875977, -0.009181976318359375, -0.008708715438842773, -0.008235454559326172, -0.00776219367980957, -0.007288932800292969, -0.006815671920776367, -0.006342411041259766, -0.005869150161743164, -0.0053958892822265625, -0.004922628402709961, -0.004449367523193359, -0.003976106643676758, -0.0035028457641601562, -0.0030295848846435547, -0.002556324005126953, -0.0020830631256103516, -0.00160980224609375, -0.0011365413665771484, -0.0006632804870605469, -0.0001900196075439453, 0.00028324127197265625, 0.0007565021514892578, 0.0012297630310058594, 0.001703023910522461, 0.0021762847900390625, 0.002649545669555664, 0.0031228065490722656, 0.003596067428588867, 0.004069328308105469, 0.00454258918762207, 0.005015850067138672, 0.0054891109466552734, 0.005962371826171875, 0.0064356327056884766, 0.006908893585205078, 0.00738215446472168, 0.007855415344238281, 0.008328676223754883, 0.008801937103271484, 0.009275197982788086, 0.009748458862304688, 0.010221719741821289, 0.01069498062133789, 0.011168241500854492, 0.011641502380371094, 0.012114763259887695, 0.012588024139404297, 0.013061285018920898, 0.0135345458984375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 15.0, 17.0, 11.0, 26.0, 21.0, 25.0, 30.0, 27.0, 41.0, 63.0, 91.0, 134.0, 278.0, 925.0, 5817.0, 102645.0, 917552.0, 17579.0, 2071.0, 517.0, 186.0, 108.0, 81.0, 53.0, 40.0, 30.0, 34.0, 22.0, 17.0, 17.0, 9.0, 10.0, 7.0, 6.0, 2.0, 2.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334228515625, -0.3227996826171875, -0.311370849609375, -0.2999420166015625, -0.28851318359375, -0.2770843505859375, -0.265655517578125, -0.2542266845703125, -0.2427978515625, -0.2313690185546875, -0.219940185546875, -0.2085113525390625, -0.19708251953125, -0.1856536865234375, -0.174224853515625, -0.1627960205078125, -0.1513671875, -0.1399383544921875, -0.128509521484375, -0.1170806884765625, -0.10565185546875, -0.0942230224609375, -0.082794189453125, -0.0713653564453125, -0.0599365234375, -0.0485076904296875, -0.037078857421875, -0.0256500244140625, -0.01422119140625, -0.0027923583984375, 0.008636474609375, 0.0200653076171875, 0.031494140625, 0.0429229736328125, 0.054351806640625, 0.0657806396484375, 0.07720947265625, 0.0886383056640625, 0.100067138671875, 0.1114959716796875, 0.1229248046875, 0.1343536376953125, 0.145782470703125, 0.1572113037109375, 0.16864013671875, 0.1800689697265625, 0.191497802734375, 0.2029266357421875, 0.21435546875, 0.2257843017578125, 0.237213134765625, 0.2486419677734375, 0.26007080078125, 0.2714996337890625, 0.282928466796875, 0.2943572998046875, 0.3057861328125, 0.3172149658203125, 0.328643798828125, 0.3400726318359375, 0.35150146484375, 0.3629302978515625, 0.374359130859375, 0.3857879638671875, 0.397216796875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 10.0, 10.0, 19.0, 14.0, 16.0, 31.0, 29.0, 40.0, 66.0, 111.0, 155.0, 154.0, 111.0, 72.0, 47.0, 30.0, 17.0, 17.0, 12.0, 11.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03648126870393753, -0.034911785274744034, -0.03334230184555054, -0.03177281841635704, -0.030203333124518394, -0.028633849695324898, -0.027064364403486252, -0.025494880974292755, -0.02392539754509926, -0.02235591411590576, -0.020786430686712265, -0.01921694539487362, -0.017647461965680122, -0.016077978536486626, -0.014508494175970554, -0.012939009815454483, -0.011369526386260986, -0.00980004295706749, -0.008230558596551418, -0.006661074701696634, -0.00509159080684185, -0.0035221073776483536, -0.0019526230171322823, -0.00038313865661621094, 0.0011863447725772858, 0.0027558286674320698, 0.004325312562286854, 0.005894796457141638, 0.007464280351996422, 0.009033763781189919, 0.01060324814170599, 0.012172732502222061, 0.013742215931415558, 0.015311699360609055, 0.01688118278980255, 0.018450668081641197, 0.020020151510834694, 0.02158963494002819, 0.023159120231866837, 0.024728603661060333, 0.02629808709025383, 0.027867570519447327, 0.029437053948640823, 0.03100653924047947, 0.032576024532318115, 0.034145504236221313, 0.03571499139070511, 0.037284474819898605, 0.0388539582490921, 0.0404234416782856, 0.041992925107479095, 0.04356240853667259, 0.04513189196586609, 0.046701379120349884, 0.04827086254954338, 0.04984034597873688, 0.051409829407930374, 0.05297931283712387, 0.05454879626631737, 0.056118279695510864, 0.05768776684999466, 0.05925724655389786, 0.06082673370838165, 0.06239621713757515, 0.06396570056676865]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 8.0, 3.0, 5.0, 5.0, 10.0, 18.0, 16.0, 16.0, 15.0, 16.0, 23.0, 26.0, 28.0, 30.0, 34.0, 29.0, 42.0, 42.0, 34.0, 43.0, 42.0, 38.0, 44.0, 46.0, 41.0, 34.0, 34.0, 35.0, 31.0, 27.0, 25.0, 30.0, 19.0, 18.0, 18.0, 11.0, 11.0, 18.0, 7.0, 4.0, 4.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.010998070240020752, -0.010667339898645878, -0.010336609557271004, -0.01000587921589613, -0.009675148874521255, -0.009344418533146381, -0.009013688191771507, -0.008682957850396633, -0.008352227509021759, -0.008021497167646885, -0.007690766826272011, -0.007360036484897137, -0.007029306143522263, -0.0066985758021473885, -0.006367845460772514, -0.00603711511939764, -0.005706384778022766, -0.005375654436647892, -0.005044924095273018, -0.004714193753898144, -0.00438346341252327, -0.0040527330711483955, -0.0037220027297735214, -0.0033912723883986473, -0.003060542047023773, -0.002729811705648899, -0.002399081364274025, -0.002068351022899151, -0.0017376206815242767, -0.0014068903401494026, -0.0010761599987745285, -0.0007454296573996544, -0.0004146993160247803, -8.396897464990616e-05, 0.00024676136672496796, 0.0005774917080998421, 0.0009082220494747162, 0.0012389523908495903, 0.0015696827322244644, 0.0019004130735993385, 0.0022311434149742126, 0.0025618737563490868, 0.002892604097723961, 0.003223334439098835, 0.003554064780473709, 0.0038847951218485832, 0.004215525463223457, 0.0045462558045983315, 0.004876986145973206, 0.00520771648734808, 0.005538446828722954, 0.005869177170097828, 0.006199907511472702, 0.006530637852847576, 0.00686136819422245, 0.007192098535597324, 0.0075228288769721985, 0.007853559218347073, 0.008184289559721947, 0.00851501990109682, 0.008845750242471695, 0.009176480583846569, 0.009507210925221443, 0.009837941266596317, 0.010168671607971191]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 12.0, 10.0, 23.0, 21.0, 14.0, 19.0, 21.0, 26.0, 38.0, 31.0, 32.0, 43.0, 46.0, 38.0, 43.0, 51.0, 45.0, 49.0, 38.0, 38.0, 48.0, 42.0, 26.0, 34.0, 27.0, 20.0, 23.0, 22.0, 15.0, 19.0, 14.0, 17.0, 9.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-6.734375, -6.54443359375, -6.3544921875, -6.16455078125, -5.974609375, -5.78466796875, -5.5947265625, -5.40478515625, -5.21484375, -5.02490234375, -4.8349609375, -4.64501953125, -4.455078125, -4.26513671875, -4.0751953125, -3.88525390625, -3.6953125, -3.50537109375, -3.3154296875, -3.12548828125, -2.935546875, -2.74560546875, -2.5556640625, -2.36572265625, -2.17578125, -1.98583984375, -1.7958984375, -1.60595703125, -1.416015625, -1.22607421875, -1.0361328125, -0.84619140625, -0.65625, -0.46630859375, -0.2763671875, -0.08642578125, 0.103515625, 0.29345703125, 0.4833984375, 0.67333984375, 0.86328125, 1.05322265625, 1.2431640625, 1.43310546875, 1.623046875, 1.81298828125, 2.0029296875, 2.19287109375, 2.3828125, 2.57275390625, 2.7626953125, 2.95263671875, 3.142578125, 3.33251953125, 3.5224609375, 3.71240234375, 3.90234375, 4.09228515625, 4.2822265625, 4.47216796875, 4.662109375, 4.85205078125, 5.0419921875, 5.23193359375, 5.421875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 14.0, 9.0, 20.0, 26.0, 49.0, 56.0, 77.0, 129.0, 180.0, 322.0, 478.0, 724.0, 1225.0, 2102.0, 3737.0, 7003.0, 13446.0, 28163.0, 64271.0, 175537.0, 405369.0, 208446.0, 72995.0, 31441.0, 15135.0, 7766.0, 4103.0, 2198.0, 1274.0, 858.0, 455.0, 301.0, 210.0, 139.0, 104.0, 55.0, 45.0, 34.0, 14.0, 17.0, 9.0, 7.0, 6.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0], "bins": [-6.62890625, -6.44256591796875, -6.2562255859375, -6.06988525390625, -5.883544921875, -5.69720458984375, -5.5108642578125, -5.32452392578125, -5.13818359375, -4.95184326171875, -4.7655029296875, -4.57916259765625, -4.392822265625, -4.20648193359375, -4.0201416015625, -3.83380126953125, -3.6474609375, -3.46112060546875, -3.2747802734375, -3.08843994140625, -2.902099609375, -2.71575927734375, -2.5294189453125, -2.34307861328125, -2.15673828125, -1.97039794921875, -1.7840576171875, -1.59771728515625, -1.411376953125, -1.22503662109375, -1.0386962890625, -0.85235595703125, -0.666015625, -0.47967529296875, -0.2933349609375, -0.10699462890625, 0.079345703125, 0.26568603515625, 0.4520263671875, 0.63836669921875, 0.82470703125, 1.01104736328125, 1.1973876953125, 1.38372802734375, 1.570068359375, 1.75640869140625, 1.9427490234375, 2.12908935546875, 2.3154296875, 2.50177001953125, 2.6881103515625, 2.87445068359375, 3.060791015625, 3.24713134765625, 3.4334716796875, 3.61981201171875, 3.80615234375, 3.99249267578125, 4.1788330078125, 4.36517333984375, 4.551513671875, 4.73785400390625, 4.9241943359375, 5.11053466796875, 5.296875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 7.0, 4.0, 7.0, 11.0, 13.0, 16.0, 17.0, 21.0, 25.0, 24.0, 30.0, 28.0, 27.0, 34.0, 35.0, 55.0, 58.0, 85.0, 153.0, 1401.0, 381.0, 121.0, 86.0, 52.0, 47.0, 49.0, 25.0, 39.0, 24.0, 23.0, 19.0, 17.0, 22.0, 14.0, 15.0, 9.0, 8.0, 11.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.875, -17.29833984375, -16.7216796875, -16.14501953125, -15.568359375, -14.99169921875, -14.4150390625, -13.83837890625, -13.26171875, -12.68505859375, -12.1083984375, -11.53173828125, -10.955078125, -10.37841796875, -9.8017578125, -9.22509765625, -8.6484375, -8.07177734375, -7.4951171875, -6.91845703125, -6.341796875, -5.76513671875, -5.1884765625, -4.61181640625, -4.03515625, -3.45849609375, -2.8818359375, -2.30517578125, -1.728515625, -1.15185546875, -0.5751953125, 0.00146484375, 0.578125, 1.15478515625, 1.7314453125, 2.30810546875, 2.884765625, 3.46142578125, 4.0380859375, 4.61474609375, 5.19140625, 5.76806640625, 6.3447265625, 6.92138671875, 7.498046875, 8.07470703125, 8.6513671875, 9.22802734375, 9.8046875, 10.38134765625, 10.9580078125, 11.53466796875, 12.111328125, 12.68798828125, 13.2646484375, 13.84130859375, 14.41796875, 14.99462890625, 15.5712890625, 16.14794921875, 16.724609375, 17.30126953125, 17.8779296875, 18.45458984375, 19.03125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 7.0, 13.0, 23.0, 18.0, 25.0, 43.0, 69.0, 76.0, 150.0, 213.0, 349.0, 725.0, 3456.0, 123108.0, 2992328.0, 21913.0, 1747.0, 534.0, 298.0, 204.0, 140.0, 78.0, 49.0, 38.0, 28.0, 20.0, 13.0, 11.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 4.0], "bins": [-63.46875, -62.00341796875, -60.5380859375, -59.07275390625, -57.607421875, -56.14208984375, -54.6767578125, -53.21142578125, -51.74609375, -50.28076171875, -48.8154296875, -47.35009765625, -45.884765625, -44.41943359375, -42.9541015625, -41.48876953125, -40.0234375, -38.55810546875, -37.0927734375, -35.62744140625, -34.162109375, -32.69677734375, -31.2314453125, -29.76611328125, -28.30078125, -26.83544921875, -25.3701171875, -23.90478515625, -22.439453125, -20.97412109375, -19.5087890625, -18.04345703125, -16.578125, -15.11279296875, -13.6474609375, -12.18212890625, -10.716796875, -9.25146484375, -7.7861328125, -6.32080078125, -4.85546875, -3.39013671875, -1.9248046875, -0.45947265625, 1.005859375, 2.47119140625, 3.9365234375, 5.40185546875, 6.8671875, 8.33251953125, 9.7978515625, 11.26318359375, 12.728515625, 14.19384765625, 15.6591796875, 17.12451171875, 18.58984375, 20.05517578125, 21.5205078125, 22.98583984375, 24.451171875, 25.91650390625, 27.3818359375, 28.84716796875, 30.3125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 48.0, 841.0, 127.0], "bins": [-551.3821411132812, -542.5691528320312, -533.7561645507812, -524.9431762695312, -516.1301879882812, -507.31719970703125, -498.50421142578125, -489.69122314453125, -480.87823486328125, -472.06524658203125, -463.25225830078125, -454.43927001953125, -445.62628173828125, -436.81329345703125, -428.00030517578125, -419.18731689453125, -410.37432861328125, -401.56134033203125, -392.74835205078125, -383.93536376953125, -375.12237548828125, -366.30938720703125, -357.49639892578125, -348.68341064453125, -339.8704528808594, -331.0574645996094, -322.2444763183594, -313.4314880371094, -304.6184997558594, -295.8055114746094, -286.9925231933594, -278.1795349121094, -269.3665771484375, -260.5535888671875, -251.7406005859375, -242.9276123046875, -234.1146240234375, -225.3016357421875, -216.4886474609375, -207.6756591796875, -198.8626708984375, -190.0496826171875, -181.2366943359375, -172.4237060546875, -163.6107177734375, -154.7977294921875, -145.9847412109375, -137.1717529296875, -128.35877990722656, -119.54579162597656, -110.73280334472656, -101.91981506347656, -93.10682678222656, -84.29383850097656, -75.4808578491211, -66.6678695678711, -57.85487747192383, -49.04188919067383, -40.228904724121094, -31.415916442871094, -22.602928161621094, -13.789939880371094, -4.976955413818359, 3.8360328674316406, 12.64902114868164]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 9.0, 9.0, 13.0, 16.0, 21.0, 22.0, 20.0, 15.0, 28.0, 18.0, 32.0, 34.0, 37.0, 35.0, 40.0, 46.0, 36.0, 37.0, 47.0, 34.0, 32.0, 43.0, 34.0, 34.0, 29.0, 27.0, 34.0, 21.0, 30.0, 20.0, 20.0, 20.0, 13.0, 11.0, 12.0, 12.0, 7.0, 6.0, 12.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-48.853546142578125, -47.29233932495117, -45.73113250732422, -44.169921875, -42.60871505737305, -41.047508239746094, -39.48630142211914, -37.92509460449219, -36.36388397216797, -34.802677154541016, -33.24147033691406, -31.680261611938477, -30.11905288696289, -28.557846069335938, -26.996639251708984, -25.4354305267334, -23.874223709106445, -22.313016891479492, -20.751808166503906, -19.190601348876953, -17.629392623901367, -16.068185806274414, -14.506978034973145, -12.945770263671875, -11.384562492370605, -9.823354721069336, -8.262146949768066, -6.700939655303955, -5.1397318840026855, -3.578524112701416, -2.0173168182373047, -0.45610904693603516, 1.1050987243652344, 2.666306495666504, 4.227514266967773, 5.788721561431885, 7.349929332733154, 8.911136627197266, 10.472344398498535, 12.033552169799805, 13.594759941101074, 15.155967712402344, 16.717174530029297, 18.278383255004883, 19.839590072631836, 21.400798797607422, 22.962005615234375, 24.523212432861328, 26.084421157836914, 27.645627975463867, 29.206836700439453, 30.768043518066406, 32.32925033569336, 33.89046096801758, 35.45166778564453, 37.012874603271484, 38.57408142089844, 40.13528823852539, 41.696495056152344, 43.25770568847656, 44.818912506103516, 46.38011932373047, 47.94132614135742, 49.502532958984375, 51.063743591308594]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 0.0, 2.0, 5.0, 3.0, 9.0, 14.0, 14.0, 18.0, 17.0, 22.0, 26.0, 23.0, 27.0, 42.0, 32.0, 37.0, 39.0, 44.0, 43.0, 46.0, 50.0, 49.0, 39.0, 52.0, 34.0, 47.0, 33.0, 27.0, 37.0, 21.0, 24.0, 24.0, 23.0, 18.0, 10.0, 11.0, 5.0, 9.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.07421875, -6.8712158203125, -6.668212890625, -6.4652099609375, -6.26220703125, -6.0592041015625, -5.856201171875, -5.6531982421875, -5.4501953125, -5.2471923828125, -5.044189453125, -4.8411865234375, -4.63818359375, -4.4351806640625, -4.232177734375, -4.0291748046875, -3.826171875, -3.6231689453125, -3.420166015625, -3.2171630859375, -3.01416015625, -2.8111572265625, -2.608154296875, -2.4051513671875, -2.2021484375, -1.9991455078125, -1.796142578125, -1.5931396484375, -1.39013671875, -1.1871337890625, -0.984130859375, -0.7811279296875, -0.578125, -0.3751220703125, -0.172119140625, 0.0308837890625, 0.23388671875, 0.4368896484375, 0.639892578125, 0.8428955078125, 1.0458984375, 1.2489013671875, 1.451904296875, 1.6549072265625, 1.85791015625, 2.0609130859375, 2.263916015625, 2.4669189453125, 2.669921875, 2.8729248046875, 3.075927734375, 3.2789306640625, 3.48193359375, 3.6849365234375, 3.887939453125, 4.0909423828125, 4.2939453125, 4.4969482421875, 4.699951171875, 4.9029541015625, 5.10595703125, 5.3089599609375, 5.511962890625, 5.7149658203125, 5.91796875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 10.0, 9.0, 19.0, 23.0, 38.0, 58.0, 91.0, 117.0, 222.0, 327.0, 567.0, 929.0, 1626.0, 3043.0, 6836.0, 20956.0, 105475.0, 902560.0, 2570780.0, 491274.0, 62719.0, 14800.0, 5481.0, 2671.0, 1420.0, 836.0, 492.0, 309.0, 200.0, 118.0, 86.0, 52.0, 34.0, 20.0, 24.0, 9.0, 12.0, 10.0, 7.0, 1.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.3984375, -11.9761962890625, -11.553955078125, -11.1317138671875, -10.70947265625, -10.2872314453125, -9.864990234375, -9.4427490234375, -9.0205078125, -8.5982666015625, -8.176025390625, -7.7537841796875, -7.33154296875, -6.9093017578125, -6.487060546875, -6.0648193359375, -5.642578125, -5.2203369140625, -4.798095703125, -4.3758544921875, -3.95361328125, -3.5313720703125, -3.109130859375, -2.6868896484375, -2.2646484375, -1.8424072265625, -1.420166015625, -0.9979248046875, -0.57568359375, -0.1534423828125, 0.268798828125, 0.6910400390625, 1.11328125, 1.5355224609375, 1.957763671875, 2.3800048828125, 2.80224609375, 3.2244873046875, 3.646728515625, 4.0689697265625, 4.4912109375, 4.9134521484375, 5.335693359375, 5.7579345703125, 6.18017578125, 6.6024169921875, 7.024658203125, 7.4468994140625, 7.869140625, 8.2913818359375, 8.713623046875, 9.1358642578125, 9.55810546875, 9.9803466796875, 10.402587890625, 10.8248291015625, 11.2470703125, 11.6693115234375, 12.091552734375, 12.5137939453125, 12.93603515625, 13.3582763671875, 13.780517578125, 14.2027587890625, 14.625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 6.0, 15.0, 16.0, 25.0, 24.0, 52.0, 67.0, 125.0, 167.0, 280.0, 451.0, 669.0, 699.0, 548.0, 328.0, 204.0, 143.0, 77.0, 41.0, 27.0, 18.0, 18.0, 15.0, 10.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -18.02001953125, -17.4775390625, -16.93505859375, -16.392578125, -15.85009765625, -15.3076171875, -14.76513671875, -14.22265625, -13.68017578125, -13.1376953125, -12.59521484375, -12.052734375, -11.51025390625, -10.9677734375, -10.42529296875, -9.8828125, -9.34033203125, -8.7978515625, -8.25537109375, -7.712890625, -7.17041015625, -6.6279296875, -6.08544921875, -5.54296875, -5.00048828125, -4.4580078125, -3.91552734375, -3.373046875, -2.83056640625, -2.2880859375, -1.74560546875, -1.203125, -0.66064453125, -0.1181640625, 0.42431640625, 0.966796875, 1.50927734375, 2.0517578125, 2.59423828125, 3.13671875, 3.67919921875, 4.2216796875, 4.76416015625, 5.306640625, 5.84912109375, 6.3916015625, 6.93408203125, 7.4765625, 8.01904296875, 8.5615234375, 9.10400390625, 9.646484375, 10.18896484375, 10.7314453125, 11.27392578125, 11.81640625, 12.35888671875, 12.9013671875, 13.44384765625, 13.986328125, 14.52880859375, 15.0712890625, 15.61376953125, 16.15625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 4.0, 5.0, 8.0, 5.0, 5.0, 19.0, 37.0, 41.0, 75.0, 151.0, 321.0, 754.0, 2014.0, 7354.0, 53530.0, 3747822.0, 360809.0, 15579.0, 3571.0, 1181.0, 496.0, 224.0, 104.0, 70.0, 33.0, 23.0, 14.0, 7.0, 6.0, 5.0, 2.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.46875, -48.64892578125, -46.8291015625, -45.00927734375, -43.189453125, -41.36962890625, -39.5498046875, -37.72998046875, -35.91015625, -34.09033203125, -32.2705078125, -30.45068359375, -28.630859375, -26.81103515625, -24.9912109375, -23.17138671875, -21.3515625, -19.53173828125, -17.7119140625, -15.89208984375, -14.072265625, -12.25244140625, -10.4326171875, -8.61279296875, -6.79296875, -4.97314453125, -3.1533203125, -1.33349609375, 0.486328125, 2.30615234375, 4.1259765625, 5.94580078125, 7.765625, 9.58544921875, 11.4052734375, 13.22509765625, 15.044921875, 16.86474609375, 18.6845703125, 20.50439453125, 22.32421875, 24.14404296875, 25.9638671875, 27.78369140625, 29.603515625, 31.42333984375, 33.2431640625, 35.06298828125, 36.8828125, 38.70263671875, 40.5224609375, 42.34228515625, 44.162109375, 45.98193359375, 47.8017578125, 49.62158203125, 51.44140625, 53.26123046875, 55.0810546875, 56.90087890625, 58.720703125, 60.54052734375, 62.3603515625, 64.18017578125, 66.0]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 10.0, 20.0, 62.0, 182.0, 336.0, 248.0, 100.0, 33.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.34639739990234, -77.09847259521484, -71.85054779052734, -66.60263061523438, -61.354705810546875, -56.106781005859375, -50.858856201171875, -45.61093521118164, -40.36301040649414, -35.11508560180664, -29.867164611816406, -24.619239807128906, -19.37131690979004, -14.123394012451172, -8.875469207763672, -3.6275482177734375, 1.6203765869140625, 6.868299961090088, 12.116223335266113, 17.364147186279297, 22.612070083618164, 27.85999298095703, 33.10791778564453, 38.355838775634766, 43.603763580322266, 48.851688385009766, 54.099609375, 59.3475341796875, 64.595458984375, 69.8433837890625, 75.09130859375, 80.33922576904297, 85.587158203125, 90.8350830078125, 96.0830078125, 101.3309326171875, 106.57884979248047, 111.82677459716797, 117.07469940185547, 122.32261657714844, 127.57054138183594, 132.81846618652344, 138.06639099121094, 143.31431579589844, 148.56224060058594, 153.81015014648438, 159.05807495117188, 164.30599975585938, 169.55392456054688, 174.80184936523438, 180.04977416992188, 185.29769897460938, 190.54562377929688, 195.79354858398438, 201.04147338867188, 206.2893829345703, 211.53732299804688, 216.78524780273438, 222.03317260742188, 227.28109741210938, 232.52902221679688, 237.77694702148438, 243.02487182617188, 248.2727813720703, 253.5207061767578]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 4.0, 3.0, 7.0, 2.0, 8.0, 9.0, 5.0, 10.0, 12.0, 11.0, 10.0, 23.0, 20.0, 16.0, 19.0, 22.0, 24.0, 32.0, 33.0, 28.0, 36.0, 30.0, 35.0, 43.0, 33.0, 30.0, 40.0, 34.0, 26.0, 30.0, 23.0, 36.0, 31.0, 35.0, 34.0, 24.0, 19.0, 19.0, 15.0, 9.0, 13.0, 19.0, 17.0, 18.0, 8.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-37.57875061035156, -36.38471984863281, -35.19068908691406, -33.99665832519531, -32.80262756347656, -31.608596801757812, -30.41456413269043, -29.22053337097168, -28.02650260925293, -26.83247184753418, -25.63844108581543, -24.44441032409668, -23.250377655029297, -22.056346893310547, -20.862316131591797, -19.668285369873047, -18.474254608154297, -17.280223846435547, -16.086193084716797, -14.89216136932373, -13.69813060760498, -12.50409984588623, -11.310068130493164, -10.116037368774414, -8.922006607055664, -7.727975845336914, -6.533944606781006, -5.339913368225098, -4.145882606506348, -2.9518518447875977, -1.7578206062316895, -0.5637893676757812, 0.6302413940429688, 1.8242723941802979, 3.018303394317627, 4.212334632873535, 5.406365394592285, 6.600396156311035, 7.794427394866943, 8.988458633422852, 10.182489395141602, 11.376520156860352, 12.570550918579102, 13.764582633972168, 14.958613395690918, 16.152645111083984, 17.346675872802734, 18.540706634521484, 19.734737396240234, 20.928768157958984, 22.122798919677734, 23.316829681396484, 24.510860443115234, 25.704891204833984, 26.898923873901367, 28.092954635620117, 29.286985397338867, 30.481016159057617, 31.675046920776367, 32.86907958984375, 34.0631103515625, 35.25714111328125, 36.451171875, 37.64520263671875, 38.8392333984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 10.0, 8.0, 8.0, 13.0, 24.0, 10.0, 27.0, 26.0, 35.0, 36.0, 32.0, 40.0, 47.0, 55.0, 34.0, 40.0, 50.0, 42.0, 36.0, 52.0, 36.0, 39.0, 27.0, 35.0, 32.0, 27.0, 21.0, 19.0, 23.0, 14.0, 13.0, 16.0, 16.0, 4.0, 7.0, 7.0, 3.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.375, -6.1685791015625, -5.962158203125, -5.7557373046875, -5.54931640625, -5.3428955078125, -5.136474609375, -4.9300537109375, -4.7236328125, -4.5172119140625, -4.310791015625, -4.1043701171875, -3.89794921875, -3.6915283203125, -3.485107421875, -3.2786865234375, -3.072265625, -2.8658447265625, -2.659423828125, -2.4530029296875, -2.24658203125, -2.0401611328125, -1.833740234375, -1.6273193359375, -1.4208984375, -1.2144775390625, -1.008056640625, -0.8016357421875, -0.59521484375, -0.3887939453125, -0.182373046875, 0.0240478515625, 0.23046875, 0.4368896484375, 0.643310546875, 0.8497314453125, 1.05615234375, 1.2625732421875, 1.468994140625, 1.6754150390625, 1.8818359375, 2.0882568359375, 2.294677734375, 2.5010986328125, 2.70751953125, 2.9139404296875, 3.120361328125, 3.3267822265625, 3.533203125, 3.7396240234375, 3.946044921875, 4.1524658203125, 4.35888671875, 4.5653076171875, 4.771728515625, 4.9781494140625, 5.1845703125, 5.3909912109375, 5.597412109375, 5.8038330078125, 6.01025390625, 6.2166748046875, 6.423095703125, 6.6295166015625, 6.8359375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 9.0, 9.0, 16.0, 25.0, 31.0, 39.0, 62.0, 98.0, 148.0, 219.0, 341.0, 515.0, 839.0, 1332.0, 2235.0, 3481.0, 5843.0, 9987.0, 16518.0, 28248.0, 48116.0, 80827.0, 131476.0, 191619.0, 192569.0, 133090.0, 81553.0, 48358.0, 28493.0, 16923.0, 9944.0, 5975.0, 3592.0, 2282.0, 1384.0, 858.0, 518.0, 335.0, 229.0, 135.0, 83.0, 66.0, 51.0, 34.0, 22.0, 11.0, 5.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7578125, -0.7333755493164062, -0.7089385986328125, -0.6845016479492188, -0.660064697265625, -0.6356277465820312, -0.6111907958984375, -0.5867538452148438, -0.56231689453125, -0.5378799438476562, -0.5134429931640625, -0.48900604248046875, -0.464569091796875, -0.44013214111328125, -0.4156951904296875, -0.39125823974609375, -0.3668212890625, -0.34238433837890625, -0.3179473876953125, -0.29351043701171875, -0.269073486328125, -0.24463653564453125, -0.2201995849609375, -0.19576263427734375, -0.17132568359375, -0.14688873291015625, -0.1224517822265625, -0.09801483154296875, -0.073577880859375, -0.04914093017578125, -0.0247039794921875, -0.00026702880859375, 0.024169921875, 0.04860687255859375, 0.0730438232421875, 0.09748077392578125, 0.121917724609375, 0.14635467529296875, 0.1707916259765625, 0.19522857666015625, 0.21966552734375, 0.24410247802734375, 0.2685394287109375, 0.29297637939453125, 0.317413330078125, 0.34185028076171875, 0.3662872314453125, 0.39072418212890625, 0.4151611328125, 0.43959808349609375, 0.4640350341796875, 0.48847198486328125, 0.512908935546875, 0.5373458862304688, 0.5617828369140625, 0.5862197875976562, 0.61065673828125, 0.6350936889648438, 0.6595306396484375, 0.6839675903320312, 0.708404541015625, 0.7328414916992188, 0.7572784423828125, 0.7817153930664062, 0.80615234375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 11.0, 10.0, 16.0, 18.0, 19.0, 15.0, 24.0, 24.0, 36.0, 35.0, 43.0, 42.0, 28.0, 48.0, 45.0, 55.0, 1055.0, 43.0, 36.0, 43.0, 37.0, 44.0, 36.0, 27.0, 39.0, 28.0, 27.0, 21.0, 13.0, 15.0, 8.0, 13.0, 11.0, 13.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.29296875, -4.15185546875, -4.0107421875, -3.86962890625, -3.728515625, -3.58740234375, -3.4462890625, -3.30517578125, -3.1640625, -3.02294921875, -2.8818359375, -2.74072265625, -2.599609375, -2.45849609375, -2.3173828125, -2.17626953125, -2.03515625, -1.89404296875, -1.7529296875, -1.61181640625, -1.470703125, -1.32958984375, -1.1884765625, -1.04736328125, -0.90625, -0.76513671875, -0.6240234375, -0.48291015625, -0.341796875, -0.20068359375, -0.0595703125, 0.08154296875, 0.22265625, 0.36376953125, 0.5048828125, 0.64599609375, 0.787109375, 0.92822265625, 1.0693359375, 1.21044921875, 1.3515625, 1.49267578125, 1.6337890625, 1.77490234375, 1.916015625, 2.05712890625, 2.1982421875, 2.33935546875, 2.48046875, 2.62158203125, 2.7626953125, 2.90380859375, 3.044921875, 3.18603515625, 3.3271484375, 3.46826171875, 3.609375, 3.75048828125, 3.8916015625, 4.03271484375, 4.173828125, 4.31494140625, 4.4560546875, 4.59716796875, 4.73828125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 15.0, 18.0, 39.0, 43.0, 81.0, 114.0, 161.0, 284.0, 397.0, 628.0, 937.0, 1477.0, 2131.0, 3487.0, 5251.0, 8044.0, 12445.0, 19322.0, 30527.0, 48548.0, 76974.0, 118374.0, 176523.0, 1203420.0, 136713.0, 91460.0, 57972.0, 36571.0, 22926.0, 14870.0, 9521.0, 6249.0, 3984.0, 2717.0, 1665.0, 1128.0, 731.0, 455.0, 307.0, 192.0, 145.0, 90.0, 64.0, 37.0, 28.0, 16.0, 16.0, 10.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.453125, -0.4385986328125, -0.424072265625, -0.4095458984375, -0.39501953125, -0.3804931640625, -0.365966796875, -0.3514404296875, -0.3369140625, -0.3223876953125, -0.307861328125, -0.2933349609375, -0.27880859375, -0.2642822265625, -0.249755859375, -0.2352294921875, -0.220703125, -0.2061767578125, -0.191650390625, -0.1771240234375, -0.16259765625, -0.1480712890625, -0.133544921875, -0.1190185546875, -0.1044921875, -0.0899658203125, -0.075439453125, -0.0609130859375, -0.04638671875, -0.0318603515625, -0.017333984375, -0.0028076171875, 0.01171875, 0.0262451171875, 0.040771484375, 0.0552978515625, 0.06982421875, 0.0843505859375, 0.098876953125, 0.1134033203125, 0.1279296875, 0.1424560546875, 0.156982421875, 0.1715087890625, 0.18603515625, 0.2005615234375, 0.215087890625, 0.2296142578125, 0.244140625, 0.2586669921875, 0.273193359375, 0.2877197265625, 0.30224609375, 0.3167724609375, 0.331298828125, 0.3458251953125, 0.3603515625, 0.3748779296875, 0.389404296875, 0.4039306640625, 0.41845703125, 0.4329833984375, 0.447509765625, 0.4620361328125, 0.4765625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 13.0, 15.0, 16.0, 48.0, 139.0, 441.0, 188.0, 60.0, 27.0, 14.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07061767578125, -0.06857967376708984, -0.06654167175292969, -0.06450366973876953, -0.062465667724609375, -0.06042766571044922, -0.05838966369628906, -0.056351661682128906, -0.05431365966796875, -0.052275657653808594, -0.05023765563964844, -0.04819965362548828, -0.046161651611328125, -0.04412364959716797, -0.04208564758300781, -0.040047645568847656, -0.0380096435546875, -0.035971641540527344, -0.03393363952636719, -0.03189563751220703, -0.029857635498046875, -0.02781963348388672, -0.025781631469726562, -0.023743629455566406, -0.02170562744140625, -0.019667625427246094, -0.017629623413085938, -0.015591621398925781, -0.013553619384765625, -0.011515617370605469, -0.009477615356445312, -0.007439613342285156, -0.005401611328125, -0.0033636093139648438, -0.0013256072998046875, 0.0007123947143554688, 0.002750396728515625, 0.004788398742675781, 0.0068264007568359375, 0.008864402770996094, 0.01090240478515625, 0.012940406799316406, 0.014978408813476562, 0.01701641082763672, 0.019054412841796875, 0.02109241485595703, 0.023130416870117188, 0.025168418884277344, 0.0272064208984375, 0.029244422912597656, 0.03128242492675781, 0.03332042694091797, 0.035358428955078125, 0.03739643096923828, 0.03943443298339844, 0.041472434997558594, 0.04351043701171875, 0.045548439025878906, 0.04758644104003906, 0.04962444305419922, 0.051662445068359375, 0.05370044708251953, 0.05573844909667969, 0.057776451110839844, 0.059814453125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 6.0, 11.0, 21.0, 26.0, 38.0, 83.0, 160.0, 2977.0, 1043846.0, 974.0, 173.0, 71.0, 32.0, 18.0, 20.0, 16.0, 17.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1787109375, -1.1385955810546875, -1.098480224609375, -1.0583648681640625, -1.01824951171875, -0.9781341552734375, -0.938018798828125, -0.8979034423828125, -0.8577880859375, -0.8176727294921875, -0.777557373046875, -0.7374420166015625, -0.69732666015625, -0.6572113037109375, -0.617095947265625, -0.5769805908203125, -0.536865234375, -0.4967498779296875, -0.456634521484375, -0.4165191650390625, -0.37640380859375, -0.3362884521484375, -0.296173095703125, -0.2560577392578125, -0.2159423828125, -0.1758270263671875, -0.135711669921875, -0.0955963134765625, -0.05548095703125, -0.0153656005859375, 0.024749755859375, 0.0648651123046875, 0.10498046875, 0.1450958251953125, 0.185211181640625, 0.2253265380859375, 0.26544189453125, 0.3055572509765625, 0.345672607421875, 0.3857879638671875, 0.4259033203125, 0.4660186767578125, 0.506134033203125, 0.5462493896484375, 0.58636474609375, 0.6264801025390625, 0.666595458984375, 0.7067108154296875, 0.746826171875, 0.7869415283203125, 0.827056884765625, 0.8671722412109375, 0.90728759765625, 0.9474029541015625, 0.987518310546875, 1.0276336669921875, 1.0677490234375, 1.1078643798828125, 1.147979736328125, 1.1880950927734375, 1.22821044921875, 1.2683258056640625, 1.308441162109375, 1.3485565185546875, 1.388671875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 40.0, 720.0, 240.0, 12.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4045638144016266, -0.39690497517585754, -0.3892461061477661, -0.38158726692199707, -0.37392839789390564, -0.3662695586681366, -0.35861068964004517, -0.3509518504142761, -0.3432930111885071, -0.33563417196273804, -0.3279753029346466, -0.32031646370887756, -0.31265759468078613, -0.3049987554550171, -0.29733988642692566, -0.2896810472011566, -0.2820221781730652, -0.27436333894729614, -0.2667044699192047, -0.25904563069343567, -0.25138676166534424, -0.2437279224395752, -0.23606906831264496, -0.22841021418571472, -0.22075136005878448, -0.21309250593185425, -0.205433651804924, -0.19777479767799377, -0.19011595845222473, -0.1824570894241333, -0.17479825019836426, -0.16713939607143402, -0.15948054194450378, -0.15182168781757355, -0.1441628336906433, -0.13650397956371307, -0.12884512543678284, -0.1211862787604332, -0.11352743208408356, -0.10586857795715332, -0.09820971637964249, -0.09055086225271225, -0.08289201557636261, -0.07523316144943237, -0.06757430732250214, -0.0599154531955719, -0.05225660279393196, -0.04459775239229202, -0.036938898265361786, -0.0292800460010767, -0.02162119373679161, -0.013962341472506523, -0.0063034892082214355, 0.0013553649187088013, 0.00901421532034874, 0.016673065721988678, 0.024331919848918915, 0.03199077397584915, 0.03964962437748909, 0.04730847477912903, 0.054967328906059265, 0.0626261830329895, 0.07028503715991974, 0.07794388383626938, 0.08560273796319962]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 8.0, 4.0, 16.0, 12.0, 12.0, 13.0, 15.0, 16.0, 21.0, 30.0, 29.0, 36.0, 32.0, 32.0, 46.0, 38.0, 42.0, 50.0, 34.0, 44.0, 43.0, 40.0, 34.0, 44.0, 27.0, 37.0, 30.0, 21.0, 34.0, 29.0, 24.0, 14.0, 22.0, 17.0, 5.0, 6.0, 7.0, 5.0, 7.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023527026176452637, -0.022762481123209, -0.021997936069965363, -0.021233391016721725, -0.02046884596347809, -0.01970430091023445, -0.018939755856990814, -0.018175210803747177, -0.01741066575050354, -0.016646120697259903, -0.015881575644016266, -0.015117030590772629, -0.014352485537528992, -0.013587940484285355, -0.012823395431041718, -0.01205885037779808, -0.011294305324554443, -0.010529760271310806, -0.00976521521806717, -0.009000670164823532, -0.008236125111579895, -0.007471580058336258, -0.006707035005092621, -0.005942489951848984, -0.005177944898605347, -0.00441339984536171, -0.0036488547921180725, -0.0028843097388744354, -0.0021197646856307983, -0.0013552196323871613, -0.0005906745791435242, 0.00017387047410011292, 0.00093841552734375, 0.001702960580587387, 0.002467505633831024, 0.0032320506870746613, 0.003996595740318298, 0.004761140793561935, 0.0055256858468055725, 0.00629023090004921, 0.007054775953292847, 0.007819321006536484, 0.00858386605978012, 0.009348411113023758, 0.010112956166267395, 0.010877501219511032, 0.01164204627275467, 0.012406591325998306, 0.013171136379241943, 0.01393568143248558, 0.014700226485729218, 0.015464771538972855, 0.01622931659221649, 0.01699386164546013, 0.017758406698703766, 0.018522951751947403, 0.01928749680519104, 0.020052041858434677, 0.020816586911678314, 0.02158113196492195, 0.02234567701816559, 0.023110222071409225, 0.023874767124652863, 0.0246393121778965, 0.025403857231140137]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 10.0, 9.0, 7.0, 13.0, 24.0, 10.0, 27.0, 26.0, 35.0, 36.0, 32.0, 40.0, 47.0, 55.0, 34.0, 40.0, 49.0, 43.0, 36.0, 52.0, 36.0, 39.0, 27.0, 35.0, 32.0, 27.0, 21.0, 19.0, 23.0, 14.0, 13.0, 16.0, 16.0, 4.0, 7.0, 7.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.375, -6.1685791015625, -5.962158203125, -5.7557373046875, -5.54931640625, -5.3428955078125, -5.136474609375, -4.9300537109375, -4.7236328125, -4.5172119140625, -4.310791015625, -4.1043701171875, -3.89794921875, -3.6915283203125, -3.485107421875, -3.2786865234375, -3.072265625, -2.8658447265625, -2.659423828125, -2.4530029296875, -2.24658203125, -2.0401611328125, -1.833740234375, -1.6273193359375, -1.4208984375, -1.2144775390625, -1.008056640625, -0.8016357421875, -0.59521484375, -0.3887939453125, -0.182373046875, 0.0240478515625, 0.23046875, 0.4368896484375, 0.643310546875, 0.8497314453125, 1.05615234375, 1.2625732421875, 1.468994140625, 1.6754150390625, 1.8818359375, 2.0882568359375, 2.294677734375, 2.5010986328125, 2.70751953125, 2.9139404296875, 3.120361328125, 3.3267822265625, 3.533203125, 3.7396240234375, 3.946044921875, 4.1524658203125, 4.35888671875, 4.5653076171875, 4.771728515625, 4.9781494140625, 5.1845703125, 5.3909912109375, 5.597412109375, 5.8038330078125, 6.01025390625, 6.2166748046875, 6.423095703125, 6.6295166015625, 6.8359375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 9.0, 13.0, 12.0, 13.0, 29.0, 38.0, 31.0, 59.0, 60.0, 96.0, 158.0, 195.0, 406.0, 977.0, 3426.0, 13887.0, 67762.0, 543113.0, 352774.0, 50007.0, 10936.0, 2694.0, 817.0, 313.0, 212.0, 116.0, 88.0, 71.0, 48.0, 38.0, 29.0, 21.0, 22.0, 20.0, 9.0, 8.0, 8.0, 4.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.640625, -12.231689453125, -11.82275390625, -11.413818359375, -11.0048828125, -10.595947265625, -10.18701171875, -9.778076171875, -9.369140625, -8.960205078125, -8.55126953125, -8.142333984375, -7.7333984375, -7.324462890625, -6.91552734375, -6.506591796875, -6.09765625, -5.688720703125, -5.27978515625, -4.870849609375, -4.4619140625, -4.052978515625, -3.64404296875, -3.235107421875, -2.826171875, -2.417236328125, -2.00830078125, -1.599365234375, -1.1904296875, -0.781494140625, -0.37255859375, 0.036376953125, 0.4453125, 0.854248046875, 1.26318359375, 1.672119140625, 2.0810546875, 2.489990234375, 2.89892578125, 3.307861328125, 3.716796875, 4.125732421875, 4.53466796875, 4.943603515625, 5.3525390625, 5.761474609375, 6.17041015625, 6.579345703125, 6.98828125, 7.397216796875, 7.80615234375, 8.215087890625, 8.6240234375, 9.032958984375, 9.44189453125, 9.850830078125, 10.259765625, 10.668701171875, 11.07763671875, 11.486572265625, 11.8955078125, 12.304443359375, 12.71337890625, 13.122314453125, 13.53125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 8.0, 10.0, 13.0, 18.0, 10.0, 19.0, 21.0, 28.0, 24.0, 29.0, 34.0, 28.0, 37.0, 42.0, 46.0, 61.0, 97.0, 345.0, 1540.0, 149.0, 57.0, 71.0, 52.0, 32.0, 30.0, 46.0, 36.0, 23.0, 16.0, 17.0, 15.0, 20.0, 9.0, 10.0, 13.0, 6.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-21.15625, -20.537109375, -19.91796875, -19.298828125, -18.6796875, -18.060546875, -17.44140625, -16.822265625, -16.203125, -15.583984375, -14.96484375, -14.345703125, -13.7265625, -13.107421875, -12.48828125, -11.869140625, -11.25, -10.630859375, -10.01171875, -9.392578125, -8.7734375, -8.154296875, -7.53515625, -6.916015625, -6.296875, -5.677734375, -5.05859375, -4.439453125, -3.8203125, -3.201171875, -2.58203125, -1.962890625, -1.34375, -0.724609375, -0.10546875, 0.513671875, 1.1328125, 1.751953125, 2.37109375, 2.990234375, 3.609375, 4.228515625, 4.84765625, 5.466796875, 6.0859375, 6.705078125, 7.32421875, 7.943359375, 8.5625, 9.181640625, 9.80078125, 10.419921875, 11.0390625, 11.658203125, 12.27734375, 12.896484375, 13.515625, 14.134765625, 14.75390625, 15.373046875, 15.9921875, 16.611328125, 17.23046875, 17.849609375, 18.46875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 10.0, 5.0, 9.0, 6.0, 11.0, 13.0, 14.0, 14.0, 23.0, 19.0, 23.0, 39.0, 56.0, 84.0, 61.0, 139.0, 194.0, 357.0, 848.0, 6936.0, 2121656.0, 1007680.0, 5616.0, 857.0, 341.0, 165.0, 128.0, 90.0, 66.0, 64.0, 33.0, 30.0, 21.0, 21.0, 20.0, 16.0, 16.0, 7.0, 6.0, 7.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.5625, -41.14208984375, -39.7216796875, -38.30126953125, -36.880859375, -35.46044921875, -34.0400390625, -32.61962890625, -31.19921875, -29.77880859375, -28.3583984375, -26.93798828125, -25.517578125, -24.09716796875, -22.6767578125, -21.25634765625, -19.8359375, -18.41552734375, -16.9951171875, -15.57470703125, -14.154296875, -12.73388671875, -11.3134765625, -9.89306640625, -8.47265625, -7.05224609375, -5.6318359375, -4.21142578125, -2.791015625, -1.37060546875, 0.0498046875, 1.47021484375, 2.890625, 4.31103515625, 5.7314453125, 7.15185546875, 8.572265625, 9.99267578125, 11.4130859375, 12.83349609375, 14.25390625, 15.67431640625, 17.0947265625, 18.51513671875, 19.935546875, 21.35595703125, 22.7763671875, 24.19677734375, 25.6171875, 27.03759765625, 28.4580078125, 29.87841796875, 31.298828125, 32.71923828125, 34.1396484375, 35.56005859375, 36.98046875, 38.40087890625, 39.8212890625, 41.24169921875, 42.662109375, 44.08251953125, 45.5029296875, 46.92333984375, 48.34375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 25.0, 331.0, 533.0, 117.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-239.1573486328125, -234.90525817871094, -230.6531524658203, -226.40106201171875, -222.1489715576172, -217.89686584472656, -213.644775390625, -209.39268493652344, -205.1405792236328, -200.88848876953125, -196.63638305664062, -192.38429260253906, -188.1322021484375, -183.88009643554688, -179.6280059814453, -175.37591552734375, -171.12380981445312, -166.87171936035156, -162.61961364746094, -158.36752319335938, -154.1154327392578, -149.8633270263672, -145.61123657226562, -141.35914611816406, -137.1070556640625, -132.85496520996094, -128.6028594970703, -124.35076904296875, -120.09867095947266, -115.84657287597656, -111.594482421875, -107.3423843383789, -103.09027099609375, -98.83817291259766, -94.5860824584961, -90.333984375, -86.0818862915039, -81.82978820800781, -77.57769775390625, -73.32559967041016, -69.0735092163086, -64.8214111328125, -60.56931686401367, -56.317222595214844, -52.06512451171875, -47.81303024291992, -43.560935974121094, -39.308837890625, -35.05674362182617, -30.80464744567871, -26.55255126953125, -22.300457000732422, -18.04836082458496, -13.7962646484375, -9.544170379638672, -5.292074203491211, -1.03997802734375, 3.2121176719665527, 7.4642133712768555, 11.71630859375, 15.968404769897461, 20.220500946044922, 24.47259521484375, 28.72469139099121, 32.97678756713867]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 10.0, 11.0, 8.0, 9.0, 17.0, 18.0, 21.0, 28.0, 27.0, 39.0, 31.0, 41.0, 39.0, 43.0, 51.0, 41.0, 44.0, 56.0, 61.0, 53.0, 54.0, 41.0, 31.0, 37.0, 25.0, 30.0, 30.0, 15.0, 19.0, 10.0, 12.0, 13.0, 14.0, 9.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.69481658935547, -46.60063171386719, -44.506446838378906, -42.41226577758789, -40.31808090209961, -38.22389602661133, -36.12971496582031, -34.03553009033203, -31.94134521484375, -29.84716033935547, -27.75297737121582, -25.658794403076172, -23.56460952758789, -21.47042465209961, -19.37624168395996, -17.282058715820312, -15.187873840332031, -13.093689918518066, -10.999505996704102, -8.905322074890137, -6.811138153076172, -4.716954231262207, -2.622770309448242, -0.5285863876342773, 1.5655975341796875, 3.6597814559936523, 5.753965377807617, 7.848149299621582, 9.942333221435547, 12.036517143249512, 14.130701065063477, 16.224884033203125, 18.319076538085938, 20.41326141357422, 22.507444381713867, 24.601627349853516, 26.695812225341797, 28.789997100830078, 30.884180068969727, 32.978363037109375, 35.072547912597656, 37.16673278808594, 39.26091766357422, 41.355098724365234, 43.449283599853516, 45.5434684753418, 47.63764953613281, 49.731834411621094, 51.826019287109375, 53.920204162597656, 56.01438903808594, 58.10857009887695, 60.202754974365234, 62.296939849853516, 64.39112091064453, 66.48530578613281, 68.5794906616211, 70.67367553710938, 72.76786041259766, 74.86204528808594, 76.95622253417969, 79.05040740966797, 81.14459228515625, 83.23877716064453, 85.33296203613281]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 1.0, 5.0, 3.0, 6.0, 6.0, 10.0, 18.0, 13.0, 13.0, 17.0, 17.0, 30.0, 18.0, 30.0, 32.0, 36.0, 36.0, 53.0, 41.0, 47.0, 41.0, 51.0, 36.0, 43.0, 35.0, 38.0, 36.0, 41.0, 35.0, 32.0, 20.0, 24.0, 19.0, 14.0, 21.0, 18.0, 13.0, 13.0, 7.0, 8.0, 7.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.13671875, -6.92486572265625, -6.7130126953125, -6.50115966796875, -6.289306640625, -6.07745361328125, -5.8656005859375, -5.65374755859375, -5.44189453125, -5.23004150390625, -5.0181884765625, -4.80633544921875, -4.594482421875, -4.38262939453125, -4.1707763671875, -3.95892333984375, -3.7470703125, -3.53521728515625, -3.3233642578125, -3.11151123046875, -2.899658203125, -2.68780517578125, -2.4759521484375, -2.26409912109375, -2.05224609375, -1.84039306640625, -1.6285400390625, -1.41668701171875, -1.204833984375, -0.99298095703125, -0.7811279296875, -0.56927490234375, -0.357421875, -0.14556884765625, 0.0662841796875, 0.27813720703125, 0.489990234375, 0.70184326171875, 0.9136962890625, 1.12554931640625, 1.33740234375, 1.54925537109375, 1.7611083984375, 1.97296142578125, 2.184814453125, 2.39666748046875, 2.6085205078125, 2.82037353515625, 3.0322265625, 3.24407958984375, 3.4559326171875, 3.66778564453125, 3.879638671875, 4.09149169921875, 4.3033447265625, 4.51519775390625, 4.72705078125, 4.93890380859375, 5.1507568359375, 5.36260986328125, 5.574462890625, 5.78631591796875, 5.9981689453125, 6.21002197265625, 6.421875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 9.0, 7.0, 6.0, 17.0, 15.0, 28.0, 26.0, 29.0, 49.0, 82.0, 87.0, 108.0, 190.0, 211.0, 320.0, 382.0, 609.0, 855.0, 1372.0, 2119.0, 3556.0, 6219.0, 12506.0, 33851.0, 151680.0, 997155.0, 2302295.0, 543787.0, 89606.0, 23829.0, 9841.0, 5130.0, 2852.0, 1745.0, 1156.0, 760.0, 500.0, 330.0, 228.0, 180.0, 158.0, 94.0, 79.0, 51.0, 43.0, 39.0, 25.0, 19.0, 17.0, 8.0, 4.0, 9.0, 7.0, 1.0, 3.0, 4.0], "bins": [-13.5859375, -13.1903076171875, -12.794677734375, -12.3990478515625, -12.00341796875, -11.6077880859375, -11.212158203125, -10.8165283203125, -10.4208984375, -10.0252685546875, -9.629638671875, -9.2340087890625, -8.83837890625, -8.4427490234375, -8.047119140625, -7.6514892578125, -7.255859375, -6.8602294921875, -6.464599609375, -6.0689697265625, -5.67333984375, -5.2777099609375, -4.882080078125, -4.4864501953125, -4.0908203125, -3.6951904296875, -3.299560546875, -2.9039306640625, -2.50830078125, -2.1126708984375, -1.717041015625, -1.3214111328125, -0.92578125, -0.5301513671875, -0.134521484375, 0.2611083984375, 0.65673828125, 1.0523681640625, 1.447998046875, 1.8436279296875, 2.2392578125, 2.6348876953125, 3.030517578125, 3.4261474609375, 3.82177734375, 4.2174072265625, 4.613037109375, 5.0086669921875, 5.404296875, 5.7999267578125, 6.195556640625, 6.5911865234375, 6.98681640625, 7.3824462890625, 7.778076171875, 8.1737060546875, 8.5693359375, 8.9649658203125, 9.360595703125, 9.7562255859375, 10.15185546875, 10.5474853515625, 10.943115234375, 11.3387451171875, 11.734375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 0.0, 6.0, 8.0, 10.0, 11.0, 14.0, 18.0, 23.0, 52.0, 59.0, 84.0, 119.0, 218.0, 308.0, 519.0, 648.0, 703.0, 492.0, 259.0, 187.0, 98.0, 70.0, 45.0, 32.0, 24.0, 18.0, 15.0, 4.0, 7.0, 7.0, 2.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.046875, -17.529296875, -17.01171875, -16.494140625, -15.9765625, -15.458984375, -14.94140625, -14.423828125, -13.90625, -13.388671875, -12.87109375, -12.353515625, -11.8359375, -11.318359375, -10.80078125, -10.283203125, -9.765625, -9.248046875, -8.73046875, -8.212890625, -7.6953125, -7.177734375, -6.66015625, -6.142578125, -5.625, -5.107421875, -4.58984375, -4.072265625, -3.5546875, -3.037109375, -2.51953125, -2.001953125, -1.484375, -0.966796875, -0.44921875, 0.068359375, 0.5859375, 1.103515625, 1.62109375, 2.138671875, 2.65625, 3.173828125, 3.69140625, 4.208984375, 4.7265625, 5.244140625, 5.76171875, 6.279296875, 6.796875, 7.314453125, 7.83203125, 8.349609375, 8.8671875, 9.384765625, 9.90234375, 10.419921875, 10.9375, 11.455078125, 11.97265625, 12.490234375, 13.0078125, 13.525390625, 14.04296875, 14.560546875, 15.078125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 15.0, 17.0, 37.0, 49.0, 69.0, 132.0, 214.0, 355.0, 714.0, 1272.0, 3022.0, 7725.0, 28297.0, 282565.0, 3575966.0, 253451.0, 27117.0, 7482.0, 2866.0, 1334.0, 623.0, 386.0, 216.0, 122.0, 79.0, 49.0, 20.0, 28.0, 14.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.9375, -32.82421875, -31.7109375, -30.59765625, -29.484375, -28.37109375, -27.2578125, -26.14453125, -25.03125, -23.91796875, -22.8046875, -21.69140625, -20.578125, -19.46484375, -18.3515625, -17.23828125, -16.125, -15.01171875, -13.8984375, -12.78515625, -11.671875, -10.55859375, -9.4453125, -8.33203125, -7.21875, -6.10546875, -4.9921875, -3.87890625, -2.765625, -1.65234375, -0.5390625, 0.57421875, 1.6875, 2.80078125, 3.9140625, 5.02734375, 6.140625, 7.25390625, 8.3671875, 9.48046875, 10.59375, 11.70703125, 12.8203125, 13.93359375, 15.046875, 16.16015625, 17.2734375, 18.38671875, 19.5, 20.61328125, 21.7265625, 22.83984375, 23.953125, 25.06640625, 26.1796875, 27.29296875, 28.40625, 29.51953125, 30.6328125, 31.74609375, 32.859375, 33.97265625, 35.0859375, 36.19921875, 37.3125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 10.0, 29.0, 59.0, 121.0, 196.0, 234.0, 165.0, 100.0, 45.0, 24.0, 13.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.83023071289062, -130.26339721679688, -126.6965560913086, -123.12972259521484, -119.56288146972656, -115.99604797363281, -112.42921447753906, -108.86237335205078, -105.29553985595703, -101.72870635986328, -98.161865234375, -94.59503173828125, -91.02819061279297, -87.46135711669922, -83.89451599121094, -80.32768249511719, -76.76084899902344, -73.19401550292969, -69.6271743774414, -66.06034088134766, -62.49350357055664, -58.926666259765625, -55.35982894897461, -51.792991638183594, -48.22615051269531, -44.6593132019043, -41.09247589111328, -37.52564239501953, -33.958805084228516, -30.3919677734375, -26.825130462646484, -23.2582950592041, -19.69145965576172, -16.124622344970703, -12.55778694152832, -8.990949630737305, -5.4241132736206055, -1.8572769165039062, 1.7095603942871094, 5.276395797729492, 8.843233108520508, 12.410069465637207, 15.976905822753906, 19.543743133544922, 23.110580444335938, 26.67741584777832, 30.244253158569336, 33.81108856201172, 37.377925872802734, 40.94476318359375, 44.511600494384766, 48.07843780517578, 51.64527130126953, 55.21210861206055, 58.77894592285156, 62.34577941894531, 65.9126205444336, 69.47945404052734, 73.04629516601562, 76.61312866210938, 80.17996978759766, 83.7468032836914, 87.31364440917969, 90.88047790527344, 94.44731140136719]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 3.0, 9.0, 7.0, 14.0, 9.0, 13.0, 23.0, 19.0, 14.0, 22.0, 24.0, 20.0, 25.0, 32.0, 23.0, 41.0, 40.0, 38.0, 40.0, 46.0, 32.0, 46.0, 45.0, 38.0, 32.0, 42.0, 23.0, 30.0, 17.0, 31.0, 24.0, 24.0, 26.0, 22.0, 15.0, 10.0, 10.0, 4.0, 9.0, 13.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-39.722686767578125, -38.48804473876953, -37.25340270996094, -36.01875686645508, -34.784114837646484, -33.54947280883789, -32.31482696533203, -31.080184936523438, -29.845542907714844, -28.61090087890625, -27.376256942749023, -26.141613006591797, -24.906970977783203, -23.67232894897461, -22.437685012817383, -21.203041076660156, -19.968399047851562, -18.73375701904297, -17.499113082885742, -16.264469146728516, -15.029827117919922, -13.795184135437012, -12.560541152954102, -11.325898170471191, -10.091255187988281, -8.856612205505371, -7.621969223022461, -6.387326240539551, -5.152683258056641, -3.9180402755737305, -2.6833972930908203, -1.4487543106079102, -0.214111328125, 1.0205316543579102, 2.2551746368408203, 3.4898176193237305, 4.724460601806641, 5.959103584289551, 7.193746566772461, 8.428389549255371, 9.663032531738281, 10.897675514221191, 12.132318496704102, 13.366961479187012, 14.601604461669922, 15.836247444152832, 17.070890426635742, 18.30553436279297, 19.540176391601562, 20.774818420410156, 22.009462356567383, 23.24410629272461, 24.478748321533203, 25.713390350341797, 26.948034286499023, 28.18267822265625, 29.417320251464844, 30.651962280273438, 31.886606216430664, 33.12125015258789, 34.355892181396484, 35.59053421020508, 36.82518005371094, 38.05982208251953, 39.294464111328125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 8.0, 4.0, 5.0, 14.0, 11.0, 7.0, 24.0, 24.0, 23.0, 17.0, 27.0, 22.0, 34.0, 32.0, 24.0, 38.0, 27.0, 39.0, 41.0, 47.0, 40.0, 46.0, 35.0, 28.0, 33.0, 42.0, 34.0, 23.0, 15.0, 23.0, 22.0, 19.0, 18.0, 21.0, 15.0, 24.0, 15.0, 14.0, 6.0, 5.0, 14.0, 5.0, 7.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.078125, -5.8751220703125, -5.672119140625, -5.4691162109375, -5.26611328125, -5.0631103515625, -4.860107421875, -4.6571044921875, -4.4541015625, -4.2510986328125, -4.048095703125, -3.8450927734375, -3.64208984375, -3.4390869140625, -3.236083984375, -3.0330810546875, -2.830078125, -2.6270751953125, -2.424072265625, -2.2210693359375, -2.01806640625, -1.8150634765625, -1.612060546875, -1.4090576171875, -1.2060546875, -1.0030517578125, -0.800048828125, -0.5970458984375, -0.39404296875, -0.1910400390625, 0.011962890625, 0.2149658203125, 0.41796875, 0.6209716796875, 0.823974609375, 1.0269775390625, 1.22998046875, 1.4329833984375, 1.635986328125, 1.8389892578125, 2.0419921875, 2.2449951171875, 2.447998046875, 2.6510009765625, 2.85400390625, 3.0570068359375, 3.260009765625, 3.4630126953125, 3.666015625, 3.8690185546875, 4.072021484375, 4.2750244140625, 4.47802734375, 4.6810302734375, 4.884033203125, 5.0870361328125, 5.2900390625, 5.4930419921875, 5.696044921875, 5.8990478515625, 6.10205078125, 6.3050537109375, 6.508056640625, 6.7110595703125, 6.9140625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 6.0, 9.0, 13.0, 25.0, 34.0, 56.0, 63.0, 101.0, 142.0, 229.0, 286.0, 476.0, 725.0, 1053.0, 1577.0, 2522.0, 3869.0, 5892.0, 9153.0, 14729.0, 24007.0, 40120.0, 68397.0, 115122.0, 182344.0, 209642.0, 146072.0, 88147.0, 51893.0, 30632.0, 18549.0, 11410.0, 7337.0, 4809.0, 3095.0, 2022.0, 1375.0, 859.0, 597.0, 384.0, 253.0, 175.0, 115.0, 76.0, 50.0, 40.0, 27.0, 16.0, 16.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.80859375, -0.7835159301757812, -0.7584381103515625, -0.7333602905273438, -0.708282470703125, -0.6832046508789062, -0.6581268310546875, -0.6330490112304688, -0.60797119140625, -0.5828933715820312, -0.5578155517578125, -0.5327377319335938, -0.507659912109375, -0.48258209228515625, -0.4575042724609375, -0.43242645263671875, -0.4073486328125, -0.38227081298828125, -0.3571929931640625, -0.33211517333984375, -0.307037353515625, -0.28195953369140625, -0.2568817138671875, -0.23180389404296875, -0.20672607421875, -0.18164825439453125, -0.1565704345703125, -0.13149261474609375, -0.106414794921875, -0.08133697509765625, -0.0562591552734375, -0.03118133544921875, -0.006103515625, 0.01897430419921875, 0.0440521240234375, 0.06912994384765625, 0.094207763671875, 0.11928558349609375, 0.1443634033203125, 0.16944122314453125, 0.19451904296875, 0.21959686279296875, 0.2446746826171875, 0.26975250244140625, 0.294830322265625, 0.31990814208984375, 0.3449859619140625, 0.37006378173828125, 0.3951416015625, 0.42021942138671875, 0.4452972412109375, 0.47037506103515625, 0.495452880859375, 0.5205307006835938, 0.5456085205078125, 0.5706863403320312, 0.59576416015625, 0.6208419799804688, 0.6459197998046875, 0.6709976196289062, 0.696075439453125, 0.7211532592773438, 0.7462310791015625, 0.7713088989257812, 0.79638671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 3.0, 8.0, 6.0, 6.0, 10.0, 7.0, 20.0, 10.0, 19.0, 22.0, 25.0, 32.0, 29.0, 20.0, 38.0, 33.0, 40.0, 36.0, 40.0, 46.0, 1073.0, 43.0, 57.0, 46.0, 37.0, 28.0, 31.0, 27.0, 34.0, 19.0, 27.0, 18.0, 28.0, 15.0, 16.0, 13.0, 16.0, 6.0, 5.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0], "bins": [-4.8203125, -4.676513671875, -4.53271484375, -4.388916015625, -4.2451171875, -4.101318359375, -3.95751953125, -3.813720703125, -3.669921875, -3.526123046875, -3.38232421875, -3.238525390625, -3.0947265625, -2.950927734375, -2.80712890625, -2.663330078125, -2.51953125, -2.375732421875, -2.23193359375, -2.088134765625, -1.9443359375, -1.800537109375, -1.65673828125, -1.512939453125, -1.369140625, -1.225341796875, -1.08154296875, -0.937744140625, -0.7939453125, -0.650146484375, -0.50634765625, -0.362548828125, -0.21875, -0.074951171875, 0.06884765625, 0.212646484375, 0.3564453125, 0.500244140625, 0.64404296875, 0.787841796875, 0.931640625, 1.075439453125, 1.21923828125, 1.363037109375, 1.5068359375, 1.650634765625, 1.79443359375, 1.938232421875, 2.08203125, 2.225830078125, 2.36962890625, 2.513427734375, 2.6572265625, 2.801025390625, 2.94482421875, 3.088623046875, 3.232421875, 3.376220703125, 3.52001953125, 3.663818359375, 3.8076171875, 3.951416015625, 4.09521484375, 4.239013671875, 4.3828125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 12.0, 19.0, 32.0, 46.0, 72.0, 96.0, 139.0, 230.0, 332.0, 458.0, 680.0, 1007.0, 1634.0, 2283.0, 3452.0, 5124.0, 7802.0, 12004.0, 18593.0, 29037.0, 46586.0, 75402.0, 119507.0, 175190.0, 1220083.0, 136765.0, 88683.0, 55096.0, 34167.0, 21564.0, 13988.0, 9156.0, 5915.0, 3891.0, 2721.0, 1719.0, 1154.0, 824.0, 530.0, 362.0, 261.0, 162.0, 120.0, 71.0, 57.0, 35.0, 16.0, 19.0, 8.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.501953125, -0.48635101318359375, -0.4707489013671875, -0.45514678955078125, -0.439544677734375, -0.42394256591796875, -0.4083404541015625, -0.39273834228515625, -0.37713623046875, -0.36153411865234375, -0.3459320068359375, -0.33032989501953125, -0.314727783203125, -0.29912567138671875, -0.2835235595703125, -0.26792144775390625, -0.2523193359375, -0.23671722412109375, -0.2211151123046875, -0.20551300048828125, -0.189910888671875, -0.17430877685546875, -0.1587066650390625, -0.14310455322265625, -0.12750244140625, -0.11190032958984375, -0.0962982177734375, -0.08069610595703125, -0.065093994140625, -0.04949188232421875, -0.0338897705078125, -0.01828765869140625, -0.002685546875, 0.01291656494140625, 0.0285186767578125, 0.04412078857421875, 0.059722900390625, 0.07532501220703125, 0.0909271240234375, 0.10652923583984375, 0.12213134765625, 0.13773345947265625, 0.1533355712890625, 0.16893768310546875, 0.184539794921875, 0.20014190673828125, 0.2157440185546875, 0.23134613037109375, 0.2469482421875, 0.26255035400390625, 0.2781524658203125, 0.29375457763671875, 0.309356689453125, 0.32495880126953125, 0.3405609130859375, 0.35616302490234375, 0.37176513671875, 0.38736724853515625, 0.4029693603515625, 0.41857147216796875, 0.434173583984375, 0.44977569580078125, 0.4653778076171875, 0.48097991943359375, 0.49658203125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 10.0, 9.0, 9.0, 11.0, 14.0, 21.0, 25.0, 22.0, 33.0, 50.0, 50.0, 56.0, 45.0, 78.0, 98.0, 58.0, 61.0, 50.0, 43.0, 47.0, 41.0, 30.0, 23.0, 18.0, 14.0, 8.0, 10.0, 11.0, 6.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0159912109375, -0.015482664108276367, -0.014974117279052734, -0.014465570449829102, -0.013957023620605469, -0.013448476791381836, -0.012939929962158203, -0.01243138313293457, -0.011922836303710938, -0.011414289474487305, -0.010905742645263672, -0.010397195816040039, -0.009888648986816406, -0.009380102157592773, -0.00887155532836914, -0.008363008499145508, -0.007854461669921875, -0.007345914840698242, -0.006837368011474609, -0.0063288211822509766, -0.005820274353027344, -0.005311727523803711, -0.004803180694580078, -0.004294633865356445, -0.0037860870361328125, -0.0032775402069091797, -0.002768993377685547, -0.002260446548461914, -0.0017518997192382812, -0.0012433528900146484, -0.0007348060607910156, -0.0002262592315673828, 0.00028228759765625, 0.0007908344268798828, 0.0012993812561035156, 0.0018079280853271484, 0.0023164749145507812, 0.002825021743774414, 0.003333568572998047, 0.0038421154022216797, 0.0043506622314453125, 0.004859209060668945, 0.005367755889892578, 0.005876302719116211, 0.006384849548339844, 0.0068933963775634766, 0.007401943206787109, 0.007910490036010742, 0.008419036865234375, 0.008927583694458008, 0.00943613052368164, 0.009944677352905273, 0.010453224182128906, 0.010961771011352539, 0.011470317840576172, 0.011978864669799805, 0.012487411499023438, 0.01299595832824707, 0.013504505157470703, 0.014013051986694336, 0.014521598815917969, 0.015030145645141602, 0.015538692474365234, 0.016047239303588867, 0.0165557861328125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 22.0, 18.0, 21.0, 35.0, 37.0, 52.0, 79.0, 107.0, 187.0, 255.0, 516.0, 5494.0, 1034362.0, 5912.0, 537.0, 281.0, 176.0, 101.0, 69.0, 44.0, 42.0, 38.0, 22.0, 23.0, 11.0, 19.0, 11.0, 18.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.366943359375, -0.3556556701660156, -0.34436798095703125, -0.3330802917480469, -0.3217926025390625, -0.3105049133300781, -0.29921722412109375, -0.2879295349121094, -0.276641845703125, -0.2653541564941406, -0.25406646728515625, -0.24277877807617188, -0.2314910888671875, -0.22020339965820312, -0.20891571044921875, -0.19762802124023438, -0.18634033203125, -0.17505264282226562, -0.16376495361328125, -0.15247726440429688, -0.1411895751953125, -0.12990188598632812, -0.11861419677734375, -0.10732650756835938, -0.096038818359375, -0.08475112915039062, -0.07346343994140625, -0.062175750732421875, -0.0508880615234375, -0.039600372314453125, -0.02831268310546875, -0.017024993896484375, -0.0057373046875, 0.005550384521484375, 0.01683807373046875, 0.028125762939453125, 0.0394134521484375, 0.050701141357421875, 0.06198883056640625, 0.07327651977539062, 0.084564208984375, 0.09585189819335938, 0.10713958740234375, 0.11842727661132812, 0.1297149658203125, 0.14100265502929688, 0.15229034423828125, 0.16357803344726562, 0.17486572265625, 0.18615341186523438, 0.19744110107421875, 0.20872879028320312, 0.2200164794921875, 0.23130416870117188, 0.24259185791015625, 0.2538795471191406, 0.265167236328125, 0.2764549255371094, 0.28774261474609375, 0.2990303039550781, 0.3103179931640625, 0.3216056823730469, 0.33289337158203125, 0.3441810607910156, 0.35546875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 16.0, 793.0, 203.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034030091017484665, -0.025136243551969528, -0.01624239608645439, -0.007348548620939255, 0.001545298844575882, 0.010439146310091019, 0.019332993775606155, 0.028226841241121292, 0.03712068870663643, 0.046014536172151566, 0.0549083836376667, 0.06380222737789154, 0.07269607484340668, 0.08158992230892181, 0.09048376977443695, 0.09937761723995209, 0.10827146470546722, 0.11716531217098236, 0.1260591596364975, 0.13495300710201263, 0.14384685456752777, 0.1527407020330429, 0.16163454949855804, 0.17052839696407318, 0.17942224442958832, 0.18831609189510345, 0.1972099393606186, 0.20610378682613373, 0.21499763429164886, 0.223891481757164, 0.23278532922267914, 0.24167917668819427, 0.2505730390548706, 0.25946688652038574, 0.2683607339859009, 0.277254581451416, 0.28614842891693115, 0.2950422763824463, 0.3039361238479614, 0.31282997131347656, 0.3217238187789917, 0.33061766624450684, 0.339511513710022, 0.3484053611755371, 0.35729920864105225, 0.3661930561065674, 0.3750869035720825, 0.38398075103759766, 0.3928745985031128, 0.40176844596862793, 0.41066229343414307, 0.4195561408996582, 0.42844998836517334, 0.4373438358306885, 0.4462376832962036, 0.45513153076171875, 0.4640253782272339, 0.472919225692749, 0.48181307315826416, 0.4907069206237793, 0.49960076808929443, 0.5084946155548096, 0.5173884630203247, 0.5262823104858398, 0.535176157951355]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 7.0, 7.0, 11.0, 10.0, 15.0, 29.0, 19.0, 30.0, 35.0, 40.0, 35.0, 36.0, 38.0, 62.0, 56.0, 54.0, 46.0, 52.0, 50.0, 43.0, 35.0, 52.0, 45.0, 35.0, 25.0, 16.0, 20.0, 23.0, 19.0, 20.0, 10.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03338998556137085, -0.0324234813451767, -0.03145698085427284, -0.03049047850072384, -0.029523976147174835, -0.02855747379362583, -0.027590971440076828, -0.026624469086527824, -0.02565796673297882, -0.024691464379429817, -0.023724962025880814, -0.02275845967233181, -0.021791957318782806, -0.020825454965233803, -0.0198589526116848, -0.018892450258135796, -0.017925947904586792, -0.01695944555103779, -0.015992943197488785, -0.015026440843939781, -0.014059938490390778, -0.013093436136841774, -0.01212693378329277, -0.011160431429743767, -0.010193929076194763, -0.00922742672264576, -0.008260924369096756, -0.007294422015547752, -0.006327919661998749, -0.005361417308449745, -0.004394914954900742, -0.003428412601351738, -0.0024619102478027344, -0.0014954078942537308, -0.0005289055407047272, 0.00043759681284427643, 0.00140409916639328, 0.0023706015199422836, 0.0033371038734912872, 0.004303606227040291, 0.005270108580589294, 0.006236610934138298, 0.007203113287687302, 0.008169615641236305, 0.009136117994785309, 0.010102620348334312, 0.011069122701883316, 0.01203562505543232, 0.013002127408981323, 0.013968629762530327, 0.01493513211607933, 0.015901634469628334, 0.016868136823177338, 0.01783463917672634, 0.018801141530275345, 0.01976764388382435, 0.020734146237373352, 0.021700648590922356, 0.02266715094447136, 0.023633653298020363, 0.024600155651569366, 0.02556665800511837, 0.026533160358667374, 0.027499662712216377, 0.02846616506576538]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 9.0, 3.0, 6.0, 13.0, 12.0, 7.0, 24.0, 23.0, 24.0, 16.0, 28.0, 21.0, 33.0, 33.0, 25.0, 38.0, 27.0, 39.0, 41.0, 46.0, 41.0, 46.0, 35.0, 28.0, 32.0, 43.0, 34.0, 23.0, 15.0, 22.0, 23.0, 19.0, 18.0, 21.0, 15.0, 24.0, 15.0, 14.0, 6.0, 5.0, 14.0, 5.0, 7.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.08203125, -5.87896728515625, -5.6759033203125, -5.47283935546875, -5.269775390625, -5.06671142578125, -4.8636474609375, -4.66058349609375, -4.45751953125, -4.25445556640625, -4.0513916015625, -3.84832763671875, -3.645263671875, -3.44219970703125, -3.2391357421875, -3.03607177734375, -2.8330078125, -2.62994384765625, -2.4268798828125, -2.22381591796875, -2.020751953125, -1.81768798828125, -1.6146240234375, -1.41156005859375, -1.20849609375, -1.00543212890625, -0.8023681640625, -0.59930419921875, -0.396240234375, -0.19317626953125, 0.0098876953125, 0.21295166015625, 0.416015625, 0.61907958984375, 0.8221435546875, 1.02520751953125, 1.228271484375, 1.43133544921875, 1.6343994140625, 1.83746337890625, 2.04052734375, 2.24359130859375, 2.4466552734375, 2.64971923828125, 2.852783203125, 3.05584716796875, 3.2589111328125, 3.46197509765625, 3.6650390625, 3.86810302734375, 4.0711669921875, 4.27423095703125, 4.477294921875, 4.68035888671875, 4.8834228515625, 5.08648681640625, 5.28955078125, 5.49261474609375, 5.6956787109375, 5.89874267578125, 6.101806640625, 6.30487060546875, 6.5079345703125, 6.71099853515625, 6.9140625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 5.0, 7.0, 8.0, 9.0, 7.0, 11.0, 12.0, 18.0, 28.0, 34.0, 49.0, 45.0, 75.0, 120.0, 163.0, 201.0, 293.0, 367.0, 536.0, 833.0, 1274.0, 2008.0, 3497.0, 6582.0, 14962.0, 47287.0, 523660.0, 374970.0, 42151.0, 13963.0, 6234.0, 3267.0, 2002.0, 1209.0, 798.0, 493.0, 365.0, 256.0, 167.0, 144.0, 90.0, 94.0, 64.0, 48.0, 32.0, 26.0, 28.0, 11.0, 16.0, 21.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-14.5625, -14.076416015625, -13.59033203125, -13.104248046875, -12.6181640625, -12.132080078125, -11.64599609375, -11.159912109375, -10.673828125, -10.187744140625, -9.70166015625, -9.215576171875, -8.7294921875, -8.243408203125, -7.75732421875, -7.271240234375, -6.78515625, -6.299072265625, -5.81298828125, -5.326904296875, -4.8408203125, -4.354736328125, -3.86865234375, -3.382568359375, -2.896484375, -2.410400390625, -1.92431640625, -1.438232421875, -0.9521484375, -0.466064453125, 0.02001953125, 0.506103515625, 0.9921875, 1.478271484375, 1.96435546875, 2.450439453125, 2.9365234375, 3.422607421875, 3.90869140625, 4.394775390625, 4.880859375, 5.366943359375, 5.85302734375, 6.339111328125, 6.8251953125, 7.311279296875, 7.79736328125, 8.283447265625, 8.76953125, 9.255615234375, 9.74169921875, 10.227783203125, 10.7138671875, 11.199951171875, 11.68603515625, 12.172119140625, 12.658203125, 13.144287109375, 13.63037109375, 14.116455078125, 14.6025390625, 15.088623046875, 15.57470703125, 16.060791015625, 16.546875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 10.0, 13.0, 6.0, 7.0, 18.0, 20.0, 23.0, 21.0, 19.0, 27.0, 26.0, 25.0, 35.0, 50.0, 53.0, 66.0, 89.0, 180.0, 1620.0, 159.0, 87.0, 53.0, 60.0, 48.0, 34.0, 37.0, 35.0, 22.0, 34.0, 25.0, 24.0, 13.0, 22.0, 12.0, 13.0, 7.0, 4.0, 8.0, 7.0, 6.0, 9.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.890625, -19.258056640625, -18.62548828125, -17.992919921875, -17.3603515625, -16.727783203125, -16.09521484375, -15.462646484375, -14.830078125, -14.197509765625, -13.56494140625, -12.932373046875, -12.2998046875, -11.667236328125, -11.03466796875, -10.402099609375, -9.76953125, -9.136962890625, -8.50439453125, -7.871826171875, -7.2392578125, -6.606689453125, -5.97412109375, -5.341552734375, -4.708984375, -4.076416015625, -3.44384765625, -2.811279296875, -2.1787109375, -1.546142578125, -0.91357421875, -0.281005859375, 0.3515625, 0.984130859375, 1.61669921875, 2.249267578125, 2.8818359375, 3.514404296875, 4.14697265625, 4.779541015625, 5.412109375, 6.044677734375, 6.67724609375, 7.309814453125, 7.9423828125, 8.574951171875, 9.20751953125, 9.840087890625, 10.47265625, 11.105224609375, 11.73779296875, 12.370361328125, 13.0029296875, 13.635498046875, 14.26806640625, 14.900634765625, 15.533203125, 16.165771484375, 16.79833984375, 17.430908203125, 18.0634765625, 18.696044921875, 19.32861328125, 19.961181640625, 20.59375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 4.0, 14.0, 9.0, 10.0, 13.0, 14.0, 19.0, 29.0, 37.0, 40.0, 61.0, 59.0, 100.0, 129.0, 286.0, 700.0, 3466.0, 62026.0, 3047148.0, 28086.0, 2261.0, 518.0, 215.0, 112.0, 69.0, 72.0, 46.0, 29.0, 26.0, 22.0, 17.0, 13.0, 19.0, 12.0, 5.0, 4.0, 2.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-66.1875, -64.0791015625, -61.970703125, -59.8623046875, -57.75390625, -55.6455078125, -53.537109375, -51.4287109375, -49.3203125, -47.2119140625, -45.103515625, -42.9951171875, -40.88671875, -38.7783203125, -36.669921875, -34.5615234375, -32.453125, -30.3447265625, -28.236328125, -26.1279296875, -24.01953125, -21.9111328125, -19.802734375, -17.6943359375, -15.5859375, -13.4775390625, -11.369140625, -9.2607421875, -7.15234375, -5.0439453125, -2.935546875, -0.8271484375, 1.28125, 3.3896484375, 5.498046875, 7.6064453125, 9.71484375, 11.8232421875, 13.931640625, 16.0400390625, 18.1484375, 20.2568359375, 22.365234375, 24.4736328125, 26.58203125, 28.6904296875, 30.798828125, 32.9072265625, 35.015625, 37.1240234375, 39.232421875, 41.3408203125, 43.44921875, 45.5576171875, 47.666015625, 49.7744140625, 51.8828125, 53.9912109375, 56.099609375, 58.2080078125, 60.31640625, 62.4248046875, 64.533203125, 66.6416015625, 68.75]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 12.0, 52.0, 277.0, 425.0, 184.0, 49.0, 7.0, 4.0, 1.0, 0.0, 1.0], "bins": [-212.79273986816406, -209.0165557861328, -205.24038696289062, -201.46420288085938, -197.68801879882812, -193.91183471679688, -190.1356658935547, -186.35948181152344, -182.58331298828125, -178.80712890625, -175.0309600830078, -171.25477600097656, -167.4785919189453, -163.70242309570312, -159.92623901367188, -156.15005493164062, -152.37387084960938, -148.59768676757812, -144.82151794433594, -141.0453338623047, -137.26914978027344, -133.49298095703125, -129.716796875, -125.94061279296875, -122.16443634033203, -118.38825988769531, -114.61207580566406, -110.83589935302734, -107.05972290039062, -103.28353881835938, -99.50736236572266, -95.73118591308594, -91.95499420166016, -88.17881774902344, -84.40263366699219, -80.62645721435547, -76.85028076171875, -73.0740966796875, -69.29792022705078, -65.52174377441406, -61.74555969238281, -57.96937942504883, -54.193199157714844, -50.417022705078125, -46.64084243774414, -42.864662170410156, -39.08848571777344, -35.31230545043945, -31.5361270904541, -27.75994873046875, -23.983768463134766, -20.20758819580078, -16.43140983581543, -12.655229568481445, -8.879051208496094, -5.102872848510742, -1.3266925811767578, 2.44948673248291, 6.225666046142578, 10.001845359802246, 13.778024673461914, 17.5542049407959, 21.33038330078125, 25.1065616607666, 28.882741928100586]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 6.0, 15.0, 15.0, 15.0, 12.0, 13.0, 30.0, 35.0, 25.0, 43.0, 40.0, 34.0, 44.0, 43.0, 50.0, 51.0, 39.0, 43.0, 53.0, 36.0, 41.0, 44.0, 36.0, 25.0, 31.0, 27.0, 19.0, 20.0, 17.0, 21.0, 13.0, 8.0, 13.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.248661041259766, -59.386024475097656, -57.52338409423828, -55.660743713378906, -53.7981071472168, -51.93547058105469, -50.07283020019531, -48.21018981933594, -46.34755325317383, -44.48491668701172, -42.622276306152344, -40.75963592529297, -38.89699935913086, -37.03436279296875, -35.171722412109375, -33.30908203125, -31.44644546508789, -29.58380699157715, -27.721168518066406, -25.858530044555664, -23.995891571044922, -22.13325309753418, -20.270614624023438, -18.407976150512695, -16.545337677001953, -14.682699203491211, -12.820060729980469, -10.957422256469727, -9.094783782958984, -7.232145309448242, -5.3695068359375, -3.506868362426758, -1.6442298889160156, 0.21840858459472656, 2.0810470581054688, 3.943685531616211, 5.806324005126953, 7.668962478637695, 9.531600952148438, 11.39423942565918, 13.256877899169922, 15.119516372680664, 16.982154846191406, 18.84479331970215, 20.70743179321289, 22.570070266723633, 24.432708740234375, 26.295347213745117, 28.15798568725586, 30.0206241607666, 31.883262634277344, 33.74590301513672, 35.60853958129883, 37.47117614746094, 39.33381652832031, 41.19645690917969, 43.0590934753418, 44.921730041503906, 46.78437042236328, 48.647010803222656, 50.509647369384766, 52.372283935546875, 54.23492431640625, 56.097564697265625, 57.960201263427734]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 0.0, 4.0, 6.0, 8.0, 4.0, 6.0, 10.0, 18.0, 13.0, 11.0, 18.0, 27.0, 23.0, 36.0, 22.0, 30.0, 31.0, 34.0, 38.0, 39.0, 42.0, 47.0, 34.0, 41.0, 39.0, 44.0, 32.0, 27.0, 36.0, 30.0, 20.0, 24.0, 17.0, 30.0, 24.0, 21.0, 13.0, 19.0, 12.0, 16.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.34765625, -6.1312255859375, -5.914794921875, -5.6983642578125, -5.48193359375, -5.2655029296875, -5.049072265625, -4.8326416015625, -4.6162109375, -4.3997802734375, -4.183349609375, -3.9669189453125, -3.75048828125, -3.5340576171875, -3.317626953125, -3.1011962890625, -2.884765625, -2.6683349609375, -2.451904296875, -2.2354736328125, -2.01904296875, -1.8026123046875, -1.586181640625, -1.3697509765625, -1.1533203125, -0.9368896484375, -0.720458984375, -0.5040283203125, -0.28759765625, -0.0711669921875, 0.145263671875, 0.3616943359375, 0.578125, 0.7945556640625, 1.010986328125, 1.2274169921875, 1.44384765625, 1.6602783203125, 1.876708984375, 2.0931396484375, 2.3095703125, 2.5260009765625, 2.742431640625, 2.9588623046875, 3.17529296875, 3.3917236328125, 3.608154296875, 3.8245849609375, 4.041015625, 4.2574462890625, 4.473876953125, 4.6903076171875, 4.90673828125, 5.1231689453125, 5.339599609375, 5.5560302734375, 5.7724609375, 5.9888916015625, 6.205322265625, 6.4217529296875, 6.63818359375, 6.8546142578125, 7.071044921875, 7.2874755859375, 7.50390625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 10.0, 17.0, 18.0, 28.0, 41.0, 64.0, 83.0, 119.0, 201.0, 307.0, 458.0, 723.0, 1160.0, 1830.0, 3121.0, 5360.0, 10535.0, 25562.0, 146566.0, 1980356.0, 1841724.0, 127645.0, 24304.0, 10176.0, 5425.0, 3079.0, 1871.0, 1186.0, 769.0, 494.0, 334.0, 214.0, 148.0, 93.0, 59.0, 45.0, 35.0, 22.0, 21.0, 14.0, 11.0, 12.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.53125, -19.90869140625, -19.2861328125, -18.66357421875, -18.041015625, -17.41845703125, -16.7958984375, -16.17333984375, -15.55078125, -14.92822265625, -14.3056640625, -13.68310546875, -13.060546875, -12.43798828125, -11.8154296875, -11.19287109375, -10.5703125, -9.94775390625, -9.3251953125, -8.70263671875, -8.080078125, -7.45751953125, -6.8349609375, -6.21240234375, -5.58984375, -4.96728515625, -4.3447265625, -3.72216796875, -3.099609375, -2.47705078125, -1.8544921875, -1.23193359375, -0.609375, 0.01318359375, 0.6357421875, 1.25830078125, 1.880859375, 2.50341796875, 3.1259765625, 3.74853515625, 4.37109375, 4.99365234375, 5.6162109375, 6.23876953125, 6.861328125, 7.48388671875, 8.1064453125, 8.72900390625, 9.3515625, 9.97412109375, 10.5966796875, 11.21923828125, 11.841796875, 12.46435546875, 13.0869140625, 13.70947265625, 14.33203125, 14.95458984375, 15.5771484375, 16.19970703125, 16.822265625, 17.44482421875, 18.0673828125, 18.68994140625, 19.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 3.0, 9.0, 11.0, 17.0, 16.0, 19.0, 33.0, 32.0, 74.0, 79.0, 127.0, 237.0, 375.0, 560.0, 731.0, 588.0, 407.0, 229.0, 145.0, 113.0, 64.0, 47.0, 34.0, 26.0, 14.0, 17.0, 11.0, 14.0, 6.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.839599609375, -14.31982421875, -13.800048828125, -13.2802734375, -12.760498046875, -12.24072265625, -11.720947265625, -11.201171875, -10.681396484375, -10.16162109375, -9.641845703125, -9.1220703125, -8.602294921875, -8.08251953125, -7.562744140625, -7.04296875, -6.523193359375, -6.00341796875, -5.483642578125, -4.9638671875, -4.444091796875, -3.92431640625, -3.404541015625, -2.884765625, -2.364990234375, -1.84521484375, -1.325439453125, -0.8056640625, -0.285888671875, 0.23388671875, 0.753662109375, 1.2734375, 1.793212890625, 2.31298828125, 2.832763671875, 3.3525390625, 3.872314453125, 4.39208984375, 4.911865234375, 5.431640625, 5.951416015625, 6.47119140625, 6.990966796875, 7.5107421875, 8.030517578125, 8.55029296875, 9.070068359375, 9.58984375, 10.109619140625, 10.62939453125, 11.149169921875, 11.6689453125, 12.188720703125, 12.70849609375, 13.228271484375, 13.748046875, 14.267822265625, 14.78759765625, 15.307373046875, 15.8271484375, 16.346923828125, 16.86669921875, 17.386474609375, 17.90625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 8.0, 12.0, 13.0, 25.0, 27.0, 45.0, 52.0, 91.0, 150.0, 301.0, 509.0, 856.0, 1707.0, 3482.0, 8430.0, 23887.0, 120388.0, 3075996.0, 874112.0, 57190.0, 15466.0, 5876.0, 2707.0, 1342.0, 657.0, 378.0, 209.0, 128.0, 73.0, 55.0, 33.0, 24.0, 20.0, 10.0, 5.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-39.5, -38.39697265625, -37.2939453125, -36.19091796875, -35.087890625, -33.98486328125, -32.8818359375, -31.77880859375, -30.67578125, -29.57275390625, -28.4697265625, -27.36669921875, -26.263671875, -25.16064453125, -24.0576171875, -22.95458984375, -21.8515625, -20.74853515625, -19.6455078125, -18.54248046875, -17.439453125, -16.33642578125, -15.2333984375, -14.13037109375, -13.02734375, -11.92431640625, -10.8212890625, -9.71826171875, -8.615234375, -7.51220703125, -6.4091796875, -5.30615234375, -4.203125, -3.10009765625, -1.9970703125, -0.89404296875, 0.208984375, 1.31201171875, 2.4150390625, 3.51806640625, 4.62109375, 5.72412109375, 6.8271484375, 7.93017578125, 9.033203125, 10.13623046875, 11.2392578125, 12.34228515625, 13.4453125, 14.54833984375, 15.6513671875, 16.75439453125, 17.857421875, 18.96044921875, 20.0634765625, 21.16650390625, 22.26953125, 23.37255859375, 24.4755859375, 25.57861328125, 26.681640625, 27.78466796875, 28.8876953125, 29.99072265625, 31.09375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 51.0, 601.0, 347.0, 17.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-474.36749267578125, -457.90960693359375, -441.4517517089844, -424.993896484375, -408.5360107421875, -392.078125, -375.6202697753906, -359.16241455078125, -342.70452880859375, -326.24664306640625, -309.7887878417969, -293.3309326171875, -276.873046875, -260.4151611328125, -243.95730590820312, -227.4994354248047, -211.04156494140625, -194.5836944580078, -178.12582397460938, -161.66795349121094, -145.2100830078125, -128.75221252441406, -112.29434204101562, -95.83647155761719, -79.37860107421875, -62.92073059082031, -46.462860107421875, -30.004989624023438, -13.547119140625, 2.9107513427734375, 19.368621826171875, 35.82649230957031, 52.284423828125, 68.74229431152344, 85.20016479492188, 101.65803527832031, 118.11590576171875, 134.5737762451172, 151.03164672851562, 167.48951721191406, 183.9473876953125, 200.40525817871094, 216.86312866210938, 233.3209991455078, 249.77886962890625, 266.23675537109375, 282.6946105957031, 299.1524658203125, 315.6103515625, 332.0682373046875, 348.5260925292969, 364.98394775390625, 381.44183349609375, 397.89971923828125, 414.3575744628906, 430.8154296875, 447.2733154296875, 463.731201171875, 480.1890563964844, 496.64691162109375, 513.1047973632812, 529.5626831054688, 546.0205078125, 562.4783935546875, 578.936279296875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 2.0, 4.0, 5.0, 7.0, 6.0, 12.0, 16.0, 21.0, 14.0, 18.0, 25.0, 26.0, 32.0, 20.0, 27.0, 32.0, 35.0, 40.0, 35.0, 33.0, 40.0, 38.0, 36.0, 36.0, 36.0, 31.0, 37.0, 29.0, 32.0, 28.0, 25.0, 22.0, 27.0, 28.0, 27.0, 22.0, 20.0, 9.0, 11.0, 10.0, 12.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-44.56242370605469, -43.203861236572266, -41.845298767089844, -40.48674011230469, -39.128177642822266, -37.769615173339844, -36.41105270385742, -35.052490234375, -33.693931579589844, -32.33536911010742, -30.976808547973633, -29.61824607849121, -28.259685516357422, -26.901123046875, -25.542560577392578, -24.183998107910156, -22.825435638427734, -21.466873168945312, -20.108312606811523, -18.7497501373291, -17.391189575195312, -16.03262710571289, -14.674064636230469, -13.315503120422363, -11.956941604614258, -10.598380088806152, -9.239818572998047, -7.881256103515625, -6.5226945877075195, -5.164133071899414, -3.805570602416992, -2.4470090866088867, -1.0884513854980469, 0.2701103687286377, 1.6286721229553223, 2.987234115600586, 4.345795631408691, 5.704357147216797, 7.062919616699219, 8.421481132507324, 9.78004264831543, 11.138604164123535, 12.49716567993164, 13.855728149414062, 15.214289665222168, 16.572851181030273, 17.931413650512695, 19.289974212646484, 20.648536682128906, 22.007099151611328, 23.365659713745117, 24.72422218322754, 26.082782745361328, 27.44134521484375, 28.799907684326172, 30.158470153808594, 31.517030715942383, 32.87559127807617, 34.234153747558594, 35.592716217041016, 36.95127868652344, 38.309837341308594, 39.66840362548828, 41.02696228027344, 42.38552474975586]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 7.0, 13.0, 12.0, 15.0, 15.0, 14.0, 22.0, 23.0, 30.0, 48.0, 27.0, 30.0, 29.0, 30.0, 38.0, 34.0, 43.0, 32.0, 44.0, 39.0, 43.0, 38.0, 42.0, 39.0, 30.0, 31.0, 29.0, 17.0, 23.0, 27.0, 17.0, 11.0, 12.0, 15.0, 14.0, 5.0, 6.0, 9.0, 5.0, 1.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0], "bins": [-8.09375, -7.85595703125, -7.6181640625, -7.38037109375, -7.142578125, -6.90478515625, -6.6669921875, -6.42919921875, -6.19140625, -5.95361328125, -5.7158203125, -5.47802734375, -5.240234375, -5.00244140625, -4.7646484375, -4.52685546875, -4.2890625, -4.05126953125, -3.8134765625, -3.57568359375, -3.337890625, -3.10009765625, -2.8623046875, -2.62451171875, -2.38671875, -2.14892578125, -1.9111328125, -1.67333984375, -1.435546875, -1.19775390625, -0.9599609375, -0.72216796875, -0.484375, -0.24658203125, -0.0087890625, 0.22900390625, 0.466796875, 0.70458984375, 0.9423828125, 1.18017578125, 1.41796875, 1.65576171875, 1.8935546875, 2.13134765625, 2.369140625, 2.60693359375, 2.8447265625, 3.08251953125, 3.3203125, 3.55810546875, 3.7958984375, 4.03369140625, 4.271484375, 4.50927734375, 4.7470703125, 4.98486328125, 5.22265625, 5.46044921875, 5.6982421875, 5.93603515625, 6.173828125, 6.41162109375, 6.6494140625, 6.88720703125, 7.125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 18.0, 24.0, 32.0, 50.0, 83.0, 104.0, 139.0, 235.0, 273.0, 452.0, 615.0, 925.0, 1346.0, 1996.0, 2825.0, 4116.0, 5930.0, 8840.0, 13058.0, 19632.0, 30480.0, 47018.0, 72825.0, 111332.0, 160452.0, 176452.0, 132756.0, 88836.0, 57535.0, 36998.0, 24132.0, 15899.0, 10493.0, 7139.0, 4813.0, 3269.0, 2327.0, 1540.0, 1112.0, 733.0, 532.0, 377.0, 252.0, 184.0, 135.0, 77.0, 64.0, 32.0, 15.0, 18.0, 12.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.76171875, -0.7380828857421875, -0.714447021484375, -0.6908111572265625, -0.66717529296875, -0.6435394287109375, -0.619903564453125, -0.5962677001953125, -0.5726318359375, -0.5489959716796875, -0.525360107421875, -0.5017242431640625, -0.47808837890625, -0.4544525146484375, -0.430816650390625, -0.4071807861328125, -0.383544921875, -0.3599090576171875, -0.336273193359375, -0.3126373291015625, -0.28900146484375, -0.2653656005859375, -0.241729736328125, -0.2180938720703125, -0.1944580078125, -0.1708221435546875, -0.147186279296875, -0.1235504150390625, -0.09991455078125, -0.0762786865234375, -0.052642822265625, -0.0290069580078125, -0.00537109375, 0.0182647705078125, 0.041900634765625, 0.0655364990234375, 0.08917236328125, 0.1128082275390625, 0.136444091796875, 0.1600799560546875, 0.1837158203125, 0.2073516845703125, 0.230987548828125, 0.2546234130859375, 0.27825927734375, 0.3018951416015625, 0.325531005859375, 0.3491668701171875, 0.372802734375, 0.3964385986328125, 0.420074462890625, 0.4437103271484375, 0.46734619140625, 0.4909820556640625, 0.514617919921875, 0.5382537841796875, 0.5618896484375, 0.5855255126953125, 0.609161376953125, 0.6327972412109375, 0.65643310546875, 0.6800689697265625, 0.703704833984375, 0.7273406982421875, 0.7509765625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 9.0, 11.0, 4.0, 10.0, 19.0, 27.0, 21.0, 26.0, 29.0, 29.0, 32.0, 39.0, 37.0, 24.0, 31.0, 44.0, 54.0, 1061.0, 38.0, 57.0, 40.0, 42.0, 42.0, 37.0, 29.0, 28.0, 31.0, 33.0, 26.0, 19.0, 11.0, 16.0, 10.0, 11.0, 9.0, 5.0, 11.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.4609375, -5.2918701171875, -5.122802734375, -4.9537353515625, -4.78466796875, -4.6156005859375, -4.446533203125, -4.2774658203125, -4.1083984375, -3.9393310546875, -3.770263671875, -3.6011962890625, -3.43212890625, -3.2630615234375, -3.093994140625, -2.9249267578125, -2.755859375, -2.5867919921875, -2.417724609375, -2.2486572265625, -2.07958984375, -1.9105224609375, -1.741455078125, -1.5723876953125, -1.4033203125, -1.2342529296875, -1.065185546875, -0.8961181640625, -0.72705078125, -0.5579833984375, -0.388916015625, -0.2198486328125, -0.05078125, 0.1182861328125, 0.287353515625, 0.4564208984375, 0.62548828125, 0.7945556640625, 0.963623046875, 1.1326904296875, 1.3017578125, 1.4708251953125, 1.639892578125, 1.8089599609375, 1.97802734375, 2.1470947265625, 2.316162109375, 2.4852294921875, 2.654296875, 2.8233642578125, 2.992431640625, 3.1614990234375, 3.33056640625, 3.4996337890625, 3.668701171875, 3.8377685546875, 4.0068359375, 4.1759033203125, 4.344970703125, 4.5140380859375, 4.68310546875, 4.8521728515625, 5.021240234375, 5.1903076171875, 5.359375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 13.0, 13.0, 27.0, 36.0, 52.0, 75.0, 117.0, 188.0, 292.0, 364.0, 554.0, 788.0, 1188.0, 1711.0, 2536.0, 3675.0, 5498.0, 8106.0, 11951.0, 17836.0, 26951.0, 40900.0, 64203.0, 97516.0, 139494.0, 1214596.0, 148370.0, 105729.0, 69951.0, 45217.0, 29492.0, 19232.0, 12999.0, 8740.0, 5855.0, 4079.0, 2743.0, 1876.0, 1314.0, 884.0, 641.0, 442.0, 302.0, 199.0, 129.0, 95.0, 65.0, 37.0, 27.0, 18.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.55224609375, -0.5358123779296875, -0.519378662109375, -0.5029449462890625, -0.48651123046875, -0.4700775146484375, -0.453643798828125, -0.4372100830078125, -0.4207763671875, -0.4043426513671875, -0.387908935546875, -0.3714752197265625, -0.35504150390625, -0.3386077880859375, -0.322174072265625, -0.3057403564453125, -0.289306640625, -0.2728729248046875, -0.256439208984375, -0.2400054931640625, -0.22357177734375, -0.2071380615234375, -0.190704345703125, -0.1742706298828125, -0.1578369140625, -0.1414031982421875, -0.124969482421875, -0.1085357666015625, -0.09210205078125, -0.0756683349609375, -0.059234619140625, -0.0428009033203125, -0.0263671875, -0.0099334716796875, 0.006500244140625, 0.0229339599609375, 0.03936767578125, 0.0558013916015625, 0.072235107421875, 0.0886688232421875, 0.1051025390625, 0.1215362548828125, 0.137969970703125, 0.1544036865234375, 0.17083740234375, 0.1872711181640625, 0.203704833984375, 0.2201385498046875, 0.236572265625, 0.2530059814453125, 0.269439697265625, 0.2858734130859375, 0.30230712890625, 0.3187408447265625, 0.335174560546875, 0.3516082763671875, 0.3680419921875, 0.3844757080078125, 0.400909423828125, 0.4173431396484375, 0.43377685546875, 0.4502105712890625, 0.466644287109375, 0.4830780029296875, 0.49951171875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 3.0, 13.0, 5.0, 11.0, 33.0, 45.0, 43.0, 51.0, 77.0, 123.0, 158.0, 120.0, 57.0, 60.0, 40.0, 34.0, 19.0, 20.0, 14.0, 5.0, 12.0, 8.0, 8.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019805908203125, -0.019127368927001953, -0.018448829650878906, -0.01777029037475586, -0.017091751098632812, -0.016413211822509766, -0.01573467254638672, -0.015056133270263672, -0.014377593994140625, -0.013699054718017578, -0.013020515441894531, -0.012341976165771484, -0.011663436889648438, -0.01098489761352539, -0.010306358337402344, -0.009627819061279297, -0.00894927978515625, -0.008270740509033203, -0.007592201232910156, -0.006913661956787109, -0.0062351226806640625, -0.005556583404541016, -0.004878044128417969, -0.004199504852294922, -0.003520965576171875, -0.002842426300048828, -0.0021638870239257812, -0.0014853477478027344, -0.0008068084716796875, -0.00012826919555664062, 0.0005502700805664062, 0.0012288093566894531, 0.0019073486328125, 0.002585887908935547, 0.0032644271850585938, 0.003942966461181641, 0.0046215057373046875, 0.005300045013427734, 0.005978584289550781, 0.006657123565673828, 0.007335662841796875, 0.008014202117919922, 0.008692741394042969, 0.009371280670166016, 0.010049819946289062, 0.01072835922241211, 0.011406898498535156, 0.012085437774658203, 0.01276397705078125, 0.013442516326904297, 0.014121055603027344, 0.01479959487915039, 0.015478134155273438, 0.016156673431396484, 0.01683521270751953, 0.017513751983642578, 0.018192291259765625, 0.018870830535888672, 0.01954936981201172, 0.020227909088134766, 0.020906448364257812, 0.02158498764038086, 0.022263526916503906, 0.022942066192626953, 0.02362060546875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 6.0, 6.0, 12.0, 10.0, 10.0, 11.0, 25.0, 28.0, 43.0, 58.0, 113.0, 123.0, 256.0, 1261.0, 991342.0, 54168.0, 569.0, 175.0, 94.0, 86.0, 50.0, 24.0, 9.0, 14.0, 6.0, 10.0, 13.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5380859375, -0.52264404296875, -0.5072021484375, -0.49176025390625, -0.476318359375, -0.46087646484375, -0.4454345703125, -0.42999267578125, -0.41455078125, -0.39910888671875, -0.3836669921875, -0.36822509765625, -0.352783203125, -0.33734130859375, -0.3218994140625, -0.30645751953125, -0.291015625, -0.27557373046875, -0.2601318359375, -0.24468994140625, -0.229248046875, -0.21380615234375, -0.1983642578125, -0.18292236328125, -0.16748046875, -0.15203857421875, -0.1365966796875, -0.12115478515625, -0.105712890625, -0.09027099609375, -0.0748291015625, -0.05938720703125, -0.0439453125, -0.02850341796875, -0.0130615234375, 0.00238037109375, 0.017822265625, 0.03326416015625, 0.0487060546875, 0.06414794921875, 0.07958984375, 0.09503173828125, 0.1104736328125, 0.12591552734375, 0.141357421875, 0.15679931640625, 0.1722412109375, 0.18768310546875, 0.203125, 0.21856689453125, 0.2340087890625, 0.24945068359375, 0.264892578125, 0.28033447265625, 0.2957763671875, 0.31121826171875, 0.32666015625, 0.34210205078125, 0.3575439453125, 0.37298583984375, 0.388427734375, 0.40386962890625, 0.4193115234375, 0.43475341796875, 0.4501953125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 18.0, 32.0, 106.0, 285.0, 384.0, 117.0, 36.0, 20.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07168031483888626, -0.06975238770246506, -0.06782446056604385, -0.06589654088020325, -0.06396861374378204, -0.06204068660736084, -0.060112759470939636, -0.05818483605980873, -0.056256912648677826, -0.05432898551225662, -0.05240106210112572, -0.050473134964704514, -0.04854521155357361, -0.046617284417152405, -0.0446893572807312, -0.042761433869600296, -0.04083350673317909, -0.03890557959675789, -0.036977656185626984, -0.03504972904920578, -0.033121805638074875, -0.03119387850165367, -0.029265953227877617, -0.027338027954101562, -0.025410102680325508, -0.023482177406549454, -0.0215542521327734, -0.019626326858997345, -0.01769839972257614, -0.015770476311445236, -0.013842549175024033, -0.011914623901247978, -0.009986694902181625, -0.008058769628405571, -0.006130843888968229, -0.004202918149530888, -0.0022749928757548332, -0.00034706760197877884, 0.0015808586031198502, 0.0035087838768959045, 0.005436709150671959, 0.007364634424448013, 0.009292559698224068, 0.011220485903322697, 0.013148411177098751, 0.015076336450874805, 0.017004262655973434, 0.01893218792974949, 0.020860113203525543, 0.022788038477301598, 0.024715963751077652, 0.026643890887498856, 0.02857181429862976, 0.030499741435050964, 0.03242766857147217, 0.03435559198260307, 0.03628351539373398, 0.03821144253015518, 0.04013936594128609, 0.04206729307770729, 0.043995216488838196, 0.0459231436252594, 0.0478510707616806, 0.04977899417281151, 0.05170692130923271]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 14.0, 16.0, 21.0, 21.0, 30.0, 20.0, 27.0, 31.0, 40.0, 46.0, 45.0, 49.0, 47.0, 46.0, 56.0, 55.0, 39.0, 45.0, 49.0, 47.0, 42.0, 26.0, 37.0, 24.0, 20.0, 23.0, 18.0, 10.0, 19.0, 8.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.02317988872528076, -0.022519852966070175, -0.02185981720685959, -0.021199781447649002, -0.020539745688438416, -0.01987970992922783, -0.019219674170017242, -0.018559638410806656, -0.01789960265159607, -0.017239566892385483, -0.016579531133174896, -0.01591949537396431, -0.015259459614753723, -0.014599423855543137, -0.01393938809633255, -0.013279352337121964, -0.012619316577911377, -0.01195928081870079, -0.011299245059490204, -0.010639209300279617, -0.00997917354106903, -0.009319137781858444, -0.008659102022647858, -0.007999066263437271, -0.007339030504226685, -0.006678994745016098, -0.0060189589858055115, -0.005358923226594925, -0.004698887467384338, -0.004038851708173752, -0.0033788159489631653, -0.0027187801897525787, -0.002058744430541992, -0.0013987086713314056, -0.0007386729121208191, -7.863715291023254e-05, 0.000581398606300354, 0.0012414343655109406, 0.001901470124721527, 0.0025615058839321136, 0.0032215416431427, 0.0038815774023532867, 0.004541613161563873, 0.00520164892077446, 0.005861684679985046, 0.006521720439195633, 0.0071817561984062195, 0.007841791957616806, 0.008501827716827393, 0.009161863476037979, 0.009821899235248566, 0.010481934994459152, 0.011141970753669739, 0.011802006512880325, 0.012462042272090912, 0.013122078031301498, 0.013782113790512085, 0.014442149549722672, 0.015102185308933258, 0.015762221068143845, 0.01642225682735443, 0.017082292586565018, 0.017742328345775604, 0.01840236410498619, 0.019062399864196777]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 7.0, 13.0, 12.0, 15.0, 15.0, 14.0, 22.0, 23.0, 30.0, 48.0, 27.0, 30.0, 29.0, 30.0, 38.0, 34.0, 42.0, 33.0, 44.0, 39.0, 43.0, 38.0, 42.0, 39.0, 30.0, 31.0, 29.0, 17.0, 23.0, 26.0, 18.0, 11.0, 12.0, 15.0, 14.0, 5.0, 6.0, 9.0, 5.0, 1.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0], "bins": [-8.09375, -7.85595703125, -7.6181640625, -7.38037109375, -7.142578125, -6.90478515625, -6.6669921875, -6.42919921875, -6.19140625, -5.95361328125, -5.7158203125, -5.47802734375, -5.240234375, -5.00244140625, -4.7646484375, -4.52685546875, -4.2890625, -4.05126953125, -3.8134765625, -3.57568359375, -3.337890625, -3.10009765625, -2.8623046875, -2.62451171875, -2.38671875, -2.14892578125, -1.9111328125, -1.67333984375, -1.435546875, -1.19775390625, -0.9599609375, -0.72216796875, -0.484375, -0.24658203125, -0.0087890625, 0.22900390625, 0.466796875, 0.70458984375, 0.9423828125, 1.18017578125, 1.41796875, 1.65576171875, 1.8935546875, 2.13134765625, 2.369140625, 2.60693359375, 2.8447265625, 3.08251953125, 3.3203125, 3.55810546875, 3.7958984375, 4.03369140625, 4.271484375, 4.50927734375, 4.7470703125, 4.98486328125, 5.22265625, 5.46044921875, 5.6982421875, 5.93603515625, 6.173828125, 6.41162109375, 6.6494140625, 6.88720703125, 7.125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 22.0, 17.0, 34.0, 34.0, 43.0, 61.0, 98.0, 130.0, 168.0, 261.0, 347.0, 528.0, 758.0, 1167.0, 1771.0, 2981.0, 5403.0, 10876.0, 26273.0, 75408.0, 301095.0, 450361.0, 105978.0, 34754.0, 13785.0, 6487.0, 3536.0, 2025.0, 1311.0, 800.0, 608.0, 398.0, 286.0, 212.0, 153.0, 100.0, 78.0, 58.0, 34.0, 30.0, 22.0, 16.0, 16.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.999755859375, -10.60888671875, -10.218017578125, -9.8271484375, -9.436279296875, -9.04541015625, -8.654541015625, -8.263671875, -7.872802734375, -7.48193359375, -7.091064453125, -6.7001953125, -6.309326171875, -5.91845703125, -5.527587890625, -5.13671875, -4.745849609375, -4.35498046875, -3.964111328125, -3.5732421875, -3.182373046875, -2.79150390625, -2.400634765625, -2.009765625, -1.618896484375, -1.22802734375, -0.837158203125, -0.4462890625, -0.055419921875, 0.33544921875, 0.726318359375, 1.1171875, 1.508056640625, 1.89892578125, 2.289794921875, 2.6806640625, 3.071533203125, 3.46240234375, 3.853271484375, 4.244140625, 4.635009765625, 5.02587890625, 5.416748046875, 5.8076171875, 6.198486328125, 6.58935546875, 6.980224609375, 7.37109375, 7.761962890625, 8.15283203125, 8.543701171875, 8.9345703125, 9.325439453125, 9.71630859375, 10.107177734375, 10.498046875, 10.888916015625, 11.27978515625, 11.670654296875, 12.0615234375, 12.452392578125, 12.84326171875, 13.234130859375, 13.625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 3.0, 5.0, 7.0, 4.0, 9.0, 9.0, 15.0, 14.0, 10.0, 11.0, 17.0, 19.0, 32.0, 35.0, 27.0, 40.0, 43.0, 47.0, 45.0, 85.0, 154.0, 1458.0, 322.0, 129.0, 76.0, 50.0, 51.0, 40.0, 38.0, 37.0, 29.0, 34.0, 24.0, 19.0, 19.0, 10.0, 14.0, 12.0, 8.0, 9.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-21.234375, -20.54833984375, -19.8623046875, -19.17626953125, -18.490234375, -17.80419921875, -17.1181640625, -16.43212890625, -15.74609375, -15.06005859375, -14.3740234375, -13.68798828125, -13.001953125, -12.31591796875, -11.6298828125, -10.94384765625, -10.2578125, -9.57177734375, -8.8857421875, -8.19970703125, -7.513671875, -6.82763671875, -6.1416015625, -5.45556640625, -4.76953125, -4.08349609375, -3.3974609375, -2.71142578125, -2.025390625, -1.33935546875, -0.6533203125, 0.03271484375, 0.71875, 1.40478515625, 2.0908203125, 2.77685546875, 3.462890625, 4.14892578125, 4.8349609375, 5.52099609375, 6.20703125, 6.89306640625, 7.5791015625, 8.26513671875, 8.951171875, 9.63720703125, 10.3232421875, 11.00927734375, 11.6953125, 12.38134765625, 13.0673828125, 13.75341796875, 14.439453125, 15.12548828125, 15.8115234375, 16.49755859375, 17.18359375, 17.86962890625, 18.5556640625, 19.24169921875, 19.927734375, 20.61376953125, 21.2998046875, 21.98583984375, 22.671875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 16.0, 10.0, 15.0, 29.0, 41.0, 56.0, 93.0, 164.0, 356.0, 884.0, 3921.0, 59456.0, 3000631.0, 74052.0, 4266.0, 897.0, 371.0, 149.0, 97.0, 68.0, 43.0, 19.0, 29.0, 11.0, 10.0, 4.0, 5.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-58.9375, -57.23046875, -55.5234375, -53.81640625, -52.109375, -50.40234375, -48.6953125, -46.98828125, -45.28125, -43.57421875, -41.8671875, -40.16015625, -38.453125, -36.74609375, -35.0390625, -33.33203125, -31.625, -29.91796875, -28.2109375, -26.50390625, -24.796875, -23.08984375, -21.3828125, -19.67578125, -17.96875, -16.26171875, -14.5546875, -12.84765625, -11.140625, -9.43359375, -7.7265625, -6.01953125, -4.3125, -2.60546875, -0.8984375, 0.80859375, 2.515625, 4.22265625, 5.9296875, 7.63671875, 9.34375, 11.05078125, 12.7578125, 14.46484375, 16.171875, 17.87890625, 19.5859375, 21.29296875, 23.0, 24.70703125, 26.4140625, 28.12109375, 29.828125, 31.53515625, 33.2421875, 34.94921875, 36.65625, 38.36328125, 40.0703125, 41.77734375, 43.484375, 45.19140625, 46.8984375, 48.60546875, 50.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 249.0, 640.0, 109.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.90864562988281, -50.050357818603516, -43.19207000732422, -36.33378219604492, -29.475494384765625, -22.617206573486328, -15.758918762207031, -8.900630950927734, -2.0423431396484375, 4.815944671630859, 11.674232482910156, 18.532520294189453, 25.39080810546875, 32.24909591674805, 39.107383728027344, 45.96567153930664, 52.82395935058594, 59.682247161865234, 66.54053497314453, 73.39881896972656, 80.25711059570312, 87.11540222167969, 93.97368621826172, 100.83197021484375, 107.69026184082031, 114.54855346679688, 121.4068374633789, 128.26512145996094, 135.1234130859375, 141.98170471191406, 148.83999633789062, 155.69827270507812, 162.55654907226562, 169.4148406982422, 176.27313232421875, 183.13140869140625, 189.9897003173828, 196.84799194335938, 203.70626831054688, 210.56455993652344, 217.4228515625, 224.28114318847656, 231.13943481445312, 237.99771118164062, 244.8560028076172, 251.71429443359375, 258.57257080078125, 265.4308776855469, 272.2891540527344, 279.1474304199219, 286.0057373046875, 292.864013671875, 299.7222900390625, 306.5805969238281, 313.4388732910156, 320.29718017578125, 327.15545654296875, 334.01373291015625, 340.8720397949219, 347.7303161621094, 354.588623046875, 361.4468994140625, 368.30517578125, 375.1634826660156, 382.0217590332031]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 5.0, 9.0, 5.0, 12.0, 18.0, 19.0, 15.0, 18.0, 33.0, 27.0, 48.0, 31.0, 39.0, 47.0, 54.0, 46.0, 45.0, 38.0, 51.0, 43.0, 53.0, 38.0, 31.0, 32.0, 35.0, 32.0, 24.0, 25.0, 17.0, 24.0, 16.0, 11.0, 11.0, 7.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.00137710571289, -51.068233489990234, -49.13508987426758, -47.20195007324219, -45.26880645751953, -43.335662841796875, -41.40251922607422, -39.46937561035156, -37.536231994628906, -35.60308837890625, -33.669944763183594, -31.73680305480957, -29.803661346435547, -27.87051773071289, -25.937374114990234, -24.004230499267578, -22.071090698242188, -20.13794708251953, -18.204805374145508, -16.27166175842285, -14.338519096374512, -12.405376434326172, -10.472232818603516, -8.539090156555176, -6.605947494506836, -4.672804832458496, -2.739661693572998, -0.8065185546875, 1.1266241073608398, 3.0597667694091797, 4.992910385131836, 6.926053047180176, 8.85919189453125, 10.79233455657959, 12.72547721862793, 14.658620834350586, 16.59176254272461, 18.524906158447266, 20.458049774169922, 22.391193389892578, 24.3243350982666, 26.257478713989258, 28.19062042236328, 30.123764038085938, 32.056907653808594, 33.99005126953125, 35.923194885253906, 37.8563346862793, 39.78947830200195, 41.72262191772461, 43.655765533447266, 45.588905334472656, 47.52204895019531, 49.45519256591797, 51.388336181640625, 53.32147979736328, 55.25462341308594, 57.187767028808594, 59.12091064453125, 61.054054260253906, 62.9871940612793, 64.92033386230469, 66.85348510742188, 68.78662109375, 70.71976470947266]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 3.0, 6.0, 10.0, 4.0, 6.0, 13.0, 10.0, 10.0, 15.0, 13.0, 26.0, 22.0, 27.0, 23.0, 36.0, 30.0, 33.0, 36.0, 36.0, 33.0, 38.0, 32.0, 34.0, 34.0, 39.0, 43.0, 39.0, 38.0, 42.0, 30.0, 32.0, 26.0, 21.0, 20.0, 13.0, 17.0, 15.0, 15.0, 7.0, 14.0, 11.0, 10.0, 5.0, 3.0, 3.0, 9.0, 3.0, 2.0, 3.0, 1.0, 6.0, 0.0, 1.0, 3.0], "bins": [-7.56640625, -7.3345947265625, -7.102783203125, -6.8709716796875, -6.63916015625, -6.4073486328125, -6.175537109375, -5.9437255859375, -5.7119140625, -5.4801025390625, -5.248291015625, -5.0164794921875, -4.78466796875, -4.5528564453125, -4.321044921875, -4.0892333984375, -3.857421875, -3.6256103515625, -3.393798828125, -3.1619873046875, -2.93017578125, -2.6983642578125, -2.466552734375, -2.2347412109375, -2.0029296875, -1.7711181640625, -1.539306640625, -1.3074951171875, -1.07568359375, -0.8438720703125, -0.612060546875, -0.3802490234375, -0.1484375, 0.0833740234375, 0.315185546875, 0.5469970703125, 0.77880859375, 1.0106201171875, 1.242431640625, 1.4742431640625, 1.7060546875, 1.9378662109375, 2.169677734375, 2.4014892578125, 2.63330078125, 2.8651123046875, 3.096923828125, 3.3287353515625, 3.560546875, 3.7923583984375, 4.024169921875, 4.2559814453125, 4.48779296875, 4.7196044921875, 4.951416015625, 5.1832275390625, 5.4150390625, 5.6468505859375, 5.878662109375, 6.1104736328125, 6.34228515625, 6.5740966796875, 6.805908203125, 7.0377197265625, 7.26953125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 14.0, 5.0, 14.0, 29.0, 38.0, 58.0, 65.0, 107.0, 144.0, 194.0, 230.0, 351.0, 518.0, 750.0, 1201.0, 1737.0, 2614.0, 4209.0, 7273.0, 14554.0, 43590.0, 320458.0, 2506664.0, 1123498.0, 116027.0, 24461.0, 10410.0, 5635.0, 3239.0, 1958.0, 1338.0, 897.0, 611.0, 418.0, 282.0, 182.0, 134.0, 105.0, 67.0, 56.0, 47.0, 27.0, 20.0, 20.0, 18.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.109375, -14.565185546875, -14.02099609375, -13.476806640625, -12.9326171875, -12.388427734375, -11.84423828125, -11.300048828125, -10.755859375, -10.211669921875, -9.66748046875, -9.123291015625, -8.5791015625, -8.034912109375, -7.49072265625, -6.946533203125, -6.40234375, -5.858154296875, -5.31396484375, -4.769775390625, -4.2255859375, -3.681396484375, -3.13720703125, -2.593017578125, -2.048828125, -1.504638671875, -0.96044921875, -0.416259765625, 0.1279296875, 0.672119140625, 1.21630859375, 1.760498046875, 2.3046875, 2.848876953125, 3.39306640625, 3.937255859375, 4.4814453125, 5.025634765625, 5.56982421875, 6.114013671875, 6.658203125, 7.202392578125, 7.74658203125, 8.290771484375, 8.8349609375, 9.379150390625, 9.92333984375, 10.467529296875, 11.01171875, 11.555908203125, 12.10009765625, 12.644287109375, 13.1884765625, 13.732666015625, 14.27685546875, 14.821044921875, 15.365234375, 15.909423828125, 16.45361328125, 16.997802734375, 17.5419921875, 18.086181640625, 18.63037109375, 19.174560546875, 19.71875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 5.0, 12.0, 6.0, 12.0, 4.0, 16.0, 8.0, 15.0, 26.0, 28.0, 30.0, 33.0, 71.0, 94.0, 129.0, 235.0, 367.0, 625.0, 700.0, 590.0, 394.0, 224.0, 148.0, 78.0, 48.0, 42.0, 34.0, 29.0, 10.0, 6.0, 11.0, 4.0, 6.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.65625, -15.1591796875, -14.662109375, -14.1650390625, -13.66796875, -13.1708984375, -12.673828125, -12.1767578125, -11.6796875, -11.1826171875, -10.685546875, -10.1884765625, -9.69140625, -9.1943359375, -8.697265625, -8.2001953125, -7.703125, -7.2060546875, -6.708984375, -6.2119140625, -5.71484375, -5.2177734375, -4.720703125, -4.2236328125, -3.7265625, -3.2294921875, -2.732421875, -2.2353515625, -1.73828125, -1.2412109375, -0.744140625, -0.2470703125, 0.25, 0.7470703125, 1.244140625, 1.7412109375, 2.23828125, 2.7353515625, 3.232421875, 3.7294921875, 4.2265625, 4.7236328125, 5.220703125, 5.7177734375, 6.21484375, 6.7119140625, 7.208984375, 7.7060546875, 8.203125, 8.7001953125, 9.197265625, 9.6943359375, 10.19140625, 10.6884765625, 11.185546875, 11.6826171875, 12.1796875, 12.6767578125, 13.173828125, 13.6708984375, 14.16796875, 14.6650390625, 15.162109375, 15.6591796875, 16.15625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 12.0, 9.0, 19.0, 18.0, 22.0, 40.0, 56.0, 81.0, 93.0, 134.0, 189.0, 304.0, 412.0, 540.0, 857.0, 1332.0, 1923.0, 3000.0, 4633.0, 7712.0, 13368.0, 26342.0, 67700.0, 300590.0, 2483759.0, 1049262.0, 143220.0, 42768.0, 18761.0, 9863.0, 6054.0, 3778.0, 2434.0, 1585.0, 1012.0, 719.0, 487.0, 348.0, 231.0, 179.0, 117.0, 72.0, 76.0, 51.0, 29.0, 26.0, 16.0, 15.0, 8.0, 4.0, 11.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.3125, -17.736328125, -17.16015625, -16.583984375, -16.0078125, -15.431640625, -14.85546875, -14.279296875, -13.703125, -13.126953125, -12.55078125, -11.974609375, -11.3984375, -10.822265625, -10.24609375, -9.669921875, -9.09375, -8.517578125, -7.94140625, -7.365234375, -6.7890625, -6.212890625, -5.63671875, -5.060546875, -4.484375, -3.908203125, -3.33203125, -2.755859375, -2.1796875, -1.603515625, -1.02734375, -0.451171875, 0.125, 0.701171875, 1.27734375, 1.853515625, 2.4296875, 3.005859375, 3.58203125, 4.158203125, 4.734375, 5.310546875, 5.88671875, 6.462890625, 7.0390625, 7.615234375, 8.19140625, 8.767578125, 9.34375, 9.919921875, 10.49609375, 11.072265625, 11.6484375, 12.224609375, 12.80078125, 13.376953125, 13.953125, 14.529296875, 15.10546875, 15.681640625, 16.2578125, 16.833984375, 17.41015625, 17.986328125, 18.5625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 11.0, 18.0, 44.0, 168.0, 374.0, 257.0, 94.0, 26.0, 10.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.83030700683594, -196.44622802734375, -190.0621337890625, -183.6780548095703, -177.29397583007812, -170.90988159179688, -164.5258026123047, -158.1417236328125, -151.75762939453125, -145.37355041503906, -138.9894561767578, -132.60537719726562, -126.2212905883789, -119.83720397949219, -113.453125, -107.06903839111328, -100.6849594116211, -94.30087280273438, -87.91679382324219, -81.53270721435547, -75.14862060546875, -68.76454162597656, -62.380455017089844, -55.996368408203125, -49.61228561401367, -43.22820281982422, -36.8441162109375, -30.460033416748047, -24.07594871520996, -17.691864013671875, -11.307781219482422, -4.923694610595703, 1.46038818359375, 7.844472408294678, 14.228556632995605, 20.612640380859375, 26.99672508239746, 33.38080978393555, 39.764892578125, 46.14897918701172, 52.53306198120117, 58.917144775390625, 65.30123138427734, 71.68531799316406, 78.06939697265625, 84.45348358154297, 90.83757019042969, 97.22164916992188, 103.6057357788086, 109.98982238769531, 116.3739013671875, 122.75798797607422, 129.14207458496094, 135.52615356445312, 141.91024780273438, 148.29432678222656, 154.67840576171875, 161.06248474121094, 167.4465789794922, 173.83065795898438, 180.21473693847656, 186.5988311767578, 192.98291015625, 199.36700439453125, 205.75108337402344]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 6.0, 8.0, 14.0, 9.0, 12.0, 17.0, 14.0, 23.0, 25.0, 26.0, 26.0, 29.0, 33.0, 33.0, 46.0, 40.0, 34.0, 55.0, 37.0, 36.0, 43.0, 40.0, 46.0, 35.0, 40.0, 34.0, 28.0, 36.0, 18.0, 24.0, 25.0, 21.0, 11.0, 13.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-58.242889404296875, -56.551963806152344, -54.86104202270508, -53.17011642456055, -51.479190826416016, -49.78826904296875, -48.09734344482422, -46.40641784667969, -44.715492248535156, -43.024566650390625, -41.33364486694336, -39.64271926879883, -37.9517936706543, -36.26087188720703, -34.5699462890625, -32.87902069091797, -31.188098907470703, -29.497175216674805, -27.806249618530273, -26.115325927734375, -24.424400329589844, -22.733476638793945, -21.042552947998047, -19.351627349853516, -17.660703659057617, -15.969779014587402, -14.278854370117188, -12.587930679321289, -10.897006034851074, -9.20608139038086, -7.515157699584961, -5.824233055114746, -4.133308410644531, -2.4423840045928955, -0.7514595985412598, 0.9394645690917969, 2.6303892135620117, 4.321313858032227, 6.012237548828125, 7.70316219329834, 9.394086837768555, 11.08501148223877, 12.775936126708984, 14.466859817504883, 16.15778350830078, 17.848709106445312, 19.53963279724121, 21.23055648803711, 22.92148208618164, 24.61240577697754, 26.30333137512207, 27.99425506591797, 29.6851806640625, 31.3761043548584, 33.0670280456543, 34.75795364379883, 36.448875427246094, 38.139801025390625, 39.83072280883789, 41.52164840698242, 43.21257400512695, 44.90349578857422, 46.59442138671875, 48.28534698486328, 49.97627258300781]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 7.0, 6.0, 5.0, 4.0, 13.0, 11.0, 14.0, 15.0, 24.0, 30.0, 22.0, 26.0, 18.0, 20.0, 29.0, 43.0, 32.0, 37.0, 43.0, 36.0, 42.0, 32.0, 41.0, 38.0, 39.0, 35.0, 32.0, 37.0, 32.0, 31.0, 22.0, 18.0, 32.0, 23.0, 14.0, 14.0, 12.0, 16.0, 10.0, 7.0, 11.0, 5.0, 4.0, 8.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.73876953125, -7.4775390625, -7.21630859375, -6.955078125, -6.69384765625, -6.4326171875, -6.17138671875, -5.91015625, -5.64892578125, -5.3876953125, -5.12646484375, -4.865234375, -4.60400390625, -4.3427734375, -4.08154296875, -3.8203125, -3.55908203125, -3.2978515625, -3.03662109375, -2.775390625, -2.51416015625, -2.2529296875, -1.99169921875, -1.73046875, -1.46923828125, -1.2080078125, -0.94677734375, -0.685546875, -0.42431640625, -0.1630859375, 0.09814453125, 0.359375, 0.62060546875, 0.8818359375, 1.14306640625, 1.404296875, 1.66552734375, 1.9267578125, 2.18798828125, 2.44921875, 2.71044921875, 2.9716796875, 3.23291015625, 3.494140625, 3.75537109375, 4.0166015625, 4.27783203125, 4.5390625, 4.80029296875, 5.0615234375, 5.32275390625, 5.583984375, 5.84521484375, 6.1064453125, 6.36767578125, 6.62890625, 6.89013671875, 7.1513671875, 7.41259765625, 7.673828125, 7.93505859375, 8.1962890625, 8.45751953125, 8.71875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 17.0, 35.0, 23.0, 37.0, 60.0, 88.0, 141.0, 222.0, 295.0, 461.0, 705.0, 1022.0, 1571.0, 2418.0, 3492.0, 5059.0, 7827.0, 12034.0, 18059.0, 27853.0, 43539.0, 68164.0, 107490.0, 163204.0, 188080.0, 141310.0, 91236.0, 57510.0, 36736.0, 23747.0, 15430.0, 10277.0, 6643.0, 4600.0, 2993.0, 2015.0, 1414.0, 905.0, 583.0, 404.0, 265.0, 197.0, 136.0, 76.0, 69.0, 42.0, 23.0, 12.0, 15.0, 7.0, 2.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.849609375, -0.822479248046875, -0.79534912109375, -0.768218994140625, -0.7410888671875, -0.713958740234375, -0.68682861328125, -0.659698486328125, -0.632568359375, -0.605438232421875, -0.57830810546875, -0.551177978515625, -0.5240478515625, -0.496917724609375, -0.46978759765625, -0.442657470703125, -0.41552734375, -0.388397216796875, -0.36126708984375, -0.334136962890625, -0.3070068359375, -0.279876708984375, -0.25274658203125, -0.225616455078125, -0.198486328125, -0.171356201171875, -0.14422607421875, -0.117095947265625, -0.0899658203125, -0.062835693359375, -0.03570556640625, -0.008575439453125, 0.0185546875, 0.045684814453125, 0.07281494140625, 0.099945068359375, 0.1270751953125, 0.154205322265625, 0.18133544921875, 0.208465576171875, 0.235595703125, 0.262725830078125, 0.28985595703125, 0.316986083984375, 0.3441162109375, 0.371246337890625, 0.39837646484375, 0.425506591796875, 0.45263671875, 0.479766845703125, 0.50689697265625, 0.534027099609375, 0.5611572265625, 0.588287353515625, 0.61541748046875, 0.642547607421875, 0.669677734375, 0.696807861328125, 0.72393798828125, 0.751068115234375, 0.7781982421875, 0.805328369140625, 0.83245849609375, 0.859588623046875, 0.88671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 7.0, 6.0, 8.0, 15.0, 11.0, 13.0, 5.0, 26.0, 25.0, 19.0, 29.0, 25.0, 27.0, 41.0, 44.0, 50.0, 44.0, 50.0, 45.0, 1061.0, 42.0, 48.0, 51.0, 40.0, 36.0, 27.0, 33.0, 30.0, 27.0, 28.0, 22.0, 16.0, 20.0, 10.0, 10.0, 8.0, 8.0, 4.0, 12.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.53125, -6.34295654296875, -6.1546630859375, -5.96636962890625, -5.778076171875, -5.58978271484375, -5.4014892578125, -5.21319580078125, -5.02490234375, -4.83660888671875, -4.6483154296875, -4.46002197265625, -4.271728515625, -4.08343505859375, -3.8951416015625, -3.70684814453125, -3.5185546875, -3.33026123046875, -3.1419677734375, -2.95367431640625, -2.765380859375, -2.57708740234375, -2.3887939453125, -2.20050048828125, -2.01220703125, -1.82391357421875, -1.6356201171875, -1.44732666015625, -1.259033203125, -1.07073974609375, -0.8824462890625, -0.69415283203125, -0.505859375, -0.31756591796875, -0.1292724609375, 0.05902099609375, 0.247314453125, 0.43560791015625, 0.6239013671875, 0.81219482421875, 1.00048828125, 1.18878173828125, 1.3770751953125, 1.56536865234375, 1.753662109375, 1.94195556640625, 2.1302490234375, 2.31854248046875, 2.5068359375, 2.69512939453125, 2.8834228515625, 3.07171630859375, 3.260009765625, 3.44830322265625, 3.6365966796875, 3.82489013671875, 4.01318359375, 4.20147705078125, 4.3897705078125, 4.57806396484375, 4.766357421875, 4.95465087890625, 5.1429443359375, 5.33123779296875, 5.51953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 4.0, 9.0, 20.0, 23.0, 24.0, 39.0, 51.0, 97.0, 149.0, 204.0, 286.0, 398.0, 499.0, 768.0, 1144.0, 1574.0, 2222.0, 3226.0, 4671.0, 6692.0, 9835.0, 14111.0, 21842.0, 33019.0, 51477.0, 82716.0, 128446.0, 1092886.0, 293341.0, 123222.0, 78757.0, 48826.0, 31606.0, 20623.0, 13895.0, 9386.0, 6394.0, 4391.0, 3062.0, 2117.0, 1501.0, 1072.0, 784.0, 545.0, 371.0, 225.0, 194.0, 136.0, 81.0, 64.0, 40.0, 26.0, 14.0, 10.0, 13.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.583984375, -0.565704345703125, -0.54742431640625, -0.529144287109375, -0.5108642578125, -0.492584228515625, -0.47430419921875, -0.456024169921875, -0.437744140625, -0.419464111328125, -0.40118408203125, -0.382904052734375, -0.3646240234375, -0.346343994140625, -0.32806396484375, -0.309783935546875, -0.29150390625, -0.273223876953125, -0.25494384765625, -0.236663818359375, -0.2183837890625, -0.200103759765625, -0.18182373046875, -0.163543701171875, -0.145263671875, -0.126983642578125, -0.10870361328125, -0.090423583984375, -0.0721435546875, -0.053863525390625, -0.03558349609375, -0.017303466796875, 0.0009765625, 0.019256591796875, 0.03753662109375, 0.055816650390625, 0.0740966796875, 0.092376708984375, 0.11065673828125, 0.128936767578125, 0.147216796875, 0.165496826171875, 0.18377685546875, 0.202056884765625, 0.2203369140625, 0.238616943359375, 0.25689697265625, 0.275177001953125, 0.29345703125, 0.311737060546875, 0.33001708984375, 0.348297119140625, 0.3665771484375, 0.384857177734375, 0.40313720703125, 0.421417236328125, 0.439697265625, 0.457977294921875, 0.47625732421875, 0.494537353515625, 0.5128173828125, 0.531097412109375, 0.54937744140625, 0.567657470703125, 0.5859375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 5.0, 6.0, 8.0, 17.0, 11.0, 21.0, 41.0, 45.0, 74.0, 145.0, 230.0, 136.0, 83.0, 43.0, 35.0, 13.0, 16.0, 11.0, 7.0, 8.0, 5.0, 5.0, 4.0, 2.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.038970947265625, -0.0378718376159668, -0.036772727966308594, -0.03567361831665039, -0.03457450866699219, -0.033475399017333984, -0.03237628936767578, -0.03127717971801758, -0.030178070068359375, -0.029078960418701172, -0.02797985076904297, -0.026880741119384766, -0.025781631469726562, -0.02468252182006836, -0.023583412170410156, -0.022484302520751953, -0.02138519287109375, -0.020286083221435547, -0.019186973571777344, -0.01808786392211914, -0.016988754272460938, -0.015889644622802734, -0.014790534973144531, -0.013691425323486328, -0.012592315673828125, -0.011493206024169922, -0.010394096374511719, -0.009294986724853516, -0.008195877075195312, -0.007096767425537109, -0.005997657775878906, -0.004898548126220703, -0.0037994384765625, -0.002700328826904297, -0.0016012191772460938, -0.0005021095275878906, 0.0005970001220703125, 0.0016961097717285156, 0.0027952194213867188, 0.003894329071044922, 0.004993438720703125, 0.006092548370361328, 0.007191658020019531, 0.008290767669677734, 0.009389877319335938, 0.01048898696899414, 0.011588096618652344, 0.012687206268310547, 0.01378631591796875, 0.014885425567626953, 0.015984535217285156, 0.01708364486694336, 0.018182754516601562, 0.019281864166259766, 0.02038097381591797, 0.021480083465576172, 0.022579193115234375, 0.023678302764892578, 0.02477741241455078, 0.025876522064208984, 0.026975631713867188, 0.02807474136352539, 0.029173851013183594, 0.030272960662841797, 0.0313720703125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 6.0, 9.0, 8.0, 13.0, 10.0, 10.0, 23.0, 29.0, 56.0, 70.0, 115.0, 167.0, 587.0, 32995.0, 1010690.0, 3036.0, 286.0, 135.0, 98.0, 65.0, 31.0, 20.0, 20.0, 10.0, 13.0, 9.0, 5.0, 5.0, 0.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.625, -0.6028900146484375, -0.580780029296875, -0.5586700439453125, -0.53656005859375, -0.5144500732421875, -0.492340087890625, -0.4702301025390625, -0.4481201171875, -0.4260101318359375, -0.403900146484375, -0.3817901611328125, -0.35968017578125, -0.3375701904296875, -0.315460205078125, -0.2933502197265625, -0.271240234375, -0.2491302490234375, -0.227020263671875, -0.2049102783203125, -0.18280029296875, -0.1606903076171875, -0.138580322265625, -0.1164703369140625, -0.0943603515625, -0.0722503662109375, -0.050140380859375, -0.0280303955078125, -0.00592041015625, 0.0161895751953125, 0.038299560546875, 0.0604095458984375, 0.08251953125, 0.1046295166015625, 0.126739501953125, 0.1488494873046875, 0.17095947265625, 0.1930694580078125, 0.215179443359375, 0.2372894287109375, 0.2593994140625, 0.2815093994140625, 0.303619384765625, 0.3257293701171875, 0.34783935546875, 0.3699493408203125, 0.392059326171875, 0.4141693115234375, 0.436279296875, 0.4583892822265625, 0.480499267578125, 0.5026092529296875, 0.52471923828125, 0.5468292236328125, 0.568939208984375, 0.5910491943359375, 0.6131591796875, 0.6352691650390625, 0.657379150390625, 0.6794891357421875, 0.70159912109375, 0.7237091064453125, 0.745819091796875, 0.7679290771484375, 0.7900390625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 31.0, 93.0, 583.0, 262.0, 33.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272876501083374, -0.2660271227359772, -0.2591777443885803, -0.25232839584350586, -0.24547900259494781, -0.23862963914871216, -0.2317802608013153, -0.22493088245391846, -0.2180815041065216, -0.21123212575912476, -0.2043827623128891, -0.19753338396549225, -0.1906840056180954, -0.18383464217185974, -0.1769852638244629, -0.17013588547706604, -0.16328652203083038, -0.15643714368343353, -0.14958778023719788, -0.14273840188980103, -0.13588902354240417, -0.12903964519500732, -0.12219028174877167, -0.11534090340137482, -0.10849153250455856, -0.10164216160774231, -0.09479278326034546, -0.0879434123635292, -0.08109404146671295, -0.0742446631193161, -0.06739529222249985, -0.060545917600393295, -0.05369654297828674, -0.04684716835618019, -0.03999779373407364, -0.033148422837257385, -0.026299048215150833, -0.01944967359304428, -0.012600302696228027, -0.005750928074121475, 0.001098446547985077, 0.007947820238769054, 0.014797193929553032, 0.021646566689014435, 0.028495941311120987, 0.03534531593322754, 0.04219468683004379, 0.049044061452150345, 0.0558934360742569, 0.06274280697107315, 0.06959218531847, 0.07644155621528625, 0.0832909345626831, 0.09014030545949936, 0.09698967635631561, 0.10383905470371246, 0.11068842560052872, 0.11753779649734497, 0.12438717484474182, 0.13123655319213867, 0.13808591663837433, 0.14493529498577118, 0.15178465843200684, 0.1586340367794037, 0.16548341512680054]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 5.0, 5.0, 7.0, 7.0, 13.0, 19.0, 11.0, 15.0, 22.0, 24.0, 17.0, 20.0, 19.0, 39.0, 28.0, 28.0, 37.0, 44.0, 35.0, 44.0, 40.0, 46.0, 37.0, 41.0, 45.0, 34.0, 32.0, 34.0, 31.0, 42.0, 26.0, 25.0, 19.0, 22.0, 15.0, 16.0, 9.0, 14.0, 8.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.022802889347076416, -0.022143829613924026, -0.021484771743416786, -0.020825713872909546, -0.020166654139757156, -0.019507594406604767, -0.018848536536097527, -0.018189478665590286, -0.017530418932437897, -0.016871359199285507, -0.016212301328778267, -0.015553242526948452, -0.014894183725118637, -0.014235124923288822, -0.013576066121459007, -0.012917007319629192, -0.012257948517799377, -0.011598889715969563, -0.010939830914139748, -0.010280772112309933, -0.009621713310480118, -0.008962654508650303, -0.008303595706820488, -0.007644536904990673, -0.006985478103160858, -0.006326419301331043, -0.005667360499501228, -0.005008301697671413, -0.0043492428958415985, -0.0036901840940117836, -0.0030311252921819687, -0.0023720664903521538, -0.0017130076885223389, -0.001053948886692524, -0.00039489008486270905, 0.00026416871696710587, 0.0009232275187969208, 0.0015822863206267357, 0.0022413451224565506, 0.0029004039242863655, 0.0035594627261161804, 0.004218521527945995, 0.00487758032977581, 0.005536639131605625, 0.00619569793343544, 0.006854756735265255, 0.00751381553709507, 0.008172874338924885, 0.0088319331407547, 0.009490991942584515, 0.01015005074441433, 0.010809109546244144, 0.01146816834807396, 0.012127227149903774, 0.01278628595173359, 0.013445344753563404, 0.014104403555393219, 0.014763462357223034, 0.015422521159052849, 0.01608157902956009, 0.01674063876271248, 0.017399698495864868, 0.01805875636637211, 0.01871781423687935, 0.01937687397003174]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 7.0, 6.0, 5.0, 4.0, 13.0, 11.0, 14.0, 15.0, 24.0, 30.0, 22.0, 26.0, 18.0, 20.0, 28.0, 45.0, 31.0, 38.0, 42.0, 37.0, 41.0, 32.0, 41.0, 38.0, 39.0, 35.0, 32.0, 37.0, 32.0, 31.0, 22.0, 18.0, 32.0, 23.0, 14.0, 14.0, 11.0, 17.0, 10.0, 7.0, 11.0, 5.0, 4.0, 8.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.73876953125, -7.4775390625, -7.21630859375, -6.955078125, -6.69384765625, -6.4326171875, -6.17138671875, -5.91015625, -5.64892578125, -5.3876953125, -5.12646484375, -4.865234375, -4.60400390625, -4.3427734375, -4.08154296875, -3.8203125, -3.55908203125, -3.2978515625, -3.03662109375, -2.775390625, -2.51416015625, -2.2529296875, -1.99169921875, -1.73046875, -1.46923828125, -1.2080078125, -0.94677734375, -0.685546875, -0.42431640625, -0.1630859375, 0.09814453125, 0.359375, 0.62060546875, 0.8818359375, 1.14306640625, 1.404296875, 1.66552734375, 1.9267578125, 2.18798828125, 2.44921875, 2.71044921875, 2.9716796875, 3.23291015625, 3.494140625, 3.75537109375, 4.0166015625, 4.27783203125, 4.5390625, 4.80029296875, 5.0615234375, 5.32275390625, 5.583984375, 5.84521484375, 6.1064453125, 6.36767578125, 6.62890625, 6.89013671875, 7.1513671875, 7.41259765625, 7.673828125, 7.93505859375, 8.1962890625, 8.45751953125, 8.71875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 8.0, 16.0, 8.0, 20.0, 19.0, 33.0, 49.0, 61.0, 95.0, 112.0, 158.0, 236.0, 360.0, 546.0, 807.0, 1190.0, 1837.0, 2899.0, 4572.0, 8297.0, 15497.0, 31646.0, 73524.0, 242450.0, 433318.0, 132096.0, 48214.0, 22233.0, 11319.0, 6390.0, 3747.0, 2265.0, 1436.0, 976.0, 671.0, 436.0, 300.0, 189.0, 161.0, 113.0, 68.0, 42.0, 42.0, 30.0, 22.0, 9.0, 16.0, 6.0, 5.0, 9.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.7423095703125, -10.375244140625, -10.0081787109375, -9.64111328125, -9.2740478515625, -8.906982421875, -8.5399169921875, -8.1728515625, -7.8057861328125, -7.438720703125, -7.0716552734375, -6.70458984375, -6.3375244140625, -5.970458984375, -5.6033935546875, -5.236328125, -4.8692626953125, -4.502197265625, -4.1351318359375, -3.76806640625, -3.4010009765625, -3.033935546875, -2.6668701171875, -2.2998046875, -1.9327392578125, -1.565673828125, -1.1986083984375, -0.83154296875, -0.4644775390625, -0.097412109375, 0.2696533203125, 0.63671875, 1.0037841796875, 1.370849609375, 1.7379150390625, 2.10498046875, 2.4720458984375, 2.839111328125, 3.2061767578125, 3.5732421875, 3.9403076171875, 4.307373046875, 4.6744384765625, 5.04150390625, 5.4085693359375, 5.775634765625, 6.1427001953125, 6.509765625, 6.8768310546875, 7.243896484375, 7.6109619140625, 7.97802734375, 8.3450927734375, 8.712158203125, 9.0792236328125, 9.4462890625, 9.8133544921875, 10.180419921875, 10.5474853515625, 10.91455078125, 11.2816162109375, 11.648681640625, 12.0157470703125, 12.3828125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 3.0, 7.0, 10.0, 11.0, 14.0, 7.0, 10.0, 16.0, 17.0, 28.0, 19.0, 26.0, 24.0, 32.0, 26.0, 41.0, 45.0, 67.0, 80.0, 102.0, 216.0, 1388.0, 248.0, 120.0, 94.0, 54.0, 38.0, 47.0, 27.0, 24.0, 27.0, 18.0, 24.0, 20.0, 10.0, 20.0, 21.0, 9.0, 14.0, 10.0, 11.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.78125, -21.15185546875, -20.5224609375, -19.89306640625, -19.263671875, -18.63427734375, -18.0048828125, -17.37548828125, -16.74609375, -16.11669921875, -15.4873046875, -14.85791015625, -14.228515625, -13.59912109375, -12.9697265625, -12.34033203125, -11.7109375, -11.08154296875, -10.4521484375, -9.82275390625, -9.193359375, -8.56396484375, -7.9345703125, -7.30517578125, -6.67578125, -6.04638671875, -5.4169921875, -4.78759765625, -4.158203125, -3.52880859375, -2.8994140625, -2.27001953125, -1.640625, -1.01123046875, -0.3818359375, 0.24755859375, 0.876953125, 1.50634765625, 2.1357421875, 2.76513671875, 3.39453125, 4.02392578125, 4.6533203125, 5.28271484375, 5.912109375, 6.54150390625, 7.1708984375, 7.80029296875, 8.4296875, 9.05908203125, 9.6884765625, 10.31787109375, 10.947265625, 11.57666015625, 12.2060546875, 12.83544921875, 13.46484375, 14.09423828125, 14.7236328125, 15.35302734375, 15.982421875, 16.61181640625, 17.2412109375, 17.87060546875, 18.5]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 4.0, 11.0, 7.0, 11.0, 24.0, 20.0, 39.0, 60.0, 74.0, 118.0, 235.0, 501.0, 1783.0, 15571.0, 2630840.0, 485383.0, 8741.0, 1297.0, 405.0, 193.0, 122.0, 70.0, 48.0, 34.0, 20.0, 27.0, 10.0, 8.0, 12.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-61.0, -59.1455078125, -57.291015625, -55.4365234375, -53.58203125, -51.7275390625, -49.873046875, -48.0185546875, -46.1640625, -44.3095703125, -42.455078125, -40.6005859375, -38.74609375, -36.8916015625, -35.037109375, -33.1826171875, -31.328125, -29.4736328125, -27.619140625, -25.7646484375, -23.91015625, -22.0556640625, -20.201171875, -18.3466796875, -16.4921875, -14.6376953125, -12.783203125, -10.9287109375, -9.07421875, -7.2197265625, -5.365234375, -3.5107421875, -1.65625, 0.1982421875, 2.052734375, 3.9072265625, 5.76171875, 7.6162109375, 9.470703125, 11.3251953125, 13.1796875, 15.0341796875, 16.888671875, 18.7431640625, 20.59765625, 22.4521484375, 24.306640625, 26.1611328125, 28.015625, 29.8701171875, 31.724609375, 33.5791015625, 35.43359375, 37.2880859375, 39.142578125, 40.9970703125, 42.8515625, 44.7060546875, 46.560546875, 48.4150390625, 50.26953125, 52.1240234375, 53.978515625, 55.8330078125, 57.6875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 522.0, 459.0, 12.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.90570068359375, -455.78759765625, -446.66949462890625, -437.5513610839844, -428.4332580566406, -419.3151550292969, -410.1970520019531, -401.0789489746094, -391.9608154296875, -382.84271240234375, -373.724609375, -364.6064758300781, -355.4883728027344, -346.3702697753906, -337.2521667480469, -328.1340637207031, -319.0159606933594, -309.8978576660156, -300.7797546386719, -291.66162109375, -282.54351806640625, -273.4254150390625, -264.30731201171875, -255.189208984375, -246.0710906982422, -236.95298767089844, -227.83486938476562, -218.71676635742188, -209.59866333007812, -200.4805450439453, -191.36244201660156, -182.24432373046875, -173.126220703125, -164.00811767578125, -154.88999938964844, -145.7718963623047, -136.65377807617188, -127.53567504882812, -118.41757202148438, -109.2994613647461, -100.18134307861328, -91.063232421875, -81.94512939453125, -72.82701873779297, -63.70890808105469, -54.590797424316406, -45.47269058227539, -36.354583740234375, -27.236473083496094, -18.118364334106445, -9.000255584716797, 0.11785316467285156, 9.2359619140625, 18.35407257080078, 27.472179412841797, 36.59028625488281, 45.708396911621094, 54.826507568359375, 63.94461441040039, 73.0627212524414, 82.18083190917969, 91.29894256591797, 100.41705322265625, 109.53515625, 118.65326690673828]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 9.0, 14.0, 8.0, 9.0, 15.0, 10.0, 24.0, 25.0, 17.0, 37.0, 26.0, 45.0, 31.0, 21.0, 37.0, 33.0, 47.0, 45.0, 47.0, 49.0, 50.0, 40.0, 48.0, 23.0, 37.0, 29.0, 30.0, 32.0, 24.0, 15.0, 18.0, 14.0, 20.0, 15.0, 12.0, 7.0, 8.0, 8.0, 3.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.259281158447266, -48.63461685180664, -47.009952545166016, -45.38528823852539, -43.760623931884766, -42.13595962524414, -40.51129150390625, -38.886627197265625, -37.261962890625, -35.637298583984375, -34.01263427734375, -32.387969970703125, -30.7633056640625, -29.138641357421875, -27.513975143432617, -25.889310836791992, -24.2646484375, -22.639984130859375, -21.01531982421875, -19.390655517578125, -17.7659912109375, -16.141326904296875, -14.516660690307617, -12.891996383666992, -11.267332077026367, -9.642667770385742, -8.018003463745117, -6.393338203430176, -4.768673896789551, -3.144009590148926, -1.5193443298339844, 0.10531997680664062, 1.7299880981445312, 3.3546526432037354, 4.9793171882629395, 6.603981971740723, 8.228646278381348, 9.853310585021973, 11.477975845336914, 13.102640151977539, 14.727304458618164, 16.35196876525879, 17.976633071899414, 19.601299285888672, 21.225963592529297, 22.850627899169922, 24.475292205810547, 26.099956512451172, 27.724620819091797, 29.349285125732422, 30.973949432373047, 32.59861373901367, 34.2232780456543, 35.84794235229492, 37.47261047363281, 39.09727478027344, 40.72193908691406, 42.34660339355469, 43.97126770019531, 45.59593200683594, 47.22059631347656, 48.84526062011719, 50.46992492675781, 52.09458923339844, 53.71925354003906]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 8.0, 6.0, 7.0, 12.0, 8.0, 16.0, 21.0, 18.0, 16.0, 23.0, 22.0, 22.0, 24.0, 27.0, 40.0, 46.0, 39.0, 46.0, 34.0, 31.0, 45.0, 40.0, 36.0, 27.0, 36.0, 36.0, 28.0, 29.0, 39.0, 31.0, 22.0, 20.0, 13.0, 18.0, 18.0, 13.0, 11.0, 11.0, 13.0, 15.0, 5.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-8.3203125, -8.0587158203125, -7.797119140625, -7.5355224609375, -7.27392578125, -7.0123291015625, -6.750732421875, -6.4891357421875, -6.2275390625, -5.9659423828125, -5.704345703125, -5.4427490234375, -5.18115234375, -4.9195556640625, -4.657958984375, -4.3963623046875, -4.134765625, -3.8731689453125, -3.611572265625, -3.3499755859375, -3.08837890625, -2.8267822265625, -2.565185546875, -2.3035888671875, -2.0419921875, -1.7803955078125, -1.518798828125, -1.2572021484375, -0.99560546875, -0.7340087890625, -0.472412109375, -0.2108154296875, 0.05078125, 0.3123779296875, 0.573974609375, 0.8355712890625, 1.09716796875, 1.3587646484375, 1.620361328125, 1.8819580078125, 2.1435546875, 2.4051513671875, 2.666748046875, 2.9283447265625, 3.18994140625, 3.4515380859375, 3.713134765625, 3.9747314453125, 4.236328125, 4.4979248046875, 4.759521484375, 5.0211181640625, 5.28271484375, 5.5443115234375, 5.805908203125, 6.0675048828125, 6.3291015625, 6.5906982421875, 6.852294921875, 7.1138916015625, 7.37548828125, 7.6370849609375, 7.898681640625, 8.1602783203125, 8.421875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 10.0, 7.0, 10.0, 15.0, 15.0, 27.0, 30.0, 21.0, 31.0, 47.0, 48.0, 80.0, 105.0, 130.0, 211.0, 352.0, 661.0, 1601.0, 7606.0, 2301515.0, 1871348.0, 7077.0, 1513.0, 655.0, 348.0, 218.0, 147.0, 105.0, 61.0, 53.0, 52.0, 31.0, 22.0, 26.0, 17.0, 14.0, 16.0, 13.0, 8.0, 8.0, 1.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.875, -76.4091796875, -73.943359375, -71.4775390625, -69.01171875, -66.5458984375, -64.080078125, -61.6142578125, -59.1484375, -56.6826171875, -54.216796875, -51.7509765625, -49.28515625, -46.8193359375, -44.353515625, -41.8876953125, -39.421875, -36.9560546875, -34.490234375, -32.0244140625, -29.55859375, -27.0927734375, -24.626953125, -22.1611328125, -19.6953125, -17.2294921875, -14.763671875, -12.2978515625, -9.83203125, -7.3662109375, -4.900390625, -2.4345703125, 0.03125, 2.4970703125, 4.962890625, 7.4287109375, 9.89453125, 12.3603515625, 14.826171875, 17.2919921875, 19.7578125, 22.2236328125, 24.689453125, 27.1552734375, 29.62109375, 32.0869140625, 34.552734375, 37.0185546875, 39.484375, 41.9501953125, 44.416015625, 46.8818359375, 49.34765625, 51.8134765625, 54.279296875, 56.7451171875, 59.2109375, 61.6767578125, 64.142578125, 66.6083984375, 69.07421875, 71.5400390625, 74.005859375, 76.4716796875, 78.9375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 5.0, 4.0, 9.0, 11.0, 14.0, 17.0, 29.0, 32.0, 52.0, 69.0, 69.0, 114.0, 180.0, 315.0, 515.0, 720.0, 667.0, 432.0, 256.0, 168.0, 108.0, 57.0, 48.0, 38.0, 25.0, 27.0, 20.0, 11.0, 11.0, 9.0, 9.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.4500732421875, -11.986083984375, -11.5220947265625, -11.05810546875, -10.5941162109375, -10.130126953125, -9.6661376953125, -9.2021484375, -8.7381591796875, -8.274169921875, -7.8101806640625, -7.34619140625, -6.8822021484375, -6.418212890625, -5.9542236328125, -5.490234375, -5.0262451171875, -4.562255859375, -4.0982666015625, -3.63427734375, -3.1702880859375, -2.706298828125, -2.2423095703125, -1.7783203125, -1.3143310546875, -0.850341796875, -0.3863525390625, 0.07763671875, 0.5416259765625, 1.005615234375, 1.4696044921875, 1.93359375, 2.3975830078125, 2.861572265625, 3.3255615234375, 3.78955078125, 4.2535400390625, 4.717529296875, 5.1815185546875, 5.6455078125, 6.1094970703125, 6.573486328125, 7.0374755859375, 7.50146484375, 7.9654541015625, 8.429443359375, 8.8934326171875, 9.357421875, 9.8214111328125, 10.285400390625, 10.7493896484375, 11.21337890625, 11.6773681640625, 12.141357421875, 12.6053466796875, 13.0693359375, 13.5333251953125, 13.997314453125, 14.4613037109375, 14.92529296875, 15.3892822265625, 15.853271484375, 16.3172607421875, 16.78125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 11.0, 7.0, 9.0, 12.0, 17.0, 29.0, 28.0, 39.0, 47.0, 97.0, 143.0, 281.0, 578.0, 1362.0, 3750.0, 12159.0, 70420.0, 2531681.0, 1502151.0, 55510.0, 10341.0, 3185.0, 1200.0, 497.0, 280.0, 132.0, 79.0, 54.0, 35.0, 20.0, 27.0, 26.0, 13.0, 13.0, 5.0, 6.0, 4.0, 3.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.9033203125, -33.775390625, -32.6474609375, -31.51953125, -30.3916015625, -29.263671875, -28.1357421875, -27.0078125, -25.8798828125, -24.751953125, -23.6240234375, -22.49609375, -21.3681640625, -20.240234375, -19.1123046875, -17.984375, -16.8564453125, -15.728515625, -14.6005859375, -13.47265625, -12.3447265625, -11.216796875, -10.0888671875, -8.9609375, -7.8330078125, -6.705078125, -5.5771484375, -4.44921875, -3.3212890625, -2.193359375, -1.0654296875, 0.0625, 1.1904296875, 2.318359375, 3.4462890625, 4.57421875, 5.7021484375, 6.830078125, 7.9580078125, 9.0859375, 10.2138671875, 11.341796875, 12.4697265625, 13.59765625, 14.7255859375, 15.853515625, 16.9814453125, 18.109375, 19.2373046875, 20.365234375, 21.4931640625, 22.62109375, 23.7490234375, 24.876953125, 26.0048828125, 27.1328125, 28.2607421875, 29.388671875, 30.5166015625, 31.64453125, 32.7724609375, 33.900390625, 35.0283203125, 36.15625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 16.0, 23.0, 30.0, 59.0, 108.0, 151.0, 186.0, 161.0, 106.0, 71.0, 44.0, 30.0, 11.0, 7.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.5049991607666, -24.248519897460938, -21.99203872680664, -19.735557556152344, -17.47907829284668, -15.2225980758667, -12.966117858886719, -10.709637641906738, -8.453157424926758, -6.196677207946777, -3.940196990966797, -1.6837167739868164, 0.5727634429931641, 2.8292436599731445, 5.085723876953125, 7.3422040939331055, 9.598684310913086, 11.855164527893066, 14.111644744873047, 16.368125915527344, 18.624605178833008, 20.881084442138672, 23.13756561279297, 25.394046783447266, 27.65052604675293, 29.907005310058594, 32.16348648071289, 34.41996765136719, 36.67644500732422, 38.932926177978516, 41.18940734863281, 43.44588851928711, 45.702362060546875, 47.95884323120117, 50.21532440185547, 52.4718017578125, 54.7282829284668, 56.984764099121094, 59.241241455078125, 61.49772262573242, 63.75420379638672, 66.01068115234375, 68.26716613769531, 70.52364349365234, 72.78012084960938, 75.03660583496094, 77.29308319091797, 79.54956817626953, 81.80604553222656, 84.0625228881836, 86.31900787353516, 88.57548522949219, 90.83197021484375, 93.08844757080078, 95.34492492675781, 97.60140991210938, 99.8578872680664, 102.11436462402344, 104.370849609375, 106.62732696533203, 108.88380432128906, 111.14028930664062, 113.39676666259766, 115.65325164794922, 117.90972900390625]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 3.0, 1.0, 7.0, 4.0, 4.0, 10.0, 9.0, 15.0, 8.0, 14.0, 12.0, 24.0, 31.0, 21.0, 26.0, 29.0, 25.0, 33.0, 31.0, 32.0, 35.0, 35.0, 43.0, 40.0, 55.0, 39.0, 38.0, 30.0, 30.0, 30.0, 31.0, 29.0, 21.0, 28.0, 29.0, 19.0, 23.0, 16.0, 16.0, 13.0, 15.0, 11.0, 6.0, 9.0, 7.0, 2.0, 1.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-41.1014404296875, -39.82278823852539, -38.54413604736328, -37.26548767089844, -35.98683547973633, -34.70818328857422, -33.429534912109375, -32.150882720947266, -30.872230529785156, -29.593578338623047, -28.31492805480957, -27.036277770996094, -25.757625579833984, -24.478973388671875, -23.2003231048584, -21.921672821044922, -20.643020629882812, -19.364368438720703, -18.085718154907227, -16.80706787109375, -15.52841567993164, -14.249764442443848, -12.971113204956055, -11.692461967468262, -10.413810729980469, -9.135159492492676, -7.856508255004883, -6.57785701751709, -5.299205780029297, -4.020554542541504, -2.741903305053711, -1.463252067565918, -0.184600830078125, 1.094050407409668, 2.372701644897461, 3.651352882385254, 4.930004119873047, 6.20865535736084, 7.487306594848633, 8.765957832336426, 10.044609069824219, 11.323260307312012, 12.601911544799805, 13.880562782287598, 15.15921401977539, 16.4378662109375, 17.716516494750977, 18.995166778564453, 20.273818969726562, 21.552471160888672, 22.83112144470215, 24.109771728515625, 25.388423919677734, 26.667076110839844, 27.94572639465332, 29.224376678466797, 30.503028869628906, 31.781681060791016, 33.060333251953125, 34.33898162841797, 35.61763381958008, 36.89628601074219, 38.17493438720703, 39.45358657836914, 40.73223876953125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 7.0, 8.0, 5.0, 7.0, 7.0, 8.0, 20.0, 11.0, 13.0, 12.0, 18.0, 22.0, 30.0, 28.0, 36.0, 37.0, 37.0, 48.0, 32.0, 49.0, 38.0, 42.0, 40.0, 42.0, 39.0, 30.0, 37.0, 27.0, 32.0, 22.0, 34.0, 28.0, 18.0, 10.0, 18.0, 17.0, 13.0, 10.0, 12.0, 13.0, 10.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.84375, -7.58544921875, -7.3271484375, -7.06884765625, -6.810546875, -6.55224609375, -6.2939453125, -6.03564453125, -5.77734375, -5.51904296875, -5.2607421875, -5.00244140625, -4.744140625, -4.48583984375, -4.2275390625, -3.96923828125, -3.7109375, -3.45263671875, -3.1943359375, -2.93603515625, -2.677734375, -2.41943359375, -2.1611328125, -1.90283203125, -1.64453125, -1.38623046875, -1.1279296875, -0.86962890625, -0.611328125, -0.35302734375, -0.0947265625, 0.16357421875, 0.421875, 0.68017578125, 0.9384765625, 1.19677734375, 1.455078125, 1.71337890625, 1.9716796875, 2.22998046875, 2.48828125, 2.74658203125, 3.0048828125, 3.26318359375, 3.521484375, 3.77978515625, 4.0380859375, 4.29638671875, 4.5546875, 4.81298828125, 5.0712890625, 5.32958984375, 5.587890625, 5.84619140625, 6.1044921875, 6.36279296875, 6.62109375, 6.87939453125, 7.1376953125, 7.39599609375, 7.654296875, 7.91259765625, 8.1708984375, 8.42919921875, 8.6875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 10.0, 22.0, 24.0, 47.0, 63.0, 103.0, 153.0, 225.0, 388.0, 607.0, 927.0, 1455.0, 2293.0, 3528.0, 5694.0, 9145.0, 14662.0, 23310.0, 37649.0, 61668.0, 101214.0, 161099.0, 208675.0, 158345.0, 98531.0, 60469.0, 37088.0, 22760.0, 14129.0, 8856.0, 5656.0, 3544.0, 2187.0, 1496.0, 927.0, 582.0, 361.0, 238.0, 162.0, 101.0, 57.0, 45.0, 17.0, 19.0, 12.0, 3.0, 9.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.029296875, -0.9976043701171875, -0.965911865234375, -0.9342193603515625, -0.90252685546875, -0.8708343505859375, -0.839141845703125, -0.8074493408203125, -0.7757568359375, -0.7440643310546875, -0.712371826171875, -0.6806793212890625, -0.64898681640625, -0.6172943115234375, -0.585601806640625, -0.5539093017578125, -0.522216796875, -0.4905242919921875, -0.458831787109375, -0.4271392822265625, -0.39544677734375, -0.3637542724609375, -0.332061767578125, -0.3003692626953125, -0.2686767578125, -0.2369842529296875, -0.205291748046875, -0.1735992431640625, -0.14190673828125, -0.1102142333984375, -0.078521728515625, -0.0468292236328125, -0.01513671875, 0.0165557861328125, 0.048248291015625, 0.0799407958984375, 0.11163330078125, 0.1433258056640625, 0.175018310546875, 0.2067108154296875, 0.2384033203125, 0.2700958251953125, 0.301788330078125, 0.3334808349609375, 0.36517333984375, 0.3968658447265625, 0.428558349609375, 0.4602508544921875, 0.491943359375, 0.5236358642578125, 0.555328369140625, 0.5870208740234375, 0.61871337890625, 0.6504058837890625, 0.682098388671875, 0.7137908935546875, 0.7454833984375, 0.7771759033203125, 0.808868408203125, 0.8405609130859375, 0.87225341796875, 0.9039459228515625, 0.935638427734375, 0.9673309326171875, 0.9990234375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 9.0, 3.0, 6.0, 13.0, 14.0, 21.0, 24.0, 17.0, 25.0, 33.0, 37.0, 28.0, 33.0, 34.0, 36.0, 36.0, 36.0, 56.0, 1063.0, 46.0, 35.0, 45.0, 38.0, 45.0, 43.0, 37.0, 28.0, 23.0, 21.0, 17.0, 17.0, 16.0, 21.0, 9.0, 4.0, 7.0, 2.0, 11.0, 7.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.484375, -5.30426025390625, -5.1241455078125, -4.94403076171875, -4.763916015625, -4.58380126953125, -4.4036865234375, -4.22357177734375, -4.04345703125, -3.86334228515625, -3.6832275390625, -3.50311279296875, -3.322998046875, -3.14288330078125, -2.9627685546875, -2.78265380859375, -2.6025390625, -2.42242431640625, -2.2423095703125, -2.06219482421875, -1.882080078125, -1.70196533203125, -1.5218505859375, -1.34173583984375, -1.16162109375, -0.98150634765625, -0.8013916015625, -0.62127685546875, -0.441162109375, -0.26104736328125, -0.0809326171875, 0.09918212890625, 0.279296875, 0.45941162109375, 0.6395263671875, 0.81964111328125, 0.999755859375, 1.17987060546875, 1.3599853515625, 1.54010009765625, 1.72021484375, 1.90032958984375, 2.0804443359375, 2.26055908203125, 2.440673828125, 2.62078857421875, 2.8009033203125, 2.98101806640625, 3.1611328125, 3.34124755859375, 3.5213623046875, 3.70147705078125, 3.881591796875, 4.06170654296875, 4.2418212890625, 4.42193603515625, 4.60205078125, 4.78216552734375, 4.9622802734375, 5.14239501953125, 5.322509765625, 5.50262451171875, 5.6827392578125, 5.86285400390625, 6.04296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 10.0, 20.0, 43.0, 44.0, 67.0, 110.0, 138.0, 198.0, 269.0, 403.0, 621.0, 828.0, 1303.0, 1753.0, 2774.0, 3862.0, 5704.0, 8489.0, 12535.0, 18882.0, 28446.0, 44173.0, 68705.0, 107683.0, 157598.0, 1214421.0, 142399.0, 96536.0, 61696.0, 39130.0, 25773.0, 16889.0, 11339.0, 7594.0, 5228.0, 3638.0, 2444.0, 1679.0, 1159.0, 796.0, 525.0, 378.0, 250.0, 194.0, 137.0, 78.0, 65.0, 55.0, 22.0, 21.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 4.0], "bins": [-0.61767578125, -0.5985946655273438, -0.5795135498046875, -0.5604324340820312, -0.541351318359375, -0.5222702026367188, -0.5031890869140625, -0.48410797119140625, -0.46502685546875, -0.44594573974609375, -0.4268646240234375, -0.40778350830078125, -0.388702392578125, -0.36962127685546875, -0.3505401611328125, -0.33145904541015625, -0.3123779296875, -0.29329681396484375, -0.2742156982421875, -0.25513458251953125, -0.236053466796875, -0.21697235107421875, -0.1978912353515625, -0.17881011962890625, -0.15972900390625, -0.14064788818359375, -0.1215667724609375, -0.10248565673828125, -0.083404541015625, -0.06432342529296875, -0.0452423095703125, -0.02616119384765625, -0.007080078125, 0.01200103759765625, 0.0310821533203125, 0.05016326904296875, 0.069244384765625, 0.08832550048828125, 0.1074066162109375, 0.12648773193359375, 0.14556884765625, 0.16464996337890625, 0.1837310791015625, 0.20281219482421875, 0.221893310546875, 0.24097442626953125, 0.2600555419921875, 0.27913665771484375, 0.2982177734375, 0.31729888916015625, 0.3363800048828125, 0.35546112060546875, 0.374542236328125, 0.39362335205078125, 0.4127044677734375, 0.43178558349609375, 0.45086669921875, 0.46994781494140625, 0.4890289306640625, 0.5081100463867188, 0.527191162109375, 0.5462722778320312, 0.5653533935546875, 0.5844345092773438, 0.603515625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 1.0, 11.0, 7.0, 12.0, 21.0, 23.0, 32.0, 39.0, 80.0, 157.0, 210.0, 124.0, 70.0, 54.0, 34.0, 26.0, 22.0, 11.0, 5.0, 8.0, 3.0, 6.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.053466796875, -0.05195426940917969, -0.050441741943359375, -0.04892921447753906, -0.04741668701171875, -0.04590415954589844, -0.044391632080078125, -0.04287910461425781, -0.0413665771484375, -0.03985404968261719, -0.038341522216796875, -0.03682899475097656, -0.03531646728515625, -0.03380393981933594, -0.032291412353515625, -0.030778884887695312, -0.029266357421875, -0.027753829956054688, -0.026241302490234375, -0.024728775024414062, -0.02321624755859375, -0.021703720092773438, -0.020191192626953125, -0.018678665161132812, -0.0171661376953125, -0.015653610229492188, -0.014141082763671875, -0.012628555297851562, -0.01111602783203125, -0.009603500366210938, -0.008090972900390625, -0.0065784454345703125, -0.00506591796875, -0.0035533905029296875, -0.002040863037109375, -0.0005283355712890625, 0.00098419189453125, 0.0024967193603515625, 0.004009246826171875, 0.0055217742919921875, 0.0070343017578125, 0.008546829223632812, 0.010059356689453125, 0.011571884155273438, 0.01308441162109375, 0.014596939086914062, 0.016109466552734375, 0.017621994018554688, 0.019134521484375, 0.020647048950195312, 0.022159576416015625, 0.023672103881835938, 0.02518463134765625, 0.026697158813476562, 0.028209686279296875, 0.029722213745117188, 0.0312347412109375, 0.03274726867675781, 0.034259796142578125, 0.03577232360839844, 0.03728485107421875, 0.03879737854003906, 0.040309906005859375, 0.04182243347167969, 0.0433349609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 6.0, 4.0, 3.0, 13.0, 13.0, 20.0, 19.0, 28.0, 47.0, 70.0, 113.0, 170.0, 576.0, 5841.0, 1023166.0, 17090.0, 747.0, 208.0, 103.0, 92.0, 42.0, 39.0, 26.0, 23.0, 12.0, 10.0, 11.0, 8.0, 8.0, 3.0, 3.0, 7.0, 2.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85595703125, -0.8260574340820312, -0.7961578369140625, -0.7662582397460938, -0.736358642578125, -0.7064590454101562, -0.6765594482421875, -0.6466598510742188, -0.61676025390625, -0.5868606567382812, -0.5569610595703125, -0.5270614624023438, -0.497161865234375, -0.46726226806640625, -0.4373626708984375, -0.40746307373046875, -0.3775634765625, -0.34766387939453125, -0.3177642822265625, -0.28786468505859375, -0.257965087890625, -0.22806549072265625, -0.1981658935546875, -0.16826629638671875, -0.13836669921875, -0.10846710205078125, -0.0785675048828125, -0.04866790771484375, -0.018768310546875, 0.01113128662109375, 0.0410308837890625, 0.07093048095703125, 0.100830078125, 0.13072967529296875, 0.1606292724609375, 0.19052886962890625, 0.220428466796875, 0.25032806396484375, 0.2802276611328125, 0.31012725830078125, 0.34002685546875, 0.36992645263671875, 0.3998260498046875, 0.42972564697265625, 0.459625244140625, 0.48952484130859375, 0.5194244384765625, 0.5493240356445312, 0.5792236328125, 0.6091232299804688, 0.6390228271484375, 0.6689224243164062, 0.698822021484375, 0.7287216186523438, 0.7586212158203125, 0.7885208129882812, 0.81842041015625, 0.8483200073242188, 0.8782196044921875, 0.9081192016601562, 0.938018798828125, 0.9679183959960938, 0.9978179931640625, 1.0277175903320312, 1.0576171875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 9.0, 9.0, 15.0, 17.0, 20.0, 29.0, 51.0, 83.0, 100.0, 140.0, 176.0, 112.0, 75.0, 49.0, 26.0, 21.0, 13.0, 15.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05558837205171585, -0.05386858060956001, -0.052148789167404175, -0.05042899772524834, -0.0487092062830925, -0.04698941484093666, -0.04526962339878082, -0.043549828231334686, -0.04183004051446915, -0.04011024907231331, -0.03839045763015747, -0.03667066618800163, -0.034950874745845795, -0.03323108330368996, -0.03151129186153412, -0.02979149855673313, -0.028071705251932144, -0.026351913809776306, -0.024632122367620468, -0.02291233092546463, -0.021192539483308792, -0.019472748041152954, -0.017752954736351967, -0.01603316329419613, -0.01431337185204029, -0.012593580409884453, -0.010873788967728615, -0.009153996594250202, -0.007434205152094364, -0.005714413709938526, -0.0039946213364601135, -0.0022748298943042755, -0.000555034726858139, 0.0011647569481283426, 0.0028845486231148243, 0.00460434053093195, 0.006324131973087788, 0.008043923415243626, 0.009763715788722038, 0.011483507230877876, 0.013203298673033714, 0.014923090115189552, 0.01664288155734539, 0.018362674862146378, 0.020082466304302216, 0.021802257746458054, 0.02352204918861389, 0.02524184063076973, 0.026961632072925568, 0.028681423515081406, 0.030401214957237244, 0.03212100639939308, 0.03384079784154892, 0.03556058928370476, 0.037280380725860596, 0.03900017589330673, 0.04071996361017227, 0.04243975505232811, 0.04415954649448395, 0.045879337936639786, 0.047599129378795624, 0.04931892082095146, 0.0510387122631073, 0.052758507430553436, 0.054478298872709274]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 9.0, 9.0, 7.0, 11.0, 15.0, 11.0, 13.0, 21.0, 17.0, 27.0, 24.0, 33.0, 23.0, 25.0, 37.0, 41.0, 37.0, 61.0, 36.0, 44.0, 43.0, 52.0, 48.0, 33.0, 51.0, 25.0, 40.0, 35.0, 28.0, 22.0, 19.0, 18.0, 16.0, 22.0, 13.0, 8.0, 8.0, 8.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023683011531829834, -0.022920023649930954, -0.022157037630677223, -0.021394051611423492, -0.020631063729524612, -0.019868075847625732, -0.019105089828372, -0.01834210380911827, -0.01757911592721939, -0.01681612804532051, -0.01605314202606678, -0.015290155075490475, -0.01452716812491417, -0.013764181174337864, -0.013001194223761559, -0.012238207273185253, -0.011475220322608948, -0.010712233372032642, -0.009949246421456337, -0.009186259470880032, -0.008423272520303726, -0.007660285569727421, -0.006897298619151115, -0.00613431166857481, -0.005371324717998505, -0.004608337767422199, -0.003845350816845894, -0.0030823638662695885, -0.002319376915693283, -0.0015563899651169777, -0.0007934030145406723, -3.0416063964366913e-05, 0.0007325708866119385, 0.0014955578371882439, 0.0022585447877645493, 0.0030215317383408546, 0.00378451868891716, 0.004547505639493465, 0.005310492590069771, 0.006073479540646076, 0.006836466491222382, 0.007599453441798687, 0.008362440392374992, 0.009125427342951298, 0.009888414293527603, 0.010651401244103909, 0.011414388194680214, 0.01217737514525652, 0.012940362095832825, 0.01370334904640913, 0.014466335996985435, 0.015229322947561741, 0.015992309898138046, 0.016755297780036926, 0.017518283799290657, 0.018281269818544388, 0.019044257700443268, 0.019807245582342148, 0.02057023160159588, 0.02133321762084961, 0.02209620550274849, 0.02285919338464737, 0.0236221794039011, 0.02438516542315483, 0.02514815330505371]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 7.0, 7.0, 6.0, 7.0, 7.0, 8.0, 19.0, 12.0, 13.0, 12.0, 17.0, 23.0, 30.0, 28.0, 36.0, 37.0, 37.0, 49.0, 31.0, 49.0, 37.0, 43.0, 40.0, 43.0, 37.0, 31.0, 37.0, 28.0, 31.0, 22.0, 34.0, 28.0, 18.0, 10.0, 17.0, 18.0, 13.0, 10.0, 12.0, 13.0, 10.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.84375, -7.58544921875, -7.3271484375, -7.06884765625, -6.810546875, -6.55224609375, -6.2939453125, -6.03564453125, -5.77734375, -5.51904296875, -5.2607421875, -5.00244140625, -4.744140625, -4.48583984375, -4.2275390625, -3.96923828125, -3.7109375, -3.45263671875, -3.1943359375, -2.93603515625, -2.677734375, -2.41943359375, -2.1611328125, -1.90283203125, -1.64453125, -1.38623046875, -1.1279296875, -0.86962890625, -0.611328125, -0.35302734375, -0.0947265625, 0.16357421875, 0.421875, 0.68017578125, 0.9384765625, 1.19677734375, 1.455078125, 1.71337890625, 1.9716796875, 2.22998046875, 2.48828125, 2.74658203125, 3.0048828125, 3.26318359375, 3.521484375, 3.77978515625, 4.0380859375, 4.29638671875, 4.5546875, 4.81298828125, 5.0712890625, 5.32958984375, 5.587890625, 5.84619140625, 6.1044921875, 6.36279296875, 6.62109375, 6.87939453125, 7.1376953125, 7.39599609375, 7.654296875, 7.91259765625, 8.1708984375, 8.42919921875, 8.6875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 7.0, 3.0, 7.0, 9.0, 13.0, 19.0, 27.0, 27.0, 35.0, 37.0, 56.0, 72.0, 110.0, 145.0, 190.0, 252.0, 364.0, 483.0, 613.0, 866.0, 1162.0, 1851.0, 2975.0, 5495.0, 13590.0, 44036.0, 178886.0, 524879.0, 195624.0, 47099.0, 14398.0, 5887.0, 2970.0, 1773.0, 1202.0, 867.0, 634.0, 516.0, 320.0, 265.0, 190.0, 155.0, 110.0, 91.0, 65.0, 45.0, 47.0, 29.0, 18.0, 9.0, 12.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.359375, -12.9217529296875, -12.484130859375, -12.0465087890625, -11.60888671875, -11.1712646484375, -10.733642578125, -10.2960205078125, -9.8583984375, -9.4207763671875, -8.983154296875, -8.5455322265625, -8.10791015625, -7.6702880859375, -7.232666015625, -6.7950439453125, -6.357421875, -5.9197998046875, -5.482177734375, -5.0445556640625, -4.60693359375, -4.1693115234375, -3.731689453125, -3.2940673828125, -2.8564453125, -2.4188232421875, -1.981201171875, -1.5435791015625, -1.10595703125, -0.6683349609375, -0.230712890625, 0.2069091796875, 0.64453125, 1.0821533203125, 1.519775390625, 1.9573974609375, 2.39501953125, 2.8326416015625, 3.270263671875, 3.7078857421875, 4.1455078125, 4.5831298828125, 5.020751953125, 5.4583740234375, 5.89599609375, 6.3336181640625, 6.771240234375, 7.2088623046875, 7.646484375, 8.0841064453125, 8.521728515625, 8.9593505859375, 9.39697265625, 9.8345947265625, 10.272216796875, 10.7098388671875, 11.1474609375, 11.5850830078125, 12.022705078125, 12.4603271484375, 12.89794921875, 13.3355712890625, 13.773193359375, 14.2108154296875, 14.6484375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 11.0, 7.0, 13.0, 15.0, 25.0, 23.0, 30.0, 43.0, 47.0, 42.0, 52.0, 39.0, 81.0, 204.0, 1532.0, 339.0, 126.0, 69.0, 52.0, 51.0, 49.0, 35.0, 29.0, 29.0, 14.0, 16.0, 20.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.421875, -25.66162109375, -24.9013671875, -24.14111328125, -23.380859375, -22.62060546875, -21.8603515625, -21.10009765625, -20.33984375, -19.57958984375, -18.8193359375, -18.05908203125, -17.298828125, -16.53857421875, -15.7783203125, -15.01806640625, -14.2578125, -13.49755859375, -12.7373046875, -11.97705078125, -11.216796875, -10.45654296875, -9.6962890625, -8.93603515625, -8.17578125, -7.41552734375, -6.6552734375, -5.89501953125, -5.134765625, -4.37451171875, -3.6142578125, -2.85400390625, -2.09375, -1.33349609375, -0.5732421875, 0.18701171875, 0.947265625, 1.70751953125, 2.4677734375, 3.22802734375, 3.98828125, 4.74853515625, 5.5087890625, 6.26904296875, 7.029296875, 7.78955078125, 8.5498046875, 9.31005859375, 10.0703125, 10.83056640625, 11.5908203125, 12.35107421875, 13.111328125, 13.87158203125, 14.6318359375, 15.39208984375, 16.15234375, 16.91259765625, 17.6728515625, 18.43310546875, 19.193359375, 19.95361328125, 20.7138671875, 21.47412109375, 22.234375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 6.0, 4.0, 12.0, 11.0, 17.0, 24.0, 39.0, 50.0, 78.0, 143.0, 365.0, 1107.0, 32127.0, 3108021.0, 2555.0, 591.0, 207.0, 114.0, 69.0, 37.0, 36.0, 24.0, 20.0, 9.0, 13.0, 5.0, 8.0, 2.0, 2.0, 1.0, 7.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.875, -73.25390625, -69.6328125, -66.01171875, -62.390625, -58.76953125, -55.1484375, -51.52734375, -47.90625, -44.28515625, -40.6640625, -37.04296875, -33.421875, -29.80078125, -26.1796875, -22.55859375, -18.9375, -15.31640625, -11.6953125, -8.07421875, -4.453125, -0.83203125, 2.7890625, 6.41015625, 10.03125, 13.65234375, 17.2734375, 20.89453125, 24.515625, 28.13671875, 31.7578125, 35.37890625, 39.0, 42.62109375, 46.2421875, 49.86328125, 53.484375, 57.10546875, 60.7265625, 64.34765625, 67.96875, 71.58984375, 75.2109375, 78.83203125, 82.453125, 86.07421875, 89.6953125, 93.31640625, 96.9375, 100.55859375, 104.1796875, 107.80078125, 111.421875, 115.04296875, 118.6640625, 122.28515625, 125.90625, 129.52734375, 133.1484375, 136.76953125, 140.390625, 144.01171875, 147.6328125, 151.25390625, 154.875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 11.0, 53.0, 297.0, 463.0, 170.0, 21.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.4927215576172, -147.7690887451172, -143.04547119140625, -138.32183837890625, -133.59820556640625, -128.87457275390625, -124.15095520019531, -119.42732238769531, -114.70369720458984, -109.98007202148438, -105.25643920898438, -100.5328140258789, -95.80918884277344, -91.08555603027344, -86.36193084716797, -81.6383056640625, -76.9146728515625, -72.19104766845703, -67.46741485595703, -62.74378967285156, -58.02016067504883, -53.296531677246094, -48.572906494140625, -43.84927749633789, -39.125648498535156, -34.40201950073242, -29.67839241027832, -24.95476531982422, -20.231136322021484, -15.50750732421875, -10.783880233764648, -6.060253143310547, -1.336639404296875, 3.386988639831543, 8.110616683959961, 12.834244728088379, 17.557872772216797, 22.28150177001953, 27.005128860473633, 31.728755950927734, 36.45238494873047, 41.1760139465332, 45.89964294433594, 50.623268127441406, 55.34689712524414, 60.070526123046875, 64.79415130615234, 69.51777648925781, 74.24140930175781, 78.96503448486328, 83.68866729736328, 88.41229248046875, 93.13592529296875, 97.85955047607422, 102.58317565917969, 107.30680847167969, 112.03043365478516, 116.75405883789062, 121.47769165039062, 126.2013168334961, 130.92494201660156, 135.64857482910156, 140.37220764160156, 145.0958251953125, 149.8194580078125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 5.0, 7.0, 14.0, 13.0, 23.0, 15.0, 21.0, 18.0, 35.0, 41.0, 37.0, 36.0, 42.0, 44.0, 33.0, 51.0, 48.0, 47.0, 47.0, 41.0, 40.0, 34.0, 35.0, 29.0, 31.0, 33.0, 32.0, 20.0, 23.0, 26.0, 12.0, 10.0, 15.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.8980712890625, -62.054901123046875, -60.211727142333984, -58.36855697631836, -56.52538299560547, -54.682212829589844, -52.83904266357422, -50.99586868286133, -49.15269470214844, -47.30952453613281, -45.46635055541992, -43.6231803894043, -41.780006408691406, -39.93683624267578, -38.093666076660156, -36.250492095947266, -34.40732192993164, -32.564151763916016, -30.720977783203125, -28.8778076171875, -27.03463363647461, -25.191463470458984, -23.348291397094727, -21.50511932373047, -19.66194725036621, -17.818775177001953, -15.975603103637695, -14.132431983947754, -12.289259910583496, -10.446087837219238, -8.602916717529297, -6.759744644165039, -4.916576385498047, -3.073404550552368, -1.2302327156066895, 0.6129388809204102, 2.456110954284668, 4.299283027648926, 6.142454147338867, 7.985626220703125, 9.828798294067383, 11.67197036743164, 13.515142440795898, 15.35831356048584, 17.20148468017578, 19.044658660888672, 20.887828826904297, 22.731000900268555, 24.574172973632812, 26.41734504699707, 28.260517120361328, 30.103687286376953, 31.946861267089844, 33.79003143310547, 35.633201599121094, 37.476375579833984, 39.319549560546875, 41.1627197265625, 43.00589370727539, 44.849063873291016, 46.692237854003906, 48.53540802001953, 50.378578186035156, 52.22175216674805, 54.06492233276367]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 9.0, 9.0, 4.0, 5.0, 5.0, 5.0, 11.0, 14.0, 12.0, 26.0, 25.0, 21.0, 34.0, 35.0, 24.0, 48.0, 36.0, 41.0, 44.0, 36.0, 39.0, 52.0, 38.0, 42.0, 40.0, 32.0, 34.0, 35.0, 21.0, 31.0, 29.0, 30.0, 20.0, 17.0, 26.0, 10.0, 11.0, 6.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-9.59375, -9.32025146484375, -9.0467529296875, -8.77325439453125, -8.499755859375, -8.22625732421875, -7.9527587890625, -7.67926025390625, -7.40576171875, -7.13226318359375, -6.8587646484375, -6.58526611328125, -6.311767578125, -6.03826904296875, -5.7647705078125, -5.49127197265625, -5.2177734375, -4.94427490234375, -4.6707763671875, -4.39727783203125, -4.123779296875, -3.85028076171875, -3.5767822265625, -3.30328369140625, -3.02978515625, -2.75628662109375, -2.4827880859375, -2.20928955078125, -1.935791015625, -1.66229248046875, -1.3887939453125, -1.11529541015625, -0.841796875, -0.56829833984375, -0.2947998046875, -0.02130126953125, 0.252197265625, 0.52569580078125, 0.7991943359375, 1.07269287109375, 1.34619140625, 1.61968994140625, 1.8931884765625, 2.16668701171875, 2.440185546875, 2.71368408203125, 2.9871826171875, 3.26068115234375, 3.5341796875, 3.80767822265625, 4.0811767578125, 4.35467529296875, 4.628173828125, 4.90167236328125, 5.1751708984375, 5.44866943359375, 5.72216796875, 5.99566650390625, 6.2691650390625, 6.54266357421875, 6.816162109375, 7.08966064453125, 7.3631591796875, 7.63665771484375, 7.91015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 7.0, 6.0, 4.0, 21.0, 23.0, 24.0, 28.0, 63.0, 47.0, 122.0, 149.0, 227.0, 311.0, 539.0, 885.0, 1641.0, 3434.0, 8617.0, 33162.0, 369875.0, 2881233.0, 812165.0, 60564.0, 11930.0, 4371.0, 2018.0, 1064.0, 613.0, 338.0, 270.0, 152.0, 118.0, 70.0, 57.0, 33.0, 33.0, 28.0, 10.0, 9.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.046875, -23.310302734375, -22.57373046875, -21.837158203125, -21.1005859375, -20.364013671875, -19.62744140625, -18.890869140625, -18.154296875, -17.417724609375, -16.68115234375, -15.944580078125, -15.2080078125, -14.471435546875, -13.73486328125, -12.998291015625, -12.26171875, -11.525146484375, -10.78857421875, -10.052001953125, -9.3154296875, -8.578857421875, -7.84228515625, -7.105712890625, -6.369140625, -5.632568359375, -4.89599609375, -4.159423828125, -3.4228515625, -2.686279296875, -1.94970703125, -1.213134765625, -0.4765625, 0.260009765625, 0.99658203125, 1.733154296875, 2.4697265625, 3.206298828125, 3.94287109375, 4.679443359375, 5.416015625, 6.152587890625, 6.88916015625, 7.625732421875, 8.3623046875, 9.098876953125, 9.83544921875, 10.572021484375, 11.30859375, 12.045166015625, 12.78173828125, 13.518310546875, 14.2548828125, 14.991455078125, 15.72802734375, 16.464599609375, 17.201171875, 17.937744140625, 18.67431640625, 19.410888671875, 20.1474609375, 20.884033203125, 21.62060546875, 22.357177734375, 23.09375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 8.0, 8.0, 2.0, 7.0, 18.0, 22.0, 32.0, 38.0, 65.0, 88.0, 136.0, 222.0, 398.0, 585.0, 784.0, 598.0, 372.0, 226.0, 144.0, 118.0, 64.0, 50.0, 33.0, 21.0, 12.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.609375, -23.934814453125, -23.26025390625, -22.585693359375, -21.9111328125, -21.236572265625, -20.56201171875, -19.887451171875, -19.212890625, -18.538330078125, -17.86376953125, -17.189208984375, -16.5146484375, -15.840087890625, -15.16552734375, -14.490966796875, -13.81640625, -13.141845703125, -12.46728515625, -11.792724609375, -11.1181640625, -10.443603515625, -9.76904296875, -9.094482421875, -8.419921875, -7.745361328125, -7.07080078125, -6.396240234375, -5.7216796875, -5.047119140625, -4.37255859375, -3.697998046875, -3.0234375, -2.348876953125, -1.67431640625, -0.999755859375, -0.3251953125, 0.349365234375, 1.02392578125, 1.698486328125, 2.373046875, 3.047607421875, 3.72216796875, 4.396728515625, 5.0712890625, 5.745849609375, 6.42041015625, 7.094970703125, 7.76953125, 8.444091796875, 9.11865234375, 9.793212890625, 10.4677734375, 11.142333984375, 11.81689453125, 12.491455078125, 13.166015625, 13.840576171875, 14.51513671875, 15.189697265625, 15.8642578125, 16.538818359375, 17.21337890625, 17.887939453125, 18.5625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 14.0, 23.0, 26.0, 44.0, 70.0, 128.0, 231.0, 409.0, 871.0, 2167.0, 5995.0, 23773.0, 212179.0, 3480890.0, 420453.0, 34416.0, 7911.0, 2554.0, 1010.0, 472.0, 233.0, 161.0, 91.0, 55.0, 28.0, 15.0, 16.0, 13.0, 8.0, 4.0, 0.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.609375, -28.536865234375, -27.46435546875, -26.391845703125, -25.3193359375, -24.246826171875, -23.17431640625, -22.101806640625, -21.029296875, -19.956787109375, -18.88427734375, -17.811767578125, -16.7392578125, -15.666748046875, -14.59423828125, -13.521728515625, -12.44921875, -11.376708984375, -10.30419921875, -9.231689453125, -8.1591796875, -7.086669921875, -6.01416015625, -4.941650390625, -3.869140625, -2.796630859375, -1.72412109375, -0.651611328125, 0.4208984375, 1.493408203125, 2.56591796875, 3.638427734375, 4.7109375, 5.783447265625, 6.85595703125, 7.928466796875, 9.0009765625, 10.073486328125, 11.14599609375, 12.218505859375, 13.291015625, 14.363525390625, 15.43603515625, 16.508544921875, 17.5810546875, 18.653564453125, 19.72607421875, 20.798583984375, 21.87109375, 22.943603515625, 24.01611328125, 25.088623046875, 26.1611328125, 27.233642578125, 28.30615234375, 29.378662109375, 30.451171875, 31.523681640625, 32.59619140625, 33.668701171875, 34.7412109375, 35.813720703125, 36.88623046875, 37.958740234375, 39.03125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 25.0, 46.0, 106.0, 224.0, 286.0, 205.0, 76.0, 22.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.05123901367188, -134.13015747070312, -129.2090606689453, -124.28797149658203, -119.36688232421875, -114.44580078125, -109.52471160888672, -104.60362243652344, -99.68253326416016, -94.76144409179688, -89.8403549194336, -84.91926574707031, -79.99818420410156, -75.07708740234375, -70.156005859375, -65.23491668701172, -60.31382751464844, -55.392738342285156, -50.471649169921875, -45.55056381225586, -40.62947463989258, -35.7083854675293, -30.78729820251465, -25.8662109375, -20.94512176513672, -16.024032592773438, -11.102945327758789, -6.181857109069824, -1.2607688903808594, 3.660320281982422, 8.58140754699707, 13.502494812011719, 18.423599243164062, 23.344688415527344, 28.265775680541992, 33.18686294555664, 38.10795211791992, 43.0290412902832, 47.95012664794922, 52.8712158203125, 57.79230499267578, 62.71339416503906, 67.63448333740234, 72.55557250976562, 77.47665405273438, 82.39775085449219, 87.31883239746094, 92.23992156982422, 97.1610107421875, 102.08209991455078, 107.00318908691406, 111.92427825927734, 116.84536743164062, 121.76644897460938, 126.68753814697266, 131.60862731933594, 136.52972412109375, 141.4508056640625, 146.3719024658203, 151.29298400878906, 156.21408081054688, 161.13516235351562, 166.05625915527344, 170.9773406982422, 175.89842224121094]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 7.0, 11.0, 14.0, 11.0, 20.0, 29.0, 20.0, 22.0, 29.0, 22.0, 38.0, 34.0, 38.0, 44.0, 46.0, 27.0, 47.0, 57.0, 42.0, 41.0, 43.0, 31.0, 35.0, 30.0, 30.0, 38.0, 32.0, 22.0, 30.0, 15.0, 14.0, 8.0, 8.0, 9.0, 4.0, 5.0, 11.0, 2.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-51.902488708496094, -50.216556549072266, -48.53062438964844, -46.844688415527344, -45.158756256103516, -43.47282409667969, -41.786888122558594, -40.100955963134766, -38.41502380371094, -36.72909164428711, -35.04315948486328, -33.35722351074219, -31.67129135131836, -29.98535919189453, -28.29942512512207, -26.61349105834961, -24.92755889892578, -23.241626739501953, -21.555692672729492, -19.86975860595703, -18.183826446533203, -16.497894287109375, -14.811960220336914, -13.12602710723877, -11.440093994140625, -9.75416088104248, -8.068227767944336, -6.382294654846191, -4.696361541748047, -3.0104284286499023, -1.3244953155517578, 0.3614377975463867, 2.0473709106445312, 3.733304023742676, 5.41923713684082, 7.105170249938965, 8.79110336303711, 10.477036476135254, 12.162969589233398, 13.848902702331543, 15.534835815429688, 17.220767974853516, 18.906702041625977, 20.592636108398438, 22.278568267822266, 23.964500427246094, 25.650434494018555, 27.336368560791016, 29.022300720214844, 30.708232879638672, 32.3941650390625, 34.080101013183594, 35.76603317260742, 37.45196533203125, 39.137901306152344, 40.82383346557617, 42.509765625, 44.19569778442383, 45.881629943847656, 47.56756591796875, 49.25349807739258, 50.939430236816406, 52.6253662109375, 54.31129837036133, 55.997230529785156]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 3.0, 3.0, 8.0, 9.0, 9.0, 16.0, 6.0, 20.0, 14.0, 12.0, 20.0, 24.0, 34.0, 30.0, 36.0, 33.0, 36.0, 36.0, 36.0, 43.0, 50.0, 40.0, 48.0, 43.0, 31.0, 28.0, 44.0, 27.0, 29.0, 26.0, 31.0, 19.0, 19.0, 27.0, 19.0, 12.0, 15.0, 14.0, 7.0, 11.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.83203125, -7.6029052734375, -7.373779296875, -7.1446533203125, -6.91552734375, -6.6864013671875, -6.457275390625, -6.2281494140625, -5.9990234375, -5.7698974609375, -5.540771484375, -5.3116455078125, -5.08251953125, -4.8533935546875, -4.624267578125, -4.3951416015625, -4.166015625, -3.9368896484375, -3.707763671875, -3.4786376953125, -3.24951171875, -3.0203857421875, -2.791259765625, -2.5621337890625, -2.3330078125, -2.1038818359375, -1.874755859375, -1.6456298828125, -1.41650390625, -1.1873779296875, -0.958251953125, -0.7291259765625, -0.5, -0.2708740234375, -0.041748046875, 0.1873779296875, 0.41650390625, 0.6456298828125, 0.874755859375, 1.1038818359375, 1.3330078125, 1.5621337890625, 1.791259765625, 2.0203857421875, 2.24951171875, 2.4786376953125, 2.707763671875, 2.9368896484375, 3.166015625, 3.3951416015625, 3.624267578125, 3.8533935546875, 4.08251953125, 4.3116455078125, 4.540771484375, 4.7698974609375, 4.9990234375, 5.2281494140625, 5.457275390625, 5.6864013671875, 5.91552734375, 6.1446533203125, 6.373779296875, 6.6029052734375, 6.83203125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 8.0, 6.0, 8.0, 16.0, 19.0, 31.0, 48.0, 71.0, 127.0, 149.0, 223.0, 362.0, 501.0, 739.0, 1062.0, 1669.0, 2408.0, 3340.0, 4972.0, 7164.0, 10550.0, 15550.0, 23211.0, 35116.0, 53681.0, 83694.0, 133664.0, 185920.0, 168059.0, 110537.0, 69967.0, 44921.0, 29312.0, 19712.0, 13193.0, 9068.0, 6117.0, 4168.0, 2852.0, 2021.0, 1401.0, 913.0, 650.0, 433.0, 306.0, 184.0, 142.0, 96.0, 75.0, 43.0, 27.0, 20.0, 13.0, 10.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.7412109375, -0.7171401977539062, -0.6930694580078125, -0.6689987182617188, -0.644927978515625, -0.6208572387695312, -0.5967864990234375, -0.5727157592773438, -0.54864501953125, -0.5245742797851562, -0.5005035400390625, -0.47643280029296875, -0.452362060546875, -0.42829132080078125, -0.4042205810546875, -0.38014984130859375, -0.3560791015625, -0.33200836181640625, -0.3079376220703125, -0.28386688232421875, -0.259796142578125, -0.23572540283203125, -0.2116546630859375, -0.18758392333984375, -0.16351318359375, -0.13944244384765625, -0.1153717041015625, -0.09130096435546875, -0.067230224609375, -0.04315948486328125, -0.0190887451171875, 0.00498199462890625, 0.029052734375, 0.05312347412109375, 0.0771942138671875, 0.10126495361328125, 0.125335693359375, 0.14940643310546875, 0.1734771728515625, 0.19754791259765625, 0.22161865234375, 0.24568939208984375, 0.2697601318359375, 0.29383087158203125, 0.317901611328125, 0.34197235107421875, 0.3660430908203125, 0.39011383056640625, 0.4141845703125, 0.43825531005859375, 0.4623260498046875, 0.48639678955078125, 0.510467529296875, 0.5345382690429688, 0.5586090087890625, 0.5826797485351562, 0.60675048828125, 0.6308212280273438, 0.6548919677734375, 0.6789627075195312, 0.703033447265625, 0.7271041870117188, 0.7511749267578125, 0.7752456665039062, 0.79931640625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 5.0, 7.0, 5.0, 7.0, 7.0, 10.0, 8.0, 14.0, 19.0, 20.0, 19.0, 26.0, 39.0, 27.0, 31.0, 33.0, 33.0, 40.0, 30.0, 46.0, 40.0, 1061.0, 47.0, 41.0, 34.0, 31.0, 36.0, 32.0, 32.0, 36.0, 36.0, 26.0, 22.0, 19.0, 14.0, 20.0, 10.0, 10.0, 14.0, 10.0, 9.0, 2.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.00390625, -4.85333251953125, -4.7027587890625, -4.55218505859375, -4.401611328125, -4.25103759765625, -4.1004638671875, -3.94989013671875, -3.79931640625, -3.64874267578125, -3.4981689453125, -3.34759521484375, -3.197021484375, -3.04644775390625, -2.8958740234375, -2.74530029296875, -2.5947265625, -2.44415283203125, -2.2935791015625, -2.14300537109375, -1.992431640625, -1.84185791015625, -1.6912841796875, -1.54071044921875, -1.39013671875, -1.23956298828125, -1.0889892578125, -0.93841552734375, -0.787841796875, -0.63726806640625, -0.4866943359375, -0.33612060546875, -0.185546875, -0.03497314453125, 0.1156005859375, 0.26617431640625, 0.416748046875, 0.56732177734375, 0.7178955078125, 0.86846923828125, 1.01904296875, 1.16961669921875, 1.3201904296875, 1.47076416015625, 1.621337890625, 1.77191162109375, 1.9224853515625, 2.07305908203125, 2.2236328125, 2.37420654296875, 2.5247802734375, 2.67535400390625, 2.825927734375, 2.97650146484375, 3.1270751953125, 3.27764892578125, 3.42822265625, 3.57879638671875, 3.7293701171875, 3.87994384765625, 4.030517578125, 4.18109130859375, 4.3316650390625, 4.48223876953125, 4.6328125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 8.0, 9.0, 21.0, 28.0, 39.0, 66.0, 94.0, 149.0, 229.0, 342.0, 532.0, 780.0, 1129.0, 1533.0, 2227.0, 3190.0, 4656.0, 6548.0, 9252.0, 13262.0, 19194.0, 28491.0, 41829.0, 64505.0, 98093.0, 143036.0, 1211729.0, 144790.0, 99639.0, 65578.0, 43056.0, 28802.0, 19666.0, 13378.0, 9360.0, 6648.0, 4654.0, 3235.0, 2245.0, 1633.0, 1068.0, 721.0, 568.0, 376.0, 254.0, 165.0, 112.0, 67.0, 51.0, 32.0, 25.0, 14.0, 15.0, 8.0, 3.0], "bins": [-0.58056640625, -0.5642204284667969, -0.5478744506835938, -0.5315284729003906, -0.5151824951171875, -0.4988365173339844, -0.48249053955078125, -0.4661445617675781, -0.449798583984375, -0.4334526062011719, -0.41710662841796875, -0.4007606506347656, -0.3844146728515625, -0.3680686950683594, -0.35172271728515625, -0.3353767395019531, -0.31903076171875, -0.3026847839355469, -0.28633880615234375, -0.2699928283691406, -0.2536468505859375, -0.23730087280273438, -0.22095489501953125, -0.20460891723632812, -0.188262939453125, -0.17191696166992188, -0.15557098388671875, -0.13922500610351562, -0.1228790283203125, -0.10653305053710938, -0.09018707275390625, -0.07384109497070312, -0.0574951171875, -0.041149139404296875, -0.02480316162109375, -0.008457183837890625, 0.0078887939453125, 0.024234771728515625, 0.04058074951171875, 0.056926727294921875, 0.073272705078125, 0.08961868286132812, 0.10596466064453125, 0.12231063842773438, 0.1386566162109375, 0.15500259399414062, 0.17134857177734375, 0.18769454956054688, 0.20404052734375, 0.22038650512695312, 0.23673248291015625, 0.2530784606933594, 0.2694244384765625, 0.2857704162597656, 0.30211639404296875, 0.3184623718261719, 0.334808349609375, 0.3511543273925781, 0.36750030517578125, 0.3838462829589844, 0.4001922607421875, 0.4165382385253906, 0.43288421630859375, 0.4492301940917969, 0.465576171875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 8.0, 6.0, 14.0, 15.0, 12.0, 26.0, 22.0, 26.0, 29.0, 35.0, 57.0, 78.0, 92.0, 111.0, 78.0, 77.0, 61.0, 52.0, 28.0, 18.0, 21.0, 13.0, 12.0, 14.0, 11.0, 12.0, 9.0, 14.0, 11.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0236053466796875, -0.022921323776245117, -0.022237300872802734, -0.02155327796936035, -0.02086925506591797, -0.020185232162475586, -0.019501209259033203, -0.01881718635559082, -0.018133163452148438, -0.017449140548706055, -0.016765117645263672, -0.01608109474182129, -0.015397071838378906, -0.014713048934936523, -0.01402902603149414, -0.013345003128051758, -0.012660980224609375, -0.011976957321166992, -0.01129293441772461, -0.010608911514282227, -0.009924888610839844, -0.009240865707397461, -0.008556842803955078, -0.007872819900512695, -0.0071887969970703125, -0.00650477409362793, -0.005820751190185547, -0.005136728286743164, -0.004452705383300781, -0.0037686824798583984, -0.0030846595764160156, -0.002400636672973633, -0.00171661376953125, -0.0010325908660888672, -0.0003485679626464844, 0.00033545494079589844, 0.0010194778442382812, 0.001703500747680664, 0.002387523651123047, 0.0030715465545654297, 0.0037555694580078125, 0.004439592361450195, 0.005123615264892578, 0.005807638168334961, 0.006491661071777344, 0.0071756839752197266, 0.00785970687866211, 0.008543729782104492, 0.009227752685546875, 0.009911775588989258, 0.01059579849243164, 0.011279821395874023, 0.011963844299316406, 0.012647867202758789, 0.013331890106201172, 0.014015913009643555, 0.014699935913085938, 0.01538395881652832, 0.016067981719970703, 0.016752004623413086, 0.01743602752685547, 0.01812005043029785, 0.018804073333740234, 0.019488096237182617, 0.020172119140625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 11.0, 8.0, 17.0, 21.0, 26.0, 28.0, 27.0, 31.0, 37.0, 48.0, 65.0, 103.0, 157.0, 242.0, 384.0, 1223.0, 30799.0, 990903.0, 22285.0, 1015.0, 366.0, 202.0, 137.0, 99.0, 58.0, 55.0, 37.0, 40.0, 34.0, 14.0, 14.0, 13.0, 7.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.359619140625, -0.347412109375, -0.335205078125, -0.322998046875, -0.310791015625, -0.298583984375, -0.286376953125, -0.274169921875, -0.261962890625, -0.249755859375, -0.237548828125, -0.225341796875, -0.213134765625, -0.200927734375, -0.188720703125, -0.176513671875, -0.164306640625, -0.152099609375, -0.139892578125, -0.127685546875, -0.115478515625, -0.103271484375, -0.091064453125, -0.078857421875, -0.066650390625, -0.054443359375, -0.042236328125, -0.030029296875, -0.017822265625, -0.005615234375, 0.006591796875, 0.018798828125, 0.031005859375, 0.043212890625, 0.055419921875, 0.067626953125, 0.079833984375, 0.092041015625, 0.104248046875, 0.116455078125, 0.128662109375, 0.140869140625, 0.153076171875, 0.165283203125, 0.177490234375, 0.189697265625, 0.201904296875, 0.214111328125, 0.226318359375, 0.238525390625, 0.250732421875, 0.262939453125, 0.275146484375, 0.287353515625, 0.299560546875, 0.311767578125, 0.323974609375, 0.336181640625, 0.348388671875, 0.360595703125, 0.372802734375, 0.385009765625, 0.397216796875, 0.409423828125, 0.421630859375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 52.0, 406.0, 491.0, 49.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1614478975534439, -0.15295201539993286, -0.14445611834526062, -0.13596022129058838, -0.12746433913707733, -0.11896844953298569, -0.11047255992889404, -0.1019766703248024, -0.09348078072071075, -0.08498489111661911, -0.07648900151252747, -0.06799311190843582, -0.05949722230434418, -0.05100133270025253, -0.04250544309616089, -0.034009553492069244, -0.0255136638879776, -0.017017774283885956, -0.008521884679794312, -2.5995075702667236e-05, 0.008469894528388977, 0.01696578413248062, 0.025461673736572266, 0.03395756334066391, 0.042453452944755554, 0.0509493425488472, 0.05944523215293884, 0.06794112175703049, 0.07643701136112213, 0.08493290096521378, 0.09342879056930542, 0.10192468017339706, 0.1104205846786499, 0.11891647428274155, 0.1274123638868332, 0.13590824604034424, 0.14440414309501648, 0.15290004014968872, 0.16139592230319977, 0.16989180445671082, 0.17838770151138306, 0.1868835985660553, 0.19537948071956635, 0.2038753628730774, 0.21237125992774963, 0.22086715698242188, 0.22936303913593292, 0.23785892128944397, 0.2463548183441162, 0.25485071539878845, 0.2633466124534607, 0.27184247970581055, 0.2803383767604828, 0.28883427381515503, 0.2973301410675049, 0.3058260381221771, 0.31432193517684937, 0.3228178322315216, 0.33131372928619385, 0.3398095965385437, 0.34830549359321594, 0.3568013906478882, 0.36529725790023804, 0.3737931549549103, 0.3822890520095825]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 2.0, 10.0, 7.0, 15.0, 12.0, 25.0, 16.0, 31.0, 40.0, 34.0, 38.0, 38.0, 39.0, 39.0, 54.0, 39.0, 45.0, 46.0, 46.0, 37.0, 39.0, 41.0, 40.0, 38.0, 37.0, 25.0, 31.0, 29.0, 24.0, 13.0, 11.0, 14.0, 9.0, 8.0, 4.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033541202545166016, -0.032430168241262436, -0.031319133937358856, -0.030208095908164978, -0.0290970616042614, -0.02798602730035782, -0.02687499113380909, -0.02576395496726036, -0.02465292066335678, -0.0235418863594532, -0.022430850192904472, -0.021319814026355743, -0.020208779722452164, -0.019097745418548584, -0.017986709251999855, -0.016875673085451126, -0.015764638781547546, -0.014653603546321392, -0.013542568311095238, -0.012431533075869083, -0.011320497840642929, -0.010209462605416775, -0.00909842737019062, -0.007987392134964466, -0.006876356899738312, -0.0057653216645121574, -0.004654286429286003, -0.003543251194059849, -0.0024322159588336945, -0.0013211807236075401, -0.0002101454883813858, 0.0009008897468447685, 0.002011924982070923, 0.003122960217297077, 0.0042339954525232315, 0.005345030687749386, 0.00645606592297554, 0.0075671011582016945, 0.008678136393427849, 0.009789171628654003, 0.010900206863880157, 0.012011242099106312, 0.013122277334332466, 0.01423331256955862, 0.015344347804784775, 0.016455382108688354, 0.017566418275237083, 0.018677454441785812, 0.019788488745689392, 0.020899523049592972, 0.0220105592161417, 0.02312159538269043, 0.02423262968659401, 0.02534366399049759, 0.026454700157046318, 0.027565736323595047, 0.028676770627498627, 0.029787804931402206, 0.030898841097950935, 0.032009877264499664, 0.033120911568403244, 0.034231945872306824, 0.0353429839015007, 0.03645401820540428, 0.03756505250930786]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 2.0, 3.0, 3.0, 9.0, 8.0, 10.0, 15.0, 6.0, 20.0, 14.0, 12.0, 20.0, 25.0, 33.0, 30.0, 37.0, 31.0, 38.0, 34.0, 38.0, 42.0, 51.0, 39.0, 48.0, 43.0, 31.0, 28.0, 44.0, 27.0, 29.0, 26.0, 31.0, 19.0, 19.0, 27.0, 19.0, 12.0, 15.0, 14.0, 7.0, 11.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.82421875, -7.59527587890625, -7.3663330078125, -7.13739013671875, -6.908447265625, -6.67950439453125, -6.4505615234375, -6.22161865234375, -5.99267578125, -5.76373291015625, -5.5347900390625, -5.30584716796875, -5.076904296875, -4.84796142578125, -4.6190185546875, -4.39007568359375, -4.1611328125, -3.93218994140625, -3.7032470703125, -3.47430419921875, -3.245361328125, -3.01641845703125, -2.7874755859375, -2.55853271484375, -2.32958984375, -2.10064697265625, -1.8717041015625, -1.64276123046875, -1.413818359375, -1.18487548828125, -0.9559326171875, -0.72698974609375, -0.498046875, -0.26910400390625, -0.0401611328125, 0.18878173828125, 0.417724609375, 0.64666748046875, 0.8756103515625, 1.10455322265625, 1.33349609375, 1.56243896484375, 1.7913818359375, 2.02032470703125, 2.249267578125, 2.47821044921875, 2.7071533203125, 2.93609619140625, 3.1650390625, 3.39398193359375, 3.6229248046875, 3.85186767578125, 4.080810546875, 4.30975341796875, 4.5386962890625, 4.76763916015625, 4.99658203125, 5.22552490234375, 5.4544677734375, 5.68341064453125, 5.912353515625, 6.14129638671875, 6.3702392578125, 6.59918212890625, 6.828125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 4.0, 7.0, 14.0, 11.0, 20.0, 25.0, 32.0, 48.0, 78.0, 79.0, 140.0, 149.0, 244.0, 304.0, 531.0, 718.0, 1069.0, 1612.0, 2825.0, 5664.0, 17493.0, 118607.0, 739214.0, 127519.0, 18348.0, 5813.0, 2919.0, 1655.0, 1043.0, 679.0, 488.0, 335.0, 233.0, 160.0, 116.0, 91.0, 63.0, 45.0, 41.0, 34.0, 23.0, 10.0, 10.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.015625, -18.371337890625, -17.72705078125, -17.082763671875, -16.4384765625, -15.794189453125, -15.14990234375, -14.505615234375, -13.861328125, -13.217041015625, -12.57275390625, -11.928466796875, -11.2841796875, -10.639892578125, -9.99560546875, -9.351318359375, -8.70703125, -8.062744140625, -7.41845703125, -6.774169921875, -6.1298828125, -5.485595703125, -4.84130859375, -4.197021484375, -3.552734375, -2.908447265625, -2.26416015625, -1.619873046875, -0.9755859375, -0.331298828125, 0.31298828125, 0.957275390625, 1.6015625, 2.245849609375, 2.89013671875, 3.534423828125, 4.1787109375, 4.822998046875, 5.46728515625, 6.111572265625, 6.755859375, 7.400146484375, 8.04443359375, 8.688720703125, 9.3330078125, 9.977294921875, 10.62158203125, 11.265869140625, 11.91015625, 12.554443359375, 13.19873046875, 13.843017578125, 14.4873046875, 15.131591796875, 15.77587890625, 16.420166015625, 17.064453125, 17.708740234375, 18.35302734375, 18.997314453125, 19.6416015625, 20.285888671875, 20.93017578125, 21.574462890625, 22.21875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 4.0, 9.0, 1.0, 5.0, 6.0, 8.0, 11.0, 10.0, 15.0, 21.0, 20.0, 21.0, 23.0, 48.0, 48.0, 53.0, 64.0, 96.0, 156.0, 1488.0, 357.0, 145.0, 93.0, 54.0, 42.0, 39.0, 38.0, 31.0, 27.0, 22.0, 18.0, 22.0, 8.0, 10.0, 11.0, 7.0, 6.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-23.671875, -22.973388671875, -22.27490234375, -21.576416015625, -20.8779296875, -20.179443359375, -19.48095703125, -18.782470703125, -18.083984375, -17.385498046875, -16.68701171875, -15.988525390625, -15.2900390625, -14.591552734375, -13.89306640625, -13.194580078125, -12.49609375, -11.797607421875, -11.09912109375, -10.400634765625, -9.7021484375, -9.003662109375, -8.30517578125, -7.606689453125, -6.908203125, -6.209716796875, -5.51123046875, -4.812744140625, -4.1142578125, -3.415771484375, -2.71728515625, -2.018798828125, -1.3203125, -0.621826171875, 0.07666015625, 0.775146484375, 1.4736328125, 2.172119140625, 2.87060546875, 3.569091796875, 4.267578125, 4.966064453125, 5.66455078125, 6.363037109375, 7.0615234375, 7.760009765625, 8.45849609375, 9.156982421875, 9.85546875, 10.553955078125, 11.25244140625, 11.950927734375, 12.6494140625, 13.347900390625, 14.04638671875, 14.744873046875, 15.443359375, 16.141845703125, 16.84033203125, 17.538818359375, 18.2373046875, 18.935791015625, 19.63427734375, 20.332763671875, 21.03125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 12.0, 11.0, 16.0, 27.0, 26.0, 45.0, 61.0, 94.0, 149.0, 243.0, 525.0, 1277.0, 59353.0, 3079315.0, 2978.0, 667.0, 338.0, 185.0, 94.0, 80.0, 53.0, 32.0, 34.0, 22.0, 21.0, 13.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.625, -82.0771484375, -79.529296875, -76.9814453125, -74.43359375, -71.8857421875, -69.337890625, -66.7900390625, -64.2421875, -61.6943359375, -59.146484375, -56.5986328125, -54.05078125, -51.5029296875, -48.955078125, -46.4072265625, -43.859375, -41.3115234375, -38.763671875, -36.2158203125, -33.66796875, -31.1201171875, -28.572265625, -26.0244140625, -23.4765625, -20.9287109375, -18.380859375, -15.8330078125, -13.28515625, -10.7373046875, -8.189453125, -5.6416015625, -3.09375, -0.5458984375, 2.001953125, 4.5498046875, 7.09765625, 9.6455078125, 12.193359375, 14.7412109375, 17.2890625, 19.8369140625, 22.384765625, 24.9326171875, 27.48046875, 30.0283203125, 32.576171875, 35.1240234375, 37.671875, 40.2197265625, 42.767578125, 45.3154296875, 47.86328125, 50.4111328125, 52.958984375, 55.5068359375, 58.0546875, 60.6025390625, 63.150390625, 65.6982421875, 68.24609375, 70.7939453125, 73.341796875, 75.8896484375, 78.4375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 15.0, 47.0, 139.0, 346.0, 300.0, 124.0, 33.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.02149200439453, -51.31443786621094, -46.60737991333008, -41.90032196044922, -37.193267822265625, -32.48621368408203, -27.779155731201172, -23.072097778320312, -18.36504364013672, -13.657987594604492, -8.950931549072266, -4.243875503540039, 0.4631805419921875, 5.170236587524414, 9.87729263305664, 14.5843505859375, 19.291404724121094, 23.99846076965332, 28.705516815185547, 33.412574768066406, 38.11962890625, 42.826683044433594, 47.53374099731445, 52.24079895019531, 56.947853088378906, 61.6549072265625, 66.36196899414062, 71.06902313232422, 75.77607727050781, 80.4831314086914, 85.190185546875, 89.89724731445312, 94.60430908203125, 99.31136322021484, 104.01841735839844, 108.72547912597656, 113.43253326416016, 118.13958740234375, 122.84664916992188, 127.55370330810547, 132.26075744628906, 136.9678192138672, 141.67486572265625, 146.38192749023438, 151.0889892578125, 155.79603576660156, 160.5030975341797, 165.21014404296875, 169.91720581054688, 174.624267578125, 179.33131408691406, 184.0383758544922, 188.74542236328125, 193.45248413085938, 198.1595458984375, 202.86660766601562, 207.5736541748047, 212.2807159423828, 216.98776245117188, 221.69482421875, 226.40188598632812, 231.1089324951172, 235.8159942626953, 240.52304077148438, 245.2301025390625]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 7.0, 8.0, 13.0, 12.0, 10.0, 26.0, 21.0, 17.0, 17.0, 21.0, 31.0, 36.0, 32.0, 34.0, 35.0, 39.0, 45.0, 46.0, 44.0, 41.0, 45.0, 53.0, 36.0, 39.0, 31.0, 26.0, 32.0, 28.0, 25.0, 19.0, 15.0, 11.0, 17.0, 10.0, 15.0, 15.0, 8.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-57.607154846191406, -55.86639404296875, -54.12563705444336, -52.3848762512207, -50.64411926269531, -48.903358459472656, -47.16259765625, -45.421836853027344, -43.68107986450195, -41.9403190612793, -40.199562072753906, -38.45880126953125, -36.718040466308594, -34.9772834777832, -33.23652267456055, -31.495763778686523, -29.7550048828125, -28.014245986938477, -26.273487091064453, -24.532726287841797, -22.791967391967773, -21.05120849609375, -19.310447692871094, -17.56968879699707, -15.828929901123047, -14.088171005249023, -12.347411155700684, -10.606651306152344, -8.86589241027832, -7.125133514404297, -5.384373664855957, -3.643613815307617, -1.9028549194335938, -0.1620955467224121, 1.5786638259887695, 3.319423198699951, 5.060182571411133, 6.800941467285156, 8.541701316833496, 10.282461166381836, 12.02322006225586, 13.763978958129883, 15.504738807678223, 17.245498657226562, 18.986257553100586, 20.72701644897461, 22.467777252197266, 24.20853614807129, 25.949295043945312, 27.690053939819336, 29.43081283569336, 31.171573638916016, 32.912330627441406, 34.65309143066406, 36.39385223388672, 38.134613037109375, 39.875370025634766, 41.61613082885742, 43.35688781738281, 45.09764862060547, 46.838409423828125, 48.579166412353516, 50.31992721557617, 52.06068420410156, 53.80144500732422]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 11.0, 9.0, 18.0, 19.0, 11.0, 17.0, 21.0, 24.0, 17.0, 31.0, 27.0, 37.0, 34.0, 37.0, 31.0, 29.0, 41.0, 45.0, 37.0, 44.0, 44.0, 32.0, 25.0, 38.0, 26.0, 26.0, 28.0, 21.0, 28.0, 22.0, 29.0, 17.0, 18.0, 12.0, 17.0, 14.0, 4.0, 9.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.2421875, -7.01568603515625, -6.7891845703125, -6.56268310546875, -6.336181640625, -6.10968017578125, -5.8831787109375, -5.65667724609375, -5.43017578125, -5.20367431640625, -4.9771728515625, -4.75067138671875, -4.524169921875, -4.29766845703125, -4.0711669921875, -3.84466552734375, -3.6181640625, -3.39166259765625, -3.1651611328125, -2.93865966796875, -2.712158203125, -2.48565673828125, -2.2591552734375, -2.03265380859375, -1.80615234375, -1.57965087890625, -1.3531494140625, -1.12664794921875, -0.900146484375, -0.67364501953125, -0.4471435546875, -0.22064208984375, 0.005859375, 0.23236083984375, 0.4588623046875, 0.68536376953125, 0.911865234375, 1.13836669921875, 1.3648681640625, 1.59136962890625, 1.81787109375, 2.04437255859375, 2.2708740234375, 2.49737548828125, 2.723876953125, 2.95037841796875, 3.1768798828125, 3.40338134765625, 3.6298828125, 3.85638427734375, 4.0828857421875, 4.30938720703125, 4.535888671875, 4.76239013671875, 4.9888916015625, 5.21539306640625, 5.44189453125, 5.66839599609375, 5.8948974609375, 6.12139892578125, 6.347900390625, 6.57440185546875, 6.8009033203125, 7.02740478515625, 7.25390625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 11.0, 12.0, 21.0, 32.0, 35.0, 46.0, 46.0, 61.0, 105.0, 115.0, 162.0, 186.0, 242.0, 309.0, 362.0, 467.0, 548.0, 906.0, 1613.0, 3145.0, 7535.0, 23057.0, 176975.0, 2478511.0, 1381085.0, 89566.0, 15997.0, 5729.0, 2587.0, 1455.0, 871.0, 525.0, 413.0, 347.0, 250.0, 212.0, 171.0, 132.0, 105.0, 78.0, 62.0, 41.0, 27.0, 29.0, 19.0, 18.0, 15.0, 11.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.765625, -21.08251953125, -20.3994140625, -19.71630859375, -19.033203125, -18.35009765625, -17.6669921875, -16.98388671875, -16.30078125, -15.61767578125, -14.9345703125, -14.25146484375, -13.568359375, -12.88525390625, -12.2021484375, -11.51904296875, -10.8359375, -10.15283203125, -9.4697265625, -8.78662109375, -8.103515625, -7.42041015625, -6.7373046875, -6.05419921875, -5.37109375, -4.68798828125, -4.0048828125, -3.32177734375, -2.638671875, -1.95556640625, -1.2724609375, -0.58935546875, 0.09375, 0.77685546875, 1.4599609375, 2.14306640625, 2.826171875, 3.50927734375, 4.1923828125, 4.87548828125, 5.55859375, 6.24169921875, 6.9248046875, 7.60791015625, 8.291015625, 8.97412109375, 9.6572265625, 10.34033203125, 11.0234375, 11.70654296875, 12.3896484375, 13.07275390625, 13.755859375, 14.43896484375, 15.1220703125, 15.80517578125, 16.48828125, 17.17138671875, 17.8544921875, 18.53759765625, 19.220703125, 19.90380859375, 20.5869140625, 21.27001953125, 21.953125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 7.0, 10.0, 9.0, 25.0, 25.0, 50.0, 63.0, 106.0, 157.0, 299.0, 460.0, 667.0, 770.0, 507.0, 325.0, 201.0, 110.0, 103.0, 53.0, 48.0, 26.0, 13.0, 11.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.6754150390625, -13.108642578125, -12.5418701171875, -11.97509765625, -11.4083251953125, -10.841552734375, -10.2747802734375, -9.7080078125, -9.1412353515625, -8.574462890625, -8.0076904296875, -7.44091796875, -6.8741455078125, -6.307373046875, -5.7406005859375, -5.173828125, -4.6070556640625, -4.040283203125, -3.4735107421875, -2.90673828125, -2.3399658203125, -1.773193359375, -1.2064208984375, -0.6396484375, -0.0728759765625, 0.493896484375, 1.0606689453125, 1.62744140625, 2.1942138671875, 2.760986328125, 3.3277587890625, 3.89453125, 4.4613037109375, 5.028076171875, 5.5948486328125, 6.16162109375, 6.7283935546875, 7.295166015625, 7.8619384765625, 8.4287109375, 8.9954833984375, 9.562255859375, 10.1290283203125, 10.69580078125, 11.2625732421875, 11.829345703125, 12.3961181640625, 12.962890625, 13.5296630859375, 14.096435546875, 14.6632080078125, 15.22998046875, 15.7967529296875, 16.363525390625, 16.9302978515625, 17.4970703125, 18.0638427734375, 18.630615234375, 19.1973876953125, 19.76416015625, 20.3309326171875, 20.897705078125, 21.4644775390625, 22.03125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 3.0, 6.0, 11.0, 12.0, 24.0, 23.0, 46.0, 83.0, 127.0, 240.0, 464.0, 1211.0, 3792.0, 23922.0, 1217139.0, 2904382.0, 35606.0, 4727.0, 1350.0, 522.0, 236.0, 125.0, 78.0, 49.0, 45.0, 17.0, 7.0, 10.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-47.125, -45.85400390625, -44.5830078125, -43.31201171875, -42.041015625, -40.77001953125, -39.4990234375, -38.22802734375, -36.95703125, -35.68603515625, -34.4150390625, -33.14404296875, -31.873046875, -30.60205078125, -29.3310546875, -28.06005859375, -26.7890625, -25.51806640625, -24.2470703125, -22.97607421875, -21.705078125, -20.43408203125, -19.1630859375, -17.89208984375, -16.62109375, -15.35009765625, -14.0791015625, -12.80810546875, -11.537109375, -10.26611328125, -8.9951171875, -7.72412109375, -6.453125, -5.18212890625, -3.9111328125, -2.64013671875, -1.369140625, -0.09814453125, 1.1728515625, 2.44384765625, 3.71484375, 4.98583984375, 6.2568359375, 7.52783203125, 8.798828125, 10.06982421875, 11.3408203125, 12.61181640625, 13.8828125, 15.15380859375, 16.4248046875, 17.69580078125, 18.966796875, 20.23779296875, 21.5087890625, 22.77978515625, 24.05078125, 25.32177734375, 26.5927734375, 27.86376953125, 29.134765625, 30.40576171875, 31.6767578125, 32.94775390625, 34.21875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 27.0, 39.0, 107.0, 225.0, 273.0, 194.0, 82.0, 33.0, 17.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.18653869628906, -205.9167022705078, -201.64686584472656, -197.3770294189453, -193.10720825195312, -188.83737182617188, -184.56753540039062, -180.29769897460938, -176.02786254882812, -171.75802612304688, -167.48818969726562, -163.21835327148438, -158.94851684570312, -154.67869567871094, -150.4088592529297, -146.13902282714844, -141.8691864013672, -137.59934997558594, -133.3295135498047, -129.05967712402344, -124.78984832763672, -120.52001190185547, -116.25018310546875, -111.9803466796875, -107.71051025390625, -103.440673828125, -99.17083740234375, -94.90100860595703, -90.63117218017578, -86.36133575439453, -82.09150695800781, -77.82167053222656, -73.55183410644531, -69.28199768066406, -65.01216125488281, -60.742332458496094, -56.472496032714844, -52.202659606933594, -47.93282699584961, -43.662994384765625, -39.393157958984375, -35.123321533203125, -30.85348892211914, -26.583654403686523, -22.313819885253906, -18.04398536682129, -13.774150848388672, -9.504316329956055, -5.2344818115234375, -0.9646472930908203, 3.305187225341797, 7.575021743774414, 11.844856262207031, 16.11469078063965, 20.384525299072266, 24.654359817504883, 28.9241943359375, 33.19403076171875, 37.463863372802734, 41.73369598388672, 46.00353240966797, 50.27336883544922, 54.5432014465332, 58.81303405761719, 63.08287048339844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 10.0, 6.0, 13.0, 12.0, 6.0, 16.0, 16.0, 20.0, 24.0, 20.0, 30.0, 36.0, 32.0, 29.0, 28.0, 55.0, 42.0, 39.0, 39.0, 46.0, 43.0, 30.0, 36.0, 32.0, 32.0, 36.0, 34.0, 29.0, 30.0, 27.0, 19.0, 30.0, 15.0, 10.0, 11.0, 10.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.1527099609375, -43.715240478515625, -42.27777099609375, -40.840301513671875, -39.40283203125, -37.96535873413086, -36.527889251708984, -35.09041976928711, -33.652950286865234, -32.21548080444336, -30.778011322021484, -29.340539932250977, -27.9030704498291, -26.465600967407227, -25.02812957763672, -23.590660095214844, -22.15319061279297, -20.715721130371094, -19.27825164794922, -17.84078025817871, -16.403310775756836, -14.965841293334961, -13.52837085723877, -12.090900421142578, -10.653430938720703, -9.215961456298828, -7.778491020202637, -6.3410210609436035, -4.90355110168457, -3.466081142425537, -2.028611183166504, -0.5911407470703125, 0.8463287353515625, 2.2837986946105957, 3.721268653869629, 5.158738613128662, 6.596208572387695, 8.03367805480957, 9.471148490905762, 10.908618927001953, 12.346088409423828, 13.783557891845703, 15.221028327941895, 16.658498764038086, 18.09596824645996, 19.533437728881836, 20.970909118652344, 22.40837860107422, 23.845848083496094, 25.28331756591797, 26.720787048339844, 28.15825843811035, 29.595727920532227, 31.0331974029541, 32.47066879272461, 33.908138275146484, 35.34560775756836, 36.783077239990234, 38.22054672241211, 39.658016204833984, 41.095489501953125, 42.532958984375, 43.970428466796875, 45.40789794921875, 46.845367431640625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 8.0, 10.0, 15.0, 11.0, 16.0, 10.0, 15.0, 20.0, 15.0, 15.0, 41.0, 28.0, 29.0, 34.0, 35.0, 40.0, 38.0, 41.0, 38.0, 47.0, 47.0, 49.0, 42.0, 44.0, 31.0, 38.0, 31.0, 38.0, 28.0, 25.0, 17.0, 23.0, 16.0, 15.0, 6.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.4453125, -7.22900390625, -7.0126953125, -6.79638671875, -6.580078125, -6.36376953125, -6.1474609375, -5.93115234375, -5.71484375, -5.49853515625, -5.2822265625, -5.06591796875, -4.849609375, -4.63330078125, -4.4169921875, -4.20068359375, -3.984375, -3.76806640625, -3.5517578125, -3.33544921875, -3.119140625, -2.90283203125, -2.6865234375, -2.47021484375, -2.25390625, -2.03759765625, -1.8212890625, -1.60498046875, -1.388671875, -1.17236328125, -0.9560546875, -0.73974609375, -0.5234375, -0.30712890625, -0.0908203125, 0.12548828125, 0.341796875, 0.55810546875, 0.7744140625, 0.99072265625, 1.20703125, 1.42333984375, 1.6396484375, 1.85595703125, 2.072265625, 2.28857421875, 2.5048828125, 2.72119140625, 2.9375, 3.15380859375, 3.3701171875, 3.58642578125, 3.802734375, 4.01904296875, 4.2353515625, 4.45166015625, 4.66796875, 4.88427734375, 5.1005859375, 5.31689453125, 5.533203125, 5.74951171875, 5.9658203125, 6.18212890625, 6.3984375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 9.0, 12.0, 14.0, 20.0, 33.0, 50.0, 64.0, 109.0, 115.0, 179.0, 235.0, 369.0, 508.0, 746.0, 1119.0, 1546.0, 2176.0, 3108.0, 4607.0, 6846.0, 9944.0, 14764.0, 22608.0, 33736.0, 52134.0, 82466.0, 132018.0, 190833.0, 172878.0, 110993.0, 69813.0, 44718.0, 29054.0, 19228.0, 13159.0, 8824.0, 6073.0, 4081.0, 2874.0, 1948.0, 1422.0, 916.0, 670.0, 464.0, 316.0, 229.0, 168.0, 102.0, 92.0, 49.0, 39.0, 30.0, 20.0, 15.0, 9.0, 5.0, 5.0, 3.0, 2.0], "bins": [-0.63037109375, -0.6111679077148438, -0.5919647216796875, -0.5727615356445312, -0.553558349609375, -0.5343551635742188, -0.5151519775390625, -0.49594879150390625, -0.47674560546875, -0.45754241943359375, -0.4383392333984375, -0.41913604736328125, -0.399932861328125, -0.38072967529296875, -0.3615264892578125, -0.34232330322265625, -0.3231201171875, -0.30391693115234375, -0.2847137451171875, -0.26551055908203125, -0.246307373046875, -0.22710418701171875, -0.2079010009765625, -0.18869781494140625, -0.16949462890625, -0.15029144287109375, -0.1310882568359375, -0.11188507080078125, -0.092681884765625, -0.07347869873046875, -0.0542755126953125, -0.03507232666015625, -0.015869140625, 0.00333404541015625, 0.0225372314453125, 0.04174041748046875, 0.060943603515625, 0.08014678955078125, 0.0993499755859375, 0.11855316162109375, 0.13775634765625, 0.15695953369140625, 0.1761627197265625, 0.19536590576171875, 0.214569091796875, 0.23377227783203125, 0.2529754638671875, 0.27217864990234375, 0.2913818359375, 0.31058502197265625, 0.3297882080078125, 0.34899139404296875, 0.368194580078125, 0.38739776611328125, 0.4066009521484375, 0.42580413818359375, 0.44500732421875, 0.46421051025390625, 0.4834136962890625, 0.5026168823242188, 0.521820068359375, 0.5410232543945312, 0.5602264404296875, 0.5794296264648438, 0.5986328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 4.0, 10.0, 8.0, 12.0, 9.0, 9.0, 6.0, 14.0, 12.0, 22.0, 20.0, 26.0, 27.0, 45.0, 31.0, 22.0, 39.0, 39.0, 31.0, 34.0, 31.0, 35.0, 1072.0, 42.0, 31.0, 37.0, 28.0, 30.0, 31.0, 31.0, 32.0, 21.0, 25.0, 23.0, 20.0, 16.0, 21.0, 16.0, 8.0, 9.0, 4.0, 6.0, 7.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9140625, -3.78399658203125, -3.6539306640625, -3.52386474609375, -3.393798828125, -3.26373291015625, -3.1336669921875, -3.00360107421875, -2.87353515625, -2.74346923828125, -2.6134033203125, -2.48333740234375, -2.353271484375, -2.22320556640625, -2.0931396484375, -1.96307373046875, -1.8330078125, -1.70294189453125, -1.5728759765625, -1.44281005859375, -1.312744140625, -1.18267822265625, -1.0526123046875, -0.92254638671875, -0.79248046875, -0.66241455078125, -0.5323486328125, -0.40228271484375, -0.272216796875, -0.14215087890625, -0.0120849609375, 0.11798095703125, 0.248046875, 0.37811279296875, 0.5081787109375, 0.63824462890625, 0.768310546875, 0.89837646484375, 1.0284423828125, 1.15850830078125, 1.28857421875, 1.41864013671875, 1.5487060546875, 1.67877197265625, 1.808837890625, 1.93890380859375, 2.0689697265625, 2.19903564453125, 2.3291015625, 2.45916748046875, 2.5892333984375, 2.71929931640625, 2.849365234375, 2.97943115234375, 3.1094970703125, 3.23956298828125, 3.36962890625, 3.49969482421875, 3.6297607421875, 3.75982666015625, 3.889892578125, 4.01995849609375, 4.1500244140625, 4.28009033203125, 4.41015625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 8.0, 12.0, 13.0, 36.0, 37.0, 60.0, 87.0, 148.0, 262.0, 398.0, 510.0, 875.0, 1282.0, 1859.0, 2943.0, 4553.0, 6928.0, 10692.0, 16568.0, 26284.0, 43599.0, 75220.0, 132054.0, 1120677.0, 335958.0, 128597.0, 73351.0, 42528.0, 25685.0, 15933.0, 10538.0, 6660.0, 4506.0, 2861.0, 1826.0, 1223.0, 816.0, 511.0, 364.0, 274.0, 158.0, 83.0, 58.0, 34.0, 29.0, 19.0, 8.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.5130538940429688, -0.4953460693359375, -0.47763824462890625, -0.459930419921875, -0.44222259521484375, -0.4245147705078125, -0.40680694580078125, -0.38909912109375, -0.37139129638671875, -0.3536834716796875, -0.33597564697265625, -0.318267822265625, -0.30055999755859375, -0.2828521728515625, -0.26514434814453125, -0.2474365234375, -0.22972869873046875, -0.2120208740234375, -0.19431304931640625, -0.176605224609375, -0.15889739990234375, -0.1411895751953125, -0.12348175048828125, -0.10577392578125, -0.08806610107421875, -0.0703582763671875, -0.05265045166015625, -0.034942626953125, -0.01723480224609375, 0.0004730224609375, 0.01818084716796875, 0.035888671875, 0.05359649658203125, 0.0713043212890625, 0.08901214599609375, 0.106719970703125, 0.12442779541015625, 0.1421356201171875, 0.15984344482421875, 0.17755126953125, 0.19525909423828125, 0.2129669189453125, 0.23067474365234375, 0.248382568359375, 0.26609039306640625, 0.2837982177734375, 0.30150604248046875, 0.3192138671875, 0.33692169189453125, 0.3546295166015625, 0.37233734130859375, 0.390045166015625, 0.40775299072265625, 0.4254608154296875, 0.44316864013671875, 0.46087646484375, 0.47858428955078125, 0.4962921142578125, 0.5139999389648438, 0.531707763671875, 0.5494155883789062, 0.5671234130859375, 0.5848312377929688, 0.6025390625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 4.0, 4.0, 11.0, 11.0, 17.0, 25.0, 35.0, 47.0, 74.0, 87.0, 132.0, 122.0, 107.0, 77.0, 83.0, 52.0, 29.0, 24.0, 17.0, 6.0, 14.0, 4.0, 3.0, 1.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0130157470703125, -0.012669086456298828, -0.012322425842285156, -0.011975765228271484, -0.011629104614257812, -0.01128244400024414, -0.010935783386230469, -0.010589122772216797, -0.010242462158203125, -0.009895801544189453, -0.009549140930175781, -0.00920248031616211, -0.008855819702148438, -0.008509159088134766, -0.008162498474121094, -0.007815837860107422, -0.00746917724609375, -0.007122516632080078, -0.006775856018066406, -0.006429195404052734, -0.0060825347900390625, -0.005735874176025391, -0.005389213562011719, -0.005042552947998047, -0.004695892333984375, -0.004349231719970703, -0.004002571105957031, -0.0036559104919433594, -0.0033092498779296875, -0.0029625892639160156, -0.0026159286499023438, -0.002269268035888672, -0.001922607421875, -0.0015759468078613281, -0.0012292861938476562, -0.0008826255798339844, -0.0005359649658203125, -0.00018930435180664062, 0.00015735626220703125, 0.0005040168762207031, 0.000850677490234375, 0.0011973381042480469, 0.0015439987182617188, 0.0018906593322753906, 0.0022373199462890625, 0.0025839805603027344, 0.0029306411743164062, 0.003277301788330078, 0.00362396240234375, 0.003970623016357422, 0.004317283630371094, 0.004663944244384766, 0.0050106048583984375, 0.005357265472412109, 0.005703926086425781, 0.006050586700439453, 0.006397247314453125, 0.006743907928466797, 0.007090568542480469, 0.007437229156494141, 0.0077838897705078125, 0.008130550384521484, 0.008477210998535156, 0.008823871612548828, 0.0091705322265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 7.0, 3.0, 9.0, 11.0, 26.0, 23.0, 26.0, 32.0, 58.0, 54.0, 111.0, 123.0, 214.0, 335.0, 508.0, 1674.0, 707806.0, 334451.0, 1527.0, 543.0, 315.0, 207.0, 130.0, 80.0, 66.0, 54.0, 31.0, 31.0, 27.0, 17.0, 8.0, 9.0, 5.0, 4.0, 1.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.1650257110595703, -0.15951919555664062, -0.15401268005371094, -0.14850616455078125, -0.14299964904785156, -0.13749313354492188, -0.1319866180419922, -0.1264801025390625, -0.12097358703613281, -0.11546707153320312, -0.10996055603027344, -0.10445404052734375, -0.09894752502441406, -0.09344100952148438, -0.08793449401855469, -0.082427978515625, -0.07692146301269531, -0.07141494750976562, -0.06590843200683594, -0.06040191650390625, -0.05489540100097656, -0.049388885498046875, -0.04388236999511719, -0.0383758544921875, -0.03286933898925781, -0.027362823486328125, -0.021856307983398438, -0.01634979248046875, -0.010843276977539062, -0.005336761474609375, 0.0001697540283203125, 0.00567626953125, 0.011182785034179688, 0.016689300537109375, 0.022195816040039062, 0.02770233154296875, 0.03320884704589844, 0.038715362548828125, 0.04422187805175781, 0.0497283935546875, 0.05523490905761719, 0.060741424560546875, 0.06624794006347656, 0.07175445556640625, 0.07726097106933594, 0.08276748657226562, 0.08827400207519531, 0.093780517578125, 0.09928703308105469, 0.10479354858398438, 0.11030006408691406, 0.11580657958984375, 0.12131309509277344, 0.12681961059570312, 0.1323261260986328, 0.1378326416015625, 0.1433391571044922, 0.14884567260742188, 0.15435218811035156, 0.15985870361328125, 0.16536521911621094, 0.17087173461914062, 0.1763782501220703, 0.181884765625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 355.0, 648.0, 9.0], "bins": [-0.24799008667469025, -0.2439933568239212, -0.23999662697315216, -0.23599989712238312, -0.23200316727161407, -0.22800645232200623, -0.22400972247123718, -0.22001299262046814, -0.2160162627696991, -0.21201953291893005, -0.208022803068161, -0.20402607321739197, -0.20002934336662292, -0.19603261351585388, -0.19203588366508484, -0.188039168715477, -0.18404242396354675, -0.1800456941127777, -0.17604896426200867, -0.17205223441123962, -0.16805550456047058, -0.16405877470970154, -0.1600620448589325, -0.15606532990932465, -0.1520686000585556, -0.14807187020778656, -0.14407514035701752, -0.14007841050624847, -0.13608168065547943, -0.13208496570587158, -0.12808823585510254, -0.1240914985537529, -0.12009478360414505, -0.11609805375337601, -0.11210132390260696, -0.10810460150241852, -0.10410787165164948, -0.10011114180088043, -0.09611441195011139, -0.09211768209934235, -0.0881209596991539, -0.08412422984838486, -0.08012749999761581, -0.07613077759742737, -0.07213404774665833, -0.06813731789588928, -0.06414058804512024, -0.060143858194351196, -0.05614712834358215, -0.05215039849281311, -0.048153672367334366, -0.04415694251656532, -0.04016021639108658, -0.036163486540317535, -0.03216675668954849, -0.0281700287014246, -0.024173300713300705, -0.02017657272517681, -0.016179844737052917, -0.012183114886283875, -0.00818638689815998, -0.004189658910036087, -0.00019292905926704407, 0.0038037989288568497, 0.007800525985658169]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 4.0, 6.0, 12.0, 22.0, 24.0, 19.0, 20.0, 41.0, 40.0, 29.0, 37.0, 47.0, 47.0, 42.0, 53.0, 50.0, 35.0, 54.0, 42.0, 55.0, 33.0, 40.0, 35.0, 47.0, 30.0, 29.0, 19.0, 16.0, 10.0, 13.0, 11.0, 9.0, 6.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.006684422492980957, -0.006505077704787254, -0.006325732916593552, -0.006146388128399849, -0.005967043340206146, -0.0057876985520124435, -0.005608353763818741, -0.005429008975625038, -0.0052496641874313354, -0.005070319399237633, -0.00489097461104393, -0.004711629822850227, -0.004532285034656525, -0.004352940246462822, -0.004173595458269119, -0.0039942506700754166, -0.003814905881881714, -0.003635561093688011, -0.0034562163054943085, -0.0032768715173006058, -0.003097526729106903, -0.0029181819409132004, -0.0027388371527194977, -0.002559492364525795, -0.0023801475763320923, -0.0022008027881383896, -0.002021457999944687, -0.0018421132117509842, -0.0016627684235572815, -0.0014834236353635788, -0.001304078847169876, -0.0011247340589761734, -0.0009453892707824707, -0.000766044482588768, -0.0005866996943950653, -0.0004073549062013626, -0.0002280101180076599, -4.8665329813957214e-05, 0.00013067945837974548, 0.0003100242465734482, 0.0004893690347671509, 0.0006687138229608536, 0.0008480586111545563, 0.001027403399348259, 0.0012067481875419617, 0.0013860929757356644, 0.001565437763929367, 0.0017447825521230698, 0.0019241273403167725, 0.002103472128510475, 0.002282816916704178, 0.0024621617048978806, 0.0026415064930915833, 0.002820851281285286, 0.0030001960694789886, 0.0031795408576726913, 0.003358885645866394, 0.0035382304340600967, 0.0037175752222537994, 0.003896920010447502, 0.004076264798641205, 0.0042556095868349075, 0.00443495437502861, 0.004614299163222313, 0.004793643951416016]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 8.0, 10.0, 15.0, 10.0, 17.0, 10.0, 15.0, 20.0, 15.0, 15.0, 41.0, 28.0, 29.0, 34.0, 35.0, 40.0, 38.0, 40.0, 39.0, 47.0, 46.0, 50.0, 42.0, 44.0, 31.0, 38.0, 30.0, 39.0, 28.0, 25.0, 17.0, 23.0, 16.0, 14.0, 7.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.4453125, -7.22906494140625, -7.0128173828125, -6.79656982421875, -6.580322265625, -6.36407470703125, -6.1478271484375, -5.93157958984375, -5.71533203125, -5.49908447265625, -5.2828369140625, -5.06658935546875, -4.850341796875, -4.63409423828125, -4.4178466796875, -4.20159912109375, -3.9853515625, -3.76910400390625, -3.5528564453125, -3.33660888671875, -3.120361328125, -2.90411376953125, -2.6878662109375, -2.47161865234375, -2.25537109375, -2.03912353515625, -1.8228759765625, -1.60662841796875, -1.390380859375, -1.17413330078125, -0.9578857421875, -0.74163818359375, -0.525390625, -0.30914306640625, -0.0928955078125, 0.12335205078125, 0.339599609375, 0.55584716796875, 0.7720947265625, 0.98834228515625, 1.20458984375, 1.42083740234375, 1.6370849609375, 1.85333251953125, 2.069580078125, 2.28582763671875, 2.5020751953125, 2.71832275390625, 2.9345703125, 3.15081787109375, 3.3670654296875, 3.58331298828125, 3.799560546875, 4.01580810546875, 4.2320556640625, 4.44830322265625, 4.66455078125, 4.88079833984375, 5.0970458984375, 5.31329345703125, 5.529541015625, 5.74578857421875, 5.9620361328125, 6.17828369140625, 6.39453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 10.0, 6.0, 9.0, 17.0, 29.0, 32.0, 42.0, 53.0, 77.0, 85.0, 136.0, 153.0, 197.0, 335.0, 434.0, 754.0, 1276.0, 2470.0, 5084.0, 13306.0, 43767.0, 211011.0, 570344.0, 145750.0, 33017.0, 10446.0, 4270.0, 2096.0, 1108.0, 699.0, 437.0, 311.0, 209.0, 135.0, 123.0, 92.0, 46.0, 39.0, 28.0, 29.0, 21.0, 18.0, 12.0, 13.0, 6.0, 4.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.1484375, -10.8145751953125, -10.480712890625, -10.1468505859375, -9.81298828125, -9.4791259765625, -9.145263671875, -8.8114013671875, -8.4775390625, -8.1436767578125, -7.809814453125, -7.4759521484375, -7.14208984375, -6.8082275390625, -6.474365234375, -6.1405029296875, -5.806640625, -5.4727783203125, -5.138916015625, -4.8050537109375, -4.47119140625, -4.1373291015625, -3.803466796875, -3.4696044921875, -3.1357421875, -2.8018798828125, -2.468017578125, -2.1341552734375, -1.80029296875, -1.4664306640625, -1.132568359375, -0.7987060546875, -0.46484375, -0.1309814453125, 0.202880859375, 0.5367431640625, 0.87060546875, 1.2044677734375, 1.538330078125, 1.8721923828125, 2.2060546875, 2.5399169921875, 2.873779296875, 3.2076416015625, 3.54150390625, 3.8753662109375, 4.209228515625, 4.5430908203125, 4.876953125, 5.2108154296875, 5.544677734375, 5.8785400390625, 6.21240234375, 6.5462646484375, 6.880126953125, 7.2139892578125, 7.5478515625, 7.8817138671875, 8.215576171875, 8.5494384765625, 8.88330078125, 9.2171630859375, 9.551025390625, 9.8848876953125, 10.21875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 2.0, 8.0, 11.0, 9.0, 10.0, 17.0, 9.0, 18.0, 24.0, 29.0, 27.0, 28.0, 39.0, 43.0, 50.0, 72.0, 178.0, 1464.0, 390.0, 148.0, 85.0, 70.0, 42.0, 39.0, 46.0, 35.0, 15.0, 23.0, 19.0, 22.0, 12.0, 11.0, 10.0, 8.0, 5.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.34375, -16.74462890625, -16.1455078125, -15.54638671875, -14.947265625, -14.34814453125, -13.7490234375, -13.14990234375, -12.55078125, -11.95166015625, -11.3525390625, -10.75341796875, -10.154296875, -9.55517578125, -8.9560546875, -8.35693359375, -7.7578125, -7.15869140625, -6.5595703125, -5.96044921875, -5.361328125, -4.76220703125, -4.1630859375, -3.56396484375, -2.96484375, -2.36572265625, -1.7666015625, -1.16748046875, -0.568359375, 0.03076171875, 0.6298828125, 1.22900390625, 1.828125, 2.42724609375, 3.0263671875, 3.62548828125, 4.224609375, 4.82373046875, 5.4228515625, 6.02197265625, 6.62109375, 7.22021484375, 7.8193359375, 8.41845703125, 9.017578125, 9.61669921875, 10.2158203125, 10.81494140625, 11.4140625, 12.01318359375, 12.6123046875, 13.21142578125, 13.810546875, 14.40966796875, 15.0087890625, 15.60791015625, 16.20703125, 16.80615234375, 17.4052734375, 18.00439453125, 18.603515625, 19.20263671875, 19.8017578125, 20.40087890625, 21.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 6.0, 8.0, 8.0, 6.0, 18.0, 17.0, 24.0, 30.0, 41.0, 61.0, 118.0, 189.0, 343.0, 507.0, 1316.0, 60195.0, 3077888.0, 3183.0, 707.0, 366.0, 226.0, 123.0, 88.0, 62.0, 48.0, 27.0, 27.0, 11.0, 8.0, 17.0, 4.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-57.59375, -56.00439453125, -54.4150390625, -52.82568359375, -51.236328125, -49.64697265625, -48.0576171875, -46.46826171875, -44.87890625, -43.28955078125, -41.7001953125, -40.11083984375, -38.521484375, -36.93212890625, -35.3427734375, -33.75341796875, -32.1640625, -30.57470703125, -28.9853515625, -27.39599609375, -25.806640625, -24.21728515625, -22.6279296875, -21.03857421875, -19.44921875, -17.85986328125, -16.2705078125, -14.68115234375, -13.091796875, -11.50244140625, -9.9130859375, -8.32373046875, -6.734375, -5.14501953125, -3.5556640625, -1.96630859375, -0.376953125, 1.21240234375, 2.8017578125, 4.39111328125, 5.98046875, 7.56982421875, 9.1591796875, 10.74853515625, 12.337890625, 13.92724609375, 15.5166015625, 17.10595703125, 18.6953125, 20.28466796875, 21.8740234375, 23.46337890625, 25.052734375, 26.64208984375, 28.2314453125, 29.82080078125, 31.41015625, 32.99951171875, 34.5888671875, 36.17822265625, 37.767578125, 39.35693359375, 40.9462890625, 42.53564453125, 44.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [6.0, 602.0, 405.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.456827163696289, -7.366308212280273, 0.7242107391357422, 8.814729690551758, 16.905248641967773, 24.99576759338379, 33.08628845214844, 41.17680358886719, 49.26732635498047, 57.357845306396484, 65.4483642578125, 73.53887939453125, 81.62940216064453, 89.71992492675781, 97.81044006347656, 105.90095520019531, 113.9914779663086, 122.08200073242188, 130.17251586914062, 138.26303100585938, 146.35354614257812, 154.44407653808594, 162.5345916748047, 170.62510681152344, 178.7156219482422, 186.80613708496094, 194.89666748046875, 202.9871826171875, 211.07769775390625, 219.168212890625, 227.25872802734375, 235.34925842285156, 243.43975830078125, 251.5302734375, 259.62078857421875, 267.7113037109375, 275.80181884765625, 283.8923645019531, 291.9828796386719, 300.0733947753906, 308.1639099121094, 316.2544250488281, 324.3449401855469, 332.4354553222656, 340.5260009765625, 348.61651611328125, 356.70703125, 364.79754638671875, 372.8880615234375, 380.97857666015625, 389.069091796875, 397.15960693359375, 405.2501220703125, 413.3406677246094, 421.4311828613281, 429.5216979980469, 437.6122131347656, 445.7027282714844, 453.7932434082031, 461.8837585449219, 469.97430419921875, 478.0648193359375, 486.15533447265625, 494.245849609375, 502.33636474609375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 8.0, 13.0, 15.0, 18.0, 18.0, 19.0, 25.0, 24.0, 20.0, 51.0, 45.0, 24.0, 45.0, 42.0, 41.0, 53.0, 47.0, 37.0, 48.0, 38.0, 41.0, 45.0, 36.0, 33.0, 31.0, 32.0, 25.0, 22.0, 16.0, 14.0, 9.0, 12.0, 13.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.781192779541016, -40.37506866455078, -38.96894073486328, -37.56281280517578, -36.15668869018555, -34.75056457519531, -33.34443664550781, -31.938310623168945, -30.532184600830078, -29.12605857849121, -27.719932556152344, -26.313806533813477, -24.90768051147461, -23.501554489135742, -22.095428466796875, -20.689302444458008, -19.28317642211914, -17.877050399780273, -16.470924377441406, -15.064798355102539, -13.658672332763672, -12.252546310424805, -10.846420288085938, -9.44029426574707, -8.034168243408203, -6.628042221069336, -5.221916198730469, -3.8157901763916016, -2.4096641540527344, -1.0035381317138672, 0.402587890625, 1.8087139129638672, 3.2148361206054688, 4.620962142944336, 6.027088165283203, 7.43321418762207, 8.839340209960938, 10.245466232299805, 11.651592254638672, 13.057718276977539, 14.463844299316406, 15.869970321655273, 17.27609634399414, 18.682222366333008, 20.088348388671875, 21.494474411010742, 22.90060043334961, 24.306726455688477, 25.712852478027344, 27.11897850036621, 28.525104522705078, 29.931230545043945, 31.337356567382812, 32.74348449707031, 34.14960861206055, 35.55573272705078, 36.96186065673828, 38.36798858642578, 39.774112701416016, 41.18023681640625, 42.58636474609375, 43.99249267578125, 45.398616790771484, 46.80474090576172, 48.21086883544922]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 11.0, 11.0, 12.0, 16.0, 10.0, 24.0, 34.0, 24.0, 25.0, 25.0, 37.0, 40.0, 40.0, 44.0, 51.0, 51.0, 45.0, 45.0, 45.0, 45.0, 41.0, 46.0, 38.0, 37.0, 39.0, 26.0, 24.0, 13.0, 22.0, 11.0, 9.0, 12.0, 8.0, 10.0, 7.0, 4.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.837646484375, -7.57373046875, -7.309814453125, -7.0458984375, -6.781982421875, -6.51806640625, -6.254150390625, -5.990234375, -5.726318359375, -5.46240234375, -5.198486328125, -4.9345703125, -4.670654296875, -4.40673828125, -4.142822265625, -3.87890625, -3.614990234375, -3.35107421875, -3.087158203125, -2.8232421875, -2.559326171875, -2.29541015625, -2.031494140625, -1.767578125, -1.503662109375, -1.23974609375, -0.975830078125, -0.7119140625, -0.447998046875, -0.18408203125, 0.079833984375, 0.34375, 0.607666015625, 0.87158203125, 1.135498046875, 1.3994140625, 1.663330078125, 1.92724609375, 2.191162109375, 2.455078125, 2.718994140625, 2.98291015625, 3.246826171875, 3.5107421875, 3.774658203125, 4.03857421875, 4.302490234375, 4.56640625, 4.830322265625, 5.09423828125, 5.358154296875, 5.6220703125, 5.885986328125, 6.14990234375, 6.413818359375, 6.677734375, 6.941650390625, 7.20556640625, 7.469482421875, 7.7333984375, 7.997314453125, 8.26123046875, 8.525146484375, 8.7890625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 7.0, 16.0, 20.0, 35.0, 42.0, 57.0, 77.0, 99.0, 123.0, 188.0, 281.0, 397.0, 637.0, 1168.0, 2761.0, 8557.0, 48924.0, 2799786.0, 1291074.0, 28682.0, 6300.0, 2251.0, 1003.0, 520.0, 376.0, 251.0, 167.0, 119.0, 92.0, 75.0, 51.0, 33.0, 23.0, 18.0, 12.0, 11.0, 9.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.09375, -38.79541015625, -37.4970703125, -36.19873046875, -34.900390625, -33.60205078125, -32.3037109375, -31.00537109375, -29.70703125, -28.40869140625, -27.1103515625, -25.81201171875, -24.513671875, -23.21533203125, -21.9169921875, -20.61865234375, -19.3203125, -18.02197265625, -16.7236328125, -15.42529296875, -14.126953125, -12.82861328125, -11.5302734375, -10.23193359375, -8.93359375, -7.63525390625, -6.3369140625, -5.03857421875, -3.740234375, -2.44189453125, -1.1435546875, 0.15478515625, 1.453125, 2.75146484375, 4.0498046875, 5.34814453125, 6.646484375, 7.94482421875, 9.2431640625, 10.54150390625, 11.83984375, 13.13818359375, 14.4365234375, 15.73486328125, 17.033203125, 18.33154296875, 19.6298828125, 20.92822265625, 22.2265625, 23.52490234375, 24.8232421875, 26.12158203125, 27.419921875, 28.71826171875, 30.0166015625, 31.31494140625, 32.61328125, 33.91162109375, 35.2099609375, 36.50830078125, 37.806640625, 39.10498046875, 40.4033203125, 41.70166015625, 43.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 7.0, 13.0, 5.0, 11.0, 13.0, 26.0, 29.0, 34.0, 58.0, 70.0, 103.0, 148.0, 226.0, 385.0, 542.0, 698.0, 594.0, 374.0, 256.0, 152.0, 92.0, 69.0, 49.0, 29.0, 20.0, 18.0, 8.0, 7.0, 3.0, 11.0, 8.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1953125, -12.6353759765625, -12.075439453125, -11.5155029296875, -10.95556640625, -10.3956298828125, -9.835693359375, -9.2757568359375, -8.7158203125, -8.1558837890625, -7.595947265625, -7.0360107421875, -6.47607421875, -5.9161376953125, -5.356201171875, -4.7962646484375, -4.236328125, -3.6763916015625, -3.116455078125, -2.5565185546875, -1.99658203125, -1.4366455078125, -0.876708984375, -0.3167724609375, 0.2431640625, 0.8031005859375, 1.363037109375, 1.9229736328125, 2.48291015625, 3.0428466796875, 3.602783203125, 4.1627197265625, 4.72265625, 5.2825927734375, 5.842529296875, 6.4024658203125, 6.96240234375, 7.5223388671875, 8.082275390625, 8.6422119140625, 9.2021484375, 9.7620849609375, 10.322021484375, 10.8819580078125, 11.44189453125, 12.0018310546875, 12.561767578125, 13.1217041015625, 13.681640625, 14.2415771484375, 14.801513671875, 15.3614501953125, 15.92138671875, 16.4813232421875, 17.041259765625, 17.6011962890625, 18.1611328125, 18.7210693359375, 19.281005859375, 19.8409423828125, 20.40087890625, 20.9608154296875, 21.520751953125, 22.0806884765625, 22.640625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 14.0, 24.0, 34.0, 54.0, 125.0, 252.0, 613.0, 1309.0, 3214.0, 8192.0, 23694.0, 100226.0, 1120731.0, 2681881.0, 197572.0, 37249.0, 11461.0, 4300.0, 1776.0, 865.0, 369.0, 159.0, 81.0, 36.0, 20.0, 15.0, 3.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -16.103515625, -15.48828125, -14.873046875, -14.2578125, -13.642578125, -13.02734375, -12.412109375, -11.796875, -11.181640625, -10.56640625, -9.951171875, -9.3359375, -8.720703125, -8.10546875, -7.490234375, -6.875, -6.259765625, -5.64453125, -5.029296875, -4.4140625, -3.798828125, -3.18359375, -2.568359375, -1.953125, -1.337890625, -0.72265625, -0.107421875, 0.5078125, 1.123046875, 1.73828125, 2.353515625, 2.96875, 3.583984375, 4.19921875, 4.814453125, 5.4296875, 6.044921875, 6.66015625, 7.275390625, 7.890625, 8.505859375, 9.12109375, 9.736328125, 10.3515625, 10.966796875, 11.58203125, 12.197265625, 12.8125, 13.427734375, 14.04296875, 14.658203125, 15.2734375, 15.888671875, 16.50390625, 17.119140625, 17.734375, 18.349609375, 18.96484375, 19.580078125, 20.1953125, 20.810546875, 21.42578125, 22.041015625, 22.65625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 9.0, 12.0, 11.0, 17.0, 18.0, 24.0, 24.0, 36.0, 55.0, 54.0, 65.0, 85.0, 79.0, 81.0, 83.0, 67.0, 51.0, 43.0, 39.0, 29.0, 22.0, 15.0, 11.0, 13.0, 5.0, 6.0, 4.0, 5.0, 3.0, 0.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.84513092041016, -65.29803466796875, -62.75093078613281, -60.20383071899414, -57.65673065185547, -55.1096305847168, -52.562530517578125, -50.01543045043945, -47.46833038330078, -44.92123031616211, -42.37413024902344, -39.827030181884766, -37.279930114746094, -34.73283004760742, -32.18572998046875, -29.638629913330078, -27.091529846191406, -24.544429779052734, -21.997329711914062, -19.45022964477539, -16.90312957763672, -14.356029510498047, -11.808929443359375, -9.261829376220703, -6.714729309082031, -4.167629241943359, -1.6205291748046875, 0.9265708923339844, 3.4736709594726562, 6.020771026611328, 8.56787109375, 11.114971160888672, 13.662063598632812, 16.209163665771484, 18.756263732910156, 21.303363800048828, 23.8504638671875, 26.397563934326172, 28.944664001464844, 31.491764068603516, 34.03886413574219, 36.58596420288086, 39.13306427001953, 41.6801643371582, 44.227264404296875, 46.77436447143555, 49.32146453857422, 51.86856460571289, 54.41566467285156, 56.962764739990234, 59.509864807128906, 62.05696487426758, 64.60406494140625, 67.15116882324219, 69.6982650756836, 72.245361328125, 74.79246520996094, 77.33956909179688, 79.88666534423828, 82.43376159667969, 84.98086547851562, 87.52796936035156, 90.07506561279297, 92.62216186523438, 95.16926574707031]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 4.0, 11.0, 17.0, 11.0, 11.0, 19.0, 27.0, 29.0, 27.0, 32.0, 32.0, 35.0, 42.0, 39.0, 35.0, 30.0, 43.0, 36.0, 42.0, 58.0, 43.0, 28.0, 36.0, 29.0, 31.0, 32.0, 26.0, 18.0, 22.0, 24.0, 16.0, 15.0, 13.0, 13.0, 14.0, 10.0, 11.0, 4.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-61.7271842956543, -59.909019470214844, -58.090850830078125, -56.27268600463867, -54.45451736450195, -52.6363525390625, -50.81818389892578, -49.00001907348633, -47.181854248046875, -45.36368942260742, -43.5455207824707, -41.72735595703125, -39.90918731689453, -38.09102249145508, -36.272857666015625, -34.454689025878906, -32.63652038574219, -30.8183536529541, -29.000186920166016, -27.182022094726562, -25.363855361938477, -23.54568862915039, -21.727521896362305, -19.90935516357422, -18.091190338134766, -16.27302360534668, -14.45485782623291, -12.636691093444824, -10.818525314331055, -9.000358581542969, -7.182191848754883, -5.364026069641113, -3.5458602905273438, -1.7276939153671265, 0.09047245979309082, 1.9086389541625977, 3.7268052101135254, 5.544971466064453, 7.363138198852539, 9.181303977966309, 10.999470710754395, 12.81763744354248, 14.63580322265625, 16.453969955444336, 18.272136688232422, 20.090301513671875, 21.908470153808594, 23.726634979248047, 25.544801712036133, 27.36296844482422, 29.181135177612305, 30.99930191040039, 32.817466735839844, 34.63563537597656, 36.453800201416016, 38.27196502685547, 40.09013366699219, 41.90829849243164, 43.72646713256836, 45.54463195800781, 47.36280059814453, 49.180965423583984, 50.99913024902344, 52.817298889160156, 54.63546371459961]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 2.0, 8.0, 3.0, 2.0, 14.0, 7.0, 15.0, 16.0, 22.0, 20.0, 34.0, 36.0, 24.0, 39.0, 26.0, 44.0, 49.0, 40.0, 35.0, 44.0, 55.0, 63.0, 37.0, 35.0, 39.0, 32.0, 34.0, 26.0, 28.0, 29.0, 13.0, 23.0, 18.0, 13.0, 8.0, 11.0, 20.0, 5.0, 5.0, 3.0, 8.0, 1.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-113.5625, -110.328125, -107.09375, -103.859375, -100.625, -97.390625, -94.15625, -90.921875, -87.6875, -84.453125, -81.21875, -77.984375, -74.75, -71.515625, -68.28125, -65.046875, -61.8125, -58.578125, -55.34375, -52.109375, -48.875, -45.640625, -42.40625, -39.171875, -35.9375, -32.703125, -29.46875, -26.234375, -23.0, -19.765625, -16.53125, -13.296875, -10.0625, -6.828125, -3.59375, -0.359375, 2.875, 6.109375, 9.34375, 12.578125, 15.8125, 19.046875, 22.28125, 25.515625, 28.75, 31.984375, 35.21875, 38.453125, 41.6875, 44.921875, 48.15625, 51.390625, 54.625, 57.859375, 61.09375, 64.328125, 67.5625, 70.796875, 74.03125, 77.265625, 80.5, 83.734375, 86.96875, 90.203125, 93.4375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 14.0, 18.0, 14.0, 31.0, 44.0, 50.0, 92.0, 127.0, 185.0, 254.0, 357.0, 561.0, 828.0, 1094.0, 1590.0, 2291.0, 3427.0, 4870.0, 7568.0, 11777.0, 18989.0, 31306.0, 55693.0, 105002.0, 201601.0, 254912.0, 153540.0, 79290.0, 43140.0, 25238.0, 15376.0, 9704.0, 6216.0, 4198.0, 2845.0, 1877.0, 1365.0, 918.0, 628.0, 472.0, 323.0, 225.0, 164.0, 91.0, 87.0, 56.0, 46.0, 21.0, 12.0, 11.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0], "bins": [-10.71875, -10.38671875, -10.0546875, -9.72265625, -9.390625, -9.05859375, -8.7265625, -8.39453125, -8.0625, -7.73046875, -7.3984375, -7.06640625, -6.734375, -6.40234375, -6.0703125, -5.73828125, -5.40625, -5.07421875, -4.7421875, -4.41015625, -4.078125, -3.74609375, -3.4140625, -3.08203125, -2.75, -2.41796875, -2.0859375, -1.75390625, -1.421875, -1.08984375, -0.7578125, -0.42578125, -0.09375, 0.23828125, 0.5703125, 0.90234375, 1.234375, 1.56640625, 1.8984375, 2.23046875, 2.5625, 2.89453125, 3.2265625, 3.55859375, 3.890625, 4.22265625, 4.5546875, 4.88671875, 5.21875, 5.55078125, 5.8828125, 6.21484375, 6.546875, 6.87890625, 7.2109375, 7.54296875, 7.875, 8.20703125, 8.5390625, 8.87109375, 9.203125, 9.53515625, 9.8671875, 10.19921875, 10.53125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 6.0, 3.0, 10.0, 7.0, 20.0, 18.0, 14.0, 18.0, 31.0, 30.0, 29.0, 34.0, 37.0, 42.0, 42.0, 53.0, 57.0, 54.0, 1074.0, 36.0, 52.0, 48.0, 37.0, 44.0, 31.0, 39.0, 25.0, 31.0, 14.0, 13.0, 21.0, 20.0, 16.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.5712890625, -62.267578125, -59.9638671875, -57.66015625, -55.3564453125, -53.052734375, -50.7490234375, -48.4453125, -46.1416015625, -43.837890625, -41.5341796875, -39.23046875, -36.9267578125, -34.623046875, -32.3193359375, -30.015625, -27.7119140625, -25.408203125, -23.1044921875, -20.80078125, -18.4970703125, -16.193359375, -13.8896484375, -11.5859375, -9.2822265625, -6.978515625, -4.6748046875, -2.37109375, -0.0673828125, 2.236328125, 4.5400390625, 6.84375, 9.1474609375, 11.451171875, 13.7548828125, 16.05859375, 18.3623046875, 20.666015625, 22.9697265625, 25.2734375, 27.5771484375, 29.880859375, 32.1845703125, 34.48828125, 36.7919921875, 39.095703125, 41.3994140625, 43.703125, 46.0068359375, 48.310546875, 50.6142578125, 52.91796875, 55.2216796875, 57.525390625, 59.8291015625, 62.1328125, 64.4365234375, 66.740234375, 69.0439453125, 71.34765625, 73.6513671875, 75.955078125, 78.2587890625, 80.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 15.0, 29.0, 43.0, 64.0, 107.0, 119.0, 202.0, 347.0, 462.0, 709.0, 1016.0, 1478.0, 2273.0, 3171.0, 4771.0, 6929.0, 10396.0, 15638.0, 23745.0, 38285.0, 65530.0, 117168.0, 192131.0, 1260437.0, 142462.0, 80170.0, 46061.0, 28198.0, 18238.0, 11937.0, 8062.0, 5408.0, 3733.0, 2598.0, 1696.0, 1186.0, 736.0, 528.0, 349.0, 254.0, 159.0, 89.0, 61.0, 49.0, 32.0, 18.0, 14.0, 6.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3125, -7.0701904296875, -6.827880859375, -6.5855712890625, -6.34326171875, -6.1009521484375, -5.858642578125, -5.6163330078125, -5.3740234375, -5.1317138671875, -4.889404296875, -4.6470947265625, -4.40478515625, -4.1624755859375, -3.920166015625, -3.6778564453125, -3.435546875, -3.1932373046875, -2.950927734375, -2.7086181640625, -2.46630859375, -2.2239990234375, -1.981689453125, -1.7393798828125, -1.4970703125, -1.2547607421875, -1.012451171875, -0.7701416015625, -0.52783203125, -0.2855224609375, -0.043212890625, 0.1990966796875, 0.44140625, 0.6837158203125, 0.926025390625, 1.1683349609375, 1.41064453125, 1.6529541015625, 1.895263671875, 2.1375732421875, 2.3798828125, 2.6221923828125, 2.864501953125, 3.1068115234375, 3.34912109375, 3.5914306640625, 3.833740234375, 4.0760498046875, 4.318359375, 4.5606689453125, 4.802978515625, 5.0452880859375, 5.28759765625, 5.5299072265625, 5.772216796875, 6.0145263671875, 6.2568359375, 6.4991455078125, 6.741455078125, 6.9837646484375, 7.22607421875, 7.4683837890625, 7.710693359375, 7.9530029296875, 8.1953125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 7.0, 9.0, 9.0, 4.0, 9.0, 10.0, 17.0, 15.0, 16.0, 19.0, 28.0, 31.0, 32.0, 40.0, 42.0, 48.0, 47.0, 39.0, 44.0, 59.0, 39.0, 43.0, 44.0, 37.0, 35.0, 32.0, 32.0, 30.0, 32.0, 22.0, 22.0, 20.0, 19.0, 11.0, 13.0, 3.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0238037109375, -0.023006916046142578, -0.022210121154785156, -0.021413326263427734, -0.020616531372070312, -0.01981973648071289, -0.01902294158935547, -0.018226146697998047, -0.017429351806640625, -0.016632556915283203, -0.01583576202392578, -0.01503896713256836, -0.014242172241210938, -0.013445377349853516, -0.012648582458496094, -0.011851787567138672, -0.01105499267578125, -0.010258197784423828, -0.009461402893066406, -0.008664608001708984, -0.007867813110351562, -0.007071018218994141, -0.006274223327636719, -0.005477428436279297, -0.004680633544921875, -0.003883838653564453, -0.0030870437622070312, -0.0022902488708496094, -0.0014934539794921875, -0.0006966590881347656, 0.00010013580322265625, 0.0008969306945800781, 0.0016937255859375, 0.002490520477294922, 0.0032873153686523438, 0.004084110260009766, 0.0048809051513671875, 0.005677700042724609, 0.006474494934082031, 0.007271289825439453, 0.008068084716796875, 0.008864879608154297, 0.009661674499511719, 0.01045846939086914, 0.011255264282226562, 0.012052059173583984, 0.012848854064941406, 0.013645648956298828, 0.01444244384765625, 0.015239238739013672, 0.016036033630371094, 0.016832828521728516, 0.017629623413085938, 0.01842641830444336, 0.01922321319580078, 0.020020008087158203, 0.020816802978515625, 0.021613597869873047, 0.02241039276123047, 0.02320718765258789, 0.024003982543945312, 0.024800777435302734, 0.025597572326660156, 0.026394367218017578, 0.027191162109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 7.0, 5.0, 4.0, 5.0, 8.0, 7.0, 11.0, 19.0, 15.0, 36.0, 32.0, 42.0, 63.0, 99.0, 146.0, 251.0, 456.0, 1079.0, 3382.0, 14128.0, 103725.0, 639985.0, 247963.0, 28440.0, 5510.0, 1557.0, 661.0, 325.0, 200.0, 109.0, 88.0, 36.0, 27.0, 27.0, 25.0, 22.0, 13.0, 8.0, 7.0, 5.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.316162109375, -0.3067779541015625, -0.297393798828125, -0.2880096435546875, -0.27862548828125, -0.2692413330078125, -0.259857177734375, -0.2504730224609375, -0.2410888671875, -0.2317047119140625, -0.222320556640625, -0.2129364013671875, -0.20355224609375, -0.1941680908203125, -0.184783935546875, -0.1753997802734375, -0.166015625, -0.1566314697265625, -0.147247314453125, -0.1378631591796875, -0.12847900390625, -0.1190948486328125, -0.109710693359375, -0.1003265380859375, -0.0909423828125, -0.0815582275390625, -0.072174072265625, -0.0627899169921875, -0.05340576171875, -0.0440216064453125, -0.034637451171875, -0.0252532958984375, -0.015869140625, -0.0064849853515625, 0.002899169921875, 0.0122833251953125, 0.02166748046875, 0.0310516357421875, 0.040435791015625, 0.0498199462890625, 0.0592041015625, 0.0685882568359375, 0.077972412109375, 0.0873565673828125, 0.09674072265625, 0.1061248779296875, 0.115509033203125, 0.1248931884765625, 0.13427734375, 0.1436614990234375, 0.153045654296875, 0.1624298095703125, 0.17181396484375, 0.1811981201171875, 0.190582275390625, 0.1999664306640625, 0.2093505859375, 0.2187347412109375, 0.228118896484375, 0.2375030517578125, 0.24688720703125, 0.2562713623046875, 0.265655517578125, 0.2750396728515625, 0.284423828125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 35.0, 61.0, 214.0, 448.0, 195.0, 35.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10440338402986526, -0.09808691591024399, -0.09177044034004211, -0.08545397222042084, -0.07913750410079956, -0.07282103598117828, -0.06650456041097641, -0.06018809229135513, -0.05387162044644356, -0.04755514860153198, -0.041238680481910706, -0.03492220863699913, -0.028605738654732704, -0.022289268672466278, -0.015972796827554703, -0.009656328707933426, -0.0033398568630218506, 0.002976613584905863, 0.009293084032833576, 0.015609554946422577, 0.021926024928689003, 0.02824249491095543, 0.034558966755867004, 0.04087543487548828, 0.04719190672039986, 0.05350837856531143, 0.05982484668493271, 0.06614132225513458, 0.07245779037475586, 0.07877425849437714, 0.08509072661399841, 0.09140719473361969, 0.09772367775440216, 0.10404014587402344, 0.11035662144422531, 0.11667308956384659, 0.12298955768346786, 0.12930603325366974, 0.13562250137329102, 0.1419389694929123, 0.14825543761253357, 0.15457190573215485, 0.16088837385177612, 0.1672048568725586, 0.17352132499217987, 0.17983779311180115, 0.18615426123142242, 0.1924707293510437, 0.19878721237182617, 0.20510368049144745, 0.21142014861106873, 0.2177366316318512, 0.22405309975147247, 0.23036956787109375, 0.23668603599071503, 0.2430025041103363, 0.24931897222995758, 0.25563544034957886, 0.26195192337036133, 0.2682683765888214, 0.2745848596096039, 0.28090131282806396, 0.28721779584884644, 0.2935342788696289, 0.299850732088089]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 3.0, 6.0, 10.0, 15.0, 15.0, 16.0, 23.0, 15.0, 24.0, 19.0, 29.0, 17.0, 33.0, 30.0, 30.0, 26.0, 59.0, 33.0, 41.0, 36.0, 44.0, 28.0, 42.0, 41.0, 40.0, 33.0, 30.0, 29.0, 29.0, 27.0, 13.0, 20.0, 23.0, 24.0, 18.0, 14.0, 12.0, 16.0, 7.0, 4.0, 9.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02394580841064453, -0.023098502308130264, -0.022251196205615997, -0.02140389010310173, -0.020556584000587463, -0.019709277898073196, -0.01886197179555893, -0.018014665693044662, -0.017167359590530396, -0.01632005348801613, -0.015472747385501862, -0.014625441282987595, -0.013778135180473328, -0.01293082907795906, -0.012083522975444794, -0.011236216872930527, -0.01038891077041626, -0.009541604667901993, -0.008694298565387726, -0.007846992462873459, -0.006999686360359192, -0.006152380257844925, -0.005305074155330658, -0.004457768052816391, -0.003610461950302124, -0.002763155847787857, -0.00191584974527359, -0.0010685436427593231, -0.00022123754024505615, 0.0006260685622692108, 0.0014733746647834778, 0.0023206807672977448, 0.0031679868698120117, 0.004015292972326279, 0.004862599074840546, 0.005709905177354813, 0.00655721127986908, 0.0074045173823833466, 0.008251823484897614, 0.00909912958741188, 0.009946435689926147, 0.010793741792440414, 0.011641047894954681, 0.012488353997468948, 0.013335660099983215, 0.014182966202497482, 0.01503027230501175, 0.015877578407526016, 0.016724884510040283, 0.01757219061255455, 0.018419496715068817, 0.019266802817583084, 0.02011410892009735, 0.020961415022611618, 0.021808721125125885, 0.022656027227640152, 0.02350333333015442, 0.024350639432668686, 0.025197945535182953, 0.02604525163769722, 0.026892557740211487, 0.027739863842725754, 0.02858716994524002, 0.029434476047754288, 0.030281782150268555]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 8.0, 3.0, 2.0, 14.0, 7.0, 15.0, 16.0, 22.0, 20.0, 33.0, 36.0, 25.0, 38.0, 27.0, 43.0, 49.0, 40.0, 36.0, 43.0, 55.0, 62.0, 39.0, 35.0, 37.0, 34.0, 33.0, 25.0, 29.0, 30.0, 13.0, 22.0, 19.0, 11.0, 10.0, 10.0, 20.0, 6.0, 5.0, 3.0, 8.0, 1.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-113.5625, -110.330078125, -107.09765625, -103.865234375, -100.6328125, -97.400390625, -94.16796875, -90.935546875, -87.703125, -84.470703125, -81.23828125, -78.005859375, -74.7734375, -71.541015625, -68.30859375, -65.076171875, -61.84375, -58.611328125, -55.37890625, -52.146484375, -48.9140625, -45.681640625, -42.44921875, -39.216796875, -35.984375, -32.751953125, -29.51953125, -26.287109375, -23.0546875, -19.822265625, -16.58984375, -13.357421875, -10.125, -6.892578125, -3.66015625, -0.427734375, 2.8046875, 6.037109375, 9.26953125, 12.501953125, 15.734375, 18.966796875, 22.19921875, 25.431640625, 28.6640625, 31.896484375, 35.12890625, 38.361328125, 41.59375, 44.826171875, 48.05859375, 51.291015625, 54.5234375, 57.755859375, 60.98828125, 64.220703125, 67.453125, 70.685546875, 73.91796875, 77.150390625, 80.3828125, 83.615234375, 86.84765625, 90.080078125, 93.3125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 11.0, 16.0, 16.0, 19.0, 25.0, 29.0, 50.0, 53.0, 75.0, 128.0, 173.0, 282.0, 421.0, 712.0, 1321.0, 3020.0, 8485.0, 26752.0, 109766.0, 454466.0, 336853.0, 74866.0, 19453.0, 6203.0, 2439.0, 1108.0, 588.0, 387.0, 233.0, 141.0, 109.0, 77.0, 54.0, 60.0, 37.0, 26.0, 18.0, 16.0, 17.0, 15.0, 11.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.328125, -16.784423828125, -16.24072265625, -15.697021484375, -15.1533203125, -14.609619140625, -14.06591796875, -13.522216796875, -12.978515625, -12.434814453125, -11.89111328125, -11.347412109375, -10.8037109375, -10.260009765625, -9.71630859375, -9.172607421875, -8.62890625, -8.085205078125, -7.54150390625, -6.997802734375, -6.4541015625, -5.910400390625, -5.36669921875, -4.822998046875, -4.279296875, -3.735595703125, -3.19189453125, -2.648193359375, -2.1044921875, -1.560791015625, -1.01708984375, -0.473388671875, 0.0703125, 0.614013671875, 1.15771484375, 1.701416015625, 2.2451171875, 2.788818359375, 3.33251953125, 3.876220703125, 4.419921875, 4.963623046875, 5.50732421875, 6.051025390625, 6.5947265625, 7.138427734375, 7.68212890625, 8.225830078125, 8.76953125, 9.313232421875, 9.85693359375, 10.400634765625, 10.9443359375, 11.488037109375, 12.03173828125, 12.575439453125, 13.119140625, 13.662841796875, 14.20654296875, 14.750244140625, 15.2939453125, 15.837646484375, 16.38134765625, 16.925048828125, 17.46875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 6.0, 16.0, 24.0, 22.0, 28.0, 32.0, 56.0, 45.0, 51.0, 79.0, 60.0, 2118.0, 106.0, 69.0, 65.0, 61.0, 46.0, 29.0, 34.0, 29.0, 19.0, 13.0, 10.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.375, -201.568359375, -194.76171875, -187.955078125, -181.1484375, -174.341796875, -167.53515625, -160.728515625, -153.921875, -147.115234375, -140.30859375, -133.501953125, -126.6953125, -119.888671875, -113.08203125, -106.275390625, -99.46875, -92.662109375, -85.85546875, -79.048828125, -72.2421875, -65.435546875, -58.62890625, -51.822265625, -45.015625, -38.208984375, -31.40234375, -24.595703125, -17.7890625, -10.982421875, -4.17578125, 2.630859375, 9.4375, 16.244140625, 23.05078125, 29.857421875, 36.6640625, 43.470703125, 50.27734375, 57.083984375, 63.890625, 70.697265625, 77.50390625, 84.310546875, 91.1171875, 97.923828125, 104.73046875, 111.537109375, 118.34375, 125.150390625, 131.95703125, 138.763671875, 145.5703125, 152.376953125, 159.18359375, 165.990234375, 172.796875, 179.603515625, 186.41015625, 193.216796875, 200.0234375, 206.830078125, 213.63671875, 220.443359375, 227.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 9.0, 6.0, 16.0, 35.0, 37.0, 58.0, 113.0, 185.0, 370.0, 763.0, 1899.0, 10646.0, 598353.0, 2517830.0, 11785.0, 1935.0, 819.0, 387.0, 200.0, 100.0, 66.0, 47.0, 25.0, 7.0, 11.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.53125, -48.03125, -46.53125, -45.03125, -43.53125, -42.03125, -40.53125, -39.03125, -37.53125, -36.03125, -34.53125, -33.03125, -31.53125, -30.03125, -28.53125, -27.03125, -25.53125, -24.03125, -22.53125, -21.03125, -19.53125, -18.03125, -16.53125, -15.03125, -13.53125, -12.03125, -10.53125, -9.03125, -7.53125, -6.03125, -4.53125, -3.03125, -1.53125, -0.03125, 1.46875, 2.96875, 4.46875, 5.96875, 7.46875, 8.96875, 10.46875, 11.96875, 13.46875, 14.96875, 16.46875, 17.96875, 19.46875, 20.96875, 22.46875, 23.96875, 25.46875, 26.96875, 28.46875, 29.96875, 31.46875, 32.96875, 34.46875, 35.96875, 37.46875, 38.96875, 40.46875, 41.96875, 43.46875, 44.96875, 46.46875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 8.0, 24.0, 119.0, 275.0, 345.0, 145.0, 49.0, 21.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.8161163330078, -191.63790893554688, -174.45970153808594, -157.281494140625, -140.10330200195312, -122.92508697509766, -105.74688720703125, -88.56867980957031, -71.39047241210938, -54.21226501464844, -37.034061431884766, -19.855857849121094, -2.6776504516601562, 14.500556945800781, 31.678756713867188, 48.856964111328125, 66.03517150878906, 83.21337890625, 100.39158630371094, 117.56978607177734, 134.74798583984375, 151.92620849609375, 169.10440063476562, 186.28260803222656, 203.4608154296875, 220.63902282714844, 237.81723022460938, 254.99542236328125, 272.17364501953125, 289.3518371582031, 306.530029296875, 323.708251953125, 340.88641357421875, 358.0646057128906, 375.2428283691406, 392.4210205078125, 409.5992431640625, 426.7774353027344, 443.95562744140625, 461.13385009765625, 478.31207275390625, 495.4902648925781, 512.66845703125, 529.8466796875, 547.02490234375, 564.203125, 581.3812866210938, 598.5595092773438, 615.7376708984375, 632.9158935546875, 650.0940551757812, 667.2722778320312, 684.4505004882812, 701.6287231445312, 718.806884765625, 735.985107421875, 753.163330078125, 770.341552734375, 787.5197143554688, 804.6979370117188, 821.8761596679688, 839.0543823242188, 856.2325439453125, 873.4107666015625, 890.5889892578125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 5.0, 7.0, 7.0, 8.0, 7.0, 13.0, 13.0, 16.0, 21.0, 32.0, 38.0, 30.0, 38.0, 48.0, 34.0, 44.0, 54.0, 45.0, 49.0, 45.0, 42.0, 36.0, 36.0, 63.0, 40.0, 39.0, 34.0, 27.0, 15.0, 20.0, 18.0, 15.0, 18.0, 9.0, 5.0, 9.0, 13.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.4662628173828, -202.9014892578125, -196.3367156982422, -189.77194213867188, -183.20716857910156, -176.64239501953125, -170.07763671875, -163.51284790039062, -156.94808959960938, -150.38331604003906, -143.81854248046875, -137.25376892089844, -130.68899536132812, -124.12422180175781, -117.55945587158203, -110.99468231201172, -104.42990112304688, -97.86512756347656, -91.30035400390625, -84.73558044433594, -78.17080688476562, -71.60603332519531, -65.04126739501953, -58.47649383544922, -51.911720275878906, -45.346946716308594, -38.78217315673828, -32.217403411865234, -25.652629852294922, -19.08785629272461, -12.523086547851562, -5.95831298828125, 0.6064453125, 7.171217918395996, 13.735990524291992, 20.300762176513672, 26.865535736083984, 33.4303092956543, 39.995079040527344, 46.559852600097656, 53.12462615966797, 59.68939971923828, 66.2541732788086, 72.81893920898438, 79.38371276855469, 85.948486328125, 92.51325988769531, 99.07803344726562, 105.64280700683594, 112.20758056640625, 118.77235412597656, 125.33712768554688, 131.9019012451172, 138.4666748046875, 145.03143310546875, 151.59622192382812, 158.16098022460938, 164.7257537841797, 171.29052734375, 177.8553009033203, 184.42007446289062, 190.98484802246094, 197.54962158203125, 204.1143798828125, 210.67916870117188]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 8.0, 14.0, 16.0, 20.0, 31.0, 37.0, 40.0, 50.0, 71.0, 110.0, 141.0, 183.0, 257.0, 334.0, 523.0, 789.0, 1294.0, 1040768.0, 1265.0, 721.0, 524.0, 349.0, 250.0, 177.0, 135.0, 119.0, 64.0, 53.0, 33.0, 34.0, 36.0, 23.0, 7.0, 8.0, 15.0, 9.0, 8.0, 1.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.3751449584961, -66.1307144165039, -63.88628387451172, -61.64185333251953, -59.397422790527344, -57.152992248535156, -54.9085578918457, -52.664127349853516, -50.41969680786133, -48.17526626586914, -45.93083572387695, -43.686405181884766, -41.44197082519531, -39.197540283203125, -36.95310974121094, -34.70867919921875, -32.46424865722656, -30.219818115234375, -27.975387573242188, -25.730955123901367, -23.48652458190918, -21.242094039916992, -18.997661590576172, -16.753231048583984, -14.508800506591797, -12.26436996459961, -10.019938468933105, -7.77550745010376, -5.531076431274414, -3.2866458892822266, -1.0422143936157227, 1.2022171020507812, 3.4466552734375, 5.691086292266846, 7.935517311096191, 10.179948806762695, 12.424379348754883, 14.66880989074707, 16.91324234008789, 19.157672882080078, 21.402103424072266, 23.646533966064453, 25.89096450805664, 28.13539695739746, 30.37982749938965, 32.62425994873047, 34.868690490722656, 37.113121032714844, 39.35755157470703, 41.60198211669922, 43.846412658691406, 46.090843200683594, 48.33527374267578, 50.57970428466797, 52.82413864135742, 55.06856918334961, 57.3129997253418, 59.557430267333984, 61.80186080932617, 64.04629516601562, 66.29072570800781, 68.53515625, 70.77958679199219, 73.02401733398438, 75.26844787597656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 0.0, 4.0, 5.0, 18.0, 15.0, 15.0, 23.0, 64.0, 125.0, 51436560.0, 26224.0, 72.0, 48.0, 17.0, 11.0, 9.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2635.649169921875, -2541.3642578125, -2447.0791015625, -2352.7939453125, -2258.509033203125, -2164.22412109375, -2069.93896484375, -1975.6539306640625, -1881.368896484375, -1787.0838623046875, -1692.798828125, -1598.5137939453125, -1504.228759765625, -1409.9437255859375, -1315.65869140625, -1221.3736572265625, -1127.088623046875, -1032.8035888671875, -938.5185546875, -844.2335205078125, -749.948486328125, -655.6634521484375, -561.37841796875, -467.0933837890625, -372.808349609375, -278.5233154296875, -184.23828125, -89.9532470703125, 4.331787109375, 98.6168212890625, 192.90185546875, 287.1868896484375, 381.471923828125, 475.7569580078125, 570.0419921875, 664.3270263671875, 758.612060546875, 852.8970947265625, 947.18212890625, 1041.4671630859375, 1135.752197265625, 1230.0372314453125, 1324.322265625, 1418.6072998046875, 1512.892333984375, 1607.1773681640625, 1701.46240234375, 1795.7474365234375, 1890.032470703125, 1984.3175048828125, 2078.6025390625, 2172.8876953125, 2267.172607421875, 2361.45751953125, 2455.74267578125, 2550.02783203125, 2644.312744140625, 2738.59765625, 2832.8828125, 2927.16796875, 3021.452880859375, 3115.73779296875, 3210.02294921875, 3304.30810546875, 3398.593017578125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 6.0, 11.0, 3.0, 13.0, 18.0, 25.0, 46.0, 60.0, 78.0, 122.0, 204.0, 260.0, 352.0, 484.0, 714.0, 1110.0, 1584.0, 2194.0, 3108.0, 4722.0, 7062.0, 10433.0, 15966.0, 24337.0, 37573.0, 60190.0, 97009.0, 161106.0, 266758.0, 412008.0, 3164188.0, 1013206.0, 378992.0, 239682.0, 144758.0, 87484.0, 54618.0, 34385.0, 22245.0, 14476.0, 9521.0, 6540.0, 4341.0, 2924.0, 2013.0, 1344.0, 962.0, 686.0, 446.0, 303.0, 232.0, 170.0, 132.0, 89.0, 59.0, 16.0, 17.0, 22.0, 17.0, 16.0, 7.0, 5.0, 3.0], "bins": [-2.04296875, -1.978912353515625, -1.91485595703125, -1.850799560546875, -1.7867431640625, -1.722686767578125, -1.65863037109375, -1.594573974609375, -1.530517578125, -1.466461181640625, -1.40240478515625, -1.338348388671875, -1.2742919921875, -1.210235595703125, -1.14617919921875, -1.082122802734375, -1.01806640625, -0.954010009765625, -0.88995361328125, -0.825897216796875, -0.7618408203125, -0.697784423828125, -0.63372802734375, -0.569671630859375, -0.505615234375, -0.441558837890625, -0.37750244140625, -0.313446044921875, -0.2493896484375, -0.185333251953125, -0.12127685546875, -0.057220458984375, 0.0068359375, 0.070892333984375, 0.13494873046875, 0.199005126953125, 0.2630615234375, 0.327117919921875, 0.39117431640625, 0.455230712890625, 0.519287109375, 0.583343505859375, 0.64739990234375, 0.711456298828125, 0.7755126953125, 0.839569091796875, 0.90362548828125, 0.967681884765625, 1.03173828125, 1.095794677734375, 1.15985107421875, 1.223907470703125, 1.2879638671875, 1.352020263671875, 1.41607666015625, 1.480133056640625, 1.544189453125, 1.608245849609375, 1.67230224609375, 1.736358642578125, 1.8004150390625, 1.864471435546875, 1.92852783203125, 1.992584228515625, 2.056640625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 9.0, 2.0, 12.0, 10.0, 11.0, 12.0, 14.0, 19.0, 18.0, 18.0, 17.0, 22.0, 20.0, 32.0, 36.0, 42.0, 34.0, 34.0, 36.0, 34.0, 130.0, 846.0, 145.0, 38.0, 25.0, 34.0, 36.0, 38.0, 20.0, 28.0, 30.0, 20.0, 19.0, 23.0, 25.0, 17.0, 17.0, 17.0, 8.0, 9.0, 11.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 1.0, 3.0], "bins": [-17.84375, -17.2763671875, -16.708984375, -16.1416015625, -15.57421875, -15.0068359375, -14.439453125, -13.8720703125, -13.3046875, -12.7373046875, -12.169921875, -11.6025390625, -11.03515625, -10.4677734375, -9.900390625, -9.3330078125, -8.765625, -8.1982421875, -7.630859375, -7.0634765625, -6.49609375, -5.9287109375, -5.361328125, -4.7939453125, -4.2265625, -3.6591796875, -3.091796875, -2.5244140625, -1.95703125, -1.3896484375, -0.822265625, -0.2548828125, 0.3125, 0.8798828125, 1.447265625, 2.0146484375, 2.58203125, 3.1494140625, 3.716796875, 4.2841796875, 4.8515625, 5.4189453125, 5.986328125, 6.5537109375, 7.12109375, 7.6884765625, 8.255859375, 8.8232421875, 9.390625, 9.9580078125, 10.525390625, 11.0927734375, 11.66015625, 12.2275390625, 12.794921875, 13.3623046875, 13.9296875, 14.4970703125, 15.064453125, 15.6318359375, 16.19921875, 16.7666015625, 17.333984375, 17.9013671875, 18.46875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 15.0, 20.0, 32.0, 47.0, 84.0, 119.0, 188.0, 246.0, 397.0, 675.0, 978.0, 1539.0, 2548.0, 4100.0, 6430.0, 10448.0, 16949.0, 27420.0, 44406.0, 72342.0, 118071.0, 192147.0, 296640.0, 418137.0, 3475598.0, 612463.0, 356863.0, 240890.0, 150864.0, 92523.0, 56730.0, 35196.0, 21383.0, 13190.0, 8177.0, 5030.0, 3110.0, 1951.0, 1234.0, 738.0, 520.0, 353.0, 202.0, 146.0, 96.0, 52.0, 46.0, 28.0, 19.0, 16.0, 7.0, 7.0, 8.0, 3.0, 2.0], "bins": [-1.7060546875, -1.6555023193359375, -1.604949951171875, -1.5543975830078125, -1.50384521484375, -1.4532928466796875, -1.402740478515625, -1.3521881103515625, -1.3016357421875, -1.2510833740234375, -1.200531005859375, -1.1499786376953125, -1.09942626953125, -1.0488739013671875, -0.998321533203125, -0.9477691650390625, -0.897216796875, -0.8466644287109375, -0.796112060546875, -0.7455596923828125, -0.69500732421875, -0.6444549560546875, -0.593902587890625, -0.5433502197265625, -0.4927978515625, -0.4422454833984375, -0.391693115234375, -0.3411407470703125, -0.29058837890625, -0.2400360107421875, -0.189483642578125, -0.1389312744140625, -0.08837890625, -0.0378265380859375, 0.012725830078125, 0.0632781982421875, 0.11383056640625, 0.1643829345703125, 0.214935302734375, 0.2654876708984375, 0.3160400390625, 0.3665924072265625, 0.417144775390625, 0.4676971435546875, 0.51824951171875, 0.5688018798828125, 0.619354248046875, 0.6699066162109375, 0.720458984375, 0.7710113525390625, 0.821563720703125, 0.8721160888671875, 0.92266845703125, 0.9732208251953125, 1.023773193359375, 1.0743255615234375, 1.1248779296875, 1.1754302978515625, 1.225982666015625, 1.2765350341796875, 1.32708740234375, 1.3776397705078125, 1.428192138671875, 1.4787445068359375, 1.529296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 2.0, 4.0, 7.0, 2.0, 6.0, 12.0, 14.0, 8.0, 20.0, 19.0, 17.0, 24.0, 27.0, 29.0, 28.0, 27.0, 34.0, 41.0, 41.0, 41.0, 41.0, 79.0, 972.0, 98.0, 35.0, 35.0, 39.0, 40.0, 34.0, 35.0, 29.0, 25.0, 23.0, 27.0, 27.0, 12.0, 12.0, 16.0, 14.0, 5.0, 6.0, 6.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9140625, -14.3897705078125, -13.865478515625, -13.3411865234375, -12.81689453125, -12.2926025390625, -11.768310546875, -11.2440185546875, -10.7197265625, -10.1954345703125, -9.671142578125, -9.1468505859375, -8.62255859375, -8.0982666015625, -7.573974609375, -7.0496826171875, -6.525390625, -6.0010986328125, -5.476806640625, -4.9525146484375, -4.42822265625, -3.9039306640625, -3.379638671875, -2.8553466796875, -2.3310546875, -1.8067626953125, -1.282470703125, -0.7581787109375, -0.23388671875, 0.2904052734375, 0.814697265625, 1.3389892578125, 1.86328125, 2.3875732421875, 2.911865234375, 3.4361572265625, 3.96044921875, 4.4847412109375, 5.009033203125, 5.5333251953125, 6.0576171875, 6.5819091796875, 7.106201171875, 7.6304931640625, 8.15478515625, 8.6790771484375, 9.203369140625, 9.7276611328125, 10.251953125, 10.7762451171875, 11.300537109375, 11.8248291015625, 12.34912109375, 12.8734130859375, 13.397705078125, 13.9219970703125, 14.4462890625, 14.9705810546875, 15.494873046875, 16.0191650390625, 16.54345703125, 17.0677490234375, 17.592041015625, 18.1163330078125, 18.640625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 11.0, 18.0, 10.0, 23.0, 44.0, 43.0, 75.0, 93.0, 162.0, 199.0, 300.0, 412.0, 650.0, 882.0, 1325.0, 1988.0, 3033.0, 4553.0, 7174.0, 11100.0, 17320.0, 27974.0, 44461.0, 71650.0, 123970.0, 5609537.0, 149308.0, 80058.0, 49346.0, 31318.0, 19730.0, 12180.0, 7589.0, 5005.0, 3283.0, 2162.0, 1421.0, 941.0, 618.0, 408.0, 300.0, 196.0, 167.0, 129.0, 75.0, 67.0, 32.0, 25.0, 23.0, 13.0, 4.0, 5.0, 9.0, 8.0, 2.0, 3.0], "bins": [-3.751953125, -3.64031982421875, -3.5286865234375, -3.41705322265625, -3.305419921875, -3.19378662109375, -3.0821533203125, -2.97052001953125, -2.85888671875, -2.74725341796875, -2.6356201171875, -2.52398681640625, -2.412353515625, -2.30072021484375, -2.1890869140625, -2.07745361328125, -1.9658203125, -1.85418701171875, -1.7425537109375, -1.63092041015625, -1.519287109375, -1.40765380859375, -1.2960205078125, -1.18438720703125, -1.07275390625, -0.96112060546875, -0.8494873046875, -0.73785400390625, -0.626220703125, -0.51458740234375, -0.4029541015625, -0.29132080078125, -0.1796875, -0.06805419921875, 0.0435791015625, 0.15521240234375, 0.266845703125, 0.37847900390625, 0.4901123046875, 0.60174560546875, 0.71337890625, 0.82501220703125, 0.9366455078125, 1.04827880859375, 1.159912109375, 1.27154541015625, 1.3831787109375, 1.49481201171875, 1.6064453125, 1.71807861328125, 1.8297119140625, 1.94134521484375, 2.052978515625, 2.16461181640625, 2.2762451171875, 2.38787841796875, 2.49951171875, 2.61114501953125, 2.7227783203125, 2.83441162109375, 2.946044921875, 3.05767822265625, 3.1693115234375, 3.28094482421875, 3.392578125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 10.0, 5.0, 5.0, 16.0, 11.0, 11.0, 16.0, 17.0, 18.0, 26.0, 27.0, 24.0, 27.0, 34.0, 28.0, 31.0, 37.0, 51.0, 39.0, 45.0, 802.0, 290.0, 44.0, 37.0, 37.0, 45.0, 38.0, 36.0, 31.0, 26.0, 24.0, 23.0, 21.0, 17.0, 10.0, 8.0, 21.0, 10.0, 5.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.03125, -12.608154296875, -12.18505859375, -11.761962890625, -11.3388671875, -10.915771484375, -10.49267578125, -10.069580078125, -9.646484375, -9.223388671875, -8.80029296875, -8.377197265625, -7.9541015625, -7.531005859375, -7.10791015625, -6.684814453125, -6.26171875, -5.838623046875, -5.41552734375, -4.992431640625, -4.5693359375, -4.146240234375, -3.72314453125, -3.300048828125, -2.876953125, -2.453857421875, -2.03076171875, -1.607666015625, -1.1845703125, -0.761474609375, -0.33837890625, 0.084716796875, 0.5078125, 0.930908203125, 1.35400390625, 1.777099609375, 2.2001953125, 2.623291015625, 3.04638671875, 3.469482421875, 3.892578125, 4.315673828125, 4.73876953125, 5.161865234375, 5.5849609375, 6.008056640625, 6.43115234375, 6.854248046875, 7.27734375, 7.700439453125, 8.12353515625, 8.546630859375, 8.9697265625, 9.392822265625, 9.81591796875, 10.239013671875, 10.662109375, 11.085205078125, 11.50830078125, 11.931396484375, 12.3544921875, 12.777587890625, 13.20068359375, 13.623779296875, 14.046875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 21.0, 63.0, 144.0, 316.0, 279.0, 101.0, 34.0, 23.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.8656234741211, -85.40959167480469, -82.95355224609375, -80.49751281738281, -78.0414810180664, -75.58544921875, -73.12940979003906, -70.67337036132812, -68.21733856201172, -65.76130676269531, -63.305267333984375, -60.8492317199707, -58.39319610595703, -55.93716049194336, -53.48112487792969, -51.025089263916016, -48.569053649902344, -46.11301803588867, -43.656982421875, -41.20094680786133, -38.744911193847656, -36.288875579833984, -33.83283996582031, -31.37680435180664, -28.92076873779297, -26.464733123779297, -24.008697509765625, -21.552661895751953, -19.09662628173828, -16.64059066772461, -14.184555053710938, -11.728519439697266, -9.272476196289062, -6.816440582275391, -4.360404968261719, -1.9043693542480469, 0.551666259765625, 3.007701873779297, 5.463737487792969, 7.919773101806641, 10.375808715820312, 12.831844329833984, 15.287879943847656, 17.743915557861328, 20.199951171875, 22.655986785888672, 25.112022399902344, 27.568058013916016, 30.024093627929688, 32.48012924194336, 34.93616485595703, 37.3922004699707, 39.848236083984375, 42.30427169799805, 44.76030731201172, 47.21634292602539, 49.67237854003906, 52.128414154052734, 54.584449768066406, 57.04048538208008, 59.49652099609375, 61.95255661010742, 64.4085922241211, 66.8646240234375, 69.32066345214844]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 1.0, 5.0, 6.0, 9.0, 9.0, 13.0, 13.0, 26.0, 22.0, 31.0, 34.0, 32.0, 48.0, 43.0, 49.0, 42.0, 59.0, 49.0, 52.0, 38.0, 43.0, 42.0, 47.0, 34.0, 42.0, 41.0, 24.0, 33.0, 26.0, 17.0, 21.0, 5.0, 16.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.56077575683594, -41.389495849609375, -40.21821975708008, -39.046939849853516, -37.87565994262695, -36.704383850097656, -35.533103942871094, -34.36182403564453, -33.19054412841797, -32.019264221191406, -30.847986221313477, -29.676708221435547, -28.505428314208984, -27.334150314331055, -26.162872314453125, -24.991592407226562, -23.820316314697266, -22.649038314819336, -21.477758407592773, -20.306480407714844, -19.13520050048828, -17.96392250061035, -16.792644500732422, -15.621365547180176, -14.45008659362793, -13.278807640075684, -12.107528686523438, -10.936250686645508, -9.764971733093262, -8.593692779541016, -7.422414302825928, -6.25113582611084, -5.079856872558594, -3.9085781574249268, -2.7372994422912598, -1.5660207271575928, -0.3947420120239258, 0.7765369415283203, 1.9478154182434082, 3.119093894958496, 4.290372848510742, 5.461651802062988, 6.632930278778076, 7.804208755493164, 8.97548770904541, 10.146766662597656, 11.318044662475586, 12.489323616027832, 13.660602569580078, 14.831881523132324, 16.00316047668457, 17.1744384765625, 18.345718383789062, 19.516996383666992, 20.688274383544922, 21.859554290771484, 23.030832290649414, 24.202110290527344, 25.373390197753906, 26.544668197631836, 27.715946197509766, 28.887226104736328, 30.058504104614258, 31.229782104492188, 32.40106201171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 1.0, 8.0, 5.0, 9.0, 7.0, 10.0, 20.0, 29.0, 37.0, 66.0, 60.0, 148.0, 172.0, 363.0, 664.0, 1347.0, 2929.0, 8087.0, 39112.0, 4018355.0, 102597.0, 13263.0, 3880.0, 1591.0, 710.0, 333.0, 193.0, 112.0, 60.0, 36.0, 26.0, 12.0, 11.0, 4.0, 8.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.428375244140625, -0.41290283203125, -0.397430419921875, -0.3819580078125, -0.366485595703125, -0.35101318359375, -0.335540771484375, -0.320068359375, -0.304595947265625, -0.28912353515625, -0.273651123046875, -0.2581787109375, -0.242706298828125, -0.22723388671875, -0.211761474609375, -0.1962890625, -0.180816650390625, -0.16534423828125, -0.149871826171875, -0.1343994140625, -0.118927001953125, -0.10345458984375, -0.087982177734375, -0.072509765625, -0.057037353515625, -0.04156494140625, -0.026092529296875, -0.0106201171875, 0.004852294921875, 0.02032470703125, 0.035797119140625, 0.05126953125, 0.066741943359375, 0.08221435546875, 0.097686767578125, 0.1131591796875, 0.128631591796875, 0.14410400390625, 0.159576416015625, 0.175048828125, 0.190521240234375, 0.20599365234375, 0.221466064453125, 0.2369384765625, 0.252410888671875, 0.26788330078125, 0.283355712890625, 0.298828125, 0.314300537109375, 0.32977294921875, 0.345245361328125, 0.3607177734375, 0.376190185546875, 0.39166259765625, 0.407135009765625, 0.422607421875, 0.438079833984375, 0.45355224609375, 0.469024658203125, 0.4844970703125, 0.499969482421875, 0.51544189453125, 0.530914306640625, 0.54638671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 14.0, 11.0, 13.0, 11.0, 23.0, 751.0, 37.0, 19.0, 11.0, 6.0, 12.0, 11.0, 7.0, 6.0, 7.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17529296875, -0.17037391662597656, -0.16545486450195312, -0.1605358123779297, -0.15561676025390625, -0.1506977081298828, -0.14577865600585938, -0.14085960388183594, -0.1359405517578125, -0.13102149963378906, -0.12610244750976562, -0.12118339538574219, -0.11626434326171875, -0.11134529113769531, -0.10642623901367188, -0.10150718688964844, -0.096588134765625, -0.09166908264160156, -0.08675003051757812, -0.08183097839355469, -0.07691192626953125, -0.07199287414550781, -0.06707382202148438, -0.06215476989746094, -0.0572357177734375, -0.05231666564941406, -0.047397613525390625, -0.04247856140136719, -0.03755950927734375, -0.03264045715332031, -0.027721405029296875, -0.022802352905273438, -0.01788330078125, -0.012964248657226562, -0.008045196533203125, -0.0031261444091796875, 0.00179290771484375, 0.0067119598388671875, 0.011631011962890625, 0.016550064086914062, 0.0214691162109375, 0.026388168334960938, 0.031307220458984375, 0.03622627258300781, 0.04114532470703125, 0.04606437683105469, 0.050983428955078125, 0.05590248107910156, 0.060821533203125, 0.06574058532714844, 0.07065963745117188, 0.07557868957519531, 0.08049774169921875, 0.08541679382324219, 0.09033584594726562, 0.09525489807128906, 0.1001739501953125, 0.10509300231933594, 0.11001205444335938, 0.11493110656738281, 0.11985015869140625, 0.12476921081542969, 0.12968826293945312, 0.13460731506347656, 0.1395263671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 16.0, 18.0, 26.0, 38.0, 70.0, 120.0, 212.0, 370.0, 609.0, 1162.0, 2348.0, 4996.0, 11625.0, 33125.0, 155212.0, 3092514.0, 779167.0, 77507.0, 20900.0, 7443.0, 3272.0, 1503.0, 811.0, 445.0, 279.0, 174.0, 111.0, 50.0, 42.0, 31.0, 19.0, 15.0, 11.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.350341796875, -0.3408203125, -0.331298828125, -0.32177734375, -0.312255859375, -0.302734375, -0.293212890625, -0.28369140625, -0.274169921875, -0.2646484375, -0.255126953125, -0.24560546875, -0.236083984375, -0.2265625, -0.217041015625, -0.20751953125, -0.197998046875, -0.1884765625, -0.178955078125, -0.16943359375, -0.159912109375, -0.150390625, -0.140869140625, -0.13134765625, -0.121826171875, -0.1123046875, -0.102783203125, -0.09326171875, -0.083740234375, -0.07421875, -0.064697265625, -0.05517578125, -0.045654296875, -0.0361328125, -0.026611328125, -0.01708984375, -0.007568359375, 0.001953125, 0.011474609375, 0.02099609375, 0.030517578125, 0.0400390625, 0.049560546875, 0.05908203125, 0.068603515625, 0.078125, 0.087646484375, 0.09716796875, 0.106689453125, 0.1162109375, 0.125732421875, 0.13525390625, 0.144775390625, 0.154296875, 0.163818359375, 0.17333984375, 0.182861328125, 0.1923828125, 0.201904296875, 0.21142578125, 0.220947265625, 0.23046875, 0.239990234375, 0.24951171875, 0.259033203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 10.0, 7.0, 3.0, 6.0, 11.0, 12.0, 15.0, 20.0, 40.0, 45.0, 75.0, 169.0, 299.0, 841.0, 1364.0, 557.0, 223.0, 114.0, 75.0, 66.0, 31.0, 25.0, 13.0, 15.0, 10.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.1399364471435547, -0.13460922241210938, -0.12928199768066406, -0.12395477294921875, -0.11862754821777344, -0.11330032348632812, -0.10797309875488281, -0.1026458740234375, -0.09731864929199219, -0.09199142456054688, -0.08666419982910156, -0.08133697509765625, -0.07600975036621094, -0.07068252563476562, -0.06535530090332031, -0.060028076171875, -0.05470085144042969, -0.049373626708984375, -0.04404640197753906, -0.03871917724609375, -0.03339195251464844, -0.028064727783203125, -0.022737503051757812, -0.0174102783203125, -0.012083053588867188, -0.006755828857421875, -0.0014286041259765625, 0.00389862060546875, 0.009225845336914062, 0.014553070068359375, 0.019880294799804688, 0.02520751953125, 0.030534744262695312, 0.035861968994140625, 0.04118919372558594, 0.04651641845703125, 0.05184364318847656, 0.057170867919921875, 0.06249809265136719, 0.0678253173828125, 0.07315254211425781, 0.07847976684570312, 0.08380699157714844, 0.08913421630859375, 0.09446144104003906, 0.09978866577148438, 0.10511589050292969, 0.110443115234375, 0.11577033996582031, 0.12109756469726562, 0.12642478942871094, 0.13175201416015625, 0.13707923889160156, 0.14240646362304688, 0.1477336883544922, 0.1530609130859375, 0.1583881378173828, 0.16371536254882812, 0.16904258728027344, 0.17436981201171875, 0.17969703674316406, 0.18502426147460938, 0.1903514862060547, 0.1956787109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 18.0, 108.0, 481.0, 327.0, 53.0, 12.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.786720037460327, -3.716315269470215, -3.6459105014801025, -3.5755057334899902, -3.505100965499878, -3.4346961975097656, -3.3642914295196533, -3.293886661529541, -3.223482131958008, -3.1530773639678955, -3.082672595977783, -3.012267827987671, -2.9418630599975586, -2.8714582920074463, -2.801053524017334, -2.730648994445801, -2.6602439880371094, -2.589839220046997, -2.5194344520568848, -2.4490296840667725, -2.37862491607666, -2.308220148086548, -2.2378153800964355, -2.1674108505249023, -2.097005844116211, -2.0266010761260986, -1.9561963081359863, -1.885791540145874, -1.8153867721557617, -1.7449820041656494, -1.6745773553848267, -1.6041725873947144, -1.5337679386138916, -1.4633631706237793, -1.392958402633667, -1.3225536346435547, -1.2521488666534424, -1.18174409866333, -1.1113394498825073, -1.040934681892395, -0.9705298542976379, -0.9001250863075256, -0.8297203779220581, -0.7593156099319458, -0.6889108419418335, -0.6185060739517212, -0.5481013059616089, -0.47769659757614136, -0.40729182958602905, -0.33688706159591675, -0.26648232340812683, -0.19607757031917572, -0.1256728172302246, -0.055268049240112305, 0.015136688947677612, 0.08554142713546753, 0.15594619512557983, 0.22635094821453094, 0.29675570130348206, 0.367160439491272, 0.4375652074813843, 0.5079699754714966, 0.5783747434616089, 0.6487794518470764, 0.7191842198371887]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 10.0, 2.0, 9.0, 11.0, 14.0, 20.0, 30.0, 36.0, 40.0, 66.0, 63.0, 63.0, 67.0, 75.0, 79.0, 70.0, 78.0, 54.0, 46.0, 44.0, 37.0, 20.0, 16.0, 20.0, 14.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6763163208961487, -0.6550523042678833, -0.6337883472442627, -0.6125243306159973, -0.5912603139877319, -0.5699962973594666, -0.5487322807312012, -0.5274683237075806, -0.5062043070793152, -0.4849402904510498, -0.4636763036251068, -0.4424123167991638, -0.42114830017089844, -0.39988428354263306, -0.37862029671669006, -0.35735630989074707, -0.3360922932624817, -0.3148282766342163, -0.2935642898082733, -0.2723003029823303, -0.25103628635406494, -0.22977228462696075, -0.20850828289985657, -0.18724428117275238, -0.1659802794456482, -0.144716277718544, -0.12345227599143982, -0.10218827426433563, -0.08092427253723145, -0.05966027081012726, -0.03839626908302307, -0.017132267355918884, 0.004131793975830078, 0.025395795702934265, 0.04665979743003845, 0.06792379915714264, 0.08918780088424683, 0.11045180261135101, 0.1317158043384552, 0.1529798060655594, 0.17424380779266357, 0.19550780951976776, 0.21677181124687195, 0.23803581297397614, 0.2592998147010803, 0.2805638313293457, 0.3018278181552887, 0.3230918049812317, 0.34435582160949707, 0.36561983823776245, 0.38688382506370544, 0.40814781188964844, 0.4294118285179138, 0.4506758451461792, 0.4719398319721222, 0.4932038187980652, 0.5144678354263306, 0.535731852054596, 0.5569958686828613, 0.5782598257064819, 0.5995238423347473, 0.6207878589630127, 0.6420518159866333, 0.6633158326148987, 0.6845798492431641]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 6.0, 11.0, 15.0, 21.0, 40.0, 41.0, 65.0, 68.0, 130.0, 169.0, 274.0, 449.0, 672.0, 1157.0, 2015.0, 3678.0, 6718.0, 14294.0, 33401.0, 845278.0, 90388.0, 25353.0, 11327.0, 5641.0, 2948.0, 1681.0, 1000.0, 534.0, 385.0, 245.0, 165.0, 105.0, 68.0, 51.0, 38.0, 18.0, 25.0, 21.0, 12.0, 17.0, 12.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.82080078125, -0.7923507690429688, -0.7639007568359375, -0.7354507446289062, -0.707000732421875, -0.6785507202148438, -0.6501007080078125, -0.6216506958007812, -0.59320068359375, -0.5647506713867188, -0.5363006591796875, -0.5078506469726562, -0.479400634765625, -0.45095062255859375, -0.4225006103515625, -0.39405059814453125, -0.3656005859375, -0.33715057373046875, -0.3087005615234375, -0.28025054931640625, -0.251800537109375, -0.22335052490234375, -0.1949005126953125, -0.16645050048828125, -0.13800048828125, -0.10955047607421875, -0.0811004638671875, -0.05265045166015625, -0.024200439453125, 0.00424957275390625, 0.0326995849609375, 0.06114959716796875, 0.089599609375, 0.11804962158203125, 0.1464996337890625, 0.17494964599609375, 0.203399658203125, 0.23184967041015625, 0.2602996826171875, 0.28874969482421875, 0.31719970703125, 0.34564971923828125, 0.3740997314453125, 0.40254974365234375, 0.430999755859375, 0.45944976806640625, 0.4878997802734375, 0.5163497924804688, 0.5447998046875, 0.5732498168945312, 0.6016998291015625, 0.6301498413085938, 0.658599853515625, 0.6870498657226562, 0.7154998779296875, 0.7439498901367188, 0.77239990234375, 0.8008499145507812, 0.8292999267578125, 0.8577499389648438, 0.886199951171875, 0.9146499633789062, 0.9430999755859375, 0.9715499877929688, 1.0]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 9.0, 11.0, 9.0, 12.0, 18.0, 15.0, 269.0, 516.0, 22.0, 12.0, 14.0, 5.0, 10.0, 13.0, 5.0, 4.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.15961074829101562, -0.15491485595703125, -0.15021896362304688, -0.1455230712890625, -0.14082717895507812, -0.13613128662109375, -0.13143539428710938, -0.126739501953125, -0.12204360961914062, -0.11734771728515625, -0.11265182495117188, -0.1079559326171875, -0.10326004028320312, -0.09856414794921875, -0.09386825561523438, -0.08917236328125, -0.08447647094726562, -0.07978057861328125, -0.07508468627929688, -0.0703887939453125, -0.06569290161132812, -0.06099700927734375, -0.056301116943359375, -0.051605224609375, -0.046909332275390625, -0.04221343994140625, -0.037517547607421875, -0.0328216552734375, -0.028125762939453125, -0.02342987060546875, -0.018733978271484375, -0.0140380859375, -0.009342193603515625, -0.00464630126953125, 4.9591064453125e-05, 0.0047454833984375, 0.009441375732421875, 0.01413726806640625, 0.018833160400390625, 0.023529052734375, 0.028224945068359375, 0.03292083740234375, 0.037616729736328125, 0.0423126220703125, 0.047008514404296875, 0.05170440673828125, 0.056400299072265625, 0.06109619140625, 0.06579208374023438, 0.07048797607421875, 0.07518386840820312, 0.0798797607421875, 0.08457565307617188, 0.08927154541015625, 0.09396743774414062, 0.098663330078125, 0.10335922241210938, 0.10805511474609375, 0.11275100708007812, 0.1174468994140625, 0.12214279174804688, 0.12683868408203125, 0.13153457641601562, 0.13623046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 3.0, 8.0, 20.0, 16.0, 22.0, 37.0, 45.0, 55.0, 90.0, 126.0, 177.0, 260.0, 441.0, 646.0, 1163.0, 2092.0, 3888.0, 7631.0, 16006.0, 35130.0, 82991.0, 199821.0, 343872.0, 202017.0, 83255.0, 35296.0, 16255.0, 7788.0, 4066.0, 2157.0, 1151.0, 708.0, 412.0, 276.0, 176.0, 115.0, 87.0, 59.0, 44.0, 42.0, 26.0, 30.0, 11.0, 8.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.36376953125, -0.3522224426269531, -0.34067535400390625, -0.3291282653808594, -0.3175811767578125, -0.3060340881347656, -0.29448699951171875, -0.2829399108886719, -0.271392822265625, -0.2598457336425781, -0.24829864501953125, -0.23675155639648438, -0.2252044677734375, -0.21365737915039062, -0.20211029052734375, -0.19056320190429688, -0.17901611328125, -0.16746902465820312, -0.15592193603515625, -0.14437484741210938, -0.1328277587890625, -0.12128067016601562, -0.10973358154296875, -0.09818649291992188, -0.086639404296875, -0.07509231567382812, -0.06354522705078125, -0.051998138427734375, -0.0404510498046875, -0.028903961181640625, -0.01735687255859375, -0.005809783935546875, 0.0057373046875, 0.017284393310546875, 0.02883148193359375, 0.040378570556640625, 0.0519256591796875, 0.06347274780273438, 0.07501983642578125, 0.08656692504882812, 0.098114013671875, 0.10966110229492188, 0.12120819091796875, 0.13275527954101562, 0.1443023681640625, 0.15584945678710938, 0.16739654541015625, 0.17894363403320312, 0.19049072265625, 0.20203781127929688, 0.21358489990234375, 0.22513198852539062, 0.2366790771484375, 0.24822616577148438, 0.25977325439453125, 0.2713203430175781, 0.282867431640625, 0.2944145202636719, 0.30596160888671875, 0.3175086975097656, 0.3290557861328125, 0.3406028747558594, 0.35214996337890625, 0.3636970520019531, 0.375244140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 9.0, 7.0, 15.0, 13.0, 9.0, 18.0, 16.0, 18.0, 21.0, 24.0, 29.0, 32.0, 31.0, 31.0, 37.0, 45.0, 45.0, 48.0, 39.0, 35.0, 43.0, 40.0, 55.0, 43.0, 38.0, 35.0, 27.0, 33.0, 15.0, 26.0, 22.0, 17.0, 20.0, 11.0, 13.0, 10.0, 6.0, 9.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5199966430664062, -0.5028839111328125, -0.48577117919921875, -0.468658447265625, -0.45154571533203125, -0.4344329833984375, -0.41732025146484375, -0.40020751953125, -0.38309478759765625, -0.3659820556640625, -0.34886932373046875, -0.331756591796875, -0.31464385986328125, -0.2975311279296875, -0.28041839599609375, -0.2633056640625, -0.24619293212890625, -0.2290802001953125, -0.21196746826171875, -0.194854736328125, -0.17774200439453125, -0.1606292724609375, -0.14351654052734375, -0.12640380859375, -0.10929107666015625, -0.0921783447265625, -0.07506561279296875, -0.057952880859375, -0.04084014892578125, -0.0237274169921875, -0.00661468505859375, 0.010498046875, 0.02761077880859375, 0.0447235107421875, 0.06183624267578125, 0.078948974609375, 0.09606170654296875, 0.1131744384765625, 0.13028717041015625, 0.14739990234375, 0.16451263427734375, 0.1816253662109375, 0.19873809814453125, 0.215850830078125, 0.23296356201171875, 0.2500762939453125, 0.26718902587890625, 0.2843017578125, 0.30141448974609375, 0.3185272216796875, 0.33563995361328125, 0.352752685546875, 0.36986541748046875, 0.3869781494140625, 0.40409088134765625, 0.42120361328125, 0.43831634521484375, 0.4554290771484375, 0.47254180908203125, 0.489654541015625, 0.5067672729492188, 0.5238800048828125, 0.5409927368164062, 0.55810546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 13.0, 17.0, 18.0, 38.0, 57.0, 102.0, 147.0, 259.0, 501.0, 1124.0, 2898.0, 10898.0, 114289.0, 871400.0, 36633.0, 6399.0, 2028.0, 779.0, 392.0, 215.0, 105.0, 65.0, 55.0, 33.0, 20.0, 15.0, 12.0, 12.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.658203125, -0.6357498168945312, -0.6132965087890625, -0.5908432006835938, -0.568389892578125, -0.5459365844726562, -0.5234832763671875, -0.5010299682617188, -0.47857666015625, -0.45612335205078125, -0.4336700439453125, -0.41121673583984375, -0.388763427734375, -0.36631011962890625, -0.3438568115234375, -0.32140350341796875, -0.2989501953125, -0.27649688720703125, -0.2540435791015625, -0.23159027099609375, -0.209136962890625, -0.18668365478515625, -0.1642303466796875, -0.14177703857421875, -0.11932373046875, -0.09687042236328125, -0.0744171142578125, -0.05196380615234375, -0.029510498046875, -0.00705718994140625, 0.0153961181640625, 0.03784942626953125, 0.060302734375, 0.08275604248046875, 0.1052093505859375, 0.12766265869140625, 0.150115966796875, 0.17256927490234375, 0.1950225830078125, 0.21747589111328125, 0.23992919921875, 0.26238250732421875, 0.2848358154296875, 0.30728912353515625, 0.329742431640625, 0.35219573974609375, 0.3746490478515625, 0.39710235595703125, 0.4195556640625, 0.44200897216796875, 0.4644622802734375, 0.48691558837890625, 0.509368896484375, 0.5318222045898438, 0.5542755126953125, 0.5767288208007812, 0.59918212890625, 0.6216354370117188, 0.6440887451171875, 0.6665420532226562, 0.688995361328125, 0.7114486694335938, 0.7339019775390625, 0.7563552856445312, 0.77880859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 10.0, 14.0, 19.0, 23.0, 61.0, 70.0, 97.0, 161.0, 154.0, 135.0, 83.0, 56.0, 49.0, 23.0, 14.0, 12.0, 11.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.072355270385742e-05, -4.915241152048111e-05, -4.75812703371048e-05, -4.6010129153728485e-05, -4.443898797035217e-05, -4.286784678697586e-05, -4.129670560359955e-05, -3.9725564420223236e-05, -3.8154423236846924e-05, -3.658328205347061e-05, -3.50121408700943e-05, -3.344099968671799e-05, -3.1869858503341675e-05, -3.0298717319965363e-05, -2.872757613658905e-05, -2.7156434953212738e-05, -2.5585293769836426e-05, -2.4014152586460114e-05, -2.24430114030838e-05, -2.087187021970749e-05, -1.9300729036331177e-05, -1.7729587852954865e-05, -1.6158446669578552e-05, -1.458730548620224e-05, -1.3016164302825928e-05, -1.1445023119449615e-05, -9.873881936073303e-06, -8.302740752696991e-06, -6.731599569320679e-06, -5.1604583859443665e-06, -3.589317202568054e-06, -2.018176019191742e-06, -4.470348358154297e-07, 1.1241063475608826e-06, 2.695247530937195e-06, 4.266388714313507e-06, 5.837529897689819e-06, 7.408671081066132e-06, 8.979812264442444e-06, 1.0550953447818756e-05, 1.2122094631195068e-05, 1.369323581457138e-05, 1.5264376997947693e-05, 1.6835518181324005e-05, 1.8406659364700317e-05, 1.997780054807663e-05, 2.1548941731452942e-05, 2.3120082914829254e-05, 2.4691224098205566e-05, 2.626236528158188e-05, 2.783350646495819e-05, 2.9404647648334503e-05, 3.0975788831710815e-05, 3.254693001508713e-05, 3.411807119846344e-05, 3.568921238183975e-05, 3.7260353565216064e-05, 3.883149474859238e-05, 4.040263593196869e-05, 4.1973777115345e-05, 4.3544918298721313e-05, 4.5116059482097626e-05, 4.668720066547394e-05, 4.825834184885025e-05, 4.982948303222656e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 9.0, 12.0, 22.0, 16.0, 18.0, 34.0, 48.0, 65.0, 98.0, 136.0, 157.0, 311.0, 500.0, 712.0, 1239.0, 2217.0, 4069.0, 8727.0, 21787.0, 70175.0, 324699.0, 460006.0, 103002.0, 28707.0, 10685.0, 4791.0, 2522.0, 1385.0, 857.0, 515.0, 325.0, 207.0, 128.0, 100.0, 73.0, 41.0, 44.0, 24.0, 26.0, 17.0, 9.0, 10.0, 5.0, 4.0, 2.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.371337890625, -0.36013031005859375, -0.3489227294921875, -0.33771514892578125, -0.326507568359375, -0.31529998779296875, -0.3040924072265625, -0.29288482666015625, -0.28167724609375, -0.27046966552734375, -0.2592620849609375, -0.24805450439453125, -0.236846923828125, -0.22563934326171875, -0.2144317626953125, -0.20322418212890625, -0.1920166015625, -0.18080902099609375, -0.1696014404296875, -0.15839385986328125, -0.147186279296875, -0.13597869873046875, -0.1247711181640625, -0.11356353759765625, -0.10235595703125, -0.09114837646484375, -0.0799407958984375, -0.06873321533203125, -0.057525634765625, -0.04631805419921875, -0.0351104736328125, -0.02390289306640625, -0.0126953125, -0.00148773193359375, 0.0097198486328125, 0.02092742919921875, 0.032135009765625, 0.04334259033203125, 0.0545501708984375, 0.06575775146484375, 0.07696533203125, 0.08817291259765625, 0.0993804931640625, 0.11058807373046875, 0.121795654296875, 0.13300323486328125, 0.1442108154296875, 0.15541839599609375, 0.1666259765625, 0.17783355712890625, 0.1890411376953125, 0.20024871826171875, 0.211456298828125, 0.22266387939453125, 0.2338714599609375, 0.24507904052734375, 0.25628662109375, 0.26749420166015625, 0.2787017822265625, 0.28990936279296875, 0.301116943359375, 0.31232452392578125, 0.3235321044921875, 0.33473968505859375, 0.345947265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 11.0, 15.0, 17.0, 20.0, 31.0, 24.0, 27.0, 43.0, 32.0, 53.0, 67.0, 86.0, 77.0, 55.0, 76.0, 57.0, 60.0, 50.0, 35.0, 34.0, 19.0, 18.0, 21.0, 11.0, 11.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.50634765625, -0.4898834228515625, -0.473419189453125, -0.4569549560546875, -0.44049072265625, -0.4240264892578125, -0.407562255859375, -0.3910980224609375, -0.3746337890625, -0.3581695556640625, -0.341705322265625, -0.3252410888671875, -0.30877685546875, -0.2923126220703125, -0.275848388671875, -0.2593841552734375, -0.242919921875, -0.2264556884765625, -0.209991455078125, -0.1935272216796875, -0.17706298828125, -0.1605987548828125, -0.144134521484375, -0.1276702880859375, -0.1112060546875, -0.0947418212890625, -0.078277587890625, -0.0618133544921875, -0.04534912109375, -0.0288848876953125, -0.012420654296875, 0.0040435791015625, 0.0205078125, 0.0369720458984375, 0.053436279296875, 0.0699005126953125, 0.08636474609375, 0.1028289794921875, 0.119293212890625, 0.1357574462890625, 0.1522216796875, 0.1686859130859375, 0.185150146484375, 0.2016143798828125, 0.21807861328125, 0.2345428466796875, 0.251007080078125, 0.2674713134765625, 0.283935546875, 0.3003997802734375, 0.316864013671875, 0.3333282470703125, 0.34979248046875, 0.3662567138671875, 0.382720947265625, 0.3991851806640625, 0.4156494140625, 0.4321136474609375, 0.448577880859375, 0.4650421142578125, 0.48150634765625, 0.4979705810546875, 0.514434814453125, 0.5308990478515625, 0.54736328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 10.0, 28.0, 52.0, 153.0, 386.0, 232.0, 90.0, 20.0, 13.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.209859848022461, -13.842630386352539, -13.4753999710083, -13.108170509338379, -12.740941047668457, -12.373710632324219, -12.006481170654297, -11.639251708984375, -11.272022247314453, -10.904792785644531, -10.537562370300293, -10.170332908630371, -9.80310344696045, -9.435873031616211, -9.068643569946289, -8.701414108276367, -8.334183692932129, -7.966953754425049, -7.599724292755127, -7.232494354248047, -6.865264892578125, -6.498034954071045, -6.130805015563965, -5.763575553894043, -5.396345615386963, -5.029115676879883, -4.661886215209961, -4.294656276702881, -3.92742657661438, -3.560196876525879, -3.192966938018799, -2.825737237930298, -2.4585084915161133, -2.0912787914276123, -1.7240489721298218, -1.3568191528320312, -0.9895894527435303, -0.6223597526550293, -0.2551298141479492, 0.11209988594055176, 0.47932958602905273, 0.8465593457221985, 1.2137891054153442, 1.5810189247131348, 1.9482486248016357, 2.3154783248901367, 2.682708263397217, 3.0499379634857178, 3.4171676635742188, 3.7843973636627197, 4.151627063751221, 4.518857002258301, 4.886086463928223, 5.253316402435303, 5.620546340942383, 5.987775802612305, 6.355005741119385, 6.722235679626465, 7.089465141296387, 7.456695079803467, 7.823925018310547, 8.191154479980469, 8.55838394165039, 8.925614356994629, 9.29284381866455]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 17.0, 12.0, 17.0, 41.0, 37.0, 86.0, 111.0, 139.0, 134.0, 113.0, 76.0, 58.0, 46.0, 26.0, 14.0, 7.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.37216567993164, -10.048008918762207, -9.723852157592773, -9.39969539642334, -9.075538635253906, -8.751382827758789, -8.427226066589355, -8.103069305419922, -7.778912544250488, -7.454755783081055, -7.130599021911621, -6.806442737579346, -6.482285976409912, -6.1581292152404785, -5.833972930908203, -5.5098161697387695, -5.185659408569336, -4.861502647399902, -4.537345886230469, -4.213189601898193, -3.8890328407287598, -3.564876079559326, -3.2407195568084717, -2.916563034057617, -2.5924062728881836, -2.26824951171875, -1.9440929889678955, -1.6199363470077515, -1.2957797050476074, -0.9716230630874634, -0.6474664211273193, -0.32330989837646484, 0.00084686279296875, 0.3250035047531128, 0.6491601467132568, 0.9733167886734009, 1.297473430633545, 1.621630072593689, 1.945786714553833, 2.2699432373046875, 2.594099998474121, 2.9182567596435547, 3.242413282394409, 3.5665698051452637, 3.8907265663146973, 4.214883327484131, 4.539039611816406, 4.86319637298584, 5.187353134155273, 5.511509895324707, 5.835666656494141, 6.159822940826416, 6.48397970199585, 6.808136463165283, 7.132292747497559, 7.456449508666992, 7.780606269836426, 8.10476303100586, 8.428919792175293, 8.753076553344727, 9.077232360839844, 9.401389122009277, 9.725545883178711, 10.049702644348145, 10.373859405517578]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 12.0, 17.0, 26.0, 49.0, 74.0, 152.0, 240.0, 477.0, 1016.0, 2413.0, 6504.0, 22931.0, 237135.0, 3864807.0, 44261.0, 9098.0, 2926.0, 1155.0, 451.0, 208.0, 132.0, 69.0, 44.0, 30.0, 10.0, 8.0, 11.0, 4.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.384765625, -1.33892822265625, -1.2930908203125, -1.24725341796875, -1.201416015625, -1.15557861328125, -1.1097412109375, -1.06390380859375, -1.01806640625, -0.97222900390625, -0.9263916015625, -0.88055419921875, -0.834716796875, -0.78887939453125, -0.7430419921875, -0.69720458984375, -0.6513671875, -0.60552978515625, -0.5596923828125, -0.51385498046875, -0.468017578125, -0.42218017578125, -0.3763427734375, -0.33050537109375, -0.28466796875, -0.23883056640625, -0.1929931640625, -0.14715576171875, -0.101318359375, -0.05548095703125, -0.0096435546875, 0.03619384765625, 0.08203125, 0.12786865234375, 0.1737060546875, 0.21954345703125, 0.265380859375, 0.31121826171875, 0.3570556640625, 0.40289306640625, 0.44873046875, 0.49456787109375, 0.5404052734375, 0.58624267578125, 0.632080078125, 0.67791748046875, 0.7237548828125, 0.76959228515625, 0.8154296875, 0.86126708984375, 0.9071044921875, 0.95294189453125, 0.998779296875, 1.04461669921875, 1.0904541015625, 1.13629150390625, 1.18212890625, 1.22796630859375, 1.2738037109375, 1.31964111328125, 1.365478515625, 1.41131591796875, 1.4571533203125, 1.50299072265625, 1.548828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 8.0, 7.0, 6.0, 10.0, 9.0, 11.0, 21.0, 29.0, 88.0, 254.0, 252.0, 136.0, 53.0, 24.0, 13.0, 12.0, 13.0, 6.0, 6.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10723876953125, -0.10378456115722656, -0.10033035278320312, -0.09687614440917969, -0.09342193603515625, -0.08996772766113281, -0.08651351928710938, -0.08305931091308594, -0.0796051025390625, -0.07615089416503906, -0.07269668579101562, -0.06924247741699219, -0.06578826904296875, -0.06233406066894531, -0.058879852294921875, -0.05542564392089844, -0.051971435546875, -0.04851722717285156, -0.045063018798828125, -0.04160881042480469, -0.03815460205078125, -0.03470039367675781, -0.031246185302734375, -0.027791976928710938, -0.0243377685546875, -0.020883560180664062, -0.017429351806640625, -0.013975143432617188, -0.01052093505859375, -0.0070667266845703125, -0.003612518310546875, -0.0001583099365234375, 0.0032958984375, 0.0067501068115234375, 0.010204315185546875, 0.013658523559570312, 0.01711273193359375, 0.020566940307617188, 0.024021148681640625, 0.027475357055664062, 0.0309295654296875, 0.03438377380371094, 0.037837982177734375, 0.04129219055175781, 0.04474639892578125, 0.04820060729980469, 0.051654815673828125, 0.05510902404785156, 0.058563232421875, 0.06201744079589844, 0.06547164916992188, 0.06892585754394531, 0.07238006591796875, 0.07583427429199219, 0.07928848266601562, 0.08274269104003906, 0.0861968994140625, 0.08965110778808594, 0.09310531616210938, 0.09655952453613281, 0.10001373291015625, 0.10346794128417969, 0.10692214965820312, 0.11037635803222656, 0.11383056640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 10.0, 19.0, 28.0, 29.0, 48.0, 61.0, 84.0, 132.0, 202.0, 323.0, 600.0, 1029.0, 1852.0, 3746.0, 8169.0, 19684.0, 60572.0, 348907.0, 3339545.0, 317426.0, 57386.0, 18811.0, 7752.0, 3609.0, 1779.0, 976.0, 529.0, 329.0, 201.0, 131.0, 83.0, 63.0, 41.0, 41.0, 23.0, 13.0, 16.0, 9.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.517578125, -0.5000228881835938, -0.4824676513671875, -0.46491241455078125, -0.447357177734375, -0.42980194091796875, -0.4122467041015625, -0.39469146728515625, -0.37713623046875, -0.35958099365234375, -0.3420257568359375, -0.32447052001953125, -0.306915283203125, -0.28936004638671875, -0.2718048095703125, -0.25424957275390625, -0.2366943359375, -0.21913909912109375, -0.2015838623046875, -0.18402862548828125, -0.166473388671875, -0.14891815185546875, -0.1313629150390625, -0.11380767822265625, -0.09625244140625, -0.07869720458984375, -0.0611419677734375, -0.04358673095703125, -0.026031494140625, -0.00847625732421875, 0.0090789794921875, 0.02663421630859375, 0.044189453125, 0.06174468994140625, 0.0792999267578125, 0.09685516357421875, 0.114410400390625, 0.13196563720703125, 0.1495208740234375, 0.16707611083984375, 0.18463134765625, 0.20218658447265625, 0.2197418212890625, 0.23729705810546875, 0.254852294921875, 0.27240753173828125, 0.2899627685546875, 0.30751800537109375, 0.3250732421875, 0.34262847900390625, 0.3601837158203125, 0.37773895263671875, 0.395294189453125, 0.41284942626953125, 0.4304046630859375, 0.44795989990234375, 0.46551513671875, 0.48307037353515625, 0.5006256103515625, 0.5181808471679688, 0.535736083984375, 0.5532913208007812, 0.5708465576171875, 0.5884017944335938, 0.60595703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 7.0, 3.0, 2.0, 6.0, 8.0, 16.0, 9.0, 21.0, 28.0, 27.0, 35.0, 65.0, 89.0, 178.0, 323.0, 661.0, 1384.0, 571.0, 226.0, 132.0, 68.0, 44.0, 40.0, 28.0, 18.0, 12.0, 13.0, 8.0, 5.0, 11.0, 5.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09295654296875, -0.0891561508178711, -0.08535575866699219, -0.08155536651611328, -0.07775497436523438, -0.07395458221435547, -0.07015419006347656, -0.06635379791259766, -0.06255340576171875, -0.058753013610839844, -0.05495262145996094, -0.05115222930908203, -0.047351837158203125, -0.04355144500732422, -0.03975105285644531, -0.035950660705566406, -0.0321502685546875, -0.028349876403808594, -0.024549484252929688, -0.02074909210205078, -0.016948699951171875, -0.013148307800292969, -0.009347915649414062, -0.005547523498535156, -0.00174713134765625, 0.0020532608032226562, 0.0058536529541015625, 0.009654045104980469, 0.013454437255859375, 0.01725482940673828, 0.021055221557617188, 0.024855613708496094, 0.028656005859375, 0.032456398010253906, 0.03625679016113281, 0.04005718231201172, 0.043857574462890625, 0.04765796661376953, 0.05145835876464844, 0.055258750915527344, 0.05905914306640625, 0.06285953521728516, 0.06665992736816406, 0.07046031951904297, 0.07426071166992188, 0.07806110382080078, 0.08186149597167969, 0.0856618881225586, 0.0894622802734375, 0.0932626724243164, 0.09706306457519531, 0.10086345672607422, 0.10466384887695312, 0.10846424102783203, 0.11226463317871094, 0.11606502532958984, 0.11986541748046875, 0.12366580963134766, 0.12746620178222656, 0.13126659393310547, 0.13506698608398438, 0.13886737823486328, 0.1426677703857422, 0.1464681625366211, 0.1502685546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 8.0, 7.0, 17.0, 103.0, 657.0, 189.0, 14.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3823251724243164, -2.2728469371795654, -2.1633689403533936, -2.0538907051086426, -1.9444127082824707, -1.8349344730377197, -1.7254564762115479, -1.6159782409667969, -1.506500244140625, -1.3970221281051636, -1.2875440120697021, -1.1780658960342407, -1.0685877799987793, -0.9591096043586731, -0.8496314883232117, -0.7401533722877502, -0.630675196647644, -0.5211970806121826, -0.4117189645767212, -0.3022408187389374, -0.19276270270347595, -0.08328455686569214, 0.026193559169769287, 0.1356716752052307, 0.24514979124069214, 0.35462790727615356, 0.464106023311615, 0.5735841989517212, 0.6830623149871826, 0.792540431022644, 0.9020185470581055, 1.011496663093567, 1.1209747791290283, 1.2304528951644897, 1.3399310111999512, 1.4494091272354126, 1.558887243270874, 1.668365478515625, 1.7778434753417969, 1.8873217105865479, 1.9967997074127197, 2.1062779426574707, 2.2157559394836426, 2.3252341747283936, 2.4347121715545654, 2.5441904067993164, 2.6536684036254883, 2.7631466388702393, 2.8726248741149902, 2.982103109359741, 3.091581106185913, 3.201059341430664, 3.310537338256836, 3.420015573501587, 3.529493570327759, 3.6389718055725098, 3.7484498023986816, 3.8579280376434326, 3.9674060344696045, 4.0768842697143555, 4.186362266540527, 4.295840263366699, 4.405318737030029, 4.514796733856201, 4.624274730682373]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 8.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 12.0, 27.0, 30.0, 31.0, 55.0, 58.0, 56.0, 85.0, 71.0, 86.0, 73.0, 81.0, 80.0, 44.0, 34.0, 35.0, 17.0, 20.0, 18.0, 7.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7327967286109924, -0.7100450396537781, -0.6872933506965637, -0.6645417213439941, -0.6417900323867798, -0.6190383434295654, -0.5962866544723511, -0.5735349655151367, -0.5507832765579224, -0.528031587600708, -0.5052798986434937, -0.4825282394886017, -0.45977655053138733, -0.43702489137649536, -0.414273202419281, -0.39152151346206665, -0.3687698543071747, -0.3460181653499603, -0.32326650619506836, -0.300514817237854, -0.27776312828063965, -0.2550114393234253, -0.23225978016853333, -0.20950809121131897, -0.1867564171552658, -0.16400474309921265, -0.1412530541419983, -0.11850138008594513, -0.09574969857931137, -0.07299801707267761, -0.05024634301662445, -0.027494654059410095, -0.004742980003356934, 0.018008699640631676, 0.040760379284620285, 0.06351205706596375, 0.0862637385725975, 0.10901542007923126, 0.13176709413528442, 0.15451878309249878, 0.17727045714855194, 0.2000221312046051, 0.22277382016181946, 0.24552549421787262, 0.2682771682739258, 0.29102885723114014, 0.3137805461883545, 0.33653223514556885, 0.3592838943004608, 0.38203558325767517, 0.40478724241256714, 0.4275389313697815, 0.45029062032699585, 0.4730423092842102, 0.4957939684391022, 0.5185456275939941, 0.5412973165512085, 0.5640490055084229, 0.5868006944656372, 0.6095523834228516, 0.6323040127754211, 0.6550557017326355, 0.6778073906898499, 0.7005590796470642, 0.7233107686042786]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 13.0, 13.0, 18.0, 24.0, 29.0, 46.0, 49.0, 80.0, 128.0, 189.0, 293.0, 459.0, 721.0, 1155.0, 1926.0, 3389.0, 6515.0, 13029.0, 29355.0, 135659.0, 724044.0, 82336.0, 24356.0, 11247.0, 5765.0, 3071.0, 1751.0, 989.0, 636.0, 386.0, 269.0, 197.0, 133.0, 95.0, 61.0, 40.0, 28.0, 23.0, 8.0, 9.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.724609375, -0.702239990234375, -0.67987060546875, -0.657501220703125, -0.6351318359375, -0.612762451171875, -0.59039306640625, -0.568023681640625, -0.545654296875, -0.523284912109375, -0.50091552734375, -0.478546142578125, -0.4561767578125, -0.433807373046875, -0.41143798828125, -0.389068603515625, -0.36669921875, -0.344329833984375, -0.32196044921875, -0.299591064453125, -0.2772216796875, -0.254852294921875, -0.23248291015625, -0.210113525390625, -0.187744140625, -0.165374755859375, -0.14300537109375, -0.120635986328125, -0.0982666015625, -0.075897216796875, -0.05352783203125, -0.031158447265625, -0.0087890625, 0.013580322265625, 0.03594970703125, 0.058319091796875, 0.0806884765625, 0.103057861328125, 0.12542724609375, 0.147796630859375, 0.170166015625, 0.192535400390625, 0.21490478515625, 0.237274169921875, 0.2596435546875, 0.282012939453125, 0.30438232421875, 0.326751708984375, 0.34912109375, 0.371490478515625, 0.39385986328125, 0.416229248046875, 0.4385986328125, 0.460968017578125, 0.48333740234375, 0.505706787109375, 0.528076171875, 0.550445556640625, 0.57281494140625, 0.595184326171875, 0.6175537109375, 0.639923095703125, 0.66229248046875, 0.684661865234375, 0.70703125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 9.0, 6.0, 11.0, 14.0, 12.0, 22.0, 36.0, 123.0, 212.0, 238.0, 141.0, 53.0, 37.0, 13.0, 13.0, 11.0, 8.0, 6.0, 1.0, 7.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10198974609375, -0.09858417510986328, -0.09517860412597656, -0.09177303314208984, -0.08836746215820312, -0.0849618911743164, -0.08155632019042969, -0.07815074920654297, -0.07474517822265625, -0.07133960723876953, -0.06793403625488281, -0.0645284652709961, -0.061122894287109375, -0.057717323303222656, -0.05431175231933594, -0.05090618133544922, -0.0475006103515625, -0.04409503936767578, -0.04068946838378906, -0.037283897399902344, -0.033878326416015625, -0.030472755432128906, -0.027067184448242188, -0.02366161346435547, -0.02025604248046875, -0.01685047149658203, -0.013444900512695312, -0.010039329528808594, -0.006633758544921875, -0.0032281875610351562, 0.0001773834228515625, 0.0035829544067382812, 0.006988525390625, 0.010394096374511719, 0.013799667358398438, 0.017205238342285156, 0.020610809326171875, 0.024016380310058594, 0.027421951293945312, 0.03082752227783203, 0.03423309326171875, 0.03763866424560547, 0.04104423522949219, 0.044449806213378906, 0.047855377197265625, 0.051260948181152344, 0.05466651916503906, 0.05807209014892578, 0.0614776611328125, 0.06488323211669922, 0.06828880310058594, 0.07169437408447266, 0.07509994506835938, 0.0785055160522461, 0.08191108703613281, 0.08531665802001953, 0.08872222900390625, 0.09212779998779297, 0.09553337097167969, 0.0989389419555664, 0.10234451293945312, 0.10575008392333984, 0.10915565490722656, 0.11256122589111328, 0.115966796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 12.0, 42.0, 155.0, 627.0, 2914.0, 25821.0, 500616.0, 489666.0, 24984.0, 2842.0, 649.0, 151.0, 30.0, 11.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3525390625, -1.3169403076171875, -1.281341552734375, -1.2457427978515625, -1.21014404296875, -1.1745452880859375, -1.138946533203125, -1.1033477783203125, -1.0677490234375, -1.0321502685546875, -0.996551513671875, -0.9609527587890625, -0.92535400390625, -0.8897552490234375, -0.854156494140625, -0.8185577392578125, -0.782958984375, -0.7473602294921875, -0.711761474609375, -0.6761627197265625, -0.64056396484375, -0.6049652099609375, -0.569366455078125, -0.5337677001953125, -0.4981689453125, -0.4625701904296875, -0.426971435546875, -0.3913726806640625, -0.35577392578125, -0.3201751708984375, -0.284576416015625, -0.2489776611328125, -0.21337890625, -0.1777801513671875, -0.142181396484375, -0.1065826416015625, -0.07098388671875, -0.0353851318359375, 0.000213623046875, 0.0358123779296875, 0.0714111328125, 0.1070098876953125, 0.142608642578125, 0.1782073974609375, 0.21380615234375, 0.2494049072265625, 0.285003662109375, 0.3206024169921875, 0.356201171875, 0.3917999267578125, 0.427398681640625, 0.4629974365234375, 0.49859619140625, 0.5341949462890625, 0.569793701171875, 0.6053924560546875, 0.6409912109375, 0.6765899658203125, 0.712188720703125, 0.7477874755859375, 0.78338623046875, 0.8189849853515625, 0.854583740234375, 0.8901824951171875, 0.92578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 7.0, 11.0, 9.0, 16.0, 13.0, 18.0, 24.0, 23.0, 20.0, 35.0, 28.0, 41.0, 40.0, 45.0, 59.0, 46.0, 55.0, 46.0, 55.0, 53.0, 49.0, 42.0, 49.0, 24.0, 28.0, 35.0, 19.0, 23.0, 15.0, 14.0, 18.0, 13.0, 7.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.404541015625, -0.39459228515625, -0.3846435546875, -0.37469482421875, -0.36474609375, -0.35479736328125, -0.3448486328125, -0.33489990234375, -0.324951171875, -0.31500244140625, -0.3050537109375, -0.29510498046875, -0.28515625, -0.27520751953125, -0.2652587890625, -0.25531005859375, -0.245361328125, -0.23541259765625, -0.2254638671875, -0.21551513671875, -0.20556640625, -0.19561767578125, -0.1856689453125, -0.17572021484375, -0.165771484375, -0.15582275390625, -0.1458740234375, -0.13592529296875, -0.1259765625, -0.11602783203125, -0.1060791015625, -0.09613037109375, -0.086181640625, -0.07623291015625, -0.0662841796875, -0.05633544921875, -0.04638671875, -0.03643798828125, -0.0264892578125, -0.01654052734375, -0.006591796875, 0.00335693359375, 0.0133056640625, 0.02325439453125, 0.033203125, 0.04315185546875, 0.0531005859375, 0.06304931640625, 0.072998046875, 0.08294677734375, 0.0928955078125, 0.10284423828125, 0.11279296875, 0.12274169921875, 0.1326904296875, 0.14263916015625, 0.152587890625, 0.16253662109375, 0.1724853515625, 0.18243408203125, 0.1923828125, 0.20233154296875, 0.2122802734375, 0.22222900390625, 0.232177734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 8.0, 12.0, 4.0, 9.0, 28.0, 41.0, 40.0, 85.0, 154.0, 327.0, 976.0, 4774.0, 129978.0, 896073.0, 13231.0, 1800.0, 487.0, 234.0, 119.0, 55.0, 28.0, 30.0, 12.0, 10.0, 7.0, 6.0, 9.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.662109375, -1.6149139404296875, -1.567718505859375, -1.5205230712890625, -1.47332763671875, -1.4261322021484375, -1.378936767578125, -1.3317413330078125, -1.2845458984375, -1.2373504638671875, -1.190155029296875, -1.1429595947265625, -1.09576416015625, -1.0485687255859375, -1.001373291015625, -0.9541778564453125, -0.906982421875, -0.8597869873046875, -0.812591552734375, -0.7653961181640625, -0.71820068359375, -0.6710052490234375, -0.623809814453125, -0.5766143798828125, -0.5294189453125, -0.4822235107421875, -0.435028076171875, -0.3878326416015625, -0.34063720703125, -0.2934417724609375, -0.246246337890625, -0.1990509033203125, -0.15185546875, -0.1046600341796875, -0.057464599609375, -0.0102691650390625, 0.03692626953125, 0.0841217041015625, 0.131317138671875, 0.1785125732421875, 0.2257080078125, 0.2729034423828125, 0.320098876953125, 0.3672943115234375, 0.41448974609375, 0.4616851806640625, 0.508880615234375, 0.5560760498046875, 0.603271484375, 0.6504669189453125, 0.697662353515625, 0.7448577880859375, 0.79205322265625, 0.8392486572265625, 0.886444091796875, 0.9336395263671875, 0.9808349609375, 1.0280303955078125, 1.075225830078125, 1.1224212646484375, 1.16961669921875, 1.2168121337890625, 1.264007568359375, 1.3112030029296875, 1.3583984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 3.0, 10.0, 11.0, 13.0, 18.0, 48.0, 53.0, 80.0, 113.0, 100.0, 164.0, 103.0, 75.0, 49.0, 44.0, 34.0, 13.0, 23.0, 11.0, 7.0, 4.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8160552978515625e-05, -4.656333476305008e-05, -4.4966116547584534e-05, -4.336889833211899e-05, -4.177168011665344e-05, -4.01744619011879e-05, -3.857724368572235e-05, -3.6980025470256805e-05, -3.538280725479126e-05, -3.3785589039325714e-05, -3.218837082386017e-05, -3.059115260839462e-05, -2.8993934392929077e-05, -2.739671617746353e-05, -2.5799497961997986e-05, -2.420227974653244e-05, -2.2605061531066895e-05, -2.100784331560135e-05, -1.9410625100135803e-05, -1.7813406884670258e-05, -1.6216188669204712e-05, -1.4618970453739166e-05, -1.302175223827362e-05, -1.1424534022808075e-05, -9.82731580734253e-06, -8.230097591876984e-06, -6.632879376411438e-06, -5.035661160945892e-06, -3.4384429454803467e-06, -1.841224730014801e-06, -2.4400651454925537e-07, 1.3532117009162903e-06, 2.950429916381836e-06, 4.547648131847382e-06, 6.144866347312927e-06, 7.742084562778473e-06, 9.339302778244019e-06, 1.0936520993709564e-05, 1.253373920917511e-05, 1.4130957424640656e-05, 1.57281756401062e-05, 1.7325393855571747e-05, 1.8922612071037292e-05, 2.0519830286502838e-05, 2.2117048501968384e-05, 2.371426671743393e-05, 2.5311484932899475e-05, 2.690870314836502e-05, 2.8505921363830566e-05, 3.0103139579296112e-05, 3.170035779476166e-05, 3.32975760102272e-05, 3.489479422569275e-05, 3.6492012441158295e-05, 3.808923065662384e-05, 3.9686448872089386e-05, 4.128366708755493e-05, 4.288088530302048e-05, 4.447810351848602e-05, 4.607532173395157e-05, 4.7672539949417114e-05, 4.926975816488266e-05, 5.0866976380348206e-05, 5.246419459581375e-05, 5.40614128112793e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 8.0, 10.0, 14.0, 12.0, 32.0, 43.0, 68.0, 84.0, 163.0, 306.0, 507.0, 1072.0, 2495.0, 7182.0, 29450.0, 226701.0, 651595.0, 103442.0, 17182.0, 4607.0, 1752.0, 805.0, 383.0, 249.0, 132.0, 92.0, 49.0, 37.0, 18.0, 21.0, 12.0, 6.0, 4.0, 2.0, 5.0, 4.0, 4.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5393447875976562, -0.5215606689453125, -0.5037765502929688, -0.485992431640625, -0.46820831298828125, -0.4504241943359375, -0.43264007568359375, -0.41485595703125, -0.39707183837890625, -0.3792877197265625, -0.36150360107421875, -0.343719482421875, -0.32593536376953125, -0.3081512451171875, -0.29036712646484375, -0.2725830078125, -0.25479888916015625, -0.2370147705078125, -0.21923065185546875, -0.201446533203125, -0.18366241455078125, -0.1658782958984375, -0.14809417724609375, -0.13031005859375, -0.11252593994140625, -0.0947418212890625, -0.07695770263671875, -0.059173583984375, -0.04138946533203125, -0.0236053466796875, -0.00582122802734375, 0.011962890625, 0.02974700927734375, 0.0475311279296875, 0.06531524658203125, 0.083099365234375, 0.10088348388671875, 0.1186676025390625, 0.13645172119140625, 0.15423583984375, 0.17201995849609375, 0.1898040771484375, 0.20758819580078125, 0.225372314453125, 0.24315643310546875, 0.2609405517578125, 0.27872467041015625, 0.2965087890625, 0.31429290771484375, 0.3320770263671875, 0.34986114501953125, 0.367645263671875, 0.38542938232421875, 0.4032135009765625, 0.42099761962890625, 0.43878173828125, 0.45656585693359375, 0.4743499755859375, 0.49213409423828125, 0.509918212890625, 0.5277023315429688, 0.5454864501953125, 0.5632705688476562, 0.5810546875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 10.0, 5.0, 10.0, 16.0, 21.0, 29.0, 52.0, 70.0, 88.0, 100.0, 132.0, 93.0, 101.0, 88.0, 57.0, 44.0, 25.0, 22.0, 16.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.433349609375, -0.4177589416503906, -0.40216827392578125, -0.3865776062011719, -0.3709869384765625, -0.3553962707519531, -0.33980560302734375, -0.3242149353027344, -0.308624267578125, -0.2930335998535156, -0.27744293212890625, -0.2618522644042969, -0.2462615966796875, -0.23067092895507812, -0.21508026123046875, -0.19948959350585938, -0.18389892578125, -0.16830825805664062, -0.15271759033203125, -0.13712692260742188, -0.1215362548828125, -0.10594558715820312, -0.09035491943359375, -0.07476425170898438, -0.059173583984375, -0.043582916259765625, -0.02799224853515625, -0.012401580810546875, 0.0031890869140625, 0.018779754638671875, 0.03437042236328125, 0.049961090087890625, 0.0655517578125, 0.08114242553710938, 0.09673309326171875, 0.11232376098632812, 0.1279144287109375, 0.14350509643554688, 0.15909576416015625, 0.17468643188476562, 0.190277099609375, 0.20586776733398438, 0.22145843505859375, 0.23704910278320312, 0.2526397705078125, 0.2682304382324219, 0.28382110595703125, 0.2994117736816406, 0.31500244140625, 0.3305931091308594, 0.34618377685546875, 0.3617744445800781, 0.3773651123046875, 0.3929557800292969, 0.40854644775390625, 0.4241371154785156, 0.439727783203125, 0.4553184509277344, 0.47090911865234375, 0.4864997863769531, 0.5020904541015625, 0.5176811218261719, 0.5332717895507812, 0.5488624572753906, 0.564453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 16.0, 96.0, 649.0, 216.0, 14.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4247407913208, -11.9757661819458, -11.5267915725708, -11.0778169631958, -10.6288423538208, -10.1798677444458, -9.730894088745117, -9.281919479370117, -8.832944869995117, -8.383970260620117, -7.934995651245117, -7.486021041870117, -7.037046432495117, -6.588071823120117, -6.139097690582275, -5.690123081207275, -5.241147994995117, -4.792173385620117, -4.343198776245117, -3.8942244052886963, -3.4452497959136963, -2.9962751865386963, -2.5473008155822754, -2.0983262062072754, -1.6493515968322754, -1.2003769874572754, -0.7514024972915649, -0.3024280071258545, 0.1465466022491455, 0.5955212116241455, 1.0444955825805664, 1.4934701919555664, 1.9424457550048828, 2.391420364379883, 2.840394973754883, 3.2893693447113037, 3.7383439540863037, 4.187318801879883, 4.636292934417725, 5.085267543792725, 5.534242153167725, 5.983216762542725, 6.432191371917725, 6.881165504455566, 7.330140113830566, 7.779114723205566, 8.228089332580566, 8.677063941955566, 9.126038551330566, 9.575013160705566, 10.023987770080566, 10.472962379455566, 10.921936988830566, 11.370911598205566, 11.81988525390625, 12.26885986328125, 12.71783447265625, 13.16680908203125, 13.61578369140625, 14.06475830078125, 14.51373291015625, 14.96270751953125, 15.41168212890625, 15.86065673828125, 16.30963134765625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 4.0, 8.0, 10.0, 12.0, 12.0, 25.0, 34.0, 46.0, 65.0, 78.0, 98.0, 109.0, 101.0, 93.0, 61.0, 70.0, 52.0, 37.0, 22.0, 18.0, 13.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.923542499542236, -4.799688816070557, -4.675835609436035, -4.5519819259643555, -4.428128242492676, -4.304275035858154, -4.180421352386475, -4.056567668914795, -3.9327144622802734, -3.808861017227173, -3.685007333755493, -3.5611538887023926, -3.437300443649292, -3.3134469985961914, -3.1895933151245117, -3.065739870071411, -2.9418861865997314, -2.818032741546631, -2.694179058074951, -2.5703256130218506, -2.44647216796875, -2.3226184844970703, -2.1987650394439697, -2.074911594390869, -1.951058030128479, -1.8272044658660889, -1.7033510208129883, -1.5794974565505981, -1.455643892288208, -1.3317904472351074, -1.2079368829727173, -1.0840833187103271, -0.9602298736572266, -0.8363763689994812, -0.7125228643417358, -0.5886693000793457, -0.46481579542160034, -0.340962290763855, -0.21710872650146484, -0.09325522184371948, 0.03059828281402588, 0.15445180237293243, 0.278305321931839, 0.40215885639190674, 0.5260123610496521, 0.6498658657073975, 0.7737194299697876, 0.897572934627533, 1.0214264392852783, 1.1452800035476685, 1.269133448600769, 1.3929870128631592, 1.5168404579162598, 1.64069402217865, 1.76454758644104, 1.8884010314941406, 2.0122547149658203, 2.136108160018921, 2.2599618434906006, 2.383815288543701, 2.5076687335968018, 2.6315221786499023, 2.755375862121582, 2.8792293071746826, 3.003082752227783]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 4.0, 2.0, 12.0, 8.0, 16.0, 11.0, 20.0, 29.0, 37.0, 45.0, 56.0, 98.0, 116.0, 196.0, 313.0, 562.0, 1043.0, 2126.0, 5984.0, 40127.0, 4090465.0, 42854.0, 6186.0, 2020.0, 858.0, 425.0, 246.0, 120.0, 86.0, 65.0, 25.0, 31.0, 23.0, 16.0, 12.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.775390625, -2.69256591796875, -2.6097412109375, -2.52691650390625, -2.444091796875, -2.36126708984375, -2.2784423828125, -2.19561767578125, -2.11279296875, -2.02996826171875, -1.9471435546875, -1.86431884765625, -1.781494140625, -1.69866943359375, -1.6158447265625, -1.53302001953125, -1.4501953125, -1.36737060546875, -1.2845458984375, -1.20172119140625, -1.118896484375, -1.03607177734375, -0.9532470703125, -0.87042236328125, -0.78759765625, -0.70477294921875, -0.6219482421875, -0.53912353515625, -0.456298828125, -0.37347412109375, -0.2906494140625, -0.20782470703125, -0.125, -0.04217529296875, 0.0406494140625, 0.12347412109375, 0.206298828125, 0.28912353515625, 0.3719482421875, 0.45477294921875, 0.53759765625, 0.62042236328125, 0.7032470703125, 0.78607177734375, 0.868896484375, 0.95172119140625, 1.0345458984375, 1.11737060546875, 1.2001953125, 1.28302001953125, 1.3658447265625, 1.44866943359375, 1.531494140625, 1.61431884765625, 1.6971435546875, 1.77996826171875, 1.86279296875, 1.94561767578125, 2.0284423828125, 2.11126708984375, 2.194091796875, 2.27691650390625, 2.3597412109375, 2.44256591796875, 2.525390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 7.0, 13.0, 11.0, 11.0, 22.0, 50.0, 109.0, 210.0, 232.0, 159.0, 58.0, 40.0, 27.0, 17.0, 11.0, 4.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12560462951660156, -0.12181472778320312, -0.11802482604980469, -0.11423492431640625, -0.11044502258300781, -0.10665512084960938, -0.10286521911621094, -0.0990753173828125, -0.09528541564941406, -0.09149551391601562, -0.08770561218261719, -0.08391571044921875, -0.08012580871582031, -0.07633590698242188, -0.07254600524902344, -0.068756103515625, -0.06496620178222656, -0.061176300048828125, -0.05738639831542969, -0.05359649658203125, -0.04980659484863281, -0.046016693115234375, -0.04222679138183594, -0.0384368896484375, -0.03464698791503906, -0.030857086181640625, -0.027067184448242188, -0.02327728271484375, -0.019487380981445312, -0.015697479248046875, -0.011907577514648438, -0.00811767578125, -0.0043277740478515625, -0.000537872314453125, 0.0032520294189453125, 0.00704193115234375, 0.010831832885742188, 0.014621734619140625, 0.018411636352539062, 0.0222015380859375, 0.025991439819335938, 0.029781341552734375, 0.03357124328613281, 0.03736114501953125, 0.04115104675292969, 0.044940948486328125, 0.04873085021972656, 0.052520751953125, 0.05631065368652344, 0.060100555419921875, 0.06389045715332031, 0.06768035888671875, 0.07147026062011719, 0.07526016235351562, 0.07905006408691406, 0.0828399658203125, 0.08662986755371094, 0.09041976928710938, 0.09420967102050781, 0.09799957275390625, 0.10178947448730469, 0.10557937622070312, 0.10936927795410156, 0.1131591796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 3.0, 17.0, 17.0, 47.0, 45.0, 139.0, 267.0, 849.0, 8828.0, 4024276.0, 155764.0, 3003.0, 525.0, 213.0, 90.0, 41.0, 28.0, 20.0, 11.0, 11.0, 10.0, 15.0, 4.0, 7.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.29296875, -3.182525634765625, -3.07208251953125, -2.961639404296875, -2.8511962890625, -2.740753173828125, -2.63031005859375, -2.519866943359375, -2.409423828125, -2.298980712890625, -2.18853759765625, -2.078094482421875, -1.9676513671875, -1.857208251953125, -1.74676513671875, -1.636322021484375, -1.52587890625, -1.415435791015625, -1.30499267578125, -1.194549560546875, -1.0841064453125, -0.973663330078125, -0.86322021484375, -0.752777099609375, -0.642333984375, -0.531890869140625, -0.42144775390625, -0.311004638671875, -0.2005615234375, -0.090118408203125, 0.02032470703125, 0.130767822265625, 0.2412109375, 0.351654052734375, 0.46209716796875, 0.572540283203125, 0.6829833984375, 0.793426513671875, 0.90386962890625, 1.014312744140625, 1.124755859375, 1.235198974609375, 1.34564208984375, 1.456085205078125, 1.5665283203125, 1.676971435546875, 1.78741455078125, 1.897857666015625, 2.00830078125, 2.118743896484375, 2.22918701171875, 2.339630126953125, 2.4500732421875, 2.560516357421875, 2.67095947265625, 2.781402587890625, 2.891845703125, 3.002288818359375, 3.11273193359375, 3.223175048828125, 3.3336181640625, 3.444061279296875, 3.55450439453125, 3.664947509765625, 3.775390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 9.0, 5.0, 10.0, 18.0, 24.0, 30.0, 51.0, 76.0, 136.0, 380.0, 1337.0, 1249.0, 377.0, 154.0, 79.0, 49.0, 22.0, 9.0, 10.0, 11.0, 3.0, 8.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.205810546875, -0.200531005859375, -0.19525146484375, -0.189971923828125, -0.1846923828125, -0.179412841796875, -0.17413330078125, -0.168853759765625, -0.16357421875, -0.158294677734375, -0.15301513671875, -0.147735595703125, -0.1424560546875, -0.137176513671875, -0.13189697265625, -0.126617431640625, -0.121337890625, -0.116058349609375, -0.11077880859375, -0.105499267578125, -0.1002197265625, -0.094940185546875, -0.08966064453125, -0.084381103515625, -0.0791015625, -0.073822021484375, -0.06854248046875, -0.063262939453125, -0.0579833984375, -0.052703857421875, -0.04742431640625, -0.042144775390625, -0.036865234375, -0.031585693359375, -0.02630615234375, -0.021026611328125, -0.0157470703125, -0.010467529296875, -0.00518798828125, 9.1552734375e-05, 0.00537109375, 0.010650634765625, 0.01593017578125, 0.021209716796875, 0.0264892578125, 0.031768798828125, 0.03704833984375, 0.042327880859375, 0.047607421875, 0.052886962890625, 0.05816650390625, 0.063446044921875, 0.0687255859375, 0.074005126953125, 0.07928466796875, 0.084564208984375, 0.08984375, 0.095123291015625, 0.10040283203125, 0.105682373046875, 0.1109619140625, 0.116241455078125, 0.12152099609375, 0.126800537109375, 0.132080078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 10.0, 97.0, 587.0, 248.0, 36.0, 15.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7675652503967285, -7.60786247253418, -7.448160171508789, -7.28845739364624, -7.128754615783691, -6.969052314758301, -6.809349536895752, -6.649646759033203, -6.4899444580078125, -6.330241680145264, -6.170539379119873, -6.010836601257324, -5.851134300231934, -5.691431522369385, -5.531728744506836, -5.372026443481445, -5.2123236656188965, -5.052620887756348, -4.892918586730957, -4.733215808868408, -4.573513031005859, -4.413810729980469, -4.25410795211792, -4.094405174255371, -3.9347028732299805, -3.7750003337860107, -3.615297794342041, -3.455595016479492, -3.2958924770355225, -3.1361899375915527, -2.976487159729004, -2.816784620285034, -2.6570825576782227, -2.497380018234253, -2.337677478790283, -2.1779747009277344, -2.0182721614837646, -1.858569622039795, -1.6988669633865356, -1.5391643047332764, -1.3794617652893066, -1.219759225845337, -1.0600565671920776, -0.9003539681434631, -0.7406513690948486, -0.5809487700462341, -0.42124617099761963, -0.26154351234436035, -0.10184097290039062, 0.05786162614822388, 0.21756422519683838, 0.3772668242454529, 0.5369694232940674, 0.6966720223426819, 0.8563746213912964, 1.0160772800445557, 1.1757798194885254, 1.3354823589324951, 1.4951850175857544, 1.6548876762390137, 1.8145902156829834, 1.9742927551269531, 2.133995532989502, 2.2936980724334717, 2.4534006118774414]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 15.0, 32.0, 51.0, 92.0, 149.0, 198.0, 177.0, 144.0, 79.0, 36.0, 23.0, 11.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.243463516235352, -4.161136150360107, -4.078808784484863, -3.9964816570281982, -3.914154291152954, -3.83182692527771, -3.749499559402466, -3.6671721935272217, -3.5848450660705566, -3.5025177001953125, -3.4201903343200684, -3.3378632068634033, -3.255535840988159, -3.173208475112915, -3.090881109237671, -3.0085537433624268, -2.9262263774871826, -2.8438990116119385, -2.7615716457366943, -2.6792445182800293, -2.596917152404785, -2.514589786529541, -2.432262420654297, -2.3499350547790527, -2.2676076889038086, -2.1852803230285645, -2.1029529571533203, -2.0206258296966553, -1.9382984638214111, -1.855971097946167, -1.7736437320709229, -1.6913163661956787, -1.6089894771575928, -1.5266621112823486, -1.444334864616394, -1.36200749874115, -1.2796802520751953, -1.1973528861999512, -1.115025520324707, -1.032698154449463, -0.9503709077835083, -0.8680436015129089, -0.7857162952423096, -0.7033889293670654, -0.6210616230964661, -0.5387343168258667, -0.45640698075294495, -0.3740796446800232, -0.29175233840942383, -0.20942501723766327, -0.1270976960659027, -0.04477037489414215, 0.03755694627761841, 0.11988425254821777, 0.20221158862113953, 0.2845389246940613, 0.36686623096466064, 0.44919353723526, 0.5315208435058594, 0.6138482093811035, 0.6961755156517029, 0.7785028219223022, 0.8608301877975464, 0.9431574940681458, 1.0254848003387451]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 2.0, 6.0, 5.0, 7.0, 15.0, 12.0, 18.0, 29.0, 37.0, 42.0, 55.0, 52.0, 160.0, 10835.0, 1036351.0, 538.0, 83.0, 64.0, 51.0, 38.0, 32.0, 28.0, 19.0, 14.0, 13.0, 8.0, 2.0, 8.0, 9.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.5350341796875, -10.148193359375, -9.7613525390625, -9.37451171875, -8.9876708984375, -8.600830078125, -8.2139892578125, -7.8271484375, -7.4403076171875, -7.053466796875, -6.6666259765625, -6.27978515625, -5.8929443359375, -5.506103515625, -5.1192626953125, -4.732421875, -4.3455810546875, -3.958740234375, -3.5718994140625, -3.18505859375, -2.7982177734375, -2.411376953125, -2.0245361328125, -1.6376953125, -1.2508544921875, -0.864013671875, -0.4771728515625, -0.09033203125, 0.2965087890625, 0.683349609375, 1.0701904296875, 1.45703125, 1.8438720703125, 2.230712890625, 2.6175537109375, 3.00439453125, 3.3912353515625, 3.778076171875, 4.1649169921875, 4.5517578125, 4.9385986328125, 5.325439453125, 5.7122802734375, 6.09912109375, 6.4859619140625, 6.872802734375, 7.2596435546875, 7.646484375, 8.0333251953125, 8.420166015625, 8.8070068359375, 9.19384765625, 9.5806884765625, 9.967529296875, 10.3543701171875, 10.7412109375, 11.1280517578125, 11.514892578125, 11.9017333984375, 12.28857421875, 12.6754150390625, 13.062255859375, 13.4490966796875, 13.8359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 21.0, 98.0, 583.0, 270.0, 33.0, 7.0, 2.0, 1.0, 1.0], "bins": [-0.97705078125, -0.9601030349731445, -0.9431552886962891, -0.9262075424194336, -0.9092597961425781, -0.8923120498657227, -0.8753643035888672, -0.8584165573120117, -0.8414688110351562, -0.8245210647583008, -0.8075733184814453, -0.7906255722045898, -0.7736778259277344, -0.7567300796508789, -0.7397823333740234, -0.722834587097168, -0.7058868408203125, -0.688939094543457, -0.6719913482666016, -0.6550436019897461, -0.6380958557128906, -0.6211481094360352, -0.6042003631591797, -0.5872526168823242, -0.5703048706054688, -0.5533571243286133, -0.5364093780517578, -0.5194616317749023, -0.5025138854980469, -0.4855661392211914, -0.46861839294433594, -0.45167064666748047, -0.434722900390625, -0.41777515411376953, -0.40082740783691406, -0.3838796615600586, -0.3669319152832031, -0.34998416900634766, -0.3330364227294922, -0.3160886764526367, -0.29914093017578125, -0.2821931838989258, -0.2652454376220703, -0.24829769134521484, -0.23134994506835938, -0.2144021987915039, -0.19745445251464844, -0.18050670623779297, -0.1635589599609375, -0.14661121368408203, -0.12966346740722656, -0.1127157211303711, -0.09576797485351562, -0.07882022857666016, -0.06187248229980469, -0.04492473602294922, -0.02797698974609375, -0.011029243469238281, 0.0059185028076171875, 0.022866249084472656, 0.039813995361328125, 0.056761741638183594, 0.07370948791503906, 0.09065723419189453, 0.10760498046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 8.0, 13.0, 7.0, 19.0, 33.0, 40.0, 58.0, 98.0, 136.0, 239.0, 428.0, 913.0, 2368.0, 7774.0, 37346.0, 306776.0, 593258.0, 79468.0, 13321.0, 3610.0, 1289.0, 547.0, 294.0, 158.0, 107.0, 63.0, 50.0, 36.0, 24.0, 18.0, 13.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.01953125, -1.9586944580078125, -1.897857666015625, -1.8370208740234375, -1.77618408203125, -1.7153472900390625, -1.654510498046875, -1.5936737060546875, -1.5328369140625, -1.4720001220703125, -1.411163330078125, -1.3503265380859375, -1.28948974609375, -1.2286529541015625, -1.167816162109375, -1.1069793701171875, -1.046142578125, -0.9853057861328125, -0.924468994140625, -0.8636322021484375, -0.80279541015625, -0.7419586181640625, -0.681121826171875, -0.6202850341796875, -0.5594482421875, -0.4986114501953125, -0.437774658203125, -0.3769378662109375, -0.31610107421875, -0.2552642822265625, -0.194427490234375, -0.1335906982421875, -0.07275390625, -0.0119171142578125, 0.048919677734375, 0.1097564697265625, 0.17059326171875, 0.2314300537109375, 0.292266845703125, 0.3531036376953125, 0.4139404296875, 0.4747772216796875, 0.535614013671875, 0.5964508056640625, 0.65728759765625, 0.7181243896484375, 0.778961181640625, 0.8397979736328125, 0.900634765625, 0.9614715576171875, 1.022308349609375, 1.0831451416015625, 1.14398193359375, 1.2048187255859375, 1.265655517578125, 1.3264923095703125, 1.3873291015625, 1.4481658935546875, 1.509002685546875, 1.5698394775390625, 1.63067626953125, 1.6915130615234375, 1.752349853515625, 1.8131866455078125, 1.8740234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 9.0, 9.0, 9.0, 12.0, 17.0, 16.0, 22.0, 23.0, 44.0, 32.0, 50.0, 60.0, 49.0, 55.0, 58.0, 77.0, 66.0, 64.0, 53.0, 52.0, 53.0, 43.0, 27.0, 25.0, 17.0, 14.0, 14.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7248458862304688, -0.6982269287109375, -0.6716079711914062, -0.644989013671875, -0.6183700561523438, -0.5917510986328125, -0.5651321411132812, -0.53851318359375, -0.5118942260742188, -0.4852752685546875, -0.45865631103515625, -0.432037353515625, -0.40541839599609375, -0.3787994384765625, -0.35218048095703125, -0.3255615234375, -0.29894256591796875, -0.2723236083984375, -0.24570465087890625, -0.219085693359375, -0.19246673583984375, -0.1658477783203125, -0.13922882080078125, -0.11260986328125, -0.08599090576171875, -0.0593719482421875, -0.03275299072265625, -0.006134033203125, 0.02048492431640625, 0.0471038818359375, 0.07372283935546875, 0.100341796875, 0.12696075439453125, 0.1535797119140625, 0.18019866943359375, 0.206817626953125, 0.23343658447265625, 0.2600555419921875, 0.28667449951171875, 0.31329345703125, 0.33991241455078125, 0.3665313720703125, 0.39315032958984375, 0.419769287109375, 0.44638824462890625, 0.4730072021484375, 0.49962615966796875, 0.5262451171875, 0.5528640747070312, 0.5794830322265625, 0.6061019897460938, 0.632720947265625, 0.6593399047851562, 0.6859588623046875, 0.7125778198242188, 0.73919677734375, 0.7658157348632812, 0.7924346923828125, 0.8190536499023438, 0.845672607421875, 0.8722915649414062, 0.8989105224609375, 0.9255294799804688, 0.9521484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 14.0, 21.0, 21.0, 34.0, 62.0, 126.0, 288.0, 637.0, 2071.0, 11878.0, 377765.0, 636795.0, 15105.0, 2415.0, 736.0, 267.0, 138.0, 53.0, 36.0, 30.0, 20.0, 6.0, 8.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.490142822265625, -1.41583251953125, -1.341522216796875, -1.2672119140625, -1.192901611328125, -1.11859130859375, -1.044281005859375, -0.969970703125, -0.895660400390625, -0.82135009765625, -0.747039794921875, -0.6727294921875, -0.598419189453125, -0.52410888671875, -0.449798583984375, -0.37548828125, -0.301177978515625, -0.22686767578125, -0.152557373046875, -0.0782470703125, -0.003936767578125, 0.07037353515625, 0.144683837890625, 0.218994140625, 0.293304443359375, 0.36761474609375, 0.441925048828125, 0.5162353515625, 0.590545654296875, 0.66485595703125, 0.739166259765625, 0.8134765625, 0.887786865234375, 0.96209716796875, 1.036407470703125, 1.1107177734375, 1.185028076171875, 1.25933837890625, 1.333648681640625, 1.407958984375, 1.482269287109375, 1.55657958984375, 1.630889892578125, 1.7052001953125, 1.779510498046875, 1.85382080078125, 1.928131103515625, 2.00244140625, 2.076751708984375, 2.15106201171875, 2.225372314453125, 2.2996826171875, 2.373992919921875, 2.44830322265625, 2.522613525390625, 2.596923828125, 2.671234130859375, 2.74554443359375, 2.819854736328125, 2.8941650390625, 2.968475341796875, 3.04278564453125, 3.117095947265625, 3.19140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 12.0, 18.0, 24.0, 43.0, 67.0, 154.0, 247.0, 175.0, 91.0, 64.0, 34.0, 21.0, 13.0, 12.0, 3.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001614093780517578, -0.00015537068247795105, -0.0001493319869041443, -0.00014329329133033752, -0.00013725459575653076, -0.000131215900182724, -0.00012517720460891724, -0.00011913850903511047, -0.00011309981346130371, -0.00010706111788749695, -0.00010102242231369019, -9.498372673988342e-05, -8.894503116607666e-05, -8.29063355922699e-05, -7.686764001846313e-05, -7.082894444465637e-05, -6.479024887084961e-05, -5.875155329704285e-05, -5.2712857723236084e-05, -4.667416214942932e-05, -4.063546657562256e-05, -3.4596771001815796e-05, -2.8558075428009033e-05, -2.251937985420227e-05, -1.6480684280395508e-05, -1.0441988706588745e-05, -4.403293132781982e-06, 1.6354024410247803e-06, 7.674098014831543e-06, 1.3712793588638306e-05, 1.975148916244507e-05, 2.579018473625183e-05, 3.1828880310058594e-05, 3.7867575883865356e-05, 4.390627145767212e-05, 4.994496703147888e-05, 5.5983662605285645e-05, 6.202235817909241e-05, 6.806105375289917e-05, 7.409974932670593e-05, 8.01384449005127e-05, 8.617714047431946e-05, 9.221583604812622e-05, 9.825453162193298e-05, 0.00010429322719573975, 0.00011033192276954651, 0.00011637061834335327, 0.00012240931391716003, 0.0001284480094909668, 0.00013448670506477356, 0.00014052540063858032, 0.00014656409621238708, 0.00015260279178619385, 0.0001586414873600006, 0.00016468018293380737, 0.00017071887850761414, 0.0001767575740814209, 0.00018279626965522766, 0.00018883496522903442, 0.0001948736608028412, 0.00020091235637664795, 0.0002069510519504547, 0.00021298974752426147, 0.00021902844309806824, 0.000225067138671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 9.0, 22.0, 25.0, 34.0, 59.0, 106.0, 205.0, 401.0, 1084.0, 2930.0, 10556.0, 97898.0, 863240.0, 59297.0, 8386.0, 2522.0, 924.0, 395.0, 158.0, 96.0, 48.0, 43.0, 26.0, 19.0, 9.0, 12.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.76171875, -1.7089996337890625, -1.656280517578125, -1.6035614013671875, -1.55084228515625, -1.4981231689453125, -1.445404052734375, -1.3926849365234375, -1.3399658203125, -1.2872467041015625, -1.234527587890625, -1.1818084716796875, -1.12908935546875, -1.0763702392578125, -1.023651123046875, -0.9709320068359375, -0.918212890625, -0.8654937744140625, -0.812774658203125, -0.7600555419921875, -0.70733642578125, -0.6546173095703125, -0.601898193359375, -0.5491790771484375, -0.4964599609375, -0.4437408447265625, -0.391021728515625, -0.3383026123046875, -0.28558349609375, -0.2328643798828125, -0.180145263671875, -0.1274261474609375, -0.07470703125, -0.0219879150390625, 0.030731201171875, 0.0834503173828125, 0.13616943359375, 0.1888885498046875, 0.241607666015625, 0.2943267822265625, 0.3470458984375, 0.3997650146484375, 0.452484130859375, 0.5052032470703125, 0.55792236328125, 0.6106414794921875, 0.663360595703125, 0.7160797119140625, 0.768798828125, 0.8215179443359375, 0.874237060546875, 0.9269561767578125, 0.97967529296875, 1.0323944091796875, 1.085113525390625, 1.1378326416015625, 1.1905517578125, 1.2432708740234375, 1.295989990234375, 1.3487091064453125, 1.40142822265625, 1.4541473388671875, 1.506866455078125, 1.5595855712890625, 1.6123046875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 14.0, 25.0, 37.0, 63.0, 84.0, 106.0, 130.0, 135.0, 116.0, 79.0, 58.0, 33.0, 25.0, 25.0, 13.0, 9.0, 4.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53759765625, -0.5192184448242188, -0.5008392333984375, -0.48246002197265625, -0.464080810546875, -0.44570159912109375, -0.4273223876953125, -0.40894317626953125, -0.39056396484375, -0.37218475341796875, -0.3538055419921875, -0.33542633056640625, -0.317047119140625, -0.29866790771484375, -0.2802886962890625, -0.26190948486328125, -0.2435302734375, -0.22515106201171875, -0.2067718505859375, -0.18839263916015625, -0.170013427734375, -0.15163421630859375, -0.1332550048828125, -0.11487579345703125, -0.09649658203125, -0.07811737060546875, -0.0597381591796875, -0.04135894775390625, -0.022979736328125, -0.00460052490234375, 0.0137786865234375, 0.03215789794921875, 0.050537109375, 0.06891632080078125, 0.0872955322265625, 0.10567474365234375, 0.124053955078125, 0.14243316650390625, 0.1608123779296875, 0.17919158935546875, 0.19757080078125, 0.21595001220703125, 0.2343292236328125, 0.25270843505859375, 0.271087646484375, 0.28946685791015625, 0.3078460693359375, 0.32622528076171875, 0.3446044921875, 0.36298370361328125, 0.3813629150390625, 0.39974212646484375, 0.418121337890625, 0.43650054931640625, 0.4548797607421875, 0.47325897216796875, 0.49163818359375, 0.5100173950195312, 0.5283966064453125, 0.5467758178710938, 0.565155029296875, 0.5835342407226562, 0.6019134521484375, 0.6202926635742188, 0.638671875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 28.0, 121.0, 338.0, 319.0, 126.0, 39.0, 13.0, 7.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.267534255981445, -20.719139099121094, -20.17074203491211, -19.622344970703125, -19.073949813842773, -18.525554656982422, -17.977157592773438, -17.428760528564453, -16.8803653717041, -16.33197021484375, -15.783573150634766, -15.235177040100098, -14.68678092956543, -14.138384819030762, -13.589988708496094, -13.041592597961426, -12.493196487426758, -11.94480037689209, -11.396404266357422, -10.848008155822754, -10.299612045288086, -9.751215934753418, -9.20281982421875, -8.654423713684082, -8.106027603149414, -7.557631492614746, -7.009235382080078, -6.46083927154541, -5.912443161010742, -5.364047050476074, -4.815650939941406, -4.267254829406738, -3.7188568115234375, -3.1704607009887695, -2.6220645904541016, -2.0736684799194336, -1.5252723693847656, -0.9768762588500977, -0.4284801483154297, 0.11991596221923828, 0.6683120727539062, 1.2167081832885742, 1.7651042938232422, 2.31350040435791, 2.861896514892578, 3.410292625427246, 3.958688735961914, 4.507084846496582, 5.05548095703125, 5.603877067565918, 6.152273178100586, 6.700669288635254, 7.249065399169922, 7.79746150970459, 8.345857620239258, 8.894253730773926, 9.442649841308594, 9.991045951843262, 10.53944206237793, 11.087838172912598, 11.636234283447266, 12.184630393981934, 12.733026504516602, 13.28142261505127, 13.829818725585938]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 8.0, 6.0, 5.0, 17.0, 13.0, 16.0, 19.0, 23.0, 30.0, 32.0, 36.0, 31.0, 46.0, 54.0, 36.0, 43.0, 56.0, 65.0, 52.0, 59.0, 43.0, 36.0, 51.0, 35.0, 31.0, 25.0, 25.0, 13.0, 23.0, 14.0, 9.0, 7.0, 13.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.192131042480469, -5.040441989898682, -4.8887529373168945, -4.737063884735107, -4.58537483215332, -4.433686256408691, -4.281997203826904, -4.130308151245117, -3.97861909866333, -3.826930046081543, -3.675240993499756, -3.523552179336548, -3.3718631267547607, -3.2201740741729736, -3.0684852600097656, -2.9167962074279785, -2.7651071548461914, -2.6134181022644043, -2.461729049682617, -2.310040235519409, -2.158351182937622, -2.006662130355835, -1.8549731969833374, -1.7032842636108398, -1.5515952110290527, -1.3999061584472656, -1.248217225074768, -1.0965282917022705, -0.9448392391204834, -0.7931502461433411, -0.6414612531661987, -0.48977231979370117, -0.33808279037475586, -0.18639379739761353, -0.03470480442047119, 0.11698418855667114, 0.2686731815338135, 0.4203621745109558, 0.5720511674880981, 0.7237401008605957, 0.8754291534423828, 1.02711820602417, 1.1788071393966675, 1.330496072769165, 1.4821851253509521, 1.6338741779327393, 1.7855631113052368, 1.9372520446777344, 2.0889410972595215, 2.2406301498413086, 2.3923192024230957, 2.5440080165863037, 2.695697069168091, 2.847386121749878, 2.999074935913086, 3.150763988494873, 3.30245304107666, 3.4541420936584473, 3.6058311462402344, 3.7575199604034424, 3.9092090129852295, 4.0608978271484375, 4.212586879730225, 4.364275932312012, 4.515964984893799]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 3.0, 9.0, 17.0, 13.0, 23.0, 23.0, 23.0, 34.0, 53.0, 54.0, 68.0, 145.0, 531.0, 3943929.0, 248943.0, 331.0, 49.0, 19.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-37.0, -36.3143310546875, -35.628662109375, -34.9429931640625, -34.25732421875, -33.5716552734375, -32.885986328125, -32.2003173828125, -31.5146484375, -30.8289794921875, -30.143310546875, -29.4576416015625, -28.77197265625, -28.0863037109375, -27.400634765625, -26.7149658203125, -26.029296875, -25.3436279296875, -24.657958984375, -23.9722900390625, -23.28662109375, -22.6009521484375, -21.915283203125, -21.2296142578125, -20.5439453125, -19.8582763671875, -19.172607421875, -18.4869384765625, -17.80126953125, -17.1156005859375, -16.429931640625, -15.7442626953125, -15.05859375, -14.3729248046875, -13.687255859375, -13.0015869140625, -12.31591796875, -11.6302490234375, -10.944580078125, -10.2589111328125, -9.5732421875, -8.8875732421875, -8.201904296875, -7.5162353515625, -6.83056640625, -6.1448974609375, -5.459228515625, -4.7735595703125, -4.087890625, -3.4022216796875, -2.716552734375, -2.0308837890625, -1.34521484375, -0.6595458984375, 0.026123046875, 0.7117919921875, 1.3974609375, 2.0831298828125, 2.768798828125, 3.4544677734375, 4.14013671875, 4.8258056640625, 5.511474609375, 6.1971435546875, 6.8828125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 2.0, 16.0, 63.0, 177.0, 318.0, 267.0, 120.0, 30.0, 9.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9806003570556641, -0.9626655578613281, -0.9447307586669922, -0.9267959594726562, -0.9088611602783203, -0.8909263610839844, -0.8729915618896484, -0.8550567626953125, -0.8371219635009766, -0.8191871643066406, -0.8012523651123047, -0.7833175659179688, -0.7653827667236328, -0.7474479675292969, -0.7295131683349609, -0.711578369140625, -0.6936435699462891, -0.6757087707519531, -0.6577739715576172, -0.6398391723632812, -0.6219043731689453, -0.6039695739746094, -0.5860347747802734, -0.5680999755859375, -0.5501651763916016, -0.5322303771972656, -0.5142955780029297, -0.49636077880859375, -0.4784259796142578, -0.4604911804199219, -0.44255638122558594, -0.42462158203125, -0.40668678283691406, -0.3887519836425781, -0.3708171844482422, -0.35288238525390625, -0.3349475860595703, -0.3170127868652344, -0.29907798767089844, -0.2811431884765625, -0.26320838928222656, -0.24527359008789062, -0.2273387908935547, -0.20940399169921875, -0.1914691925048828, -0.17353439331054688, -0.15559959411621094, -0.137664794921875, -0.11972999572753906, -0.10179519653320312, -0.08386039733886719, -0.06592559814453125, -0.04799079895019531, -0.030055999755859375, -0.012121200561523438, 0.0058135986328125, 0.023748397827148438, 0.041683197021484375, 0.05961799621582031, 0.07755279541015625, 0.09548759460449219, 0.11342239379882812, 0.13135719299316406, 0.1492919921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 3.0, 4.0, 11.0, 7.0, 11.0, 30.0, 30.0, 33.0, 45.0, 54.0, 80.0, 100.0, 134.0, 151.0, 174.0, 906.0, 4122480.0, 68775.0, 588.0, 178.0, 119.0, 119.0, 65.0, 47.0, 50.0, 29.0, 23.0, 10.0, 13.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-26.203125, -25.191162109375, -24.17919921875, -23.167236328125, -22.1552734375, -21.143310546875, -20.13134765625, -19.119384765625, -18.107421875, -17.095458984375, -16.08349609375, -15.071533203125, -14.0595703125, -13.047607421875, -12.03564453125, -11.023681640625, -10.01171875, -8.999755859375, -7.98779296875, -6.975830078125, -5.9638671875, -4.951904296875, -3.93994140625, -2.927978515625, -1.916015625, -0.904052734375, 0.10791015625, 1.119873046875, 2.1318359375, 3.143798828125, 4.15576171875, 5.167724609375, 6.1796875, 7.191650390625, 8.20361328125, 9.215576171875, 10.2275390625, 11.239501953125, 12.25146484375, 13.263427734375, 14.275390625, 15.287353515625, 16.29931640625, 17.311279296875, 18.3232421875, 19.335205078125, 20.34716796875, 21.359130859375, 22.37109375, 23.383056640625, 24.39501953125, 25.406982421875, 26.4189453125, 27.430908203125, 28.44287109375, 29.454833984375, 30.466796875, 31.478759765625, 32.49072265625, 33.502685546875, 34.5146484375, 35.526611328125, 36.53857421875, 37.550537109375, 38.5625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 31.0, 695.0, 3216.0, 95.0, 28.0, 7.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.2008514404296875, -5.097015380859375, -4.9931793212890625, -4.88934326171875, -4.7855072021484375, -4.681671142578125, -4.5778350830078125, -4.4739990234375, -4.3701629638671875, -4.266326904296875, -4.1624908447265625, -4.05865478515625, -3.9548187255859375, -3.850982666015625, -3.7471466064453125, -3.643310546875, -3.5394744873046875, -3.435638427734375, -3.3318023681640625, -3.22796630859375, -3.1241302490234375, -3.020294189453125, -2.9164581298828125, -2.8126220703125, -2.7087860107421875, -2.604949951171875, -2.5011138916015625, -2.39727783203125, -2.2934417724609375, -2.189605712890625, -2.0857696533203125, -1.98193359375, -1.8780975341796875, -1.774261474609375, -1.6704254150390625, -1.56658935546875, -1.4627532958984375, -1.358917236328125, -1.2550811767578125, -1.1512451171875, -1.0474090576171875, -0.943572998046875, -0.8397369384765625, -0.73590087890625, -0.6320648193359375, -0.528228759765625, -0.4243927001953125, -0.320556640625, -0.2167205810546875, -0.112884521484375, -0.0090484619140625, 0.09478759765625, 0.1986236572265625, 0.302459716796875, 0.4062957763671875, 0.5101318359375, 0.6139678955078125, 0.717803955078125, 0.8216400146484375, 0.92547607421875, 1.0293121337890625, 1.133148193359375, 1.2369842529296875, 1.3408203125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 11.0, 59.0, 191.0, 528.0, 132.0, 42.0, 13.0, 8.0, 10.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.91761016845703, -33.957275390625, -32.9969367980957, -32.03660202026367, -31.076265335083008, -30.115928649902344, -29.155593872070312, -28.19525718688965, -27.234920501708984, -26.27458381652832, -25.31424903869629, -24.353912353515625, -23.39357566833496, -22.433238983154297, -21.472904205322266, -20.5125675201416, -19.55223274230957, -18.591896057128906, -17.631561279296875, -16.67122459411621, -15.710887908935547, -14.7505521774292, -13.790216445922852, -12.829879760742188, -11.86954402923584, -10.909208297729492, -9.948871612548828, -8.98853588104248, -8.028200149536133, -7.067863464355469, -6.107527732849121, -5.147191524505615, -4.186855316162109, -3.2265191078186035, -2.2661831378936768, -1.30584716796875, -0.34551095962524414, 0.6148252487182617, 1.5751609802246094, 2.5354971885681152, 3.495833396911621, 4.456169605255127, 5.416505813598633, 6.3768415451049805, 7.337177753448486, 8.297513961791992, 9.25784969329834, 10.218185424804688, 11.178522109985352, 12.1388578414917, 13.099194526672363, 14.059530258178711, 15.019866943359375, 15.980202674865723, 16.94053840637207, 17.900875091552734, 18.861209869384766, 19.82154655456543, 20.78188133239746, 21.742218017578125, 22.70255470275879, 23.662891387939453, 24.623226165771484, 25.58356285095215, 26.543899536132812]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 18.0, 23.0, 42.0, 83.0, 137.0, 147.0, 143.0, 152.0, 104.0, 69.0, 42.0, 18.0, 10.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.900402069091797, -17.323759078979492, -16.747116088867188, -16.170475006103516, -15.593832015991211, -15.017189025878906, -14.440546989440918, -13.86390495300293, -13.287261962890625, -12.71061897277832, -12.133976936340332, -11.557334899902344, -10.980691909790039, -10.404048919677734, -9.827406883239746, -9.250764846801758, -8.674121856689453, -8.097478866577148, -7.52083683013916, -6.944194316864014, -6.367551803588867, -5.790909290313721, -5.214266777038574, -4.637624263763428, -4.060981750488281, -3.4843392372131348, -2.9076967239379883, -2.331054210662842, -1.7544116973876953, -1.1777691841125488, -0.6011266708374023, -0.02448415756225586, 0.5521602630615234, 1.12880277633667, 1.7054452896118164, 2.282087802886963, 2.8587303161621094, 3.435372829437256, 4.012015342712402, 4.588657855987549, 5.165300369262695, 5.741942882537842, 6.318585395812988, 6.895227909088135, 7.471870422363281, 8.048513412475586, 8.625155448913574, 9.201797485351562, 9.778440475463867, 10.355083465576172, 10.93172550201416, 11.508367538452148, 12.085010528564453, 12.661653518676758, 13.238295555114746, 13.814937591552734, 14.391580581665039, 14.968223571777344, 15.544865608215332, 16.12150764465332, 16.698150634765625, 17.27479362487793, 17.851436614990234, 18.428077697753906, 19.00472068786621]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 8.0, 12.0, 8.0, 10.0, 19.0, 25.0, 42.0, 56.0, 82.0, 137.0, 223.0, 472.0, 1221.0, 4247.0, 36116.0, 846199.0, 146645.0, 9496.0, 2023.0, 728.0, 316.0, 156.0, 97.0, 61.0, 31.0, 34.0, 24.0, 18.0, 13.0, 9.0, 3.0, 10.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-12.296875, -11.9873046875, -11.677734375, -11.3681640625, -11.05859375, -10.7490234375, -10.439453125, -10.1298828125, -9.8203125, -9.5107421875, -9.201171875, -8.8916015625, -8.58203125, -8.2724609375, -7.962890625, -7.6533203125, -7.34375, -7.0341796875, -6.724609375, -6.4150390625, -6.10546875, -5.7958984375, -5.486328125, -5.1767578125, -4.8671875, -4.5576171875, -4.248046875, -3.9384765625, -3.62890625, -3.3193359375, -3.009765625, -2.7001953125, -2.390625, -2.0810546875, -1.771484375, -1.4619140625, -1.15234375, -0.8427734375, -0.533203125, -0.2236328125, 0.0859375, 0.3955078125, 0.705078125, 1.0146484375, 1.32421875, 1.6337890625, 1.943359375, 2.2529296875, 2.5625, 2.8720703125, 3.181640625, 3.4912109375, 3.80078125, 4.1103515625, 4.419921875, 4.7294921875, 5.0390625, 5.3486328125, 5.658203125, 5.9677734375, 6.27734375, 6.5869140625, 6.896484375, 7.2060546875, 7.515625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 10.0, 33.0, 45.0, 82.0, 113.0, 175.0, 175.0, 148.0, 97.0, 70.0, 26.0, 16.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3846282958984375, -1.353240966796875, -1.3218536376953125, -1.29046630859375, -1.2590789794921875, -1.227691650390625, -1.1963043212890625, -1.1649169921875, -1.1335296630859375, -1.102142333984375, -1.0707550048828125, -1.03936767578125, -1.0079803466796875, -0.976593017578125, -0.9452056884765625, -0.913818359375, -0.8824310302734375, -0.851043701171875, -0.8196563720703125, -0.78826904296875, -0.7568817138671875, -0.725494384765625, -0.6941070556640625, -0.6627197265625, -0.6313323974609375, -0.599945068359375, -0.5685577392578125, -0.53717041015625, -0.5057830810546875, -0.474395751953125, -0.4430084228515625, -0.41162109375, -0.3802337646484375, -0.348846435546875, -0.3174591064453125, -0.28607177734375, -0.2546844482421875, -0.223297119140625, -0.1919097900390625, -0.1605224609375, -0.1291351318359375, -0.097747802734375, -0.0663604736328125, -0.03497314453125, -0.0035858154296875, 0.027801513671875, 0.0591888427734375, 0.090576171875, 0.1219635009765625, 0.153350830078125, 0.1847381591796875, 0.21612548828125, 0.2475128173828125, 0.278900146484375, 0.3102874755859375, 0.3416748046875, 0.3730621337890625, 0.404449462890625, 0.4358367919921875, 0.46722412109375, 0.4986114501953125, 0.529998779296875, 0.5613861083984375, 0.5927734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 7.0, 15.0, 17.0, 30.0, 24.0, 41.0, 48.0, 85.0, 118.0, 205.0, 309.0, 522.0, 978.0, 2166.0, 5188.0, 14144.0, 50524.0, 264538.0, 562995.0, 106394.0, 25639.0, 8138.0, 3120.0, 1372.0, 696.0, 424.0, 245.0, 170.0, 105.0, 75.0, 56.0, 33.0, 27.0, 26.0, 19.0, 18.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9296875, -2.838836669921875, -2.74798583984375, -2.657135009765625, -2.5662841796875, -2.475433349609375, -2.38458251953125, -2.293731689453125, -2.202880859375, -2.112030029296875, -2.02117919921875, -1.930328369140625, -1.8394775390625, -1.748626708984375, -1.65777587890625, -1.566925048828125, -1.47607421875, -1.385223388671875, -1.29437255859375, -1.203521728515625, -1.1126708984375, -1.021820068359375, -0.93096923828125, -0.840118408203125, -0.749267578125, -0.658416748046875, -0.56756591796875, -0.476715087890625, -0.3858642578125, -0.295013427734375, -0.20416259765625, -0.113311767578125, -0.0224609375, 0.068389892578125, 0.15924072265625, 0.250091552734375, 0.3409423828125, 0.431793212890625, 0.52264404296875, 0.613494873046875, 0.704345703125, 0.795196533203125, 0.88604736328125, 0.976898193359375, 1.0677490234375, 1.158599853515625, 1.24945068359375, 1.340301513671875, 1.43115234375, 1.522003173828125, 1.61285400390625, 1.703704833984375, 1.7945556640625, 1.885406494140625, 1.97625732421875, 2.067108154296875, 2.157958984375, 2.248809814453125, 2.33966064453125, 2.430511474609375, 2.5213623046875, 2.612213134765625, 2.70306396484375, 2.793914794921875, 2.884765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 3.0, 4.0, 8.0, 6.0, 12.0, 12.0, 15.0, 26.0, 39.0, 44.0, 52.0, 57.0, 63.0, 64.0, 56.0, 55.0, 67.0, 57.0, 52.0, 52.0, 44.0, 47.0, 23.0, 26.0, 32.0, 16.0, 14.0, 8.0, 14.0, 7.0, 1.0, 8.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8857421875, -1.8245391845703125, -1.763336181640625, -1.7021331787109375, -1.64093017578125, -1.5797271728515625, -1.518524169921875, -1.4573211669921875, -1.3961181640625, -1.3349151611328125, -1.273712158203125, -1.2125091552734375, -1.15130615234375, -1.0901031494140625, -1.028900146484375, -0.9676971435546875, -0.906494140625, -0.8452911376953125, -0.784088134765625, -0.7228851318359375, -0.66168212890625, -0.6004791259765625, -0.539276123046875, -0.4780731201171875, -0.4168701171875, -0.3556671142578125, -0.294464111328125, -0.2332611083984375, -0.17205810546875, -0.1108551025390625, -0.049652099609375, 0.0115509033203125, 0.07275390625, 0.1339569091796875, 0.195159912109375, 0.2563629150390625, 0.31756591796875, 0.3787689208984375, 0.439971923828125, 0.5011749267578125, 0.5623779296875, 0.6235809326171875, 0.684783935546875, 0.7459869384765625, 0.80718994140625, 0.8683929443359375, 0.929595947265625, 0.9907989501953125, 1.052001953125, 1.1132049560546875, 1.174407958984375, 1.2356109619140625, 1.29681396484375, 1.3580169677734375, 1.419219970703125, 1.4804229736328125, 1.5416259765625, 1.6028289794921875, 1.664031982421875, 1.7252349853515625, 1.78643798828125, 1.8476409912109375, 1.908843994140625, 1.9700469970703125, 2.03125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 8.0, 7.0, 12.0, 13.0, 20.0, 31.0, 67.0, 136.0, 321.0, 901.0, 3570.0, 30665.0, 967866.0, 39163.0, 4117.0, 1025.0, 339.0, 126.0, 73.0, 40.0, 24.0, 7.0, 6.0, 11.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.4222412109375, -8.219482421875, -8.0167236328125, -7.81396484375, -7.6112060546875, -7.408447265625, -7.2056884765625, -7.0029296875, -6.8001708984375, -6.597412109375, -6.3946533203125, -6.19189453125, -5.9891357421875, -5.786376953125, -5.5836181640625, -5.380859375, -5.1781005859375, -4.975341796875, -4.7725830078125, -4.56982421875, -4.3670654296875, -4.164306640625, -3.9615478515625, -3.7587890625, -3.5560302734375, -3.353271484375, -3.1505126953125, -2.94775390625, -2.7449951171875, -2.542236328125, -2.3394775390625, -2.13671875, -1.9339599609375, -1.731201171875, -1.5284423828125, -1.32568359375, -1.1229248046875, -0.920166015625, -0.7174072265625, -0.5146484375, -0.3118896484375, -0.109130859375, 0.0936279296875, 0.29638671875, 0.4991455078125, 0.701904296875, 0.9046630859375, 1.107421875, 1.3101806640625, 1.512939453125, 1.7156982421875, 1.91845703125, 2.1212158203125, 2.323974609375, 2.5267333984375, 2.7294921875, 2.9322509765625, 3.135009765625, 3.3377685546875, 3.54052734375, 3.7432861328125, 3.946044921875, 4.1488037109375, 4.3515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 14.0, 18.0, 18.0, 37.0, 54.0, 104.0, 163.0, 242.0, 130.0, 72.0, 54.0, 29.0, 18.0, 14.0, 10.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004093647003173828, -0.0003977753221988678, -0.0003861859440803528, -0.00037459656596183777, -0.00036300718784332275, -0.00035141780972480774, -0.0003398284316062927, -0.0003282390534877777, -0.0003166496753692627, -0.0003050602972507477, -0.00029347091913223267, -0.00028188154101371765, -0.00027029216289520264, -0.0002587027847766876, -0.0002471134066581726, -0.0002355240285396576, -0.00022393465042114258, -0.00021234527230262756, -0.00020075589418411255, -0.00018916651606559753, -0.00017757713794708252, -0.0001659877598285675, -0.0001543983817100525, -0.00014280900359153748, -0.00013121962547302246, -0.00011963024735450745, -0.00010804086923599243, -9.645149111747742e-05, -8.48621129989624e-05, -7.327273488044739e-05, -6.168335676193237e-05, -5.009397864341736e-05, -3.8504600524902344e-05, -2.691522240638733e-05, -1.5325844287872314e-05, -3.7364661693573e-06, 7.852911949157715e-06, 1.944229006767273e-05, 3.1031668186187744e-05, 4.262104630470276e-05, 5.4210424423217773e-05, 6.579980254173279e-05, 7.73891806602478e-05, 8.897855877876282e-05, 0.00010056793689727783, 0.00011215731501579285, 0.00012374669313430786, 0.00013533607125282288, 0.0001469254493713379, 0.0001585148274898529, 0.00017010420560836792, 0.00018169358372688293, 0.00019328296184539795, 0.00020487233996391296, 0.00021646171808242798, 0.000228051096200943, 0.000239640474319458, 0.000251229852437973, 0.00026281923055648804, 0.00027440860867500305, 0.00028599798679351807, 0.0002975873649120331, 0.0003091767430305481, 0.0003207661211490631, 0.0003323554992675781]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 13.0, 15.0, 21.0, 30.0, 41.0, 84.0, 152.0, 260.0, 622.0, 1559.0, 5368.0, 27997.0, 854306.0, 141064.0, 12005.0, 2997.0, 1016.0, 428.0, 235.0, 124.0, 75.0, 52.0, 24.0, 23.0, 8.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.39300537109375, -4.2547607421875, -4.11651611328125, -3.978271484375, -3.84002685546875, -3.7017822265625, -3.56353759765625, -3.42529296875, -3.28704833984375, -3.1488037109375, -3.01055908203125, -2.872314453125, -2.73406982421875, -2.5958251953125, -2.45758056640625, -2.3193359375, -2.18109130859375, -2.0428466796875, -1.90460205078125, -1.766357421875, -1.62811279296875, -1.4898681640625, -1.35162353515625, -1.21337890625, -1.07513427734375, -0.9368896484375, -0.79864501953125, -0.660400390625, -0.52215576171875, -0.3839111328125, -0.24566650390625, -0.107421875, 0.03082275390625, 0.1690673828125, 0.30731201171875, 0.445556640625, 0.58380126953125, 0.7220458984375, 0.86029052734375, 0.99853515625, 1.13677978515625, 1.2750244140625, 1.41326904296875, 1.551513671875, 1.68975830078125, 1.8280029296875, 1.96624755859375, 2.1044921875, 2.24273681640625, 2.3809814453125, 2.51922607421875, 2.657470703125, 2.79571533203125, 2.9339599609375, 3.07220458984375, 3.21044921875, 3.34869384765625, 3.4869384765625, 3.62518310546875, 3.763427734375, 3.90167236328125, 4.0399169921875, 4.17816162109375, 4.31640625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 12.0, 8.0, 8.0, 18.0, 10.0, 32.0, 66.0, 116.0, 172.0, 194.0, 153.0, 75.0, 50.0, 31.0, 12.0, 11.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787109375, -1.72991943359375, -1.6727294921875, -1.61553955078125, -1.558349609375, -1.50115966796875, -1.4439697265625, -1.38677978515625, -1.32958984375, -1.27239990234375, -1.2152099609375, -1.15802001953125, -1.100830078125, -1.04364013671875, -0.9864501953125, -0.92926025390625, -0.8720703125, -0.81488037109375, -0.7576904296875, -0.70050048828125, -0.643310546875, -0.58612060546875, -0.5289306640625, -0.47174072265625, -0.41455078125, -0.35736083984375, -0.3001708984375, -0.24298095703125, -0.185791015625, -0.12860107421875, -0.0714111328125, -0.01422119140625, 0.04296875, 0.10015869140625, 0.1573486328125, 0.21453857421875, 0.271728515625, 0.32891845703125, 0.3861083984375, 0.44329833984375, 0.50048828125, 0.55767822265625, 0.6148681640625, 0.67205810546875, 0.729248046875, 0.78643798828125, 0.8436279296875, 0.90081787109375, 0.9580078125, 1.01519775390625, 1.0723876953125, 1.12957763671875, 1.186767578125, 1.24395751953125, 1.3011474609375, 1.35833740234375, 1.41552734375, 1.47271728515625, 1.5299072265625, 1.58709716796875, 1.644287109375, 1.70147705078125, 1.7586669921875, 1.81585693359375, 1.873046875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 24.0, 385.0, 554.0, 40.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.13058471679688, -147.133056640625, -144.1355438232422, -141.13803100585938, -138.1405029296875, -135.14297485351562, -132.1454620361328, -129.14794921875, -126.15042114257812, -123.15290069580078, -120.15538024902344, -117.1578598022461, -114.16033935546875, -111.1628189086914, -108.16529846191406, -105.16777801513672, -102.17025756835938, -99.17273712158203, -96.17521667480469, -93.17769622802734, -90.18017578125, -87.18265533447266, -84.18513488769531, -81.18761444091797, -78.19009399414062, -75.19257354736328, -72.19505310058594, -69.1975326538086, -66.20001220703125, -63.202491760253906, -60.20497131347656, -57.20745086669922, -54.209930419921875, -51.21240997314453, -48.21488952636719, -45.217369079589844, -42.2198486328125, -39.222328186035156, -36.22480773925781, -33.22728729248047, -30.229766845703125, -27.23224639892578, -24.234725952148438, -21.237205505371094, -18.23968505859375, -15.242164611816406, -12.244644165039062, -9.247123718261719, -6.249603271484375, -3.2520828247070312, -0.2545623779296875, 2.7429580688476562, 5.740478515625, 8.737998962402344, 11.735519409179688, 14.733039855957031, 17.730560302734375, 20.72808074951172, 23.725601196289062, 26.723121643066406, 29.72064208984375, 32.718162536621094, 35.71568298339844, 38.71320343017578, 41.710723876953125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 12.0, 11.0, 20.0, 20.0, 26.0, 40.0, 40.0, 45.0, 36.0, 54.0, 54.0, 45.0, 69.0, 54.0, 46.0, 55.0, 60.0, 54.0, 54.0, 37.0, 27.0, 22.0, 20.0, 22.0, 13.0, 18.0, 9.0, 6.0, 5.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.633420944213867, -10.228638648986816, -9.823857307434082, -9.419075012207031, -9.01429271697998, -8.609511375427246, -8.204729080200195, -7.799947261810303, -7.39516544342041, -6.990383625030518, -6.585601329803467, -6.180819511413574, -5.776037693023682, -5.371255874633789, -4.966473579406738, -4.561691761016846, -4.156909465789795, -3.7521274089813232, -3.3473455905914307, -2.942563533782959, -2.5377817153930664, -2.1329996585845947, -1.728217601776123, -1.3234357833862305, -0.9186537265777588, -0.5138717889785767, -0.10908979177474976, 0.29569220542907715, 0.7004741430282593, 1.1052560806274414, 1.510038137435913, 1.9148199558258057, 2.3196020126342773, 2.724384069442749, 3.1291658878326416, 3.5339479446411133, 3.938729763031006, 4.343511581420898, 4.748293876647949, 5.153075695037842, 5.557857513427734, 5.962639331817627, 6.367421627044678, 6.77220344543457, 7.176985263824463, 7.5817670822143555, 7.986549377441406, 8.39133071899414, 8.796113967895508, 9.200896263122559, 9.605677604675293, 10.010459899902344, 10.415242195129395, 10.820023536682129, 11.22480583190918, 11.629587173461914, 12.034369468688965, 12.439151763916016, 12.84393310546875, 13.2487154006958, 13.653497695922852, 14.058279037475586, 14.463061332702637, 14.867843627929688, 15.272624969482422]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 7.0, 7.0, 5.0, 12.0, 8.0, 19.0, 21.0, 25.0, 31.0, 52.0, 67.0, 102.0, 148.0, 252.0, 467.0, 1197.0, 4314.0, 26137.0, 4049533.0, 98200.0, 10349.0, 2191.0, 645.0, 249.0, 98.0, 61.0, 33.0, 15.0, 13.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.375, -18.96044921875, -18.5458984375, -18.13134765625, -17.716796875, -17.30224609375, -16.8876953125, -16.47314453125, -16.05859375, -15.64404296875, -15.2294921875, -14.81494140625, -14.400390625, -13.98583984375, -13.5712890625, -13.15673828125, -12.7421875, -12.32763671875, -11.9130859375, -11.49853515625, -11.083984375, -10.66943359375, -10.2548828125, -9.84033203125, -9.42578125, -9.01123046875, -8.5966796875, -8.18212890625, -7.767578125, -7.35302734375, -6.9384765625, -6.52392578125, -6.109375, -5.69482421875, -5.2802734375, -4.86572265625, -4.451171875, -4.03662109375, -3.6220703125, -3.20751953125, -2.79296875, -2.37841796875, -1.9638671875, -1.54931640625, -1.134765625, -0.72021484375, -0.3056640625, 0.10888671875, 0.5234375, 0.93798828125, 1.3525390625, 1.76708984375, 2.181640625, 2.59619140625, 3.0107421875, 3.42529296875, 3.83984375, 4.25439453125, 4.6689453125, 5.08349609375, 5.498046875, 5.91259765625, 6.3271484375, 6.74169921875, 7.15625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 5.0, 13.0, 32.0, 52.0, 85.0, 106.0, 122.0, 141.0, 134.0, 116.0, 73.0, 46.0, 39.0, 18.0, 2.0, 2.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.287109375, -1.2593917846679688, -1.2316741943359375, -1.2039566040039062, -1.176239013671875, -1.1485214233398438, -1.1208038330078125, -1.0930862426757812, -1.06536865234375, -1.0376510620117188, -1.0099334716796875, -0.9822158813476562, -0.954498291015625, -0.9267807006835938, -0.8990631103515625, -0.8713455200195312, -0.8436279296875, -0.8159103393554688, -0.7881927490234375, -0.7604751586914062, -0.732757568359375, -0.7050399780273438, -0.6773223876953125, -0.6496047973632812, -0.62188720703125, -0.5941696166992188, -0.5664520263671875, -0.5387344360351562, -0.511016845703125, -0.48329925537109375, -0.4555816650390625, -0.42786407470703125, -0.400146484375, -0.37242889404296875, -0.3447113037109375, -0.31699371337890625, -0.289276123046875, -0.26155853271484375, -0.2338409423828125, -0.20612335205078125, -0.17840576171875, -0.15068817138671875, -0.1229705810546875, -0.09525299072265625, -0.067535400390625, -0.03981781005859375, -0.0121002197265625, 0.01561737060546875, 0.0433349609375, 0.07105255126953125, 0.0987701416015625, 0.12648773193359375, 0.154205322265625, 0.18192291259765625, 0.2096405029296875, 0.23735809326171875, 0.26507568359375, 0.29279327392578125, 0.3205108642578125, 0.34822845458984375, 0.375946044921875, 0.40366363525390625, 0.4313812255859375, 0.45909881591796875, 0.48681640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 8.0, 8.0, 18.0, 20.0, 32.0, 46.0, 73.0, 108.0, 233.0, 381.0, 1162.0, 49429.0, 4138417.0, 3408.0, 479.0, 222.0, 95.0, 56.0, 37.0, 19.0, 15.0, 9.0, 4.0, 1.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.375, -35.37060546875, -34.3662109375, -33.36181640625, -32.357421875, -31.35302734375, -30.3486328125, -29.34423828125, -28.33984375, -27.33544921875, -26.3310546875, -25.32666015625, -24.322265625, -23.31787109375, -22.3134765625, -21.30908203125, -20.3046875, -19.30029296875, -18.2958984375, -17.29150390625, -16.287109375, -15.28271484375, -14.2783203125, -13.27392578125, -12.26953125, -11.26513671875, -10.2607421875, -9.25634765625, -8.251953125, -7.24755859375, -6.2431640625, -5.23876953125, -4.234375, -3.22998046875, -2.2255859375, -1.22119140625, -0.216796875, 0.78759765625, 1.7919921875, 2.79638671875, 3.80078125, 4.80517578125, 5.8095703125, 6.81396484375, 7.818359375, 8.82275390625, 9.8271484375, 10.83154296875, 11.8359375, 12.84033203125, 13.8447265625, 14.84912109375, 15.853515625, 16.85791015625, 17.8623046875, 18.86669921875, 19.87109375, 20.87548828125, 21.8798828125, 22.88427734375, 23.888671875, 24.89306640625, 25.8974609375, 26.90185546875, 27.90625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 20.0, 41.0, 89.0, 2745.0, 997.0, 90.0, 44.0, 24.0, 18.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.583892822265625, -5.47637939453125, -5.368865966796875, -5.2613525390625, -5.153839111328125, -5.04632568359375, -4.938812255859375, -4.831298828125, -4.723785400390625, -4.61627197265625, -4.508758544921875, -4.4012451171875, -4.293731689453125, -4.18621826171875, -4.078704833984375, -3.97119140625, -3.863677978515625, -3.75616455078125, -3.648651123046875, -3.5411376953125, -3.433624267578125, -3.32611083984375, -3.218597412109375, -3.111083984375, -3.003570556640625, -2.89605712890625, -2.788543701171875, -2.6810302734375, -2.573516845703125, -2.46600341796875, -2.358489990234375, -2.2509765625, -2.143463134765625, -2.03594970703125, -1.928436279296875, -1.8209228515625, -1.713409423828125, -1.60589599609375, -1.498382568359375, -1.390869140625, -1.283355712890625, -1.17584228515625, -1.068328857421875, -0.9608154296875, -0.853302001953125, -0.74578857421875, -0.638275146484375, -0.53076171875, -0.423248291015625, -0.31573486328125, -0.208221435546875, -0.1007080078125, 0.006805419921875, 0.11431884765625, 0.221832275390625, 0.329345703125, 0.436859130859375, 0.54437255859375, 0.651885986328125, 0.7593994140625, 0.866912841796875, 0.97442626953125, 1.081939697265625, 1.189453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 15.0, 62.0, 485.0, 366.0, 48.0, 10.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.46833038330078, -21.216089248657227, -19.963848114013672, -18.711606979370117, -17.459365844726562, -16.207122802734375, -14.95488166809082, -13.702640533447266, -12.450399398803711, -11.198158264160156, -9.945917129516602, -8.69367504119873, -7.441433906555176, -6.189192771911621, -4.936951160430908, -3.6847095489501953, -2.4324684143066406, -1.1802270412445068, 0.07201433181762695, 1.3242557048797607, 2.5764970779418945, 3.828738212585449, 5.080979824066162, 6.333221435546875, 7.58546257019043, 8.837703704833984, 10.089944839477539, 11.34218692779541, 12.594428062438965, 13.84666919708252, 15.09891128540039, 16.351152420043945, 17.603397369384766, 18.85563850402832, 20.107879638671875, 21.36012077331543, 22.612361907958984, 23.864604949951172, 25.116846084594727, 26.36908721923828, 27.621328353881836, 28.87356948852539, 30.125810623168945, 31.3780517578125, 32.63029479980469, 33.88253402709961, 35.1347770690918, 36.38701629638672, 37.639259338378906, 38.891502380371094, 40.143741607666016, 41.3959846496582, 42.648223876953125, 43.90046691894531, 45.152706146240234, 46.40494918823242, 47.657188415527344, 48.90943145751953, 50.16167068481445, 51.41391372680664, 52.66615295410156, 53.91839599609375, 55.17063522338867, 56.42287826538086, 57.67512130737305]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 24.0, 37.0, 50.0, 67.0, 90.0, 97.0, 99.0, 91.0, 105.0, 74.0, 65.0, 60.0, 46.0, 31.0, 13.0, 9.0, 13.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.894081115722656, -8.588213920593262, -8.28234577178955, -7.976478099822998, -7.670610427856445, -7.364743232727051, -7.058875560760498, -6.753007888793945, -6.447140216827393, -6.14127254486084, -5.835404872894287, -5.529537200927734, -5.22367000579834, -4.917801856994629, -4.611934661865234, -4.306066989898682, -4.000199317932129, -3.694331645965576, -3.3884639739990234, -3.08259654045105, -2.776728868484497, -2.4708611965179443, -2.1649937629699707, -1.859126091003418, -1.5532584190368652, -1.2473907470703125, -0.9415231943130493, -0.6356555819511414, -0.3297879695892334, -0.023920297622680664, 0.2819472551345825, 0.5878148078918457, 0.8936834335327148, 1.1995511054992676, 1.5054186582565308, 1.811286211013794, 2.1171538829803467, 2.4230215549468994, 2.728888988494873, 3.034756660461426, 3.3406243324279785, 3.6464920043945312, 3.952359676361084, 4.258227348327637, 4.564094543457031, 4.869962692260742, 5.175829887390137, 5.4816975593566895, 5.787565231323242, 6.093432903289795, 6.399300575256348, 6.7051682472229, 7.011035919189453, 7.316903114318848, 7.6227707862854, 7.928638458251953, 8.234506607055664, 8.540373802185059, 8.84624195098877, 9.152109146118164, 9.457977294921875, 9.76384449005127, 10.06971263885498, 10.375579833984375, 10.68144702911377]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 15.0, 15.0, 30.0, 51.0, 62.0, 93.0, 121.0, 204.0, 297.0, 522.0, 1014.0, 2372.0, 7421.0, 32821.0, 291166.0, 636005.0, 58661.0, 11321.0, 3315.0, 1325.0, 635.0, 354.0, 217.0, 131.0, 83.0, 73.0, 51.0, 37.0, 19.0, 16.0, 18.0, 16.0, 12.0, 2.0, 11.0, 6.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-6.29296875, -6.0972900390625, -5.901611328125, -5.7059326171875, -5.51025390625, -5.3145751953125, -5.118896484375, -4.9232177734375, -4.7275390625, -4.5318603515625, -4.336181640625, -4.1405029296875, -3.94482421875, -3.7491455078125, -3.553466796875, -3.3577880859375, -3.162109375, -2.9664306640625, -2.770751953125, -2.5750732421875, -2.37939453125, -2.1837158203125, -1.988037109375, -1.7923583984375, -1.5966796875, -1.4010009765625, -1.205322265625, -1.0096435546875, -0.81396484375, -0.6182861328125, -0.422607421875, -0.2269287109375, -0.03125, 0.1644287109375, 0.360107421875, 0.5557861328125, 0.75146484375, 0.9471435546875, 1.142822265625, 1.3385009765625, 1.5341796875, 1.7298583984375, 1.925537109375, 2.1212158203125, 2.31689453125, 2.5125732421875, 2.708251953125, 2.9039306640625, 3.099609375, 3.2952880859375, 3.490966796875, 3.6866455078125, 3.88232421875, 4.0780029296875, 4.273681640625, 4.4693603515625, 4.6650390625, 4.8607177734375, 5.056396484375, 5.2520751953125, 5.44775390625, 5.6434326171875, 5.839111328125, 6.0347900390625, 6.23046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 11.0, 5.0, 13.0, 21.0, 27.0, 67.0, 73.0, 91.0, 104.0, 122.0, 114.0, 124.0, 82.0, 49.0, 36.0, 28.0, 21.0, 8.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.330078125, -1.2981491088867188, -1.2662200927734375, -1.2342910766601562, -1.202362060546875, -1.1704330444335938, -1.1385040283203125, -1.1065750122070312, -1.07464599609375, -1.0427169799804688, -1.0107879638671875, -0.9788589477539062, -0.946929931640625, -0.9150009155273438, -0.8830718994140625, -0.8511428833007812, -0.8192138671875, -0.7872848510742188, -0.7553558349609375, -0.7234268188476562, -0.691497802734375, -0.6595687866210938, -0.6276397705078125, -0.5957107543945312, -0.56378173828125, -0.5318527221679688, -0.4999237060546875, -0.46799468994140625, -0.436065673828125, -0.40413665771484375, -0.3722076416015625, -0.34027862548828125, -0.308349609375, -0.27642059326171875, -0.2444915771484375, -0.21256256103515625, -0.180633544921875, -0.14870452880859375, -0.1167755126953125, -0.08484649658203125, -0.05291748046875, -0.02098846435546875, 0.0109405517578125, 0.04286956787109375, 0.074798583984375, 0.10672760009765625, 0.1386566162109375, 0.17058563232421875, 0.2025146484375, 0.23444366455078125, 0.2663726806640625, 0.29830169677734375, 0.330230712890625, 0.36215972900390625, 0.3940887451171875, 0.42601776123046875, 0.45794677734375, 0.48987579345703125, 0.5218048095703125, 0.5537338256835938, 0.585662841796875, 0.6175918579101562, 0.6495208740234375, 0.6814498901367188, 0.71337890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 8.0, 10.0, 12.0, 12.0, 21.0, 26.0, 45.0, 62.0, 63.0, 112.0, 190.0, 263.0, 399.0, 656.0, 1131.0, 2052.0, 3952.0, 8366.0, 19560.0, 52918.0, 179884.0, 498880.0, 187312.0, 54275.0, 20514.0, 8718.0, 4052.0, 2041.0, 1118.0, 673.0, 395.0, 263.0, 164.0, 120.0, 76.0, 63.0, 36.0, 24.0, 22.0, 20.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.650390625, -2.568878173828125, -2.48736572265625, -2.405853271484375, -2.3243408203125, -2.242828369140625, -2.16131591796875, -2.079803466796875, -1.998291015625, -1.916778564453125, -1.83526611328125, -1.753753662109375, -1.6722412109375, -1.590728759765625, -1.50921630859375, -1.427703857421875, -1.34619140625, -1.264678955078125, -1.18316650390625, -1.101654052734375, -1.0201416015625, -0.938629150390625, -0.85711669921875, -0.775604248046875, -0.694091796875, -0.612579345703125, -0.53106689453125, -0.449554443359375, -0.3680419921875, -0.286529541015625, -0.20501708984375, -0.123504638671875, -0.0419921875, 0.039520263671875, 0.12103271484375, 0.202545166015625, 0.2840576171875, 0.365570068359375, 0.44708251953125, 0.528594970703125, 0.610107421875, 0.691619873046875, 0.77313232421875, 0.854644775390625, 0.9361572265625, 1.017669677734375, 1.09918212890625, 1.180694580078125, 1.26220703125, 1.343719482421875, 1.42523193359375, 1.506744384765625, 1.5882568359375, 1.669769287109375, 1.75128173828125, 1.832794189453125, 1.914306640625, 1.995819091796875, 2.07733154296875, 2.158843994140625, 2.2403564453125, 2.321868896484375, 2.40338134765625, 2.484893798828125, 2.56640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 7.0, 8.0, 16.0, 9.0, 11.0, 20.0, 22.0, 26.0, 22.0, 22.0, 34.0, 38.0, 47.0, 55.0, 46.0, 29.0, 53.0, 49.0, 47.0, 51.0, 49.0, 48.0, 46.0, 34.0, 34.0, 31.0, 30.0, 24.0, 19.0, 13.0, 16.0, 8.0, 8.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.421875, -2.350616455078125, -2.27935791015625, -2.208099365234375, -2.1368408203125, -2.065582275390625, -1.99432373046875, -1.923065185546875, -1.851806640625, -1.780548095703125, -1.70928955078125, -1.638031005859375, -1.5667724609375, -1.495513916015625, -1.42425537109375, -1.352996826171875, -1.28173828125, -1.210479736328125, -1.13922119140625, -1.067962646484375, -0.9967041015625, -0.925445556640625, -0.85418701171875, -0.782928466796875, -0.711669921875, -0.640411376953125, -0.56915283203125, -0.497894287109375, -0.4266357421875, -0.355377197265625, -0.28411865234375, -0.212860107421875, -0.1416015625, -0.070343017578125, 0.00091552734375, 0.072174072265625, 0.1434326171875, 0.214691162109375, 0.28594970703125, 0.357208251953125, 0.428466796875, 0.499725341796875, 0.57098388671875, 0.642242431640625, 0.7135009765625, 0.784759521484375, 0.85601806640625, 0.927276611328125, 0.99853515625, 1.069793701171875, 1.14105224609375, 1.212310791015625, 1.2835693359375, 1.354827880859375, 1.42608642578125, 1.497344970703125, 1.568603515625, 1.639862060546875, 1.71112060546875, 1.782379150390625, 1.8536376953125, 1.924896240234375, 1.99615478515625, 2.067413330078125, 2.138671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 14.0, 4.0, 16.0, 21.0, 29.0, 45.0, 79.0, 128.0, 228.0, 402.0, 922.0, 2523.0, 9003.0, 66907.0, 886867.0, 68004.0, 8983.0, 2517.0, 853.0, 413.0, 237.0, 121.0, 73.0, 59.0, 31.0, 25.0, 15.0, 8.0, 5.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.5625, -4.444000244140625, -4.32550048828125, -4.207000732421875, -4.0885009765625, -3.970001220703125, -3.85150146484375, -3.733001708984375, -3.614501953125, -3.496002197265625, -3.37750244140625, -3.259002685546875, -3.1405029296875, -3.022003173828125, -2.90350341796875, -2.785003662109375, -2.66650390625, -2.548004150390625, -2.42950439453125, -2.311004638671875, -2.1925048828125, -2.074005126953125, -1.95550537109375, -1.837005615234375, -1.718505859375, -1.600006103515625, -1.48150634765625, -1.363006591796875, -1.2445068359375, -1.126007080078125, -1.00750732421875, -0.889007568359375, -0.7705078125, -0.652008056640625, -0.53350830078125, -0.415008544921875, -0.2965087890625, -0.178009033203125, -0.05950927734375, 0.058990478515625, 0.177490234375, 0.295989990234375, 0.41448974609375, 0.532989501953125, 0.6514892578125, 0.769989013671875, 0.88848876953125, 1.006988525390625, 1.12548828125, 1.243988037109375, 1.36248779296875, 1.480987548828125, 1.5994873046875, 1.717987060546875, 1.83648681640625, 1.954986572265625, 2.073486328125, 2.191986083984375, 2.31048583984375, 2.428985595703125, 2.5474853515625, 2.665985107421875, 2.78448486328125, 2.902984619140625, 3.021484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 8.0, 18.0, 22.0, 29.0, 47.0, 70.0, 173.0, 236.0, 164.0, 70.0, 45.0, 26.0, 20.0, 18.0, 15.0, 7.0, 8.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0], "bins": [-0.0006036758422851562, -0.0005904026329517365, -0.0005771294236183167, -0.0005638562142848969, -0.000550583004951477, -0.0005373097956180573, -0.0005240365862846375, -0.0005107633769512177, -0.0004974901676177979, -0.00048421695828437805, -0.00047094374895095825, -0.00045767053961753845, -0.00044439733028411865, -0.00043112412095069885, -0.00041785091161727905, -0.00040457770228385925, -0.00039130449295043945, -0.00037803128361701965, -0.00036475807428359985, -0.00035148486495018005, -0.00033821165561676025, -0.00032493844628334045, -0.00031166523694992065, -0.00029839202761650085, -0.00028511881828308105, -0.00027184560894966125, -0.00025857239961624146, -0.00024529919028282166, -0.00023202598094940186, -0.00021875277161598206, -0.00020547956228256226, -0.00019220635294914246, -0.00017893314361572266, -0.00016565993428230286, -0.00015238672494888306, -0.00013911351561546326, -0.00012584030628204346, -0.00011256709694862366, -9.929388761520386e-05, -8.602067828178406e-05, -7.274746894836426e-05, -5.947425961494446e-05, -4.620105028152466e-05, -3.292784094810486e-05, -1.965463161468506e-05, -6.381422281265259e-06, 6.891787052154541e-06, 2.016499638557434e-05, 3.343820571899414e-05, 4.671141505241394e-05, 5.998462438583374e-05, 7.325783371925354e-05, 8.653104305267334e-05, 9.980425238609314e-05, 0.00011307746171951294, 0.00012635067105293274, 0.00013962388038635254, 0.00015289708971977234, 0.00016617029905319214, 0.00017944350838661194, 0.00019271671772003174, 0.00020598992705345154, 0.00021926313638687134, 0.00023253634572029114, 0.00024580955505371094]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 14.0, 9.0, 13.0, 13.0, 24.0, 22.0, 38.0, 72.0, 75.0, 111.0, 207.0, 265.0, 490.0, 793.0, 1411.0, 2649.0, 5336.0, 12444.0, 36278.0, 183814.0, 670083.0, 92419.0, 23748.0, 8889.0, 4184.0, 2111.0, 1191.0, 660.0, 431.0, 263.0, 161.0, 105.0, 74.0, 39.0, 28.0, 23.0, 13.0, 14.0, 5.0, 4.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.7705078125, -1.715728759765625, -1.66094970703125, -1.606170654296875, -1.5513916015625, -1.496612548828125, -1.44183349609375, -1.387054443359375, -1.332275390625, -1.277496337890625, -1.22271728515625, -1.167938232421875, -1.1131591796875, -1.058380126953125, -1.00360107421875, -0.948822021484375, -0.89404296875, -0.839263916015625, -0.78448486328125, -0.729705810546875, -0.6749267578125, -0.620147705078125, -0.56536865234375, -0.510589599609375, -0.455810546875, -0.401031494140625, -0.34625244140625, -0.291473388671875, -0.2366943359375, -0.181915283203125, -0.12713623046875, -0.072357177734375, -0.017578125, 0.037200927734375, 0.09197998046875, 0.146759033203125, 0.2015380859375, 0.256317138671875, 0.31109619140625, 0.365875244140625, 0.420654296875, 0.475433349609375, 0.53021240234375, 0.584991455078125, 0.6397705078125, 0.694549560546875, 0.74932861328125, 0.804107666015625, 0.85888671875, 0.913665771484375, 0.96844482421875, 1.023223876953125, 1.0780029296875, 1.132781982421875, 1.18756103515625, 1.242340087890625, 1.297119140625, 1.351898193359375, 1.40667724609375, 1.461456298828125, 1.5162353515625, 1.571014404296875, 1.62579345703125, 1.680572509765625, 1.7353515625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 10.0, 12.0, 13.0, 6.0, 16.0, 27.0, 35.0, 38.0, 54.0, 52.0, 84.0, 85.0, 104.0, 97.0, 61.0, 65.0, 48.0, 29.0, 29.0, 26.0, 22.0, 16.0, 10.0, 10.0, 6.0, 7.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0212249755859375, -0.987762451171875, -0.9542999267578125, -0.92083740234375, -0.8873748779296875, -0.853912353515625, -0.8204498291015625, -0.7869873046875, -0.7535247802734375, -0.720062255859375, -0.6865997314453125, -0.65313720703125, -0.6196746826171875, -0.586212158203125, -0.5527496337890625, -0.519287109375, -0.4858245849609375, -0.452362060546875, -0.4188995361328125, -0.38543701171875, -0.3519744873046875, -0.318511962890625, -0.2850494384765625, -0.2515869140625, -0.2181243896484375, -0.184661865234375, -0.1511993408203125, -0.11773681640625, -0.0842742919921875, -0.050811767578125, -0.0173492431640625, 0.01611328125, 0.0495758056640625, 0.083038330078125, 0.1165008544921875, 0.14996337890625, 0.1834259033203125, 0.216888427734375, 0.2503509521484375, 0.2838134765625, 0.3172760009765625, 0.350738525390625, 0.3842010498046875, 0.41766357421875, 0.4511260986328125, 0.484588623046875, 0.5180511474609375, 0.551513671875, 0.5849761962890625, 0.618438720703125, 0.6519012451171875, 0.68536376953125, 0.7188262939453125, 0.752288818359375, 0.7857513427734375, 0.8192138671875, 0.8526763916015625, 0.886138916015625, 0.9196014404296875, 0.95306396484375, 0.9865264892578125, 1.019989013671875, 1.0534515380859375, 1.0869140625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 33.0, 69.0, 156.0, 255.0, 224.0, 125.0, 62.0, 36.0, 11.0, 9.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.6658992767334, -27.667036056518555, -26.668170928955078, -25.669307708740234, -24.67044448852539, -23.671581268310547, -22.67271614074707, -21.673852920532227, -20.67498779296875, -19.676124572753906, -18.67725944519043, -17.678396224975586, -16.679533004760742, -15.680668830871582, -14.681804656982422, -13.682941436767578, -12.684078216552734, -11.685214042663574, -10.68635082244873, -9.68748664855957, -8.688623428344727, -7.689759254455566, -6.690895080566406, -5.692031383514404, -4.693167686462402, -3.6943039894104004, -2.6954400539398193, -1.6965761184692383, -0.6977124214172363, 0.3011512756347656, 1.3000154495239258, 2.2988791465759277, 3.2977447509765625, 4.2966084480285645, 5.295472145080566, 6.294336318969727, 7.2932000160217285, 8.29206371307373, 9.29092788696289, 10.289791107177734, 11.288655281066895, 12.287519454956055, 13.286382675170898, 14.285246849060059, 15.284111022949219, 16.282974243164062, 17.281837463378906, 18.280702590942383, 19.279565811157227, 20.27842903137207, 21.277294158935547, 22.27615737915039, 23.275020599365234, 24.273883819580078, 25.272748947143555, 26.2716121673584, 27.270477294921875, 28.26934051513672, 29.268205642700195, 30.26706886291504, 31.265932083129883, 32.26479721069336, 33.2636604309082, 34.26252365112305, 35.26138687133789]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 12.0, 19.0, 23.0, 22.0, 35.0, 35.0, 41.0, 60.0, 72.0, 73.0, 69.0, 77.0, 77.0, 57.0, 55.0, 63.0, 35.0, 36.0, 32.0, 28.0, 23.0, 15.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.603023529052734, -10.003554344177246, -9.404086112976074, -8.804616928100586, -8.205147743225098, -7.605679035186768, -7.0062103271484375, -6.406741142272949, -5.807272434234619, -5.207803726196289, -4.608334541320801, -4.008865833282471, -3.4093968868255615, -2.8099279403686523, -2.2104592323303223, -1.610990047454834, -1.011521339416504, -0.4120524525642395, 0.1874164342880249, 0.7868852615356445, 1.3863542079925537, 1.985823154449463, 2.585291862487793, 3.1847610473632812, 3.7842297554016113, 4.383698463439941, 4.98316764831543, 5.58263635635376, 6.18210506439209, 6.781574249267578, 7.381042957305908, 7.9805121421813965, 8.579980850219727, 9.179450035095215, 9.778918266296387, 10.378387451171875, 10.977856636047363, 11.577325820922852, 12.176794052124023, 12.776263236999512, 13.375732421875, 13.975201606750488, 14.57466983795166, 15.174139022827148, 15.773608207702637, 16.373077392578125, 16.972545623779297, 17.57201385498047, 18.17148208618164, 18.770950317382812, 19.370420455932617, 19.96988868713379, 20.56935691833496, 21.168827056884766, 21.768295288085938, 22.36776351928711, 22.967233657836914, 23.566701889038086, 24.16617202758789, 24.765640258789062, 25.365108489990234, 25.96457862854004, 26.56404685974121, 27.163516998291016, 27.762985229492188]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 5.0, 5.0, 7.0, 6.0, 12.0, 10.0, 16.0, 19.0, 17.0, 24.0, 27.0, 27.0, 41.0, 56.0, 82.0, 101.0, 137.0, 206.0, 409.0, 851.0, 1976.0, 5782.0, 21060.0, 3967749.0, 172456.0, 15320.0, 4585.0, 1646.0, 715.0, 395.0, 202.0, 113.0, 62.0, 54.0, 31.0, 21.0, 13.0, 10.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-14.390625, -14.03857421875, -13.6865234375, -13.33447265625, -12.982421875, -12.63037109375, -12.2783203125, -11.92626953125, -11.57421875, -11.22216796875, -10.8701171875, -10.51806640625, -10.166015625, -9.81396484375, -9.4619140625, -9.10986328125, -8.7578125, -8.40576171875, -8.0537109375, -7.70166015625, -7.349609375, -6.99755859375, -6.6455078125, -6.29345703125, -5.94140625, -5.58935546875, -5.2373046875, -4.88525390625, -4.533203125, -4.18115234375, -3.8291015625, -3.47705078125, -3.125, -2.77294921875, -2.4208984375, -2.06884765625, -1.716796875, -1.36474609375, -1.0126953125, -0.66064453125, -0.30859375, 0.04345703125, 0.3955078125, 0.74755859375, 1.099609375, 1.45166015625, 1.8037109375, 2.15576171875, 2.5078125, 2.85986328125, 3.2119140625, 3.56396484375, 3.916015625, 4.26806640625, 4.6201171875, 4.97216796875, 5.32421875, 5.67626953125, 6.0283203125, 6.38037109375, 6.732421875, 7.08447265625, 7.4365234375, 7.78857421875, 8.140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 29.0, 42.0, 52.0, 79.0, 98.0, 115.0, 125.0, 138.0, 92.0, 77.0, 55.0, 34.0, 27.0, 10.0, 10.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.3050918579101562, -1.2693634033203125, -1.2336349487304688, -1.197906494140625, -1.1621780395507812, -1.1264495849609375, -1.0907211303710938, -1.05499267578125, -1.0192642211914062, -0.9835357666015625, -0.9478073120117188, -0.912078857421875, -0.8763504028320312, -0.8406219482421875, -0.8048934936523438, -0.7691650390625, -0.7334365844726562, -0.6977081298828125, -0.6619796752929688, -0.626251220703125, -0.5905227661132812, -0.5547943115234375, -0.5190658569335938, -0.48333740234375, -0.44760894775390625, -0.4118804931640625, -0.37615203857421875, -0.340423583984375, -0.30469512939453125, -0.2689666748046875, -0.23323822021484375, -0.197509765625, -0.16178131103515625, -0.1260528564453125, -0.09032440185546875, -0.054595947265625, -0.01886749267578125, 0.0168609619140625, 0.05258941650390625, 0.08831787109375, 0.12404632568359375, 0.1597747802734375, 0.19550323486328125, 0.231231689453125, 0.26696014404296875, 0.3026885986328125, 0.33841705322265625, 0.3741455078125, 0.40987396240234375, 0.4456024169921875, 0.48133087158203125, 0.517059326171875, 0.5527877807617188, 0.5885162353515625, 0.6242446899414062, 0.65997314453125, 0.6957015991210938, 0.7314300537109375, 0.7671585083007812, 0.802886962890625, 0.8386154174804688, 0.8743438720703125, 0.9100723266601562, 0.94580078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 16.0, 29.0, 35.0, 50.0, 79.0, 129.0, 223.0, 313.0, 491.0, 742.0, 1546.0, 3437.0, 9400.0, 40112.0, 3780604.0, 319205.0, 25076.0, 6956.0, 2566.0, 1274.0, 775.0, 433.0, 242.0, 155.0, 120.0, 77.0, 61.0, 37.0, 29.0, 17.0, 13.0, 10.0, 6.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.4566650390625, -7.229736328125, -7.0028076171875, -6.77587890625, -6.5489501953125, -6.322021484375, -6.0950927734375, -5.8681640625, -5.6412353515625, -5.414306640625, -5.1873779296875, -4.96044921875, -4.7335205078125, -4.506591796875, -4.2796630859375, -4.052734375, -3.8258056640625, -3.598876953125, -3.3719482421875, -3.14501953125, -2.9180908203125, -2.691162109375, -2.4642333984375, -2.2373046875, -2.0103759765625, -1.783447265625, -1.5565185546875, -1.32958984375, -1.1026611328125, -0.875732421875, -0.6488037109375, -0.421875, -0.1949462890625, 0.031982421875, 0.2589111328125, 0.48583984375, 0.7127685546875, 0.939697265625, 1.1666259765625, 1.3935546875, 1.6204833984375, 1.847412109375, 2.0743408203125, 2.30126953125, 2.5281982421875, 2.755126953125, 2.9820556640625, 3.208984375, 3.4359130859375, 3.662841796875, 3.8897705078125, 4.11669921875, 4.3436279296875, 4.570556640625, 4.7974853515625, 5.0244140625, 5.2513427734375, 5.478271484375, 5.7052001953125, 5.93212890625, 6.1590576171875, 6.385986328125, 6.6129150390625, 6.83984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 8.0, 12.0, 11.0, 15.0, 17.0, 41.0, 65.0, 142.0, 866.0, 2524.0, 167.0, 70.0, 45.0, 35.0, 13.0, 16.0, 9.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6279296875, -1.5720367431640625, -1.516143798828125, -1.4602508544921875, -1.40435791015625, -1.3484649658203125, -1.292572021484375, -1.2366790771484375, -1.1807861328125, -1.1248931884765625, -1.069000244140625, -1.0131072998046875, -0.95721435546875, -0.9013214111328125, -0.845428466796875, -0.7895355224609375, -0.733642578125, -0.6777496337890625, -0.621856689453125, -0.5659637451171875, -0.51007080078125, -0.4541778564453125, -0.398284912109375, -0.3423919677734375, -0.2864990234375, -0.2306060791015625, -0.174713134765625, -0.1188201904296875, -0.06292724609375, -0.0070343017578125, 0.048858642578125, 0.1047515869140625, 0.16064453125, 0.2165374755859375, 0.272430419921875, 0.3283233642578125, 0.38421630859375, 0.4401092529296875, 0.496002197265625, 0.5518951416015625, 0.6077880859375, 0.6636810302734375, 0.719573974609375, 0.7754669189453125, 0.83135986328125, 0.8872528076171875, 0.943145751953125, 0.9990386962890625, 1.054931640625, 1.1108245849609375, 1.166717529296875, 1.2226104736328125, 1.27850341796875, 1.3343963623046875, 1.390289306640625, 1.4461822509765625, 1.5020751953125, 1.5579681396484375, 1.613861083984375, 1.6697540283203125, 1.72564697265625, 1.7815399169921875, 1.837432861328125, 1.8933258056640625, 1.94921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 17.0, 26.0, 89.0, 210.0, 375.0, 153.0, 65.0, 30.0, 8.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.586057662963867, -18.125606536865234, -17.66515350341797, -17.204702377319336, -16.744251251220703, -16.28380012512207, -15.823347091674805, -15.362895965576172, -14.902444839477539, -14.44199275970459, -13.981541633605957, -13.521089553833008, -13.060638427734375, -12.600186347961426, -12.139734268188477, -11.679283142089844, -11.218831062316895, -10.758378982543945, -10.297927856445312, -9.837475776672363, -9.37702465057373, -8.916572570800781, -8.456121444702148, -7.995669364929199, -7.535217761993408, -7.074766159057617, -6.614314556121826, -6.153862953186035, -5.693410873413086, -5.232959747314453, -4.772507667541504, -4.312056064605713, -3.8516054153442383, -3.3911538124084473, -2.9307022094726562, -2.470250368118286, -2.009798765182495, -1.549347162246704, -1.088895320892334, -0.628443717956543, -0.16799211502075195, 0.29245954751968384, 0.7529112100601196, 1.2133629322052002, 1.6738145351409912, 2.1342661380767822, 2.5947179794311523, 3.0551695823669434, 3.5156211853027344, 3.9760727882385254, 4.436524391174316, 4.896976470947266, 5.357427597045898, 5.817879676818848, 6.278331279754639, 6.73878288269043, 7.199234485626221, 7.659686088562012, 8.120138168334961, 8.580589294433594, 9.041041374206543, 9.501492500305176, 9.961944580078125, 10.422395706176758, 10.882847785949707]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 13.0, 18.0, 19.0, 23.0, 19.0, 23.0, 38.0, 34.0, 43.0, 60.0, 53.0, 63.0, 67.0, 69.0, 52.0, 64.0, 52.0, 49.0, 38.0, 26.0, 27.0, 32.0, 27.0, 20.0, 6.0, 12.0, 13.0, 6.0, 9.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.373544216156006, -5.224605560302734, -5.075666427612305, -4.926727771759033, -4.7777886390686035, -4.628849983215332, -4.479910850524902, -4.330972194671631, -4.182033538818359, -4.033094882965088, -3.884155750274658, -3.7352168560028076, -3.586277961730957, -3.4373393058776855, -3.288400411605835, -3.1394615173339844, -2.9905223846435547, -2.841583490371704, -2.6926445960998535, -2.543705701828003, -2.3947668075561523, -2.245828151702881, -2.0968892574310303, -1.9479503631591797, -1.799011468887329, -1.6500725746154785, -1.501133680343628, -1.352194905281067, -1.2032560110092163, -1.0543171167373657, -0.9053782820701599, -0.7564394474029541, -0.6075010299682617, -0.4585621654987335, -0.3096233010292053, -0.16068443655967712, -0.011745572090148926, 0.13719332218170166, 0.28613215684890747, 0.4350709915161133, 0.5840098857879639, 0.7329487800598145, 0.8818876147270203, 1.030826449394226, 1.1797653436660767, 1.3287042379379272, 1.4776430130004883, 1.6265819072723389, 1.7755208015441895, 1.92445969581604, 2.0733985900878906, 2.222337484359741, 2.371276378631592, 2.5202150344848633, 2.669153928756714, 2.8180928230285645, 2.967031717300415, 3.1159706115722656, 3.264909505844116, 3.413848400115967, 3.5627870559692383, 3.711726188659668, 3.8606648445129395, 4.009603500366211, 4.158542633056641]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 20.0, 24.0, 25.0, 54.0, 59.0, 127.0, 241.0, 469.0, 1122.0, 3346.0, 19682.0, 471591.0, 524810.0, 21185.0, 3490.0, 1117.0, 508.0, 273.0, 151.0, 69.0, 50.0, 44.0, 20.0, 18.0, 8.0, 10.0, 4.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.09375, -13.75830078125, -13.4228515625, -13.08740234375, -12.751953125, -12.41650390625, -12.0810546875, -11.74560546875, -11.41015625, -11.07470703125, -10.7392578125, -10.40380859375, -10.068359375, -9.73291015625, -9.3974609375, -9.06201171875, -8.7265625, -8.39111328125, -8.0556640625, -7.72021484375, -7.384765625, -7.04931640625, -6.7138671875, -6.37841796875, -6.04296875, -5.70751953125, -5.3720703125, -5.03662109375, -4.701171875, -4.36572265625, -4.0302734375, -3.69482421875, -3.359375, -3.02392578125, -2.6884765625, -2.35302734375, -2.017578125, -1.68212890625, -1.3466796875, -1.01123046875, -0.67578125, -0.34033203125, -0.0048828125, 0.33056640625, 0.666015625, 1.00146484375, 1.3369140625, 1.67236328125, 2.0078125, 2.34326171875, 2.6787109375, 3.01416015625, 3.349609375, 3.68505859375, 4.0205078125, 4.35595703125, 4.69140625, 5.02685546875, 5.3623046875, 5.69775390625, 6.033203125, 6.36865234375, 6.7041015625, 7.03955078125, 7.375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 11.0, 25.0, 49.0, 47.0, 81.0, 91.0, 113.0, 110.0, 134.0, 105.0, 85.0, 52.0, 32.0, 28.0, 9.0, 13.0, 1.0, 3.0, 0.0, 0.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5966796875, -1.5582046508789062, -1.5197296142578125, -1.4812545776367188, -1.442779541015625, -1.4043045043945312, -1.3658294677734375, -1.3273544311523438, -1.28887939453125, -1.2504043579101562, -1.2119293212890625, -1.1734542846679688, -1.134979248046875, -1.0965042114257812, -1.0580291748046875, -1.0195541381835938, -0.9810791015625, -0.9426040649414062, -0.9041290283203125, -0.8656539916992188, -0.827178955078125, -0.7887039184570312, -0.7502288818359375, -0.7117538452148438, -0.67327880859375, -0.6348037719726562, -0.5963287353515625, -0.5578536987304688, -0.519378662109375, -0.48090362548828125, -0.4424285888671875, -0.40395355224609375, -0.365478515625, -0.32700347900390625, -0.2885284423828125, -0.25005340576171875, -0.211578369140625, -0.17310333251953125, -0.1346282958984375, -0.09615325927734375, -0.05767822265625, -0.01920318603515625, 0.0192718505859375, 0.05774688720703125, 0.096221923828125, 0.13469696044921875, 0.1731719970703125, 0.21164703369140625, 0.2501220703125, 0.28859710693359375, 0.3270721435546875, 0.36554718017578125, 0.404022216796875, 0.44249725341796875, 0.4809722900390625, 0.5194473266601562, 0.55792236328125, 0.5963973999023438, 0.6348724365234375, 0.6733474731445312, 0.711822509765625, 0.7502975463867188, 0.7887725830078125, 0.8272476196289062, 0.86572265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 11.0, 13.0, 13.0, 30.0, 29.0, 47.0, 83.0, 106.0, 221.0, 417.0, 830.0, 1914.0, 5098.0, 17049.0, 92411.0, 674073.0, 213399.0, 30167.0, 7619.0, 2625.0, 1123.0, 549.0, 292.0, 165.0, 79.0, 67.0, 31.0, 27.0, 20.0, 8.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.57952880859375, -4.4012451171875, -4.22296142578125, -4.044677734375, -3.86639404296875, -3.6881103515625, -3.50982666015625, -3.33154296875, -3.15325927734375, -2.9749755859375, -2.79669189453125, -2.618408203125, -2.44012451171875, -2.2618408203125, -2.08355712890625, -1.9052734375, -1.72698974609375, -1.5487060546875, -1.37042236328125, -1.192138671875, -1.01385498046875, -0.8355712890625, -0.65728759765625, -0.47900390625, -0.30072021484375, -0.1224365234375, 0.05584716796875, 0.234130859375, 0.41241455078125, 0.5906982421875, 0.76898193359375, 0.947265625, 1.12554931640625, 1.3038330078125, 1.48211669921875, 1.660400390625, 1.83868408203125, 2.0169677734375, 2.19525146484375, 2.37353515625, 2.55181884765625, 2.7301025390625, 2.90838623046875, 3.086669921875, 3.26495361328125, 3.4432373046875, 3.62152099609375, 3.7998046875, 3.97808837890625, 4.1563720703125, 4.33465576171875, 4.512939453125, 4.69122314453125, 4.8695068359375, 5.04779052734375, 5.22607421875, 5.40435791015625, 5.5826416015625, 5.76092529296875, 5.939208984375, 6.11749267578125, 6.2957763671875, 6.47406005859375, 6.65234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 7.0, 10.0, 15.0, 23.0, 21.0, 28.0, 28.0, 30.0, 54.0, 65.0, 77.0, 73.0, 77.0, 64.0, 82.0, 62.0, 53.0, 44.0, 47.0, 41.0, 27.0, 18.0, 12.0, 7.0, 14.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.25390625, -5.13104248046875, -5.0081787109375, -4.88531494140625, -4.762451171875, -4.63958740234375, -4.5167236328125, -4.39385986328125, -4.27099609375, -4.14813232421875, -4.0252685546875, -3.90240478515625, -3.779541015625, -3.65667724609375, -3.5338134765625, -3.41094970703125, -3.2880859375, -3.16522216796875, -3.0423583984375, -2.91949462890625, -2.796630859375, -2.67376708984375, -2.5509033203125, -2.42803955078125, -2.30517578125, -2.18231201171875, -2.0594482421875, -1.93658447265625, -1.813720703125, -1.69085693359375, -1.5679931640625, -1.44512939453125, -1.322265625, -1.19940185546875, -1.0765380859375, -0.95367431640625, -0.830810546875, -0.70794677734375, -0.5850830078125, -0.46221923828125, -0.33935546875, -0.21649169921875, -0.0936279296875, 0.02923583984375, 0.152099609375, 0.27496337890625, 0.3978271484375, 0.52069091796875, 0.6435546875, 0.76641845703125, 0.8892822265625, 1.01214599609375, 1.135009765625, 1.25787353515625, 1.3807373046875, 1.50360107421875, 1.62646484375, 1.74932861328125, 1.8721923828125, 1.99505615234375, 2.117919921875, 2.24078369140625, 2.3636474609375, 2.48651123046875, 2.609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 10.0, 11.0, 14.0, 14.0, 18.0, 32.0, 42.0, 81.0, 97.0, 182.0, 269.0, 549.0, 1037.0, 2174.0, 5177.0, 14085.0, 47862.0, 275760.0, 573292.0, 91188.0, 22845.0, 7671.0, 3069.0, 1345.0, 697.0, 374.0, 225.0, 149.0, 62.0, 72.0, 32.0, 28.0, 31.0, 15.0, 13.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3427734375, -1.293426513671875, -1.24407958984375, -1.194732666015625, -1.1453857421875, -1.096038818359375, -1.04669189453125, -0.997344970703125, -0.947998046875, -0.898651123046875, -0.84930419921875, -0.799957275390625, -0.7506103515625, -0.701263427734375, -0.65191650390625, -0.602569580078125, -0.55322265625, -0.503875732421875, -0.45452880859375, -0.405181884765625, -0.3558349609375, -0.306488037109375, -0.25714111328125, -0.207794189453125, -0.158447265625, -0.109100341796875, -0.05975341796875, -0.010406494140625, 0.0389404296875, 0.088287353515625, 0.13763427734375, 0.186981201171875, 0.236328125, 0.285675048828125, 0.33502197265625, 0.384368896484375, 0.4337158203125, 0.483062744140625, 0.53240966796875, 0.581756591796875, 0.631103515625, 0.680450439453125, 0.72979736328125, 0.779144287109375, 0.8284912109375, 0.877838134765625, 0.92718505859375, 0.976531982421875, 1.02587890625, 1.075225830078125, 1.12457275390625, 1.173919677734375, 1.2232666015625, 1.272613525390625, 1.32196044921875, 1.371307373046875, 1.420654296875, 1.470001220703125, 1.51934814453125, 1.568695068359375, 1.6180419921875, 1.667388916015625, 1.71673583984375, 1.766082763671875, 1.8154296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 9.0, 10.0, 7.0, 14.0, 45.0, 74.0, 168.0, 273.0, 197.0, 72.0, 37.0, 31.0, 15.0, 10.0, 5.0, 4.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005288124084472656, -0.0005089044570922852, -0.0004889965057373047, -0.0004690885543823242, -0.00044918060302734375, -0.0004292726516723633, -0.0004093647003173828, -0.00038945674896240234, -0.0003695487976074219, -0.0003496408462524414, -0.00032973289489746094, -0.00030982494354248047, -0.0002899169921875, -0.00027000904083251953, -0.00025010108947753906, -0.0002301931381225586, -0.00021028518676757812, -0.00019037723541259766, -0.0001704692840576172, -0.00015056133270263672, -0.00013065338134765625, -0.00011074542999267578, -9.083747863769531e-05, -7.092952728271484e-05, -5.1021575927734375e-05, -3.1113624572753906e-05, -1.1205673217773438e-05, 8.702278137207031e-06, 2.86102294921875e-05, 4.851818084716797e-05, 6.842613220214844e-05, 8.83340835571289e-05, 0.00010824203491210938, 0.00012814998626708984, 0.0001480579376220703, 0.00016796588897705078, 0.00018787384033203125, 0.00020778179168701172, 0.0002276897430419922, 0.00024759769439697266, 0.0002675056457519531, 0.0002874135971069336, 0.00030732154846191406, 0.00032722949981689453, 0.000347137451171875, 0.00036704540252685547, 0.00038695335388183594, 0.0004068613052368164, 0.0004267692565917969, 0.00044667720794677734, 0.0004665851593017578, 0.0004864931106567383, 0.0005064010620117188, 0.0005263090133666992, 0.0005462169647216797, 0.0005661249160766602, 0.0005860328674316406, 0.0006059408187866211, 0.0006258487701416016, 0.000645756721496582, 0.0006656646728515625, 0.000685572624206543, 0.0007054805755615234, 0.0007253885269165039, 0.0007452964782714844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 3.0, 10.0, 11.0, 19.0, 25.0, 34.0, 63.0, 77.0, 134.0, 215.0, 407.0, 761.0, 1657.0, 4027.0, 12506.0, 49634.0, 370933.0, 518415.0, 65541.0, 15136.0, 5055.0, 1980.0, 880.0, 399.0, 253.0, 128.0, 89.0, 46.0, 32.0, 23.0, 16.0, 10.0, 10.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.29296875, -1.241424560546875, -1.18988037109375, -1.138336181640625, -1.0867919921875, -1.035247802734375, -0.98370361328125, -0.932159423828125, -0.880615234375, -0.829071044921875, -0.77752685546875, -0.725982666015625, -0.6744384765625, -0.622894287109375, -0.57135009765625, -0.519805908203125, -0.46826171875, -0.416717529296875, -0.36517333984375, -0.313629150390625, -0.2620849609375, -0.210540771484375, -0.15899658203125, -0.107452392578125, -0.055908203125, -0.004364013671875, 0.04718017578125, 0.098724365234375, 0.1502685546875, 0.201812744140625, 0.25335693359375, 0.304901123046875, 0.3564453125, 0.407989501953125, 0.45953369140625, 0.511077880859375, 0.5626220703125, 0.614166259765625, 0.66571044921875, 0.717254638671875, 0.768798828125, 0.820343017578125, 0.87188720703125, 0.923431396484375, 0.9749755859375, 1.026519775390625, 1.07806396484375, 1.129608154296875, 1.18115234375, 1.232696533203125, 1.28424072265625, 1.335784912109375, 1.3873291015625, 1.438873291015625, 1.49041748046875, 1.541961669921875, 1.593505859375, 1.645050048828125, 1.69659423828125, 1.748138427734375, 1.7996826171875, 1.851226806640625, 1.90277099609375, 1.954315185546875, 2.005859375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 6.0, 10.0, 10.0, 8.0, 28.0, 23.0, 41.0, 52.0, 78.0, 89.0, 89.0, 102.0, 92.0, 91.0, 61.0, 57.0, 41.0, 35.0, 17.0, 17.0, 15.0, 8.0, 6.0, 1.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.3564834594726562, -1.3223419189453125, -1.2882003784179688, -1.254058837890625, -1.2199172973632812, -1.1857757568359375, -1.1516342163085938, -1.11749267578125, -1.0833511352539062, -1.0492095947265625, -1.0150680541992188, -0.980926513671875, -0.9467849731445312, -0.9126434326171875, -0.8785018920898438, -0.8443603515625, -0.8102188110351562, -0.7760772705078125, -0.7419357299804688, -0.707794189453125, -0.6736526489257812, -0.6395111083984375, -0.6053695678710938, -0.57122802734375, -0.5370864868164062, -0.5029449462890625, -0.46880340576171875, -0.434661865234375, -0.40052032470703125, -0.3663787841796875, -0.33223724365234375, -0.298095703125, -0.26395416259765625, -0.2298126220703125, -0.19567108154296875, -0.161529541015625, -0.12738800048828125, -0.0932464599609375, -0.05910491943359375, -0.02496337890625, 0.00917816162109375, 0.0433197021484375, 0.07746124267578125, 0.111602783203125, 0.14574432373046875, 0.1798858642578125, 0.21402740478515625, 0.2481689453125, 0.28231048583984375, 0.3164520263671875, 0.35059356689453125, 0.384735107421875, 0.41887664794921875, 0.4530181884765625, 0.48715972900390625, 0.52130126953125, 0.5554428100585938, 0.5895843505859375, 0.6237258911132812, 0.657867431640625, 0.6920089721679688, 0.7261505126953125, 0.7602920532226562, 0.79443359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 11.0, 56.0, 227.0, 464.0, 178.0, 45.0, 13.0, 10.0, 4.0, 5.0], "bins": [-138.11410522460938, -135.7060546875, -133.29798889160156, -130.8899383544922, -128.4818878173828, -126.0738296508789, -123.66577911376953, -121.25772094726562, -118.84967041015625, -116.44161224365234, -114.03356170654297, -111.62550354003906, -109.21745300292969, -106.80939483642578, -104.4013442993164, -101.9932861328125, -99.58523559570312, -97.17717742919922, -94.76912689208984, -92.36106872558594, -89.95301818847656, -87.54496002197266, -85.13690948486328, -82.72885131835938, -80.32079315185547, -77.91273498535156, -75.50468444824219, -73.09662628173828, -70.6885757446289, -68.280517578125, -65.87246704101562, -63.46440887451172, -61.05635070800781, -58.64829635620117, -56.24024200439453, -53.83218765258789, -51.42413330078125, -49.01607894897461, -46.60802459716797, -44.19996643066406, -41.79191589355469, -39.38386154174805, -36.975807189941406, -34.567752838134766, -32.159698486328125, -29.751644134521484, -27.34358787536621, -24.93553352355957, -22.52747917175293, -20.11942481994629, -17.71137046813965, -15.303315162658691, -12.89526081085205, -10.48720645904541, -8.079151153564453, -5.6710968017578125, -3.263042449951172, -0.8549878597259521, 1.5530667304992676, 3.9611215591430664, 6.369175910949707, 8.777230262756348, 11.185285568237305, 13.593339920043945, 16.001394271850586]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 19.0, 8.0, 17.0, 20.0, 26.0, 42.0, 53.0, 53.0, 49.0, 70.0, 70.0, 70.0, 81.0, 72.0, 73.0, 60.0, 46.0, 40.0, 28.0, 34.0, 12.0, 13.0, 10.0, 8.0, 7.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.717491149902344, -26.97990608215332, -26.242321014404297, -25.504735946655273, -24.76715087890625, -24.029565811157227, -23.291980743408203, -22.554393768310547, -21.816810607910156, -21.079225540161133, -20.34164047241211, -19.604055404663086, -18.866470336914062, -18.12888526916504, -17.391300201416016, -16.65371322631836, -15.916128158569336, -15.178543090820312, -14.440958023071289, -13.703372955322266, -12.965787887573242, -12.228202819824219, -11.490616798400879, -10.753031730651855, -10.015446662902832, -9.277861595153809, -8.540276527404785, -7.8026909828186035, -7.06510591506958, -6.327520847320557, -5.589935302734375, -4.852350234985352, -4.114765167236328, -3.3771800994873047, -2.639594793319702, -1.9020094871520996, -1.1644244194030762, -0.42683935165405273, 0.3107461929321289, 1.0483312606811523, 1.7859163284301758, 2.523501396179199, 3.2610867023468018, 3.9986720085144043, 4.736257076263428, 5.473842144012451, 6.211427688598633, 6.949012756347656, 7.68659782409668, 8.424182891845703, 9.161767959594727, 9.89935302734375, 10.636938095092773, 11.374523162841797, 12.112109184265137, 12.84969425201416, 13.587279319763184, 14.324864387512207, 15.06244945526123, 15.80003547668457, 16.537620544433594, 17.275205612182617, 18.01279067993164, 18.750375747680664, 19.487960815429688]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 12.0, 4.0, 8.0, 6.0, 7.0, 5.0, 9.0, 16.0, 20.0, 31.0, 20.0, 37.0, 43.0, 48.0, 59.0, 49.0, 94.0, 120.0, 178.0, 270.0, 440.0, 884.0, 2121.0, 5556.0, 17471.0, 89500.0, 3990216.0, 64448.0, 14664.0, 4721.0, 1667.0, 709.0, 323.0, 162.0, 113.0, 74.0, 67.0, 44.0, 24.0, 9.0, 8.0, 6.0, 6.0, 1.0, 2.0], "bins": [-14.3046875, -13.98968505859375, -13.6746826171875, -13.35968017578125, -13.044677734375, -12.72967529296875, -12.4146728515625, -12.09967041015625, -11.78466796875, -11.46966552734375, -11.1546630859375, -10.83966064453125, -10.524658203125, -10.20965576171875, -9.8946533203125, -9.57965087890625, -9.2646484375, -8.94964599609375, -8.6346435546875, -8.31964111328125, -8.004638671875, -7.68963623046875, -7.3746337890625, -7.05963134765625, -6.74462890625, -6.42962646484375, -6.1146240234375, -5.79962158203125, -5.484619140625, -5.16961669921875, -4.8546142578125, -4.53961181640625, -4.224609375, -3.90960693359375, -3.5946044921875, -3.27960205078125, -2.964599609375, -2.64959716796875, -2.3345947265625, -2.01959228515625, -1.70458984375, -1.38958740234375, -1.0745849609375, -0.75958251953125, -0.444580078125, -0.12957763671875, 0.1854248046875, 0.50042724609375, 0.8154296875, 1.13043212890625, 1.4454345703125, 1.76043701171875, 2.075439453125, 2.39044189453125, 2.7054443359375, 3.02044677734375, 3.33544921875, 3.65045166015625, 3.9654541015625, 4.28045654296875, 4.595458984375, 4.91046142578125, 5.2254638671875, 5.54046630859375, 5.85546875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 9.0, 15.0, 26.0, 35.0, 59.0, 67.0, 75.0, 117.0, 102.0, 118.0, 106.0, 80.0, 56.0, 57.0, 27.0, 22.0, 15.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.638671875, -1.6002883911132812, -1.5619049072265625, -1.5235214233398438, -1.485137939453125, -1.4467544555664062, -1.4083709716796875, -1.3699874877929688, -1.33160400390625, -1.2932205200195312, -1.2548370361328125, -1.2164535522460938, -1.178070068359375, -1.1396865844726562, -1.1013031005859375, -1.0629196166992188, -1.0245361328125, -0.9861526489257812, -0.9477691650390625, -0.9093856811523438, -0.871002197265625, -0.8326187133789062, -0.7942352294921875, -0.7558517456054688, -0.71746826171875, -0.6790847778320312, -0.6407012939453125, -0.6023178100585938, -0.563934326171875, -0.5255508422851562, -0.4871673583984375, -0.44878387451171875, -0.410400390625, -0.37201690673828125, -0.3336334228515625, -0.29524993896484375, -0.256866455078125, -0.21848297119140625, -0.1800994873046875, -0.14171600341796875, -0.10333251953125, -0.06494903564453125, -0.0265655517578125, 0.01181793212890625, 0.050201416015625, 0.08858489990234375, 0.1269683837890625, 0.16535186767578125, 0.2037353515625, 0.24211883544921875, 0.2805023193359375, 0.31888580322265625, 0.357269287109375, 0.39565277099609375, 0.4340362548828125, 0.47241973876953125, 0.51080322265625, 0.5491867065429688, 0.5875701904296875, 0.6259536743164062, 0.664337158203125, 0.7027206420898438, 0.7411041259765625, 0.7794876098632812, 0.81787109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 10.0, 18.0, 21.0, 29.0, 46.0, 61.0, 126.0, 229.0, 491.0, 1173.0, 3850.0, 22350.0, 4026566.0, 127855.0, 8135.0, 1967.0, 687.0, 286.0, 128.0, 93.0, 50.0, 30.0, 22.0, 13.0, 11.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.3662109375, -12.779296875, -12.1923828125, -11.60546875, -11.0185546875, -10.431640625, -9.8447265625, -9.2578125, -8.6708984375, -8.083984375, -7.4970703125, -6.91015625, -6.3232421875, -5.736328125, -5.1494140625, -4.5625, -3.9755859375, -3.388671875, -2.8017578125, -2.21484375, -1.6279296875, -1.041015625, -0.4541015625, 0.1328125, 0.7197265625, 1.306640625, 1.8935546875, 2.48046875, 3.0673828125, 3.654296875, 4.2412109375, 4.828125, 5.4150390625, 6.001953125, 6.5888671875, 7.17578125, 7.7626953125, 8.349609375, 8.9365234375, 9.5234375, 10.1103515625, 10.697265625, 11.2841796875, 11.87109375, 12.4580078125, 13.044921875, 13.6318359375, 14.21875, 14.8056640625, 15.392578125, 15.9794921875, 16.56640625, 17.1533203125, 17.740234375, 18.3271484375, 18.9140625, 19.5009765625, 20.087890625, 20.6748046875, 21.26171875, 21.8486328125, 22.435546875, 23.0224609375, 23.609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 4.0, 22.0, 18.0, 35.0, 47.0, 116.0, 570.0, 2838.0, 228.0, 85.0, 39.0, 22.0, 16.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.54296875, -6.4100799560546875, -6.277191162109375, -6.1443023681640625, -6.01141357421875, -5.8785247802734375, -5.745635986328125, -5.6127471923828125, -5.4798583984375, -5.3469696044921875, -5.214080810546875, -5.0811920166015625, -4.94830322265625, -4.8154144287109375, -4.682525634765625, -4.5496368408203125, -4.416748046875, -4.2838592529296875, -4.150970458984375, -4.0180816650390625, -3.88519287109375, -3.7523040771484375, -3.619415283203125, -3.4865264892578125, -3.3536376953125, -3.2207489013671875, -3.087860107421875, -2.9549713134765625, -2.82208251953125, -2.6891937255859375, -2.556304931640625, -2.4234161376953125, -2.29052734375, -2.1576385498046875, -2.024749755859375, -1.8918609619140625, -1.75897216796875, -1.6260833740234375, -1.493194580078125, -1.3603057861328125, -1.2274169921875, -1.0945281982421875, -0.961639404296875, -0.8287506103515625, -0.69586181640625, -0.5629730224609375, -0.430084228515625, -0.2971954345703125, -0.164306640625, -0.0314178466796875, 0.101470947265625, 0.2343597412109375, 0.36724853515625, 0.5001373291015625, 0.633026123046875, 0.7659149169921875, 0.8988037109375, 1.0316925048828125, 1.164581298828125, 1.2974700927734375, 1.43035888671875, 1.5632476806640625, 1.696136474609375, 1.8290252685546875, 1.9619140625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 32.0, 78.0, 254.0, 381.0, 163.0, 47.0, 13.0, 11.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.16647720336914, -41.94157409667969, -40.71666717529297, -39.491764068603516, -38.26686096191406, -37.04195785522461, -35.817054748535156, -34.59214782714844, -33.367244720458984, -32.14234161376953, -30.917436599731445, -29.69253158569336, -28.467628479003906, -27.242725372314453, -26.017820358276367, -24.79291534423828, -23.568012237548828, -22.343109130859375, -21.11820411682129, -19.893299102783203, -18.66839599609375, -17.443492889404297, -16.21858787536621, -14.993683815002441, -13.768779754638672, -12.543875694274902, -11.318971633911133, -10.094067573547363, -8.869163513183594, -7.644259452819824, -6.419355392456055, -5.194451332092285, -3.96954345703125, -2.7446393966674805, -1.519735336303711, -0.2948312759399414, 0.9300727844238281, 2.1549768447875977, 3.379880905151367, 4.604784965515137, 5.829689025878906, 7.054593086242676, 8.279497146606445, 9.504401206970215, 10.729305267333984, 11.954209327697754, 13.179113388061523, 14.404017448425293, 15.628921508789062, 16.853824615478516, 18.0787296295166, 19.303634643554688, 20.52853775024414, 21.753440856933594, 22.97834587097168, 24.203250885009766, 25.42815399169922, 26.653057098388672, 27.877962112426758, 29.102867126464844, 30.327770233154297, 31.55267333984375, 32.77758026123047, 34.00248336791992, 35.227386474609375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 7.0, 16.0, 17.0, 29.0, 51.0, 48.0, 82.0, 97.0, 101.0, 115.0, 110.0, 85.0, 73.0, 53.0, 45.0, 32.0, 14.0, 14.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.67136001586914, -19.122207641601562, -18.573057174682617, -18.02390480041504, -17.47475242614746, -16.925601959228516, -16.376449584960938, -15.82729721069336, -15.278145790100098, -14.728994369506836, -14.179841995239258, -13.630690574645996, -13.081539154052734, -12.532386779785156, -11.983235359191895, -11.434083938598633, -10.884931564331055, -10.335780143737793, -9.786627769470215, -9.237476348876953, -8.688323974609375, -8.139172554016113, -7.590021133422852, -7.040869235992432, -6.491717338562012, -5.942565441131592, -5.393413543701172, -4.84426212310791, -4.29511022567749, -3.7459583282470703, -3.1968066692352295, -2.6476550102233887, -2.098504066467285, -1.5493522882461548, -1.0002005100250244, -0.45104873180389404, 0.09810304641723633, 0.6472549438476562, 1.196406602859497, 1.745558261871338, 2.294710159301758, 2.8438620567321777, 3.3930137157440186, 3.9421653747558594, 4.491317272186279, 5.040469169616699, 5.589620590209961, 6.138772487640381, 6.687924385070801, 7.237076282501221, 7.786228179931641, 8.335379600524902, 8.884531021118164, 9.433683395385742, 9.982834815979004, 10.531986236572266, 11.081138610839844, 11.630290031433105, 12.179442405700684, 12.728593826293945, 13.277746200561523, 13.826897621154785, 14.376049041748047, 14.925201416015625, 15.474352836608887]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 2.0, 4.0, 15.0, 11.0, 12.0, 23.0, 23.0, 29.0, 51.0, 72.0, 78.0, 142.0, 188.0, 314.0, 542.0, 1041.0, 2697.0, 11568.0, 90878.0, 786134.0, 133566.0, 15077.0, 3267.0, 1205.0, 581.0, 324.0, 223.0, 141.0, 91.0, 70.0, 45.0, 34.0, 27.0, 18.0, 14.0, 23.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.7890625, -8.52728271484375, -8.2655029296875, -8.00372314453125, -7.741943359375, -7.48016357421875, -7.2183837890625, -6.95660400390625, -6.69482421875, -6.43304443359375, -6.1712646484375, -5.90948486328125, -5.647705078125, -5.38592529296875, -5.1241455078125, -4.86236572265625, -4.6005859375, -4.33880615234375, -4.0770263671875, -3.81524658203125, -3.553466796875, -3.29168701171875, -3.0299072265625, -2.76812744140625, -2.50634765625, -2.24456787109375, -1.9827880859375, -1.72100830078125, -1.459228515625, -1.19744873046875, -0.9356689453125, -0.67388916015625, -0.412109375, -0.15032958984375, 0.1114501953125, 0.37322998046875, 0.635009765625, 0.89678955078125, 1.1585693359375, 1.42034912109375, 1.68212890625, 1.94390869140625, 2.2056884765625, 2.46746826171875, 2.729248046875, 2.99102783203125, 3.2528076171875, 3.51458740234375, 3.7763671875, 4.03814697265625, 4.2999267578125, 4.56170654296875, 4.823486328125, 5.08526611328125, 5.3470458984375, 5.60882568359375, 5.87060546875, 6.13238525390625, 6.3941650390625, 6.65594482421875, 6.917724609375, 7.17950439453125, 7.4412841796875, 7.70306396484375, 7.96484375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 17.0, 24.0, 45.0, 51.0, 107.0, 100.0, 135.0, 154.0, 95.0, 89.0, 74.0, 42.0, 30.0, 17.0, 9.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8642578125, -1.817596435546875, -1.77093505859375, -1.724273681640625, -1.6776123046875, -1.630950927734375, -1.58428955078125, -1.537628173828125, -1.490966796875, -1.444305419921875, -1.39764404296875, -1.350982666015625, -1.3043212890625, -1.257659912109375, -1.21099853515625, -1.164337158203125, -1.11767578125, -1.071014404296875, -1.02435302734375, -0.977691650390625, -0.9310302734375, -0.884368896484375, -0.83770751953125, -0.791046142578125, -0.744384765625, -0.697723388671875, -0.65106201171875, -0.604400634765625, -0.5577392578125, -0.511077880859375, -0.46441650390625, -0.417755126953125, -0.37109375, -0.324432373046875, -0.27777099609375, -0.231109619140625, -0.1844482421875, -0.137786865234375, -0.09112548828125, -0.044464111328125, 0.002197265625, 0.048858642578125, 0.09552001953125, 0.142181396484375, 0.1888427734375, 0.235504150390625, 0.28216552734375, 0.328826904296875, 0.37548828125, 0.422149658203125, 0.46881103515625, 0.515472412109375, 0.5621337890625, 0.608795166015625, 0.65545654296875, 0.702117919921875, 0.748779296875, 0.795440673828125, 0.84210205078125, 0.888763427734375, 0.9354248046875, 0.982086181640625, 1.02874755859375, 1.075408935546875, 1.1220703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 11.0, 15.0, 9.0, 19.0, 29.0, 34.0, 57.0, 96.0, 154.0, 261.0, 546.0, 1083.0, 2426.0, 5693.0, 15341.0, 46706.0, 186560.0, 538740.0, 180414.0, 45372.0, 14829.0, 5434.0, 2358.0, 1069.0, 556.0, 303.0, 170.0, 102.0, 59.0, 37.0, 24.0, 16.0, 8.0, 11.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.921875, -3.8172607421875, -3.712646484375, -3.6080322265625, -3.50341796875, -3.3988037109375, -3.294189453125, -3.1895751953125, -3.0849609375, -2.9803466796875, -2.875732421875, -2.7711181640625, -2.66650390625, -2.5618896484375, -2.457275390625, -2.3526611328125, -2.248046875, -2.1434326171875, -2.038818359375, -1.9342041015625, -1.82958984375, -1.7249755859375, -1.620361328125, -1.5157470703125, -1.4111328125, -1.3065185546875, -1.201904296875, -1.0972900390625, -0.99267578125, -0.8880615234375, -0.783447265625, -0.6788330078125, -0.57421875, -0.4696044921875, -0.364990234375, -0.2603759765625, -0.15576171875, -0.0511474609375, 0.053466796875, 0.1580810546875, 0.2626953125, 0.3673095703125, 0.471923828125, 0.5765380859375, 0.68115234375, 0.7857666015625, 0.890380859375, 0.9949951171875, 1.099609375, 1.2042236328125, 1.308837890625, 1.4134521484375, 1.51806640625, 1.6226806640625, 1.727294921875, 1.8319091796875, 1.9365234375, 2.0411376953125, 2.145751953125, 2.2503662109375, 2.35498046875, 2.4595947265625, 2.564208984375, 2.6688232421875, 2.7734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 7.0, 7.0, 7.0, 6.0, 13.0, 10.0, 24.0, 18.0, 18.0, 25.0, 32.0, 23.0, 40.0, 38.0, 28.0, 39.0, 57.0, 38.0, 39.0, 41.0, 40.0, 50.0, 38.0, 35.0, 37.0, 44.0, 29.0, 34.0, 21.0, 30.0, 21.0, 17.0, 13.0, 13.0, 16.0, 7.0, 8.0, 10.0, 8.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.533203125, -2.457855224609375, -2.38250732421875, -2.307159423828125, -2.2318115234375, -2.156463623046875, -2.08111572265625, -2.005767822265625, -1.930419921875, -1.855072021484375, -1.77972412109375, -1.704376220703125, -1.6290283203125, -1.553680419921875, -1.47833251953125, -1.402984619140625, -1.32763671875, -1.252288818359375, -1.17694091796875, -1.101593017578125, -1.0262451171875, -0.950897216796875, -0.87554931640625, -0.800201416015625, -0.724853515625, -0.649505615234375, -0.57415771484375, -0.498809814453125, -0.4234619140625, -0.348114013671875, -0.27276611328125, -0.197418212890625, -0.1220703125, -0.046722412109375, 0.02862548828125, 0.103973388671875, 0.1793212890625, 0.254669189453125, 0.33001708984375, 0.405364990234375, 0.480712890625, 0.556060791015625, 0.63140869140625, 0.706756591796875, 0.7821044921875, 0.857452392578125, 0.93280029296875, 1.008148193359375, 1.08349609375, 1.158843994140625, 1.23419189453125, 1.309539794921875, 1.3848876953125, 1.460235595703125, 1.53558349609375, 1.610931396484375, 1.686279296875, 1.761627197265625, 1.83697509765625, 1.912322998046875, 1.9876708984375, 2.063018798828125, 2.13836669921875, 2.213714599609375, 2.2890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 12.0, 6.0, 4.0, 10.0, 11.0, 25.0, 44.0, 38.0, 52.0, 90.0, 162.0, 258.0, 540.0, 1113.0, 2742.0, 8099.0, 31990.0, 203831.0, 666326.0, 103744.0, 19912.0, 5653.0, 1993.0, 837.0, 431.0, 214.0, 144.0, 91.0, 45.0, 28.0, 34.0, 19.0, 11.0, 12.0, 5.0, 5.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.06011962890625, -1.9874267578125, -1.91473388671875, -1.842041015625, -1.76934814453125, -1.6966552734375, -1.62396240234375, -1.55126953125, -1.47857666015625, -1.4058837890625, -1.33319091796875, -1.260498046875, -1.18780517578125, -1.1151123046875, -1.04241943359375, -0.9697265625, -0.89703369140625, -0.8243408203125, -0.75164794921875, -0.678955078125, -0.60626220703125, -0.5335693359375, -0.46087646484375, -0.38818359375, -0.31549072265625, -0.2427978515625, -0.17010498046875, -0.097412109375, -0.02471923828125, 0.0479736328125, 0.12066650390625, 0.193359375, 0.26605224609375, 0.3387451171875, 0.41143798828125, 0.484130859375, 0.55682373046875, 0.6295166015625, 0.70220947265625, 0.77490234375, 0.84759521484375, 0.9202880859375, 0.99298095703125, 1.065673828125, 1.13836669921875, 1.2110595703125, 1.28375244140625, 1.3564453125, 1.42913818359375, 1.5018310546875, 1.57452392578125, 1.647216796875, 1.71990966796875, 1.7926025390625, 1.86529541015625, 1.93798828125, 2.01068115234375, 2.0833740234375, 2.15606689453125, 2.228759765625, 2.30145263671875, 2.3741455078125, 2.44683837890625, 2.51953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 6.0, 9.0, 6.0, 12.0, 20.0, 17.0, 40.0, 44.0, 60.0, 62.0, 106.0, 130.0, 120.0, 105.0, 63.0, 52.0, 34.0, 39.0, 13.0, 12.0, 15.0, 6.0, 4.0, 7.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032639503479003906, -0.00031581148505210876, -0.00030522793531417847, -0.00029464438557624817, -0.00028406083583831787, -0.0002734772861003876, -0.0002628937363624573, -0.000252310186624527, -0.00024172663688659668, -0.00023114308714866638, -0.00022055953741073608, -0.00020997598767280579, -0.0001993924379348755, -0.0001888088881969452, -0.0001782253384590149, -0.0001676417887210846, -0.0001570582389831543, -0.000146474689245224, -0.0001358911395072937, -0.0001253075897693634, -0.0001147240400314331, -0.00010414049029350281, -9.355694055557251e-05, -8.297339081764221e-05, -7.238984107971191e-05, -6.180629134178162e-05, -5.122274160385132e-05, -4.063919186592102e-05, -3.0055642127990723e-05, -1.9472092390060425e-05, -8.888542652130127e-06, 1.695007085800171e-06, 1.2278556823730469e-05, 2.2862106561660767e-05, 3.3445656299591064e-05, 4.402920603752136e-05, 5.461275577545166e-05, 6.519630551338196e-05, 7.577985525131226e-05, 8.636340498924255e-05, 9.694695472717285e-05, 0.00010753050446510315, 0.00011811405420303345, 0.00012869760394096375, 0.00013928115367889404, 0.00014986470341682434, 0.00016044825315475464, 0.00017103180289268494, 0.00018161535263061523, 0.00019219890236854553, 0.00020278245210647583, 0.00021336600184440613, 0.00022394955158233643, 0.00023453310132026672, 0.000245116651058197, 0.0002557002007961273, 0.0002662837505340576, 0.0002768673002719879, 0.0002874508500099182, 0.0002980343997478485, 0.0003086179494857788, 0.0003192014992237091, 0.0003297850489616394, 0.0003403685986995697, 0.0003509521484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 7.0, 13.0, 21.0, 39.0, 54.0, 100.0, 141.0, 221.0, 351.0, 630.0, 1200.0, 2626.0, 6335.0, 17884.0, 71663.0, 528840.0, 344210.0, 50695.0, 13788.0, 5075.0, 2114.0, 1102.0, 575.0, 328.0, 188.0, 112.0, 81.0, 50.0, 30.0, 23.0, 22.0, 7.0, 5.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.119110107421875, -2.05657958984375, -1.994049072265625, -1.9315185546875, -1.868988037109375, -1.80645751953125, -1.743927001953125, -1.681396484375, -1.618865966796875, -1.55633544921875, -1.493804931640625, -1.4312744140625, -1.368743896484375, -1.30621337890625, -1.243682861328125, -1.18115234375, -1.118621826171875, -1.05609130859375, -0.993560791015625, -0.9310302734375, -0.868499755859375, -0.80596923828125, -0.743438720703125, -0.680908203125, -0.618377685546875, -0.55584716796875, -0.493316650390625, -0.4307861328125, -0.368255615234375, -0.30572509765625, -0.243194580078125, -0.1806640625, -0.118133544921875, -0.05560302734375, 0.006927490234375, 0.0694580078125, 0.131988525390625, 0.19451904296875, 0.257049560546875, 0.319580078125, 0.382110595703125, 0.44464111328125, 0.507171630859375, 0.5697021484375, 0.632232666015625, 0.69476318359375, 0.757293701171875, 0.81982421875, 0.882354736328125, 0.94488525390625, 1.007415771484375, 1.0699462890625, 1.132476806640625, 1.19500732421875, 1.257537841796875, 1.320068359375, 1.382598876953125, 1.44512939453125, 1.507659912109375, 1.5701904296875, 1.632720947265625, 1.69525146484375, 1.757781982421875, 1.8203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 4.0, 10.0, 17.0, 14.0, 21.0, 26.0, 52.0, 77.0, 71.0, 104.0, 106.0, 103.0, 106.0, 76.0, 44.0, 46.0, 27.0, 20.0, 13.0, 13.0, 12.0, 12.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.736328125, -1.6866607666015625, -1.636993408203125, -1.5873260498046875, -1.53765869140625, -1.4879913330078125, -1.438323974609375, -1.3886566162109375, -1.3389892578125, -1.2893218994140625, -1.239654541015625, -1.1899871826171875, -1.14031982421875, -1.0906524658203125, -1.040985107421875, -0.9913177490234375, -0.941650390625, -0.8919830322265625, -0.842315673828125, -0.7926483154296875, -0.74298095703125, -0.6933135986328125, -0.643646240234375, -0.5939788818359375, -0.5443115234375, -0.4946441650390625, -0.444976806640625, -0.3953094482421875, -0.34564208984375, -0.2959747314453125, -0.246307373046875, -0.1966400146484375, -0.14697265625, -0.0973052978515625, -0.047637939453125, 0.0020294189453125, 0.05169677734375, 0.1013641357421875, 0.151031494140625, 0.2006988525390625, 0.2503662109375, 0.3000335693359375, 0.349700927734375, 0.3993682861328125, 0.44903564453125, 0.4987030029296875, 0.548370361328125, 0.5980377197265625, 0.647705078125, 0.6973724365234375, 0.747039794921875, 0.7967071533203125, 0.84637451171875, 0.8960418701171875, 0.945709228515625, 0.9953765869140625, 1.0450439453125, 1.0947113037109375, 1.144378662109375, 1.1940460205078125, 1.24371337890625, 1.2933807373046875, 1.343048095703125, 1.3927154541015625, 1.4423828125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 19.0, 51.0, 187.0, 355.0, 221.0, 96.0, 39.0, 20.0, 8.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.96515655517578, -68.32442474365234, -66.68370056152344, -65.04296875, -63.40224075317383, -61.761512756347656, -60.12078094482422, -58.48005294799805, -56.839324951171875, -55.1985969543457, -53.557865142822266, -51.917137145996094, -50.27640914916992, -48.63568115234375, -46.99494934082031, -45.35422134399414, -43.71349334716797, -42.0727653503418, -40.43203353881836, -38.79130554199219, -37.150577545166016, -35.509849548339844, -33.869117736816406, -32.228389739990234, -30.587657928466797, -28.946928024291992, -27.30620002746582, -25.665470123291016, -24.024742126464844, -22.38401222229004, -20.743282318115234, -19.102554321289062, -17.46182632446289, -15.821097373962402, -14.180368423461914, -12.53963851928711, -10.898910522460938, -9.258180618286133, -7.6174516677856445, -5.976722717285156, -4.335993766784668, -2.6952648162841797, -1.0545356273651123, 0.5861935615539551, 2.2269225120544434, 3.86765193939209, 5.508380889892578, 7.149109840393066, 8.789838790893555, 10.430567741394043, 12.071296691894531, 13.712026596069336, 15.352754592895508, 16.993484497070312, 18.634212493896484, 20.27494239807129, 21.915672302246094, 23.5564022064209, 25.19713020324707, 26.837860107421875, 28.478588104248047, 30.11931800842285, 31.760047912597656, 33.40077590942383, 35.04150390625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 10.0, 11.0, 16.0, 19.0, 27.0, 23.0, 19.0, 24.0, 33.0, 36.0, 43.0, 44.0, 52.0, 48.0, 45.0, 48.0, 36.0, 54.0, 43.0, 48.0, 57.0, 40.0, 27.0, 27.0, 28.0, 29.0, 22.0, 29.0, 9.0, 9.0, 8.0, 10.0, 8.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.02634048461914, -16.503665924072266, -15.980989456176758, -15.458313941955566, -14.935638427734375, -14.412962913513184, -13.890287399291992, -13.367612838745117, -12.84493637084961, -12.322260856628418, -11.799585342407227, -11.276909828186035, -10.754234313964844, -10.231558799743652, -9.708883285522461, -9.186208724975586, -8.663533210754395, -8.140857696533203, -7.618182182312012, -7.09550666809082, -6.572831153869629, -6.0501556396484375, -5.527480602264404, -5.004805088043213, -4.4821295738220215, -3.95945405960083, -3.4367785453796387, -2.9141032695770264, -2.391427755355835, -1.8687522411346436, -1.3460769653320312, -0.8234014511108398, -0.30072593688964844, 0.2219495177268982, 0.7446249723434448, 1.2673003673553467, 1.789975881576538, 2.3126513957977295, 2.835326671600342, 3.358002185821533, 3.8806777000427246, 4.403353214263916, 4.926028728485107, 5.448703765869141, 5.971379280090332, 6.494054794311523, 7.016730308532715, 7.539405822753906, 8.062081336975098, 8.584756851196289, 9.10743236541748, 9.630107879638672, 10.152783393859863, 10.675458908081055, 11.19813346862793, 11.720809936523438, 12.243484497070312, 12.766160011291504, 13.288835525512695, 13.811511039733887, 14.334186553955078, 14.85686206817627, 15.379537582397461, 15.902212142944336, 16.424888610839844]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 9.0, 7.0, 11.0, 19.0, 19.0, 19.0, 25.0, 30.0, 39.0, 53.0, 69.0, 108.0, 167.0, 239.0, 593.0, 1606.0, 5917.0, 40207.0, 4105124.0, 31995.0, 5433.0, 1454.0, 524.0, 229.0, 134.0, 74.0, 53.0, 31.0, 24.0, 11.0, 12.0, 8.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.890625, -18.423583984375, -17.95654296875, -17.489501953125, -17.0224609375, -16.555419921875, -16.08837890625, -15.621337890625, -15.154296875, -14.687255859375, -14.22021484375, -13.753173828125, -13.2861328125, -12.819091796875, -12.35205078125, -11.885009765625, -11.41796875, -10.950927734375, -10.48388671875, -10.016845703125, -9.5498046875, -9.082763671875, -8.61572265625, -8.148681640625, -7.681640625, -7.214599609375, -6.74755859375, -6.280517578125, -5.8134765625, -5.346435546875, -4.87939453125, -4.412353515625, -3.9453125, -3.478271484375, -3.01123046875, -2.544189453125, -2.0771484375, -1.610107421875, -1.14306640625, -0.676025390625, -0.208984375, 0.258056640625, 0.72509765625, 1.192138671875, 1.6591796875, 2.126220703125, 2.59326171875, 3.060302734375, 3.52734375, 3.994384765625, 4.46142578125, 4.928466796875, 5.3955078125, 5.862548828125, 6.32958984375, 6.796630859375, 7.263671875, 7.730712890625, 8.19775390625, 8.664794921875, 9.1318359375, 9.598876953125, 10.06591796875, 10.532958984375, 11.0]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 13.0, 25.0, 26.0, 48.0, 84.0, 94.0, 99.0, 128.0, 112.0, 94.0, 76.0, 81.0, 43.0, 26.0, 17.0, 13.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.75164794921875, -1.7064208984375, -1.66119384765625, -1.615966796875, -1.57073974609375, -1.5255126953125, -1.48028564453125, -1.43505859375, -1.38983154296875, -1.3446044921875, -1.29937744140625, -1.254150390625, -1.20892333984375, -1.1636962890625, -1.11846923828125, -1.0732421875, -1.02801513671875, -0.9827880859375, -0.93756103515625, -0.892333984375, -0.84710693359375, -0.8018798828125, -0.75665283203125, -0.71142578125, -0.66619873046875, -0.6209716796875, -0.57574462890625, -0.530517578125, -0.48529052734375, -0.4400634765625, -0.39483642578125, -0.349609375, -0.30438232421875, -0.2591552734375, -0.21392822265625, -0.168701171875, -0.12347412109375, -0.0782470703125, -0.03302001953125, 0.01220703125, 0.05743408203125, 0.1026611328125, 0.14788818359375, 0.193115234375, 0.23834228515625, 0.2835693359375, 0.32879638671875, 0.3740234375, 0.41925048828125, 0.4644775390625, 0.50970458984375, 0.554931640625, 0.60015869140625, 0.6453857421875, 0.69061279296875, 0.73583984375, 0.78106689453125, 0.8262939453125, 0.87152099609375, 0.916748046875, 0.96197509765625, 1.0072021484375, 1.05242919921875, 1.09765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 4.0, 9.0, 17.0, 18.0, 21.0, 41.0, 61.0, 97.0, 125.0, 188.0, 364.0, 656.0, 1258.0, 2546.0, 5485.0, 13196.0, 43051.0, 1040174.0, 3013660.0, 47778.0, 13814.0, 5784.0, 2648.0, 1408.0, 774.0, 409.0, 241.0, 142.0, 85.0, 56.0, 55.0, 33.0, 16.0, 15.0, 11.0, 13.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0], "bins": [-7.15625, -6.97747802734375, -6.7987060546875, -6.61993408203125, -6.441162109375, -6.26239013671875, -6.0836181640625, -5.90484619140625, -5.72607421875, -5.54730224609375, -5.3685302734375, -5.18975830078125, -5.010986328125, -4.83221435546875, -4.6534423828125, -4.47467041015625, -4.2958984375, -4.11712646484375, -3.9383544921875, -3.75958251953125, -3.580810546875, -3.40203857421875, -3.2232666015625, -3.04449462890625, -2.86572265625, -2.68695068359375, -2.5081787109375, -2.32940673828125, -2.150634765625, -1.97186279296875, -1.7930908203125, -1.61431884765625, -1.435546875, -1.25677490234375, -1.0780029296875, -0.89923095703125, -0.720458984375, -0.54168701171875, -0.3629150390625, -0.18414306640625, -0.00537109375, 0.17340087890625, 0.3521728515625, 0.53094482421875, 0.709716796875, 0.88848876953125, 1.0672607421875, 1.24603271484375, 1.4248046875, 1.60357666015625, 1.7823486328125, 1.96112060546875, 2.139892578125, 2.31866455078125, 2.4974365234375, 2.67620849609375, 2.85498046875, 3.03375244140625, 3.2125244140625, 3.39129638671875, 3.570068359375, 3.74884033203125, 3.9276123046875, 4.10638427734375, 4.28515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 8.0, 9.0, 12.0, 10.0, 21.0, 21.0, 46.0, 61.0, 141.0, 590.0, 2597.0, 245.0, 120.0, 56.0, 36.0, 26.0, 16.0, 11.0, 5.0, 5.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.3373870849609375, -1.277313232421875, -1.2172393798828125, -1.15716552734375, -1.0970916748046875, -1.037017822265625, -0.9769439697265625, -0.9168701171875, -0.8567962646484375, -0.796722412109375, -0.7366485595703125, -0.67657470703125, -0.6165008544921875, -0.556427001953125, -0.4963531494140625, -0.436279296875, -0.3762054443359375, -0.316131591796875, -0.2560577392578125, -0.19598388671875, -0.1359100341796875, -0.075836181640625, -0.0157623291015625, 0.0443115234375, 0.1043853759765625, 0.164459228515625, 0.2245330810546875, 0.28460693359375, 0.3446807861328125, 0.404754638671875, 0.4648284912109375, 0.52490234375, 0.5849761962890625, 0.645050048828125, 0.7051239013671875, 0.76519775390625, 0.8252716064453125, 0.885345458984375, 0.9454193115234375, 1.0054931640625, 1.0655670166015625, 1.125640869140625, 1.1857147216796875, 1.24578857421875, 1.3058624267578125, 1.365936279296875, 1.4260101318359375, 1.486083984375, 1.5461578369140625, 1.606231689453125, 1.6663055419921875, 1.72637939453125, 1.7864532470703125, 1.846527099609375, 1.9066009521484375, 1.9666748046875, 2.0267486572265625, 2.086822509765625, 2.1468963623046875, 2.20697021484375, 2.2670440673828125, 2.327117919921875, 2.3871917724609375, 2.447265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 14.0, 37.0, 53.0, 143.0, 366.0, 240.0, 98.0, 39.0, 14.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.569042205810547, -8.864547729492188, -8.160053253173828, -7.4555583000183105, -6.751063346862793, -6.046568870544434, -5.342074394226074, -4.637579441070557, -3.9330849647521973, -3.228590250015259, -2.5240955352783203, -1.819601058959961, -1.1151063442230225, -0.410611629486084, 0.2938828468322754, 0.998377799987793, 1.7028722763061523, 2.407366991043091, 3.1118617057800293, 3.8163561820983887, 4.520851135253906, 5.225345611572266, 5.929840087890625, 6.634335041046143, 7.338829517364502, 8.04332447052002, 8.747818946838379, 9.452313423156738, 10.156807899475098, 10.861303329467773, 11.565797805786133, 12.270292282104492, 12.974786758422852, 13.679281234741211, 14.38377571105957, 15.08827018737793, 15.792765617370605, 16.49726104736328, 17.20175552368164, 17.90625, 18.61074447631836, 19.31523895263672, 20.019733428955078, 20.724227905273438, 21.428722381591797, 22.133216857910156, 22.837711334228516, 23.542207717895508, 24.246700286865234, 24.951194763183594, 25.655689239501953, 26.360183715820312, 27.064678192138672, 27.76917266845703, 28.47366714477539, 29.178163528442383, 29.882658004760742, 30.5871524810791, 31.29164695739746, 31.99614143371582, 32.70063781738281, 33.40513229370117, 34.10962677001953, 34.81412124633789, 35.51861572265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 9.0, 7.0, 9.0, 12.0, 9.0, 17.0, 22.0, 25.0, 18.0, 20.0, 33.0, 38.0, 35.0, 33.0, 40.0, 48.0, 48.0, 48.0, 47.0, 36.0, 41.0, 46.0, 32.0, 37.0, 38.0, 37.0, 26.0, 23.0, 21.0, 19.0, 24.0, 15.0, 14.0, 14.0, 15.0, 10.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.502102375030518, -4.361291408538818, -4.220480918884277, -4.079669952392578, -3.938858985900879, -3.7980480194091797, -3.6572372913360596, -3.5164265632629395, -3.3756155967712402, -3.234804630279541, -3.093993902206421, -2.953183174133301, -2.8123722076416016, -2.6715612411499023, -2.5307505130767822, -2.389939785003662, -2.249128818511963, -2.1083178520202637, -1.9675071239471436, -1.8266962766647339, -1.6858854293823242, -1.5450745820999146, -1.4042637348175049, -1.2634528875350952, -1.1226420402526855, -0.9818311929702759, -0.8410203456878662, -0.7002094984054565, -0.5593986511230469, -0.4185878038406372, -0.27777695655822754, -0.13696610927581787, 0.0038442611694335938, 0.14465510845184326, 0.28546595573425293, 0.4262768030166626, 0.5670876502990723, 0.7078984975814819, 0.8487093448638916, 0.9895201921463013, 1.130331039428711, 1.2711418867111206, 1.4119527339935303, 1.55276358127594, 1.6935744285583496, 1.8343852758407593, 1.975196123123169, 2.116006851196289, 2.2568178176879883, 2.3976287841796875, 2.5384395122528076, 2.6792502403259277, 2.820061206817627, 2.960872173309326, 3.1016829013824463, 3.2424936294555664, 3.3833045959472656, 3.524115562438965, 3.664926290512085, 3.805737018585205, 3.9465479850769043, 4.0873589515686035, 4.2281694412231445, 4.368980407714844, 4.509791374206543]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 9.0, 4.0, 10.0, 10.0, 20.0, 27.0, 31.0, 44.0, 42.0, 72.0, 86.0, 141.0, 186.0, 291.0, 573.0, 1162.0, 2852.0, 9939.0, 49648.0, 470731.0, 449127.0, 48361.0, 9777.0, 2807.0, 1097.0, 506.0, 284.0, 226.0, 140.0, 94.0, 58.0, 44.0, 34.0, 37.0, 16.0, 19.0, 7.0, 5.0, 4.0, 8.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.15008544921875, -5.9134521484375, -5.67681884765625, -5.440185546875, -5.20355224609375, -4.9669189453125, -4.73028564453125, -4.49365234375, -4.25701904296875, -4.0203857421875, -3.78375244140625, -3.547119140625, -3.31048583984375, -3.0738525390625, -2.83721923828125, -2.6005859375, -2.36395263671875, -2.1273193359375, -1.89068603515625, -1.654052734375, -1.41741943359375, -1.1807861328125, -0.94415283203125, -0.70751953125, -0.47088623046875, -0.2342529296875, 0.00238037109375, 0.239013671875, 0.47564697265625, 0.7122802734375, 0.94891357421875, 1.185546875, 1.42218017578125, 1.6588134765625, 1.89544677734375, 2.132080078125, 2.36871337890625, 2.6053466796875, 2.84197998046875, 3.07861328125, 3.31524658203125, 3.5518798828125, 3.78851318359375, 4.025146484375, 4.26177978515625, 4.4984130859375, 4.73504638671875, 4.9716796875, 5.20831298828125, 5.4449462890625, 5.68157958984375, 5.918212890625, 6.15484619140625, 6.3914794921875, 6.62811279296875, 6.86474609375, 7.10137939453125, 7.3380126953125, 7.57464599609375, 7.811279296875, 8.04791259765625, 8.2845458984375, 8.52117919921875, 8.7578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 10.0, 13.0, 20.0, 34.0, 40.0, 79.0, 90.0, 113.0, 118.0, 111.0, 99.0, 83.0, 79.0, 40.0, 35.0, 16.0, 13.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8642578125, -1.8174896240234375, -1.770721435546875, -1.7239532470703125, -1.67718505859375, -1.6304168701171875, -1.583648681640625, -1.5368804931640625, -1.4901123046875, -1.4433441162109375, -1.396575927734375, -1.3498077392578125, -1.30303955078125, -1.2562713623046875, -1.209503173828125, -1.1627349853515625, -1.115966796875, -1.0691986083984375, -1.022430419921875, -0.9756622314453125, -0.92889404296875, -0.8821258544921875, -0.835357666015625, -0.7885894775390625, -0.7418212890625, -0.6950531005859375, -0.648284912109375, -0.6015167236328125, -0.55474853515625, -0.5079803466796875, -0.461212158203125, -0.4144439697265625, -0.36767578125, -0.3209075927734375, -0.274139404296875, -0.2273712158203125, -0.18060302734375, -0.1338348388671875, -0.087066650390625, -0.0402984619140625, 0.0064697265625, 0.0532379150390625, 0.100006103515625, 0.1467742919921875, 0.19354248046875, 0.2403106689453125, 0.287078857421875, 0.3338470458984375, 0.380615234375, 0.4273834228515625, 0.474151611328125, 0.5209197998046875, 0.56768798828125, 0.6144561767578125, 0.661224365234375, 0.7079925537109375, 0.7547607421875, 0.8015289306640625, 0.848297119140625, 0.8950653076171875, 0.94183349609375, 0.9886016845703125, 1.035369873046875, 1.0821380615234375, 1.12890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 0.0, 6.0, 6.0, 15.0, 10.0, 18.0, 25.0, 37.0, 48.0, 62.0, 111.0, 182.0, 315.0, 496.0, 824.0, 1678.0, 3114.0, 6576.0, 14697.0, 37467.0, 115752.0, 412144.0, 314975.0, 86827.0, 29617.0, 12138.0, 5418.0, 2736.0, 1351.0, 760.0, 411.0, 247.0, 158.0, 112.0, 83.0, 38.0, 32.0, 22.0, 19.0, 9.0, 5.0, 9.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.65625, -2.55743408203125, -2.4586181640625, -2.35980224609375, -2.260986328125, -2.16217041015625, -2.0633544921875, -1.96453857421875, -1.86572265625, -1.76690673828125, -1.6680908203125, -1.56927490234375, -1.470458984375, -1.37164306640625, -1.2728271484375, -1.17401123046875, -1.0751953125, -0.97637939453125, -0.8775634765625, -0.77874755859375, -0.679931640625, -0.58111572265625, -0.4822998046875, -0.38348388671875, -0.28466796875, -0.18585205078125, -0.0870361328125, 0.01177978515625, 0.110595703125, 0.20941162109375, 0.3082275390625, 0.40704345703125, 0.505859375, 0.60467529296875, 0.7034912109375, 0.80230712890625, 0.901123046875, 0.99993896484375, 1.0987548828125, 1.19757080078125, 1.29638671875, 1.39520263671875, 1.4940185546875, 1.59283447265625, 1.691650390625, 1.79046630859375, 1.8892822265625, 1.98809814453125, 2.0869140625, 2.18572998046875, 2.2845458984375, 2.38336181640625, 2.482177734375, 2.58099365234375, 2.6798095703125, 2.77862548828125, 2.87744140625, 2.97625732421875, 3.0750732421875, 3.17388916015625, 3.272705078125, 3.37152099609375, 3.4703369140625, 3.56915283203125, 3.66796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 7.0, 5.0, 5.0, 8.0, 13.0, 10.0, 10.0, 25.0, 15.0, 32.0, 19.0, 37.0, 25.0, 35.0, 36.0, 52.0, 40.0, 47.0, 54.0, 59.0, 49.0, 44.0, 42.0, 40.0, 36.0, 28.0, 37.0, 23.0, 24.0, 24.0, 16.0, 19.0, 17.0, 13.0, 12.0, 5.0, 9.0, 7.0, 3.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.263671875, -3.17266845703125, -3.0816650390625, -2.99066162109375, -2.899658203125, -2.80865478515625, -2.7176513671875, -2.62664794921875, -2.53564453125, -2.44464111328125, -2.3536376953125, -2.26263427734375, -2.171630859375, -2.08062744140625, -1.9896240234375, -1.89862060546875, -1.8076171875, -1.71661376953125, -1.6256103515625, -1.53460693359375, -1.443603515625, -1.35260009765625, -1.2615966796875, -1.17059326171875, -1.07958984375, -0.98858642578125, -0.8975830078125, -0.80657958984375, -0.715576171875, -0.62457275390625, -0.5335693359375, -0.44256591796875, -0.3515625, -0.26055908203125, -0.1695556640625, -0.07855224609375, 0.012451171875, 0.10345458984375, 0.1944580078125, 0.28546142578125, 0.37646484375, 0.46746826171875, 0.5584716796875, 0.64947509765625, 0.740478515625, 0.83148193359375, 0.9224853515625, 1.01348876953125, 1.1044921875, 1.19549560546875, 1.2864990234375, 1.37750244140625, 1.468505859375, 1.55950927734375, 1.6505126953125, 1.74151611328125, 1.83251953125, 1.92352294921875, 2.0145263671875, 2.10552978515625, 2.196533203125, 2.28753662109375, 2.3785400390625, 2.46954345703125, 2.560546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 12.0, 10.0, 11.0, 20.0, 24.0, 34.0, 58.0, 69.0, 98.0, 175.0, 270.0, 400.0, 780.0, 1568.0, 3321.0, 8562.0, 27594.0, 117833.0, 575363.0, 243454.0, 46196.0, 13351.0, 4689.0, 2159.0, 1019.0, 560.0, 361.0, 181.0, 114.0, 60.0, 55.0, 38.0, 27.0, 21.0, 12.0, 14.0, 11.0, 6.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.60546875, -1.5514068603515625, -1.497344970703125, -1.4432830810546875, -1.38922119140625, -1.3351593017578125, -1.281097412109375, -1.2270355224609375, -1.1729736328125, -1.1189117431640625, -1.064849853515625, -1.0107879638671875, -0.95672607421875, -0.9026641845703125, -0.848602294921875, -0.7945404052734375, -0.740478515625, -0.6864166259765625, -0.632354736328125, -0.5782928466796875, -0.52423095703125, -0.4701690673828125, -0.416107177734375, -0.3620452880859375, -0.3079833984375, -0.2539215087890625, -0.199859619140625, -0.1457977294921875, -0.09173583984375, -0.0376739501953125, 0.016387939453125, 0.0704498291015625, 0.12451171875, 0.1785736083984375, 0.232635498046875, 0.2866973876953125, 0.34075927734375, 0.3948211669921875, 0.448883056640625, 0.5029449462890625, 0.5570068359375, 0.6110687255859375, 0.665130615234375, 0.7191925048828125, 0.77325439453125, 0.8273162841796875, 0.881378173828125, 0.9354400634765625, 0.989501953125, 1.0435638427734375, 1.097625732421875, 1.1516876220703125, 1.20574951171875, 1.2598114013671875, 1.313873291015625, 1.3679351806640625, 1.4219970703125, 1.4760589599609375, 1.530120849609375, 1.5841827392578125, 1.63824462890625, 1.6923065185546875, 1.746368408203125, 1.8004302978515625, 1.8544921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 9.0, 9.0, 8.0, 22.0, 24.0, 37.0, 39.0, 88.0, 117.0, 155.0, 152.0, 101.0, 67.0, 42.0, 24.0, 13.0, 18.0, 14.0, 15.0, 8.0, 7.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004165172576904297, -0.0004025474190711975, -0.00038857758045196533, -0.00037460774183273315, -0.000360637903213501, -0.0003466680645942688, -0.0003326982259750366, -0.00031872838735580444, -0.00030475854873657227, -0.0002907887101173401, -0.0002768188714981079, -0.00026284903287887573, -0.00024887919425964355, -0.00023490935564041138, -0.0002209395170211792, -0.00020696967840194702, -0.00019299983978271484, -0.00017903000116348267, -0.0001650601625442505, -0.0001510903239250183, -0.00013712048530578613, -0.00012315064668655396, -0.00010918080806732178, -9.52109694480896e-05, -8.124113082885742e-05, -6.727129220962524e-05, -5.3301453590393066e-05, -3.933161497116089e-05, -2.536177635192871e-05, -1.1391937732696533e-05, 2.5779008865356445e-06, 1.6547739505767822e-05, 3.0517578125e-05, 4.448741674423218e-05, 5.8457255363464355e-05, 7.242709398269653e-05, 8.639693260192871e-05, 0.00010036677122116089, 0.00011433660984039307, 0.00012830644845962524, 0.00014227628707885742, 0.0001562461256980896, 0.00017021596431732178, 0.00018418580293655396, 0.00019815564155578613, 0.0002121254801750183, 0.0002260953187942505, 0.00024006515741348267, 0.00025403499603271484, 0.000268004834651947, 0.0002819746732711792, 0.0002959445118904114, 0.00030991435050964355, 0.00032388418912887573, 0.0003378540277481079, 0.0003518238663673401, 0.00036579370498657227, 0.00037976354360580444, 0.0003937333822250366, 0.0004077032208442688, 0.000421673059463501, 0.00043564289808273315, 0.00044961273670196533, 0.0004635825753211975, 0.0004775524139404297]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 12.0, 7.0, 20.0, 15.0, 33.0, 46.0, 68.0, 108.0, 187.0, 308.0, 579.0, 1052.0, 2420.0, 6136.0, 19538.0, 91365.0, 571705.0, 290122.0, 45565.0, 11487.0, 3971.0, 1800.0, 897.0, 446.0, 247.0, 143.0, 95.0, 52.0, 47.0, 24.0, 20.0, 10.0, 10.0, 4.0, 1.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.111328125, -2.0569000244140625, -2.002471923828125, -1.9480438232421875, -1.89361572265625, -1.8391876220703125, -1.784759521484375, -1.7303314208984375, -1.6759033203125, -1.6214752197265625, -1.567047119140625, -1.5126190185546875, -1.45819091796875, -1.4037628173828125, -1.349334716796875, -1.2949066162109375, -1.240478515625, -1.1860504150390625, -1.131622314453125, -1.0771942138671875, -1.02276611328125, -0.9683380126953125, -0.913909912109375, -0.8594818115234375, -0.8050537109375, -0.7506256103515625, -0.696197509765625, -0.6417694091796875, -0.58734130859375, -0.5329132080078125, -0.478485107421875, -0.4240570068359375, -0.36962890625, -0.3152008056640625, -0.260772705078125, -0.2063446044921875, -0.15191650390625, -0.0974884033203125, -0.043060302734375, 0.0113677978515625, 0.0657958984375, 0.1202239990234375, 0.174652099609375, 0.2290802001953125, 0.28350830078125, 0.3379364013671875, 0.392364501953125, 0.4467926025390625, 0.501220703125, 0.5556488037109375, 0.610076904296875, 0.6645050048828125, 0.71893310546875, 0.7733612060546875, 0.827789306640625, 0.8822174072265625, 0.9366455078125, 0.9910736083984375, 1.045501708984375, 1.0999298095703125, 1.15435791015625, 1.2087860107421875, 1.263214111328125, 1.3176422119140625, 1.3720703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 23.0, 25.0, 31.0, 51.0, 59.0, 88.0, 107.0, 116.0, 102.0, 92.0, 67.0, 54.0, 46.0, 28.0, 25.0, 18.0, 7.0, 9.0, 6.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.3189239501953125, -1.274566650390625, -1.2302093505859375, -1.18585205078125, -1.1414947509765625, -1.097137451171875, -1.0527801513671875, -1.0084228515625, -0.9640655517578125, -0.919708251953125, -0.8753509521484375, -0.83099365234375, -0.7866363525390625, -0.742279052734375, -0.6979217529296875, -0.653564453125, -0.6092071533203125, -0.564849853515625, -0.5204925537109375, -0.47613525390625, -0.4317779541015625, -0.387420654296875, -0.3430633544921875, -0.2987060546875, -0.2543487548828125, -0.209991455078125, -0.1656341552734375, -0.12127685546875, -0.0769195556640625, -0.032562255859375, 0.0117950439453125, 0.05615234375, 0.1005096435546875, 0.144866943359375, 0.1892242431640625, 0.23358154296875, 0.2779388427734375, 0.322296142578125, 0.3666534423828125, 0.4110107421875, 0.4553680419921875, 0.499725341796875, 0.5440826416015625, 0.58843994140625, 0.6327972412109375, 0.677154541015625, 0.7215118408203125, 0.765869140625, 0.8102264404296875, 0.854583740234375, 0.8989410400390625, 0.94329833984375, 0.9876556396484375, 1.032012939453125, 1.0763702392578125, 1.1207275390625, 1.1650848388671875, 1.209442138671875, 1.2537994384765625, 1.29815673828125, 1.3425140380859375, 1.386871337890625, 1.4312286376953125, 1.4755859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 7.0, 16.0, 96.0, 402.0, 381.0, 79.0, 24.0, 6.0, 1.0, 0.0, 1.0], "bins": [-163.84609985351562, -160.96719360351562, -158.0883026123047, -155.2093963623047, -152.33050537109375, -149.45159912109375, -146.5727081298828, -143.6938018798828, -140.81491088867188, -137.93600463867188, -135.05711364746094, -132.17820739746094, -129.29931640625, -126.42041778564453, -123.54151916503906, -120.6626205444336, -117.78372192382812, -114.90482330322266, -112.02592468261719, -109.14702606201172, -106.26812744140625, -103.38922882080078, -100.51033020019531, -97.63143157958984, -94.75252532958984, -91.87362670898438, -88.9947280883789, -86.11582946777344, -83.23693084716797, -80.3580322265625, -77.47913360595703, -74.60023498535156, -71.72134399414062, -68.84244537353516, -65.96354675292969, -63.08464813232422, -60.20574951171875, -57.32685089111328, -54.44795227050781, -51.569053649902344, -48.690147399902344, -45.811248779296875, -42.932350158691406, -40.05345153808594, -37.17455291748047, -34.295654296875, -31.4167537689209, -28.53785514831543, -25.658958435058594, -22.780059814453125, -19.901161193847656, -17.022262573242188, -14.143362998962402, -11.264464378356934, -8.385564804077148, -5.50666618347168, -2.627767562866211, 0.2511312961578369, 3.1300301551818848, 6.008929252624512, 8.88782787322998, 11.76672649383545, 14.645626068115234, 17.524524688720703, 20.403423309326172]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 9.0, 9.0, 6.0, 6.0, 10.0, 16.0, 16.0, 24.0, 16.0, 13.0, 20.0, 33.0, 27.0, 25.0, 41.0, 46.0, 46.0, 48.0, 49.0, 46.0, 51.0, 43.0, 44.0, 34.0, 29.0, 30.0, 35.0, 36.0, 20.0, 36.0, 23.0, 16.0, 14.0, 10.0, 14.0, 9.0, 8.0, 6.0, 6.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-16.658592224121094, -16.147735595703125, -15.636880874633789, -15.12602424621582, -14.615168571472168, -14.104312896728516, -13.593456268310547, -13.082600593566895, -12.571744918823242, -12.06088924407959, -11.550033569335938, -11.039176940917969, -10.528321266174316, -10.017465591430664, -9.506608963012695, -8.995753288269043, -8.48489761352539, -7.974041938781738, -7.463185787200928, -6.952329635620117, -6.441473960876465, -5.9306182861328125, -5.419762134552002, -4.908905982971191, -4.398050308227539, -3.8871943950653076, -3.376338481903076, -2.8654825687408447, -2.3546266555786133, -1.8437707424163818, -1.3329148292541504, -0.822058916091919, -0.3112049102783203, 0.19965100288391113, 0.7105069160461426, 1.221362829208374, 1.7322187423706055, 2.243074655532837, 2.7539305686950684, 3.2647864818573, 3.7756423950195312, 4.286498069763184, 4.797354221343994, 5.308210372924805, 5.819066047668457, 6.329921722412109, 6.84077787399292, 7.3516340255737305, 7.862489700317383, 8.373345375061035, 8.884201049804688, 9.395057678222656, 9.905913352966309, 10.416769027709961, 10.92762565612793, 11.438481330871582, 11.949337005615234, 12.460192680358887, 12.971048355102539, 13.481904983520508, 13.99276065826416, 14.503616333007812, 15.014472961425781, 15.525328636169434, 16.036184310913086]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 10.0, 7.0, 10.0, 4.0, 7.0, 21.0, 13.0, 17.0, 19.0, 23.0, 34.0, 41.0, 41.0, 56.0, 67.0, 85.0, 182.0, 269.0, 535.0, 1267.0, 3139.0, 9761.0, 49327.0, 4038104.0, 72754.0, 11705.0, 3808.0, 1455.0, 655.0, 314.0, 191.0, 106.0, 72.0, 37.0, 44.0, 23.0, 17.0, 15.0, 13.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-13.2890625, -12.9532470703125, -12.617431640625, -12.2816162109375, -11.94580078125, -11.6099853515625, -11.274169921875, -10.9383544921875, -10.6025390625, -10.2667236328125, -9.930908203125, -9.5950927734375, -9.25927734375, -8.9234619140625, -8.587646484375, -8.2518310546875, -7.916015625, -7.5802001953125, -7.244384765625, -6.9085693359375, -6.57275390625, -6.2369384765625, -5.901123046875, -5.5653076171875, -5.2294921875, -4.8936767578125, -4.557861328125, -4.2220458984375, -3.88623046875, -3.5504150390625, -3.214599609375, -2.8787841796875, -2.54296875, -2.2071533203125, -1.871337890625, -1.5355224609375, -1.19970703125, -0.8638916015625, -0.528076171875, -0.1922607421875, 0.1435546875, 0.4793701171875, 0.815185546875, 1.1510009765625, 1.48681640625, 1.8226318359375, 2.158447265625, 2.4942626953125, 2.830078125, 3.1658935546875, 3.501708984375, 3.8375244140625, 4.17333984375, 4.5091552734375, 4.844970703125, 5.1807861328125, 5.5166015625, 5.8524169921875, 6.188232421875, 6.5240478515625, 6.85986328125, 7.1956787109375, 7.531494140625, 7.8673095703125, 8.203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 11.0, 13.0, 16.0, 27.0, 36.0, 45.0, 53.0, 73.0, 89.0, 89.0, 107.0, 88.0, 83.0, 75.0, 60.0, 47.0, 28.0, 19.0, 17.0, 9.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7119140625, -1.6672515869140625, -1.622589111328125, -1.5779266357421875, -1.53326416015625, -1.4886016845703125, -1.443939208984375, -1.3992767333984375, -1.3546142578125, -1.3099517822265625, -1.265289306640625, -1.2206268310546875, -1.17596435546875, -1.1313018798828125, -1.086639404296875, -1.0419769287109375, -0.997314453125, -0.9526519775390625, -0.907989501953125, -0.8633270263671875, -0.81866455078125, -0.7740020751953125, -0.729339599609375, -0.6846771240234375, -0.6400146484375, -0.5953521728515625, -0.550689697265625, -0.5060272216796875, -0.46136474609375, -0.4167022705078125, -0.372039794921875, -0.3273773193359375, -0.28271484375, -0.2380523681640625, -0.193389892578125, -0.1487274169921875, -0.10406494140625, -0.0594024658203125, -0.014739990234375, 0.0299224853515625, 0.0745849609375, 0.1192474365234375, 0.163909912109375, 0.2085723876953125, 0.25323486328125, 0.2978973388671875, 0.342559814453125, 0.3872222900390625, 0.431884765625, 0.4765472412109375, 0.521209716796875, 0.5658721923828125, 0.61053466796875, 0.6551971435546875, 0.699859619140625, 0.7445220947265625, 0.7891845703125, 0.8338470458984375, 0.878509521484375, 0.9231719970703125, 0.96783447265625, 1.0124969482421875, 1.057159423828125, 1.1018218994140625, 1.146484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 4.0, 14.0, 24.0, 29.0, 55.0, 50.0, 82.0, 182.0, 309.0, 559.0, 1232.0, 2962.0, 8207.0, 30413.0, 340601.0, 3736659.0, 53523.0, 12118.0, 4021.0, 1599.0, 732.0, 393.0, 205.0, 121.0, 57.0, 38.0, 24.0, 16.0, 11.0, 11.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3984375, -6.1539306640625, -5.909423828125, -5.6649169921875, -5.42041015625, -5.1759033203125, -4.931396484375, -4.6868896484375, -4.4423828125, -4.1978759765625, -3.953369140625, -3.7088623046875, -3.46435546875, -3.2198486328125, -2.975341796875, -2.7308349609375, -2.486328125, -2.2418212890625, -1.997314453125, -1.7528076171875, -1.50830078125, -1.2637939453125, -1.019287109375, -0.7747802734375, -0.5302734375, -0.2857666015625, -0.041259765625, 0.2032470703125, 0.44775390625, 0.6922607421875, 0.936767578125, 1.1812744140625, 1.42578125, 1.6702880859375, 1.914794921875, 2.1593017578125, 2.40380859375, 2.6483154296875, 2.892822265625, 3.1373291015625, 3.3818359375, 3.6263427734375, 3.870849609375, 4.1153564453125, 4.35986328125, 4.6043701171875, 4.848876953125, 5.0933837890625, 5.337890625, 5.5823974609375, 5.826904296875, 6.0714111328125, 6.31591796875, 6.5604248046875, 6.804931640625, 7.0494384765625, 7.2939453125, 7.5384521484375, 7.782958984375, 8.0274658203125, 8.27197265625, 8.5164794921875, 8.760986328125, 9.0054931640625, 9.25]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 8.0, 17.0, 12.0, 13.0, 32.0, 50.0, 71.0, 167.0, 911.0, 2331.0, 218.0, 84.0, 54.0, 31.0, 19.0, 14.0, 9.0, 4.0, 7.0, 2.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.19921875, -4.104034423828125, -4.00885009765625, -3.913665771484375, -3.8184814453125, -3.723297119140625, -3.62811279296875, -3.532928466796875, -3.437744140625, -3.342559814453125, -3.24737548828125, -3.152191162109375, -3.0570068359375, -2.961822509765625, -2.86663818359375, -2.771453857421875, -2.67626953125, -2.581085205078125, -2.48590087890625, -2.390716552734375, -2.2955322265625, -2.200347900390625, -2.10516357421875, -2.009979248046875, -1.914794921875, -1.819610595703125, -1.72442626953125, -1.629241943359375, -1.5340576171875, -1.438873291015625, -1.34368896484375, -1.248504638671875, -1.1533203125, -1.058135986328125, -0.96295166015625, -0.867767333984375, -0.7725830078125, -0.677398681640625, -0.58221435546875, -0.487030029296875, -0.391845703125, -0.296661376953125, -0.20147705078125, -0.106292724609375, -0.0111083984375, 0.084075927734375, 0.17926025390625, 0.274444580078125, 0.36962890625, 0.464813232421875, 0.55999755859375, 0.655181884765625, 0.7503662109375, 0.845550537109375, 0.94073486328125, 1.035919189453125, 1.131103515625, 1.226287841796875, 1.32147216796875, 1.416656494140625, 1.5118408203125, 1.607025146484375, 1.70220947265625, 1.797393798828125, 1.892578125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 5.0, 17.0, 27.0, 63.0, 83.0, 142.0, 204.0, 178.0, 133.0, 52.0, 41.0, 15.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.175186157226562, -19.668771743774414, -19.162357330322266, -18.655942916870117, -18.14952850341797, -17.643112182617188, -17.13669776916504, -16.63028335571289, -16.123868942260742, -15.617454528808594, -15.111040115356445, -14.60462474822998, -14.098210334777832, -13.591795921325684, -13.085380554199219, -12.57896614074707, -12.072551727294922, -11.566137313842773, -11.059722900390625, -10.55330753326416, -10.046893119812012, -9.540478706359863, -9.034063339233398, -8.52764892578125, -8.021234512329102, -7.514820098876953, -7.0084052085876465, -6.50199031829834, -5.995575904846191, -5.489161491394043, -4.982746601104736, -4.47633171081543, -3.969916343688965, -3.4635016918182373, -2.9570870399475098, -2.4506723880767822, -1.9442577362060547, -1.4378430843353271, -0.9314284324645996, -0.42501378059387207, 0.08140087127685547, 0.587815523147583, 1.0942301750183105, 1.600644826889038, 2.1070594787597656, 2.613474130630493, 3.1198887825012207, 3.6263034343719482, 4.132718086242676, 4.639132499694824, 5.145547389984131, 5.6519622802734375, 6.158376693725586, 6.664791107177734, 7.171205997467041, 7.677620887756348, 8.184035301208496, 8.690449714660645, 9.19686508178711, 9.703279495239258, 10.209693908691406, 10.716108322143555, 11.222522735595703, 11.728938102722168, 12.235352516174316]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 6.0, 7.0, 8.0, 12.0, 17.0, 12.0, 23.0, 28.0, 23.0, 22.0, 45.0, 45.0, 52.0, 48.0, 53.0, 53.0, 47.0, 57.0, 55.0, 44.0, 49.0, 38.0, 45.0, 32.0, 24.0, 30.0, 30.0, 15.0, 12.0, 13.0, 24.0, 8.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.596019268035889, -5.365468502044678, -5.134917259216309, -4.904366493225098, -4.6738152503967285, -4.443264484405518, -4.212713241577148, -3.9821624755859375, -3.7516114711761475, -3.5210604667663574, -3.2905094623565674, -3.0599584579467773, -2.8294076919555664, -2.5988564491271973, -2.3683056831359863, -2.1377546787261963, -1.9072036743164062, -1.6766526699066162, -1.4461016654968262, -1.2155507802963257, -0.9849997758865356, -0.7544487714767456, -0.5238978862762451, -0.2933468818664551, -0.06279587745666504, 0.1677550971508026, 0.39830607175827026, 0.6288570165634155, 0.8594080209732056, 1.0899590253829956, 1.320509910583496, 1.5510609149932861, 1.7816123962402344, 2.0121634006500244, 2.2427144050598145, 2.4732651710510254, 2.7038164138793945, 2.9343671798706055, 3.1649181842803955, 3.3954691886901855, 3.6260201930999756, 3.8565711975097656, 4.087121963500977, 4.317673206329346, 4.548223972320557, 4.778775215148926, 5.009325981140137, 5.239876747131348, 5.470427989959717, 5.700978755950928, 5.931529998779297, 6.162080764770508, 6.392632007598877, 6.623182773590088, 6.853734016418457, 7.084284782409668, 7.314835548400879, 7.54538631439209, 7.775937557220459, 8.006488800048828, 8.237039566040039, 8.46759033203125, 8.698141098022461, 8.928691864013672, 9.1592435836792]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 17.0, 13.0, 22.0, 33.0, 44.0, 59.0, 135.0, 234.0, 502.0, 1130.0, 4868.0, 36163.0, 860690.0, 130830.0, 10361.0, 2049.0, 678.0, 316.0, 160.0, 90.0, 41.0, 38.0, 21.0, 12.0, 11.0, 17.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.0916748046875, -9.683349609375, -9.2750244140625, -8.86669921875, -8.4583740234375, -8.050048828125, -7.6417236328125, -7.2333984375, -6.8250732421875, -6.416748046875, -6.0084228515625, -5.60009765625, -5.1917724609375, -4.783447265625, -4.3751220703125, -3.966796875, -3.5584716796875, -3.150146484375, -2.7418212890625, -2.33349609375, -1.9251708984375, -1.516845703125, -1.1085205078125, -0.7001953125, -0.2918701171875, 0.116455078125, 0.5247802734375, 0.93310546875, 1.3414306640625, 1.749755859375, 2.1580810546875, 2.56640625, 2.9747314453125, 3.383056640625, 3.7913818359375, 4.19970703125, 4.6080322265625, 5.016357421875, 5.4246826171875, 5.8330078125, 6.2413330078125, 6.649658203125, 7.0579833984375, 7.46630859375, 7.8746337890625, 8.282958984375, 8.6912841796875, 9.099609375, 9.5079345703125, 9.916259765625, 10.3245849609375, 10.73291015625, 11.1412353515625, 11.549560546875, 11.9578857421875, 12.3662109375, 12.7745361328125, 13.182861328125, 13.5911865234375, 13.99951171875, 14.4078369140625, 14.816162109375, 15.2244873046875, 15.6328125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 11.0, 20.0, 21.0, 32.0, 30.0, 58.0, 65.0, 82.0, 111.0, 106.0, 100.0, 78.0, 82.0, 71.0, 42.0, 26.0, 26.0, 16.0, 12.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.826690673828125, -1.77935791015625, -1.732025146484375, -1.6846923828125, -1.637359619140625, -1.59002685546875, -1.542694091796875, -1.495361328125, -1.448028564453125, -1.40069580078125, -1.353363037109375, -1.3060302734375, -1.258697509765625, -1.21136474609375, -1.164031982421875, -1.11669921875, -1.069366455078125, -1.02203369140625, -0.974700927734375, -0.9273681640625, -0.880035400390625, -0.83270263671875, -0.785369873046875, -0.738037109375, -0.690704345703125, -0.64337158203125, -0.596038818359375, -0.5487060546875, -0.501373291015625, -0.45404052734375, -0.406707763671875, -0.359375, -0.312042236328125, -0.26470947265625, -0.217376708984375, -0.1700439453125, -0.122711181640625, -0.07537841796875, -0.028045654296875, 0.019287109375, 0.066619873046875, 0.11395263671875, 0.161285400390625, 0.2086181640625, 0.255950927734375, 0.30328369140625, 0.350616455078125, 0.39794921875, 0.445281982421875, 0.49261474609375, 0.539947509765625, 0.5872802734375, 0.634613037109375, 0.68194580078125, 0.729278564453125, 0.776611328125, 0.823944091796875, 0.87127685546875, 0.918609619140625, 0.9659423828125, 1.013275146484375, 1.06060791015625, 1.107940673828125, 1.1552734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 3.0, 10.0, 9.0, 12.0, 18.0, 27.0, 26.0, 39.0, 40.0, 74.0, 93.0, 145.0, 212.0, 334.0, 538.0, 932.0, 1802.0, 3622.0, 7689.0, 18222.0, 49942.0, 181667.0, 555042.0, 153113.0, 44087.0, 16310.0, 6885.0, 3458.0, 1731.0, 914.0, 550.0, 319.0, 210.0, 139.0, 86.0, 70.0, 45.0, 34.0, 31.0, 17.0, 19.0, 7.0, 5.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-3.5, -3.39837646484375, -3.2967529296875, -3.19512939453125, -3.093505859375, -2.99188232421875, -2.8902587890625, -2.78863525390625, -2.68701171875, -2.58538818359375, -2.4837646484375, -2.38214111328125, -2.280517578125, -2.17889404296875, -2.0772705078125, -1.97564697265625, -1.8740234375, -1.77239990234375, -1.6707763671875, -1.56915283203125, -1.467529296875, -1.36590576171875, -1.2642822265625, -1.16265869140625, -1.06103515625, -0.95941162109375, -0.8577880859375, -0.75616455078125, -0.654541015625, -0.55291748046875, -0.4512939453125, -0.34967041015625, -0.248046875, -0.14642333984375, -0.0447998046875, 0.05682373046875, 0.158447265625, 0.26007080078125, 0.3616943359375, 0.46331787109375, 0.56494140625, 0.66656494140625, 0.7681884765625, 0.86981201171875, 0.971435546875, 1.07305908203125, 1.1746826171875, 1.27630615234375, 1.3779296875, 1.47955322265625, 1.5811767578125, 1.68280029296875, 1.784423828125, 1.88604736328125, 1.9876708984375, 2.08929443359375, 2.19091796875, 2.29254150390625, 2.3941650390625, 2.49578857421875, 2.597412109375, 2.69903564453125, 2.8006591796875, 2.90228271484375, 3.00390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 7.0, 14.0, 15.0, 18.0, 25.0, 32.0, 23.0, 33.0, 36.0, 38.0, 39.0, 38.0, 53.0, 54.0, 50.0, 44.0, 50.0, 57.0, 52.0, 49.0, 46.0, 45.0, 34.0, 25.0, 22.0, 29.0, 18.0, 13.0, 8.0, 6.0, 1.0, 7.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.5125732421875, -3.398193359375, -3.2838134765625, -3.16943359375, -3.0550537109375, -2.940673828125, -2.8262939453125, -2.7119140625, -2.5975341796875, -2.483154296875, -2.3687744140625, -2.25439453125, -2.1400146484375, -2.025634765625, -1.9112548828125, -1.796875, -1.6824951171875, -1.568115234375, -1.4537353515625, -1.33935546875, -1.2249755859375, -1.110595703125, -0.9962158203125, -0.8818359375, -0.7674560546875, -0.653076171875, -0.5386962890625, -0.42431640625, -0.3099365234375, -0.195556640625, -0.0811767578125, 0.033203125, 0.1475830078125, 0.261962890625, 0.3763427734375, 0.49072265625, 0.6051025390625, 0.719482421875, 0.8338623046875, 0.9482421875, 1.0626220703125, 1.177001953125, 1.2913818359375, 1.40576171875, 1.5201416015625, 1.634521484375, 1.7489013671875, 1.86328125, 1.9776611328125, 2.092041015625, 2.2064208984375, 2.32080078125, 2.4351806640625, 2.549560546875, 2.6639404296875, 2.7783203125, 2.8927001953125, 3.007080078125, 3.1214599609375, 3.23583984375, 3.3502197265625, 3.464599609375, 3.5789794921875, 3.693359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 15.0, 23.0, 32.0, 50.0, 99.0, 185.0, 367.0, 852.0, 2473.0, 10883.0, 127834.0, 857846.0, 38888.0, 6100.0, 1690.0, 619.0, 256.0, 138.0, 61.0, 40.0, 27.0, 16.0, 15.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.658203125, -3.537506103515625, -3.41680908203125, -3.296112060546875, -3.1754150390625, -3.054718017578125, -2.93402099609375, -2.813323974609375, -2.692626953125, -2.571929931640625, -2.45123291015625, -2.330535888671875, -2.2098388671875, -2.089141845703125, -1.96844482421875, -1.847747802734375, -1.72705078125, -1.606353759765625, -1.48565673828125, -1.364959716796875, -1.2442626953125, -1.123565673828125, -1.00286865234375, -0.882171630859375, -0.761474609375, -0.640777587890625, -0.52008056640625, -0.399383544921875, -0.2786865234375, -0.157989501953125, -0.03729248046875, 0.083404541015625, 0.2041015625, 0.324798583984375, 0.44549560546875, 0.566192626953125, 0.6868896484375, 0.807586669921875, 0.92828369140625, 1.048980712890625, 1.169677734375, 1.290374755859375, 1.41107177734375, 1.531768798828125, 1.6524658203125, 1.773162841796875, 1.89385986328125, 2.014556884765625, 2.13525390625, 2.255950927734375, 2.37664794921875, 2.497344970703125, 2.6180419921875, 2.738739013671875, 2.85943603515625, 2.980133056640625, 3.100830078125, 3.221527099609375, 3.34222412109375, 3.462921142578125, 3.5836181640625, 3.704315185546875, 3.82501220703125, 3.945709228515625, 4.06640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 7.0, 9.0, 21.0, 27.0, 33.0, 82.0, 184.0, 273.0, 165.0, 92.0, 44.0, 19.0, 15.0, 9.0, 10.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005245208740234375, -0.0005054250359535217, -0.00048632919788360596, -0.0004672333598136902, -0.0004481375217437744, -0.00042904168367385864, -0.00040994584560394287, -0.0003908500075340271, -0.00037175416946411133, -0.00035265833139419556, -0.0003335624933242798, -0.000314466655254364, -0.00029537081718444824, -0.00027627497911453247, -0.0002571791410446167, -0.00023808330297470093, -0.00021898746490478516, -0.00019989162683486938, -0.0001807957887649536, -0.00016169995069503784, -0.00014260411262512207, -0.0001235082745552063, -0.00010441243648529053, -8.531659841537476e-05, -6.622076034545898e-05, -4.712492227554321e-05, -2.802908420562744e-05, -8.93324613571167e-06, 1.0162591934204102e-05, 2.9258430004119873e-05, 4.8354268074035645e-05, 6.745010614395142e-05, 8.654594421386719e-05, 0.00010564178228378296, 0.00012473762035369873, 0.0001438334584236145, 0.00016292929649353027, 0.00018202513456344604, 0.00020112097263336182, 0.0002202168107032776, 0.00023931264877319336, 0.00025840848684310913, 0.0002775043249130249, 0.0002966001629829407, 0.00031569600105285645, 0.0003347918391227722, 0.000353887677192688, 0.00037298351526260376, 0.00039207935333251953, 0.0004111751914024353, 0.0004302710294723511, 0.00044936686754226685, 0.0004684627056121826, 0.0004875585436820984, 0.0005066543817520142, 0.0005257502198219299, 0.0005448460578918457, 0.0005639418959617615, 0.0005830377340316772, 0.000602133572101593, 0.0006212294101715088, 0.0006403252482414246, 0.0006594210863113403, 0.0006785169243812561, 0.0006976127624511719]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 12.0, 21.0, 21.0, 44.0, 44.0, 61.0, 119.0, 200.0, 481.0, 1578.0, 8545.0, 188721.0, 828651.0, 16272.0, 2456.0, 651.0, 262.0, 141.0, 93.0, 57.0, 49.0, 19.0, 16.0, 8.0, 2.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.813232421875, -3.66162109375, -3.510009765625, -3.3583984375, -3.206787109375, -3.05517578125, -2.903564453125, -2.751953125, -2.600341796875, -2.44873046875, -2.297119140625, -2.1455078125, -1.993896484375, -1.84228515625, -1.690673828125, -1.5390625, -1.387451171875, -1.23583984375, -1.084228515625, -0.9326171875, -0.781005859375, -0.62939453125, -0.477783203125, -0.326171875, -0.174560546875, -0.02294921875, 0.128662109375, 0.2802734375, 0.431884765625, 0.58349609375, 0.735107421875, 0.88671875, 1.038330078125, 1.18994140625, 1.341552734375, 1.4931640625, 1.644775390625, 1.79638671875, 1.947998046875, 2.099609375, 2.251220703125, 2.40283203125, 2.554443359375, 2.7060546875, 2.857666015625, 3.00927734375, 3.160888671875, 3.3125, 3.464111328125, 3.61572265625, 3.767333984375, 3.9189453125, 4.070556640625, 4.22216796875, 4.373779296875, 4.525390625, 4.677001953125, 4.82861328125, 4.980224609375, 5.1318359375, 5.283447265625, 5.43505859375, 5.586669921875, 5.73828125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 5.0, 15.0, 19.0, 59.0, 179.0, 443.0, 187.0, 50.0, 20.0, 12.0, 8.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.5814208984375, -5.428466796875, -5.2755126953125, -5.12255859375, -4.9696044921875, -4.816650390625, -4.6636962890625, -4.5107421875, -4.3577880859375, -4.204833984375, -4.0518798828125, -3.89892578125, -3.7459716796875, -3.593017578125, -3.4400634765625, -3.287109375, -3.1341552734375, -2.981201171875, -2.8282470703125, -2.67529296875, -2.5223388671875, -2.369384765625, -2.2164306640625, -2.0634765625, -1.9105224609375, -1.757568359375, -1.6046142578125, -1.45166015625, -1.2987060546875, -1.145751953125, -0.9927978515625, -0.83984375, -0.6868896484375, -0.533935546875, -0.3809814453125, -0.22802734375, -0.0750732421875, 0.077880859375, 0.2308349609375, 0.3837890625, 0.5367431640625, 0.689697265625, 0.8426513671875, 0.99560546875, 1.1485595703125, 1.301513671875, 1.4544677734375, 1.607421875, 1.7603759765625, 1.913330078125, 2.0662841796875, 2.21923828125, 2.3721923828125, 2.525146484375, 2.6781005859375, 2.8310546875, 2.9840087890625, 3.136962890625, 3.2899169921875, 3.44287109375, 3.5958251953125, 3.748779296875, 3.9017333984375, 4.0546875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 13.0, 19.0, 67.0, 110.0, 194.0, 189.0, 157.0, 112.0, 60.0, 34.0, 22.0, 10.0, 4.0, 6.0, 0.0, 2.0, 2.0, 3.0], "bins": [-59.06610107421875, -57.913002014160156, -56.75990295410156, -55.60680389404297, -54.453704833984375, -53.30060577392578, -52.14750671386719, -50.99440383911133, -49.841304779052734, -48.68820571899414, -47.53510665893555, -46.38200759887695, -45.22890853881836, -44.0758056640625, -42.922706604003906, -41.76960754394531, -40.61650848388672, -39.463409423828125, -38.31031036376953, -37.15721130371094, -36.004112243652344, -34.85101318359375, -33.697914123535156, -32.5448112487793, -31.39171600341797, -30.238616943359375, -29.08551788330078, -27.932418823242188, -26.77931785583496, -25.626218795776367, -24.473119735717773, -23.320018768310547, -22.166919708251953, -21.01382064819336, -19.860721588134766, -18.707622528076172, -17.554521560668945, -16.40142250061035, -15.248323440551758, -14.095223426818848, -12.942124366760254, -11.78902530670166, -10.63592529296875, -9.482826232910156, -8.329727172851562, -7.176627159118652, -6.023528099060059, -4.870428085327148, -3.7173290252685547, -2.5642294883728027, -1.4111301898956299, -0.25803089141845703, 0.8950686454772949, 2.048168182373047, 3.2012672424316406, 4.354367256164551, 5.5074663162231445, 6.6605658531188965, 7.813665390014648, 8.966764450073242, 10.119863510131836, 11.272963523864746, 12.42606258392334, 13.57916259765625, 14.732261657714844]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 16.0, 15.0, 26.0, 26.0, 23.0, 30.0, 22.0, 30.0, 29.0, 41.0, 37.0, 56.0, 41.0, 42.0, 46.0, 39.0, 51.0, 45.0, 33.0, 32.0, 36.0, 27.0, 31.0, 33.0, 28.0, 20.0, 25.0, 14.0, 21.0, 11.0, 10.0, 11.0, 10.0, 2.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.634029388427734, -16.133546829223633, -15.633064270019531, -15.13258171081543, -14.632099151611328, -14.131616592407227, -13.631133079528809, -13.130650520324707, -12.630167961120605, -12.129685401916504, -11.629202842712402, -11.1287202835083, -10.628236770629883, -10.127754211425781, -9.62727165222168, -9.126789093017578, -8.626306533813477, -8.125823974609375, -7.625341415405273, -7.124858379364014, -6.624375820159912, -6.1238932609558105, -5.623410224914551, -5.122927665710449, -4.622445106506348, -4.121962547302246, -3.6214797496795654, -3.1209969520568848, -2.620514392852783, -2.1200318336486816, -1.619549036026001, -1.1190662384033203, -0.6185817718505859, -0.11809909343719482, 0.3823835849761963, 0.8828662633895874, 1.3833489418029785, 1.88383150100708, 2.3843142986297607, 2.8847970962524414, 3.385279655456543, 3.8857622146606445, 4.386244773864746, 4.886727809906006, 5.387210369110107, 5.887692928314209, 6.388175964355469, 6.88865852355957, 7.389141082763672, 7.889623641967773, 8.390106201171875, 8.890588760375977, 9.391071319580078, 9.89155387878418, 10.392037391662598, 10.8925199508667, 11.3930025100708, 11.893485069274902, 12.393967628479004, 12.894450187683105, 13.394933700561523, 13.895416259765625, 14.395898818969727, 14.896381378173828, 15.39686393737793]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 5.0, 7.0, 3.0, 1.0, 7.0, 9.0, 14.0, 14.0, 21.0, 27.0, 45.0, 86.0, 111.0, 186.0, 567.0, 1565.0, 5225.0, 35587.0, 4105473.0, 37296.0, 5293.0, 1621.0, 591.0, 216.0, 127.0, 63.0, 27.0, 30.0, 18.0, 12.0, 10.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.09375, -16.6717529296875, -16.249755859375, -15.8277587890625, -15.40576171875, -14.9837646484375, -14.561767578125, -14.1397705078125, -13.7177734375, -13.2957763671875, -12.873779296875, -12.4517822265625, -12.02978515625, -11.6077880859375, -11.185791015625, -10.7637939453125, -10.341796875, -9.9197998046875, -9.497802734375, -9.0758056640625, -8.65380859375, -8.2318115234375, -7.809814453125, -7.3878173828125, -6.9658203125, -6.5438232421875, -6.121826171875, -5.6998291015625, -5.27783203125, -4.8558349609375, -4.433837890625, -4.0118408203125, -3.58984375, -3.1678466796875, -2.745849609375, -2.3238525390625, -1.90185546875, -1.4798583984375, -1.057861328125, -0.6358642578125, -0.2138671875, 0.2081298828125, 0.630126953125, 1.0521240234375, 1.47412109375, 1.8961181640625, 2.318115234375, 2.7401123046875, 3.162109375, 3.5841064453125, 4.006103515625, 4.4281005859375, 4.85009765625, 5.2720947265625, 5.694091796875, 6.1160888671875, 6.5380859375, 6.9600830078125, 7.382080078125, 7.8040771484375, 8.22607421875, 8.6480712890625, 9.070068359375, 9.4920654296875, 9.9140625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 13.0, 11.0, 20.0, 29.0, 30.0, 43.0, 53.0, 79.0, 72.0, 92.0, 98.0, 70.0, 87.0, 93.0, 56.0, 53.0, 33.0, 25.0, 15.0, 10.0, 12.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.884765625, -1.8371429443359375, -1.789520263671875, -1.7418975830078125, -1.69427490234375, -1.6466522216796875, -1.599029541015625, -1.5514068603515625, -1.5037841796875, -1.4561614990234375, -1.408538818359375, -1.3609161376953125, -1.31329345703125, -1.2656707763671875, -1.218048095703125, -1.1704254150390625, -1.122802734375, -1.0751800537109375, -1.027557373046875, -0.9799346923828125, -0.93231201171875, -0.8846893310546875, -0.837066650390625, -0.7894439697265625, -0.7418212890625, -0.6941986083984375, -0.646575927734375, -0.5989532470703125, -0.55133056640625, -0.5037078857421875, -0.456085205078125, -0.4084625244140625, -0.36083984375, -0.3132171630859375, -0.265594482421875, -0.2179718017578125, -0.17034912109375, -0.1227264404296875, -0.075103759765625, -0.0274810791015625, 0.0201416015625, 0.0677642822265625, 0.115386962890625, 0.1630096435546875, 0.21063232421875, 0.2582550048828125, 0.305877685546875, 0.3535003662109375, 0.401123046875, 0.4487457275390625, 0.496368408203125, 0.5439910888671875, 0.59161376953125, 0.6392364501953125, 0.686859130859375, 0.7344818115234375, 0.7821044921875, 0.8297271728515625, 0.877349853515625, 0.9249725341796875, 0.97259521484375, 1.0202178955078125, 1.067840576171875, 1.1154632568359375, 1.1630859375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 6.0, 5.0, 11.0, 6.0, 16.0, 38.0, 43.0, 54.0, 72.0, 100.0, 155.0, 245.0, 361.0, 545.0, 794.0, 1325.0, 2311.0, 3839.0, 7082.0, 14463.0, 39211.0, 256737.0, 3743239.0, 78326.0, 22609.0, 9997.0, 5131.0, 2908.0, 1676.0, 1033.0, 646.0, 415.0, 257.0, 194.0, 102.0, 93.0, 78.0, 50.0, 27.0, 17.0, 17.0, 15.0, 14.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.26953125, -4.12835693359375, -3.9871826171875, -3.84600830078125, -3.704833984375, -3.56365966796875, -3.4224853515625, -3.28131103515625, -3.14013671875, -2.99896240234375, -2.8577880859375, -2.71661376953125, -2.575439453125, -2.43426513671875, -2.2930908203125, -2.15191650390625, -2.0107421875, -1.86956787109375, -1.7283935546875, -1.58721923828125, -1.446044921875, -1.30487060546875, -1.1636962890625, -1.02252197265625, -0.88134765625, -0.74017333984375, -0.5989990234375, -0.45782470703125, -0.316650390625, -0.17547607421875, -0.0343017578125, 0.10687255859375, 0.248046875, 0.38922119140625, 0.5303955078125, 0.67156982421875, 0.812744140625, 0.95391845703125, 1.0950927734375, 1.23626708984375, 1.37744140625, 1.51861572265625, 1.6597900390625, 1.80096435546875, 1.942138671875, 2.08331298828125, 2.2244873046875, 2.36566162109375, 2.5068359375, 2.64801025390625, 2.7891845703125, 2.93035888671875, 3.071533203125, 3.21270751953125, 3.3538818359375, 3.49505615234375, 3.63623046875, 3.77740478515625, 3.9185791015625, 4.05975341796875, 4.200927734375, 4.34210205078125, 4.4832763671875, 4.62445068359375, 4.765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 4.0, 5.0, 6.0, 5.0, 6.0, 10.0, 19.0, 34.0, 41.0, 63.0, 207.0, 2882.0, 469.0, 127.0, 53.0, 23.0, 33.0, 16.0, 14.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.262908935546875, -2.19378662109375, -2.124664306640625, -2.0555419921875, -1.986419677734375, -1.91729736328125, -1.848175048828125, -1.779052734375, -1.709930419921875, -1.64080810546875, -1.571685791015625, -1.5025634765625, -1.433441162109375, -1.36431884765625, -1.295196533203125, -1.22607421875, -1.156951904296875, -1.08782958984375, -1.018707275390625, -0.9495849609375, -0.880462646484375, -0.81134033203125, -0.742218017578125, -0.673095703125, -0.603973388671875, -0.53485107421875, -0.465728759765625, -0.3966064453125, -0.327484130859375, -0.25836181640625, -0.189239501953125, -0.1201171875, -0.050994873046875, 0.01812744140625, 0.087249755859375, 0.1563720703125, 0.225494384765625, 0.29461669921875, 0.363739013671875, 0.432861328125, 0.501983642578125, 0.57110595703125, 0.640228271484375, 0.7093505859375, 0.778472900390625, 0.84759521484375, 0.916717529296875, 0.98583984375, 1.054962158203125, 1.12408447265625, 1.193206787109375, 1.2623291015625, 1.331451416015625, 1.40057373046875, 1.469696044921875, 1.538818359375, 1.607940673828125, 1.67706298828125, 1.746185302734375, 1.8153076171875, 1.884429931640625, 1.95355224609375, 2.022674560546875, 2.091796875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 17.0, 23.0, 41.0, 71.0, 95.0, 136.0, 189.0, 135.0, 105.0, 63.0, 35.0, 30.0, 13.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.80157470703125, -9.445779800415039, -9.089984893798828, -8.734189987182617, -8.378395080566406, -8.022600173950195, -7.666804790496826, -7.311009883880615, -6.955214977264404, -6.599420070648193, -6.243625164031982, -5.887829780578613, -5.532034873962402, -5.176239967346191, -4.8204450607299805, -4.4646501541137695, -4.108855247497559, -3.7530603408813477, -3.3972654342651367, -3.0414702892303467, -2.6856753826141357, -2.329880475997925, -1.9740853309631348, -1.6182904243469238, -1.262495517730713, -0.9067005515098572, -0.5509055852890015, -0.19511055946350098, 0.16068434715270996, 0.5164792537689209, 0.8722743988037109, 1.2280693054199219, 1.5838651657104492, 1.9396600723266602, 2.295454978942871, 2.651250123977661, 3.007045030593872, 3.362839937210083, 3.718635082244873, 4.074429988861084, 4.430224895477295, 4.786019802093506, 5.141814708709717, 5.497610092163086, 5.853404998779297, 6.209199905395508, 6.564994812011719, 6.92078971862793, 7.276584625244141, 7.632379531860352, 7.9881744384765625, 8.343969345092773, 8.699764251708984, 9.055559158325195, 9.411354064941406, 9.767148971557617, 10.122943878173828, 10.478738784790039, 10.83453369140625, 11.190328598022461, 11.546123504638672, 11.901918411254883, 12.257713317871094, 12.613508224487305, 12.969304084777832]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 5.0, 4.0, 6.0, 10.0, 9.0, 8.0, 13.0, 12.0, 26.0, 21.0, 15.0, 32.0, 27.0, 35.0, 24.0, 36.0, 42.0, 39.0, 48.0, 38.0, 38.0, 45.0, 44.0, 40.0, 34.0, 43.0, 35.0, 34.0, 37.0, 25.0, 21.0, 25.0, 13.0, 18.0, 18.0, 15.0, 12.0, 9.0, 9.0, 4.0, 3.0, 7.0, 1.0, 3.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.343256950378418, -4.184394836425781, -4.0255327224731445, -3.8666703701019287, -3.707808256149292, -3.5489461421966553, -3.3900837898254395, -3.2312216758728027, -3.072359561920166, -2.9134974479675293, -2.7546353340148926, -2.5957729816436768, -2.43691086769104, -2.2780487537384033, -2.1191864013671875, -1.9603242874145508, -1.801462173461914, -1.6426000595092773, -1.483737826347351, -1.3248755931854248, -1.166013479232788, -1.0071513652801514, -0.8482891321182251, -0.6894268989562988, -0.5305647850036621, -0.3717026114463806, -0.21284043788909912, -0.05397826433181763, 0.10488390922546387, 0.26374608278274536, 0.42260825634002686, 0.5814704895019531, 0.740333080291748, 0.8991952538490295, 1.058057427406311, 1.2169196605682373, 1.375781774520874, 1.5346438884735107, 1.693506121635437, 1.8523683547973633, 2.01123046875, 2.1700925827026367, 2.3289546966552734, 2.4878170490264893, 2.646679162979126, 2.8055412769317627, 2.9644036293029785, 3.1232657432556152, 3.282127857208252, 3.4409899711608887, 3.5998520851135254, 3.758714437484741, 3.917576551437378, 4.076438903808594, 4.2353010177612305, 4.394163131713867, 4.553025245666504, 4.711887359619141, 4.870749473571777, 5.029611587524414, 5.188473701477051, 5.347336292266846, 5.506198406219482, 5.665060520172119, 5.823922634124756]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 12.0, 8.0, 7.0, 10.0, 20.0, 45.0, 54.0, 101.0, 167.0, 364.0, 804.0, 2706.0, 14783.0, 312132.0, 689839.0, 22110.0, 3484.0, 979.0, 426.0, 199.0, 115.0, 66.0, 45.0, 26.0, 10.0, 10.0, 12.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-14.09375, -13.7237548828125, -13.353759765625, -12.9837646484375, -12.61376953125, -12.2437744140625, -11.873779296875, -11.5037841796875, -11.1337890625, -10.7637939453125, -10.393798828125, -10.0238037109375, -9.65380859375, -9.2838134765625, -8.913818359375, -8.5438232421875, -8.173828125, -7.8038330078125, -7.433837890625, -7.0638427734375, -6.69384765625, -6.3238525390625, -5.953857421875, -5.5838623046875, -5.2138671875, -4.8438720703125, -4.473876953125, -4.1038818359375, -3.73388671875, -3.3638916015625, -2.993896484375, -2.6239013671875, -2.25390625, -1.8839111328125, -1.513916015625, -1.1439208984375, -0.77392578125, -0.4039306640625, -0.033935546875, 0.3360595703125, 0.7060546875, 1.0760498046875, 1.446044921875, 1.8160400390625, 2.18603515625, 2.5560302734375, 2.926025390625, 3.2960205078125, 3.666015625, 4.0360107421875, 4.406005859375, 4.7760009765625, 5.14599609375, 5.5159912109375, 5.885986328125, 6.2559814453125, 6.6259765625, 6.9959716796875, 7.365966796875, 7.7359619140625, 8.10595703125, 8.4759521484375, 8.845947265625, 9.2159423828125, 9.5859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 11.0, 20.0, 27.0, 24.0, 34.0, 61.0, 67.0, 81.0, 101.0, 85.0, 78.0, 86.0, 75.0, 80.0, 50.0, 38.0, 22.0, 14.0, 20.0, 10.0, 4.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87109375, -1.82293701171875, -1.7747802734375, -1.72662353515625, -1.678466796875, -1.63031005859375, -1.5821533203125, -1.53399658203125, -1.48583984375, -1.43768310546875, -1.3895263671875, -1.34136962890625, -1.293212890625, -1.24505615234375, -1.1968994140625, -1.14874267578125, -1.1005859375, -1.05242919921875, -1.0042724609375, -0.95611572265625, -0.907958984375, -0.85980224609375, -0.8116455078125, -0.76348876953125, -0.71533203125, -0.66717529296875, -0.6190185546875, -0.57086181640625, -0.522705078125, -0.47454833984375, -0.4263916015625, -0.37823486328125, -0.330078125, -0.28192138671875, -0.2337646484375, -0.18560791015625, -0.137451171875, -0.08929443359375, -0.0411376953125, 0.00701904296875, 0.05517578125, 0.10333251953125, 0.1514892578125, 0.19964599609375, 0.247802734375, 0.29595947265625, 0.3441162109375, 0.39227294921875, 0.4404296875, 0.48858642578125, 0.5367431640625, 0.58489990234375, 0.633056640625, 0.68121337890625, 0.7293701171875, 0.77752685546875, 0.82568359375, 0.87384033203125, 0.9219970703125, 0.97015380859375, 1.018310546875, 1.06646728515625, 1.1146240234375, 1.16278076171875, 1.2109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 11.0, 24.0, 40.0, 61.0, 98.0, 159.0, 231.0, 496.0, 929.0, 2079.0, 4648.0, 11175.0, 31728.0, 114240.0, 561352.0, 237333.0, 53903.0, 17406.0, 6702.0, 2965.0, 1374.0, 697.0, 328.0, 215.0, 134.0, 80.0, 39.0, 33.0, 12.0, 11.0, 8.0, 6.0, 5.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.3828125, -3.272705078125, -3.16259765625, -3.052490234375, -2.9423828125, -2.832275390625, -2.72216796875, -2.612060546875, -2.501953125, -2.391845703125, -2.28173828125, -2.171630859375, -2.0615234375, -1.951416015625, -1.84130859375, -1.731201171875, -1.62109375, -1.510986328125, -1.40087890625, -1.290771484375, -1.1806640625, -1.070556640625, -0.96044921875, -0.850341796875, -0.740234375, -0.630126953125, -0.52001953125, -0.409912109375, -0.2998046875, -0.189697265625, -0.07958984375, 0.030517578125, 0.140625, 0.250732421875, 0.36083984375, 0.470947265625, 0.5810546875, 0.691162109375, 0.80126953125, 0.911376953125, 1.021484375, 1.131591796875, 1.24169921875, 1.351806640625, 1.4619140625, 1.572021484375, 1.68212890625, 1.792236328125, 1.90234375, 2.012451171875, 2.12255859375, 2.232666015625, 2.3427734375, 2.452880859375, 2.56298828125, 2.673095703125, 2.783203125, 2.893310546875, 3.00341796875, 3.113525390625, 3.2236328125, 3.333740234375, 3.44384765625, 3.553955078125, 3.6640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 5.0, 5.0, 1.0, 11.0, 8.0, 15.0, 13.0, 16.0, 22.0, 19.0, 25.0, 21.0, 28.0, 28.0, 36.0, 37.0, 47.0, 45.0, 39.0, 42.0, 44.0, 38.0, 54.0, 58.0, 32.0, 34.0, 39.0, 24.0, 31.0, 35.0, 19.0, 13.0, 18.0, 23.0, 11.0, 14.0, 15.0, 7.0, 8.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.75390625, -3.65057373046875, -3.5472412109375, -3.44390869140625, -3.340576171875, -3.23724365234375, -3.1339111328125, -3.03057861328125, -2.92724609375, -2.82391357421875, -2.7205810546875, -2.61724853515625, -2.513916015625, -2.41058349609375, -2.3072509765625, -2.20391845703125, -2.1005859375, -1.99725341796875, -1.8939208984375, -1.79058837890625, -1.687255859375, -1.58392333984375, -1.4805908203125, -1.37725830078125, -1.27392578125, -1.17059326171875, -1.0672607421875, -0.96392822265625, -0.860595703125, -0.75726318359375, -0.6539306640625, -0.55059814453125, -0.447265625, -0.34393310546875, -0.2406005859375, -0.13726806640625, -0.033935546875, 0.06939697265625, 0.1727294921875, 0.27606201171875, 0.37939453125, 0.48272705078125, 0.5860595703125, 0.68939208984375, 0.792724609375, 0.89605712890625, 0.9993896484375, 1.10272216796875, 1.2060546875, 1.30938720703125, 1.4127197265625, 1.51605224609375, 1.619384765625, 1.72271728515625, 1.8260498046875, 1.92938232421875, 2.03271484375, 2.13604736328125, 2.2393798828125, 2.34271240234375, 2.446044921875, 2.54937744140625, 2.6527099609375, 2.75604248046875, 2.859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 8.0, 9.0, 9.0, 20.0, 33.0, 40.0, 73.0, 116.0, 201.0, 462.0, 1041.0, 2841.0, 9824.0, 63134.0, 887241.0, 68268.0, 10193.0, 2892.0, 1097.0, 499.0, 232.0, 119.0, 68.0, 42.0, 28.0, 15.0, 8.0, 6.0, 4.0, 10.0, 4.0, 6.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.402862548828125, -4.28228759765625, -4.161712646484375, -4.0411376953125, -3.920562744140625, -3.79998779296875, -3.679412841796875, -3.558837890625, -3.438262939453125, -3.31768798828125, -3.197113037109375, -3.0765380859375, -2.955963134765625, -2.83538818359375, -2.714813232421875, -2.59423828125, -2.473663330078125, -2.35308837890625, -2.232513427734375, -2.1119384765625, -1.991363525390625, -1.87078857421875, -1.750213623046875, -1.629638671875, -1.509063720703125, -1.38848876953125, -1.267913818359375, -1.1473388671875, -1.026763916015625, -0.90618896484375, -0.785614013671875, -0.6650390625, -0.544464111328125, -0.42388916015625, -0.303314208984375, -0.1827392578125, -0.062164306640625, 0.05841064453125, 0.178985595703125, 0.299560546875, 0.420135498046875, 0.54071044921875, 0.661285400390625, 0.7818603515625, 0.902435302734375, 1.02301025390625, 1.143585205078125, 1.26416015625, 1.384735107421875, 1.50531005859375, 1.625885009765625, 1.7464599609375, 1.867034912109375, 1.98760986328125, 2.108184814453125, 2.228759765625, 2.349334716796875, 2.46990966796875, 2.590484619140625, 2.7110595703125, 2.831634521484375, 2.95220947265625, 3.072784423828125, 3.193359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 19.0, 25.0, 35.0, 78.0, 194.0, 349.0, 155.0, 63.0, 24.0, 13.0, 15.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010242462158203125, -0.001001652330160141, -0.0009790584444999695, -0.000956464558839798, -0.0009338706731796265, -0.000911276787519455, -0.0008886829018592834, -0.0008660890161991119, -0.0008434951305389404, -0.0008209012448787689, -0.0007983073592185974, -0.0007757134735584259, -0.0007531195878982544, -0.0007305257022380829, -0.0007079318165779114, -0.0006853379309177399, -0.0006627440452575684, -0.0006401501595973969, -0.0006175562739372253, -0.0005949623882770538, -0.0005723685026168823, -0.0005497746169567108, -0.0005271807312965393, -0.0005045868456363678, -0.0004819929599761963, -0.0004593990743160248, -0.00043680518865585327, -0.00041421130299568176, -0.00039161741733551025, -0.00036902353167533875, -0.00034642964601516724, -0.00032383576035499573, -0.0003012418746948242, -0.0002786479890346527, -0.0002560541033744812, -0.0002334602177143097, -0.00021086633205413818, -0.00018827244639396667, -0.00016567856073379517, -0.00014308467507362366, -0.00012049078941345215, -9.789690375328064e-05, -7.530301809310913e-05, -5.270913243293762e-05, -3.0115246772766113e-05, -7.5213611125946045e-06, 1.5072524547576904e-05, 3.766641020774841e-05, 6.026029586791992e-05, 8.285418152809143e-05, 0.00010544806718826294, 0.00012804195284843445, 0.00015063583850860596, 0.00017322972416877747, 0.00019582360982894897, 0.00021841749548912048, 0.000241011381149292, 0.0002636052668094635, 0.000286199152469635, 0.0003087930381298065, 0.00033138692378997803, 0.00035398080945014954, 0.00037657469511032104, 0.00039916858077049255, 0.00042176246643066406]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 9.0, 17.0, 24.0, 28.0, 53.0, 105.0, 151.0, 331.0, 601.0, 1408.0, 3355.0, 11965.0, 153834.0, 844813.0, 23212.0, 5072.0, 1854.0, 771.0, 402.0, 214.0, 133.0, 67.0, 40.0, 29.0, 18.0, 15.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.74609375, -5.599456787109375, -5.45281982421875, -5.306182861328125, -5.1595458984375, -5.012908935546875, -4.86627197265625, -4.719635009765625, -4.572998046875, -4.426361083984375, -4.27972412109375, -4.133087158203125, -3.9864501953125, -3.839813232421875, -3.69317626953125, -3.546539306640625, -3.39990234375, -3.253265380859375, -3.10662841796875, -2.959991455078125, -2.8133544921875, -2.666717529296875, -2.52008056640625, -2.373443603515625, -2.226806640625, -2.080169677734375, -1.93353271484375, -1.786895751953125, -1.6402587890625, -1.493621826171875, -1.34698486328125, -1.200347900390625, -1.0537109375, -0.907073974609375, -0.76043701171875, -0.613800048828125, -0.4671630859375, -0.320526123046875, -0.17388916015625, -0.027252197265625, 0.119384765625, 0.266021728515625, 0.41265869140625, 0.559295654296875, 0.7059326171875, 0.852569580078125, 0.99920654296875, 1.145843505859375, 1.29248046875, 1.439117431640625, 1.58575439453125, 1.732391357421875, 1.8790283203125, 2.025665283203125, 2.17230224609375, 2.318939208984375, 2.465576171875, 2.612213134765625, 2.75885009765625, 2.905487060546875, 3.0521240234375, 3.198760986328125, 3.34539794921875, 3.492034912109375, 3.638671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 9.0, 8.0, 8.0, 16.0, 23.0, 51.0, 67.0, 156.0, 261.0, 175.0, 80.0, 41.0, 30.0, 16.0, 13.0, 6.0, 5.0, 5.0, 4.0, 1.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.080078125, -1.9920654296875, -1.904052734375, -1.8160400390625, -1.72802734375, -1.6400146484375, -1.552001953125, -1.4639892578125, -1.3759765625, -1.2879638671875, -1.199951171875, -1.1119384765625, -1.02392578125, -0.9359130859375, -0.847900390625, -0.7598876953125, -0.671875, -0.5838623046875, -0.495849609375, -0.4078369140625, -0.31982421875, -0.2318115234375, -0.143798828125, -0.0557861328125, 0.0322265625, 0.1202392578125, 0.208251953125, 0.2962646484375, 0.38427734375, 0.4722900390625, 0.560302734375, 0.6483154296875, 0.736328125, 0.8243408203125, 0.912353515625, 1.0003662109375, 1.08837890625, 1.1763916015625, 1.264404296875, 1.3524169921875, 1.4404296875, 1.5284423828125, 1.616455078125, 1.7044677734375, 1.79248046875, 1.8804931640625, 1.968505859375, 2.0565185546875, 2.14453125, 2.2325439453125, 2.320556640625, 2.4085693359375, 2.49658203125, 2.5845947265625, 2.672607421875, 2.7606201171875, 2.8486328125, 2.9366455078125, 3.024658203125, 3.1126708984375, 3.20068359375, 3.2886962890625, 3.376708984375, 3.4647216796875, 3.552734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 15.0, 74.0, 199.0, 337.0, 218.0, 103.0, 32.0, 15.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.05762481689453, -81.14897155761719, -79.24031829833984, -77.3316650390625, -75.42301177978516, -73.51435852050781, -71.60570526123047, -69.69705200195312, -67.78840637207031, -65.87975311279297, -63.971099853515625, -62.06244659423828, -60.15379333496094, -58.245140075683594, -56.336490631103516, -54.42783737182617, -52.51918029785156, -50.61052703857422, -48.701873779296875, -46.79322052001953, -44.88456726074219, -42.975914001464844, -41.067264556884766, -39.15861129760742, -37.24995803833008, -35.341304779052734, -33.43265151977539, -31.52400016784668, -29.615346908569336, -27.706693649291992, -25.79804229736328, -23.889389038085938, -21.980735778808594, -20.07208251953125, -18.163429260253906, -16.254777908325195, -14.346124649047852, -12.437471389770508, -10.52881908416748, -8.620166778564453, -6.711513519287109, -4.802860736846924, -2.8942079544067383, -0.9855551719665527, 0.9230976104736328, 2.8317508697509766, 4.740403175354004, 6.649055480957031, 8.557708740234375, 10.466361999511719, 12.375014305114746, 14.283666610717773, 16.192319869995117, 18.10097312927246, 20.009624481201172, 21.918277740478516, 23.82693099975586, 25.735584259033203, 27.644237518310547, 29.552888870239258, 31.4615421295166, 33.37019348144531, 35.278846740722656, 37.1875, 39.096153259277344]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 3.0, 8.0, 11.0, 7.0, 12.0, 22.0, 14.0, 17.0, 20.0, 22.0, 10.0, 16.0, 26.0, 40.0, 35.0, 39.0, 30.0, 38.0, 42.0, 31.0, 40.0, 29.0, 51.0, 38.0, 43.0, 29.0, 38.0, 35.0, 29.0, 31.0, 30.0, 23.0, 21.0, 20.0, 10.0, 22.0, 8.0, 10.0, 8.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-13.920467376708984, -13.482731819152832, -13.044995307922363, -12.607259750366211, -12.169523239135742, -11.73178768157959, -11.294052124023438, -10.856315612792969, -10.4185791015625, -9.980843544006348, -9.543107032775879, -9.105371475219727, -8.667634963989258, -8.229899406433105, -7.792163372039795, -7.354427337646484, -6.916691780090332, -6.4789557456970215, -6.041219711303711, -5.603484153747559, -5.16574764251709, -4.7280120849609375, -4.290276050567627, -3.8525400161743164, -3.414803981781006, -2.9770679473876953, -2.5393319129943848, -2.1015961170196533, -1.6638600826263428, -1.2261240482330322, -0.7883882522583008, -0.35065221786499023, 0.0870828628540039, 0.5248188376426697, 0.9625548124313354, 1.4002907276153564, 1.838026762008667, 2.2757627964019775, 2.713498592376709, 3.1512346267700195, 3.58897066116333, 4.026706695556641, 4.464442729949951, 4.902178764343262, 5.339914321899414, 5.777650833129883, 6.215386390686035, 6.653122425079346, 7.090858459472656, 7.528594493865967, 7.966330528259277, 8.40406608581543, 8.841802597045898, 9.27953815460205, 9.717273712158203, 10.155010223388672, 10.59274673461914, 11.030482292175293, 11.468218803405762, 11.905954360961914, 12.343690872192383, 12.781426429748535, 13.219161987304688, 13.656898498535156, 14.094634056091309]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 4.0, 6.0, 10.0, 5.0, 9.0, 17.0, 12.0, 15.0, 21.0, 28.0, 56.0, 47.0, 103.0, 132.0, 315.0, 743.0, 2148.0, 7209.0, 36555.0, 4038083.0, 91605.0, 11863.0, 3190.0, 1086.0, 479.0, 200.0, 122.0, 76.0, 37.0, 31.0, 23.0, 8.0, 14.0, 8.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.734375, -16.3126220703125, -15.890869140625, -15.4691162109375, -15.04736328125, -14.6256103515625, -14.203857421875, -13.7821044921875, -13.3603515625, -12.9385986328125, -12.516845703125, -12.0950927734375, -11.67333984375, -11.2515869140625, -10.829833984375, -10.4080810546875, -9.986328125, -9.5645751953125, -9.142822265625, -8.7210693359375, -8.29931640625, -7.8775634765625, -7.455810546875, -7.0340576171875, -6.6123046875, -6.1905517578125, -5.768798828125, -5.3470458984375, -4.92529296875, -4.5035400390625, -4.081787109375, -3.6600341796875, -3.23828125, -2.8165283203125, -2.394775390625, -1.9730224609375, -1.55126953125, -1.1295166015625, -0.707763671875, -0.2860107421875, 0.1357421875, 0.5574951171875, 0.979248046875, 1.4010009765625, 1.82275390625, 2.2445068359375, 2.666259765625, 3.0880126953125, 3.509765625, 3.9315185546875, 4.353271484375, 4.7750244140625, 5.19677734375, 5.6185302734375, 6.040283203125, 6.4620361328125, 6.8837890625, 7.3055419921875, 7.727294921875, 8.1490478515625, 8.57080078125, 8.9925537109375, 9.414306640625, 9.8360595703125, 10.2578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 5.0, 17.0, 16.0, 15.0, 29.0, 38.0, 47.0, 60.0, 74.0, 69.0, 91.0, 81.0, 68.0, 79.0, 73.0, 62.0, 51.0, 39.0, 20.0, 19.0, 12.0, 11.0, 11.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.7003631591796875, -1.653656005859375, -1.6069488525390625, -1.56024169921875, -1.5135345458984375, -1.466827392578125, -1.4201202392578125, -1.3734130859375, -1.3267059326171875, -1.279998779296875, -1.2332916259765625, -1.18658447265625, -1.1398773193359375, -1.093170166015625, -1.0464630126953125, -0.999755859375, -0.9530487060546875, -0.906341552734375, -0.8596343994140625, -0.81292724609375, -0.7662200927734375, -0.719512939453125, -0.6728057861328125, -0.6260986328125, -0.5793914794921875, -0.532684326171875, -0.4859771728515625, -0.43927001953125, -0.3925628662109375, -0.345855712890625, -0.2991485595703125, -0.25244140625, -0.2057342529296875, -0.159027099609375, -0.1123199462890625, -0.06561279296875, -0.0189056396484375, 0.027801513671875, 0.0745086669921875, 0.1212158203125, 0.1679229736328125, 0.214630126953125, 0.2613372802734375, 0.30804443359375, 0.3547515869140625, 0.401458740234375, 0.4481658935546875, 0.494873046875, 0.5415802001953125, 0.588287353515625, 0.6349945068359375, 0.68170166015625, 0.7284088134765625, 0.775115966796875, 0.8218231201171875, 0.8685302734375, 0.9152374267578125, 0.961944580078125, 1.0086517333984375, 1.05535888671875, 1.1020660400390625, 1.148773193359375, 1.1954803466796875, 1.2421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 6.0, 11.0, 14.0, 18.0, 28.0, 29.0, 45.0, 65.0, 110.0, 150.0, 189.0, 309.0, 443.0, 827.0, 1419.0, 2745.0, 5344.0, 12362.0, 34020.0, 163122.0, 3817841.0, 107365.0, 27148.0, 10289.0, 4641.0, 2305.0, 1338.0, 748.0, 440.0, 294.0, 180.0, 124.0, 78.0, 50.0, 50.0, 35.0, 28.0, 18.0, 16.0, 10.0, 4.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.27752685546875, -5.0980224609375, -4.91851806640625, -4.739013671875, -4.55950927734375, -4.3800048828125, -4.20050048828125, -4.02099609375, -3.84149169921875, -3.6619873046875, -3.48248291015625, -3.302978515625, -3.12347412109375, -2.9439697265625, -2.76446533203125, -2.5849609375, -2.40545654296875, -2.2259521484375, -2.04644775390625, -1.866943359375, -1.68743896484375, -1.5079345703125, -1.32843017578125, -1.14892578125, -0.96942138671875, -0.7899169921875, -0.61041259765625, -0.430908203125, -0.25140380859375, -0.0718994140625, 0.10760498046875, 0.287109375, 0.46661376953125, 0.6461181640625, 0.82562255859375, 1.005126953125, 1.18463134765625, 1.3641357421875, 1.54364013671875, 1.72314453125, 1.90264892578125, 2.0821533203125, 2.26165771484375, 2.441162109375, 2.62066650390625, 2.8001708984375, 2.97967529296875, 3.1591796875, 3.33868408203125, 3.5181884765625, 3.69769287109375, 3.877197265625, 4.05670166015625, 4.2362060546875, 4.41571044921875, 4.59521484375, 4.77471923828125, 4.9542236328125, 5.13372802734375, 5.313232421875, 5.49273681640625, 5.6722412109375, 5.85174560546875, 6.03125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 7.0, 7.0, 5.0, 14.0, 23.0, 20.0, 30.0, 51.0, 111.0, 429.0, 2929.0, 190.0, 77.0, 53.0, 34.0, 18.0, 11.0, 11.0, 8.0, 9.0, 5.0, 2.0, 7.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.66015625, -2.580230712890625, -2.50030517578125, -2.420379638671875, -2.3404541015625, -2.260528564453125, -2.18060302734375, -2.100677490234375, -2.020751953125, -1.940826416015625, -1.86090087890625, -1.780975341796875, -1.7010498046875, -1.621124267578125, -1.54119873046875, -1.461273193359375, -1.38134765625, -1.301422119140625, -1.22149658203125, -1.141571044921875, -1.0616455078125, -0.981719970703125, -0.90179443359375, -0.821868896484375, -0.741943359375, -0.662017822265625, -0.58209228515625, -0.502166748046875, -0.4222412109375, -0.342315673828125, -0.26239013671875, -0.182464599609375, -0.1025390625, -0.022613525390625, 0.05731201171875, 0.137237548828125, 0.2171630859375, 0.297088623046875, 0.37701416015625, 0.456939697265625, 0.536865234375, 0.616790771484375, 0.69671630859375, 0.776641845703125, 0.8565673828125, 0.936492919921875, 1.01641845703125, 1.096343994140625, 1.17626953125, 1.256195068359375, 1.33612060546875, 1.416046142578125, 1.4959716796875, 1.575897216796875, 1.65582275390625, 1.735748291015625, 1.815673828125, 1.895599365234375, 1.97552490234375, 2.055450439453125, 2.1353759765625, 2.215301513671875, 2.29522705078125, 2.375152587890625, 2.455078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 12.0, 33.0, 61.0, 148.0, 262.0, 244.0, 126.0, 51.0, 24.0, 11.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.324113845825195, -23.756994247436523, -23.18987274169922, -22.622753143310547, -22.055631637573242, -21.48851203918457, -20.921390533447266, -20.354270935058594, -19.78714942932129, -19.220029830932617, -18.652908325195312, -18.08578872680664, -17.518667221069336, -16.951547622680664, -16.38442611694336, -15.817306518554688, -15.2501859664917, -14.683065414428711, -14.115944862365723, -13.548824310302734, -12.981703758239746, -12.414583206176758, -11.847463607788086, -11.280342102050781, -10.71322250366211, -10.146101951599121, -9.578981399536133, -9.011860847473145, -8.444740295410156, -7.877619743347168, -7.310499668121338, -6.74337911605835, -6.176258087158203, -5.609137535095215, -5.042016983032227, -4.474896430969238, -3.907776117324829, -3.340655565261841, -2.7735352516174316, -2.2064146995544434, -1.639294147491455, -1.0721735954284668, -0.5050531625747681, 0.062067270278930664, 0.629187822341919, 1.1963083744049072, 1.7634286880493164, 2.3305492401123047, 2.897669792175293, 3.4647903442382812, 4.0319108963012695, 4.599031448364258, 5.166152000427246, 5.733272552490234, 6.3003926277160645, 6.867513179779053, 7.434633731842041, 8.001753807067871, 8.56887435913086, 9.135994911193848, 9.703115463256836, 10.270236015319824, 10.837356567382812, 11.4044771194458, 11.971597671508789]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 9.0, 11.0, 16.0, 14.0, 20.0, 31.0, 22.0, 35.0, 35.0, 41.0, 46.0, 42.0, 60.0, 66.0, 49.0, 59.0, 47.0, 53.0, 48.0, 62.0, 55.0, 35.0, 27.0, 14.0, 24.0, 20.0, 20.0, 10.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.483158588409424, -6.265747547149658, -6.048336505889893, -5.830925464630127, -5.613514423370361, -5.396103858947754, -5.178692817687988, -4.961281776428223, -4.743870735168457, -4.526459693908691, -4.309048652648926, -4.09163761138916, -3.8742268085479736, -3.656815767288208, -3.4394047260284424, -3.221993923187256, -3.004582643508911, -2.7871716022491455, -2.56976056098938, -2.3523497581481934, -2.1349387168884277, -1.917527675628662, -1.7001166343688965, -1.4827057123184204, -1.2652946710586548, -1.0478836297988892, -0.8304727077484131, -0.6130616664886475, -0.3956506848335266, -0.17823970317840576, 0.03917133808135986, 0.25658226013183594, 0.47399330139160156, 0.6914042830467224, 0.9088152647018433, 1.1262263059616089, 1.343637228012085, 1.5610482692718506, 1.7784593105316162, 1.9958702325820923, 2.2132811546325684, 2.430692195892334, 2.6481032371520996, 2.8655142784118652, 3.0829250812530518, 3.3003361225128174, 3.517747163772583, 3.7351579666137695, 3.9525692462921143, 4.169980049133301, 4.387391090393066, 4.604802131652832, 4.822213172912598, 5.039624214172363, 5.257035255432129, 5.4744462966918945, 5.69185733795166, 5.909268379211426, 6.126679420471191, 6.344090461730957, 6.561501502990723, 6.778912544250488, 6.996323585510254, 7.213734149932861, 7.431145191192627]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 6.0, 8.0, 2.0, 4.0, 7.0, 10.0, 18.0, 16.0, 18.0, 39.0, 43.0, 80.0, 96.0, 165.0, 248.0, 484.0, 1021.0, 2342.0, 6329.0, 21104.0, 94924.0, 591379.0, 266460.0, 44881.0, 11693.0, 3909.0, 1564.0, 699.0, 372.0, 177.0, 123.0, 71.0, 74.0, 47.0, 31.0, 33.0, 16.0, 11.0, 15.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.421875, -7.20208740234375, -6.9822998046875, -6.76251220703125, -6.542724609375, -6.32293701171875, -6.1031494140625, -5.88336181640625, -5.66357421875, -5.44378662109375, -5.2239990234375, -5.00421142578125, -4.784423828125, -4.56463623046875, -4.3448486328125, -4.12506103515625, -3.9052734375, -3.68548583984375, -3.4656982421875, -3.24591064453125, -3.026123046875, -2.80633544921875, -2.5865478515625, -2.36676025390625, -2.14697265625, -1.92718505859375, -1.7073974609375, -1.48760986328125, -1.267822265625, -1.04803466796875, -0.8282470703125, -0.60845947265625, -0.388671875, -0.16888427734375, 0.0509033203125, 0.27069091796875, 0.490478515625, 0.71026611328125, 0.9300537109375, 1.14984130859375, 1.36962890625, 1.58941650390625, 1.8092041015625, 2.02899169921875, 2.248779296875, 2.46856689453125, 2.6883544921875, 2.90814208984375, 3.1279296875, 3.34771728515625, 3.5675048828125, 3.78729248046875, 4.007080078125, 4.22686767578125, 4.4466552734375, 4.66644287109375, 4.88623046875, 5.10601806640625, 5.3258056640625, 5.54559326171875, 5.765380859375, 5.98516845703125, 6.2049560546875, 6.42474365234375, 6.64453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 10.0, 14.0, 15.0, 27.0, 36.0, 36.0, 48.0, 64.0, 86.0, 65.0, 89.0, 73.0, 65.0, 71.0, 65.0, 62.0, 45.0, 40.0, 22.0, 20.0, 14.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8291015625, -1.781097412109375, -1.73309326171875, -1.685089111328125, -1.6370849609375, -1.589080810546875, -1.54107666015625, -1.493072509765625, -1.445068359375, -1.397064208984375, -1.34906005859375, -1.301055908203125, -1.2530517578125, -1.205047607421875, -1.15704345703125, -1.109039306640625, -1.06103515625, -1.013031005859375, -0.96502685546875, -0.917022705078125, -0.8690185546875, -0.821014404296875, -0.77301025390625, -0.725006103515625, -0.677001953125, -0.628997802734375, -0.58099365234375, -0.532989501953125, -0.4849853515625, -0.436981201171875, -0.38897705078125, -0.340972900390625, -0.29296875, -0.244964599609375, -0.19696044921875, -0.148956298828125, -0.1009521484375, -0.052947998046875, -0.00494384765625, 0.043060302734375, 0.091064453125, 0.139068603515625, 0.18707275390625, 0.235076904296875, 0.2830810546875, 0.331085205078125, 0.37908935546875, 0.427093505859375, 0.47509765625, 0.523101806640625, 0.57110595703125, 0.619110107421875, 0.6671142578125, 0.715118408203125, 0.76312255859375, 0.811126708984375, 0.859130859375, 0.907135009765625, 0.95513916015625, 1.003143310546875, 1.0511474609375, 1.099151611328125, 1.14715576171875, 1.195159912109375, 1.2431640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 7.0, 11.0, 8.0, 10.0, 14.0, 16.0, 20.0, 38.0, 63.0, 97.0, 143.0, 248.0, 510.0, 920.0, 1748.0, 3511.0, 7839.0, 18242.0, 49481.0, 166528.0, 511218.0, 194949.0, 55909.0, 20601.0, 8416.0, 3856.0, 1883.0, 979.0, 525.0, 286.0, 176.0, 101.0, 53.0, 44.0, 28.0, 21.0, 16.0, 13.0, 13.0, 3.0, 0.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.949005126953125, -3.82769775390625, -3.706390380859375, -3.5850830078125, -3.463775634765625, -3.34246826171875, -3.221160888671875, -3.099853515625, -2.978546142578125, -2.85723876953125, -2.735931396484375, -2.6146240234375, -2.493316650390625, -2.37200927734375, -2.250701904296875, -2.12939453125, -2.008087158203125, -1.88677978515625, -1.765472412109375, -1.6441650390625, -1.522857666015625, -1.40155029296875, -1.280242919921875, -1.158935546875, -1.037628173828125, -0.91632080078125, -0.795013427734375, -0.6737060546875, -0.552398681640625, -0.43109130859375, -0.309783935546875, -0.1884765625, -0.067169189453125, 0.05413818359375, 0.175445556640625, 0.2967529296875, 0.418060302734375, 0.53936767578125, 0.660675048828125, 0.781982421875, 0.903289794921875, 1.02459716796875, 1.145904541015625, 1.2672119140625, 1.388519287109375, 1.50982666015625, 1.631134033203125, 1.75244140625, 1.873748779296875, 1.99505615234375, 2.116363525390625, 2.2376708984375, 2.358978271484375, 2.48028564453125, 2.601593017578125, 2.722900390625, 2.844207763671875, 2.96551513671875, 3.086822509765625, 3.2081298828125, 3.329437255859375, 3.45074462890625, 3.572052001953125, 3.693359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 10.0, 8.0, 14.0, 10.0, 16.0, 19.0, 32.0, 23.0, 28.0, 39.0, 50.0, 47.0, 38.0, 42.0, 52.0, 54.0, 49.0, 56.0, 45.0, 53.0, 45.0, 27.0, 31.0, 28.0, 25.0, 25.0, 19.0, 22.0, 11.0, 11.0, 16.0, 5.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.3333740234375, -4.190185546875, -4.0469970703125, -3.90380859375, -3.7606201171875, -3.617431640625, -3.4742431640625, -3.3310546875, -3.1878662109375, -3.044677734375, -2.9014892578125, -2.75830078125, -2.6151123046875, -2.471923828125, -2.3287353515625, -2.185546875, -2.0423583984375, -1.899169921875, -1.7559814453125, -1.61279296875, -1.4696044921875, -1.326416015625, -1.1832275390625, -1.0400390625, -0.8968505859375, -0.753662109375, -0.6104736328125, -0.46728515625, -0.3240966796875, -0.180908203125, -0.0377197265625, 0.10546875, 0.2486572265625, 0.391845703125, 0.5350341796875, 0.67822265625, 0.8214111328125, 0.964599609375, 1.1077880859375, 1.2509765625, 1.3941650390625, 1.537353515625, 1.6805419921875, 1.82373046875, 1.9669189453125, 2.110107421875, 2.2532958984375, 2.396484375, 2.5396728515625, 2.682861328125, 2.8260498046875, 2.96923828125, 3.1124267578125, 3.255615234375, 3.3988037109375, 3.5419921875, 3.6851806640625, 3.828369140625, 3.9715576171875, 4.11474609375, 4.2579345703125, 4.401123046875, 4.5443115234375, 4.6875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 3.0, 6.0, 8.0, 22.0, 10.0, 15.0, 28.0, 46.0, 64.0, 123.0, 192.0, 375.0, 684.0, 1636.0, 3951.0, 12443.0, 55162.0, 560452.0, 357627.0, 39715.0, 9815.0, 3358.0, 1443.0, 638.0, 283.0, 154.0, 105.0, 59.0, 32.0, 29.0, 20.0, 18.0, 12.0, 9.0, 3.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.025390625, -2.941131591796875, -2.85687255859375, -2.772613525390625, -2.6883544921875, -2.604095458984375, -2.51983642578125, -2.435577392578125, -2.351318359375, -2.267059326171875, -2.18280029296875, -2.098541259765625, -2.0142822265625, -1.930023193359375, -1.84576416015625, -1.761505126953125, -1.67724609375, -1.592987060546875, -1.50872802734375, -1.424468994140625, -1.3402099609375, -1.255950927734375, -1.17169189453125, -1.087432861328125, -1.003173828125, -0.918914794921875, -0.83465576171875, -0.750396728515625, -0.6661376953125, -0.581878662109375, -0.49761962890625, -0.413360595703125, -0.3291015625, -0.244842529296875, -0.16058349609375, -0.076324462890625, 0.0079345703125, 0.092193603515625, 0.17645263671875, 0.260711669921875, 0.344970703125, 0.429229736328125, 0.51348876953125, 0.597747802734375, 0.6820068359375, 0.766265869140625, 0.85052490234375, 0.934783935546875, 1.01904296875, 1.103302001953125, 1.18756103515625, 1.271820068359375, 1.3560791015625, 1.440338134765625, 1.52459716796875, 1.608856201171875, 1.693115234375, 1.777374267578125, 1.86163330078125, 1.945892333984375, 2.0301513671875, 2.114410400390625, 2.19866943359375, 2.282928466796875, 2.3671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 10.0, 11.0, 20.0, 42.0, 52.0, 81.0, 140.0, 209.0, 158.0, 94.0, 60.0, 42.0, 28.0, 11.0, 15.0, 8.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005521774291992188, -0.0005362518131732941, -0.0005203261971473694, -0.0005044005811214447, -0.00048847496509552, -0.00047254934906959534, -0.00045662373304367065, -0.00044069811701774597, -0.0004247725009918213, -0.0004088468849658966, -0.0003929212689399719, -0.00037699565291404724, -0.00036107003688812256, -0.0003451444208621979, -0.0003292188048362732, -0.0003132931888103485, -0.00029736757278442383, -0.00028144195675849915, -0.00026551634073257446, -0.0002495907247066498, -0.0002336651086807251, -0.00021773949265480042, -0.00020181387662887573, -0.00018588826060295105, -0.00016996264457702637, -0.00015403702855110168, -0.000138111412525177, -0.00012218579649925232, -0.00010626018047332764, -9.033456444740295e-05, -7.440894842147827e-05, -5.848333239555359e-05, -4.2557716369628906e-05, -2.6632100343704224e-05, -1.0706484317779541e-05, 5.219131708145142e-06, 2.1144747734069824e-05, 3.707036375999451e-05, 5.299597978591919e-05, 6.892159581184387e-05, 8.484721183776855e-05, 0.00010077282786369324, 0.00011669844388961792, 0.0001326240599155426, 0.00014854967594146729, 0.00016447529196739197, 0.00018040090799331665, 0.00019632652401924133, 0.00021225214004516602, 0.0002281777560710907, 0.00024410337209701538, 0.00026002898812294006, 0.00027595460414886475, 0.00029188022017478943, 0.0003078058362007141, 0.0003237314522266388, 0.0003396570682525635, 0.00035558268427848816, 0.00037150830030441284, 0.0003874339163303375, 0.0004033595323562622, 0.0004192851483821869, 0.00043521076440811157, 0.00045113638043403625, 0.00046706199645996094]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 20.0, 23.0, 29.0, 33.0, 51.0, 80.0, 112.0, 190.0, 277.0, 424.0, 701.0, 1078.0, 1998.0, 3555.0, 6961.0, 14763.0, 38492.0, 131167.0, 480257.0, 259164.0, 65748.0, 22644.0, 9644.0, 4713.0, 2534.0, 1488.0, 831.0, 558.0, 341.0, 232.0, 136.0, 100.0, 72.0, 41.0, 23.0, 18.0, 10.0, 14.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3955078125, -1.34857177734375, -1.3016357421875, -1.25469970703125, -1.207763671875, -1.16082763671875, -1.1138916015625, -1.06695556640625, -1.02001953125, -0.97308349609375, -0.9261474609375, -0.87921142578125, -0.832275390625, -0.78533935546875, -0.7384033203125, -0.69146728515625, -0.64453125, -0.59759521484375, -0.5506591796875, -0.50372314453125, -0.456787109375, -0.40985107421875, -0.3629150390625, -0.31597900390625, -0.26904296875, -0.22210693359375, -0.1751708984375, -0.12823486328125, -0.081298828125, -0.03436279296875, 0.0125732421875, 0.05950927734375, 0.1064453125, 0.15338134765625, 0.2003173828125, 0.24725341796875, 0.294189453125, 0.34112548828125, 0.3880615234375, 0.43499755859375, 0.48193359375, 0.52886962890625, 0.5758056640625, 0.62274169921875, 0.669677734375, 0.71661376953125, 0.7635498046875, 0.81048583984375, 0.857421875, 0.90435791015625, 0.9512939453125, 0.99822998046875, 1.045166015625, 1.09210205078125, 1.1390380859375, 1.18597412109375, 1.23291015625, 1.27984619140625, 1.3267822265625, 1.37371826171875, 1.420654296875, 1.46759033203125, 1.5145263671875, 1.56146240234375, 1.6083984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 14.0, 14.0, 13.0, 32.0, 28.0, 29.0, 57.0, 75.0, 95.0, 81.0, 102.0, 88.0, 82.0, 51.0, 46.0, 34.0, 21.0, 27.0, 19.0, 13.0, 11.0, 11.0, 4.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7265625, -1.66583251953125, -1.6051025390625, -1.54437255859375, -1.483642578125, -1.42291259765625, -1.3621826171875, -1.30145263671875, -1.24072265625, -1.17999267578125, -1.1192626953125, -1.05853271484375, -0.997802734375, -0.93707275390625, -0.8763427734375, -0.81561279296875, -0.7548828125, -0.69415283203125, -0.6334228515625, -0.57269287109375, -0.511962890625, -0.45123291015625, -0.3905029296875, -0.32977294921875, -0.26904296875, -0.20831298828125, -0.1475830078125, -0.08685302734375, -0.026123046875, 0.03460693359375, 0.0953369140625, 0.15606689453125, 0.216796875, 0.27752685546875, 0.3382568359375, 0.39898681640625, 0.459716796875, 0.52044677734375, 0.5811767578125, 0.64190673828125, 0.70263671875, 0.76336669921875, 0.8240966796875, 0.88482666015625, 0.945556640625, 1.00628662109375, 1.0670166015625, 1.12774658203125, 1.1884765625, 1.24920654296875, 1.3099365234375, 1.37066650390625, 1.431396484375, 1.49212646484375, 1.5528564453125, 1.61358642578125, 1.67431640625, 1.73504638671875, 1.7957763671875, 1.85650634765625, 1.917236328125, 1.97796630859375, 2.0386962890625, 2.09942626953125, 2.16015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 11.0, 20.0, 29.0, 52.0, 79.0, 96.0, 133.0, 130.0, 137.0, 111.0, 70.0, 43.0, 22.0, 25.0, 13.0, 9.0, 7.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.897438049316406, -44.8162727355957, -43.735103607177734, -42.65393829345703, -41.57277297973633, -40.491607666015625, -39.410438537597656, -38.32927322387695, -37.24810791015625, -36.16694259643555, -35.08577346801758, -34.004608154296875, -32.92344284057617, -31.842275619506836, -30.7611083984375, -29.679943084716797, -28.598773956298828, -27.517606735229492, -26.43644142150879, -25.355274200439453, -24.27410888671875, -23.192941665649414, -22.111774444580078, -21.030609130859375, -19.94944190979004, -18.868274688720703, -17.787109375, -16.705942153930664, -15.624775886535645, -14.543609619140625, -13.462442398071289, -12.38127613067627, -11.300107955932617, -10.218941688537598, -9.137775421142578, -8.056608200073242, -6.975441932678223, -5.894275665283203, -4.813108921051025, -3.7319421768188477, -2.650775909423828, -1.5696094036102295, -0.48844289779663086, 0.5927236080169678, 1.6738901138305664, 2.755056381225586, 3.8362231254577637, 4.917389869689941, 5.998556137084961, 7.0797224044799805, 8.160888671875, 9.242055892944336, 10.323222160339355, 11.404388427734375, 12.485555648803711, 13.56672191619873, 14.64788818359375, 15.72905445098877, 16.81022071838379, 17.891387939453125, 18.972553253173828, 20.053720474243164, 21.1348876953125, 22.216053009033203, 23.29722023010254]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 8.0, 8.0, 9.0, 12.0, 9.0, 19.0, 23.0, 21.0, 26.0, 15.0, 26.0, 28.0, 28.0, 35.0, 23.0, 42.0, 30.0, 37.0, 37.0, 44.0, 41.0, 39.0, 32.0, 41.0, 33.0, 42.0, 33.0, 23.0, 23.0, 33.0, 24.0, 22.0, 19.0, 17.0, 15.0, 16.0, 11.0, 14.0, 12.0, 1.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-20.260244369506836, -19.632579803466797, -19.004913330078125, -18.377246856689453, -17.749582290649414, -17.121917724609375, -16.494251251220703, -15.866585731506348, -15.238920211791992, -14.611254692077637, -13.983589172363281, -13.355923652648926, -12.72825813293457, -12.100592613220215, -11.47292709350586, -10.845261573791504, -10.217596054077148, -9.589930534362793, -8.962265014648438, -8.334599494934082, -7.706933975219727, -7.079268455505371, -6.451602935791016, -5.82393741607666, -5.196271896362305, -4.568606376647949, -3.9409408569335938, -3.3132753372192383, -2.685609817504883, -2.0579442977905273, -1.4302787780761719, -0.8026132583618164, -0.17494773864746094, 0.45271778106689453, 1.08038330078125, 1.7080488204956055, 2.335714340209961, 2.9633798599243164, 3.591045379638672, 4.218710899353027, 4.846376419067383, 5.474041938781738, 6.101707458496094, 6.729372978210449, 7.357038497924805, 7.98470401763916, 8.612369537353516, 9.240035057067871, 9.867700576782227, 10.495366096496582, 11.123031616210938, 11.750697135925293, 12.378362655639648, 13.006028175354004, 13.63369369506836, 14.261359214782715, 14.88902473449707, 15.516690254211426, 16.14435577392578, 16.772022247314453, 17.399686813354492, 18.02735137939453, 18.655017852783203, 19.282684326171875, 19.910348892211914]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 11.0, 6.0, 4.0, 7.0, 10.0, 12.0, 13.0, 19.0, 29.0, 37.0, 64.0, 90.0, 163.0, 344.0, 859.0, 2472.0, 8527.0, 47512.0, 3984588.0, 128450.0, 14845.0, 3898.0, 1292.0, 539.0, 227.0, 110.0, 52.0, 34.0, 22.0, 14.0, 12.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.625, -14.2564697265625, -13.887939453125, -13.5194091796875, -13.15087890625, -12.7823486328125, -12.413818359375, -12.0452880859375, -11.6767578125, -11.3082275390625, -10.939697265625, -10.5711669921875, -10.20263671875, -9.8341064453125, -9.465576171875, -9.0970458984375, -8.728515625, -8.3599853515625, -7.991455078125, -7.6229248046875, -7.25439453125, -6.8858642578125, -6.517333984375, -6.1488037109375, -5.7802734375, -5.4117431640625, -5.043212890625, -4.6746826171875, -4.30615234375, -3.9376220703125, -3.569091796875, -3.2005615234375, -2.83203125, -2.4635009765625, -2.094970703125, -1.7264404296875, -1.35791015625, -0.9893798828125, -0.620849609375, -0.2523193359375, 0.1162109375, 0.4847412109375, 0.853271484375, 1.2218017578125, 1.59033203125, 1.9588623046875, 2.327392578125, 2.6959228515625, 3.064453125, 3.4329833984375, 3.801513671875, 4.1700439453125, 4.53857421875, 4.9071044921875, 5.275634765625, 5.6441650390625, 6.0126953125, 6.3812255859375, 6.749755859375, 7.1182861328125, 7.48681640625, 7.8553466796875, 8.223876953125, 8.5924072265625, 8.9609375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 11.0, 8.0, 8.0, 22.0, 27.0, 20.0, 36.0, 46.0, 47.0, 51.0, 63.0, 68.0, 60.0, 74.0, 68.0, 52.0, 62.0, 58.0, 47.0, 37.0, 24.0, 25.0, 23.0, 18.0, 17.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7607421875, -1.713623046875, -1.66650390625, -1.619384765625, -1.572265625, -1.525146484375, -1.47802734375, -1.430908203125, -1.3837890625, -1.336669921875, -1.28955078125, -1.242431640625, -1.1953125, -1.148193359375, -1.10107421875, -1.053955078125, -1.0068359375, -0.959716796875, -0.91259765625, -0.865478515625, -0.818359375, -0.771240234375, -0.72412109375, -0.677001953125, -0.6298828125, -0.582763671875, -0.53564453125, -0.488525390625, -0.44140625, -0.394287109375, -0.34716796875, -0.300048828125, -0.2529296875, -0.205810546875, -0.15869140625, -0.111572265625, -0.064453125, -0.017333984375, 0.02978515625, 0.076904296875, 0.1240234375, 0.171142578125, 0.21826171875, 0.265380859375, 0.3125, 0.359619140625, 0.40673828125, 0.453857421875, 0.5009765625, 0.548095703125, 0.59521484375, 0.642333984375, 0.689453125, 0.736572265625, 0.78369140625, 0.830810546875, 0.8779296875, 0.925048828125, 0.97216796875, 1.019287109375, 1.06640625, 1.113525390625, 1.16064453125, 1.207763671875, 1.2548828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 12.0, 15.0, 15.0, 18.0, 27.0, 40.0, 56.0, 67.0, 100.0, 152.0, 234.0, 396.0, 626.0, 1023.0, 1924.0, 3742.0, 8030.0, 19312.0, 61909.0, 777065.0, 3205312.0, 74273.0, 22015.0, 8841.0, 4082.0, 1998.0, 1187.0, 628.0, 394.0, 269.0, 139.0, 105.0, 77.0, 48.0, 35.0, 39.0, 26.0, 13.0, 10.0, 8.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.13671875, -5.93914794921875, -5.7415771484375, -5.54400634765625, -5.346435546875, -5.14886474609375, -4.9512939453125, -4.75372314453125, -4.55615234375, -4.35858154296875, -4.1610107421875, -3.96343994140625, -3.765869140625, -3.56829833984375, -3.3707275390625, -3.17315673828125, -2.9755859375, -2.77801513671875, -2.5804443359375, -2.38287353515625, -2.185302734375, -1.98773193359375, -1.7901611328125, -1.59259033203125, -1.39501953125, -1.19744873046875, -0.9998779296875, -0.80230712890625, -0.604736328125, -0.40716552734375, -0.2095947265625, -0.01202392578125, 0.185546875, 0.38311767578125, 0.5806884765625, 0.77825927734375, 0.975830078125, 1.17340087890625, 1.3709716796875, 1.56854248046875, 1.76611328125, 1.96368408203125, 2.1612548828125, 2.35882568359375, 2.556396484375, 2.75396728515625, 2.9515380859375, 3.14910888671875, 3.3466796875, 3.54425048828125, 3.7418212890625, 3.93939208984375, 4.136962890625, 4.33453369140625, 4.5321044921875, 4.72967529296875, 4.92724609375, 5.12481689453125, 5.3223876953125, 5.51995849609375, 5.717529296875, 5.91510009765625, 6.1126708984375, 6.31024169921875, 6.5078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 13.0, 10.0, 13.0, 23.0, 24.0, 35.0, 106.0, 240.0, 2818.0, 421.0, 127.0, 80.0, 40.0, 32.0, 22.0, 14.0, 13.0, 4.0, 9.0, 5.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.665771484375, -4.53857421875, -4.411376953125, -4.2841796875, -4.156982421875, -4.02978515625, -3.902587890625, -3.775390625, -3.648193359375, -3.52099609375, -3.393798828125, -3.2666015625, -3.139404296875, -3.01220703125, -2.885009765625, -2.7578125, -2.630615234375, -2.50341796875, -2.376220703125, -2.2490234375, -2.121826171875, -1.99462890625, -1.867431640625, -1.740234375, -1.613037109375, -1.48583984375, -1.358642578125, -1.2314453125, -1.104248046875, -0.97705078125, -0.849853515625, -0.72265625, -0.595458984375, -0.46826171875, -0.341064453125, -0.2138671875, -0.086669921875, 0.04052734375, 0.167724609375, 0.294921875, 0.422119140625, 0.54931640625, 0.676513671875, 0.8037109375, 0.930908203125, 1.05810546875, 1.185302734375, 1.3125, 1.439697265625, 1.56689453125, 1.694091796875, 1.8212890625, 1.948486328125, 2.07568359375, 2.202880859375, 2.330078125, 2.457275390625, 2.58447265625, 2.711669921875, 2.8388671875, 2.966064453125, 3.09326171875, 3.220458984375, 3.34765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 19.0, 19.0, 40.0, 47.0, 67.0, 110.0, 146.0, 177.0, 136.0, 90.0, 54.0, 22.0, 17.0, 16.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.25238037109375, -11.67287826538086, -11.093375205993652, -10.513872146606445, -9.934370040893555, -9.354867935180664, -8.775364875793457, -8.19586181640625, -7.616359710693359, -7.0368571281433105, -6.457354545593262, -5.877851963043213, -5.298349380493164, -4.718846797943115, -4.139344215393066, -3.5598416328430176, -2.9803390502929688, -2.40083646774292, -1.821333885192871, -1.2418313026428223, -0.6623287200927734, -0.08282613754272461, 0.4966764450073242, 1.076179027557373, 1.6556816101074219, 2.2351841926574707, 2.8146867752075195, 3.3941893577575684, 3.973691940307617, 4.553194522857666, 5.132697105407715, 5.712199687957764, 6.291704177856445, 6.871206760406494, 7.450709342956543, 8.03021240234375, 8.60971450805664, 9.189216613769531, 9.768719673156738, 10.348222732543945, 10.927724838256836, 11.507226943969727, 12.086730003356934, 12.66623306274414, 13.245735168457031, 13.825237274169922, 14.404740333557129, 14.984243392944336, 15.563745498657227, 16.143247604370117, 16.72275161743164, 17.30225372314453, 17.881755828857422, 18.461257934570312, 19.040760040283203, 19.620264053344727, 20.199766159057617, 20.779268264770508, 21.35877227783203, 21.938274383544922, 22.517776489257812, 23.097278594970703, 23.676780700683594, 24.256284713745117, 24.835786819458008]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 7.0, 4.0, 3.0, 6.0, 10.0, 8.0, 13.0, 16.0, 23.0, 18.0, 21.0, 36.0, 26.0, 25.0, 38.0, 39.0, 33.0, 53.0, 39.0, 42.0, 40.0, 48.0, 41.0, 39.0, 30.0, 41.0, 29.0, 36.0, 41.0, 31.0, 25.0, 28.0, 17.0, 25.0, 11.0, 16.0, 11.0, 5.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.516212463378906, -8.23979663848877, -7.963380813598633, -7.686964988708496, -7.410549163818359, -7.134133338928223, -6.857717990875244, -6.581302165985107, -6.304886341094971, -6.028470516204834, -5.752054691314697, -5.4756388664245605, -5.199223518371582, -4.922807693481445, -4.646391868591309, -4.369976043701172, -4.093560218811035, -3.8171443939208984, -3.5407285690307617, -3.264312982559204, -2.9878971576690674, -2.7114813327789307, -2.435065746307373, -2.1586499214172363, -1.8822340965270996, -1.605818271636963, -1.3294025659561157, -1.0529868602752686, -0.7765710353851318, -0.5001552104949951, -0.22373950481414795, 0.05267620086669922, 0.32909297943115234, 0.6055087447166443, 0.8819245100021362, 1.1583402156829834, 1.4347560405731201, 1.7111718654632568, 1.987587571144104, 2.264003276824951, 2.540419101715088, 2.8168349266052246, 3.0932507514953613, 3.369666337966919, 3.6460821628570557, 3.9224979877471924, 4.19891357421875, 4.475329399108887, 4.751745223999023, 5.02816104888916, 5.304576873779297, 5.580992698669434, 5.85740852355957, 6.133824348449707, 6.4102396965026855, 6.686655521392822, 6.963071346282959, 7.239487171173096, 7.515902996063232, 7.792318820953369, 8.068734169006348, 8.345149993896484, 8.621565818786621, 8.897981643676758, 9.174397468566895]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 5.0, 1.0, 13.0, 14.0, 32.0, 46.0, 78.0, 163.0, 296.0, 717.0, 1808.0, 6168.0, 27666.0, 164463.0, 642326.0, 167212.0, 28067.0, 6296.0, 1821.0, 697.0, 290.0, 143.0, 83.0, 54.0, 28.0, 23.0, 15.0, 8.0, 10.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.3125, -9.0345458984375, -8.756591796875, -8.4786376953125, -8.20068359375, -7.9227294921875, -7.644775390625, -7.3668212890625, -7.0888671875, -6.8109130859375, -6.532958984375, -6.2550048828125, -5.97705078125, -5.6990966796875, -5.421142578125, -5.1431884765625, -4.865234375, -4.5872802734375, -4.309326171875, -4.0313720703125, -3.75341796875, -3.4754638671875, -3.197509765625, -2.9195556640625, -2.6416015625, -2.3636474609375, -2.085693359375, -1.8077392578125, -1.52978515625, -1.2518310546875, -0.973876953125, -0.6959228515625, -0.41796875, -0.1400146484375, 0.137939453125, 0.4158935546875, 0.69384765625, 0.9718017578125, 1.249755859375, 1.5277099609375, 1.8056640625, 2.0836181640625, 2.361572265625, 2.6395263671875, 2.91748046875, 3.1954345703125, 3.473388671875, 3.7513427734375, 4.029296875, 4.3072509765625, 4.585205078125, 4.8631591796875, 5.14111328125, 5.4190673828125, 5.697021484375, 5.9749755859375, 6.2529296875, 6.5308837890625, 6.808837890625, 7.0867919921875, 7.36474609375, 7.6427001953125, 7.920654296875, 8.1986083984375, 8.4765625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 4.0, 7.0, 7.0, 18.0, 20.0, 21.0, 34.0, 32.0, 36.0, 44.0, 58.0, 66.0, 57.0, 68.0, 75.0, 53.0, 60.0, 57.0, 37.0, 44.0, 37.0, 36.0, 30.0, 26.0, 19.0, 10.0, 16.0, 13.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6693572998046875, -1.620941162109375, -1.5725250244140625, -1.52410888671875, -1.4756927490234375, -1.427276611328125, -1.3788604736328125, -1.3304443359375, -1.2820281982421875, -1.233612060546875, -1.1851959228515625, -1.13677978515625, -1.0883636474609375, -1.039947509765625, -0.9915313720703125, -0.943115234375, -0.8946990966796875, -0.846282958984375, -0.7978668212890625, -0.74945068359375, -0.7010345458984375, -0.652618408203125, -0.6042022705078125, -0.5557861328125, -0.5073699951171875, -0.458953857421875, -0.4105377197265625, -0.36212158203125, -0.3137054443359375, -0.265289306640625, -0.2168731689453125, -0.16845703125, -0.1200408935546875, -0.071624755859375, -0.0232086181640625, 0.02520751953125, 0.0736236572265625, 0.122039794921875, 0.1704559326171875, 0.2188720703125, 0.2672882080078125, 0.315704345703125, 0.3641204833984375, 0.41253662109375, 0.4609527587890625, 0.509368896484375, 0.5577850341796875, 0.606201171875, 0.6546173095703125, 0.703033447265625, 0.7514495849609375, 0.79986572265625, 0.8482818603515625, 0.896697998046875, 0.9451141357421875, 0.9935302734375, 1.0419464111328125, 1.090362548828125, 1.1387786865234375, 1.18719482421875, 1.2356109619140625, 1.284027099609375, 1.3324432373046875, 1.380859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 10.0, 15.0, 15.0, 14.0, 34.0, 45.0, 69.0, 111.0, 191.0, 320.0, 551.0, 1065.0, 2120.0, 4427.0, 10339.0, 26018.0, 74634.0, 266680.0, 455038.0, 135344.0, 42525.0, 16106.0, 6540.0, 3030.0, 1489.0, 762.0, 408.0, 211.0, 158.0, 66.0, 60.0, 42.0, 26.0, 19.0, 20.0, 12.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.26171875, -5.10345458984375, -4.9451904296875, -4.78692626953125, -4.628662109375, -4.47039794921875, -4.3121337890625, -4.15386962890625, -3.99560546875, -3.83734130859375, -3.6790771484375, -3.52081298828125, -3.362548828125, -3.20428466796875, -3.0460205078125, -2.88775634765625, -2.7294921875, -2.57122802734375, -2.4129638671875, -2.25469970703125, -2.096435546875, -1.93817138671875, -1.7799072265625, -1.62164306640625, -1.46337890625, -1.30511474609375, -1.1468505859375, -0.98858642578125, -0.830322265625, -0.67205810546875, -0.5137939453125, -0.35552978515625, -0.197265625, -0.03900146484375, 0.1192626953125, 0.27752685546875, 0.435791015625, 0.59405517578125, 0.7523193359375, 0.91058349609375, 1.06884765625, 1.22711181640625, 1.3853759765625, 1.54364013671875, 1.701904296875, 1.86016845703125, 2.0184326171875, 2.17669677734375, 2.3349609375, 2.49322509765625, 2.6514892578125, 2.80975341796875, 2.968017578125, 3.12628173828125, 3.2845458984375, 3.44281005859375, 3.60107421875, 3.75933837890625, 3.9176025390625, 4.07586669921875, 4.234130859375, 4.39239501953125, 4.5506591796875, 4.70892333984375, 4.8671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 7.0, 10.0, 12.0, 16.0, 10.0, 21.0, 25.0, 21.0, 19.0, 26.0, 26.0, 40.0, 44.0, 42.0, 52.0, 39.0, 48.0, 53.0, 46.0, 56.0, 45.0, 47.0, 38.0, 33.0, 24.0, 27.0, 31.0, 22.0, 22.0, 8.0, 13.0, 14.0, 9.0, 7.0, 7.0, 8.0, 3.0, 1.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.2955322265625, -5.102783203125, -4.9100341796875, -4.71728515625, -4.5245361328125, -4.331787109375, -4.1390380859375, -3.9462890625, -3.7535400390625, -3.560791015625, -3.3680419921875, -3.17529296875, -2.9825439453125, -2.789794921875, -2.5970458984375, -2.404296875, -2.2115478515625, -2.018798828125, -1.8260498046875, -1.63330078125, -1.4405517578125, -1.247802734375, -1.0550537109375, -0.8623046875, -0.6695556640625, -0.476806640625, -0.2840576171875, -0.09130859375, 0.1014404296875, 0.294189453125, 0.4869384765625, 0.6796875, 0.8724365234375, 1.065185546875, 1.2579345703125, 1.45068359375, 1.6434326171875, 1.836181640625, 2.0289306640625, 2.2216796875, 2.4144287109375, 2.607177734375, 2.7999267578125, 2.99267578125, 3.1854248046875, 3.378173828125, 3.5709228515625, 3.763671875, 3.9564208984375, 4.149169921875, 4.3419189453125, 4.53466796875, 4.7274169921875, 4.920166015625, 5.1129150390625, 5.3056640625, 5.4984130859375, 5.691162109375, 5.8839111328125, 6.07666015625, 6.2694091796875, 6.462158203125, 6.6549072265625, 6.84765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 12.0, 9.0, 13.0, 14.0, 33.0, 44.0, 38.0, 66.0, 115.0, 180.0, 293.0, 505.0, 1071.0, 2376.0, 6267.0, 20951.0, 106920.0, 668924.0, 195018.0, 30974.0, 8703.0, 3092.0, 1316.0, 660.0, 318.0, 211.0, 130.0, 85.0, 46.0, 46.0, 30.0, 20.0, 13.0, 16.0, 7.0, 8.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.828125, -3.710845947265625, -3.59356689453125, -3.476287841796875, -3.3590087890625, -3.241729736328125, -3.12445068359375, -3.007171630859375, -2.889892578125, -2.772613525390625, -2.65533447265625, -2.538055419921875, -2.4207763671875, -2.303497314453125, -2.18621826171875, -2.068939208984375, -1.95166015625, -1.834381103515625, -1.71710205078125, -1.599822998046875, -1.4825439453125, -1.365264892578125, -1.24798583984375, -1.130706787109375, -1.013427734375, -0.896148681640625, -0.77886962890625, -0.661590576171875, -0.5443115234375, -0.427032470703125, -0.30975341796875, -0.192474365234375, -0.0751953125, 0.042083740234375, 0.15936279296875, 0.276641845703125, 0.3939208984375, 0.511199951171875, 0.62847900390625, 0.745758056640625, 0.863037109375, 0.980316162109375, 1.09759521484375, 1.214874267578125, 1.3321533203125, 1.449432373046875, 1.56671142578125, 1.683990478515625, 1.80126953125, 1.918548583984375, 2.03582763671875, 2.153106689453125, 2.2703857421875, 2.387664794921875, 2.50494384765625, 2.622222900390625, 2.739501953125, 2.856781005859375, 2.97406005859375, 3.091339111328125, 3.2086181640625, 3.325897216796875, 3.44317626953125, 3.560455322265625, 3.677734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 10.0, 12.0, 24.0, 47.0, 79.0, 176.0, 218.0, 191.0, 105.0, 72.0, 33.0, 14.0, 8.0, 6.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001316070556640625, -0.0012836754322052002, -0.0012512803077697754, -0.0012188851833343506, -0.0011864900588989258, -0.001154094934463501, -0.0011216998100280762, -0.0010893046855926514, -0.0010569095611572266, -0.0010245144367218018, -0.000992119312286377, -0.0009597241878509521, -0.0009273290634155273, -0.0008949339389801025, -0.0008625388145446777, -0.0008301436901092529, -0.0007977485656738281, -0.0007653534412384033, -0.0007329583168029785, -0.0007005631923675537, -0.0006681680679321289, -0.0006357729434967041, -0.0006033778190612793, -0.0005709826946258545, -0.0005385875701904297, -0.0005061924457550049, -0.0004737973213195801, -0.0004414021968841553, -0.00040900707244873047, -0.00037661194801330566, -0.00034421682357788086, -0.00031182169914245605, -0.00027942657470703125, -0.00024703145027160645, -0.00021463632583618164, -0.00018224120140075684, -0.00014984607696533203, -0.00011745095252990723, -8.505582809448242e-05, -5.266070365905762e-05, -2.0265579223632812e-05, 1.2129545211791992e-05, 4.45246696472168e-05, 7.69197940826416e-05, 0.0001093149185180664, 0.0001417100429534912, 0.00017410516738891602, 0.00020650029182434082, 0.00023889541625976562, 0.00027129054069519043, 0.00030368566513061523, 0.00033608078956604004, 0.00036847591400146484, 0.00040087103843688965, 0.00043326616287231445, 0.00046566128730773926, 0.0004980564117431641, 0.0005304515361785889, 0.0005628466606140137, 0.0005952417850494385, 0.0006276369094848633, 0.0006600320339202881, 0.0006924271583557129, 0.0007248222827911377, 0.0007572174072265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 11.0, 14.0, 15.0, 30.0, 45.0, 87.0, 168.0, 269.0, 518.0, 1171.0, 2629.0, 7074.0, 24345.0, 144566.0, 712564.0, 121969.0, 21876.0, 6562.0, 2521.0, 1037.0, 476.0, 254.0, 163.0, 94.0, 35.0, 28.0, 12.0, 9.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.2421875, -5.109344482421875, -4.97650146484375, -4.843658447265625, -4.7108154296875, -4.577972412109375, -4.44512939453125, -4.312286376953125, -4.179443359375, -4.046600341796875, -3.91375732421875, -3.780914306640625, -3.6480712890625, -3.515228271484375, -3.38238525390625, -3.249542236328125, -3.11669921875, -2.983856201171875, -2.85101318359375, -2.718170166015625, -2.5853271484375, -2.452484130859375, -2.31964111328125, -2.186798095703125, -2.053955078125, -1.921112060546875, -1.78826904296875, -1.655426025390625, -1.5225830078125, -1.389739990234375, -1.25689697265625, -1.124053955078125, -0.9912109375, -0.858367919921875, -0.72552490234375, -0.592681884765625, -0.4598388671875, -0.326995849609375, -0.19415283203125, -0.061309814453125, 0.071533203125, 0.204376220703125, 0.33721923828125, 0.470062255859375, 0.6029052734375, 0.735748291015625, 0.86859130859375, 1.001434326171875, 1.13427734375, 1.267120361328125, 1.39996337890625, 1.532806396484375, 1.6656494140625, 1.798492431640625, 1.93133544921875, 2.064178466796875, 2.197021484375, 2.329864501953125, 2.46270751953125, 2.595550537109375, 2.7283935546875, 2.861236572265625, 2.99407958984375, 3.126922607421875, 3.259765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 2.0, 10.0, 13.0, 10.0, 20.0, 24.0, 22.0, 41.0, 69.0, 109.0, 148.0, 148.0, 124.0, 70.0, 60.0, 27.0, 20.0, 14.0, 11.0, 9.0, 11.0, 9.0, 1.0, 5.0, 5.0, 0.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.484832763671875, -3.34661865234375, -3.208404541015625, -3.0701904296875, -2.931976318359375, -2.79376220703125, -2.655548095703125, -2.517333984375, -2.379119873046875, -2.24090576171875, -2.102691650390625, -1.9644775390625, -1.826263427734375, -1.68804931640625, -1.549835205078125, -1.41162109375, -1.273406982421875, -1.13519287109375, -0.996978759765625, -0.8587646484375, -0.720550537109375, -0.58233642578125, -0.444122314453125, -0.305908203125, -0.167694091796875, -0.02947998046875, 0.108734130859375, 0.2469482421875, 0.385162353515625, 0.52337646484375, 0.661590576171875, 0.7998046875, 0.938018798828125, 1.07623291015625, 1.214447021484375, 1.3526611328125, 1.490875244140625, 1.62908935546875, 1.767303466796875, 1.905517578125, 2.043731689453125, 2.18194580078125, 2.320159912109375, 2.4583740234375, 2.596588134765625, 2.73480224609375, 2.873016357421875, 3.01123046875, 3.149444580078125, 3.28765869140625, 3.425872802734375, 3.5640869140625, 3.702301025390625, 3.84051513671875, 3.978729248046875, 4.116943359375, 4.255157470703125, 4.39337158203125, 4.531585693359375, 4.6697998046875, 4.808013916015625, 4.94622802734375, 5.084442138671875, 5.22265625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 20.0, 82.0, 249.0, 367.0, 186.0, 67.0, 25.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-225.08436584472656, -220.86749267578125, -216.65060424804688, -212.43373107910156, -208.21685791015625, -203.99996948242188, -199.78309631347656, -195.56622314453125, -191.34933471679688, -187.13246154785156, -182.9155731201172, -178.69869995117188, -174.48182678222656, -170.2649383544922, -166.04806518554688, -161.83119201660156, -157.61431884765625, -153.39744567871094, -149.18055725097656, -144.96368408203125, -140.74681091308594, -136.52992248535156, -132.31304931640625, -128.09617614746094, -123.87928771972656, -119.66240692138672, -115.4455337524414, -111.22865295410156, -107.01177215576172, -102.79489135742188, -98.57801818847656, -94.36113739013672, -90.14424896240234, -85.9273681640625, -81.71049499511719, -77.49361419677734, -73.2767333984375, -69.05986022949219, -64.84297943115234, -60.6260986328125, -56.40922164916992, -52.192344665527344, -47.9754638671875, -43.75858688354492, -39.541709899902344, -35.3248291015625, -31.107952117919922, -26.89107322692871, -22.6741943359375, -18.45731544494629, -14.240437507629395, -10.0235595703125, -5.806680679321289, -1.5898017883300781, 2.6270751953125, 6.843954086303711, 11.060832977294922, 15.277711868286133, 19.494590759277344, 23.711467742919922, 27.928346633911133, 32.145225524902344, 36.36210250854492, 40.5789794921875, 44.795860290527344]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 3.0, 9.0, 12.0, 17.0, 14.0, 18.0, 25.0, 22.0, 34.0, 40.0, 40.0, 58.0, 52.0, 53.0, 51.0, 63.0, 57.0, 54.0, 61.0, 46.0, 52.0, 31.0, 37.0, 36.0, 23.0, 17.0, 18.0, 16.0, 10.0, 10.0, 9.0, 3.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.235107421875, -39.83210372924805, -38.42909622192383, -37.026092529296875, -35.62308883666992, -34.2200813293457, -32.81707763671875, -31.414072036743164, -30.011066436767578, -28.608060836791992, -27.20505714416504, -25.802051544189453, -24.399045944213867, -22.99604034423828, -21.593036651611328, -20.190031051635742, -18.78702735900879, -17.384021759033203, -15.981017112731934, -14.578012466430664, -13.175006866455078, -11.772002220153809, -10.368997573852539, -8.965991973876953, -7.562987327575684, -6.159982204437256, -4.756977081298828, -3.3539724349975586, -1.9509673118591309, -0.5479621887207031, 0.8550424575805664, 2.2580480575561523, 3.661052703857422, 5.06405782699585, 6.467062950134277, 7.870067596435547, 9.273073196411133, 10.676077842712402, 12.079082489013672, 13.482088088989258, 14.885092735290527, 16.288097381591797, 17.691102981567383, 19.09410858154297, 20.497112274169922, 21.900117874145508, 23.303123474121094, 24.706127166748047, 26.109132766723633, 27.51213836669922, 28.915142059326172, 30.318147659301758, 31.721153259277344, 33.1241569519043, 34.52716064453125, 35.93016815185547, 37.33317184448242, 38.736175537109375, 40.139183044433594, 41.54218673706055, 42.9451904296875, 44.34819793701172, 45.75120162963867, 47.154205322265625, 48.557212829589844]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 11.0, 8.0, 9.0, 19.0, 31.0, 37.0, 52.0, 75.0, 133.0, 190.0, 314.0, 505.0, 784.0, 1538.0, 3576.0, 13073.0, 4101776.0, 59965.0, 6846.0, 2303.0, 1201.0, 674.0, 416.0, 250.0, 156.0, 116.0, 74.0, 54.0, 26.0, 22.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-15.453125, -15.0546875, -14.65625, -14.2578125, -13.859375, -13.4609375, -13.0625, -12.6640625, -12.265625, -11.8671875, -11.46875, -11.0703125, -10.671875, -10.2734375, -9.875, -9.4765625, -9.078125, -8.6796875, -8.28125, -7.8828125, -7.484375, -7.0859375, -6.6875, -6.2890625, -5.890625, -5.4921875, -5.09375, -4.6953125, -4.296875, -3.8984375, -3.5, -3.1015625, -2.703125, -2.3046875, -1.90625, -1.5078125, -1.109375, -0.7109375, -0.3125, 0.0859375, 0.484375, 0.8828125, 1.28125, 1.6796875, 2.078125, 2.4765625, 2.875, 3.2734375, 3.671875, 4.0703125, 4.46875, 4.8671875, 5.265625, 5.6640625, 6.0625, 6.4609375, 6.859375, 7.2578125, 7.65625, 8.0546875, 8.453125, 8.8515625, 9.25, 9.6484375, 10.046875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 5.0, 10.0, 11.0, 18.0, 24.0, 28.0, 33.0, 40.0, 41.0, 37.0, 39.0, 50.0, 67.0, 65.0, 59.0, 50.0, 62.0, 64.0, 44.0, 51.0, 39.0, 35.0, 25.0, 19.0, 13.0, 20.0, 8.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00390625, -1.94525146484375, -1.8865966796875, -1.82794189453125, -1.769287109375, -1.71063232421875, -1.6519775390625, -1.59332275390625, -1.53466796875, -1.47601318359375, -1.4173583984375, -1.35870361328125, -1.300048828125, -1.24139404296875, -1.1827392578125, -1.12408447265625, -1.0654296875, -1.00677490234375, -0.9481201171875, -0.88946533203125, -0.830810546875, -0.77215576171875, -0.7135009765625, -0.65484619140625, -0.59619140625, -0.53753662109375, -0.4788818359375, -0.42022705078125, -0.361572265625, -0.30291748046875, -0.2442626953125, -0.18560791015625, -0.126953125, -0.06829833984375, -0.0096435546875, 0.04901123046875, 0.107666015625, 0.16632080078125, 0.2249755859375, 0.28363037109375, 0.34228515625, 0.40093994140625, 0.4595947265625, 0.51824951171875, 0.576904296875, 0.63555908203125, 0.6942138671875, 0.75286865234375, 0.8115234375, 0.87017822265625, 0.9288330078125, 0.98748779296875, 1.046142578125, 1.10479736328125, 1.1634521484375, 1.22210693359375, 1.28076171875, 1.33941650390625, 1.3980712890625, 1.45672607421875, 1.515380859375, 1.57403564453125, 1.6326904296875, 1.69134521484375, 1.75]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 3.0, 8.0, 6.0, 5.0, 17.0, 12.0, 27.0, 26.0, 51.0, 65.0, 88.0, 117.0, 160.0, 244.0, 296.0, 428.0, 579.0, 852.0, 1207.0, 1781.0, 2674.0, 4212.0, 7428.0, 16433.0, 66223.0, 4003701.0, 53721.0, 14761.0, 6982.0, 3927.0, 2557.0, 1618.0, 1134.0, 795.0, 588.0, 445.0, 280.0, 230.0, 154.0, 124.0, 93.0, 60.0, 46.0, 30.0, 31.0, 16.0, 14.0, 15.0, 11.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.4296875, -5.24530029296875, -5.0609130859375, -4.87652587890625, -4.692138671875, -4.50775146484375, -4.3233642578125, -4.13897705078125, -3.95458984375, -3.77020263671875, -3.5858154296875, -3.40142822265625, -3.217041015625, -3.03265380859375, -2.8482666015625, -2.66387939453125, -2.4794921875, -2.29510498046875, -2.1107177734375, -1.92633056640625, -1.741943359375, -1.55755615234375, -1.3731689453125, -1.18878173828125, -1.00439453125, -0.82000732421875, -0.6356201171875, -0.45123291015625, -0.266845703125, -0.08245849609375, 0.1019287109375, 0.28631591796875, 0.470703125, 0.65509033203125, 0.8394775390625, 1.02386474609375, 1.208251953125, 1.39263916015625, 1.5770263671875, 1.76141357421875, 1.94580078125, 2.13018798828125, 2.3145751953125, 2.49896240234375, 2.683349609375, 2.86773681640625, 3.0521240234375, 3.23651123046875, 3.4208984375, 3.60528564453125, 3.7896728515625, 3.97406005859375, 4.158447265625, 4.34283447265625, 4.5272216796875, 4.71160888671875, 4.89599609375, 5.08038330078125, 5.2647705078125, 5.44915771484375, 5.633544921875, 5.81793212890625, 6.0023193359375, 6.18670654296875, 6.37109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 3.0, 10.0, 7.0, 15.0, 23.0, 39.0, 225.0, 3527.0, 89.0, 38.0, 25.0, 12.0, 7.0, 8.0, 5.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.6611328125, -1.612640380859375, -1.56414794921875, -1.515655517578125, -1.4671630859375, -1.418670654296875, -1.37017822265625, -1.321685791015625, -1.273193359375, -1.224700927734375, -1.17620849609375, -1.127716064453125, -1.0792236328125, -1.030731201171875, -0.98223876953125, -0.933746337890625, -0.88525390625, -0.836761474609375, -0.78826904296875, -0.739776611328125, -0.6912841796875, -0.642791748046875, -0.59429931640625, -0.545806884765625, -0.497314453125, -0.448822021484375, -0.40032958984375, -0.351837158203125, -0.3033447265625, -0.254852294921875, -0.20635986328125, -0.157867431640625, -0.109375, -0.060882568359375, -0.01239013671875, 0.036102294921875, 0.0845947265625, 0.133087158203125, 0.18157958984375, 0.230072021484375, 0.278564453125, 0.327056884765625, 0.37554931640625, 0.424041748046875, 0.4725341796875, 0.521026611328125, 0.56951904296875, 0.618011474609375, 0.66650390625, 0.714996337890625, 0.76348876953125, 0.811981201171875, 0.8604736328125, 0.908966064453125, 0.95745849609375, 1.005950927734375, 1.054443359375, 1.102935791015625, 1.15142822265625, 1.199920654296875, 1.2484130859375, 1.296905517578125, 1.34539794921875, 1.393890380859375, 1.4423828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 32.0, 96.0, 202.0, 276.0, 227.0, 108.0, 33.0, 17.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.639272689819336, -22.182661056518555, -21.726049423217773, -21.269437789916992, -20.81282615661621, -20.356212615966797, -19.899600982666016, -19.442989349365234, -18.986377716064453, -18.529766082763672, -18.07315444946289, -17.61654281616211, -17.159931182861328, -16.703319549560547, -16.246707916259766, -15.790095329284668, -15.333483695983887, -14.876872062683105, -14.420260429382324, -13.963647842407227, -13.507036209106445, -13.050424575805664, -12.593812942504883, -12.137201309204102, -11.68058967590332, -11.223978042602539, -10.767366409301758, -10.310754776000977, -9.854142189025879, -9.397530555725098, -8.940918922424316, -8.484307289123535, -8.027694702148438, -7.571083068847656, -7.114470958709717, -6.6578593254089355, -6.201247215270996, -5.744635581970215, -5.288023948669434, -4.831412315368652, -4.374800205230713, -3.9181883335113525, -3.461576461791992, -3.004964828491211, -2.5483529567718506, -2.0917410850524902, -1.635129451751709, -1.1785175800323486, -0.7219057083129883, -0.2652938961982727, 0.19131791591644287, 0.6479296684265137, 1.104541540145874, 1.5611534118652344, 2.0177650451660156, 2.474376916885376, 2.9309887886047363, 3.3876006603240967, 3.844212532043457, 4.300824165344238, 4.7574357986450195, 5.214047908782959, 5.67065954208374, 6.12727165222168, 6.583883285522461]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 4.0, 2.0, 10.0, 9.0, 11.0, 16.0, 22.0, 21.0, 14.0, 15.0, 28.0, 30.0, 31.0, 34.0, 34.0, 40.0, 41.0, 48.0, 43.0, 55.0, 50.0, 45.0, 55.0, 51.0, 38.0, 34.0, 23.0, 29.0, 31.0, 21.0, 15.0, 22.0, 12.0, 15.0, 12.0, 11.0, 12.0, 3.0, 4.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.6851954460144043, -3.5713894367218018, -3.45758318901062, -3.3437771797180176, -3.229970932006836, -3.1161649227142334, -3.002358913421631, -2.888552665710449, -2.7747466564178467, -2.660940647125244, -2.5471343994140625, -2.43332839012146, -2.3195221424102783, -2.205716133117676, -2.091909885406494, -1.9781038761138916, -1.8642977476119995, -1.7504916191101074, -1.6366854906082153, -1.5228793621063232, -1.4090733528137207, -1.2952672243118286, -1.1814610958099365, -1.067655086517334, -0.9538488984107971, -0.840042769908905, -0.7262367010116577, -0.6124305725097656, -0.4986244738101959, -0.3848183751106262, -0.27101224660873413, -0.15720617771148682, -0.04340004920959473, 0.07040605694055557, 0.18421216309070587, 0.29801827669143677, 0.41182437539100647, 0.5256304740905762, 0.6394366025924683, 0.7532426714897156, 0.8670487999916077, 0.9808549284934998, 1.094660997390747, 1.2084671258926392, 1.3222732543945312, 1.4360792636871338, 1.5498855113983154, 1.663691520690918, 1.77749764919281, 1.8913037776947021, 2.0051097869873047, 2.1189160346984863, 2.232722043991089, 2.3465280532836914, 2.460334300994873, 2.5741403102874756, 2.6879465579986572, 2.8017525672912598, 2.9155588150024414, 3.029364824295044, 3.1431710720062256, 3.256977081298828, 3.3707833290100098, 3.4845893383026123, 3.598395347595215]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 5.0, 10.0, 13.0, 17.0, 24.0, 35.0, 46.0, 77.0, 128.0, 180.0, 330.0, 570.0, 959.0, 1657.0, 2968.0, 5650.0, 11720.0, 26172.0, 62940.0, 160723.0, 346856.0, 252312.0, 99873.0, 40431.0, 17358.0, 8184.0, 4138.0, 2144.0, 1239.0, 696.0, 382.0, 267.0, 138.0, 101.0, 62.0, 45.0, 29.0, 29.0, 17.0, 9.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-5.99609375, -5.828369140625, -5.66064453125, -5.492919921875, -5.3251953125, -5.157470703125, -4.98974609375, -4.822021484375, -4.654296875, -4.486572265625, -4.31884765625, -4.151123046875, -3.9833984375, -3.815673828125, -3.64794921875, -3.480224609375, -3.3125, -3.144775390625, -2.97705078125, -2.809326171875, -2.6416015625, -2.473876953125, -2.30615234375, -2.138427734375, -1.970703125, -1.802978515625, -1.63525390625, -1.467529296875, -1.2998046875, -1.132080078125, -0.96435546875, -0.796630859375, -0.62890625, -0.461181640625, -0.29345703125, -0.125732421875, 0.0419921875, 0.209716796875, 0.37744140625, 0.545166015625, 0.712890625, 0.880615234375, 1.04833984375, 1.216064453125, 1.3837890625, 1.551513671875, 1.71923828125, 1.886962890625, 2.0546875, 2.222412109375, 2.39013671875, 2.557861328125, 2.7255859375, 2.893310546875, 3.06103515625, 3.228759765625, 3.396484375, 3.564208984375, 3.73193359375, 3.899658203125, 4.0673828125, 4.235107421875, 4.40283203125, 4.570556640625, 4.73828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 4.0, 12.0, 12.0, 7.0, 14.0, 20.0, 17.0, 30.0, 31.0, 51.0, 43.0, 34.0, 50.0, 45.0, 50.0, 53.0, 65.0, 47.0, 62.0, 59.0, 50.0, 42.0, 37.0, 29.0, 36.0, 18.0, 21.0, 12.0, 9.0, 7.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7802734375, -1.7207183837890625, -1.661163330078125, -1.6016082763671875, -1.54205322265625, -1.4824981689453125, -1.422943115234375, -1.3633880615234375, -1.3038330078125, -1.2442779541015625, -1.184722900390625, -1.1251678466796875, -1.06561279296875, -1.0060577392578125, -0.946502685546875, -0.8869476318359375, -0.827392578125, -0.7678375244140625, -0.708282470703125, -0.6487274169921875, -0.58917236328125, -0.5296173095703125, -0.470062255859375, -0.4105072021484375, -0.3509521484375, -0.2913970947265625, -0.231842041015625, -0.1722869873046875, -0.11273193359375, -0.0531768798828125, 0.006378173828125, 0.0659332275390625, 0.12548828125, 0.1850433349609375, 0.244598388671875, 0.3041534423828125, 0.36370849609375, 0.4232635498046875, 0.482818603515625, 0.5423736572265625, 0.6019287109375, 0.6614837646484375, 0.721038818359375, 0.7805938720703125, 0.84014892578125, 0.8997039794921875, 0.959259033203125, 1.0188140869140625, 1.078369140625, 1.1379241943359375, 1.197479248046875, 1.2570343017578125, 1.31658935546875, 1.3761444091796875, 1.435699462890625, 1.4952545166015625, 1.5548095703125, 1.6143646240234375, 1.673919677734375, 1.7334747314453125, 1.79302978515625, 1.8525848388671875, 1.912139892578125, 1.9716949462890625, 2.03125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 7.0, 7.0, 15.0, 18.0, 19.0, 39.0, 58.0, 76.0, 152.0, 175.0, 317.0, 576.0, 1162.0, 2609.0, 6148.0, 16854.0, 54773.0, 236089.0, 542910.0, 132317.0, 34177.0, 11491.0, 4482.0, 1963.0, 939.0, 429.0, 268.0, 157.0, 101.0, 61.0, 46.0, 30.0, 30.0, 17.0, 12.0, 7.0, 6.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.03729248046875, -6.7972412109375, -6.55718994140625, -6.317138671875, -6.07708740234375, -5.8370361328125, -5.59698486328125, -5.35693359375, -5.11688232421875, -4.8768310546875, -4.63677978515625, -4.396728515625, -4.15667724609375, -3.9166259765625, -3.67657470703125, -3.4365234375, -3.19647216796875, -2.9564208984375, -2.71636962890625, -2.476318359375, -2.23626708984375, -1.9962158203125, -1.75616455078125, -1.51611328125, -1.27606201171875, -1.0360107421875, -0.79595947265625, -0.555908203125, -0.31585693359375, -0.0758056640625, 0.16424560546875, 0.404296875, 0.64434814453125, 0.8843994140625, 1.12445068359375, 1.364501953125, 1.60455322265625, 1.8446044921875, 2.08465576171875, 2.32470703125, 2.56475830078125, 2.8048095703125, 3.04486083984375, 3.284912109375, 3.52496337890625, 3.7650146484375, 4.00506591796875, 4.2451171875, 4.48516845703125, 4.7252197265625, 4.96527099609375, 5.205322265625, 5.44537353515625, 5.6854248046875, 5.92547607421875, 6.16552734375, 6.40557861328125, 6.6456298828125, 6.88568115234375, 7.125732421875, 7.36578369140625, 7.6058349609375, 7.84588623046875, 8.0859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 8.0, 11.0, 3.0, 9.0, 9.0, 10.0, 30.0, 28.0, 27.0, 46.0, 57.0, 54.0, 64.0, 65.0, 75.0, 62.0, 63.0, 66.0, 54.0, 40.0, 42.0, 43.0, 29.0, 27.0, 21.0, 17.0, 11.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.6771240234375, -8.252685546875, -7.8282470703125, -7.40380859375, -6.9793701171875, -6.554931640625, -6.1304931640625, -5.7060546875, -5.2816162109375, -4.857177734375, -4.4327392578125, -4.00830078125, -3.5838623046875, -3.159423828125, -2.7349853515625, -2.310546875, -1.8861083984375, -1.461669921875, -1.0372314453125, -0.61279296875, -0.1883544921875, 0.236083984375, 0.6605224609375, 1.0849609375, 1.5093994140625, 1.933837890625, 2.3582763671875, 2.78271484375, 3.2071533203125, 3.631591796875, 4.0560302734375, 4.48046875, 4.9049072265625, 5.329345703125, 5.7537841796875, 6.17822265625, 6.6026611328125, 7.027099609375, 7.4515380859375, 7.8759765625, 8.3004150390625, 8.724853515625, 9.1492919921875, 9.57373046875, 9.9981689453125, 10.422607421875, 10.8470458984375, 11.271484375, 11.6959228515625, 12.120361328125, 12.5447998046875, 12.96923828125, 13.3936767578125, 13.818115234375, 14.2425537109375, 14.6669921875, 15.0914306640625, 15.515869140625, 15.9403076171875, 16.36474609375, 16.7891845703125, 17.213623046875, 17.6380615234375, 18.0625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 5.0, 4.0, 15.0, 22.0, 36.0, 57.0, 115.0, 267.0, 1150.0, 10152.0, 1002562.0, 31500.0, 1888.0, 419.0, 169.0, 85.0, 46.0, 20.0, 17.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.234375, -18.484375, -17.734375, -16.984375, -16.234375, -15.484375, -14.734375, -13.984375, -13.234375, -12.484375, -11.734375, -10.984375, -10.234375, -9.484375, -8.734375, -7.984375, -7.234375, -6.484375, -5.734375, -4.984375, -4.234375, -3.484375, -2.734375, -1.984375, -1.234375, -0.484375, 0.265625, 1.015625, 1.765625, 2.515625, 3.265625, 4.015625, 4.765625, 5.515625, 6.265625, 7.015625, 7.765625, 8.515625, 9.265625, 10.015625, 10.765625, 11.515625, 12.265625, 13.015625, 13.765625, 14.515625, 15.265625, 16.015625, 16.765625, 17.515625, 18.265625, 19.015625, 19.765625, 20.515625, 21.265625, 22.015625, 22.765625, 23.515625, 24.265625, 25.015625, 25.765625, 26.515625, 27.265625, 28.015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 16.0, 7.0, 17.0, 28.0, 41.0, 58.0, 109.0, 137.0, 148.0, 143.0, 96.0, 78.0, 31.0, 32.0, 16.0, 9.0, 2.0, 7.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011081695556640625, -0.0010814517736434937, -0.0010547339916229248, -0.001028016209602356, -0.0010012984275817871, -0.0009745806455612183, -0.0009478628635406494, -0.0009211450815200806, -0.0008944272994995117, -0.0008677095174789429, -0.000840991735458374, -0.0008142739534378052, -0.0007875561714172363, -0.0007608383893966675, -0.0007341206073760986, -0.0007074028253555298, -0.0006806850433349609, -0.0006539672613143921, -0.0006272494792938232, -0.0006005316972732544, -0.0005738139152526855, -0.0005470961332321167, -0.0005203783512115479, -0.000493660569190979, -0.00046694278717041016, -0.0004402250051498413, -0.00041350722312927246, -0.0003867894411087036, -0.00036007165908813477, -0.0003333538770675659, -0.00030663609504699707, -0.0002799183130264282, -0.0002532005310058594, -0.00022648274898529053, -0.00019976496696472168, -0.00017304718494415283, -0.00014632940292358398, -0.00011961162090301514, -9.289383888244629e-05, -6.617605686187744e-05, -3.9458274841308594e-05, -1.2740492820739746e-05, 1.3977289199829102e-05, 4.069507122039795e-05, 6.74128532409668e-05, 9.413063526153564e-05, 0.00012084841728210449, 0.00014756619930267334, 0.0001742839813232422, 0.00020100176334381104, 0.00022771954536437988, 0.00025443732738494873, 0.0002811551094055176, 0.0003078728914260864, 0.0003345906734466553, 0.0003613084554672241, 0.00038802623748779297, 0.0004147440195083618, 0.00044146180152893066, 0.0004681795835494995, 0.0004948973655700684, 0.0005216151475906372, 0.0005483329296112061, 0.0005750507116317749, 0.0006017684936523438]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 11.0, 15.0, 29.0, 45.0, 96.0, 205.0, 529.0, 1372.0, 4733.0, 36193.0, 893134.0, 101272.0, 7584.0, 2024.0, 765.0, 294.0, 128.0, 51.0, 21.0, 13.0, 11.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.6171875, -11.27197265625, -10.9267578125, -10.58154296875, -10.236328125, -9.89111328125, -9.5458984375, -9.20068359375, -8.85546875, -8.51025390625, -8.1650390625, -7.81982421875, -7.474609375, -7.12939453125, -6.7841796875, -6.43896484375, -6.09375, -5.74853515625, -5.4033203125, -5.05810546875, -4.712890625, -4.36767578125, -4.0224609375, -3.67724609375, -3.33203125, -2.98681640625, -2.6416015625, -2.29638671875, -1.951171875, -1.60595703125, -1.2607421875, -0.91552734375, -0.5703125, -0.22509765625, 0.1201171875, 0.46533203125, 0.810546875, 1.15576171875, 1.5009765625, 1.84619140625, 2.19140625, 2.53662109375, 2.8818359375, 3.22705078125, 3.572265625, 3.91748046875, 4.2626953125, 4.60791015625, 4.953125, 5.29833984375, 5.6435546875, 5.98876953125, 6.333984375, 6.67919921875, 7.0244140625, 7.36962890625, 7.71484375, 8.06005859375, 8.4052734375, 8.75048828125, 9.095703125, 9.44091796875, 9.7861328125, 10.13134765625, 10.4765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 11.0, 10.0, 19.0, 30.0, 74.0, 130.0, 213.0, 225.0, 122.0, 66.0, 30.0, 21.0, 8.0, 10.0, 2.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.1221923828125, -10.736572265625, -10.3509521484375, -9.96533203125, -9.5797119140625, -9.194091796875, -8.8084716796875, -8.4228515625, -8.0372314453125, -7.651611328125, -7.2659912109375, -6.88037109375, -6.4947509765625, -6.109130859375, -5.7235107421875, -5.337890625, -4.9522705078125, -4.566650390625, -4.1810302734375, -3.79541015625, -3.4097900390625, -3.024169921875, -2.6385498046875, -2.2529296875, -1.8673095703125, -1.481689453125, -1.0960693359375, -0.71044921875, -0.3248291015625, 0.060791015625, 0.4464111328125, 0.83203125, 1.2176513671875, 1.603271484375, 1.9888916015625, 2.37451171875, 2.7601318359375, 3.145751953125, 3.5313720703125, 3.9169921875, 4.3026123046875, 4.688232421875, 5.0738525390625, 5.45947265625, 5.8450927734375, 6.230712890625, 6.6163330078125, 7.001953125, 7.3875732421875, 7.773193359375, 8.1588134765625, 8.54443359375, 8.9300537109375, 9.315673828125, 9.7012939453125, 10.0869140625, 10.4725341796875, 10.858154296875, 11.2437744140625, 11.62939453125, 12.0150146484375, 12.400634765625, 12.7862548828125, 13.171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 16.0, 27.0, 44.0, 71.0, 121.0, 198.0, 202.0, 136.0, 84.0, 50.0, 23.0, 11.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.56695556640625, -157.62384033203125, -153.6807098388672, -149.7375946044922, -145.79446411132812, -141.85134887695312, -137.90823364257812, -133.96510314941406, -130.02198791503906, -126.07886505126953, -122.1357421875, -118.192626953125, -114.24950408935547, -110.30638122558594, -106.3632583618164, -102.42013549804688, -98.47701263427734, -94.53388977050781, -90.59076690673828, -86.64764404296875, -82.70452880859375, -78.76140594482422, -74.81828308105469, -70.87516021728516, -66.93203735351562, -62.988914489746094, -59.04579544067383, -55.1026725769043, -51.15955352783203, -47.2164306640625, -43.27330780029297, -39.33018493652344, -35.38706970214844, -31.44394874572754, -27.50082778930664, -23.55770492553711, -19.61458396911621, -15.671463012695312, -11.728340148925781, -7.785219192504883, -3.8420982360839844, 0.10102319717407227, 4.044144630432129, 7.987266540527344, 11.930387496948242, 15.87350845336914, 19.816631317138672, 23.75975227355957, 27.70287322998047, 31.645994186401367, 35.589115142822266, 39.5322380065918, 43.47535705566406, 47.418479919433594, 51.361602783203125, 55.304725646972656, 59.24784469604492, 63.19096755981445, 67.13408660888672, 71.07720947265625, 75.02033233642578, 78.96345520019531, 82.90657043457031, 86.84969329833984, 90.79281616210938]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 4.0, 9.0, 8.0, 10.0, 16.0, 19.0, 20.0, 27.0, 21.0, 30.0, 37.0, 39.0, 59.0, 49.0, 59.0, 41.0, 50.0, 57.0, 66.0, 41.0, 40.0, 41.0, 37.0, 24.0, 31.0, 26.0, 21.0, 22.0, 12.0, 16.0, 15.0, 9.0, 9.0, 8.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.79658508300781, -64.80411529541016, -62.81165313720703, -60.819183349609375, -58.826717376708984, -56.834251403808594, -54.8417854309082, -52.84931945800781, -50.856849670410156, -48.864383697509766, -46.871917724609375, -44.87944793701172, -42.88698196411133, -40.89451599121094, -38.90205001831055, -36.909584045410156, -34.917118072509766, -32.924652099609375, -30.93218421936035, -28.93971824645996, -26.947250366210938, -24.954784393310547, -22.962318420410156, -20.969852447509766, -18.977384567260742, -16.98491859436035, -14.992450714111328, -12.999984741210938, -11.00751781463623, -9.015050888061523, -7.022584915161133, -5.030117988586426, -3.0376548767089844, -1.0451881885528564, 0.9472784996032715, 2.9397449493408203, 4.932211875915527, 6.924678802490234, 8.917144775390625, 10.909611701965332, 12.902078628540039, 14.894545555114746, 16.887012481689453, 18.879478454589844, 20.871944427490234, 22.864412307739258, 24.85687828063965, 26.849346160888672, 28.841812133789062, 30.834278106689453, 32.826744079589844, 34.8192138671875, 36.81167984008789, 38.80414581298828, 40.79661178588867, 42.78907775878906, 44.78154754638672, 46.77401351928711, 48.7664794921875, 50.758949279785156, 52.75141525268555, 54.74388122558594, 56.73634719848633, 58.72881317138672, 60.72127914428711]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 3.0, 7.0, 1.0, 11.0, 13.0, 18.0, 21.0, 37.0, 54.0, 81.0, 148.0, 213.0, 479.0, 1095.0, 3102.0, 14801.0, 4131848.0, 34851.0, 4874.0, 1425.0, 552.0, 286.0, 139.0, 80.0, 34.0, 38.0, 21.0, 9.0, 15.0, 8.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.5732421875, -22.912109375, -22.2509765625, -21.58984375, -20.9287109375, -20.267578125, -19.6064453125, -18.9453125, -18.2841796875, -17.623046875, -16.9619140625, -16.30078125, -15.6396484375, -14.978515625, -14.3173828125, -13.65625, -12.9951171875, -12.333984375, -11.6728515625, -11.01171875, -10.3505859375, -9.689453125, -9.0283203125, -8.3671875, -7.7060546875, -7.044921875, -6.3837890625, -5.72265625, -5.0615234375, -4.400390625, -3.7392578125, -3.078125, -2.4169921875, -1.755859375, -1.0947265625, -0.43359375, 0.2275390625, 0.888671875, 1.5498046875, 2.2109375, 2.8720703125, 3.533203125, 4.1943359375, 4.85546875, 5.5166015625, 6.177734375, 6.8388671875, 7.5, 8.1611328125, 8.822265625, 9.4833984375, 10.14453125, 10.8056640625, 11.466796875, 12.1279296875, 12.7890625, 13.4501953125, 14.111328125, 14.7724609375, 15.43359375, 16.0947265625, 16.755859375, 17.4169921875, 18.078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 5.0, 4.0, 3.0, 4.0, 0.0, 5.0, 4.0, 7.0, 9.0, 18.0, 12.0, 16.0, 16.0, 33.0, 33.0, 43.0, 39.0, 57.0, 61.0, 69.0, 79.0, 50.0, 56.0, 69.0, 52.0, 45.0, 31.0, 42.0, 33.0, 28.0, 19.0, 21.0, 4.0, 8.0, 10.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.863616943359375, -2.78387451171875, -2.704132080078125, -2.6243896484375, -2.544647216796875, -2.46490478515625, -2.385162353515625, -2.305419921875, -2.225677490234375, -2.14593505859375, -2.066192626953125, -1.9864501953125, -1.906707763671875, -1.82696533203125, -1.747222900390625, -1.66748046875, -1.587738037109375, -1.50799560546875, -1.428253173828125, -1.3485107421875, -1.268768310546875, -1.18902587890625, -1.109283447265625, -1.029541015625, -0.949798583984375, -0.87005615234375, -0.790313720703125, -0.7105712890625, -0.630828857421875, -0.55108642578125, -0.471343994140625, -0.3916015625, -0.311859130859375, -0.23211669921875, -0.152374267578125, -0.0726318359375, 0.007110595703125, 0.08685302734375, 0.166595458984375, 0.246337890625, 0.326080322265625, 0.40582275390625, 0.485565185546875, 0.5653076171875, 0.645050048828125, 0.72479248046875, 0.804534912109375, 0.88427734375, 0.964019775390625, 1.04376220703125, 1.123504638671875, 1.2032470703125, 1.282989501953125, 1.36273193359375, 1.442474365234375, 1.522216796875, 1.601959228515625, 1.68170166015625, 1.761444091796875, 1.8411865234375, 1.920928955078125, 2.00067138671875, 2.080413818359375, 2.16015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 4.0, 8.0, 9.0, 9.0, 13.0, 19.0, 27.0, 34.0, 58.0, 54.0, 67.0, 94.0, 123.0, 171.0, 241.0, 279.0, 439.0, 586.0, 902.0, 1245.0, 2144.0, 3376.0, 6464.0, 14350.0, 51175.0, 3920379.0, 147577.0, 23570.0, 8789.0, 4341.0, 2555.0, 1611.0, 1006.0, 680.0, 483.0, 324.0, 242.0, 208.0, 121.0, 99.0, 99.0, 73.0, 55.0, 49.0, 32.0, 22.0, 17.0, 24.0, 7.0, 10.0, 4.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.265625, -9.9420166015625, -9.618408203125, -9.2947998046875, -8.97119140625, -8.6475830078125, -8.323974609375, -8.0003662109375, -7.6767578125, -7.3531494140625, -7.029541015625, -6.7059326171875, -6.38232421875, -6.0587158203125, -5.735107421875, -5.4114990234375, -5.087890625, -4.7642822265625, -4.440673828125, -4.1170654296875, -3.79345703125, -3.4698486328125, -3.146240234375, -2.8226318359375, -2.4990234375, -2.1754150390625, -1.851806640625, -1.5281982421875, -1.20458984375, -0.8809814453125, -0.557373046875, -0.2337646484375, 0.08984375, 0.4134521484375, 0.737060546875, 1.0606689453125, 1.38427734375, 1.7078857421875, 2.031494140625, 2.3551025390625, 2.6787109375, 3.0023193359375, 3.325927734375, 3.6495361328125, 3.97314453125, 4.2967529296875, 4.620361328125, 4.9439697265625, 5.267578125, 5.5911865234375, 5.914794921875, 6.2384033203125, 6.56201171875, 6.8856201171875, 7.209228515625, 7.5328369140625, 7.8564453125, 8.1800537109375, 8.503662109375, 8.8272705078125, 9.15087890625, 9.4744873046875, 9.798095703125, 10.1217041015625, 10.4453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 3.0, 8.0, 13.0, 16.0, 29.0, 52.0, 173.0, 3371.0, 240.0, 64.0, 32.0, 18.0, 9.0, 8.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1953125, -4.08648681640625, -3.9776611328125, -3.86883544921875, -3.760009765625, -3.65118408203125, -3.5423583984375, -3.43353271484375, -3.32470703125, -3.21588134765625, -3.1070556640625, -2.99822998046875, -2.889404296875, -2.78057861328125, -2.6717529296875, -2.56292724609375, -2.4541015625, -2.34527587890625, -2.2364501953125, -2.12762451171875, -2.018798828125, -1.90997314453125, -1.8011474609375, -1.69232177734375, -1.58349609375, -1.47467041015625, -1.3658447265625, -1.25701904296875, -1.148193359375, -1.03936767578125, -0.9305419921875, -0.82171630859375, -0.712890625, -0.60406494140625, -0.4952392578125, -0.38641357421875, -0.277587890625, -0.16876220703125, -0.0599365234375, 0.04888916015625, 0.15771484375, 0.26654052734375, 0.3753662109375, 0.48419189453125, 0.593017578125, 0.70184326171875, 0.8106689453125, 0.91949462890625, 1.0283203125, 1.13714599609375, 1.2459716796875, 1.35479736328125, 1.463623046875, 1.57244873046875, 1.6812744140625, 1.79010009765625, 1.89892578125, 2.00775146484375, 2.1165771484375, 2.22540283203125, 2.334228515625, 2.44305419921875, 2.5518798828125, 2.66070556640625, 2.76953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 10.0, 30.0, 41.0, 58.0, 90.0, 143.0, 191.0, 160.0, 125.0, 77.0, 29.0, 20.0, 8.0, 9.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.60069465637207, -27.964872360229492, -27.32904815673828, -26.693225860595703, -26.057403564453125, -25.421579360961914, -24.785757064819336, -24.149932861328125, -23.514110565185547, -22.87828826904297, -22.242464065551758, -21.60664176940918, -20.9708194732666, -20.33499526977539, -19.699172973632812, -19.063350677490234, -18.427528381347656, -17.791706085205078, -17.155881881713867, -16.52005958557129, -15.884236335754395, -15.2484130859375, -14.612590789794922, -13.976767539978027, -13.340944290161133, -12.705121040344238, -12.06929874420166, -11.433475494384766, -10.797652244567871, -10.161828994750977, -9.526006698608398, -8.890183448791504, -8.25436019897461, -7.618537425994873, -6.9827141761779785, -6.346891403198242, -5.711068153381348, -5.075245380401611, -4.439422607421875, -3.8035993576049805, -3.167776584625244, -2.5319535732269287, -1.8961306810379028, -1.260307788848877, -0.6244847774505615, 0.011338233947753906, 0.6471610069274902, 1.2829842567443848, 1.918807029724121, 2.5546300411224365, 3.190453052520752, 3.8262758255004883, 4.462099075317383, 5.097921848297119, 5.7337446212768555, 6.36956787109375, 7.005390644073486, 7.641213417053223, 8.277036666870117, 8.912858963012695, 9.54868221282959, 10.184505462646484, 10.820327758789062, 11.456151962280273, 12.091974258422852]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 8.0, 6.0, 13.0, 8.0, 17.0, 8.0, 17.0, 27.0, 26.0, 23.0, 22.0, 39.0, 39.0, 46.0, 43.0, 38.0, 37.0, 31.0, 56.0, 44.0, 45.0, 37.0, 37.0, 30.0, 40.0, 22.0, 36.0, 31.0, 20.0, 23.0, 25.0, 14.0, 20.0, 20.0, 6.0, 5.0, 8.0, 9.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.977933883666992, -6.733251094818115, -6.488568305969238, -6.243885517120361, -5.999202728271484, -5.754519939422607, -5.5098371505737305, -5.265154838562012, -5.020471572875977, -4.7757887840271, -4.531105995178223, -4.286423206329346, -4.041740417480469, -3.797057628631592, -3.552375078201294, -3.307692289352417, -3.063009738922119, -2.818326950073242, -2.5736441612243652, -2.3289613723754883, -2.0842785835266113, -1.839595913887024, -1.5949132442474365, -1.3502304553985596, -1.1055476665496826, -0.8608648777008057, -0.6161821484565735, -0.3714994192123413, -0.12681663036346436, 0.1178661584854126, 0.362548828125, 0.607231616973877, 0.8519144058227539, 1.0965971946716309, 1.3412799835205078, 1.5859626531600952, 1.8306454420089722, 2.0753283500671387, 2.3200109004974365, 2.5646936893463135, 2.8093764781951904, 3.0540592670440674, 3.2987420558929443, 3.543424606323242, 3.788107395172119, 4.032790184020996, 4.277472972869873, 4.52215576171875, 4.766838550567627, 5.011521339416504, 5.256204128265381, 5.500886917114258, 5.745569705963135, 5.990252494812012, 6.2349348068237305, 6.479618072509766, 6.724300384521484, 6.968983173370361, 7.213665962219238, 7.458348751068115, 7.703031539916992, 7.947714328765869, 8.192397117614746, 8.437079429626465, 8.6817626953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 7.0, 17.0, 13.0, 28.0, 38.0, 43.0, 90.0, 121.0, 165.0, 316.0, 460.0, 853.0, 1482.0, 2908.0, 5766.0, 12194.0, 27774.0, 68676.0, 194655.0, 408165.0, 201181.0, 70299.0, 28286.0, 12450.0, 5829.0, 3032.0, 1585.0, 817.0, 473.0, 295.0, 191.0, 117.0, 69.0, 50.0, 22.0, 26.0, 17.0, 12.0, 12.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.89453125, -6.69476318359375, -6.4949951171875, -6.29522705078125, -6.095458984375, -5.89569091796875, -5.6959228515625, -5.49615478515625, -5.29638671875, -5.09661865234375, -4.8968505859375, -4.69708251953125, -4.497314453125, -4.29754638671875, -4.0977783203125, -3.89801025390625, -3.6982421875, -3.49847412109375, -3.2987060546875, -3.09893798828125, -2.899169921875, -2.69940185546875, -2.4996337890625, -2.29986572265625, -2.10009765625, -1.90032958984375, -1.7005615234375, -1.50079345703125, -1.301025390625, -1.10125732421875, -0.9014892578125, -0.70172119140625, -0.501953125, -0.30218505859375, -0.1024169921875, 0.09735107421875, 0.297119140625, 0.49688720703125, 0.6966552734375, 0.89642333984375, 1.09619140625, 1.29595947265625, 1.4957275390625, 1.69549560546875, 1.895263671875, 2.09503173828125, 2.2947998046875, 2.49456787109375, 2.6943359375, 2.89410400390625, 3.0938720703125, 3.29364013671875, 3.493408203125, 3.69317626953125, 3.8929443359375, 4.09271240234375, 4.29248046875, 4.49224853515625, 4.6920166015625, 4.89178466796875, 5.091552734375, 5.29132080078125, 5.4910888671875, 5.69085693359375, 5.890625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 4.0, 10.0, 12.0, 17.0, 14.0, 31.0, 27.0, 28.0, 39.0, 53.0, 50.0, 53.0, 56.0, 72.0, 75.0, 68.0, 61.0, 63.0, 42.0, 37.0, 24.0, 21.0, 31.0, 20.0, 15.0, 14.0, 15.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.808990478515625, -2.72344970703125, -2.637908935546875, -2.5523681640625, -2.466827392578125, -2.38128662109375, -2.295745849609375, -2.210205078125, -2.124664306640625, -2.03912353515625, -1.953582763671875, -1.8680419921875, -1.782501220703125, -1.69696044921875, -1.611419677734375, -1.52587890625, -1.440338134765625, -1.35479736328125, -1.269256591796875, -1.1837158203125, -1.098175048828125, -1.01263427734375, -0.927093505859375, -0.841552734375, -0.756011962890625, -0.67047119140625, -0.584930419921875, -0.4993896484375, -0.413848876953125, -0.32830810546875, -0.242767333984375, -0.1572265625, -0.071685791015625, 0.01385498046875, 0.099395751953125, 0.1849365234375, 0.270477294921875, 0.35601806640625, 0.441558837890625, 0.527099609375, 0.612640380859375, 0.69818115234375, 0.783721923828125, 0.8692626953125, 0.954803466796875, 1.04034423828125, 1.125885009765625, 1.21142578125, 1.296966552734375, 1.38250732421875, 1.468048095703125, 1.5535888671875, 1.639129638671875, 1.72467041015625, 1.810211181640625, 1.895751953125, 1.981292724609375, 2.06683349609375, 2.152374267578125, 2.2379150390625, 2.323455810546875, 2.40899658203125, 2.494537353515625, 2.580078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 7.0, 13.0, 9.0, 15.0, 35.0, 48.0, 83.0, 124.0, 308.0, 761.0, 2046.0, 7790.0, 41056.0, 460571.0, 481695.0, 42445.0, 8032.0, 2150.0, 680.0, 291.0, 134.0, 84.0, 60.0, 29.0, 35.0, 11.0, 14.0, 10.0, 5.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-19.703125, -19.22265625, -18.7421875, -18.26171875, -17.78125, -17.30078125, -16.8203125, -16.33984375, -15.859375, -15.37890625, -14.8984375, -14.41796875, -13.9375, -13.45703125, -12.9765625, -12.49609375, -12.015625, -11.53515625, -11.0546875, -10.57421875, -10.09375, -9.61328125, -9.1328125, -8.65234375, -8.171875, -7.69140625, -7.2109375, -6.73046875, -6.25, -5.76953125, -5.2890625, -4.80859375, -4.328125, -3.84765625, -3.3671875, -2.88671875, -2.40625, -1.92578125, -1.4453125, -0.96484375, -0.484375, -0.00390625, 0.4765625, 0.95703125, 1.4375, 1.91796875, 2.3984375, 2.87890625, 3.359375, 3.83984375, 4.3203125, 4.80078125, 5.28125, 5.76171875, 6.2421875, 6.72265625, 7.203125, 7.68359375, 8.1640625, 8.64453125, 9.125, 9.60546875, 10.0859375, 10.56640625, 11.046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 21.0, 13.0, 17.0, 20.0, 23.0, 26.0, 27.0, 33.0, 27.0, 53.0, 50.0, 47.0, 59.0, 40.0, 51.0, 42.0, 36.0, 43.0, 41.0, 54.0, 39.0, 36.0, 27.0, 17.0, 23.0, 25.0, 13.0, 13.0, 10.0, 6.0, 9.0, 9.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.058837890625, -11.67236328125, -11.285888671875, -10.8994140625, -10.512939453125, -10.12646484375, -9.739990234375, -9.353515625, -8.967041015625, -8.58056640625, -8.194091796875, -7.8076171875, -7.421142578125, -7.03466796875, -6.648193359375, -6.26171875, -5.875244140625, -5.48876953125, -5.102294921875, -4.7158203125, -4.329345703125, -3.94287109375, -3.556396484375, -3.169921875, -2.783447265625, -2.39697265625, -2.010498046875, -1.6240234375, -1.237548828125, -0.85107421875, -0.464599609375, -0.078125, 0.308349609375, 0.69482421875, 1.081298828125, 1.4677734375, 1.854248046875, 2.24072265625, 2.627197265625, 3.013671875, 3.400146484375, 3.78662109375, 4.173095703125, 4.5595703125, 4.946044921875, 5.33251953125, 5.718994140625, 6.10546875, 6.491943359375, 6.87841796875, 7.264892578125, 7.6513671875, 8.037841796875, 8.42431640625, 8.810791015625, 9.197265625, 9.583740234375, 9.97021484375, 10.356689453125, 10.7431640625, 11.129638671875, 11.51611328125, 11.902587890625, 12.2890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 5.0, 9.0, 9.0, 11.0, 21.0, 24.0, 43.0, 42.0, 90.0, 116.0, 182.0, 294.0, 586.0, 1190.0, 3218.0, 13153.0, 116395.0, 811553.0, 85442.0, 10849.0, 2955.0, 1143.0, 490.0, 267.0, 179.0, 87.0, 59.0, 37.0, 29.0, 31.0, 8.0, 13.0, 8.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.11700439453125, -7.8668212890625, -7.61663818359375, -7.366455078125, -7.11627197265625, -6.8660888671875, -6.61590576171875, -6.36572265625, -6.11553955078125, -5.8653564453125, -5.61517333984375, -5.364990234375, -5.11480712890625, -4.8646240234375, -4.61444091796875, -4.3642578125, -4.11407470703125, -3.8638916015625, -3.61370849609375, -3.363525390625, -3.11334228515625, -2.8631591796875, -2.61297607421875, -2.36279296875, -2.11260986328125, -1.8624267578125, -1.61224365234375, -1.362060546875, -1.11187744140625, -0.8616943359375, -0.61151123046875, -0.361328125, -0.11114501953125, 0.1390380859375, 0.38922119140625, 0.639404296875, 0.88958740234375, 1.1397705078125, 1.38995361328125, 1.64013671875, 1.89031982421875, 2.1405029296875, 2.39068603515625, 2.640869140625, 2.89105224609375, 3.1412353515625, 3.39141845703125, 3.6416015625, 3.89178466796875, 4.1419677734375, 4.39215087890625, 4.642333984375, 4.89251708984375, 5.1427001953125, 5.39288330078125, 5.64306640625, 5.89324951171875, 6.1434326171875, 6.39361572265625, 6.643798828125, 6.89398193359375, 7.1441650390625, 7.39434814453125, 7.64453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 5.0, 12.0, 22.0, 22.0, 25.0, 37.0, 64.0, 90.0, 98.0, 124.0, 112.0, 100.0, 94.0, 60.0, 34.0, 21.0, 22.0, 17.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011615753173828125, -0.0011324509978294373, -0.001103326678276062, -0.0010742023587226868, -0.0010450780391693115, -0.0010159537196159363, -0.000986829400062561, -0.0009577050805091858, -0.0009285807609558105, -0.0008994564414024353, -0.0008703321218490601, -0.0008412078022956848, -0.0008120834827423096, -0.0007829591631889343, -0.0007538348436355591, -0.0007247105240821838, -0.0006955862045288086, -0.0006664618849754333, -0.0006373375654220581, -0.0006082132458686829, -0.0005790889263153076, -0.0005499646067619324, -0.0005208402872085571, -0.0004917159676551819, -0.00046259164810180664, -0.0004334673285484314, -0.00040434300899505615, -0.0003752186894416809, -0.00034609436988830566, -0.0003169700503349304, -0.0002878457307815552, -0.00025872141122817993, -0.0002295970916748047, -0.00020047277212142944, -0.0001713484525680542, -0.00014222413301467896, -0.00011309981346130371, -8.397549390792847e-05, -5.485117435455322e-05, -2.572685480117798e-05, 3.3974647521972656e-06, 3.252178430557251e-05, 6.164610385894775e-05, 9.0770423412323e-05, 0.00011989474296569824, 0.00014901906251907349, 0.00017814338207244873, 0.00020726770162582397, 0.00023639202117919922, 0.00026551634073257446, 0.0002946406602859497, 0.00032376497983932495, 0.0003528892993927002, 0.00038201361894607544, 0.0004111379384994507, 0.00044026225805282593, 0.00046938657760620117, 0.0004985108971595764, 0.0005276352167129517, 0.0005567595362663269, 0.0005858838558197021, 0.0006150081753730774, 0.0006441324949264526, 0.0006732568144798279, 0.0007023811340332031]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 5.0, 14.0, 12.0, 28.0, 38.0, 59.0, 121.0, 202.0, 408.0, 841.0, 2146.0, 6469.0, 34596.0, 630993.0, 341956.0, 22387.0, 4983.0, 1795.0, 740.0, 303.0, 153.0, 108.0, 58.0, 46.0, 28.0, 19.0, 18.0, 4.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.7421875, -7.4742431640625, -7.206298828125, -6.9383544921875, -6.67041015625, -6.4024658203125, -6.134521484375, -5.8665771484375, -5.5986328125, -5.3306884765625, -5.062744140625, -4.7947998046875, -4.52685546875, -4.2589111328125, -3.990966796875, -3.7230224609375, -3.455078125, -3.1871337890625, -2.919189453125, -2.6512451171875, -2.38330078125, -2.1153564453125, -1.847412109375, -1.5794677734375, -1.3115234375, -1.0435791015625, -0.775634765625, -0.5076904296875, -0.23974609375, 0.0281982421875, 0.296142578125, 0.5640869140625, 0.83203125, 1.0999755859375, 1.367919921875, 1.6358642578125, 1.90380859375, 2.1717529296875, 2.439697265625, 2.7076416015625, 2.9755859375, 3.2435302734375, 3.511474609375, 3.7794189453125, 4.04736328125, 4.3153076171875, 4.583251953125, 4.8511962890625, 5.119140625, 5.3870849609375, 5.655029296875, 5.9229736328125, 6.19091796875, 6.4588623046875, 6.726806640625, 6.9947509765625, 7.2626953125, 7.5306396484375, 7.798583984375, 8.0665283203125, 8.33447265625, 8.6024169921875, 8.870361328125, 9.1383056640625, 9.40625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 0.0, 4.0, 3.0, 6.0, 10.0, 10.0, 16.0, 16.0, 26.0, 27.0, 40.0, 64.0, 68.0, 102.0, 101.0, 87.0, 94.0, 79.0, 61.0, 44.0, 40.0, 20.0, 31.0, 14.0, 11.0, 7.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.8359375, -6.6517333984375, -6.467529296875, -6.2833251953125, -6.09912109375, -5.9149169921875, -5.730712890625, -5.5465087890625, -5.3623046875, -5.1781005859375, -4.993896484375, -4.8096923828125, -4.62548828125, -4.4412841796875, -4.257080078125, -4.0728759765625, -3.888671875, -3.7044677734375, -3.520263671875, -3.3360595703125, -3.15185546875, -2.9676513671875, -2.783447265625, -2.5992431640625, -2.4150390625, -2.2308349609375, -2.046630859375, -1.8624267578125, -1.67822265625, -1.4940185546875, -1.309814453125, -1.1256103515625, -0.94140625, -0.7572021484375, -0.572998046875, -0.3887939453125, -0.20458984375, -0.0203857421875, 0.163818359375, 0.3480224609375, 0.5322265625, 0.7164306640625, 0.900634765625, 1.0848388671875, 1.26904296875, 1.4532470703125, 1.637451171875, 1.8216552734375, 2.005859375, 2.1900634765625, 2.374267578125, 2.5584716796875, 2.74267578125, 2.9268798828125, 3.111083984375, 3.2952880859375, 3.4794921875, 3.6636962890625, 3.847900390625, 4.0321044921875, 4.21630859375, 4.4005126953125, 4.584716796875, 4.7689208984375, 4.953125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 12.0, 24.0, 67.0, 105.0, 212.0, 249.0, 169.0, 92.0, 42.0, 21.0, 5.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-189.49513244628906, -184.24549865722656, -178.99588012695312, -173.74624633789062, -168.4966278076172, -163.2469940185547, -157.99737548828125, -152.74774169921875, -147.49810791015625, -142.24847412109375, -136.9988555908203, -131.7492218017578, -126.49960327148438, -121.24996948242188, -116.0003433227539, -110.75071716308594, -105.5010986328125, -100.25147247314453, -95.00184631347656, -89.7522201538086, -84.50259399414062, -79.25296020507812, -74.00333404541016, -68.75370788574219, -63.50408172607422, -58.25445556640625, -53.00482940673828, -47.75519943237305, -42.50557327270508, -37.25594711303711, -32.006317138671875, -26.756690979003906, -21.507080078125, -16.25745391845703, -11.00782585144043, -5.7581987380981445, -0.5085716247558594, 4.741054534912109, 9.990682601928711, 15.240310668945312, 20.48993682861328, 25.73956298828125, 30.98919105529785, 36.23881912231445, 41.48844528198242, 46.73807144165039, 51.987701416015625, 57.237327575683594, 62.48695373535156, 67.73657989501953, 72.9862060546875, 78.23583221435547, 83.48545837402344, 88.73509216308594, 93.9847183227539, 99.23434448242188, 104.48397064208984, 109.73359680175781, 114.98322296142578, 120.23284912109375, 125.48248291015625, 130.7321014404297, 135.9817352294922, 141.23135375976562, 146.48098754882812]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 6.0, 4.0, 9.0, 13.0, 15.0, 15.0, 21.0, 19.0, 23.0, 21.0, 18.0, 42.0, 33.0, 48.0, 41.0, 49.0, 43.0, 49.0, 55.0, 48.0, 55.0, 49.0, 33.0, 41.0, 33.0, 37.0, 37.0, 25.0, 24.0, 12.0, 19.0, 14.0, 8.0, 12.0, 3.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.035037994384766, -58.16160583496094, -56.288177490234375, -54.41474533081055, -52.541316986083984, -50.667884826660156, -48.794456481933594, -46.921024322509766, -45.04759216308594, -43.17416000366211, -41.30073165893555, -39.42729949951172, -37.553871154785156, -35.68043899536133, -33.8070068359375, -31.933578491210938, -30.060150146484375, -28.18671989440918, -26.313289642333984, -24.439857482910156, -22.566429138183594, -20.692996978759766, -18.81956672668457, -16.946136474609375, -15.07270622253418, -13.199275970458984, -11.325845718383789, -9.452414512634277, -7.578984260559082, -5.705554008483887, -3.832122802734375, -1.9586925506591797, -0.08525848388671875, 1.7881720066070557, 3.66160249710083, 5.535033226013184, 7.408463478088379, 9.281893730163574, 11.155324935913086, 13.028755187988281, 14.902185440063477, 16.775615692138672, 18.649045944213867, 20.522476196289062, 22.39590835571289, 24.269336700439453, 26.14276885986328, 28.016199111938477, 29.889629364013672, 31.763059616088867, 33.63648986816406, 35.50992202758789, 37.38335037231445, 39.25678253173828, 41.130210876464844, 43.00364303588867, 44.8770751953125, 46.75050735473633, 48.62393569946289, 50.49736785888672, 52.37079620361328, 54.24422836303711, 56.11766052246094, 57.9910888671875, 59.86451721191406]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 8.0, 13.0, 24.0, 31.0, 71.0, 140.0, 281.0, 680.0, 2494.0, 45764.0, 4139747.0, 3503.0, 880.0, 313.0, 142.0, 75.0, 43.0, 23.0, 12.0, 11.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.78125, -52.533203125, -51.28515625, -50.037109375, -48.7890625, -47.541015625, -46.29296875, -45.044921875, -43.796875, -42.548828125, -41.30078125, -40.052734375, -38.8046875, -37.556640625, -36.30859375, -35.060546875, -33.8125, -32.564453125, -31.31640625, -30.068359375, -28.8203125, -27.572265625, -26.32421875, -25.076171875, -23.828125, -22.580078125, -21.33203125, -20.083984375, -18.8359375, -17.587890625, -16.33984375, -15.091796875, -13.84375, -12.595703125, -11.34765625, -10.099609375, -8.8515625, -7.603515625, -6.35546875, -5.107421875, -3.859375, -2.611328125, -1.36328125, -0.115234375, 1.1328125, 2.380859375, 3.62890625, 4.876953125, 6.125, 7.373046875, 8.62109375, 9.869140625, 11.1171875, 12.365234375, 13.61328125, 14.861328125, 16.109375, 17.357421875, 18.60546875, 19.853515625, 21.1015625, 22.349609375, 23.59765625, 24.845703125, 26.09375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 9.0, 10.0, 11.0, 23.0, 20.0, 37.0, 52.0, 59.0, 59.0, 63.0, 82.0, 67.0, 75.0, 66.0, 66.0, 66.0, 60.0, 19.0, 24.0, 17.0, 22.0, 25.0, 10.0, 5.0, 12.0, 7.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.947265625, -3.833465576171875, -3.71966552734375, -3.605865478515625, -3.4920654296875, -3.378265380859375, -3.26446533203125, -3.150665283203125, -3.036865234375, -2.923065185546875, -2.80926513671875, -2.695465087890625, -2.5816650390625, -2.467864990234375, -2.35406494140625, -2.240264892578125, -2.12646484375, -2.012664794921875, -1.89886474609375, -1.785064697265625, -1.6712646484375, -1.557464599609375, -1.44366455078125, -1.329864501953125, -1.216064453125, -1.102264404296875, -0.98846435546875, -0.874664306640625, -0.7608642578125, -0.647064208984375, -0.53326416015625, -0.419464111328125, -0.3056640625, -0.191864013671875, -0.07806396484375, 0.035736083984375, 0.1495361328125, 0.263336181640625, 0.37713623046875, 0.490936279296875, 0.604736328125, 0.718536376953125, 0.83233642578125, 0.946136474609375, 1.0599365234375, 1.173736572265625, 1.28753662109375, 1.401336669921875, 1.51513671875, 1.628936767578125, 1.74273681640625, 1.856536865234375, 1.9703369140625, 2.084136962890625, 2.19793701171875, 2.311737060546875, 2.425537109375, 2.539337158203125, 2.65313720703125, 2.766937255859375, 2.8807373046875, 2.994537353515625, 3.10833740234375, 3.222137451171875, 3.3359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 7.0, 12.0, 17.0, 23.0, 23.0, 42.0, 36.0, 51.0, 102.0, 123.0, 178.0, 222.0, 319.0, 449.0, 636.0, 853.0, 1327.0, 1953.0, 3427.0, 6679.0, 18890.0, 3973290.0, 156936.0, 14272.0, 5597.0, 2923.0, 1740.0, 1135.0, 831.0, 643.0, 419.0, 285.0, 206.0, 165.0, 117.0, 93.0, 74.0, 57.0, 38.0, 27.0, 16.0, 18.0, 7.0, 4.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.515625, -12.1351318359375, -11.754638671875, -11.3741455078125, -10.99365234375, -10.6131591796875, -10.232666015625, -9.8521728515625, -9.4716796875, -9.0911865234375, -8.710693359375, -8.3302001953125, -7.94970703125, -7.5692138671875, -7.188720703125, -6.8082275390625, -6.427734375, -6.0472412109375, -5.666748046875, -5.2862548828125, -4.90576171875, -4.5252685546875, -4.144775390625, -3.7642822265625, -3.3837890625, -3.0032958984375, -2.622802734375, -2.2423095703125, -1.86181640625, -1.4813232421875, -1.100830078125, -0.7203369140625, -0.33984375, 0.0406494140625, 0.421142578125, 0.8016357421875, 1.18212890625, 1.5626220703125, 1.943115234375, 2.3236083984375, 2.7041015625, 3.0845947265625, 3.465087890625, 3.8455810546875, 4.22607421875, 4.6065673828125, 4.987060546875, 5.3675537109375, 5.748046875, 6.1285400390625, 6.509033203125, 6.8895263671875, 7.27001953125, 7.6505126953125, 8.031005859375, 8.4114990234375, 8.7919921875, 9.1724853515625, 9.552978515625, 9.9334716796875, 10.31396484375, 10.6944580078125, 11.074951171875, 11.4554443359375, 11.8359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 4.0, 13.0, 15.0, 14.0, 65.0, 3606.0, 240.0, 47.0, 15.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.14593505859375, -3.0438232421875, -2.94171142578125, -2.839599609375, -2.73748779296875, -2.6353759765625, -2.53326416015625, -2.43115234375, -2.32904052734375, -2.2269287109375, -2.12481689453125, -2.022705078125, -1.92059326171875, -1.8184814453125, -1.71636962890625, -1.6142578125, -1.51214599609375, -1.4100341796875, -1.30792236328125, -1.205810546875, -1.10369873046875, -1.0015869140625, -0.89947509765625, -0.79736328125, -0.69525146484375, -0.5931396484375, -0.49102783203125, -0.388916015625, -0.28680419921875, -0.1846923828125, -0.08258056640625, 0.01953125, 0.12164306640625, 0.2237548828125, 0.32586669921875, 0.427978515625, 0.53009033203125, 0.6322021484375, 0.73431396484375, 0.83642578125, 0.93853759765625, 1.0406494140625, 1.14276123046875, 1.244873046875, 1.34698486328125, 1.4490966796875, 1.55120849609375, 1.6533203125, 1.75543212890625, 1.8575439453125, 1.95965576171875, 2.061767578125, 2.16387939453125, 2.2659912109375, 2.36810302734375, 2.47021484375, 2.57232666015625, 2.6744384765625, 2.77655029296875, 2.878662109375, 2.98077392578125, 3.0828857421875, 3.18499755859375, 3.287109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 10.0, 16.0, 9.0, 25.0, 53.0, 63.0, 97.0, 143.0, 164.0, 161.0, 107.0, 69.0, 37.0, 25.0, 10.0, 8.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.264812469482422, -17.76633644104004, -17.267860412597656, -16.769384384155273, -16.270906448364258, -15.772430419921875, -15.273954391479492, -14.77547836303711, -14.277002334594727, -13.778526306152344, -13.280049324035645, -12.781573295593262, -12.283097267150879, -11.78462028503418, -11.286144256591797, -10.787668228149414, -10.289192199707031, -9.790716171264648, -9.29223918914795, -8.793763160705566, -8.295287132263184, -7.796810626983643, -7.298334121704102, -6.799858093261719, -6.3013811111450195, -5.8029046058654785, -5.304428577423096, -4.805952072143555, -4.307476043701172, -3.808999538421631, -3.310523271560669, -2.812047004699707, -2.313570976257324, -1.8150947093963623, -1.3166184425354004, -0.8181420564651489, -0.319665789604187, 0.17881059646606445, 0.6772868633270264, 1.1757631301879883, 1.6742393970489502, 2.172715663909912, 2.671191930770874, 3.169668197631836, 3.668144702911377, 4.166621208190918, 4.665097236633301, 5.163573265075684, 5.662049770355225, 6.160526275634766, 6.659002304077148, 7.1574788093566895, 7.655954837799072, 8.154431343078613, 8.652907371520996, 9.151384353637695, 9.649860382080078, 10.148336410522461, 10.64681339263916, 11.145289421081543, 11.643765449523926, 12.142242431640625, 12.640718460083008, 13.13919448852539, 13.637670516967773]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 1.0, 5.0, 3.0, 9.0, 7.0, 9.0, 7.0, 15.0, 14.0, 16.0, 20.0, 31.0, 29.0, 34.0, 44.0, 45.0, 33.0, 44.0, 43.0, 43.0, 42.0, 41.0, 44.0, 49.0, 37.0, 33.0, 40.0, 45.0, 30.0, 26.0, 25.0, 23.0, 21.0, 14.0, 12.0, 16.0, 10.0, 6.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.868834495544434, -5.685405731201172, -5.50197696685791, -5.318548202514648, -5.135119438171387, -4.951690673828125, -4.768261909484863, -4.584833145141602, -4.40140438079834, -4.217975616455078, -4.034546852111816, -3.8511180877685547, -3.667689323425293, -3.4842605590820312, -3.3008315563201904, -3.1174027919769287, -2.933973789215088, -2.750545024871826, -2.5671162605285645, -2.3836874961853027, -2.200258731842041, -2.0168299674987793, -1.8334009647369385, -1.6499722003936768, -1.466543436050415, -1.2831146717071533, -1.0996859073638916, -0.9162570238113403, -0.7328282594680786, -0.5493994951248169, -0.3659706115722656, -0.1825418472290039, 0.0008864402770996094, 0.18431523442268372, 0.3677440285682678, 0.5511728525161743, 0.734601616859436, 0.9180303812026978, 1.101459264755249, 1.2848880290985107, 1.4683167934417725, 1.6517455577850342, 1.835174322128296, 2.0186033248901367, 2.2020320892333984, 2.38546085357666, 2.568889617919922, 2.7523183822631836, 2.9357471466064453, 3.119175910949707, 3.3026046752929688, 3.4860334396362305, 3.669462203979492, 3.852890968322754, 4.036319732666016, 4.219748497009277, 4.403177261352539, 4.586606025695801, 4.7700347900390625, 4.953463554382324, 5.136892318725586, 5.320321083068848, 5.503749847412109, 5.687178611755371, 5.870607852935791]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 21.0, 22.0, 31.0, 41.0, 79.0, 114.0, 172.0, 328.0, 501.0, 1028.0, 2097.0, 4898.0, 13427.0, 46217.0, 215392.0, 564336.0, 147565.0, 33723.0, 10617.0, 4025.0, 1771.0, 901.0, 478.0, 278.0, 174.0, 98.0, 65.0, 40.0, 25.0, 19.0, 12.0, 9.0, 4.0, 9.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.640625, -9.3233642578125, -9.006103515625, -8.6888427734375, -8.37158203125, -8.0543212890625, -7.737060546875, -7.4197998046875, -7.1025390625, -6.7852783203125, -6.468017578125, -6.1507568359375, -5.83349609375, -5.5162353515625, -5.198974609375, -4.8817138671875, -4.564453125, -4.2471923828125, -3.929931640625, -3.6126708984375, -3.29541015625, -2.9781494140625, -2.660888671875, -2.3436279296875, -2.0263671875, -1.7091064453125, -1.391845703125, -1.0745849609375, -0.75732421875, -0.4400634765625, -0.122802734375, 0.1944580078125, 0.51171875, 0.8289794921875, 1.146240234375, 1.4635009765625, 1.78076171875, 2.0980224609375, 2.415283203125, 2.7325439453125, 3.0498046875, 3.3670654296875, 3.684326171875, 4.0015869140625, 4.31884765625, 4.6361083984375, 4.953369140625, 5.2706298828125, 5.587890625, 5.9051513671875, 6.222412109375, 6.5396728515625, 6.85693359375, 7.1741943359375, 7.491455078125, 7.8087158203125, 8.1259765625, 8.4432373046875, 8.760498046875, 9.0777587890625, 9.39501953125, 9.7122802734375, 10.029541015625, 10.3468017578125, 10.6640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 9.0, 7.0, 6.0, 9.0, 15.0, 13.0, 17.0, 27.0, 36.0, 52.0, 55.0, 67.0, 68.0, 51.0, 69.0, 75.0, 69.0, 62.0, 54.0, 56.0, 41.0, 29.0, 25.0, 20.0, 18.0, 12.0, 8.0, 11.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.56640625, -4.44580078125, -4.3251953125, -4.20458984375, -4.083984375, -3.96337890625, -3.8427734375, -3.72216796875, -3.6015625, -3.48095703125, -3.3603515625, -3.23974609375, -3.119140625, -2.99853515625, -2.8779296875, -2.75732421875, -2.63671875, -2.51611328125, -2.3955078125, -2.27490234375, -2.154296875, -2.03369140625, -1.9130859375, -1.79248046875, -1.671875, -1.55126953125, -1.4306640625, -1.31005859375, -1.189453125, -1.06884765625, -0.9482421875, -0.82763671875, -0.70703125, -0.58642578125, -0.4658203125, -0.34521484375, -0.224609375, -0.10400390625, 0.0166015625, 0.13720703125, 0.2578125, 0.37841796875, 0.4990234375, 0.61962890625, 0.740234375, 0.86083984375, 0.9814453125, 1.10205078125, 1.22265625, 1.34326171875, 1.4638671875, 1.58447265625, 1.705078125, 1.82568359375, 1.9462890625, 2.06689453125, 2.1875, 2.30810546875, 2.4287109375, 2.54931640625, 2.669921875, 2.79052734375, 2.9111328125, 3.03173828125, 3.15234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 5.0, 13.0, 13.0, 28.0, 27.0, 38.0, 56.0, 86.0, 163.0, 291.0, 555.0, 1410.0, 4467.0, 19493.0, 154886.0, 737583.0, 108463.0, 15120.0, 3600.0, 1142.0, 483.0, 232.0, 123.0, 88.0, 52.0, 42.0, 23.0, 24.0, 11.0, 10.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.6697998046875, -15.214599609375, -14.7593994140625, -14.30419921875, -13.8489990234375, -13.393798828125, -12.9385986328125, -12.4833984375, -12.0281982421875, -11.572998046875, -11.1177978515625, -10.66259765625, -10.2073974609375, -9.752197265625, -9.2969970703125, -8.841796875, -8.3865966796875, -7.931396484375, -7.4761962890625, -7.02099609375, -6.5657958984375, -6.110595703125, -5.6553955078125, -5.2001953125, -4.7449951171875, -4.289794921875, -3.8345947265625, -3.37939453125, -2.9241943359375, -2.468994140625, -2.0137939453125, -1.55859375, -1.1033935546875, -0.648193359375, -0.1929931640625, 0.26220703125, 0.7174072265625, 1.172607421875, 1.6278076171875, 2.0830078125, 2.5382080078125, 2.993408203125, 3.4486083984375, 3.90380859375, 4.3590087890625, 4.814208984375, 5.2694091796875, 5.724609375, 6.1798095703125, 6.635009765625, 7.0902099609375, 7.54541015625, 8.0006103515625, 8.455810546875, 8.9110107421875, 9.3662109375, 9.8214111328125, 10.276611328125, 10.7318115234375, 11.18701171875, 11.6422119140625, 12.097412109375, 12.5526123046875, 13.0078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 6.0, 5.0, 10.0, 16.0, 15.0, 19.0, 18.0, 19.0, 33.0, 35.0, 41.0, 26.0, 35.0, 42.0, 48.0, 43.0, 53.0, 49.0, 57.0, 52.0, 38.0, 31.0, 35.0, 39.0, 44.0, 25.0, 38.0, 25.0, 19.0, 8.0, 16.0, 2.0, 12.0, 10.0, 2.0, 2.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.359375, -12.899169921875, -12.43896484375, -11.978759765625, -11.5185546875, -11.058349609375, -10.59814453125, -10.137939453125, -9.677734375, -9.217529296875, -8.75732421875, -8.297119140625, -7.8369140625, -7.376708984375, -6.91650390625, -6.456298828125, -5.99609375, -5.535888671875, -5.07568359375, -4.615478515625, -4.1552734375, -3.695068359375, -3.23486328125, -2.774658203125, -2.314453125, -1.854248046875, -1.39404296875, -0.933837890625, -0.4736328125, -0.013427734375, 0.44677734375, 0.906982421875, 1.3671875, 1.827392578125, 2.28759765625, 2.747802734375, 3.2080078125, 3.668212890625, 4.12841796875, 4.588623046875, 5.048828125, 5.509033203125, 5.96923828125, 6.429443359375, 6.8896484375, 7.349853515625, 7.81005859375, 8.270263671875, 8.73046875, 9.190673828125, 9.65087890625, 10.111083984375, 10.5712890625, 11.031494140625, 11.49169921875, 11.951904296875, 12.412109375, 12.872314453125, 13.33251953125, 13.792724609375, 14.2529296875, 14.713134765625, 15.17333984375, 15.633544921875, 16.09375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 10.0, 9.0, 10.0, 18.0, 44.0, 49.0, 89.0, 168.0, 375.0, 1292.0, 11516.0, 912388.0, 117803.0, 3574.0, 701.0, 248.0, 109.0, 46.0, 42.0, 15.0, 16.0, 5.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8515625, -14.3690185546875, -13.886474609375, -13.4039306640625, -12.92138671875, -12.4388427734375, -11.956298828125, -11.4737548828125, -10.9912109375, -10.5086669921875, -10.026123046875, -9.5435791015625, -9.06103515625, -8.5784912109375, -8.095947265625, -7.6134033203125, -7.130859375, -6.6483154296875, -6.165771484375, -5.6832275390625, -5.20068359375, -4.7181396484375, -4.235595703125, -3.7530517578125, -3.2705078125, -2.7879638671875, -2.305419921875, -1.8228759765625, -1.34033203125, -0.8577880859375, -0.375244140625, 0.1072998046875, 0.58984375, 1.0723876953125, 1.554931640625, 2.0374755859375, 2.52001953125, 3.0025634765625, 3.485107421875, 3.9676513671875, 4.4501953125, 4.9327392578125, 5.415283203125, 5.8978271484375, 6.38037109375, 6.8629150390625, 7.345458984375, 7.8280029296875, 8.310546875, 8.7930908203125, 9.275634765625, 9.7581787109375, 10.24072265625, 10.7232666015625, 11.205810546875, 11.6883544921875, 12.1708984375, 12.6534423828125, 13.135986328125, 13.6185302734375, 14.10107421875, 14.5836181640625, 15.066162109375, 15.5487060546875, 16.03125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 8.0, 8.0, 12.0, 20.0, 26.0, 38.0, 60.0, 69.0, 118.0, 146.0, 147.0, 103.0, 90.0, 47.0, 27.0, 24.0, 18.0, 17.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00070953369140625, -0.0006800591945648193, -0.0006505846977233887, -0.000621110200881958, -0.0005916357040405273, -0.0005621612071990967, -0.000532686710357666, -0.0005032122135162354, -0.0004737377166748047, -0.000444263219833374, -0.00041478872299194336, -0.0003853142261505127, -0.00035583972930908203, -0.00032636523246765137, -0.0002968907356262207, -0.00026741623878479004, -0.00023794174194335938, -0.0002084672451019287, -0.00017899274826049805, -0.00014951825141906738, -0.00012004375457763672, -9.056925773620605e-05, -6.109476089477539e-05, -3.1620264053344727e-05, -2.1457672119140625e-06, 2.73287296295166e-05, 5.6803226470947266e-05, 8.627772331237793e-05, 0.0001157522201538086, 0.00014522671699523926, 0.00017470121383666992, 0.00020417571067810059, 0.00023365020751953125, 0.0002631247043609619, 0.0002925992012023926, 0.00032207369804382324, 0.0003515481948852539, 0.00038102269172668457, 0.00041049718856811523, 0.0004399716854095459, 0.00046944618225097656, 0.0004989206790924072, 0.0005283951759338379, 0.0005578696727752686, 0.0005873441696166992, 0.0006168186664581299, 0.0006462931632995605, 0.0006757676601409912, 0.0007052421569824219, 0.0007347166538238525, 0.0007641911506652832, 0.0007936656475067139, 0.0008231401443481445, 0.0008526146411895752, 0.0008820891380310059, 0.0009115636348724365, 0.0009410381317138672, 0.0009705126285552979, 0.0009999871253967285, 0.0010294616222381592, 0.0010589361190795898, 0.0010884106159210205, 0.0011178851127624512, 0.0011473596096038818, 0.0011768341064453125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 11.0, 19.0, 17.0, 50.0, 68.0, 108.0, 173.0, 367.0, 835.0, 2784.0, 15000.0, 229812.0, 754321.0, 37396.0, 5172.0, 1364.0, 508.0, 223.0, 124.0, 66.0, 48.0, 28.0, 17.0, 11.0, 11.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.453125, -7.1888427734375, -6.924560546875, -6.6602783203125, -6.39599609375, -6.1317138671875, -5.867431640625, -5.6031494140625, -5.3388671875, -5.0745849609375, -4.810302734375, -4.5460205078125, -4.28173828125, -4.0174560546875, -3.753173828125, -3.4888916015625, -3.224609375, -2.9603271484375, -2.696044921875, -2.4317626953125, -2.16748046875, -1.9031982421875, -1.638916015625, -1.3746337890625, -1.1103515625, -0.8460693359375, -0.581787109375, -0.3175048828125, -0.05322265625, 0.2110595703125, 0.475341796875, 0.7396240234375, 1.00390625, 1.2681884765625, 1.532470703125, 1.7967529296875, 2.06103515625, 2.3253173828125, 2.589599609375, 2.8538818359375, 3.1181640625, 3.3824462890625, 3.646728515625, 3.9110107421875, 4.17529296875, 4.4395751953125, 4.703857421875, 4.9681396484375, 5.232421875, 5.4967041015625, 5.760986328125, 6.0252685546875, 6.28955078125, 6.5538330078125, 6.818115234375, 7.0823974609375, 7.3466796875, 7.6109619140625, 7.875244140625, 8.1395263671875, 8.40380859375, 8.6680908203125, 8.932373046875, 9.1966552734375, 9.4609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 13.0, 23.0, 22.0, 28.0, 55.0, 85.0, 129.0, 146.0, 174.0, 92.0, 67.0, 56.0, 39.0, 19.0, 16.0, 12.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.265625, -11.9852294921875, -11.704833984375, -11.4244384765625, -11.14404296875, -10.8636474609375, -10.583251953125, -10.3028564453125, -10.0224609375, -9.7420654296875, -9.461669921875, -9.1812744140625, -8.90087890625, -8.6204833984375, -8.340087890625, -8.0596923828125, -7.779296875, -7.4989013671875, -7.218505859375, -6.9381103515625, -6.65771484375, -6.3773193359375, -6.096923828125, -5.8165283203125, -5.5361328125, -5.2557373046875, -4.975341796875, -4.6949462890625, -4.41455078125, -4.1341552734375, -3.853759765625, -3.5733642578125, -3.29296875, -3.0125732421875, -2.732177734375, -2.4517822265625, -2.17138671875, -1.8909912109375, -1.610595703125, -1.3302001953125, -1.0498046875, -0.7694091796875, -0.489013671875, -0.2086181640625, 0.07177734375, 0.3521728515625, 0.632568359375, 0.9129638671875, 1.193359375, 1.4737548828125, 1.754150390625, 2.0345458984375, 2.31494140625, 2.5953369140625, 2.875732421875, 3.1561279296875, 3.4365234375, 3.7169189453125, 3.997314453125, 4.2777099609375, 4.55810546875, 4.8385009765625, 5.118896484375, 5.3992919921875, 5.6796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 18.0, 47.0, 279.0, 436.0, 173.0, 45.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.34608459472656, -76.08837890625, -66.8306655883789, -57.57295608520508, -48.31524658203125, -39.05753707885742, -29.799827575683594, -20.5421142578125, -11.284408569335938, -2.0266990661621094, 7.231010437011719, 16.488719940185547, 25.746429443359375, 35.0041389465332, 44.26184844970703, 53.519561767578125, 62.77726745605469, 72.03497314453125, 81.29268646240234, 90.55039978027344, 99.80810546875, 109.06581115722656, 118.32352447509766, 127.58123779296875, 136.8389434814453, 146.09664916992188, 155.3543701171875, 164.61207580566406, 173.86978149414062, 183.1274871826172, 192.38519287109375, 201.64291381835938, 210.900634765625, 220.15834045410156, 229.41604614257812, 238.67376708984375, 247.9314727783203, 257.1891784667969, 266.4468994140625, 275.70458984375, 284.9623107910156, 294.22003173828125, 303.47772216796875, 312.7354431152344, 321.9931640625, 331.2508544921875, 340.5085754394531, 349.76629638671875, 359.02398681640625, 368.2817077636719, 377.5393981933594, 386.797119140625, 396.0548095703125, 405.3125305175781, 414.57025146484375, 423.82794189453125, 433.0856628417969, 442.3433837890625, 451.60107421875, 460.8587951660156, 470.11651611328125, 479.37420654296875, 488.6319274902344, 497.8896484375, 507.1473388671875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 6.0, 5.0, 6.0, 11.0, 6.0, 13.0, 16.0, 20.0, 18.0, 16.0, 17.0, 20.0, 22.0, 34.0, 22.0, 38.0, 45.0, 36.0, 35.0, 46.0, 50.0, 35.0, 31.0, 45.0, 45.0, 48.0, 34.0, 32.0, 28.0, 28.0, 36.0, 18.0, 17.0, 20.0, 18.0, 11.0, 15.0, 13.0, 6.0, 9.0, 9.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-64.68049621582031, -62.86137771606445, -61.04225540161133, -59.22313690185547, -57.404014587402344, -55.584896087646484, -53.765777587890625, -51.9466552734375, -50.12753677368164, -48.30841827392578, -46.489295959472656, -44.6701774597168, -42.85105895996094, -41.03193664550781, -39.21281814575195, -37.393699645996094, -35.57457733154297, -33.75545883178711, -31.936336517333984, -30.117218017578125, -28.298097610473633, -26.47897720336914, -24.65985870361328, -22.84073829650879, -21.021617889404297, -19.202497482299805, -17.383377075195312, -15.564258575439453, -13.745138168334961, -11.926017761230469, -10.106898307800293, -8.287778854370117, -6.468658447265625, -4.649538516998291, -2.830418586730957, -1.011298656463623, 0.8078212738037109, 2.626941680908203, 4.446061134338379, 6.265180587768555, 8.084300994873047, 9.903421401977539, 11.722540855407715, 13.54166030883789, 15.360780715942383, 17.179901123046875, 18.999019622802734, 20.818140029907227, 22.63726043701172, 24.45638084411621, 26.275501251220703, 28.094619750976562, 29.913740158081055, 31.732860565185547, 33.551979064941406, 35.37110137939453, 37.19021987915039, 39.00933837890625, 40.828460693359375, 42.647579193115234, 44.466697692871094, 46.28582000732422, 48.10493850708008, 49.92405700683594, 51.74317932128906]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 7.0, 18.0, 20.0, 48.0, 71.0, 120.0, 255.0, 518.0, 1223.0, 4968.0, 4084158.0, 97152.0, 3818.0, 1052.0, 404.0, 199.0, 106.0, 57.0, 34.0, 15.0, 9.0, 7.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.837646484375, -40.86279296875, -39.887939453125, -38.9130859375, -37.938232421875, -36.96337890625, -35.988525390625, -35.013671875, -34.038818359375, -33.06396484375, -32.089111328125, -31.1142578125, -30.139404296875, -29.16455078125, -28.189697265625, -27.21484375, -26.239990234375, -25.26513671875, -24.290283203125, -23.3154296875, -22.340576171875, -21.36572265625, -20.390869140625, -19.416015625, -18.441162109375, -17.46630859375, -16.491455078125, -15.5166015625, -14.541748046875, -13.56689453125, -12.592041015625, -11.6171875, -10.642333984375, -9.66748046875, -8.692626953125, -7.7177734375, -6.742919921875, -5.76806640625, -4.793212890625, -3.818359375, -2.843505859375, -1.86865234375, -0.893798828125, 0.0810546875, 1.055908203125, 2.03076171875, 3.005615234375, 3.98046875, 4.955322265625, 5.93017578125, 6.905029296875, 7.8798828125, 8.854736328125, 9.82958984375, 10.804443359375, 11.779296875, 12.754150390625, 13.72900390625, 14.703857421875, 15.6787109375, 16.653564453125, 17.62841796875, 18.603271484375, 19.578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 4.0, 6.0, 8.0, 9.0, 13.0, 16.0, 23.0, 24.0, 34.0, 47.0, 57.0, 49.0, 62.0, 59.0, 72.0, 67.0, 74.0, 63.0, 48.0, 50.0, 51.0, 37.0, 30.0, 18.0, 12.0, 9.0, 12.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.603515625, -3.49700927734375, -3.3905029296875, -3.28399658203125, -3.177490234375, -3.07098388671875, -2.9644775390625, -2.85797119140625, -2.75146484375, -2.64495849609375, -2.5384521484375, -2.43194580078125, -2.325439453125, -2.21893310546875, -2.1124267578125, -2.00592041015625, -1.8994140625, -1.79290771484375, -1.6864013671875, -1.57989501953125, -1.473388671875, -1.36688232421875, -1.2603759765625, -1.15386962890625, -1.04736328125, -0.94085693359375, -0.8343505859375, -0.72784423828125, -0.621337890625, -0.51483154296875, -0.4083251953125, -0.30181884765625, -0.1953125, -0.08880615234375, 0.0177001953125, 0.12420654296875, 0.230712890625, 0.33721923828125, 0.4437255859375, 0.55023193359375, 0.65673828125, 0.76324462890625, 0.8697509765625, 0.97625732421875, 1.082763671875, 1.18927001953125, 1.2957763671875, 1.40228271484375, 1.5087890625, 1.61529541015625, 1.7218017578125, 1.82830810546875, 1.934814453125, 2.04132080078125, 2.1478271484375, 2.25433349609375, 2.36083984375, 2.46734619140625, 2.5738525390625, 2.68035888671875, 2.786865234375, 2.89337158203125, 2.9998779296875, 3.10638427734375, 3.212890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 6.0, 24.0, 21.0, 28.0, 57.0, 58.0, 106.0, 166.0, 220.0, 393.0, 628.0, 1057.0, 1901.0, 3485.0, 6726.0, 13618.0, 40896.0, 3926265.0, 155373.0, 22511.0, 9383.0, 4979.0, 2610.0, 1548.0, 798.0, 559.0, 304.0, 173.0, 113.0, 81.0, 64.0, 31.0, 27.0, 31.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1328125, -9.8236083984375, -9.514404296875, -9.2052001953125, -8.89599609375, -8.5867919921875, -8.277587890625, -7.9683837890625, -7.6591796875, -7.3499755859375, -7.040771484375, -6.7315673828125, -6.42236328125, -6.1131591796875, -5.803955078125, -5.4947509765625, -5.185546875, -4.8763427734375, -4.567138671875, -4.2579345703125, -3.94873046875, -3.6395263671875, -3.330322265625, -3.0211181640625, -2.7119140625, -2.4027099609375, -2.093505859375, -1.7843017578125, -1.47509765625, -1.1658935546875, -0.856689453125, -0.5474853515625, -0.23828125, 0.0709228515625, 0.380126953125, 0.6893310546875, 0.99853515625, 1.3077392578125, 1.616943359375, 1.9261474609375, 2.2353515625, 2.5445556640625, 2.853759765625, 3.1629638671875, 3.47216796875, 3.7813720703125, 4.090576171875, 4.3997802734375, 4.708984375, 5.0181884765625, 5.327392578125, 5.6365966796875, 5.94580078125, 6.2550048828125, 6.564208984375, 6.8734130859375, 7.1826171875, 7.4918212890625, 7.801025390625, 8.1102294921875, 8.41943359375, 8.7286376953125, 9.037841796875, 9.3470458984375, 9.65625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 11.0, 7.0, 9.0, 10.0, 15.0, 12.0, 35.0, 88.0, 792.0, 2821.0, 121.0, 41.0, 28.0, 13.0, 13.0, 6.0, 5.0, 3.0, 3.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28515625, -4.1375732421875, -3.989990234375, -3.8424072265625, -3.69482421875, -3.5472412109375, -3.399658203125, -3.2520751953125, -3.1044921875, -2.9569091796875, -2.809326171875, -2.6617431640625, -2.51416015625, -2.3665771484375, -2.218994140625, -2.0714111328125, -1.923828125, -1.7762451171875, -1.628662109375, -1.4810791015625, -1.33349609375, -1.1859130859375, -1.038330078125, -0.8907470703125, -0.7431640625, -0.5955810546875, -0.447998046875, -0.3004150390625, -0.15283203125, -0.0052490234375, 0.142333984375, 0.2899169921875, 0.4375, 0.5850830078125, 0.732666015625, 0.8802490234375, 1.02783203125, 1.1754150390625, 1.322998046875, 1.4705810546875, 1.6181640625, 1.7657470703125, 1.913330078125, 2.0609130859375, 2.20849609375, 2.3560791015625, 2.503662109375, 2.6512451171875, 2.798828125, 2.9464111328125, 3.093994140625, 3.2415771484375, 3.38916015625, 3.5367431640625, 3.684326171875, 3.8319091796875, 3.9794921875, 4.1270751953125, 4.274658203125, 4.4222412109375, 4.56982421875, 4.7174072265625, 4.864990234375, 5.0125732421875, 5.16015625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 23.0, 48.0, 88.0, 172.0, 236.0, 205.0, 126.0, 51.0, 18.0, 10.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.96001434326172, -44.80512619018555, -43.65024185180664, -42.49535369873047, -41.3404655456543, -40.185577392578125, -39.03069305419922, -37.87580490112305, -36.720916748046875, -35.5660285949707, -34.4111442565918, -33.256256103515625, -32.10136795043945, -30.946481704711914, -29.791595458984375, -28.636707305908203, -27.481822967529297, -26.326936721801758, -25.172048568725586, -24.017162322998047, -22.862274169921875, -21.707387924194336, -20.552501678466797, -19.397613525390625, -18.242727279663086, -17.087841033935547, -15.932952880859375, -14.778066635131836, -13.62317943572998, -12.468292236328125, -11.313405990600586, -10.15851879119873, -9.00363540649414, -7.848748207092285, -6.693861484527588, -5.538974761962891, -4.384087562561035, -3.2292003631591797, -2.0743136405944824, -0.9194269180297852, 0.2354602813720703, 1.3903472423553467, 2.545234203338623, 3.7001211643218994, 4.855008125305176, 6.009895324707031, 7.1647820472717285, 8.319668769836426, 9.474555969238281, 10.629443168640137, 11.784330368041992, 12.939216613769531, 14.094103813171387, 15.248991012573242, 16.40387725830078, 17.558765411376953, 18.713651657104492, 19.86853790283203, 21.023426055908203, 22.178312301635742, 23.33319854736328, 24.488086700439453, 25.642972946166992, 26.79785919189453, 27.952747344970703]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 10.0, 10.0, 11.0, 10.0, 12.0, 26.0, 28.0, 35.0, 29.0, 43.0, 49.0, 59.0, 44.0, 55.0, 61.0, 57.0, 65.0, 54.0, 45.0, 47.0, 36.0, 42.0, 28.0, 38.0, 18.0, 16.0, 22.0, 9.0, 9.0, 7.0, 4.0, 11.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.56656265258789, -11.110664367675781, -10.654765129089355, -10.198866844177246, -9.742968559265137, -9.287069320678711, -8.831171035766602, -8.375272750854492, -7.919373989105225, -7.463475227355957, -7.007576942443848, -6.55167818069458, -6.0957794189453125, -5.639881134033203, -5.1839823722839355, -4.728083610534668, -4.272185325622559, -3.81628680229187, -3.3603882789611816, -2.904489517211914, -2.4485909938812256, -1.992692470550537, -1.5367937088012695, -1.080895185470581, -0.6249966621398926, -0.16909807920455933, 0.2868005037307739, 0.742699146270752, 1.1985976696014404, 1.654496192932129, 2.1103949546813965, 2.566293478012085, 3.0221920013427734, 3.478090524673462, 3.9339890480041504, 4.389887809753418, 4.845786094665527, 5.301684856414795, 5.7575836181640625, 6.213481903076172, 6.6693806648254395, 7.125279426574707, 7.581177711486816, 8.037076950073242, 8.492975234985352, 8.948873519897461, 9.40477180480957, 9.860671043395996, 10.316569328308105, 10.772467613220215, 11.22836685180664, 11.68426513671875, 12.14016342163086, 12.596061706542969, 13.051960945129395, 13.507859230041504, 13.96375846862793, 14.419656753540039, 14.875555992126465, 15.331454277038574, 15.787352561950684, 16.24325180053711, 16.69915008544922, 17.155048370361328, 17.610946655273438]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 14.0, 26.0, 47.0, 91.0, 172.0, 469.0, 1263.0, 4493.0, 18780.0, 112637.0, 642259.0, 225274.0, 32893.0, 7020.0, 2016.0, 607.0, 272.0, 100.0, 49.0, 29.0, 15.0, 6.0, 11.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.0257568359375, -7.637451171875, -7.2491455078125, -6.86083984375, -6.4725341796875, -6.084228515625, -5.6959228515625, -5.3076171875, -4.9193115234375, -4.531005859375, -4.1427001953125, -3.75439453125, -3.3660888671875, -2.977783203125, -2.5894775390625, -2.201171875, -1.8128662109375, -1.424560546875, -1.0362548828125, -0.64794921875, -0.2596435546875, 0.128662109375, 0.5169677734375, 0.9052734375, 1.2935791015625, 1.681884765625, 2.0701904296875, 2.45849609375, 2.8468017578125, 3.235107421875, 3.6234130859375, 4.01171875, 4.4000244140625, 4.788330078125, 5.1766357421875, 5.56494140625, 5.9532470703125, 6.341552734375, 6.7298583984375, 7.1181640625, 7.5064697265625, 7.894775390625, 8.2830810546875, 8.67138671875, 9.0596923828125, 9.447998046875, 9.8363037109375, 10.224609375, 10.6129150390625, 11.001220703125, 11.3895263671875, 11.77783203125, 12.1661376953125, 12.554443359375, 12.9427490234375, 13.3310546875, 13.7193603515625, 14.107666015625, 14.4959716796875, 14.88427734375, 15.2725830078125, 15.660888671875, 16.0491943359375, 16.4375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 11.0, 3.0, 8.0, 9.0, 7.0, 11.0, 23.0, 27.0, 25.0, 47.0, 35.0, 61.0, 39.0, 54.0, 67.0, 75.0, 79.0, 47.0, 60.0, 53.0, 44.0, 46.0, 33.0, 36.0, 17.0, 17.0, 9.0, 16.0, 8.0, 8.0, 3.0, 6.0, 2.0, 5.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.13330078125, -3.0244140625, -2.91552734375, -2.806640625, -2.69775390625, -2.5888671875, -2.47998046875, -2.37109375, -2.26220703125, -2.1533203125, -2.04443359375, -1.935546875, -1.82666015625, -1.7177734375, -1.60888671875, -1.5, -1.39111328125, -1.2822265625, -1.17333984375, -1.064453125, -0.95556640625, -0.8466796875, -0.73779296875, -0.62890625, -0.52001953125, -0.4111328125, -0.30224609375, -0.193359375, -0.08447265625, 0.0244140625, 0.13330078125, 0.2421875, 0.35107421875, 0.4599609375, 0.56884765625, 0.677734375, 0.78662109375, 0.8955078125, 1.00439453125, 1.11328125, 1.22216796875, 1.3310546875, 1.43994140625, 1.548828125, 1.65771484375, 1.7666015625, 1.87548828125, 1.984375, 2.09326171875, 2.2021484375, 2.31103515625, 2.419921875, 2.52880859375, 2.6376953125, 2.74658203125, 2.85546875, 2.96435546875, 3.0732421875, 3.18212890625, 3.291015625, 3.39990234375, 3.5087890625, 3.61767578125, 3.7265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 5.0, 12.0, 13.0, 14.0, 17.0, 31.0, 42.0, 54.0, 106.0, 170.0, 310.0, 578.0, 1252.0, 3514.0, 12748.0, 70121.0, 598147.0, 310463.0, 38422.0, 8046.0, 2407.0, 982.0, 436.0, 244.0, 139.0, 75.0, 68.0, 44.0, 37.0, 14.0, 9.0, 7.0, 9.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3125, -10.9456787109375, -10.578857421875, -10.2120361328125, -9.84521484375, -9.4783935546875, -9.111572265625, -8.7447509765625, -8.3779296875, -8.0111083984375, -7.644287109375, -7.2774658203125, -6.91064453125, -6.5438232421875, -6.177001953125, -5.8101806640625, -5.443359375, -5.0765380859375, -4.709716796875, -4.3428955078125, -3.97607421875, -3.6092529296875, -3.242431640625, -2.8756103515625, -2.5087890625, -2.1419677734375, -1.775146484375, -1.4083251953125, -1.04150390625, -0.6746826171875, -0.307861328125, 0.0589599609375, 0.42578125, 0.7926025390625, 1.159423828125, 1.5262451171875, 1.89306640625, 2.2598876953125, 2.626708984375, 2.9935302734375, 3.3603515625, 3.7271728515625, 4.093994140625, 4.4608154296875, 4.82763671875, 5.1944580078125, 5.561279296875, 5.9281005859375, 6.294921875, 6.6617431640625, 7.028564453125, 7.3953857421875, 7.76220703125, 8.1290283203125, 8.495849609375, 8.8626708984375, 9.2294921875, 9.5963134765625, 9.963134765625, 10.3299560546875, 10.69677734375, 11.0635986328125, 11.430419921875, 11.7972412109375, 12.1640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 7.0, 8.0, 11.0, 7.0, 13.0, 19.0, 16.0, 17.0, 25.0, 18.0, 36.0, 30.0, 39.0, 35.0, 30.0, 44.0, 51.0, 55.0, 37.0, 58.0, 41.0, 57.0, 36.0, 33.0, 46.0, 32.0, 33.0, 23.0, 21.0, 18.0, 16.0, 17.0, 10.0, 13.0, 11.0, 6.0, 8.0, 2.0, 6.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.3359375, -12.9610595703125, -12.586181640625, -12.2113037109375, -11.83642578125, -11.4615478515625, -11.086669921875, -10.7117919921875, -10.3369140625, -9.9620361328125, -9.587158203125, -9.2122802734375, -8.83740234375, -8.4625244140625, -8.087646484375, -7.7127685546875, -7.337890625, -6.9630126953125, -6.588134765625, -6.2132568359375, -5.83837890625, -5.4635009765625, -5.088623046875, -4.7137451171875, -4.3388671875, -3.9639892578125, -3.589111328125, -3.2142333984375, -2.83935546875, -2.4644775390625, -2.089599609375, -1.7147216796875, -1.33984375, -0.9649658203125, -0.590087890625, -0.2152099609375, 0.15966796875, 0.5345458984375, 0.909423828125, 1.2843017578125, 1.6591796875, 2.0340576171875, 2.408935546875, 2.7838134765625, 3.15869140625, 3.5335693359375, 3.908447265625, 4.2833251953125, 4.658203125, 5.0330810546875, 5.407958984375, 5.7828369140625, 6.15771484375, 6.5325927734375, 6.907470703125, 7.2823486328125, 7.6572265625, 8.0321044921875, 8.406982421875, 8.7818603515625, 9.15673828125, 9.5316162109375, 9.906494140625, 10.2813720703125, 10.65625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 11.0, 6.0, 12.0, 24.0, 29.0, 45.0, 57.0, 99.0, 188.0, 376.0, 781.0, 2478.0, 18574.0, 797596.0, 217309.0, 8045.0, 1612.0, 628.0, 263.0, 159.0, 90.0, 55.0, 36.0, 20.0, 12.0, 6.0, 4.0, 5.0, 2.0, 7.0, 4.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.41168212890625, -7.1632080078125, -6.91473388671875, -6.666259765625, -6.41778564453125, -6.1693115234375, -5.92083740234375, -5.67236328125, -5.42388916015625, -5.1754150390625, -4.92694091796875, -4.678466796875, -4.42999267578125, -4.1815185546875, -3.93304443359375, -3.6845703125, -3.43609619140625, -3.1876220703125, -2.93914794921875, -2.690673828125, -2.44219970703125, -2.1937255859375, -1.94525146484375, -1.69677734375, -1.44830322265625, -1.1998291015625, -0.95135498046875, -0.702880859375, -0.45440673828125, -0.2059326171875, 0.04254150390625, 0.291015625, 0.53948974609375, 0.7879638671875, 1.03643798828125, 1.284912109375, 1.53338623046875, 1.7818603515625, 2.03033447265625, 2.27880859375, 2.52728271484375, 2.7757568359375, 3.02423095703125, 3.272705078125, 3.52117919921875, 3.7696533203125, 4.01812744140625, 4.2666015625, 4.51507568359375, 4.7635498046875, 5.01202392578125, 5.260498046875, 5.50897216796875, 5.7574462890625, 6.00592041015625, 6.25439453125, 6.50286865234375, 6.7513427734375, 6.99981689453125, 7.248291015625, 7.49676513671875, 7.7452392578125, 7.99371337890625, 8.2421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 7.0, 5.0, 11.0, 16.0, 13.0, 24.0, 35.0, 48.0, 48.0, 62.0, 81.0, 99.0, 116.0, 83.0, 83.0, 67.0, 54.0, 40.0, 39.0, 28.0, 11.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008020401000976562, -0.000781819224357605, -0.0007615983486175537, -0.0007413774728775024, -0.0007211565971374512, -0.0007009357213973999, -0.0006807148456573486, -0.0006604939699172974, -0.0006402730941772461, -0.0006200522184371948, -0.0005998313426971436, -0.0005796104669570923, -0.000559389591217041, -0.0005391687154769897, -0.0005189478397369385, -0.0004987269639968872, -0.00047850608825683594, -0.00045828521251678467, -0.0004380643367767334, -0.00041784346103668213, -0.00039762258529663086, -0.0003774017095565796, -0.0003571808338165283, -0.00033695995807647705, -0.0003167390823364258, -0.0002965182065963745, -0.00027629733085632324, -0.00025607645511627197, -0.0002358555793762207, -0.00021563470363616943, -0.00019541382789611816, -0.0001751929521560669, -0.00015497207641601562, -0.00013475120067596436, -0.00011453032493591309, -9.430944919586182e-05, -7.408857345581055e-05, -5.386769771575928e-05, -3.364682197570801e-05, -1.3425946235656738e-05, 6.794929504394531e-06, 2.70158052444458e-05, 4.723668098449707e-05, 6.745755672454834e-05, 8.767843246459961e-05, 0.00010789930820465088, 0.00012812018394470215, 0.00014834105968475342, 0.0001685619354248047, 0.00018878281116485596, 0.00020900368690490723, 0.0002292245626449585, 0.00024944543838500977, 0.00026966631412506104, 0.0002898871898651123, 0.0003101080656051636, 0.00033032894134521484, 0.0003505498170852661, 0.0003707706928253174, 0.00039099156856536865, 0.0004112124443054199, 0.0004314333200454712, 0.00045165419578552246, 0.00047187507152557373, 0.000492095947265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 15.0, 29.0, 30.0, 62.0, 116.0, 163.0, 386.0, 1010.0, 3463.0, 21982.0, 601215.0, 398751.0, 16866.0, 2796.0, 890.0, 383.0, 146.0, 77.0, 50.0, 33.0, 26.0, 6.0, 9.0, 6.0, 7.0, 1.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.0546875, -8.83880615234375, -8.6229248046875, -8.40704345703125, -8.191162109375, -7.97528076171875, -7.7593994140625, -7.54351806640625, -7.32763671875, -7.11175537109375, -6.8958740234375, -6.67999267578125, -6.464111328125, -6.24822998046875, -6.0323486328125, -5.81646728515625, -5.6005859375, -5.38470458984375, -5.1688232421875, -4.95294189453125, -4.737060546875, -4.52117919921875, -4.3052978515625, -4.08941650390625, -3.87353515625, -3.65765380859375, -3.4417724609375, -3.22589111328125, -3.010009765625, -2.79412841796875, -2.5782470703125, -2.36236572265625, -2.146484375, -1.93060302734375, -1.7147216796875, -1.49884033203125, -1.282958984375, -1.06707763671875, -0.8511962890625, -0.63531494140625, -0.41943359375, -0.20355224609375, 0.0123291015625, 0.22821044921875, 0.444091796875, 0.65997314453125, 0.8758544921875, 1.09173583984375, 1.3076171875, 1.52349853515625, 1.7393798828125, 1.95526123046875, 2.171142578125, 2.38702392578125, 2.6029052734375, 2.81878662109375, 3.03466796875, 3.25054931640625, 3.4664306640625, 3.68231201171875, 3.898193359375, 4.11407470703125, 4.3299560546875, 4.54583740234375, 4.76171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 15.0, 23.0, 40.0, 70.0, 109.0, 158.0, 187.0, 139.0, 95.0, 66.0, 34.0, 11.0, 14.0, 11.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.7421875, -10.49493408203125, -10.2476806640625, -10.00042724609375, -9.753173828125, -9.50592041015625, -9.2586669921875, -9.01141357421875, -8.76416015625, -8.51690673828125, -8.2696533203125, -8.02239990234375, -7.775146484375, -7.52789306640625, -7.2806396484375, -7.03338623046875, -6.7861328125, -6.53887939453125, -6.2916259765625, -6.04437255859375, -5.797119140625, -5.54986572265625, -5.3026123046875, -5.05535888671875, -4.80810546875, -4.56085205078125, -4.3135986328125, -4.06634521484375, -3.819091796875, -3.57183837890625, -3.3245849609375, -3.07733154296875, -2.830078125, -2.58282470703125, -2.3355712890625, -2.08831787109375, -1.841064453125, -1.59381103515625, -1.3465576171875, -1.09930419921875, -0.85205078125, -0.60479736328125, -0.3575439453125, -0.11029052734375, 0.136962890625, 0.38421630859375, 0.6314697265625, 0.87872314453125, 1.1259765625, 1.37322998046875, 1.6204833984375, 1.86773681640625, 2.114990234375, 2.36224365234375, 2.6094970703125, 2.85675048828125, 3.10400390625, 3.35125732421875, 3.5985107421875, 3.84576416015625, 4.093017578125, 4.34027099609375, 4.5875244140625, 4.83477783203125, 5.08203125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 9.0, 19.0, 23.0, 48.0, 96.0, 174.0, 230.0, 188.0, 112.0, 58.0, 26.0, 10.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.55062484741211, -42.87131118774414, -39.19200134277344, -35.51268768310547, -31.833375930786133, -28.154064178466797, -24.474750518798828, -20.795438766479492, -17.116127014160156, -13.43681526184082, -9.757502555847168, -6.078189849853516, -2.3988780975341797, 1.2804336547851562, 4.959747314453125, 8.639059066772461, 12.318370819091797, 15.997682571411133, 19.67699432373047, 23.356307983398438, 27.035619735717773, 30.71493148803711, 34.39424514770508, 38.07355499267578, 41.75286865234375, 45.43218231201172, 49.11149215698242, 52.79080581665039, 56.470115661621094, 60.14942932128906, 63.82874298095703, 67.508056640625, 71.18736267089844, 74.8666763305664, 78.54598999023438, 82.22529602050781, 85.90460968017578, 89.58392333984375, 93.26323699951172, 96.94255065917969, 100.62185668945312, 104.3011703491211, 107.98048400878906, 111.6597900390625, 115.33910369873047, 119.01841735839844, 122.6977310180664, 126.37704467773438, 130.05636596679688, 133.7356719970703, 137.4149932861328, 141.09429931640625, 144.77362060546875, 148.4529266357422, 152.13223266601562, 155.81155395507812, 159.49085998535156, 163.170166015625, 166.8494873046875, 170.52879333496094, 174.20811462402344, 177.88742065429688, 181.56674194335938, 185.2460479736328, 188.92535400390625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 11.0, 12.0, 13.0, 19.0, 21.0, 32.0, 29.0, 48.0, 48.0, 49.0, 56.0, 48.0, 59.0, 55.0, 57.0, 58.0, 61.0, 51.0, 40.0, 33.0, 37.0, 33.0, 30.0, 19.0, 20.0, 8.0, 7.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-60.157470703125, -57.98529815673828, -55.8131217956543, -53.64094924926758, -51.468772888183594, -49.296600341796875, -47.124427795410156, -44.95225524902344, -42.78007888793945, -40.607906341552734, -38.43572998046875, -36.26355743408203, -34.09138488769531, -31.919208526611328, -29.74703598022461, -27.574861526489258, -25.402687072753906, -23.230512619018555, -21.058338165283203, -18.886165618896484, -16.713991165161133, -14.541816711425781, -12.369643211364746, -10.197469711303711, -8.02529525756836, -5.853121280670166, -3.6809473037719727, -1.5087733268737793, 0.6634006500244141, 2.8355751037597656, 5.007748603820801, 7.179922103881836, 9.352096557617188, 11.524271011352539, 13.696444511413574, 15.86861801147461, 18.04079246520996, 20.212966918945312, 22.38513946533203, 24.557313919067383, 26.729488372802734, 28.901662826538086, 31.073837280273438, 33.246009826660156, 35.418182373046875, 37.59035873413086, 39.76253128051758, 41.93470764160156, 44.10688018798828, 46.279052734375, 48.451229095458984, 50.6234016418457, 52.79557800292969, 54.967750549316406, 57.139923095703125, 59.312095642089844, 61.48427200317383, 63.65644454956055, 65.82862091064453, 68.00079345703125, 70.17296600341797, 72.34513854980469, 74.51731872558594, 76.68949127197266, 78.86166381835938]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 9.0, 8.0, 7.0, 14.0, 23.0, 31.0, 44.0, 64.0, 122.0, 230.0, 520.0, 1415.0, 4756.0, 20186.0, 172647.0, 3870601.0, 102783.0, 14670.0, 3834.0, 1219.0, 501.0, 247.0, 121.0, 66.0, 48.0, 27.0, 25.0, 21.0, 17.0, 2.0, 7.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5390625, -7.2027587890625, -6.866455078125, -6.5301513671875, -6.19384765625, -5.8575439453125, -5.521240234375, -5.1849365234375, -4.8486328125, -4.5123291015625, -4.176025390625, -3.8397216796875, -3.50341796875, -3.1671142578125, -2.830810546875, -2.4945068359375, -2.158203125, -1.8218994140625, -1.485595703125, -1.1492919921875, -0.81298828125, -0.4766845703125, -0.140380859375, 0.1959228515625, 0.5322265625, 0.8685302734375, 1.204833984375, 1.5411376953125, 1.87744140625, 2.2137451171875, 2.550048828125, 2.8863525390625, 3.22265625, 3.5589599609375, 3.895263671875, 4.2315673828125, 4.56787109375, 4.9041748046875, 5.240478515625, 5.5767822265625, 5.9130859375, 6.2493896484375, 6.585693359375, 6.9219970703125, 7.25830078125, 7.5946044921875, 7.930908203125, 8.2672119140625, 8.603515625, 8.9398193359375, 9.276123046875, 9.6124267578125, 9.94873046875, 10.2850341796875, 10.621337890625, 10.9576416015625, 11.2939453125, 11.6302490234375, 11.966552734375, 12.3028564453125, 12.63916015625, 12.9754638671875, 13.311767578125, 13.6480712890625, 13.984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 19.0, 28.0, 51.0, 92.0, 95.0, 95.0, 110.0, 123.0, 103.0, 92.0, 69.0, 53.0, 28.0, 15.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.699371337890625, -3.51397705078125, -3.328582763671875, -3.1431884765625, -2.957794189453125, -2.77239990234375, -2.587005615234375, -2.401611328125, -2.216217041015625, -2.03082275390625, -1.845428466796875, -1.6600341796875, -1.474639892578125, -1.28924560546875, -1.103851318359375, -0.91845703125, -0.733062744140625, -0.54766845703125, -0.362274169921875, -0.1768798828125, 0.008514404296875, 0.19390869140625, 0.379302978515625, 0.564697265625, 0.750091552734375, 0.93548583984375, 1.120880126953125, 1.3062744140625, 1.491668701171875, 1.67706298828125, 1.862457275390625, 2.0478515625, 2.233245849609375, 2.41864013671875, 2.604034423828125, 2.7894287109375, 2.974822998046875, 3.16021728515625, 3.345611572265625, 3.531005859375, 3.716400146484375, 3.90179443359375, 4.087188720703125, 4.2725830078125, 4.457977294921875, 4.64337158203125, 4.828765869140625, 5.01416015625, 5.199554443359375, 5.38494873046875, 5.570343017578125, 5.7557373046875, 5.941131591796875, 6.12652587890625, 6.311920166015625, 6.497314453125, 6.682708740234375, 6.86810302734375, 7.053497314453125, 7.2388916015625, 7.424285888671875, 7.60968017578125, 7.795074462890625, 7.98046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 11.0, 8.0, 11.0, 24.0, 30.0, 42.0, 69.0, 147.0, 262.0, 459.0, 960.0, 2151.0, 6049.0, 20371.0, 95416.0, 3246476.0, 744294.0, 56254.0, 13537.0, 4277.0, 1710.0, 776.0, 360.0, 215.0, 124.0, 68.0, 50.0, 37.0, 24.0, 16.0, 9.0, 11.0, 7.0, 7.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4296875, -7.142333984375, -6.85498046875, -6.567626953125, -6.2802734375, -5.992919921875, -5.70556640625, -5.418212890625, -5.130859375, -4.843505859375, -4.55615234375, -4.268798828125, -3.9814453125, -3.694091796875, -3.40673828125, -3.119384765625, -2.83203125, -2.544677734375, -2.25732421875, -1.969970703125, -1.6826171875, -1.395263671875, -1.10791015625, -0.820556640625, -0.533203125, -0.245849609375, 0.04150390625, 0.328857421875, 0.6162109375, 0.903564453125, 1.19091796875, 1.478271484375, 1.765625, 2.052978515625, 2.34033203125, 2.627685546875, 2.9150390625, 3.202392578125, 3.48974609375, 3.777099609375, 4.064453125, 4.351806640625, 4.63916015625, 4.926513671875, 5.2138671875, 5.501220703125, 5.78857421875, 6.075927734375, 6.36328125, 6.650634765625, 6.93798828125, 7.225341796875, 7.5126953125, 7.800048828125, 8.08740234375, 8.374755859375, 8.662109375, 8.949462890625, 9.23681640625, 9.524169921875, 9.8115234375, 10.098876953125, 10.38623046875, 10.673583984375, 10.9609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 11.0, 8.0, 13.0, 14.0, 24.0, 37.0, 54.0, 77.0, 116.0, 247.0, 728.0, 1584.0, 650.0, 205.0, 111.0, 55.0, 42.0, 22.0, 20.0, 12.0, 8.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.98828125, -7.66168212890625, -7.3350830078125, -7.00848388671875, -6.681884765625, -6.35528564453125, -6.0286865234375, -5.70208740234375, -5.37548828125, -5.04888916015625, -4.7222900390625, -4.39569091796875, -4.069091796875, -3.74249267578125, -3.4158935546875, -3.08929443359375, -2.7626953125, -2.43609619140625, -2.1094970703125, -1.78289794921875, -1.456298828125, -1.12969970703125, -0.8031005859375, -0.47650146484375, -0.14990234375, 0.17669677734375, 0.5032958984375, 0.82989501953125, 1.156494140625, 1.48309326171875, 1.8096923828125, 2.13629150390625, 2.462890625, 2.78948974609375, 3.1160888671875, 3.44268798828125, 3.769287109375, 4.09588623046875, 4.4224853515625, 4.74908447265625, 5.07568359375, 5.40228271484375, 5.7288818359375, 6.05548095703125, 6.382080078125, 6.70867919921875, 7.0352783203125, 7.36187744140625, 7.6884765625, 8.01507568359375, 8.3416748046875, 8.66827392578125, 8.994873046875, 9.32147216796875, 9.6480712890625, 9.97467041015625, 10.30126953125, 10.62786865234375, 10.9544677734375, 11.28106689453125, 11.607666015625, 11.93426513671875, 12.2608642578125, 12.58746337890625, 12.9140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 7.0, 13.0, 28.0, 36.0, 90.0, 173.0, 237.0, 200.0, 107.0, 51.0, 27.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.2810287475586, -101.19893646240234, -98.11685180664062, -95.03475952148438, -91.95267486572266, -88.8705825805664, -85.78849792480469, -82.70640563964844, -79.62431335449219, -76.54222106933594, -73.46013641357422, -70.37804412841797, -67.29595947265625, -64.2138671875, -61.131778717041016, -58.04969024658203, -54.96760559082031, -51.88551712036133, -48.803428649902344, -45.721336364746094, -42.639251708984375, -39.557159423828125, -36.47507095336914, -33.392982482910156, -30.310894012451172, -27.228805541992188, -24.146717071533203, -21.064626693725586, -17.9825382232666, -14.900449752807617, -11.818359375, -8.736270904541016, -5.6541748046875, -2.5720858573913574, 0.5100030899047852, 3.592092514038086, 6.67418098449707, 9.756269454956055, 12.838359832763672, 15.920448303222656, 19.00253677368164, 22.084625244140625, 25.16671371459961, 28.248804092407227, 31.33089256286621, 34.41297912597656, 37.49507141113281, 40.5771598815918, 43.65924835205078, 46.741336822509766, 49.82342529296875, 52.905517578125, 55.98760223388672, 59.06969451904297, 62.15178298950195, 65.23387145996094, 68.31596374511719, 71.39805603027344, 74.48014068603516, 77.5622329711914, 80.64431762695312, 83.72640991210938, 86.80850219726562, 89.89058685302734, 92.97267150878906]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 5.0, 10.0, 11.0, 11.0, 11.0, 20.0, 31.0, 28.0, 36.0, 37.0, 55.0, 53.0, 53.0, 41.0, 59.0, 50.0, 56.0, 41.0, 45.0, 46.0, 47.0, 43.0, 38.0, 30.0, 23.0, 39.0, 22.0, 23.0, 12.0, 4.0, 6.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.659873962402344, -41.1981315612793, -39.736385345458984, -38.27464294433594, -36.812896728515625, -35.35115432739258, -33.889408111572266, -32.42766571044922, -30.965919494628906, -29.504175186157227, -28.042430877685547, -26.580686569213867, -25.118942260742188, -23.657197952270508, -22.195453643798828, -20.73371124267578, -19.2719669342041, -17.810222625732422, -16.348478317260742, -14.886734008789062, -13.424989700317383, -11.963245391845703, -10.50150203704834, -9.03975772857666, -7.5780134201049805, -6.116269111633301, -4.654524803161621, -3.1927809715270996, -1.73103666305542, -0.26929235458374023, 1.1924514770507812, 2.654195785522461, 4.115940093994141, 5.57768440246582, 7.0394287109375, 8.50117301940918, 9.96291732788086, 11.424661636352539, 12.886404991149902, 14.348149299621582, 15.809893608093262, 17.271636962890625, 18.733381271362305, 20.195125579833984, 21.656869888305664, 23.118614196777344, 24.580358505249023, 26.042102813720703, 27.503847122192383, 28.965591430664062, 30.427335739135742, 31.889080047607422, 33.35082244873047, 34.81256866455078, 36.27431106567383, 37.73605728149414, 39.19779968261719, 40.659542083740234, 42.12128829956055, 43.583030700683594, 45.044776916503906, 46.50651931762695, 47.968265533447266, 49.43000793457031, 50.891754150390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 9.0, 6.0, 13.0, 12.0, 23.0, 28.0, 56.0, 84.0, 137.0, 232.0, 358.0, 645.0, 1200.0, 2365.0, 4960.0, 11105.0, 27430.0, 71735.0, 199896.0, 406447.0, 200985.0, 72188.0, 27349.0, 11045.0, 5026.0, 2391.0, 1236.0, 622.0, 388.0, 222.0, 129.0, 84.0, 47.0, 33.0, 30.0, 5.0, 9.0, 8.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.79058837890625, -5.6124267578125, -5.43426513671875, -5.256103515625, -5.07794189453125, -4.8997802734375, -4.72161865234375, -4.54345703125, -4.36529541015625, -4.1871337890625, -4.00897216796875, -3.830810546875, -3.65264892578125, -3.4744873046875, -3.29632568359375, -3.1181640625, -2.94000244140625, -2.7618408203125, -2.58367919921875, -2.405517578125, -2.22735595703125, -2.0491943359375, -1.87103271484375, -1.69287109375, -1.51470947265625, -1.3365478515625, -1.15838623046875, -0.980224609375, -0.80206298828125, -0.6239013671875, -0.44573974609375, -0.267578125, -0.08941650390625, 0.0887451171875, 0.26690673828125, 0.445068359375, 0.62322998046875, 0.8013916015625, 0.97955322265625, 1.15771484375, 1.33587646484375, 1.5140380859375, 1.69219970703125, 1.870361328125, 2.04852294921875, 2.2266845703125, 2.40484619140625, 2.5830078125, 2.76116943359375, 2.9393310546875, 3.11749267578125, 3.295654296875, 3.47381591796875, 3.6519775390625, 3.83013916015625, 4.00830078125, 4.18646240234375, 4.3646240234375, 4.54278564453125, 4.720947265625, 4.89910888671875, 5.0772705078125, 5.25543212890625, 5.43359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 16.0, 9.0, 14.0, 24.0, 23.0, 44.0, 25.0, 42.0, 47.0, 51.0, 71.0, 69.0, 66.0, 53.0, 58.0, 56.0, 62.0, 61.0, 41.0, 37.0, 29.0, 18.0, 22.0, 18.0, 9.0, 9.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.5723876953125, -2.465087890625, -2.3577880859375, -2.25048828125, -2.1431884765625, -2.035888671875, -1.9285888671875, -1.8212890625, -1.7139892578125, -1.606689453125, -1.4993896484375, -1.39208984375, -1.2847900390625, -1.177490234375, -1.0701904296875, -0.962890625, -0.8555908203125, -0.748291015625, -0.6409912109375, -0.53369140625, -0.4263916015625, -0.319091796875, -0.2117919921875, -0.1044921875, 0.0028076171875, 0.110107421875, 0.2174072265625, 0.32470703125, 0.4320068359375, 0.539306640625, 0.6466064453125, 0.75390625, 0.8612060546875, 0.968505859375, 1.0758056640625, 1.18310546875, 1.2904052734375, 1.397705078125, 1.5050048828125, 1.6123046875, 1.7196044921875, 1.826904296875, 1.9342041015625, 2.04150390625, 2.1488037109375, 2.256103515625, 2.3634033203125, 2.470703125, 2.5780029296875, 2.685302734375, 2.7926025390625, 2.89990234375, 3.0072021484375, 3.114501953125, 3.2218017578125, 3.3291015625, 3.4364013671875, 3.543701171875, 3.6510009765625, 3.75830078125, 3.8656005859375, 3.972900390625, 4.0802001953125, 4.1875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 7.0, 19.0, 22.0, 32.0, 37.0, 59.0, 86.0, 155.0, 242.0, 364.0, 649.0, 1190.0, 2459.0, 6882.0, 26061.0, 157826.0, 686275.0, 132465.0, 22858.0, 5983.0, 2241.0, 1082.0, 572.0, 353.0, 229.0, 124.0, 76.0, 54.0, 40.0, 28.0, 22.0, 11.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.4888916015625, -9.196533203125, -8.9041748046875, -8.61181640625, -8.3194580078125, -8.027099609375, -7.7347412109375, -7.4423828125, -7.1500244140625, -6.857666015625, -6.5653076171875, -6.27294921875, -5.9805908203125, -5.688232421875, -5.3958740234375, -5.103515625, -4.8111572265625, -4.518798828125, -4.2264404296875, -3.93408203125, -3.6417236328125, -3.349365234375, -3.0570068359375, -2.7646484375, -2.4722900390625, -2.179931640625, -1.8875732421875, -1.59521484375, -1.3028564453125, -1.010498046875, -0.7181396484375, -0.42578125, -0.1334228515625, 0.158935546875, 0.4512939453125, 0.74365234375, 1.0360107421875, 1.328369140625, 1.6207275390625, 1.9130859375, 2.2054443359375, 2.497802734375, 2.7901611328125, 3.08251953125, 3.3748779296875, 3.667236328125, 3.9595947265625, 4.251953125, 4.5443115234375, 4.836669921875, 5.1290283203125, 5.42138671875, 5.7137451171875, 6.006103515625, 6.2984619140625, 6.5908203125, 6.8831787109375, 7.175537109375, 7.4678955078125, 7.76025390625, 8.0526123046875, 8.344970703125, 8.6373291015625, 8.9296875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 5.0, 9.0, 11.0, 9.0, 14.0, 18.0, 20.0, 27.0, 29.0, 30.0, 23.0, 41.0, 45.0, 51.0, 58.0, 54.0, 52.0, 42.0, 55.0, 57.0, 55.0, 45.0, 38.0, 28.0, 38.0, 29.0, 19.0, 22.0, 11.0, 11.0, 15.0, 8.0, 13.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.2723388671875, -9.880615234375, -9.4888916015625, -9.09716796875, -8.7054443359375, -8.313720703125, -7.9219970703125, -7.5302734375, -7.1385498046875, -6.746826171875, -6.3551025390625, -5.96337890625, -5.5716552734375, -5.179931640625, -4.7882080078125, -4.396484375, -4.0047607421875, -3.613037109375, -3.2213134765625, -2.82958984375, -2.4378662109375, -2.046142578125, -1.6544189453125, -1.2626953125, -0.8709716796875, -0.479248046875, -0.0875244140625, 0.30419921875, 0.6959228515625, 1.087646484375, 1.4793701171875, 1.87109375, 2.2628173828125, 2.654541015625, 3.0462646484375, 3.43798828125, 3.8297119140625, 4.221435546875, 4.6131591796875, 5.0048828125, 5.3966064453125, 5.788330078125, 6.1800537109375, 6.57177734375, 6.9635009765625, 7.355224609375, 7.7469482421875, 8.138671875, 8.5303955078125, 8.922119140625, 9.3138427734375, 9.70556640625, 10.0972900390625, 10.489013671875, 10.8807373046875, 11.2724609375, 11.6641845703125, 12.055908203125, 12.4476318359375, 12.83935546875, 13.2310791015625, 13.622802734375, 14.0145263671875, 14.40625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 3.0, 5.0, 12.0, 12.0, 22.0, 21.0, 38.0, 64.0, 101.0, 198.0, 350.0, 718.0, 2063.0, 7927.0, 57870.0, 780844.0, 176598.0, 16249.0, 3282.0, 1106.0, 490.0, 243.0, 120.0, 91.0, 34.0, 25.0, 19.0, 11.0, 10.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.9776611328125, -4.834228515625, -4.6907958984375, -4.54736328125, -4.4039306640625, -4.260498046875, -4.1170654296875, -3.9736328125, -3.8302001953125, -3.686767578125, -3.5433349609375, -3.39990234375, -3.2564697265625, -3.113037109375, -2.9696044921875, -2.826171875, -2.6827392578125, -2.539306640625, -2.3958740234375, -2.25244140625, -2.1090087890625, -1.965576171875, -1.8221435546875, -1.6787109375, -1.5352783203125, -1.391845703125, -1.2484130859375, -1.10498046875, -0.9615478515625, -0.818115234375, -0.6746826171875, -0.53125, -0.3878173828125, -0.244384765625, -0.1009521484375, 0.04248046875, 0.1859130859375, 0.329345703125, 0.4727783203125, 0.6162109375, 0.7596435546875, 0.903076171875, 1.0465087890625, 1.18994140625, 1.3333740234375, 1.476806640625, 1.6202392578125, 1.763671875, 1.9071044921875, 2.050537109375, 2.1939697265625, 2.33740234375, 2.4808349609375, 2.624267578125, 2.7677001953125, 2.9111328125, 3.0545654296875, 3.197998046875, 3.3414306640625, 3.48486328125, 3.6282958984375, 3.771728515625, 3.9151611328125, 4.05859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 11.0, 3.0, 5.0, 7.0, 12.0, 13.0, 22.0, 27.0, 29.0, 42.0, 62.0, 66.0, 81.0, 94.0, 102.0, 85.0, 68.0, 56.0, 51.0, 32.0, 30.0, 23.0, 12.0, 11.0, 10.0, 12.0, 8.0, 7.0, 2.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0006971359252929688, -0.0006788335740566254, -0.000660531222820282, -0.0006422288715839386, -0.0006239265203475952, -0.0006056241691112518, -0.0005873218178749084, -0.0005690194666385651, -0.0005507171154022217, -0.0005324147641658783, -0.0005141124129295349, -0.0004958100616931915, -0.00047750771045684814, -0.00045920535922050476, -0.0004409030079841614, -0.000422600656747818, -0.0004042983055114746, -0.0003859959542751312, -0.00036769360303878784, -0.00034939125180244446, -0.0003310889005661011, -0.0003127865493297577, -0.0002944841980934143, -0.0002761818468570709, -0.00025787949562072754, -0.00023957714438438416, -0.00022127479314804077, -0.0002029724419116974, -0.000184670090675354, -0.00016636773943901062, -0.00014806538820266724, -0.00012976303696632385, -0.00011146068572998047, -9.315833449363708e-05, -7.48559832572937e-05, -5.655363202095032e-05, -3.8251280784606934e-05, -1.994892954826355e-05, -1.646578311920166e-06, 1.6655772924423218e-05, 3.49581241607666e-05, 5.3260475397109985e-05, 7.156282663345337e-05, 8.986517786979675e-05, 0.00010816752910614014, 0.00012646988034248352, 0.0001447722315788269, 0.0001630745828151703, 0.00018137693405151367, 0.00019967928528785706, 0.00021798163652420044, 0.00023628398776054382, 0.0002545863389968872, 0.0002728886902332306, 0.000291191041469574, 0.00030949339270591736, 0.00032779574394226074, 0.0003460980951786041, 0.0003644004464149475, 0.0003827027976512909, 0.0004010051488876343, 0.00041930750012397766, 0.00043760985136032104, 0.00045591220259666443, 0.0004742145538330078]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 5.0, 7.0, 11.0, 15.0, 23.0, 33.0, 60.0, 128.0, 214.0, 406.0, 960.0, 2871.0, 12059.0, 101226.0, 804268.0, 108709.0, 12569.0, 2959.0, 1066.0, 422.0, 212.0, 131.0, 69.0, 44.0, 19.0, 17.0, 7.0, 9.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.4796142578125, -4.345947265625, -4.2122802734375, -4.07861328125, -3.9449462890625, -3.811279296875, -3.6776123046875, -3.5439453125, -3.4102783203125, -3.276611328125, -3.1429443359375, -3.00927734375, -2.8756103515625, -2.741943359375, -2.6082763671875, -2.474609375, -2.3409423828125, -2.207275390625, -2.0736083984375, -1.93994140625, -1.8062744140625, -1.672607421875, -1.5389404296875, -1.4052734375, -1.2716064453125, -1.137939453125, -1.0042724609375, -0.87060546875, -0.7369384765625, -0.603271484375, -0.4696044921875, -0.3359375, -0.2022705078125, -0.068603515625, 0.0650634765625, 0.19873046875, 0.3323974609375, 0.466064453125, 0.5997314453125, 0.7333984375, 0.8670654296875, 1.000732421875, 1.1343994140625, 1.26806640625, 1.4017333984375, 1.535400390625, 1.6690673828125, 1.802734375, 1.9364013671875, 2.070068359375, 2.2037353515625, 2.33740234375, 2.4710693359375, 2.604736328125, 2.7384033203125, 2.8720703125, 3.0057373046875, 3.139404296875, 3.2730712890625, 3.40673828125, 3.5404052734375, 3.674072265625, 3.8077392578125, 3.94140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 12.0, 8.0, 8.0, 5.0, 11.0, 25.0, 22.0, 29.0, 37.0, 50.0, 63.0, 67.0, 83.0, 99.0, 77.0, 67.0, 67.0, 64.0, 35.0, 37.0, 28.0, 22.0, 14.0, 20.0, 13.0, 10.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.365234375, -3.251861572265625, -3.13848876953125, -3.025115966796875, -2.9117431640625, -2.798370361328125, -2.68499755859375, -2.571624755859375, -2.458251953125, -2.344879150390625, -2.23150634765625, -2.118133544921875, -2.0047607421875, -1.891387939453125, -1.77801513671875, -1.664642333984375, -1.55126953125, -1.437896728515625, -1.32452392578125, -1.211151123046875, -1.0977783203125, -0.984405517578125, -0.87103271484375, -0.757659912109375, -0.644287109375, -0.530914306640625, -0.41754150390625, -0.304168701171875, -0.1907958984375, -0.077423095703125, 0.03594970703125, 0.149322509765625, 0.2626953125, 0.376068115234375, 0.48944091796875, 0.602813720703125, 0.7161865234375, 0.829559326171875, 0.94293212890625, 1.056304931640625, 1.169677734375, 1.283050537109375, 1.39642333984375, 1.509796142578125, 1.6231689453125, 1.736541748046875, 1.84991455078125, 1.963287353515625, 2.07666015625, 2.190032958984375, 2.30340576171875, 2.416778564453125, 2.5301513671875, 2.643524169921875, 2.75689697265625, 2.870269775390625, 2.983642578125, 3.097015380859375, 3.21038818359375, 3.323760986328125, 3.4371337890625, 3.550506591796875, 3.66387939453125, 3.777252197265625, 3.890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 10.0, 21.0, 59.0, 142.0, 294.0, 245.0, 134.0, 53.0, 19.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.8255844116211, -77.13379669189453, -73.44200897216797, -69.7502212524414, -66.05843353271484, -62.36664581298828, -58.67485427856445, -54.98306655883789, -51.29127883911133, -47.599491119384766, -43.9077033996582, -40.215911865234375, -36.52412414550781, -32.83233642578125, -29.140548706054688, -25.448760986328125, -21.756973266601562, -18.065185546875, -14.373396873474121, -10.681608200073242, -6.98982048034668, -3.298032760620117, 0.3937568664550781, 4.085544586181641, 7.777332305908203, 11.469120025634766, 15.160908699035645, 18.852697372436523, 22.544485092163086, 26.23627281188965, 29.928062438964844, 33.619850158691406, 37.31163024902344, 41.00341796875, 44.69520568847656, 48.386993408203125, 52.07878112792969, 55.77056884765625, 59.46236038208008, 63.15414810180664, 66.84593200683594, 70.5377197265625, 74.22950744628906, 77.92129516601562, 81.61308288574219, 85.30487060546875, 88.99665832519531, 92.68844604492188, 96.38024139404297, 100.07202911376953, 103.7638168334961, 107.45560455322266, 111.14739227294922, 114.83917999267578, 118.53097534179688, 122.22276306152344, 125.91455078125, 129.60633850097656, 133.29812622070312, 136.9899139404297, 140.68170166015625, 144.3734893798828, 148.06527709960938, 151.75706481933594, 155.4488525390625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 12.0, 13.0, 18.0, 15.0, 30.0, 39.0, 47.0, 45.0, 50.0, 67.0, 81.0, 95.0, 86.0, 69.0, 57.0, 56.0, 46.0, 28.0, 32.0, 26.0, 17.0, 18.0, 15.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.80537414550781, -81.68424224853516, -79.56311798095703, -77.44198608398438, -75.32085418701172, -73.19972229003906, -71.07859802246094, -68.95746612548828, -66.83633422851562, -64.71520233154297, -62.59407424926758, -60.47294616699219, -58.35181427001953, -56.23068618774414, -54.10955810546875, -51.988426208496094, -49.86730194091797, -47.74617385864258, -45.62504196166992, -43.50391387939453, -41.382781982421875, -39.261653900146484, -37.140525817871094, -35.01939392089844, -32.89826583862305, -30.777135848999023, -28.656005859375, -26.53487777709961, -24.413747787475586, -22.292617797851562, -20.171489715576172, -18.05035972595215, -15.929237365722656, -13.808107376098633, -11.686978340148926, -9.565849304199219, -7.444719314575195, -5.323589324951172, -3.202460289001465, -1.0813312530517578, 1.0397987365722656, 3.160928249359131, 5.282057762145996, 7.403187274932861, 9.524316787719727, 11.64544677734375, 13.766575813293457, 15.887704849243164, 18.008834838867188, 20.12996482849121, 22.251094818115234, 24.372222900390625, 26.49335289001465, 28.614482879638672, 30.735610961914062, 32.85674285888672, 34.97787094116211, 37.0989990234375, 39.220130920410156, 41.34125900268555, 43.46238708496094, 45.583518981933594, 47.704647064208984, 49.825775146484375, 51.94690704345703]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 15.0, 15.0, 13.0, 27.0, 39.0, 62.0, 84.0, 154.0, 246.0, 533.0, 1909.0, 10233.0, 221264.0, 3922615.0, 31313.0, 4014.0, 988.0, 314.0, 166.0, 75.0, 45.0, 39.0, 24.0, 16.0, 11.0, 13.0, 4.0, 3.0, 5.0, 2.0, 3.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.90625, -11.468994140625, -11.03173828125, -10.594482421875, -10.1572265625, -9.719970703125, -9.28271484375, -8.845458984375, -8.408203125, -7.970947265625, -7.53369140625, -7.096435546875, -6.6591796875, -6.221923828125, -5.78466796875, -5.347412109375, -4.91015625, -4.472900390625, -4.03564453125, -3.598388671875, -3.1611328125, -2.723876953125, -2.28662109375, -1.849365234375, -1.412109375, -0.974853515625, -0.53759765625, -0.100341796875, 0.3369140625, 0.774169921875, 1.21142578125, 1.648681640625, 2.0859375, 2.523193359375, 2.96044921875, 3.397705078125, 3.8349609375, 4.272216796875, 4.70947265625, 5.146728515625, 5.583984375, 6.021240234375, 6.45849609375, 6.895751953125, 7.3330078125, 7.770263671875, 8.20751953125, 8.644775390625, 9.08203125, 9.519287109375, 9.95654296875, 10.393798828125, 10.8310546875, 11.268310546875, 11.70556640625, 12.142822265625, 12.580078125, 13.017333984375, 13.45458984375, 13.891845703125, 14.3291015625, 14.766357421875, 15.20361328125, 15.640869140625, 16.078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 18.0, 21.0, 35.0, 55.0, 68.0, 79.0, 105.0, 88.0, 88.0, 103.0, 93.0, 62.0, 54.0, 34.0, 43.0, 23.0, 13.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.37109375, -7.21484375, -7.05859375, -6.90234375, -6.74609375, -6.58984375, -6.43359375, -6.27734375, -6.12109375, -5.96484375, -5.80859375, -5.65234375, -5.49609375, -5.33984375, -5.18359375, -5.02734375, -4.87109375, -4.71484375, -4.55859375, -4.40234375, -4.24609375, -4.08984375, -3.93359375, -3.77734375, -3.62109375, -3.46484375, -3.30859375, -3.15234375, -2.99609375, -2.83984375, -2.68359375, -2.52734375, -2.37109375, -2.21484375, -2.05859375, -1.90234375, -1.74609375, -1.58984375, -1.43359375, -1.27734375, -1.12109375, -0.96484375, -0.80859375, -0.65234375, -0.49609375, -0.33984375, -0.18359375, -0.02734375, 0.12890625, 0.28515625, 0.44140625, 0.59765625, 0.75390625, 0.91015625, 1.06640625, 1.22265625, 1.37890625, 1.53515625, 1.69140625, 1.84765625, 2.00390625, 2.16015625, 2.31640625, 2.47265625, 2.62890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 9.0, 11.0, 16.0, 17.0, 36.0, 65.0, 114.0, 209.0, 421.0, 947.0, 1970.0, 4483.0, 11180.0, 30235.0, 116562.0, 2621217.0, 1282348.0, 85756.0, 23408.0, 8729.0, 3540.0, 1552.0, 708.0, 318.0, 182.0, 103.0, 38.0, 45.0, 20.0, 16.0, 12.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.2633056640625, -5.081298828125, -4.8992919921875, -4.71728515625, -4.5352783203125, -4.353271484375, -4.1712646484375, -3.9892578125, -3.8072509765625, -3.625244140625, -3.4432373046875, -3.26123046875, -3.0792236328125, -2.897216796875, -2.7152099609375, -2.533203125, -2.3511962890625, -2.169189453125, -1.9871826171875, -1.80517578125, -1.6231689453125, -1.441162109375, -1.2591552734375, -1.0771484375, -0.8951416015625, -0.713134765625, -0.5311279296875, -0.34912109375, -0.1671142578125, 0.014892578125, 0.1968994140625, 0.37890625, 0.5609130859375, 0.742919921875, 0.9249267578125, 1.10693359375, 1.2889404296875, 1.470947265625, 1.6529541015625, 1.8349609375, 2.0169677734375, 2.198974609375, 2.3809814453125, 2.56298828125, 2.7449951171875, 2.927001953125, 3.1090087890625, 3.291015625, 3.4730224609375, 3.655029296875, 3.8370361328125, 4.01904296875, 4.2010498046875, 4.383056640625, 4.5650634765625, 4.7470703125, 4.9290771484375, 5.111083984375, 5.2930908203125, 5.47509765625, 5.6571044921875, 5.839111328125, 6.0211181640625, 6.203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 5.0, 8.0, 4.0, 11.0, 21.0, 18.0, 22.0, 20.0, 50.0, 44.0, 77.0, 118.0, 212.0, 448.0, 999.0, 958.0, 449.0, 200.0, 154.0, 72.0, 50.0, 32.0, 17.0, 13.0, 5.0, 12.0, 5.0, 7.0, 5.0, 6.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.46246337890625, -5.2803955078125, -5.09832763671875, -4.916259765625, -4.73419189453125, -4.5521240234375, -4.37005615234375, -4.18798828125, -4.00592041015625, -3.8238525390625, -3.64178466796875, -3.459716796875, -3.27764892578125, -3.0955810546875, -2.91351318359375, -2.7314453125, -2.54937744140625, -2.3673095703125, -2.18524169921875, -2.003173828125, -1.82110595703125, -1.6390380859375, -1.45697021484375, -1.27490234375, -1.09283447265625, -0.9107666015625, -0.72869873046875, -0.546630859375, -0.36456298828125, -0.1824951171875, -0.00042724609375, 0.181640625, 0.36370849609375, 0.5457763671875, 0.72784423828125, 0.909912109375, 1.09197998046875, 1.2740478515625, 1.45611572265625, 1.63818359375, 1.82025146484375, 2.0023193359375, 2.18438720703125, 2.366455078125, 2.54852294921875, 2.7305908203125, 2.91265869140625, 3.0947265625, 3.27679443359375, 3.4588623046875, 3.64093017578125, 3.822998046875, 4.00506591796875, 4.1871337890625, 4.36920166015625, 4.55126953125, 4.73333740234375, 4.9154052734375, 5.09747314453125, 5.279541015625, 5.46160888671875, 5.6436767578125, 5.82574462890625, 6.0078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 12.0, 7.0, 15.0, 50.0, 150.0, 276.0, 250.0, 161.0, 35.0, 15.0, 8.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.70965576171875, -100.08948516845703, -97.46932220458984, -94.84915161132812, -92.22898864746094, -89.60881805419922, -86.9886474609375, -84.36848449707031, -81.7483139038086, -79.12814331054688, -76.50798034667969, -73.88780975341797, -71.26763916015625, -68.64747619628906, -66.02730560302734, -63.40713882446289, -60.78697204589844, -58.166805267333984, -55.54663848876953, -52.92646789550781, -50.30630111694336, -47.686134338378906, -45.06596374511719, -42.445796966552734, -39.82563018798828, -37.20546340942383, -34.585296630859375, -31.965126037597656, -29.344959259033203, -26.72479248046875, -24.104623794555664, -21.484455108642578, -18.864295959472656, -16.244129180908203, -13.623960494995117, -11.003792762756348, -8.383625030517578, -5.763457298278809, -3.143289566040039, -0.5231208801269531, 2.0970458984375, 4.7172136306762695, 7.337381362915039, 9.957549095153809, 12.577716827392578, 15.197884559631348, 17.818052291870117, 20.438220977783203, 23.058387756347656, 25.67855453491211, 28.298723220825195, 30.91889190673828, 33.539058685302734, 36.15922546386719, 38.779396057128906, 41.39956283569336, 44.01972961425781, 46.639896392822266, 49.26006317138672, 51.88023376464844, 54.50040054321289, 57.120567321777344, 59.74073791503906, 62.360904693603516, 64.98107147216797]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 2.0, 7.0, 18.0, 15.0, 18.0, 23.0, 35.0, 48.0, 38.0, 54.0, 61.0, 61.0, 73.0, 65.0, 64.0, 55.0, 51.0, 60.0, 56.0, 42.0, 41.0, 22.0, 23.0, 22.0, 13.0, 12.0, 10.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.1634521484375, -44.91395568847656, -43.664459228515625, -42.41495895385742, -41.165462493896484, -39.91596603393555, -38.666465759277344, -37.416969299316406, -36.16747283935547, -34.91797637939453, -33.668479919433594, -32.41897964477539, -31.169483184814453, -29.919986724853516, -28.670488357543945, -27.420989990234375, -26.171493530273438, -24.9219970703125, -23.67249870300293, -22.42300033569336, -21.173503875732422, -19.924007415771484, -18.674509048461914, -17.425010681152344, -16.175514221191406, -14.926016807556152, -13.676519393920898, -12.427021980285645, -11.17752456665039, -9.928027153015137, -8.678529739379883, -7.429032325744629, -6.179534912109375, -4.930037498474121, -3.680540084838867, -2.4310426712036133, -1.1815452575683594, 0.06795215606689453, 1.3174495697021484, 2.5669469833374023, 3.8164443969726562, 5.06594181060791, 6.315439224243164, 7.564936637878418, 8.814434051513672, 10.063931465148926, 11.31342887878418, 12.562926292419434, 13.812423706054688, 15.061921119689941, 16.311418533325195, 17.560916900634766, 18.810413360595703, 20.05990982055664, 21.30940818786621, 22.55890655517578, 23.80840301513672, 25.057899475097656, 26.307397842407227, 27.556896209716797, 28.806392669677734, 30.055889129638672, 31.305387496948242, 32.55488586425781, 33.80438232421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 7.0, 12.0, 20.0, 30.0, 34.0, 49.0, 98.0, 132.0, 221.0, 352.0, 651.0, 1063.0, 1959.0, 3707.0, 7069.0, 14741.0, 32462.0, 75728.0, 192327.0, 384120.0, 194358.0, 76276.0, 32673.0, 15038.0, 7057.0, 3727.0, 1965.0, 1078.0, 625.0, 361.0, 215.0, 140.0, 76.0, 46.0, 38.0, 33.0, 20.0, 12.0, 5.0, 8.0, 9.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.30596923828125, -4.1549072265625, -4.00384521484375, -3.852783203125, -3.70172119140625, -3.5506591796875, -3.39959716796875, -3.24853515625, -3.09747314453125, -2.9464111328125, -2.79534912109375, -2.644287109375, -2.49322509765625, -2.3421630859375, -2.19110107421875, -2.0400390625, -1.88897705078125, -1.7379150390625, -1.58685302734375, -1.435791015625, -1.28472900390625, -1.1336669921875, -0.98260498046875, -0.83154296875, -0.68048095703125, -0.5294189453125, -0.37835693359375, -0.227294921875, -0.07623291015625, 0.0748291015625, 0.22589111328125, 0.376953125, 0.52801513671875, 0.6790771484375, 0.83013916015625, 0.981201171875, 1.13226318359375, 1.2833251953125, 1.43438720703125, 1.58544921875, 1.73651123046875, 1.8875732421875, 2.03863525390625, 2.189697265625, 2.34075927734375, 2.4918212890625, 2.64288330078125, 2.7939453125, 2.94500732421875, 3.0960693359375, 3.24713134765625, 3.398193359375, 3.54925537109375, 3.7003173828125, 3.85137939453125, 4.00244140625, 4.15350341796875, 4.3045654296875, 4.45562744140625, 4.606689453125, 4.75775146484375, 4.9088134765625, 5.05987548828125, 5.2109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 12.0, 15.0, 18.0, 28.0, 28.0, 37.0, 42.0, 52.0, 53.0, 54.0, 50.0, 51.0, 62.0, 64.0, 49.0, 49.0, 61.0, 48.0, 28.0, 40.0, 31.0, 27.0, 26.0, 18.0, 11.0, 13.0, 3.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.0679931640625, -3.968017578125, -3.8680419921875, -3.76806640625, -3.6680908203125, -3.568115234375, -3.4681396484375, -3.3681640625, -3.2681884765625, -3.168212890625, -3.0682373046875, -2.96826171875, -2.8682861328125, -2.768310546875, -2.6683349609375, -2.568359375, -2.4683837890625, -2.368408203125, -2.2684326171875, -2.16845703125, -2.0684814453125, -1.968505859375, -1.8685302734375, -1.7685546875, -1.6685791015625, -1.568603515625, -1.4686279296875, -1.36865234375, -1.2686767578125, -1.168701171875, -1.0687255859375, -0.96875, -0.8687744140625, -0.768798828125, -0.6688232421875, -0.56884765625, -0.4688720703125, -0.368896484375, -0.2689208984375, -0.1689453125, -0.0689697265625, 0.031005859375, 0.1309814453125, 0.23095703125, 0.3309326171875, 0.430908203125, 0.5308837890625, 0.630859375, 0.7308349609375, 0.830810546875, 0.9307861328125, 1.03076171875, 1.1307373046875, 1.230712890625, 1.3306884765625, 1.4306640625, 1.5306396484375, 1.630615234375, 1.7305908203125, 1.83056640625, 1.9305419921875, 2.030517578125, 2.1304931640625, 2.23046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 8.0, 11.0, 13.0, 16.0, 30.0, 35.0, 73.0, 133.0, 223.0, 600.0, 1705.0, 6711.0, 46955.0, 683045.0, 278784.0, 23894.0, 4179.0, 1191.0, 487.0, 192.0, 114.0, 53.0, 36.0, 18.0, 7.0, 9.0, 6.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.234375, -16.822509765625, -16.41064453125, -15.998779296875, -15.5869140625, -15.175048828125, -14.76318359375, -14.351318359375, -13.939453125, -13.527587890625, -13.11572265625, -12.703857421875, -12.2919921875, -11.880126953125, -11.46826171875, -11.056396484375, -10.64453125, -10.232666015625, -9.82080078125, -9.408935546875, -8.9970703125, -8.585205078125, -8.17333984375, -7.761474609375, -7.349609375, -6.937744140625, -6.52587890625, -6.114013671875, -5.7021484375, -5.290283203125, -4.87841796875, -4.466552734375, -4.0546875, -3.642822265625, -3.23095703125, -2.819091796875, -2.4072265625, -1.995361328125, -1.58349609375, -1.171630859375, -0.759765625, -0.347900390625, 0.06396484375, 0.475830078125, 0.8876953125, 1.299560546875, 1.71142578125, 2.123291015625, 2.53515625, 2.947021484375, 3.35888671875, 3.770751953125, 4.1826171875, 4.594482421875, 5.00634765625, 5.418212890625, 5.830078125, 6.241943359375, 6.65380859375, 7.065673828125, 7.4775390625, 7.889404296875, 8.30126953125, 8.713134765625, 9.125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 10.0, 13.0, 16.0, 15.0, 34.0, 27.0, 28.0, 37.0, 48.0, 32.0, 42.0, 48.0, 65.0, 55.0, 57.0, 56.0, 53.0, 40.0, 41.0, 25.0, 34.0, 33.0, 33.0, 29.0, 24.0, 14.0, 14.0, 7.0, 8.0, 4.0, 6.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.609375, -10.2681884765625, -9.927001953125, -9.5858154296875, -9.24462890625, -8.9034423828125, -8.562255859375, -8.2210693359375, -7.8798828125, -7.5386962890625, -7.197509765625, -6.8563232421875, -6.51513671875, -6.1739501953125, -5.832763671875, -5.4915771484375, -5.150390625, -4.8092041015625, -4.468017578125, -4.1268310546875, -3.78564453125, -3.4444580078125, -3.103271484375, -2.7620849609375, -2.4208984375, -2.0797119140625, -1.738525390625, -1.3973388671875, -1.05615234375, -0.7149658203125, -0.373779296875, -0.0325927734375, 0.30859375, 0.6497802734375, 0.990966796875, 1.3321533203125, 1.67333984375, 2.0145263671875, 2.355712890625, 2.6968994140625, 3.0380859375, 3.3792724609375, 3.720458984375, 4.0616455078125, 4.40283203125, 4.7440185546875, 5.085205078125, 5.4263916015625, 5.767578125, 6.1087646484375, 6.449951171875, 6.7911376953125, 7.13232421875, 7.4735107421875, 7.814697265625, 8.1558837890625, 8.4970703125, 8.8382568359375, 9.179443359375, 9.5206298828125, 9.86181640625, 10.2030029296875, 10.544189453125, 10.8853759765625, 11.2265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 14.0, 9.0, 24.0, 41.0, 50.0, 93.0, 181.0, 448.0, 1416.0, 8536.0, 724529.0, 304932.0, 6261.0, 1234.0, 393.0, 156.0, 85.0, 55.0, 32.0, 23.0, 12.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.51806640625, -8.2236328125, -7.92919921875, -7.634765625, -7.34033203125, -7.0458984375, -6.75146484375, -6.45703125, -6.16259765625, -5.8681640625, -5.57373046875, -5.279296875, -4.98486328125, -4.6904296875, -4.39599609375, -4.1015625, -3.80712890625, -3.5126953125, -3.21826171875, -2.923828125, -2.62939453125, -2.3349609375, -2.04052734375, -1.74609375, -1.45166015625, -1.1572265625, -0.86279296875, -0.568359375, -0.27392578125, 0.0205078125, 0.31494140625, 0.609375, 0.90380859375, 1.1982421875, 1.49267578125, 1.787109375, 2.08154296875, 2.3759765625, 2.67041015625, 2.96484375, 3.25927734375, 3.5537109375, 3.84814453125, 4.142578125, 4.43701171875, 4.7314453125, 5.02587890625, 5.3203125, 5.61474609375, 5.9091796875, 6.20361328125, 6.498046875, 6.79248046875, 7.0869140625, 7.38134765625, 7.67578125, 7.97021484375, 8.2646484375, 8.55908203125, 8.853515625, 9.14794921875, 9.4423828125, 9.73681640625, 10.03125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 8.0, 9.0, 23.0, 44.0, 125.0, 304.0, 275.0, 127.0, 54.0, 23.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021839141845703125, -0.002117753028869629, -0.0020515918731689453, -0.0019854307174682617, -0.0019192695617675781, -0.0018531084060668945, -0.001786947250366211, -0.0017207860946655273, -0.0016546249389648438, -0.0015884637832641602, -0.0015223026275634766, -0.001456141471862793, -0.0013899803161621094, -0.0013238191604614258, -0.0012576580047607422, -0.0011914968490600586, -0.001125335693359375, -0.0010591745376586914, -0.0009930133819580078, -0.0009268522262573242, -0.0008606910705566406, -0.000794529914855957, -0.0007283687591552734, -0.0006622076034545898, -0.0005960464477539062, -0.0005298852920532227, -0.00046372413635253906, -0.00039756298065185547, -0.0003314018249511719, -0.0002652406692504883, -0.0001990795135498047, -0.0001329183578491211, -6.67572021484375e-05, -5.960464477539062e-07, 6.556510925292969e-05, 0.00013172626495361328, 0.00019788742065429688, 0.00026404857635498047, 0.00033020973205566406, 0.00039637088775634766, 0.00046253204345703125, 0.0005286931991577148, 0.0005948543548583984, 0.000661015510559082, 0.0007271766662597656, 0.0007933378219604492, 0.0008594989776611328, 0.0009256601333618164, 0.0009918212890625, 0.0010579824447631836, 0.0011241436004638672, 0.0011903047561645508, 0.0012564659118652344, 0.001322627067565918, 0.0013887882232666016, 0.0014549493789672852, 0.0015211105346679688, 0.0015872716903686523, 0.001653432846069336, 0.0017195940017700195, 0.0017857551574707031, 0.0018519163131713867, 0.0019180774688720703, 0.001984238624572754, 0.0020503997802734375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 9.0, 14.0, 23.0, 48.0, 104.0, 214.0, 610.0, 2685.0, 28948.0, 944713.0, 65908.0, 3969.0, 785.0, 268.0, 111.0, 62.0, 24.0, 24.0, 14.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.36053466796875, -5.1234130859375, -4.88629150390625, -4.649169921875, -4.41204833984375, -4.1749267578125, -3.93780517578125, -3.70068359375, -3.46356201171875, -3.2264404296875, -2.98931884765625, -2.752197265625, -2.51507568359375, -2.2779541015625, -2.04083251953125, -1.8037109375, -1.56658935546875, -1.3294677734375, -1.09234619140625, -0.855224609375, -0.61810302734375, -0.3809814453125, -0.14385986328125, 0.09326171875, 0.33038330078125, 0.5675048828125, 0.80462646484375, 1.041748046875, 1.27886962890625, 1.5159912109375, 1.75311279296875, 1.990234375, 2.22735595703125, 2.4644775390625, 2.70159912109375, 2.938720703125, 3.17584228515625, 3.4129638671875, 3.65008544921875, 3.88720703125, 4.12432861328125, 4.3614501953125, 4.59857177734375, 4.835693359375, 5.07281494140625, 5.3099365234375, 5.54705810546875, 5.7841796875, 6.02130126953125, 6.2584228515625, 6.49554443359375, 6.732666015625, 6.96978759765625, 7.2069091796875, 7.44403076171875, 7.68115234375, 7.91827392578125, 8.1553955078125, 8.39251708984375, 8.629638671875, 8.86676025390625, 9.1038818359375, 9.34100341796875, 9.578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 2.0, 5.0, 10.0, 16.0, 25.0, 27.0, 64.0, 86.0, 144.0, 173.0, 155.0, 110.0, 74.0, 42.0, 26.0, 12.0, 8.0, 8.0, 1.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.89453125, -7.704833984375, -7.51513671875, -7.325439453125, -7.1357421875, -6.946044921875, -6.75634765625, -6.566650390625, -6.376953125, -6.187255859375, -5.99755859375, -5.807861328125, -5.6181640625, -5.428466796875, -5.23876953125, -5.049072265625, -4.859375, -4.669677734375, -4.47998046875, -4.290283203125, -4.1005859375, -3.910888671875, -3.72119140625, -3.531494140625, -3.341796875, -3.152099609375, -2.96240234375, -2.772705078125, -2.5830078125, -2.393310546875, -2.20361328125, -2.013916015625, -1.82421875, -1.634521484375, -1.44482421875, -1.255126953125, -1.0654296875, -0.875732421875, -0.68603515625, -0.496337890625, -0.306640625, -0.116943359375, 0.07275390625, 0.262451171875, 0.4521484375, 0.641845703125, 0.83154296875, 1.021240234375, 1.2109375, 1.400634765625, 1.59033203125, 1.780029296875, 1.9697265625, 2.159423828125, 2.34912109375, 2.538818359375, 2.728515625, 2.918212890625, 3.10791015625, 3.297607421875, 3.4873046875, 3.677001953125, 3.86669921875, 4.056396484375, 4.24609375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 18.0, 35.0, 56.0, 131.0, 219.0, 209.0, 133.0, 74.0, 44.0, 34.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.428253173828125, -54.912776947021484, -52.397300720214844, -49.8818244934082, -47.36634826660156, -44.85087203979492, -42.33539581298828, -39.81991958618164, -37.304443359375, -34.78896713256836, -32.27349090576172, -29.758014678955078, -27.242538452148438, -24.727062225341797, -22.211585998535156, -19.696109771728516, -17.180633544921875, -14.665157318115234, -12.149681091308594, -9.634204864501953, -7.1187286376953125, -4.603252410888672, -2.0877761840820312, 0.4277000427246094, 2.94317626953125, 5.458652496337891, 7.974128723144531, 10.489604949951172, 13.005081176757812, 15.520557403564453, 18.036033630371094, 20.551509857177734, 23.066986083984375, 25.582462310791016, 28.097938537597656, 30.613414764404297, 33.12889099121094, 35.64436721801758, 38.15984344482422, 40.67531967163086, 43.1907958984375, 45.70627212524414, 48.22174835205078, 50.73722457885742, 53.25270080566406, 55.7681770324707, 58.283653259277344, 60.799129486083984, 63.314605712890625, 65.830078125, 68.3455581665039, 70.86103820800781, 73.37651062011719, 75.89198303222656, 78.40746307373047, 80.92294311523438, 83.43841552734375, 85.95388793945312, 88.46936798095703, 90.98484802246094, 93.50032043457031, 96.01579284667969, 98.5312728881836, 101.0467529296875, 103.56222534179688]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 8.0, 5.0, 11.0, 6.0, 13.0, 15.0, 19.0, 22.0, 18.0, 28.0, 24.0, 32.0, 36.0, 29.0, 30.0, 38.0, 48.0, 43.0, 65.0, 51.0, 45.0, 43.0, 41.0, 41.0, 47.0, 36.0, 41.0, 22.0, 17.0, 14.0, 20.0, 13.0, 18.0, 10.0, 7.0, 6.0, 5.0, 6.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-44.51716232299805, -43.176795959472656, -41.83642578125, -40.49605941772461, -39.15569305419922, -37.81532287597656, -36.47495651245117, -35.13459014892578, -33.794219970703125, -32.453853607177734, -31.113483428955078, -29.773117065429688, -28.432748794555664, -27.09238052368164, -25.75201416015625, -24.411645889282227, -23.071277618408203, -21.73090934753418, -20.390541076660156, -19.050174713134766, -17.709806442260742, -16.36943817138672, -15.029070854187012, -13.688703536987305, -12.348335266113281, -11.007966995239258, -9.66759967803955, -8.327232360839844, -6.98686408996582, -5.646496295928955, -4.30612850189209, -2.965761184692383, -1.625396728515625, -0.28502893447875977, 1.0553388595581055, 2.3957066535949707, 3.736074447631836, 5.076442241668701, 6.416810035705566, 7.757177352905273, 9.097545623779297, 10.43791389465332, 11.778281211853027, 13.118648529052734, 14.459016799926758, 15.799385070800781, 17.139751434326172, 18.480119705200195, 19.82048797607422, 21.160856246948242, 22.501224517822266, 23.841590881347656, 25.18195915222168, 26.522327423095703, 27.862693786621094, 29.203062057495117, 30.54343032836914, 31.883798599243164, 33.22416687011719, 34.56453323364258, 35.90489959716797, 37.245269775390625, 38.585636138916016, 39.926002502441406, 41.26637268066406]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 7.0, 8.0, 17.0, 23.0, 31.0, 26.0, 72.0, 97.0, 137.0, 274.0, 542.0, 1373.0, 4228.0, 17865.0, 137991.0, 3441790.0, 541490.0, 37580.0, 7118.0, 2042.0, 765.0, 337.0, 168.0, 115.0, 62.0, 29.0, 23.0, 17.0, 7.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4765625, -7.2728271484375, -7.069091796875, -6.8653564453125, -6.66162109375, -6.4578857421875, -6.254150390625, -6.0504150390625, -5.8466796875, -5.6429443359375, -5.439208984375, -5.2354736328125, -5.03173828125, -4.8280029296875, -4.624267578125, -4.4205322265625, -4.216796875, -4.0130615234375, -3.809326171875, -3.6055908203125, -3.40185546875, -3.1981201171875, -2.994384765625, -2.7906494140625, -2.5869140625, -2.3831787109375, -2.179443359375, -1.9757080078125, -1.77197265625, -1.5682373046875, -1.364501953125, -1.1607666015625, -0.95703125, -0.7532958984375, -0.549560546875, -0.3458251953125, -0.14208984375, 0.0616455078125, 0.265380859375, 0.4691162109375, 0.6728515625, 0.8765869140625, 1.080322265625, 1.2840576171875, 1.48779296875, 1.6915283203125, 1.895263671875, 2.0989990234375, 2.302734375, 2.5064697265625, 2.710205078125, 2.9139404296875, 3.11767578125, 3.3214111328125, 3.525146484375, 3.7288818359375, 3.9326171875, 4.1363525390625, 4.340087890625, 4.5438232421875, 4.74755859375, 4.9512939453125, 5.155029296875, 5.3587646484375, 5.5625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 7.0, 10.0, 5.0, 13.0, 16.0, 17.0, 27.0, 33.0, 32.0, 31.0, 42.0, 34.0, 44.0, 48.0, 39.0, 41.0, 59.0, 49.0, 62.0, 46.0, 37.0, 50.0, 42.0, 42.0, 35.0, 14.0, 23.0, 16.0, 18.0, 13.0, 11.0, 16.0, 10.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.751953125, -2.6784210205078125, -2.604888916015625, -2.5313568115234375, -2.45782470703125, -2.3842926025390625, -2.310760498046875, -2.2372283935546875, -2.1636962890625, -2.0901641845703125, -2.016632080078125, -1.9430999755859375, -1.86956787109375, -1.7960357666015625, -1.722503662109375, -1.6489715576171875, -1.575439453125, -1.5019073486328125, -1.428375244140625, -1.3548431396484375, -1.28131103515625, -1.2077789306640625, -1.134246826171875, -1.0607147216796875, -0.9871826171875, -0.9136505126953125, -0.840118408203125, -0.7665863037109375, -0.69305419921875, -0.6195220947265625, -0.545989990234375, -0.4724578857421875, -0.39892578125, -0.3253936767578125, -0.251861572265625, -0.1783294677734375, -0.10479736328125, -0.0312652587890625, 0.042266845703125, 0.1157989501953125, 0.1893310546875, 0.2628631591796875, 0.336395263671875, 0.4099273681640625, 0.48345947265625, 0.5569915771484375, 0.630523681640625, 0.7040557861328125, 0.777587890625, 0.8511199951171875, 0.924652099609375, 0.9981842041015625, 1.07171630859375, 1.1452484130859375, 1.218780517578125, 1.2923126220703125, 1.3658447265625, 1.4393768310546875, 1.512908935546875, 1.5864410400390625, 1.65997314453125, 1.7335052490234375, 1.807037353515625, 1.8805694580078125, 1.9541015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 12.0, 17.0, 30.0, 35.0, 53.0, 91.0, 170.0, 325.0, 622.0, 1508.0, 4054.0, 14799.0, 82807.0, 2314445.0, 1679478.0, 74498.0, 14643.0, 4132.0, 1430.0, 552.0, 256.0, 127.0, 77.0, 39.0, 24.0, 25.0, 9.0, 7.0, 0.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.26678466796875, -5.0374755859375, -4.80816650390625, -4.578857421875, -4.34954833984375, -4.1202392578125, -3.89093017578125, -3.66162109375, -3.43231201171875, -3.2030029296875, -2.97369384765625, -2.744384765625, -2.51507568359375, -2.2857666015625, -2.05645751953125, -1.8271484375, -1.59783935546875, -1.3685302734375, -1.13922119140625, -0.909912109375, -0.68060302734375, -0.4512939453125, -0.22198486328125, 0.00732421875, 0.23663330078125, 0.4659423828125, 0.69525146484375, 0.924560546875, 1.15386962890625, 1.3831787109375, 1.61248779296875, 1.841796875, 2.07110595703125, 2.3004150390625, 2.52972412109375, 2.759033203125, 2.98834228515625, 3.2176513671875, 3.44696044921875, 3.67626953125, 3.90557861328125, 4.1348876953125, 4.36419677734375, 4.593505859375, 4.82281494140625, 5.0521240234375, 5.28143310546875, 5.5107421875, 5.74005126953125, 5.9693603515625, 6.19866943359375, 6.427978515625, 6.65728759765625, 6.8865966796875, 7.11590576171875, 7.34521484375, 7.57452392578125, 7.8038330078125, 8.03314208984375, 8.262451171875, 8.49176025390625, 8.7210693359375, 8.95037841796875, 9.1796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 10.0, 15.0, 16.0, 42.0, 43.0, 69.0, 89.0, 133.0, 245.0, 491.0, 1022.0, 889.0, 395.0, 184.0, 123.0, 83.0, 53.0, 40.0, 22.0, 20.0, 20.0, 13.0, 5.0, 12.0, 4.0, 3.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5078125, -8.28277587890625, -8.0577392578125, -7.83270263671875, -7.607666015625, -7.38262939453125, -7.1575927734375, -6.93255615234375, -6.70751953125, -6.48248291015625, -6.2574462890625, -6.03240966796875, -5.807373046875, -5.58233642578125, -5.3572998046875, -5.13226318359375, -4.9072265625, -4.68218994140625, -4.4571533203125, -4.23211669921875, -4.007080078125, -3.78204345703125, -3.5570068359375, -3.33197021484375, -3.10693359375, -2.88189697265625, -2.6568603515625, -2.43182373046875, -2.206787109375, -1.98175048828125, -1.7567138671875, -1.53167724609375, -1.306640625, -1.08160400390625, -0.8565673828125, -0.63153076171875, -0.406494140625, -0.18145751953125, 0.0435791015625, 0.26861572265625, 0.49365234375, 0.71868896484375, 0.9437255859375, 1.16876220703125, 1.393798828125, 1.61883544921875, 1.8438720703125, 2.06890869140625, 2.2939453125, 2.51898193359375, 2.7440185546875, 2.96905517578125, 3.194091796875, 3.41912841796875, 3.6441650390625, 3.86920166015625, 4.09423828125, 4.31927490234375, 4.5443115234375, 4.76934814453125, 4.994384765625, 5.21942138671875, 5.4444580078125, 5.66949462890625, 5.89453125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 15.0, 24.0, 82.0, 191.0, 330.0, 229.0, 75.0, 23.0, 12.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-117.02490997314453, -113.55226135253906, -110.0796127319336, -106.60696411132812, -103.13431549072266, -99.66166687011719, -96.18901824951172, -92.71636962890625, -89.24372100830078, -85.77107238769531, -82.29842376708984, -78.82577514648438, -75.3531265258789, -71.88047790527344, -68.40782928466797, -64.9351806640625, -61.462528228759766, -57.9898796081543, -54.51723098754883, -51.04458236694336, -47.57193374633789, -44.099281311035156, -40.62663269042969, -37.15398406982422, -33.68133544921875, -30.20868682861328, -26.736038208007812, -23.263389587402344, -19.790740966796875, -16.318090438842773, -12.845441818237305, -9.372793197631836, -5.900146484375, -2.427497625350952, 1.0451512336730957, 4.517800331115723, 7.990448951721191, 11.463098526000977, 14.935747146606445, 18.408395767211914, 21.881044387817383, 25.35369300842285, 28.82634162902832, 32.29899215698242, 35.77164077758789, 39.24428939819336, 42.71693801879883, 46.1895866394043, 49.662235260009766, 53.134883880615234, 56.6075325012207, 60.08018112182617, 63.55282974243164, 67.02548217773438, 70.49813079833984, 73.97077941894531, 77.44342803955078, 80.91607666015625, 84.38872528076172, 87.86137390136719, 91.33402252197266, 94.80667114257812, 98.2793197631836, 101.75196838378906, 105.22461700439453]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 7.0, 10.0, 4.0, 4.0, 6.0, 7.0, 15.0, 13.0, 16.0, 25.0, 29.0, 37.0, 24.0, 41.0, 31.0, 57.0, 61.0, 56.0, 57.0, 50.0, 50.0, 47.0, 53.0, 38.0, 40.0, 36.0, 30.0, 30.0, 29.0, 14.0, 17.0, 18.0, 20.0, 9.0, 8.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.60093688964844, -33.525184631347656, -32.449432373046875, -31.373676300048828, -30.297924041748047, -29.222171783447266, -28.14641761779785, -27.070663452148438, -25.994911193847656, -24.919158935546875, -23.84340476989746, -22.767650604248047, -21.691898345947266, -20.616146087646484, -19.54039192199707, -18.464637756347656, -17.388885498046875, -16.313133239746094, -15.23737907409668, -14.161625862121582, -13.085872650146484, -12.010119438171387, -10.934366226196289, -9.858613014221191, -8.782859802246094, -7.707106590270996, -6.631353378295898, -5.555600166320801, -4.479846954345703, -3.4040937423706055, -2.328340530395508, -1.2525873184204102, -0.1768341064453125, 0.8989191055297852, 1.9746723175048828, 3.0504255294799805, 4.126178741455078, 5.201931953430176, 6.277685165405273, 7.353438377380371, 8.429191589355469, 9.504944801330566, 10.580698013305664, 11.656451225280762, 12.73220443725586, 13.807957649230957, 14.883710861206055, 15.959464073181152, 17.03521728515625, 18.11096954345703, 19.186723709106445, 20.26247787475586, 21.33823013305664, 22.413982391357422, 23.489736557006836, 24.56549072265625, 25.64124298095703, 26.716995239257812, 27.792749404907227, 28.86850357055664, 29.944255828857422, 31.020008087158203, 32.09576416015625, 33.17151641845703, 34.24726867675781]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 8.0, 11.0, 11.0, 16.0, 31.0, 62.0, 65.0, 133.0, 265.0, 405.0, 903.0, 1924.0, 4605.0, 11090.0, 28385.0, 75346.0, 194819.0, 380616.0, 213410.0, 83325.0, 31603.0, 12332.0, 4955.0, 2147.0, 985.0, 500.0, 234.0, 128.0, 86.0, 60.0, 31.0, 19.0, 13.0, 15.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.75244140625, -4.6064453125, -4.46044921875, -4.314453125, -4.16845703125, -4.0224609375, -3.87646484375, -3.73046875, -3.58447265625, -3.4384765625, -3.29248046875, -3.146484375, -3.00048828125, -2.8544921875, -2.70849609375, -2.5625, -2.41650390625, -2.2705078125, -2.12451171875, -1.978515625, -1.83251953125, -1.6865234375, -1.54052734375, -1.39453125, -1.24853515625, -1.1025390625, -0.95654296875, -0.810546875, -0.66455078125, -0.5185546875, -0.37255859375, -0.2265625, -0.08056640625, 0.0654296875, 0.21142578125, 0.357421875, 0.50341796875, 0.6494140625, 0.79541015625, 0.94140625, 1.08740234375, 1.2333984375, 1.37939453125, 1.525390625, 1.67138671875, 1.8173828125, 1.96337890625, 2.109375, 2.25537109375, 2.4013671875, 2.54736328125, 2.693359375, 2.83935546875, 2.9853515625, 3.13134765625, 3.27734375, 3.42333984375, 3.5693359375, 3.71533203125, 3.861328125, 4.00732421875, 4.1533203125, 4.29931640625, 4.4453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 12.0, 10.0, 14.0, 17.0, 20.0, 18.0, 28.0, 32.0, 32.0, 33.0, 40.0, 32.0, 41.0, 31.0, 40.0, 56.0, 43.0, 40.0, 36.0, 36.0, 33.0, 40.0, 41.0, 30.0, 26.0, 29.0, 19.0, 17.0, 26.0, 21.0, 20.0, 20.0, 17.0, 10.0, 8.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.361328125, -2.296875, -2.232421875, -2.16796875, -2.103515625, -2.0390625, -1.974609375, -1.91015625, -1.845703125, -1.78125, -1.716796875, -1.65234375, -1.587890625, -1.5234375, -1.458984375, -1.39453125, -1.330078125, -1.265625, -1.201171875, -1.13671875, -1.072265625, -1.0078125, -0.943359375, -0.87890625, -0.814453125, -0.75, -0.685546875, -0.62109375, -0.556640625, -0.4921875, -0.427734375, -0.36328125, -0.298828125, -0.234375, -0.169921875, -0.10546875, -0.041015625, 0.0234375, 0.087890625, 0.15234375, 0.216796875, 0.28125, 0.345703125, 0.41015625, 0.474609375, 0.5390625, 0.603515625, 0.66796875, 0.732421875, 0.796875, 0.861328125, 0.92578125, 0.990234375, 1.0546875, 1.119140625, 1.18359375, 1.248046875, 1.3125, 1.376953125, 1.44140625, 1.505859375, 1.5703125, 1.634765625, 1.69921875, 1.763671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 3.0, 11.0, 14.0, 26.0, 28.0, 28.0, 49.0, 53.0, 75.0, 94.0, 126.0, 175.0, 223.0, 403.0, 586.0, 955.0, 1581.0, 3227.0, 9017.0, 35099.0, 190668.0, 647998.0, 120773.0, 24080.0, 6707.0, 2704.0, 1333.0, 812.0, 505.0, 359.0, 256.0, 158.0, 125.0, 82.0, 61.0, 47.0, 28.0, 24.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8203125, -6.59576416015625, -6.3712158203125, -6.14666748046875, -5.922119140625, -5.69757080078125, -5.4730224609375, -5.24847412109375, -5.02392578125, -4.79937744140625, -4.5748291015625, -4.35028076171875, -4.125732421875, -3.90118408203125, -3.6766357421875, -3.45208740234375, -3.2275390625, -3.00299072265625, -2.7784423828125, -2.55389404296875, -2.329345703125, -2.10479736328125, -1.8802490234375, -1.65570068359375, -1.43115234375, -1.20660400390625, -0.9820556640625, -0.75750732421875, -0.532958984375, -0.30841064453125, -0.0838623046875, 0.14068603515625, 0.365234375, 0.58978271484375, 0.8143310546875, 1.03887939453125, 1.263427734375, 1.48797607421875, 1.7125244140625, 1.93707275390625, 2.16162109375, 2.38616943359375, 2.6107177734375, 2.83526611328125, 3.059814453125, 3.28436279296875, 3.5089111328125, 3.73345947265625, 3.9580078125, 4.18255615234375, 4.4071044921875, 4.63165283203125, 4.856201171875, 5.08074951171875, 5.3052978515625, 5.52984619140625, 5.75439453125, 5.97894287109375, 6.2034912109375, 6.42803955078125, 6.652587890625, 6.87713623046875, 7.1016845703125, 7.32623291015625, 7.55078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 7.0, 14.0, 16.0, 12.0, 16.0, 15.0, 18.0, 32.0, 27.0, 30.0, 37.0, 34.0, 43.0, 52.0, 40.0, 31.0, 35.0, 46.0, 53.0, 46.0, 36.0, 44.0, 37.0, 35.0, 36.0, 15.0, 26.0, 26.0, 21.0, 13.0, 16.0, 16.0, 15.0, 13.0, 6.0, 3.0, 5.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5390625, -9.2373046875, -8.935546875, -8.6337890625, -8.33203125, -8.0302734375, -7.728515625, -7.4267578125, -7.125, -6.8232421875, -6.521484375, -6.2197265625, -5.91796875, -5.6162109375, -5.314453125, -5.0126953125, -4.7109375, -4.4091796875, -4.107421875, -3.8056640625, -3.50390625, -3.2021484375, -2.900390625, -2.5986328125, -2.296875, -1.9951171875, -1.693359375, -1.3916015625, -1.08984375, -0.7880859375, -0.486328125, -0.1845703125, 0.1171875, 0.4189453125, 0.720703125, 1.0224609375, 1.32421875, 1.6259765625, 1.927734375, 2.2294921875, 2.53125, 2.8330078125, 3.134765625, 3.4365234375, 3.73828125, 4.0400390625, 4.341796875, 4.6435546875, 4.9453125, 5.2470703125, 5.548828125, 5.8505859375, 6.15234375, 6.4541015625, 6.755859375, 7.0576171875, 7.359375, 7.6611328125, 7.962890625, 8.2646484375, 8.56640625, 8.8681640625, 9.169921875, 9.4716796875, 9.7734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 15.0, 11.0, 10.0, 13.0, 30.0, 45.0, 55.0, 63.0, 104.0, 187.0, 302.0, 550.0, 1152.0, 2484.0, 6705.0, 26663.0, 271036.0, 675863.0, 47316.0, 9557.0, 3270.0, 1471.0, 664.0, 358.0, 187.0, 143.0, 91.0, 46.0, 37.0, 17.0, 24.0, 16.0, 15.0, 13.0, 10.0, 10.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.438751220703125, -2.35211181640625, -2.265472412109375, -2.1788330078125, -2.092193603515625, -2.00555419921875, -1.918914794921875, -1.832275390625, -1.745635986328125, -1.65899658203125, -1.572357177734375, -1.4857177734375, -1.399078369140625, -1.31243896484375, -1.225799560546875, -1.13916015625, -1.052520751953125, -0.96588134765625, -0.879241943359375, -0.7926025390625, -0.705963134765625, -0.61932373046875, -0.532684326171875, -0.446044921875, -0.359405517578125, -0.27276611328125, -0.186126708984375, -0.0994873046875, -0.012847900390625, 0.07379150390625, 0.160430908203125, 0.2470703125, 0.333709716796875, 0.42034912109375, 0.506988525390625, 0.5936279296875, 0.680267333984375, 0.76690673828125, 0.853546142578125, 0.940185546875, 1.026824951171875, 1.11346435546875, 1.200103759765625, 1.2867431640625, 1.373382568359375, 1.46002197265625, 1.546661376953125, 1.63330078125, 1.719940185546875, 1.80657958984375, 1.893218994140625, 1.9798583984375, 2.066497802734375, 2.15313720703125, 2.239776611328125, 2.326416015625, 2.413055419921875, 2.49969482421875, 2.586334228515625, 2.6729736328125, 2.759613037109375, 2.84625244140625, 2.932891845703125, 3.01953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 10.0, 5.0, 21.0, 29.0, 68.0, 76.0, 137.0, 199.0, 140.0, 99.0, 60.0, 43.0, 20.0, 20.0, 11.0, 15.0, 2.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009512901306152344, -0.0009212866425514221, -0.0008912831544876099, -0.0008612796664237976, -0.0008312761783599854, -0.0008012726902961731, -0.0007712692022323608, -0.0007412657141685486, -0.0007112622261047363, -0.0006812587380409241, -0.0006512552499771118, -0.0006212517619132996, -0.0005912482738494873, -0.000561244785785675, -0.0005312412977218628, -0.0005012378096580505, -0.0004712343215942383, -0.000441230833530426, -0.00041122734546661377, -0.0003812238574028015, -0.00035122036933898926, -0.000321216881275177, -0.00029121339321136475, -0.0002612099051475525, -0.00023120641708374023, -0.00020120292901992798, -0.00017119944095611572, -0.00014119595289230347, -0.00011119246482849121, -8.118897676467896e-05, -5.11854887008667e-05, -2.1182000637054443e-05, 8.821487426757812e-06, 3.882497549057007e-05, 6.882846355438232e-05, 9.883195161819458e-05, 0.00012883543968200684, 0.0001588389277458191, 0.00018884241580963135, 0.0002188459038734436, 0.00024884939193725586, 0.0002788528800010681, 0.00030885636806488037, 0.0003388598561286926, 0.0003688633441925049, 0.00039886683225631714, 0.0004288703203201294, 0.00045887380838394165, 0.0004888772964477539, 0.0005188807845115662, 0.0005488842725753784, 0.0005788877606391907, 0.0006088912487030029, 0.0006388947367668152, 0.0006688982248306274, 0.0006989017128944397, 0.000728905200958252, 0.0007589086890220642, 0.0007889121770858765, 0.0008189156651496887, 0.000848919153213501, 0.0008789226412773132, 0.0009089261293411255, 0.0009389296174049377, 0.00096893310546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 8.0, 14.0, 18.0, 28.0, 63.0, 98.0, 158.0, 339.0, 895.0, 2470.0, 11107.0, 141754.0, 847102.0, 36272.0, 5434.0, 1583.0, 605.0, 280.0, 140.0, 69.0, 48.0, 25.0, 17.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.420501708984375, -4.30194091796875, -4.183380126953125, -4.0648193359375, -3.946258544921875, -3.82769775390625, -3.709136962890625, -3.590576171875, -3.472015380859375, -3.35345458984375, -3.234893798828125, -3.1163330078125, -2.997772216796875, -2.87921142578125, -2.760650634765625, -2.64208984375, -2.523529052734375, -2.40496826171875, -2.286407470703125, -2.1678466796875, -2.049285888671875, -1.93072509765625, -1.812164306640625, -1.693603515625, -1.575042724609375, -1.45648193359375, -1.337921142578125, -1.2193603515625, -1.100799560546875, -0.98223876953125, -0.863677978515625, -0.7451171875, -0.626556396484375, -0.50799560546875, -0.389434814453125, -0.2708740234375, -0.152313232421875, -0.03375244140625, 0.084808349609375, 0.203369140625, 0.321929931640625, 0.44049072265625, 0.559051513671875, 0.6776123046875, 0.796173095703125, 0.91473388671875, 1.033294677734375, 1.15185546875, 1.270416259765625, 1.38897705078125, 1.507537841796875, 1.6260986328125, 1.744659423828125, 1.86322021484375, 1.981781005859375, 2.100341796875, 2.218902587890625, 2.33746337890625, 2.456024169921875, 2.5745849609375, 2.693145751953125, 2.81170654296875, 2.930267333984375, 3.048828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 12.0, 11.0, 8.0, 14.0, 20.0, 43.0, 45.0, 51.0, 62.0, 63.0, 92.0, 89.0, 92.0, 72.0, 49.0, 56.0, 42.0, 37.0, 36.0, 19.0, 17.0, 15.0, 6.0, 5.0, 5.0, 4.0, 0.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.96014404296875, -1.8890380859375, -1.81793212890625, -1.746826171875, -1.67572021484375, -1.6046142578125, -1.53350830078125, -1.46240234375, -1.39129638671875, -1.3201904296875, -1.24908447265625, -1.177978515625, -1.10687255859375, -1.0357666015625, -0.96466064453125, -0.8935546875, -0.82244873046875, -0.7513427734375, -0.68023681640625, -0.609130859375, -0.53802490234375, -0.4669189453125, -0.39581298828125, -0.32470703125, -0.25360107421875, -0.1824951171875, -0.11138916015625, -0.040283203125, 0.03082275390625, 0.1019287109375, 0.17303466796875, 0.244140625, 0.31524658203125, 0.3863525390625, 0.45745849609375, 0.528564453125, 0.59967041015625, 0.6707763671875, 0.74188232421875, 0.81298828125, 0.88409423828125, 0.9552001953125, 1.02630615234375, 1.097412109375, 1.16851806640625, 1.2396240234375, 1.31072998046875, 1.3818359375, 1.45294189453125, 1.5240478515625, 1.59515380859375, 1.666259765625, 1.73736572265625, 1.8084716796875, 1.87957763671875, 1.95068359375, 2.02178955078125, 2.0928955078125, 2.16400146484375, 2.235107421875, 2.30621337890625, 2.3773193359375, 2.44842529296875, 2.51953125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 16.0, 33.0, 41.0, 77.0, 113.0, 180.0, 171.0, 130.0, 93.0, 45.0, 27.0, 18.0, 10.0, 6.0, 7.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-51.031551361083984, -49.385169982910156, -47.73878860473633, -46.0924072265625, -44.446022033691406, -42.79964065551758, -41.15325927734375, -39.50687789916992, -37.860496520996094, -36.214115142822266, -34.56773376464844, -32.921348571777344, -31.27496910095215, -29.628585815429688, -27.98220443725586, -26.33582305908203, -24.68943977355957, -23.043058395385742, -21.39667510986328, -19.750293731689453, -18.103912353515625, -16.457530975341797, -14.811147689819336, -13.164766311645508, -11.518383979797363, -9.872001647949219, -8.22562026977539, -6.579237937927246, -4.93285608291626, -3.2864742279052734, -1.640091896057129, 0.006289482116699219, 1.6526718139648438, 3.29905366897583, 4.945435523986816, 6.591817855834961, 8.238199234008789, 9.884581565856934, 11.530963897705078, 13.177345275878906, 14.82372760772705, 16.470109939575195, 18.116491317749023, 19.762874603271484, 21.409255981445312, 23.05563735961914, 24.70201873779297, 26.348400115966797, 27.994783401489258, 29.641164779663086, 31.287548065185547, 32.933929443359375, 34.5803108215332, 36.22669219970703, 37.873077392578125, 39.51945495605469, 41.16584014892578, 42.81222152709961, 44.45860290527344, 46.10498809814453, 47.75136947631836, 49.39775085449219, 51.044132232666016, 52.690513610839844, 54.33689498901367]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 11.0, 11.0, 3.0, 7.0, 13.0, 10.0, 15.0, 19.0, 23.0, 27.0, 19.0, 28.0, 26.0, 33.0, 33.0, 29.0, 38.0, 44.0, 62.0, 74.0, 72.0, 48.0, 41.0, 34.0, 32.0, 30.0, 40.0, 24.0, 26.0, 16.0, 13.0, 26.0, 11.0, 8.0, 8.0, 8.0, 7.0, 6.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.02223205566406, -32.83033752441406, -31.638442993164062, -30.44654655456543, -29.25465202331543, -28.06275749206543, -26.870861053466797, -25.678966522216797, -24.487071990966797, -23.295177459716797, -22.103282928466797, -20.911386489868164, -19.719491958618164, -18.527597427368164, -17.33570098876953, -16.14380645751953, -14.951911926269531, -13.760017395019531, -12.568121910095215, -11.376226425170898, -10.184331893920898, -8.992437362670898, -7.800541877746582, -6.608646392822266, -5.416751861572266, -4.224856853485107, -3.032961845397949, -1.841066837310791, -0.6491718292236328, 0.5427231788635254, 1.7346181869506836, 2.926513671875, 4.118404388427734, 5.310299396514893, 6.502194404602051, 7.694089412689209, 8.885984420776367, 10.077878952026367, 11.269774436950684, 12.461669921875, 13.653564453125, 14.845458984375, 16.037353515625, 17.229249954223633, 18.421144485473633, 19.613039016723633, 20.804935455322266, 21.996829986572266, 23.188724517822266, 24.380619049072266, 25.572513580322266, 26.7644100189209, 27.9563045501709, 29.1481990814209, 30.34009552001953, 31.53199005126953, 32.72388458251953, 33.91577911376953, 35.10767364501953, 36.29956817626953, 37.49146270751953, 38.6833610534668, 39.8752555847168, 41.0671501159668, 42.2590446472168]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 8.0, 12.0, 17.0, 16.0, 27.0, 46.0, 51.0, 80.0, 171.0, 314.0, 609.0, 1525.0, 3810.0, 11193.0, 43563.0, 391369.0, 3148358.0, 518841.0, 52754.0, 13908.0, 4459.0, 1670.0, 735.0, 315.0, 172.0, 90.0, 53.0, 28.0, 19.0, 13.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.06640625, -4.94146728515625, -4.8165283203125, -4.69158935546875, -4.566650390625, -4.44171142578125, -4.3167724609375, -4.19183349609375, -4.06689453125, -3.94195556640625, -3.8170166015625, -3.69207763671875, -3.567138671875, -3.44219970703125, -3.3172607421875, -3.19232177734375, -3.0673828125, -2.94244384765625, -2.8175048828125, -2.69256591796875, -2.567626953125, -2.44268798828125, -2.3177490234375, -2.19281005859375, -2.06787109375, -1.94293212890625, -1.8179931640625, -1.69305419921875, -1.568115234375, -1.44317626953125, -1.3182373046875, -1.19329833984375, -1.068359375, -0.94342041015625, -0.8184814453125, -0.69354248046875, -0.568603515625, -0.44366455078125, -0.3187255859375, -0.19378662109375, -0.06884765625, 0.05609130859375, 0.1810302734375, 0.30596923828125, 0.430908203125, 0.55584716796875, 0.6807861328125, 0.80572509765625, 0.9306640625, 1.05560302734375, 1.1805419921875, 1.30548095703125, 1.430419921875, 1.55535888671875, 1.6802978515625, 1.80523681640625, 1.93017578125, 2.05511474609375, 2.1800537109375, 2.30499267578125, 2.429931640625, 2.55487060546875, 2.6798095703125, 2.80474853515625, 2.9296875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 6.0, 11.0, 16.0, 21.0, 23.0, 29.0, 49.0, 56.0, 50.0, 51.0, 62.0, 70.0, 78.0, 53.0, 61.0, 71.0, 56.0, 59.0, 57.0, 20.0, 24.0, 27.0, 11.0, 12.0, 13.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.2392578125, -4.134765625, -4.0302734375, -3.92578125, -3.8212890625, -3.716796875, -3.6123046875, -3.5078125, -3.4033203125, -3.298828125, -3.1943359375, -3.08984375, -2.9853515625, -2.880859375, -2.7763671875, -2.671875, -2.5673828125, -2.462890625, -2.3583984375, -2.25390625, -2.1494140625, -2.044921875, -1.9404296875, -1.8359375, -1.7314453125, -1.626953125, -1.5224609375, -1.41796875, -1.3134765625, -1.208984375, -1.1044921875, -1.0, -0.8955078125, -0.791015625, -0.6865234375, -0.58203125, -0.4775390625, -0.373046875, -0.2685546875, -0.1640625, -0.0595703125, 0.044921875, 0.1494140625, 0.25390625, 0.3583984375, 0.462890625, 0.5673828125, 0.671875, 0.7763671875, 0.880859375, 0.9853515625, 1.08984375, 1.1943359375, 1.298828125, 1.4033203125, 1.5078125, 1.6123046875, 1.716796875, 1.8212890625, 1.92578125, 2.0302734375, 2.134765625, 2.2392578125, 2.34375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 14.0, 13.0, 24.0, 39.0, 52.0, 77.0, 90.0, 186.0, 305.0, 723.0, 2132.0, 10438.0, 100929.0, 3781255.0, 272394.0, 19792.0, 3887.0, 1120.0, 467.0, 154.0, 86.0, 51.0, 25.0, 8.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.0498046875, -7.787109375, -7.5244140625, -7.26171875, -6.9990234375, -6.736328125, -6.4736328125, -6.2109375, -5.9482421875, -5.685546875, -5.4228515625, -5.16015625, -4.8974609375, -4.634765625, -4.3720703125, -4.109375, -3.8466796875, -3.583984375, -3.3212890625, -3.05859375, -2.7958984375, -2.533203125, -2.2705078125, -2.0078125, -1.7451171875, -1.482421875, -1.2197265625, -0.95703125, -0.6943359375, -0.431640625, -0.1689453125, 0.09375, 0.3564453125, 0.619140625, 0.8818359375, 1.14453125, 1.4072265625, 1.669921875, 1.9326171875, 2.1953125, 2.4580078125, 2.720703125, 2.9833984375, 3.24609375, 3.5087890625, 3.771484375, 4.0341796875, 4.296875, 4.5595703125, 4.822265625, 5.0849609375, 5.34765625, 5.6103515625, 5.873046875, 6.1357421875, 6.3984375, 6.6611328125, 6.923828125, 7.1865234375, 7.44921875, 7.7119140625, 7.974609375, 8.2373046875, 8.5]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 12.0, 20.0, 27.0, 42.0, 67.0, 132.0, 273.0, 735.0, 1298.0, 746.0, 347.0, 141.0, 78.0, 43.0, 45.0, 19.0, 9.0, 10.0, 9.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8046875, -10.544677734375, -10.28466796875, -10.024658203125, -9.7646484375, -9.504638671875, -9.24462890625, -8.984619140625, -8.724609375, -8.464599609375, -8.20458984375, -7.944580078125, -7.6845703125, -7.424560546875, -7.16455078125, -6.904541015625, -6.64453125, -6.384521484375, -6.12451171875, -5.864501953125, -5.6044921875, -5.344482421875, -5.08447265625, -4.824462890625, -4.564453125, -4.304443359375, -4.04443359375, -3.784423828125, -3.5244140625, -3.264404296875, -3.00439453125, -2.744384765625, -2.484375, -2.224365234375, -1.96435546875, -1.704345703125, -1.4443359375, -1.184326171875, -0.92431640625, -0.664306640625, -0.404296875, -0.144287109375, 0.11572265625, 0.375732421875, 0.6357421875, 0.895751953125, 1.15576171875, 1.415771484375, 1.67578125, 1.935791015625, 2.19580078125, 2.455810546875, 2.7158203125, 2.975830078125, 3.23583984375, 3.495849609375, 3.755859375, 4.015869140625, 4.27587890625, 4.535888671875, 4.7958984375, 5.055908203125, 5.31591796875, 5.575927734375, 5.8359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 22.0, 55.0, 128.0, 275.0, 249.0, 129.0, 70.0, 25.0, 13.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.22256469726562, -69.8890151977539, -67.55547332763672, -65.221923828125, -62.88837814331055, -60.554832458496094, -58.221282958984375, -55.88773727416992, -53.55419158935547, -51.220645904541016, -48.88710021972656, -46.553550720214844, -44.22000503540039, -41.88645935058594, -39.55290985107422, -37.219364166259766, -34.88581848144531, -32.55227279663086, -30.218725204467773, -27.885177612304688, -25.551631927490234, -23.21808624267578, -20.884538650512695, -18.55099105834961, -16.217445373535156, -13.883898735046387, -11.550352096557617, -9.216805458068848, -6.883258819580078, -4.549712181091309, -2.216165542602539, 0.11738204956054688, 2.450927734375, 4.7844743728637695, 7.118021011352539, 9.451567649841309, 11.785114288330078, 14.118660926818848, 16.452207565307617, 18.785755157470703, 21.119300842285156, 23.45284652709961, 25.786394119262695, 28.11994171142578, 30.453487396240234, 32.78703308105469, 35.120582580566406, 37.45412826538086, 39.78767395019531, 42.121219635009766, 44.45476531982422, 46.78831481933594, 49.12186050415039, 51.455406188964844, 53.78895568847656, 56.122501373291016, 58.45604705810547, 60.78959274291992, 63.123138427734375, 65.4566879272461, 67.79023742675781, 70.123779296875, 72.45732879638672, 74.79087829589844, 77.12442016601562]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 6.0, 6.0, 10.0, 9.0, 9.0, 20.0, 13.0, 16.0, 27.0, 24.0, 30.0, 24.0, 38.0, 53.0, 39.0, 42.0, 48.0, 57.0, 67.0, 51.0, 45.0, 46.0, 54.0, 37.0, 33.0, 30.0, 32.0, 27.0, 24.0, 17.0, 15.0, 19.0, 10.0, 7.0, 4.0, 5.0, 5.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.07762908935547, -30.16109275817871, -29.24455451965332, -28.328018188476562, -27.411479949951172, -26.494943618774414, -25.578407287597656, -24.661869049072266, -23.745330810546875, -22.828794479370117, -21.912256240844727, -20.99571990966797, -20.079181671142578, -19.16264533996582, -18.246109008789062, -17.329570770263672, -16.413034439086914, -15.49649715423584, -14.579959869384766, -13.663423538208008, -12.746885299682617, -11.83034896850586, -10.913811683654785, -9.997274398803711, -9.080737113952637, -8.164199829101562, -7.247662544250488, -6.331125736236572, -5.414588451385498, -4.498051166534424, -3.581514358520508, -2.6649770736694336, -1.7484397888183594, -0.8319026231765747, 0.08463454246520996, 1.001171588897705, 1.9177088737487793, 2.8342461585998535, 3.7507829666137695, 4.667320251464844, 5.583857536315918, 6.500394821166992, 7.416932106018066, 8.33346939086914, 9.250005722045898, 10.166543960571289, 11.083080291748047, 11.999617576599121, 12.916154861450195, 13.83269214630127, 14.749229431152344, 15.665765762329102, 16.582304000854492, 17.49884033203125, 18.41537857055664, 19.3319149017334, 20.248451232910156, 21.164987564086914, 22.081525802612305, 22.998062133789062, 23.914600372314453, 24.83113670349121, 25.74767303466797, 26.66421127319336, 27.58074951171875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 14.0, 11.0, 22.0, 43.0, 53.0, 93.0, 183.0, 320.0, 626.0, 1448.0, 3273.0, 8488.0, 24083.0, 74022.0, 246198.0, 448098.0, 162993.0, 50713.0, 17040.0, 6107.0, 2480.0, 1087.0, 510.0, 253.0, 157.0, 77.0, 48.0, 37.0, 23.0, 15.0, 6.0, 10.0, 9.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.79559326171875, -4.6263427734375, -4.45709228515625, -4.287841796875, -4.11859130859375, -3.9493408203125, -3.78009033203125, -3.61083984375, -3.44158935546875, -3.2723388671875, -3.10308837890625, -2.933837890625, -2.76458740234375, -2.5953369140625, -2.42608642578125, -2.2568359375, -2.08758544921875, -1.9183349609375, -1.74908447265625, -1.579833984375, -1.41058349609375, -1.2413330078125, -1.07208251953125, -0.90283203125, -0.73358154296875, -0.5643310546875, -0.39508056640625, -0.225830078125, -0.05657958984375, 0.1126708984375, 0.28192138671875, 0.451171875, 0.62042236328125, 0.7896728515625, 0.95892333984375, 1.128173828125, 1.29742431640625, 1.4666748046875, 1.63592529296875, 1.80517578125, 1.97442626953125, 2.1436767578125, 2.31292724609375, 2.482177734375, 2.65142822265625, 2.8206787109375, 2.98992919921875, 3.1591796875, 3.32843017578125, 3.4976806640625, 3.66693115234375, 3.836181640625, 4.00543212890625, 4.1746826171875, 4.34393310546875, 4.51318359375, 4.68243408203125, 4.8516845703125, 5.02093505859375, 5.190185546875, 5.35943603515625, 5.5286865234375, 5.69793701171875, 5.8671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 9.0, 1.0, 6.0, 9.0, 10.0, 11.0, 22.0, 17.0, 14.0, 23.0, 26.0, 30.0, 32.0, 33.0, 48.0, 45.0, 46.0, 46.0, 65.0, 44.0, 45.0, 54.0, 62.0, 44.0, 37.0, 44.0, 19.0, 30.0, 30.0, 24.0, 17.0, 15.0, 15.0, 12.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5078125, -2.43206787109375, -2.3563232421875, -2.28057861328125, -2.204833984375, -2.12908935546875, -2.0533447265625, -1.97760009765625, -1.90185546875, -1.82611083984375, -1.7503662109375, -1.67462158203125, -1.598876953125, -1.52313232421875, -1.4473876953125, -1.37164306640625, -1.2958984375, -1.22015380859375, -1.1444091796875, -1.06866455078125, -0.992919921875, -0.91717529296875, -0.8414306640625, -0.76568603515625, -0.68994140625, -0.61419677734375, -0.5384521484375, -0.46270751953125, -0.386962890625, -0.31121826171875, -0.2354736328125, -0.15972900390625, -0.083984375, -0.00823974609375, 0.0675048828125, 0.14324951171875, 0.218994140625, 0.29473876953125, 0.3704833984375, 0.44622802734375, 0.52197265625, 0.59771728515625, 0.6734619140625, 0.74920654296875, 0.824951171875, 0.90069580078125, 0.9764404296875, 1.05218505859375, 1.1279296875, 1.20367431640625, 1.2794189453125, 1.35516357421875, 1.430908203125, 1.50665283203125, 1.5823974609375, 1.65814208984375, 1.73388671875, 1.80963134765625, 1.8853759765625, 1.96112060546875, 2.036865234375, 2.11260986328125, 2.1883544921875, 2.26409912109375, 2.33984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 0.0, 6.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 5.0, 10.0, 21.0, 23.0, 33.0, 35.0, 50.0, 67.0, 100.0, 171.0, 241.0, 448.0, 782.0, 1808.0, 5072.0, 23253.0, 187452.0, 723556.0, 86263.0, 12546.0, 3461.0, 1413.0, 657.0, 358.0, 253.0, 134.0, 109.0, 56.0, 45.0, 34.0, 25.0, 10.0, 9.0, 13.0, 6.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5546875, -8.2725830078125, -7.990478515625, -7.7083740234375, -7.42626953125, -7.1441650390625, -6.862060546875, -6.5799560546875, -6.2978515625, -6.0157470703125, -5.733642578125, -5.4515380859375, -5.16943359375, -4.8873291015625, -4.605224609375, -4.3231201171875, -4.041015625, -3.7589111328125, -3.476806640625, -3.1947021484375, -2.91259765625, -2.6304931640625, -2.348388671875, -2.0662841796875, -1.7841796875, -1.5020751953125, -1.219970703125, -0.9378662109375, -0.65576171875, -0.3736572265625, -0.091552734375, 0.1905517578125, 0.47265625, 0.7547607421875, 1.036865234375, 1.3189697265625, 1.60107421875, 1.8831787109375, 2.165283203125, 2.4473876953125, 2.7294921875, 3.0115966796875, 3.293701171875, 3.5758056640625, 3.85791015625, 4.1400146484375, 4.422119140625, 4.7042236328125, 4.986328125, 5.2684326171875, 5.550537109375, 5.8326416015625, 6.11474609375, 6.3968505859375, 6.678955078125, 6.9610595703125, 7.2431640625, 7.5252685546875, 7.807373046875, 8.0894775390625, 8.37158203125, 8.6536865234375, 8.935791015625, 9.2178955078125, 9.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 17.0, 4.0, 14.0, 13.0, 9.0, 19.0, 21.0, 28.0, 41.0, 44.0, 57.0, 45.0, 50.0, 58.0, 69.0, 71.0, 52.0, 52.0, 42.0, 54.0, 46.0, 43.0, 32.0, 25.0, 22.0, 15.0, 23.0, 13.0, 6.0, 6.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.0859375, -12.7550048828125, -12.424072265625, -12.0931396484375, -11.76220703125, -11.4312744140625, -11.100341796875, -10.7694091796875, -10.4384765625, -10.1075439453125, -9.776611328125, -9.4456787109375, -9.11474609375, -8.7838134765625, -8.452880859375, -8.1219482421875, -7.791015625, -7.4600830078125, -7.129150390625, -6.7982177734375, -6.46728515625, -6.1363525390625, -5.805419921875, -5.4744873046875, -5.1435546875, -4.8126220703125, -4.481689453125, -4.1507568359375, -3.81982421875, -3.4888916015625, -3.157958984375, -2.8270263671875, -2.49609375, -2.1651611328125, -1.834228515625, -1.5032958984375, -1.17236328125, -0.8414306640625, -0.510498046875, -0.1795654296875, 0.1513671875, 0.4822998046875, 0.813232421875, 1.1441650390625, 1.47509765625, 1.8060302734375, 2.136962890625, 2.4678955078125, 2.798828125, 3.1297607421875, 3.460693359375, 3.7916259765625, 4.12255859375, 4.4534912109375, 4.784423828125, 5.1153564453125, 5.4462890625, 5.7772216796875, 6.108154296875, 6.4390869140625, 6.77001953125, 7.1009521484375, 7.431884765625, 7.7628173828125, 8.09375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 6.0, 8.0, 17.0, 26.0, 37.0, 57.0, 96.0, 199.0, 334.0, 753.0, 2236.0, 9302.0, 66224.0, 707834.0, 229751.0, 24632.0, 4589.0, 1353.0, 521.0, 223.0, 152.0, 65.0, 51.0, 32.0, 11.0, 13.0, 8.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.42974853515625, -2.3555908203125, -2.28143310546875, -2.207275390625, -2.13311767578125, -2.0589599609375, -1.98480224609375, -1.91064453125, -1.83648681640625, -1.7623291015625, -1.68817138671875, -1.614013671875, -1.53985595703125, -1.4656982421875, -1.39154052734375, -1.3173828125, -1.24322509765625, -1.1690673828125, -1.09490966796875, -1.020751953125, -0.94659423828125, -0.8724365234375, -0.79827880859375, -0.72412109375, -0.64996337890625, -0.5758056640625, -0.50164794921875, -0.427490234375, -0.35333251953125, -0.2791748046875, -0.20501708984375, -0.130859375, -0.05670166015625, 0.0174560546875, 0.09161376953125, 0.165771484375, 0.23992919921875, 0.3140869140625, 0.38824462890625, 0.46240234375, 0.53656005859375, 0.6107177734375, 0.68487548828125, 0.759033203125, 0.83319091796875, 0.9073486328125, 0.98150634765625, 1.0556640625, 1.12982177734375, 1.2039794921875, 1.27813720703125, 1.352294921875, 1.42645263671875, 1.5006103515625, 1.57476806640625, 1.64892578125, 1.72308349609375, 1.7972412109375, 1.87139892578125, 1.945556640625, 2.01971435546875, 2.0938720703125, 2.16802978515625, 2.2421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 13.0, 9.0, 18.0, 17.0, 19.0, 20.0, 34.0, 34.0, 47.0, 56.0, 83.0, 73.0, 80.0, 79.0, 77.0, 74.0, 41.0, 41.0, 24.0, 19.0, 19.0, 18.0, 10.0, 8.0, 15.0, 5.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00042724609375, -0.0004131719470024109, -0.0003990978002548218, -0.00038502365350723267, -0.00037094950675964355, -0.00035687536001205444, -0.00034280121326446533, -0.0003287270665168762, -0.0003146529197692871, -0.000300578773021698, -0.0002865046262741089, -0.0002724304795265198, -0.00025835633277893066, -0.00024428218603134155, -0.00023020803928375244, -0.00021613389253616333, -0.00020205974578857422, -0.0001879855990409851, -0.000173911452293396, -0.00015983730554580688, -0.00014576315879821777, -0.00013168901205062866, -0.00011761486530303955, -0.00010354071855545044, -8.946657180786133e-05, -7.539242506027222e-05, -6.13182783126831e-05, -4.7244131565093994e-05, -3.316998481750488e-05, -1.909583806991577e-05, -5.02169132232666e-06, 9.052455425262451e-06, 2.3126602172851562e-05, 3.7200748920440674e-05, 5.1274895668029785e-05, 6.53490424156189e-05, 7.942318916320801e-05, 9.349733591079712e-05, 0.00010757148265838623, 0.00012164562940597534, 0.00013571977615356445, 0.00014979392290115356, 0.00016386806964874268, 0.0001779422163963318, 0.0001920163631439209, 0.00020609050989151, 0.00022016465663909912, 0.00023423880338668823, 0.00024831295013427734, 0.00026238709688186646, 0.00027646124362945557, 0.0002905353903770447, 0.0003046095371246338, 0.0003186836838722229, 0.000332757830619812, 0.0003468319773674011, 0.00036090612411499023, 0.00037498027086257935, 0.00038905441761016846, 0.00040312856435775757, 0.0004172027111053467, 0.0004312768578529358, 0.0004453510046005249, 0.000459425151348114, 0.0004734992980957031]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 13.0, 20.0, 41.0, 87.0, 211.0, 715.0, 3185.0, 48161.0, 927427.0, 63745.0, 3720.0, 803.0, 284.0, 80.0, 29.0, 19.0, 6.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.5068359375, -2.384765625, -2.2626953125, -2.140625, -2.0185546875, -1.896484375, -1.7744140625, -1.65234375, -1.5302734375, -1.408203125, -1.2861328125, -1.1640625, -1.0419921875, -0.919921875, -0.7978515625, -0.67578125, -0.5537109375, -0.431640625, -0.3095703125, -0.1875, -0.0654296875, 0.056640625, 0.1787109375, 0.30078125, 0.4228515625, 0.544921875, 0.6669921875, 0.7890625, 0.9111328125, 1.033203125, 1.1552734375, 1.27734375, 1.3994140625, 1.521484375, 1.6435546875, 1.765625, 1.8876953125, 2.009765625, 2.1318359375, 2.25390625, 2.3759765625, 2.498046875, 2.6201171875, 2.7421875, 2.8642578125, 2.986328125, 3.1083984375, 3.23046875, 3.3525390625, 3.474609375, 3.5966796875, 3.71875, 3.8408203125, 3.962890625, 4.0849609375, 4.20703125, 4.3291015625, 4.451171875, 4.5732421875, 4.6953125, 4.8173828125, 4.939453125, 5.0615234375, 5.18359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 17.0, 17.0, 19.0, 18.0, 26.0, 41.0, 25.0, 46.0, 51.0, 55.0, 50.0, 58.0, 67.0, 60.0, 72.0, 51.0, 46.0, 56.0, 42.0, 25.0, 30.0, 22.0, 23.0, 13.0, 12.0, 5.0, 10.0, 10.0, 4.0, 7.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0419921875, -0.99627685546875, -0.9505615234375, -0.90484619140625, -0.859130859375, -0.81341552734375, -0.7677001953125, -0.72198486328125, -0.67626953125, -0.63055419921875, -0.5848388671875, -0.53912353515625, -0.493408203125, -0.44769287109375, -0.4019775390625, -0.35626220703125, -0.310546875, -0.26483154296875, -0.2191162109375, -0.17340087890625, -0.127685546875, -0.08197021484375, -0.0362548828125, 0.00946044921875, 0.05517578125, 0.10089111328125, 0.1466064453125, 0.19232177734375, 0.238037109375, 0.28375244140625, 0.3294677734375, 0.37518310546875, 0.4208984375, 0.46661376953125, 0.5123291015625, 0.55804443359375, 0.603759765625, 0.64947509765625, 0.6951904296875, 0.74090576171875, 0.78662109375, 0.83233642578125, 0.8780517578125, 0.92376708984375, 0.969482421875, 1.01519775390625, 1.0609130859375, 1.10662841796875, 1.15234375, 1.19805908203125, 1.2437744140625, 1.28948974609375, 1.335205078125, 1.38092041015625, 1.4266357421875, 1.47235107421875, 1.51806640625, 1.56378173828125, 1.6094970703125, 1.65521240234375, 1.700927734375, 1.74664306640625, 1.7923583984375, 1.83807373046875, 1.8837890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 31.0, 102.0, 375.0, 298.0, 118.0, 35.0, 16.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.57394409179688, -61.31277084350586, -58.05160140991211, -54.790428161621094, -51.529258728027344, -48.26808547973633, -45.00691223144531, -41.74574279785156, -38.48456954956055, -35.22339630126953, -31.96222686767578, -28.701053619384766, -25.439882278442383, -22.1787109375, -18.917537689208984, -15.656366348266602, -12.395195007324219, -9.134023666381836, -5.872851371765137, -2.6116790771484375, 0.6494922637939453, 3.910663604736328, 7.171836853027344, 10.433008193969727, 13.69417953491211, 16.955350875854492, 20.216522216796875, 23.47769546508789, 26.738866806030273, 30.000038146972656, 33.26121139526367, 36.52238464355469, 39.78355407714844, 43.04472732543945, 46.3058967590332, 49.56707000732422, 52.82823944091797, 56.089412689208984, 59.3505859375, 62.61175537109375, 65.8729248046875, 69.13409423828125, 72.39527130126953, 75.65644073486328, 78.91761016845703, 82.17878723144531, 85.43995666503906, 88.70112609863281, 91.9623031616211, 95.22347259521484, 98.48464965820312, 101.74581909179688, 105.00698852539062, 108.26815795898438, 111.52933502197266, 114.7905044555664, 118.05168151855469, 121.31285095214844, 124.57402801513672, 127.83519744873047, 131.09637451171875, 134.3575439453125, 137.61871337890625, 140.8798828125, 144.14105224609375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 8.0, 9.0, 9.0, 9.0, 12.0, 17.0, 14.0, 16.0, 12.0, 19.0, 35.0, 18.0, 31.0, 30.0, 39.0, 46.0, 46.0, 73.0, 70.0, 63.0, 56.0, 43.0, 41.0, 34.0, 37.0, 21.0, 22.0, 21.0, 19.0, 17.0, 19.0, 8.0, 9.0, 14.0, 7.0, 12.0, 9.0, 10.0, 3.0, 6.0, 6.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.876930236816406, -33.84788131713867, -32.81883239746094, -31.78978729248047, -30.760738372802734, -29.731689453125, -28.7026424407959, -27.673595428466797, -26.644546508789062, -25.615497589111328, -24.586450576782227, -23.557403564453125, -22.52835464477539, -21.499305725097656, -20.470258712768555, -19.441211700439453, -18.41216278076172, -17.383113861083984, -16.354066848754883, -15.325018882751465, -14.295970916748047, -13.266922950744629, -12.237874984741211, -11.208827018737793, -10.179779052734375, -9.150731086730957, -8.121683120727539, -7.092635154724121, -6.063587188720703, -5.034539222717285, -4.005491256713867, -2.976443290710449, -1.947397232055664, -0.9183492660522461, 0.11069869995117188, 1.1397466659545898, 2.168794631958008, 3.197842597961426, 4.226890563964844, 5.255938529968262, 6.28498649597168, 7.314034461975098, 8.343082427978516, 9.372130393981934, 10.401178359985352, 11.43022632598877, 12.459274291992188, 13.488322257995605, 14.517370223999023, 15.546418190002441, 16.57546615600586, 17.604515075683594, 18.633562088012695, 19.662609100341797, 20.69165802001953, 21.720706939697266, 22.749753952026367, 23.77880096435547, 24.807849884033203, 25.836898803710938, 26.86594581604004, 27.89499282836914, 28.924041748046875, 29.95309066772461, 30.98213768005371]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 12.0, 12.0, 5.0, 13.0, 11.0, 38.0, 57.0, 107.0, 261.0, 546.0, 1885.0, 9168.0, 97411.0, 3435140.0, 619677.0, 24588.0, 3721.0, 911.0, 374.0, 156.0, 90.0, 48.0, 15.0, 10.0, 10.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.43359375, -7.2510986328125, -7.068603515625, -6.8861083984375, -6.70361328125, -6.5211181640625, -6.338623046875, -6.1561279296875, -5.9736328125, -5.7911376953125, -5.608642578125, -5.4261474609375, -5.24365234375, -5.0611572265625, -4.878662109375, -4.6961669921875, -4.513671875, -4.3311767578125, -4.148681640625, -3.9661865234375, -3.78369140625, -3.6011962890625, -3.418701171875, -3.2362060546875, -3.0537109375, -2.8712158203125, -2.688720703125, -2.5062255859375, -2.32373046875, -2.1412353515625, -1.958740234375, -1.7762451171875, -1.59375, -1.4112548828125, -1.228759765625, -1.0462646484375, -0.86376953125, -0.6812744140625, -0.498779296875, -0.3162841796875, -0.1337890625, 0.0487060546875, 0.231201171875, 0.4136962890625, 0.59619140625, 0.7786865234375, 0.961181640625, 1.1436767578125, 1.326171875, 1.5086669921875, 1.691162109375, 1.8736572265625, 2.05615234375, 2.2386474609375, 2.421142578125, 2.6036376953125, 2.7861328125, 2.9686279296875, 3.151123046875, 3.3336181640625, 3.51611328125, 3.6986083984375, 3.881103515625, 4.0635986328125, 4.24609375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 7.0, 7.0, 17.0, 16.0, 16.0, 21.0, 26.0, 36.0, 27.0, 35.0, 43.0, 29.0, 47.0, 49.0, 49.0, 59.0, 60.0, 49.0, 45.0, 49.0, 55.0, 42.0, 29.0, 29.0, 28.0, 29.0, 24.0, 19.0, 13.0, 13.0, 9.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48828125, -2.417266845703125, -2.34625244140625, -2.275238037109375, -2.2042236328125, -2.133209228515625, -2.06219482421875, -1.991180419921875, -1.920166015625, -1.849151611328125, -1.77813720703125, -1.707122802734375, -1.6361083984375, -1.565093994140625, -1.49407958984375, -1.423065185546875, -1.35205078125, -1.281036376953125, -1.21002197265625, -1.139007568359375, -1.0679931640625, -0.996978759765625, -0.92596435546875, -0.854949951171875, -0.783935546875, -0.712921142578125, -0.64190673828125, -0.570892333984375, -0.4998779296875, -0.428863525390625, -0.35784912109375, -0.286834716796875, -0.2158203125, -0.144805908203125, -0.07379150390625, -0.002777099609375, 0.0682373046875, 0.139251708984375, 0.21026611328125, 0.281280517578125, 0.352294921875, 0.423309326171875, 0.49432373046875, 0.565338134765625, 0.6363525390625, 0.707366943359375, 0.77838134765625, 0.849395751953125, 0.92041015625, 0.991424560546875, 1.06243896484375, 1.133453369140625, 1.2044677734375, 1.275482177734375, 1.34649658203125, 1.417510986328125, 1.488525390625, 1.559539794921875, 1.63055419921875, 1.701568603515625, 1.7725830078125, 1.843597412109375, 1.91461181640625, 1.985626220703125, 2.056640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 9.0, 7.0, 15.0, 17.0, 21.0, 37.0, 59.0, 71.0, 135.0, 168.0, 322.0, 602.0, 1319.0, 3105.0, 9084.0, 36312.0, 307519.0, 3554973.0, 237992.0, 30193.0, 7652.0, 2469.0, 988.0, 457.0, 240.0, 146.0, 100.0, 55.0, 59.0, 38.0, 25.0, 22.0, 13.0, 7.0, 8.0, 10.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.83203125, -4.68316650390625, -4.5343017578125, -4.38543701171875, -4.236572265625, -4.08770751953125, -3.9388427734375, -3.78997802734375, -3.64111328125, -3.49224853515625, -3.3433837890625, -3.19451904296875, -3.045654296875, -2.89678955078125, -2.7479248046875, -2.59906005859375, -2.4501953125, -2.30133056640625, -2.1524658203125, -2.00360107421875, -1.854736328125, -1.70587158203125, -1.5570068359375, -1.40814208984375, -1.25927734375, -1.11041259765625, -0.9615478515625, -0.81268310546875, -0.663818359375, -0.51495361328125, -0.3660888671875, -0.21722412109375, -0.068359375, 0.08050537109375, 0.2293701171875, 0.37823486328125, 0.527099609375, 0.67596435546875, 0.8248291015625, 0.97369384765625, 1.12255859375, 1.27142333984375, 1.4202880859375, 1.56915283203125, 1.718017578125, 1.86688232421875, 2.0157470703125, 2.16461181640625, 2.3134765625, 2.46234130859375, 2.6112060546875, 2.76007080078125, 2.908935546875, 3.05780029296875, 3.2066650390625, 3.35552978515625, 3.50439453125, 3.65325927734375, 3.8021240234375, 3.95098876953125, 4.099853515625, 4.24871826171875, 4.3975830078125, 4.54644775390625, 4.6953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 3.0, 2.0, 10.0, 3.0, 1.0, 14.0, 13.0, 9.0, 29.0, 34.0, 33.0, 54.0, 58.0, 99.0, 184.0, 312.0, 513.0, 833.0, 728.0, 422.0, 253.0, 151.0, 99.0, 55.0, 38.0, 35.0, 18.0, 27.0, 10.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.5833740234375, -4.447998046875, -4.3126220703125, -4.17724609375, -4.0418701171875, -3.906494140625, -3.7711181640625, -3.6357421875, -3.5003662109375, -3.364990234375, -3.2296142578125, -3.09423828125, -2.9588623046875, -2.823486328125, -2.6881103515625, -2.552734375, -2.4173583984375, -2.281982421875, -2.1466064453125, -2.01123046875, -1.8758544921875, -1.740478515625, -1.6051025390625, -1.4697265625, -1.3343505859375, -1.198974609375, -1.0635986328125, -0.92822265625, -0.7928466796875, -0.657470703125, -0.5220947265625, -0.38671875, -0.2513427734375, -0.115966796875, 0.0194091796875, 0.15478515625, 0.2901611328125, 0.425537109375, 0.5609130859375, 0.6962890625, 0.8316650390625, 0.967041015625, 1.1024169921875, 1.23779296875, 1.3731689453125, 1.508544921875, 1.6439208984375, 1.779296875, 1.9146728515625, 2.050048828125, 2.1854248046875, 2.32080078125, 2.4561767578125, 2.591552734375, 2.7269287109375, 2.8623046875, 2.9976806640625, 3.133056640625, 3.2684326171875, 3.40380859375, 3.5391845703125, 3.674560546875, 3.8099365234375, 3.9453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 19.0, 26.0, 57.0, 139.0, 212.0, 237.0, 155.0, 70.0, 30.0, 11.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-66.54733276367188, -65.01029968261719, -63.473262786865234, -61.93622970581055, -60.399192810058594, -58.862159729003906, -57.32512283325195, -55.788089752197266, -54.25105285644531, -52.714019775390625, -51.17698287963867, -49.639949798583984, -48.10291290283203, -46.565879821777344, -45.02884292602539, -43.4918098449707, -41.95477294921875, -40.41773986816406, -38.88070297241211, -37.34366989135742, -35.80663299560547, -34.26959991455078, -32.73256301879883, -31.19552993774414, -29.658496856689453, -28.121461868286133, -26.584426879882812, -25.047391891479492, -23.510356903076172, -21.97332191467285, -20.43628692626953, -18.899253845214844, -17.362218856811523, -15.825183868408203, -14.288148880004883, -12.751113891601562, -11.214078903198242, -9.677043914794922, -8.140009880065918, -6.602974891662598, -5.065939903259277, -3.528904914855957, -1.9918701648712158, -0.4548354148864746, 1.0821995735168457, 2.619234561920166, 4.156269073486328, 5.693304061889648, 7.230339050292969, 8.767374038696289, 10.30440902709961, 11.84144401550293, 13.37847900390625, 14.91551399230957, 16.45254898071289, 17.989582061767578, 19.52661895751953, 21.06365394592285, 22.600688934326172, 24.137723922729492, 25.674758911132812, 27.211793899536133, 28.748828887939453, 30.28586196899414, 31.82289695739746]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 16.0, 13.0, 10.0, 24.0, 32.0, 20.0, 39.0, 51.0, 65.0, 56.0, 53.0, 59.0, 70.0, 64.0, 54.0, 48.0, 56.0, 40.0, 42.0, 29.0, 35.0, 26.0, 27.0, 14.0, 9.0, 7.0, 10.0, 7.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.269634246826172, -26.519567489624023, -25.769500732421875, -25.01943588256836, -24.26936912536621, -23.519302368164062, -22.769235610961914, -22.019168853759766, -21.26910400390625, -20.5190372467041, -19.768970489501953, -19.018905639648438, -18.26883888244629, -17.51877212524414, -16.768705368041992, -16.018638610839844, -15.268571853637695, -14.518505096435547, -13.768439292907715, -13.018372535705566, -12.268306732177734, -11.518239974975586, -10.768173217773438, -10.018106460571289, -9.268040657043457, -8.517973899841309, -7.767908096313477, -7.017841339111328, -6.267775058746338, -5.517708778381348, -4.767642021179199, -4.017575740814209, -3.2675113677978516, -2.5174450874328613, -1.767378568649292, -1.0173120498657227, -0.2672457695007324, 0.4828205108642578, 1.2328872680664062, 1.9829535484313965, 2.7330198287963867, 3.483086109161377, 4.233152389526367, 4.983219146728516, 5.733285427093506, 6.483351707458496, 7.2334184646606445, 7.983484745025635, 8.733551025390625, 9.483617782592773, 10.233683586120605, 10.983750343322754, 11.733816146850586, 12.483882904052734, 13.233949661254883, 13.984016418457031, 14.734082221984863, 15.484148979187012, 16.234214782714844, 16.984281539916992, 17.73434829711914, 18.484413146972656, 19.234481811523438, 19.984546661376953, 20.7346134185791]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 11.0, 13.0, 17.0, 14.0, 33.0, 34.0, 81.0, 95.0, 158.0, 234.0, 358.0, 597.0, 1059.0, 1845.0, 3230.0, 6724.0, 13715.0, 31389.0, 74660.0, 171750.0, 297995.0, 241279.0, 114721.0, 47844.0, 20543.0, 9562.0, 4682.0, 2449.0, 1326.0, 797.0, 470.0, 292.0, 188.0, 125.0, 89.0, 52.0, 26.0, 27.0, 25.0, 13.0, 10.0, 4.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.12890625, -3.03619384765625, -2.9434814453125, -2.85076904296875, -2.758056640625, -2.66534423828125, -2.5726318359375, -2.47991943359375, -2.38720703125, -2.29449462890625, -2.2017822265625, -2.10906982421875, -2.016357421875, -1.92364501953125, -1.8309326171875, -1.73822021484375, -1.6455078125, -1.55279541015625, -1.4600830078125, -1.36737060546875, -1.274658203125, -1.18194580078125, -1.0892333984375, -0.99652099609375, -0.90380859375, -0.81109619140625, -0.7183837890625, -0.62567138671875, -0.532958984375, -0.44024658203125, -0.3475341796875, -0.25482177734375, -0.162109375, -0.06939697265625, 0.0233154296875, 0.11602783203125, 0.208740234375, 0.30145263671875, 0.3941650390625, 0.48687744140625, 0.57958984375, 0.67230224609375, 0.7650146484375, 0.85772705078125, 0.950439453125, 1.04315185546875, 1.1358642578125, 1.22857666015625, 1.3212890625, 1.41400146484375, 1.5067138671875, 1.59942626953125, 1.692138671875, 1.78485107421875, 1.8775634765625, 1.97027587890625, 2.06298828125, 2.15570068359375, 2.2484130859375, 2.34112548828125, 2.433837890625, 2.52655029296875, 2.6192626953125, 2.71197509765625, 2.8046875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 8.0, 3.0, 17.0, 13.0, 17.0, 25.0, 22.0, 32.0, 28.0, 45.0, 37.0, 30.0, 35.0, 49.0, 51.0, 45.0, 57.0, 44.0, 52.0, 49.0, 53.0, 37.0, 45.0, 33.0, 40.0, 32.0, 22.0, 22.0, 13.0, 9.0, 8.0, 12.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.478515625, -2.406524658203125, -2.33453369140625, -2.262542724609375, -2.1905517578125, -2.118560791015625, -2.04656982421875, -1.974578857421875, -1.902587890625, -1.830596923828125, -1.75860595703125, -1.686614990234375, -1.6146240234375, -1.542633056640625, -1.47064208984375, -1.398651123046875, -1.32666015625, -1.254669189453125, -1.18267822265625, -1.110687255859375, -1.0386962890625, -0.966705322265625, -0.89471435546875, -0.822723388671875, -0.750732421875, -0.678741455078125, -0.60675048828125, -0.534759521484375, -0.4627685546875, -0.390777587890625, -0.31878662109375, -0.246795654296875, -0.1748046875, -0.102813720703125, -0.03082275390625, 0.041168212890625, 0.1131591796875, 0.185150146484375, 0.25714111328125, 0.329132080078125, 0.401123046875, 0.473114013671875, 0.54510498046875, 0.617095947265625, 0.6890869140625, 0.761077880859375, 0.83306884765625, 0.905059814453125, 0.97705078125, 1.049041748046875, 1.12103271484375, 1.193023681640625, 1.2650146484375, 1.337005615234375, 1.40899658203125, 1.480987548828125, 1.552978515625, 1.624969482421875, 1.69696044921875, 1.768951416015625, 1.8409423828125, 1.912933349609375, 1.98492431640625, 2.056915283203125, 2.12890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 5.0, 16.0, 9.0, 7.0, 9.0, 19.0, 26.0, 44.0, 41.0, 60.0, 81.0, 165.0, 335.0, 844.0, 2362.0, 9133.0, 48273.0, 336074.0, 573438.0, 61725.0, 11240.0, 2769.0, 934.0, 354.0, 197.0, 107.0, 56.0, 43.0, 39.0, 29.0, 18.0, 18.0, 12.0, 9.0, 11.0, 8.0, 8.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.70306396484375, -5.4998779296875, -5.29669189453125, -5.093505859375, -4.89031982421875, -4.6871337890625, -4.48394775390625, -4.28076171875, -4.07757568359375, -3.8743896484375, -3.67120361328125, -3.468017578125, -3.26483154296875, -3.0616455078125, -2.85845947265625, -2.6552734375, -2.45208740234375, -2.2489013671875, -2.04571533203125, -1.842529296875, -1.63934326171875, -1.4361572265625, -1.23297119140625, -1.02978515625, -0.82659912109375, -0.6234130859375, -0.42022705078125, -0.217041015625, -0.01385498046875, 0.1893310546875, 0.39251708984375, 0.595703125, 0.79888916015625, 1.0020751953125, 1.20526123046875, 1.408447265625, 1.61163330078125, 1.8148193359375, 2.01800537109375, 2.22119140625, 2.42437744140625, 2.6275634765625, 2.83074951171875, 3.033935546875, 3.23712158203125, 3.4403076171875, 3.64349365234375, 3.8466796875, 4.04986572265625, 4.2530517578125, 4.45623779296875, 4.659423828125, 4.86260986328125, 5.0657958984375, 5.26898193359375, 5.47216796875, 5.67535400390625, 5.8785400390625, 6.08172607421875, 6.284912109375, 6.48809814453125, 6.6912841796875, 6.89447021484375, 7.09765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 3.0, 3.0, 8.0, 7.0, 15.0, 9.0, 12.0, 21.0, 21.0, 29.0, 31.0, 31.0, 35.0, 45.0, 55.0, 39.0, 44.0, 41.0, 39.0, 53.0, 59.0, 37.0, 43.0, 36.0, 39.0, 33.0, 30.0, 33.0, 24.0, 17.0, 14.0, 12.0, 13.0, 14.0, 5.0, 12.0, 3.0, 6.0, 1.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.09765625, -5.887451171875, -5.67724609375, -5.467041015625, -5.2568359375, -5.046630859375, -4.83642578125, -4.626220703125, -4.416015625, -4.205810546875, -3.99560546875, -3.785400390625, -3.5751953125, -3.364990234375, -3.15478515625, -2.944580078125, -2.734375, -2.524169921875, -2.31396484375, -2.103759765625, -1.8935546875, -1.683349609375, -1.47314453125, -1.262939453125, -1.052734375, -0.842529296875, -0.63232421875, -0.422119140625, -0.2119140625, -0.001708984375, 0.20849609375, 0.418701171875, 0.62890625, 0.839111328125, 1.04931640625, 1.259521484375, 1.4697265625, 1.679931640625, 1.89013671875, 2.100341796875, 2.310546875, 2.520751953125, 2.73095703125, 2.941162109375, 3.1513671875, 3.361572265625, 3.57177734375, 3.781982421875, 3.9921875, 4.202392578125, 4.41259765625, 4.622802734375, 4.8330078125, 5.043212890625, 5.25341796875, 5.463623046875, 5.673828125, 5.884033203125, 6.09423828125, 6.304443359375, 6.5146484375, 6.724853515625, 6.93505859375, 7.145263671875, 7.35546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 18.0, 21.0, 31.0, 47.0, 110.0, 254.0, 758.0, 3155.0, 22904.0, 338482.0, 645935.0, 31303.0, 4062.0, 945.0, 260.0, 119.0, 45.0, 29.0, 21.0, 13.0, 8.0, 5.0, 7.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.9921875, -2.9068603515625, -2.821533203125, -2.7362060546875, -2.65087890625, -2.5655517578125, -2.480224609375, -2.3948974609375, -2.3095703125, -2.2242431640625, -2.138916015625, -2.0535888671875, -1.96826171875, -1.8829345703125, -1.797607421875, -1.7122802734375, -1.626953125, -1.5416259765625, -1.456298828125, -1.3709716796875, -1.28564453125, -1.2003173828125, -1.114990234375, -1.0296630859375, -0.9443359375, -0.8590087890625, -0.773681640625, -0.6883544921875, -0.60302734375, -0.5177001953125, -0.432373046875, -0.3470458984375, -0.26171875, -0.1763916015625, -0.091064453125, -0.0057373046875, 0.07958984375, 0.1649169921875, 0.250244140625, 0.3355712890625, 0.4208984375, 0.5062255859375, 0.591552734375, 0.6768798828125, 0.76220703125, 0.8475341796875, 0.932861328125, 1.0181884765625, 1.103515625, 1.1888427734375, 1.274169921875, 1.3594970703125, 1.44482421875, 1.5301513671875, 1.615478515625, 1.7008056640625, 1.7861328125, 1.8714599609375, 1.956787109375, 2.0421142578125, 2.12744140625, 2.2127685546875, 2.298095703125, 2.3834228515625, 2.46875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 4.0, 1.0, 8.0, 13.0, 9.0, 18.0, 19.0, 21.0, 37.0, 58.0, 52.0, 75.0, 83.0, 78.0, 87.0, 71.0, 75.0, 62.0, 50.0, 24.0, 34.0, 26.0, 18.0, 15.0, 13.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036454200744628906, -0.0003500916063785553, -0.00033564120531082153, -0.00032119080424308777, -0.000306740403175354, -0.00029229000210762024, -0.0002778396010398865, -0.0002633891999721527, -0.00024893879890441895, -0.00023448839783668518, -0.00022003799676895142, -0.00020558759570121765, -0.0001911371946334839, -0.00017668679356575012, -0.00016223639249801636, -0.0001477859914302826, -0.00013333559036254883, -0.00011888518929481506, -0.0001044347882270813, -8.998438715934753e-05, -7.553398609161377e-05, -6.108358502388e-05, -4.663318395614624e-05, -3.2182782888412476e-05, -1.773238182067871e-05, -3.2819807529449463e-06, 1.1168420314788818e-05, 2.5618821382522583e-05, 4.006922245025635e-05, 5.451962351799011e-05, 6.897002458572388e-05, 8.342042565345764e-05, 9.78708267211914e-05, 0.00011232122778892517, 0.00012677162885665894, 0.0001412220299243927, 0.00015567243099212646, 0.00017012283205986023, 0.000184573233127594, 0.00019902363419532776, 0.00021347403526306152, 0.0002279244363307953, 0.00024237483739852905, 0.0002568252384662628, 0.0002712756395339966, 0.00028572604060173035, 0.0003001764416694641, 0.0003146268427371979, 0.00032907724380493164, 0.0003435276448726654, 0.00035797804594039917, 0.00037242844700813293, 0.0003868788480758667, 0.00040132924914360046, 0.00041577965021133423, 0.000430230051279068, 0.00044468045234680176, 0.0004591308534145355, 0.0004735812544822693, 0.00048803165555000305, 0.0005024820566177368, 0.0005169324576854706, 0.0005313828587532043, 0.0005458332598209381, 0.0005602836608886719]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 9.0, 14.0, 21.0, 34.0, 24.0, 48.0, 95.0, 144.0, 293.0, 538.0, 1253.0, 3270.0, 12021.0, 61173.0, 526390.0, 369669.0, 56161.0, 11631.0, 3267.0, 1267.0, 554.0, 250.0, 138.0, 93.0, 63.0, 36.0, 26.0, 13.0, 12.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.263671875, -1.20867919921875, -1.1536865234375, -1.09869384765625, -1.043701171875, -0.98870849609375, -0.9337158203125, -0.87872314453125, -0.82373046875, -0.76873779296875, -0.7137451171875, -0.65875244140625, -0.603759765625, -0.54876708984375, -0.4937744140625, -0.43878173828125, -0.3837890625, -0.32879638671875, -0.2738037109375, -0.21881103515625, -0.163818359375, -0.10882568359375, -0.0538330078125, 0.00115966796875, 0.05615234375, 0.11114501953125, 0.1661376953125, 0.22113037109375, 0.276123046875, 0.33111572265625, 0.3861083984375, 0.44110107421875, 0.49609375, 0.55108642578125, 0.6060791015625, 0.66107177734375, 0.716064453125, 0.77105712890625, 0.8260498046875, 0.88104248046875, 0.93603515625, 0.99102783203125, 1.0460205078125, 1.10101318359375, 1.156005859375, 1.21099853515625, 1.2659912109375, 1.32098388671875, 1.3759765625, 1.43096923828125, 1.4859619140625, 1.54095458984375, 1.595947265625, 1.65093994140625, 1.7059326171875, 1.76092529296875, 1.81591796875, 1.87091064453125, 1.9259033203125, 1.98089599609375, 2.035888671875, 2.09088134765625, 2.1458740234375, 2.20086669921875, 2.255859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 15.0, 19.0, 29.0, 42.0, 60.0, 89.0, 94.0, 122.0, 99.0, 113.0, 81.0, 60.0, 47.0, 38.0, 26.0, 13.0, 8.0, 12.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8134765625, -1.7393646240234375, -1.665252685546875, -1.5911407470703125, -1.51702880859375, -1.4429168701171875, -1.368804931640625, -1.2946929931640625, -1.2205810546875, -1.1464691162109375, -1.072357177734375, -0.9982452392578125, -0.92413330078125, -0.8500213623046875, -0.775909423828125, -0.7017974853515625, -0.627685546875, -0.5535736083984375, -0.479461669921875, -0.4053497314453125, -0.33123779296875, -0.2571258544921875, -0.183013916015625, -0.1089019775390625, -0.0347900390625, 0.0393218994140625, 0.113433837890625, 0.1875457763671875, 0.26165771484375, 0.3357696533203125, 0.409881591796875, 0.4839935302734375, 0.55810546875, 0.6322174072265625, 0.706329345703125, 0.7804412841796875, 0.85455322265625, 0.9286651611328125, 1.002777099609375, 1.0768890380859375, 1.1510009765625, 1.2251129150390625, 1.299224853515625, 1.3733367919921875, 1.44744873046875, 1.5215606689453125, 1.595672607421875, 1.6697845458984375, 1.743896484375, 1.8180084228515625, 1.892120361328125, 1.9662322998046875, 2.04034423828125, 2.1144561767578125, 2.188568115234375, 2.2626800537109375, 2.3367919921875, 2.4109039306640625, 2.485015869140625, 2.5591278076171875, 2.63323974609375, 2.7073516845703125, 2.781463623046875, 2.8555755615234375, 2.9296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 18.0, 38.0, 46.0, 100.0, 140.0, 234.0, 130.0, 84.0, 63.0, 37.0, 30.0, 16.0, 7.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.138591766357422, -23.064472198486328, -21.9903507232666, -20.916229248046875, -19.84210968017578, -18.767990112304688, -17.69386863708496, -16.619747161865234, -15.54562759399414, -14.47150707244873, -13.39738655090332, -12.32326602935791, -11.2491455078125, -10.17502498626709, -9.10090446472168, -8.02678394317627, -6.952663421630859, -5.878542900085449, -4.804422378540039, -3.730301856994629, -2.6561813354492188, -1.5820608139038086, -0.5079402923583984, 0.5661802291870117, 1.6403007507324219, 2.714421272277832, 3.788541793823242, 4.862662315368652, 5.9367828369140625, 7.010903358459473, 8.085023880004883, 9.159144401550293, 10.233261108398438, 11.307381629943848, 12.381502151489258, 13.455622673034668, 14.529743194580078, 15.603863716125488, 16.6779842376709, 17.752105712890625, 18.82622528076172, 19.900344848632812, 20.97446632385254, 22.048587799072266, 23.12270736694336, 24.196826934814453, 25.27094841003418, 26.345069885253906, 27.419189453125, 28.493309020996094, 29.56743049621582, 30.641551971435547, 31.71567153930664, 32.789791107177734, 33.863914489746094, 34.93803405761719, 36.01215362548828, 37.086273193359375, 38.16039276123047, 39.23451614379883, 40.30863571166992, 41.382755279541016, 42.456878662109375, 43.53099822998047, 44.60511779785156]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 8.0, 11.0, 13.0, 11.0, 18.0, 16.0, 6.0, 17.0, 11.0, 18.0, 28.0, 26.0, 17.0, 29.0, 35.0, 28.0, 37.0, 61.0, 58.0, 78.0, 69.0, 60.0, 51.0, 30.0, 34.0, 32.0, 19.0, 34.0, 15.0, 19.0, 16.0, 10.0, 8.0, 13.0, 16.0, 8.0, 5.0, 13.0, 3.0, 4.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.756919860839844, -25.931365966796875, -25.105810165405273, -24.280256271362305, -23.454700469970703, -22.629146575927734, -21.803592681884766, -20.978036880493164, -20.152481079101562, -19.326927185058594, -18.501371383666992, -17.675817489624023, -16.850261688232422, -16.024707794189453, -15.199152946472168, -14.373598098754883, -13.548044204711914, -12.722489356994629, -11.896934509277344, -11.071380615234375, -10.245824813842773, -9.420270919799805, -8.59471607208252, -7.769161224365234, -6.943606376647949, -6.118051528930664, -5.292496681213379, -4.466942310333252, -3.641387462615967, -2.8158326148986816, -1.9902782440185547, -1.1647233963012695, -0.3391685485839844, 0.48638617992401123, 1.3119409084320068, 2.137495517730713, 2.963050365447998, 3.788605213165283, 4.61415958404541, 5.439714431762695, 6.2652692794799805, 7.090824127197266, 7.916378974914551, 8.741933822631836, 9.567487716674805, 10.393043518066406, 11.218597412109375, 12.04415225982666, 12.869707107543945, 13.69526195526123, 14.520816802978516, 15.346370697021484, 16.171926498413086, 16.997480392456055, 17.823036193847656, 18.648590087890625, 19.474143981933594, 20.299697875976562, 21.125253677368164, 21.950807571411133, 22.776363372802734, 23.601917266845703, 24.427471160888672, 25.253026962280273, 26.078582763671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 1.0, 4.0, 5.0, 4.0, 8.0, 7.0, 16.0, 19.0, 25.0, 42.0, 58.0, 100.0, 136.0, 299.0, 563.0, 1229.0, 3537.0, 12279.0, 92444.0, 2439006.0, 1559680.0, 68187.0, 11159.0, 3118.0, 1149.0, 534.0, 276.0, 140.0, 89.0, 43.0, 43.0, 22.0, 18.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.4296875, -5.300201416015625, -5.17071533203125, -5.041229248046875, -4.9117431640625, -4.782257080078125, -4.65277099609375, -4.523284912109375, -4.393798828125, -4.264312744140625, -4.13482666015625, -4.005340576171875, -3.8758544921875, -3.746368408203125, -3.61688232421875, -3.487396240234375, -3.35791015625, -3.228424072265625, -3.09893798828125, -2.969451904296875, -2.8399658203125, -2.710479736328125, -2.58099365234375, -2.451507568359375, -2.322021484375, -2.192535400390625, -2.06304931640625, -1.933563232421875, -1.8040771484375, -1.674591064453125, -1.54510498046875, -1.415618896484375, -1.2861328125, -1.156646728515625, -1.02716064453125, -0.897674560546875, -0.7681884765625, -0.638702392578125, -0.50921630859375, -0.379730224609375, -0.250244140625, -0.120758056640625, 0.00872802734375, 0.138214111328125, 0.2677001953125, 0.397186279296875, 0.52667236328125, 0.656158447265625, 0.78564453125, 0.915130615234375, 1.04461669921875, 1.174102783203125, 1.3035888671875, 1.433074951171875, 1.56256103515625, 1.692047119140625, 1.821533203125, 1.951019287109375, 2.08050537109375, 2.209991455078125, 2.3394775390625, 2.468963623046875, 2.59844970703125, 2.727935791015625, 2.857421875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 5.0, 11.0, 10.0, 12.0, 18.0, 21.0, 29.0, 30.0, 33.0, 51.0, 38.0, 49.0, 39.0, 31.0, 46.0, 61.0, 49.0, 58.0, 55.0, 55.0, 58.0, 38.0, 45.0, 31.0, 30.0, 24.0, 8.0, 24.0, 11.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.405242919921875, -2.33392333984375, -2.262603759765625, -2.1912841796875, -2.119964599609375, -2.04864501953125, -1.977325439453125, -1.906005859375, -1.834686279296875, -1.76336669921875, -1.692047119140625, -1.6207275390625, -1.549407958984375, -1.47808837890625, -1.406768798828125, -1.33544921875, -1.264129638671875, -1.19281005859375, -1.121490478515625, -1.0501708984375, -0.978851318359375, -0.90753173828125, -0.836212158203125, -0.764892578125, -0.693572998046875, -0.62225341796875, -0.550933837890625, -0.4796142578125, -0.408294677734375, -0.33697509765625, -0.265655517578125, -0.1943359375, -0.123016357421875, -0.05169677734375, 0.019622802734375, 0.0909423828125, 0.162261962890625, 0.23358154296875, 0.304901123046875, 0.376220703125, 0.447540283203125, 0.51885986328125, 0.590179443359375, 0.6614990234375, 0.732818603515625, 0.80413818359375, 0.875457763671875, 0.94677734375, 1.018096923828125, 1.08941650390625, 1.160736083984375, 1.2320556640625, 1.303375244140625, 1.37469482421875, 1.446014404296875, 1.517333984375, 1.588653564453125, 1.65997314453125, 1.731292724609375, 1.8026123046875, 1.873931884765625, 1.94525146484375, 2.016571044921875, 2.087890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 9.0, 12.0, 24.0, 35.0, 56.0, 111.0, 229.0, 544.0, 2629.0, 38200.0, 4063786.0, 83900.0, 3665.0, 606.0, 220.0, 105.0, 56.0, 38.0, 27.0, 17.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9609375, -9.612548828125, -9.26416015625, -8.915771484375, -8.5673828125, -8.218994140625, -7.87060546875, -7.522216796875, -7.173828125, -6.825439453125, -6.47705078125, -6.128662109375, -5.7802734375, -5.431884765625, -5.08349609375, -4.735107421875, -4.38671875, -4.038330078125, -3.68994140625, -3.341552734375, -2.9931640625, -2.644775390625, -2.29638671875, -1.947998046875, -1.599609375, -1.251220703125, -0.90283203125, -0.554443359375, -0.2060546875, 0.142333984375, 0.49072265625, 0.839111328125, 1.1875, 1.535888671875, 1.88427734375, 2.232666015625, 2.5810546875, 2.929443359375, 3.27783203125, 3.626220703125, 3.974609375, 4.322998046875, 4.67138671875, 5.019775390625, 5.3681640625, 5.716552734375, 6.06494140625, 6.413330078125, 6.76171875, 7.110107421875, 7.45849609375, 7.806884765625, 8.1552734375, 8.503662109375, 8.85205078125, 9.200439453125, 9.548828125, 9.897216796875, 10.24560546875, 10.593994140625, 10.9423828125, 11.290771484375, 11.63916015625, 11.987548828125, 12.3359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 10.0, 17.0, 18.0, 32.0, 54.0, 112.0, 192.0, 459.0, 1036.0, 1095.0, 534.0, 232.0, 96.0, 71.0, 25.0, 24.0, 20.0, 11.0, 9.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.1484375, -7.96759033203125, -7.7867431640625, -7.60589599609375, -7.425048828125, -7.24420166015625, -7.0633544921875, -6.88250732421875, -6.70166015625, -6.52081298828125, -6.3399658203125, -6.15911865234375, -5.978271484375, -5.79742431640625, -5.6165771484375, -5.43572998046875, -5.2548828125, -5.07403564453125, -4.8931884765625, -4.71234130859375, -4.531494140625, -4.35064697265625, -4.1697998046875, -3.98895263671875, -3.80810546875, -3.62725830078125, -3.4464111328125, -3.26556396484375, -3.084716796875, -2.90386962890625, -2.7230224609375, -2.54217529296875, -2.361328125, -2.18048095703125, -1.9996337890625, -1.81878662109375, -1.637939453125, -1.45709228515625, -1.2762451171875, -1.09539794921875, -0.91455078125, -0.73370361328125, -0.5528564453125, -0.37200927734375, -0.191162109375, -0.01031494140625, 0.1705322265625, 0.35137939453125, 0.5322265625, 0.71307373046875, 0.8939208984375, 1.07476806640625, 1.255615234375, 1.43646240234375, 1.6173095703125, 1.79815673828125, 1.97900390625, 2.15985107421875, 2.3406982421875, 2.52154541015625, 2.702392578125, 2.88323974609375, 3.0640869140625, 3.24493408203125, 3.42578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 25.0, 88.0, 355.0, 396.0, 96.0, 34.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.89376449584961, -50.90268325805664, -47.91160202026367, -44.9205207824707, -41.929439544677734, -38.938358306884766, -35.9472770690918, -32.95619583129883, -29.96511459350586, -26.97403335571289, -23.982952117919922, -20.991870880126953, -18.000789642333984, -15.009708404541016, -12.018627166748047, -9.027545928955078, -6.036464691162109, -3.0453834533691406, -0.054302215576171875, 2.936779022216797, 5.927860260009766, 8.918941497802734, 11.910022735595703, 14.901103973388672, 17.89218521118164, 20.88326644897461, 23.874347686767578, 26.865428924560547, 29.856510162353516, 32.847591400146484, 35.83867263793945, 38.82975387573242, 41.820831298828125, 44.811912536621094, 47.80299377441406, 50.79407501220703, 53.78515625, 56.77623748779297, 59.76731872558594, 62.758399963378906, 65.74948120117188, 68.74056243896484, 71.73164367675781, 74.72272491455078, 77.71380615234375, 80.70488739013672, 83.69596862792969, 86.68704986572266, 89.67813110351562, 92.6692123413086, 95.66029357910156, 98.65137481689453, 101.6424560546875, 104.63353729248047, 107.62461853027344, 110.6156997680664, 113.60678100585938, 116.59786224365234, 119.58894348144531, 122.58002471923828, 125.57110595703125, 128.56219482421875, 131.5532684326172, 134.54434204101562, 137.53543090820312]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 4.0, 4.0, 7.0, 8.0, 8.0, 17.0, 19.0, 13.0, 22.0, 22.0, 29.0, 20.0, 29.0, 32.0, 31.0, 37.0, 35.0, 50.0, 49.0, 40.0, 50.0, 52.0, 48.0, 41.0, 45.0, 41.0, 22.0, 27.0, 30.0, 25.0, 19.0, 19.0, 16.0, 17.0, 16.0, 13.0, 7.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.770204544067383, -16.2814998626709, -15.792797088623047, -15.304093360900879, -14.815389633178711, -14.326684951782227, -13.837981224060059, -13.34927749633789, -12.860573768615723, -12.371870040893555, -11.883166313171387, -11.394462585449219, -10.905757904052734, -10.417055130004883, -9.928350448608398, -9.43964672088623, -8.950942993164062, -8.462239265441895, -7.973535537719727, -7.4848313331604, -6.996127605438232, -6.5074238777160645, -6.018719673156738, -5.53001594543457, -5.041312217712402, -4.552608489990234, -4.063904762268066, -3.5752005577087402, -3.0864968299865723, -2.5977931022644043, -2.1090891361236572, -1.6203851699829102, -1.1316814422607422, -0.6429775953292847, -0.15427374839782715, 0.33443009853363037, 0.8231339454650879, 1.3118376731872559, 1.800541639328003, 2.28924560546875, 2.777949333190918, 3.266653060913086, 3.755357027053833, 4.24406099319458, 4.732764720916748, 5.221468448638916, 5.710172653198242, 6.19887638092041, 6.687580108642578, 7.176283836364746, 7.664987564086914, 8.153691291809082, 8.64239501953125, 9.131099700927734, 9.619803428649902, 10.10850715637207, 10.597210884094238, 11.085914611816406, 11.574618339538574, 12.063322067260742, 12.552026748657227, 13.040729522705078, 13.529434204101562, 14.01813793182373, 14.506841659545898]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 17.0, 22.0, 26.0, 39.0, 87.0, 109.0, 185.0, 291.0, 528.0, 932.0, 1686.0, 3393.0, 6872.0, 15279.0, 37109.0, 94123.0, 247677.0, 362401.0, 167365.0, 63470.0, 25371.0, 10956.0, 4951.0, 2448.0, 1365.0, 729.0, 406.0, 264.0, 172.0, 88.0, 57.0, 37.0, 18.0, 21.0, 16.0, 3.0, 12.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.220703125, -3.12396240234375, -3.0272216796875, -2.93048095703125, -2.833740234375, -2.73699951171875, -2.6402587890625, -2.54351806640625, -2.44677734375, -2.35003662109375, -2.2532958984375, -2.15655517578125, -2.059814453125, -1.96307373046875, -1.8663330078125, -1.76959228515625, -1.6728515625, -1.57611083984375, -1.4793701171875, -1.38262939453125, -1.285888671875, -1.18914794921875, -1.0924072265625, -0.99566650390625, -0.89892578125, -0.80218505859375, -0.7054443359375, -0.60870361328125, -0.511962890625, -0.41522216796875, -0.3184814453125, -0.22174072265625, -0.125, -0.02825927734375, 0.0684814453125, 0.16522216796875, 0.261962890625, 0.35870361328125, 0.4554443359375, 0.55218505859375, 0.64892578125, 0.74566650390625, 0.8424072265625, 0.93914794921875, 1.035888671875, 1.13262939453125, 1.2293701171875, 1.32611083984375, 1.4228515625, 1.51959228515625, 1.6163330078125, 1.71307373046875, 1.809814453125, 1.90655517578125, 2.0032958984375, 2.10003662109375, 2.19677734375, 2.29351806640625, 2.3902587890625, 2.48699951171875, 2.583740234375, 2.68048095703125, 2.7772216796875, 2.87396240234375, 2.970703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 14.0, 18.0, 16.0, 19.0, 30.0, 25.0, 40.0, 42.0, 50.0, 49.0, 41.0, 44.0, 51.0, 58.0, 61.0, 51.0, 58.0, 41.0, 54.0, 55.0, 30.0, 29.0, 32.0, 16.0, 14.0, 15.0, 7.0, 10.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -2.57916259765625, -2.5040283203125, -2.42889404296875, -2.353759765625, -2.27862548828125, -2.2034912109375, -2.12835693359375, -2.05322265625, -1.97808837890625, -1.9029541015625, -1.82781982421875, -1.752685546875, -1.67755126953125, -1.6024169921875, -1.52728271484375, -1.4521484375, -1.37701416015625, -1.3018798828125, -1.22674560546875, -1.151611328125, -1.07647705078125, -1.0013427734375, -0.92620849609375, -0.85107421875, -0.77593994140625, -0.7008056640625, -0.62567138671875, -0.550537109375, -0.47540283203125, -0.4002685546875, -0.32513427734375, -0.25, -0.17486572265625, -0.0997314453125, -0.02459716796875, 0.050537109375, 0.12567138671875, 0.2008056640625, 0.27593994140625, 0.35107421875, 0.42620849609375, 0.5013427734375, 0.57647705078125, 0.651611328125, 0.72674560546875, 0.8018798828125, 0.87701416015625, 0.9521484375, 1.02728271484375, 1.1024169921875, 1.17755126953125, 1.252685546875, 1.32781982421875, 1.4029541015625, 1.47808837890625, 1.55322265625, 1.62835693359375, 1.7034912109375, 1.77862548828125, 1.853759765625, 1.92889404296875, 2.0040283203125, 2.07916259765625, 2.154296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 10.0, 17.0, 11.0, 23.0, 39.0, 52.0, 76.0, 133.0, 210.0, 316.0, 584.0, 1179.0, 2846.0, 10319.0, 55768.0, 642580.0, 285686.0, 36795.0, 7467.0, 2155.0, 887.0, 482.0, 306.0, 172.0, 126.0, 64.0, 78.0, 38.0, 37.0, 18.0, 15.0, 11.0, 6.0, 7.0, 11.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.0859375, -5.89508056640625, -5.7042236328125, -5.51336669921875, -5.322509765625, -5.13165283203125, -4.9407958984375, -4.74993896484375, -4.55908203125, -4.36822509765625, -4.1773681640625, -3.98651123046875, -3.795654296875, -3.60479736328125, -3.4139404296875, -3.22308349609375, -3.0322265625, -2.84136962890625, -2.6505126953125, -2.45965576171875, -2.268798828125, -2.07794189453125, -1.8870849609375, -1.69622802734375, -1.50537109375, -1.31451416015625, -1.1236572265625, -0.93280029296875, -0.741943359375, -0.55108642578125, -0.3602294921875, -0.16937255859375, 0.021484375, 0.21234130859375, 0.4031982421875, 0.59405517578125, 0.784912109375, 0.97576904296875, 1.1666259765625, 1.35748291015625, 1.54833984375, 1.73919677734375, 1.9300537109375, 2.12091064453125, 2.311767578125, 2.50262451171875, 2.6934814453125, 2.88433837890625, 3.0751953125, 3.26605224609375, 3.4569091796875, 3.64776611328125, 3.838623046875, 4.02947998046875, 4.2203369140625, 4.41119384765625, 4.60205078125, 4.79290771484375, 4.9837646484375, 5.17462158203125, 5.365478515625, 5.55633544921875, 5.7471923828125, 5.93804931640625, 6.12890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 3.0, 5.0, 8.0, 14.0, 13.0, 20.0, 19.0, 22.0, 24.0, 25.0, 36.0, 38.0, 39.0, 41.0, 54.0, 42.0, 52.0, 49.0, 55.0, 50.0, 45.0, 31.0, 35.0, 31.0, 36.0, 39.0, 22.0, 34.0, 20.0, 17.0, 15.0, 11.0, 7.0, 9.0, 11.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.4375, -6.229248046875, -6.02099609375, -5.812744140625, -5.6044921875, -5.396240234375, -5.18798828125, -4.979736328125, -4.771484375, -4.563232421875, -4.35498046875, -4.146728515625, -3.9384765625, -3.730224609375, -3.52197265625, -3.313720703125, -3.10546875, -2.897216796875, -2.68896484375, -2.480712890625, -2.2724609375, -2.064208984375, -1.85595703125, -1.647705078125, -1.439453125, -1.231201171875, -1.02294921875, -0.814697265625, -0.6064453125, -0.398193359375, -0.18994140625, 0.018310546875, 0.2265625, 0.434814453125, 0.64306640625, 0.851318359375, 1.0595703125, 1.267822265625, 1.47607421875, 1.684326171875, 1.892578125, 2.100830078125, 2.30908203125, 2.517333984375, 2.7255859375, 2.933837890625, 3.14208984375, 3.350341796875, 3.55859375, 3.766845703125, 3.97509765625, 4.183349609375, 4.3916015625, 4.599853515625, 4.80810546875, 5.016357421875, 5.224609375, 5.432861328125, 5.64111328125, 5.849365234375, 6.0576171875, 6.265869140625, 6.47412109375, 6.682373046875, 6.890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 12.0, 20.0, 30.0, 42.0, 69.0, 97.0, 143.0, 269.0, 578.0, 1257.0, 3236.0, 10550.0, 40918.0, 219564.0, 661394.0, 82879.0, 18673.0, 5155.0, 1889.0, 780.0, 388.0, 240.0, 125.0, 75.0, 58.0, 23.0, 22.0, 9.0, 15.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4990234375, -1.4564666748046875, -1.413909912109375, -1.3713531494140625, -1.32879638671875, -1.2862396240234375, -1.243682861328125, -1.2011260986328125, -1.1585693359375, -1.1160125732421875, -1.073455810546875, -1.0308990478515625, -0.98834228515625, -0.9457855224609375, -0.903228759765625, -0.8606719970703125, -0.818115234375, -0.7755584716796875, -0.733001708984375, -0.6904449462890625, -0.64788818359375, -0.6053314208984375, -0.562774658203125, -0.5202178955078125, -0.4776611328125, -0.4351043701171875, -0.392547607421875, -0.3499908447265625, -0.30743408203125, -0.2648773193359375, -0.222320556640625, -0.1797637939453125, -0.13720703125, -0.0946502685546875, -0.052093505859375, -0.0095367431640625, 0.03302001953125, 0.0755767822265625, 0.118133544921875, 0.1606903076171875, 0.2032470703125, 0.2458038330078125, 0.288360595703125, 0.3309173583984375, 0.37347412109375, 0.4160308837890625, 0.458587646484375, 0.5011444091796875, 0.543701171875, 0.5862579345703125, 0.628814697265625, 0.6713714599609375, 0.71392822265625, 0.7564849853515625, 0.799041748046875, 0.8415985107421875, 0.8841552734375, 0.9267120361328125, 0.969268798828125, 1.0118255615234375, 1.05438232421875, 1.0969390869140625, 1.139495849609375, 1.1820526123046875, 1.224609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 13.0, 10.0, 14.0, 17.0, 24.0, 26.0, 40.0, 39.0, 66.0, 64.0, 89.0, 77.0, 82.0, 98.0, 77.0, 48.0, 49.0, 25.0, 35.0, 16.0, 12.0, 14.0, 8.0, 11.0, 4.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000293731689453125, -0.00028191879391670227, -0.00027010589838027954, -0.0002582930028438568, -0.0002464801073074341, -0.00023466721177101135, -0.00022285431623458862, -0.0002110414206981659, -0.00019922852516174316, -0.00018741562962532043, -0.0001756027340888977, -0.00016378983855247498, -0.00015197694301605225, -0.00014016404747962952, -0.0001283511519432068, -0.00011653825640678406, -0.00010472536087036133, -9.29124653339386e-05, -8.109956979751587e-05, -6.928667426109314e-05, -5.747377872467041e-05, -4.566088318824768e-05, -3.384798765182495e-05, -2.203509211540222e-05, -1.0222196578979492e-05, 1.5906989574432373e-06, 1.3403594493865967e-05, 2.5216490030288696e-05, 3.7029385566711426e-05, 4.8842281103134155e-05, 6.0655176639556885e-05, 7.246807217597961e-05, 8.428096771240234e-05, 9.609386324882507e-05, 0.0001079067587852478, 0.00011971965432167053, 0.00013153254985809326, 0.000143345445394516, 0.00015515834093093872, 0.00016697123646736145, 0.00017878413200378418, 0.0001905970275402069, 0.00020240992307662964, 0.00021422281861305237, 0.0002260357141494751, 0.00023784860968589783, 0.00024966150522232056, 0.0002614744007587433, 0.000273287296295166, 0.00028510019183158875, 0.0002969130873680115, 0.0003087259829044342, 0.00032053887844085693, 0.00033235177397727966, 0.0003441646695137024, 0.0003559775650501251, 0.00036779046058654785, 0.0003796033561229706, 0.0003914162516593933, 0.00040322914719581604, 0.00041504204273223877, 0.0004268549382686615, 0.00043866783380508423, 0.00045048072934150696, 0.0004622936248779297]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 11.0, 14.0, 12.0, 26.0, 36.0, 64.0, 72.0, 131.0, 204.0, 328.0, 638.0, 1346.0, 3176.0, 9318.0, 33069.0, 156495.0, 682980.0, 120653.0, 26780.0, 7788.0, 2770.0, 1253.0, 602.0, 284.0, 167.0, 91.0, 77.0, 55.0, 40.0, 25.0, 7.0, 10.0, 8.0, 7.0, 4.0, 3.0, 5.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.4345703125, -1.394073486328125, -1.35357666015625, -1.313079833984375, -1.2725830078125, -1.232086181640625, -1.19158935546875, -1.151092529296875, -1.110595703125, -1.070098876953125, -1.02960205078125, -0.989105224609375, -0.9486083984375, -0.908111572265625, -0.86761474609375, -0.827117919921875, -0.78662109375, -0.746124267578125, -0.70562744140625, -0.665130615234375, -0.6246337890625, -0.584136962890625, -0.54364013671875, -0.503143310546875, -0.462646484375, -0.422149658203125, -0.38165283203125, -0.341156005859375, -0.3006591796875, -0.260162353515625, -0.21966552734375, -0.179168701171875, -0.138671875, -0.098175048828125, -0.05767822265625, -0.017181396484375, 0.0233154296875, 0.063812255859375, 0.10430908203125, 0.144805908203125, 0.185302734375, 0.225799560546875, 0.26629638671875, 0.306793212890625, 0.3472900390625, 0.387786865234375, 0.42828369140625, 0.468780517578125, 0.50927734375, 0.549774169921875, 0.59027099609375, 0.630767822265625, 0.6712646484375, 0.711761474609375, 0.75225830078125, 0.792755126953125, 0.833251953125, 0.873748779296875, 0.91424560546875, 0.954742431640625, 0.9952392578125, 1.035736083984375, 1.07623291015625, 1.116729736328125, 1.1572265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 12.0, 8.0, 15.0, 12.0, 22.0, 24.0, 43.0, 40.0, 61.0, 94.0, 117.0, 104.0, 101.0, 88.0, 63.0, 52.0, 32.0, 27.0, 28.0, 10.0, 5.0, 8.0, 10.0, 4.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.3499755859375, -1.302490234375, -1.2550048828125, -1.20751953125, -1.1600341796875, -1.112548828125, -1.0650634765625, -1.017578125, -0.9700927734375, -0.922607421875, -0.8751220703125, -0.82763671875, -0.7801513671875, -0.732666015625, -0.6851806640625, -0.6376953125, -0.5902099609375, -0.542724609375, -0.4952392578125, -0.44775390625, -0.4002685546875, -0.352783203125, -0.3052978515625, -0.2578125, -0.2103271484375, -0.162841796875, -0.1153564453125, -0.06787109375, -0.0203857421875, 0.027099609375, 0.0745849609375, 0.1220703125, 0.1695556640625, 0.217041015625, 0.2645263671875, 0.31201171875, 0.3594970703125, 0.406982421875, 0.4544677734375, 0.501953125, 0.5494384765625, 0.596923828125, 0.6444091796875, 0.69189453125, 0.7393798828125, 0.786865234375, 0.8343505859375, 0.8818359375, 0.9293212890625, 0.976806640625, 1.0242919921875, 1.07177734375, 1.1192626953125, 1.166748046875, 1.2142333984375, 1.26171875, 1.3092041015625, 1.356689453125, 1.4041748046875, 1.45166015625, 1.4991455078125, 1.546630859375, 1.5941162109375, 1.6416015625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 19.0, 51.0, 154.0, 417.0, 202.0, 90.0, 38.0, 12.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.793182373046875, -34.68589782714844, -32.57861328125, -30.471332550048828, -28.36404800415039, -26.256763458251953, -24.14948081970215, -22.042198181152344, -19.934913635253906, -17.82762908935547, -15.720346450805664, -13.613062858581543, -11.505779266357422, -9.3984956741333, -7.29121208190918, -5.183928489685059, -3.0766448974609375, -0.9693613052368164, 1.1379222869873047, 3.245205879211426, 5.352489471435547, 7.459773063659668, 9.567056655883789, 11.67434024810791, 13.781623840332031, 15.888907432556152, 17.996191024780273, 20.103473663330078, 22.210758209228516, 24.318042755126953, 26.425325393676758, 28.532608032226562, 30.639892578125, 32.74717712402344, 34.854461669921875, 36.96174240112305, 39.069026947021484, 41.17631149291992, 43.283592224121094, 45.39087677001953, 47.49816131591797, 49.605445861816406, 51.712730407714844, 53.820011138916016, 55.92729568481445, 58.03458023071289, 60.14186096191406, 62.2491455078125, 64.35643005371094, 66.46371459960938, 68.57099914550781, 70.67828369140625, 72.78556823730469, 74.8928451538086, 77.00012969970703, 79.10741424560547, 81.2146987915039, 83.32198333740234, 85.42926788330078, 87.53655242919922, 89.64382934570312, 91.75111389160156, 93.8583984375, 95.96568298339844, 98.07296752929688]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 4.0, 5.0, 8.0, 11.0, 14.0, 13.0, 10.0, 25.0, 17.0, 17.0, 17.0, 20.0, 28.0, 32.0, 46.0, 42.0, 66.0, 104.0, 94.0, 67.0, 50.0, 32.0, 32.0, 33.0, 26.0, 21.0, 20.0, 23.0, 23.0, 13.0, 12.0, 12.0, 16.0, 17.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-31.447511672973633, -30.556249618530273, -29.664987564086914, -28.773725509643555, -27.882461547851562, -26.991199493408203, -26.099937438964844, -25.208675384521484, -24.317413330078125, -23.426151275634766, -22.534889221191406, -21.643627166748047, -20.752365112304688, -19.861103057861328, -18.969839096069336, -18.078577041625977, -17.187314987182617, -16.296052932739258, -15.404790878295898, -14.513527870178223, -13.622265815734863, -12.731003761291504, -11.839740753173828, -10.948478698730469, -10.05721664428711, -9.16595458984375, -8.27469253540039, -7.383429527282715, -6.4921674728393555, -5.600905418395996, -4.7096428871154785, -3.818380355834961, -2.9271163940429688, -2.0358541011810303, -1.1445918083190918, -0.2533295154571533, 0.6379327774047852, 1.5291948318481445, 2.420457363128662, 3.3117198944091797, 4.202981948852539, 5.094244003295898, 5.985506534576416, 6.876769065856934, 7.768031120300293, 8.659293174743652, 9.550556182861328, 10.441818237304688, 11.333080291748047, 12.224342346191406, 13.115604400634766, 14.006867408752441, 14.8981294631958, 15.78939151763916, 16.680654525756836, 17.571916580200195, 18.463178634643555, 19.354440689086914, 20.245702743530273, 21.136964797973633, 22.028228759765625, 22.919490814208984, 23.810752868652344, 24.702014923095703, 25.593276977539062]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 3.0, 11.0, 12.0, 13.0, 26.0, 33.0, 52.0, 84.0, 154.0, 265.0, 573.0, 1276.0, 3131.0, 9517.0, 41679.0, 393486.0, 2860709.0, 784722.0, 74952.0, 15611.0, 4813.0, 1728.0, 689.0, 337.0, 163.0, 93.0, 43.0, 36.0, 26.0, 17.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.17578125, -4.0704345703125, -3.965087890625, -3.8597412109375, -3.75439453125, -3.6490478515625, -3.543701171875, -3.4383544921875, -3.3330078125, -3.2276611328125, -3.122314453125, -3.0169677734375, -2.91162109375, -2.8062744140625, -2.700927734375, -2.5955810546875, -2.490234375, -2.3848876953125, -2.279541015625, -2.1741943359375, -2.06884765625, -1.9635009765625, -1.858154296875, -1.7528076171875, -1.6474609375, -1.5421142578125, -1.436767578125, -1.3314208984375, -1.22607421875, -1.1207275390625, -1.015380859375, -0.9100341796875, -0.8046875, -0.6993408203125, -0.593994140625, -0.4886474609375, -0.38330078125, -0.2779541015625, -0.172607421875, -0.0672607421875, 0.0380859375, 0.1434326171875, 0.248779296875, 0.3541259765625, 0.45947265625, 0.5648193359375, 0.670166015625, 0.7755126953125, 0.880859375, 0.9862060546875, 1.091552734375, 1.1968994140625, 1.30224609375, 1.4075927734375, 1.512939453125, 1.6182861328125, 1.7236328125, 1.8289794921875, 1.934326171875, 2.0396728515625, 2.14501953125, 2.2503662109375, 2.355712890625, 2.4610595703125, 2.56640625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 10.0, 12.0, 9.0, 15.0, 18.0, 21.0, 26.0, 33.0, 50.0, 37.0, 45.0, 49.0, 44.0, 42.0, 48.0, 70.0, 59.0, 52.0, 49.0, 48.0, 37.0, 38.0, 40.0, 30.0, 25.0, 18.0, 17.0, 12.0, 13.0, 7.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.669921875, -2.6013641357421875, -2.532806396484375, -2.4642486572265625, -2.39569091796875, -2.3271331787109375, -2.258575439453125, -2.1900177001953125, -2.1214599609375, -2.0529022216796875, -1.984344482421875, -1.9157867431640625, -1.84722900390625, -1.7786712646484375, -1.710113525390625, -1.6415557861328125, -1.572998046875, -1.5044403076171875, -1.435882568359375, -1.3673248291015625, -1.29876708984375, -1.2302093505859375, -1.161651611328125, -1.0930938720703125, -1.0245361328125, -0.9559783935546875, -0.887420654296875, -0.8188629150390625, -0.75030517578125, -0.6817474365234375, -0.613189697265625, -0.5446319580078125, -0.47607421875, -0.4075164794921875, -0.338958740234375, -0.2704010009765625, -0.20184326171875, -0.1332855224609375, -0.064727783203125, 0.0038299560546875, 0.0723876953125, 0.1409454345703125, 0.209503173828125, 0.2780609130859375, 0.34661865234375, 0.4151763916015625, 0.483734130859375, 0.5522918701171875, 0.620849609375, 0.6894073486328125, 0.757965087890625, 0.8265228271484375, 0.89508056640625, 0.9636383056640625, 1.032196044921875, 1.1007537841796875, 1.1693115234375, 1.2378692626953125, 1.306427001953125, 1.3749847412109375, 1.44354248046875, 1.5121002197265625, 1.580657958984375, 1.6492156982421875, 1.7177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 15.0, 17.0, 34.0, 67.0, 99.0, 182.0, 469.0, 1486.0, 10113.0, 1423508.0, 2743348.0, 12301.0, 1658.0, 545.0, 196.0, 109.0, 52.0, 29.0, 16.0, 8.0, 7.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.537841796875, -9.18505859375, -8.832275390625, -8.4794921875, -8.126708984375, -7.77392578125, -7.421142578125, -7.068359375, -6.715576171875, -6.36279296875, -6.010009765625, -5.6572265625, -5.304443359375, -4.95166015625, -4.598876953125, -4.24609375, -3.893310546875, -3.54052734375, -3.187744140625, -2.8349609375, -2.482177734375, -2.12939453125, -1.776611328125, -1.423828125, -1.071044921875, -0.71826171875, -0.365478515625, -0.0126953125, 0.340087890625, 0.69287109375, 1.045654296875, 1.3984375, 1.751220703125, 2.10400390625, 2.456787109375, 2.8095703125, 3.162353515625, 3.51513671875, 3.867919921875, 4.220703125, 4.573486328125, 4.92626953125, 5.279052734375, 5.6318359375, 5.984619140625, 6.33740234375, 6.690185546875, 7.04296875, 7.395751953125, 7.74853515625, 8.101318359375, 8.4541015625, 8.806884765625, 9.15966796875, 9.512451171875, 9.865234375, 10.218017578125, 10.57080078125, 10.923583984375, 11.2763671875, 11.629150390625, 11.98193359375, 12.334716796875, 12.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 3.0, 10.0, 9.0, 12.0, 21.0, 33.0, 55.0, 106.0, 195.0, 457.0, 988.0, 1101.0, 545.0, 251.0, 128.0, 43.0, 41.0, 28.0, 11.0, 10.0, 10.0, 7.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.96875, -8.75567626953125, -8.5426025390625, -8.32952880859375, -8.116455078125, -7.90338134765625, -7.6903076171875, -7.47723388671875, -7.26416015625, -7.05108642578125, -6.8380126953125, -6.62493896484375, -6.411865234375, -6.19879150390625, -5.9857177734375, -5.77264404296875, -5.5595703125, -5.34649658203125, -5.1334228515625, -4.92034912109375, -4.707275390625, -4.49420166015625, -4.2811279296875, -4.06805419921875, -3.85498046875, -3.64190673828125, -3.4288330078125, -3.21575927734375, -3.002685546875, -2.78961181640625, -2.5765380859375, -2.36346435546875, -2.150390625, -1.93731689453125, -1.7242431640625, -1.51116943359375, -1.298095703125, -1.08502197265625, -0.8719482421875, -0.65887451171875, -0.44580078125, -0.23272705078125, -0.0196533203125, 0.19342041015625, 0.406494140625, 0.61956787109375, 0.8326416015625, 1.04571533203125, 1.2587890625, 1.47186279296875, 1.6849365234375, 1.89801025390625, 2.111083984375, 2.32415771484375, 2.5372314453125, 2.75030517578125, 2.96337890625, 3.17645263671875, 3.3895263671875, 3.60260009765625, 3.815673828125, 4.02874755859375, 4.2418212890625, 4.45489501953125, 4.66796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 14.0, 27.0, 50.0, 102.0, 206.0, 241.0, 183.0, 86.0, 35.0, 20.0, 9.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.060401916503906, -34.367637634277344, -32.67487716674805, -30.982112884521484, -29.289350509643555, -27.596588134765625, -25.903823852539062, -24.211061477661133, -22.518299102783203, -20.825536727905273, -19.13277244567871, -17.44001007080078, -15.747247695922852, -14.054484367370605, -12.36172103881836, -10.66895866394043, -8.976194381713867, -7.283431529998779, -5.590668678283691, -3.8979053497314453, -2.2051424980163574, -0.5123796463012695, 1.1803836822509766, 2.8731460571289062, 4.565909385681152, 6.25867223739624, 7.951435089111328, 9.644198417663574, 11.33696174621582, 13.02972412109375, 14.722487449645996, 16.41524887084961, 18.108013153076172, 19.8007755279541, 21.493539810180664, 23.186302185058594, 24.879064559936523, 26.571826934814453, 28.264591217041016, 29.957353591918945, 31.650115966796875, 33.34288024902344, 35.035640716552734, 36.7284049987793, 38.42116928100586, 40.113929748535156, 41.80669403076172, 43.49945831298828, 45.192222595214844, 46.884986877441406, 48.5777473449707, 50.270511627197266, 51.96327590942383, 53.656036376953125, 55.34880065917969, 57.04156494140625, 58.73432540893555, 60.42708969116211, 62.119850158691406, 63.81261444091797, 65.50537872314453, 67.1981430053711, 68.89089965820312, 70.58366394042969, 72.27642822265625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 9.0, 14.0, 15.0, 14.0, 17.0, 22.0, 24.0, 21.0, 27.0, 44.0, 39.0, 46.0, 55.0, 68.0, 54.0, 38.0, 43.0, 46.0, 51.0, 55.0, 49.0, 43.0, 28.0, 24.0, 17.0, 21.0, 19.0, 18.0, 18.0, 12.0, 10.0, 3.0, 6.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.67736053466797, -21.046173095703125, -20.41498565673828, -19.783798217773438, -19.152610778808594, -18.52142333984375, -17.890235900878906, -17.259050369262695, -16.62786293029785, -15.996675491333008, -15.365488052368164, -14.73430061340332, -14.103114128112793, -13.47192668914795, -12.840739250183105, -12.209552764892578, -11.578364372253418, -10.947176933288574, -10.31598949432373, -9.684803009033203, -9.05361557006836, -8.422428131103516, -7.791240692138672, -7.160053730010986, -6.528866291046143, -5.897678852081299, -5.266491889953613, -4.6353044509887695, -4.004117012023926, -3.3729300498962402, -2.7417426109313965, -2.110555648803711, -1.4793682098388672, -0.8481809496879578, -0.21699368953704834, 0.41419363021850586, 1.0453808307647705, 1.6765680313110352, 2.307755470275879, 2.9389424324035645, 3.570129871368408, 4.201317310333252, 4.8325042724609375, 5.463691711425781, 6.094879150390625, 6.7260661125183105, 7.357253551483154, 7.98844051361084, 8.619627952575684, 9.250815391540527, 9.882002830505371, 10.513189315795898, 11.144376754760742, 11.775564193725586, 12.40675163269043, 13.037939071655273, 13.669126510620117, 14.300313949584961, 14.931501388549805, 15.562688827514648, 16.193876266479492, 16.825061798095703, 17.456249237060547, 18.08743667602539, 18.718624114990234]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 9.0, 7.0, 17.0, 16.0, 28.0, 39.0, 87.0, 119.0, 163.0, 294.0, 610.0, 1132.0, 2327.0, 5475.0, 13610.0, 39737.0, 140063.0, 476652.0, 262550.0, 69019.0, 21739.0, 8170.0, 3336.0, 1555.0, 789.0, 446.0, 209.0, 120.0, 86.0, 57.0, 23.0, 18.0, 16.0, 11.0, 7.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.9281005859375, -4.781982421875, -4.6358642578125, -4.48974609375, -4.3436279296875, -4.197509765625, -4.0513916015625, -3.9052734375, -3.7591552734375, -3.613037109375, -3.4669189453125, -3.32080078125, -3.1746826171875, -3.028564453125, -2.8824462890625, -2.736328125, -2.5902099609375, -2.444091796875, -2.2979736328125, -2.15185546875, -2.0057373046875, -1.859619140625, -1.7135009765625, -1.5673828125, -1.4212646484375, -1.275146484375, -1.1290283203125, -0.98291015625, -0.8367919921875, -0.690673828125, -0.5445556640625, -0.3984375, -0.2523193359375, -0.106201171875, 0.0399169921875, 0.18603515625, 0.3321533203125, 0.478271484375, 0.6243896484375, 0.7705078125, 0.9166259765625, 1.062744140625, 1.2088623046875, 1.35498046875, 1.5010986328125, 1.647216796875, 1.7933349609375, 1.939453125, 2.0855712890625, 2.231689453125, 2.3778076171875, 2.52392578125, 2.6700439453125, 2.816162109375, 2.9622802734375, 3.1083984375, 3.2545166015625, 3.400634765625, 3.5467529296875, 3.69287109375, 3.8389892578125, 3.985107421875, 4.1312255859375, 4.27734375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 11.0, 7.0, 8.0, 22.0, 23.0, 19.0, 30.0, 43.0, 34.0, 46.0, 33.0, 43.0, 46.0, 57.0, 41.0, 56.0, 71.0, 53.0, 47.0, 44.0, 49.0, 39.0, 39.0, 25.0, 29.0, 18.0, 12.0, 10.0, 9.0, 6.0, 6.0, 6.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-2.947265625, -2.8737030029296875, -2.800140380859375, -2.7265777587890625, -2.65301513671875, -2.5794525146484375, -2.505889892578125, -2.4323272705078125, -2.3587646484375, -2.2852020263671875, -2.211639404296875, -2.1380767822265625, -2.06451416015625, -1.9909515380859375, -1.917388916015625, -1.8438262939453125, -1.770263671875, -1.6967010498046875, -1.623138427734375, -1.5495758056640625, -1.47601318359375, -1.4024505615234375, -1.328887939453125, -1.2553253173828125, -1.1817626953125, -1.1082000732421875, -1.034637451171875, -0.9610748291015625, -0.88751220703125, -0.8139495849609375, -0.740386962890625, -0.6668243408203125, -0.59326171875, -0.5196990966796875, -0.446136474609375, -0.3725738525390625, -0.29901123046875, -0.2254486083984375, -0.151885986328125, -0.0783233642578125, -0.0047607421875, 0.0688018798828125, 0.142364501953125, 0.2159271240234375, 0.28948974609375, 0.3630523681640625, 0.436614990234375, 0.5101776123046875, 0.583740234375, 0.6573028564453125, 0.730865478515625, 0.8044281005859375, 0.87799072265625, 0.9515533447265625, 1.025115966796875, 1.0986785888671875, 1.1722412109375, 1.2458038330078125, 1.319366455078125, 1.3929290771484375, 1.46649169921875, 1.5400543212890625, 1.613616943359375, 1.6871795654296875, 1.7607421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 5.0, 12.0, 11.0, 21.0, 21.0, 22.0, 46.0, 52.0, 114.0, 153.0, 280.0, 475.0, 909.0, 2020.0, 6633.0, 50993.0, 841448.0, 127707.0, 12193.0, 2855.0, 1138.0, 597.0, 320.0, 193.0, 107.0, 75.0, 38.0, 35.0, 23.0, 15.0, 6.0, 7.0, 4.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.02734375, -7.765625, -7.50390625, -7.2421875, -6.98046875, -6.71875, -6.45703125, -6.1953125, -5.93359375, -5.671875, -5.41015625, -5.1484375, -4.88671875, -4.625, -4.36328125, -4.1015625, -3.83984375, -3.578125, -3.31640625, -3.0546875, -2.79296875, -2.53125, -2.26953125, -2.0078125, -1.74609375, -1.484375, -1.22265625, -0.9609375, -0.69921875, -0.4375, -0.17578125, 0.0859375, 0.34765625, 0.609375, 0.87109375, 1.1328125, 1.39453125, 1.65625, 1.91796875, 2.1796875, 2.44140625, 2.703125, 2.96484375, 3.2265625, 3.48828125, 3.75, 4.01171875, 4.2734375, 4.53515625, 4.796875, 5.05859375, 5.3203125, 5.58203125, 5.84375, 6.10546875, 6.3671875, 6.62890625, 6.890625, 7.15234375, 7.4140625, 7.67578125, 7.9375, 8.19921875, 8.4609375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 9.0, 19.0, 16.0, 34.0, 29.0, 36.0, 41.0, 56.0, 40.0, 54.0, 69.0, 85.0, 90.0, 74.0, 54.0, 59.0, 43.0, 45.0, 34.0, 21.0, 25.0, 19.0, 16.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.9765625, -11.66839599609375, -11.3602294921875, -11.05206298828125, -10.743896484375, -10.43572998046875, -10.1275634765625, -9.81939697265625, -9.51123046875, -9.20306396484375, -8.8948974609375, -8.58673095703125, -8.278564453125, -7.97039794921875, -7.6622314453125, -7.35406494140625, -7.0458984375, -6.73773193359375, -6.4295654296875, -6.12139892578125, -5.813232421875, -5.50506591796875, -5.1968994140625, -4.88873291015625, -4.58056640625, -4.27239990234375, -3.9642333984375, -3.65606689453125, -3.347900390625, -3.03973388671875, -2.7315673828125, -2.42340087890625, -2.115234375, -1.80706787109375, -1.4989013671875, -1.19073486328125, -0.882568359375, -0.57440185546875, -0.2662353515625, 0.04193115234375, 0.35009765625, 0.65826416015625, 0.9664306640625, 1.27459716796875, 1.582763671875, 1.89093017578125, 2.1990966796875, 2.50726318359375, 2.8154296875, 3.12359619140625, 3.4317626953125, 3.73992919921875, 4.048095703125, 4.35626220703125, 4.6644287109375, 4.97259521484375, 5.28076171875, 5.58892822265625, 5.8970947265625, 6.20526123046875, 6.513427734375, 6.82159423828125, 7.1297607421875, 7.43792724609375, 7.74609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 9.0, 7.0, 17.0, 14.0, 19.0, 35.0, 44.0, 87.0, 134.0, 261.0, 604.0, 1600.0, 5242.0, 24739.0, 253499.0, 714588.0, 37295.0, 6948.0, 2002.0, 728.0, 288.0, 147.0, 84.0, 49.0, 30.0, 17.0, 18.0, 7.0, 9.0, 5.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.533203125, -2.464935302734375, -2.39666748046875, -2.328399658203125, -2.2601318359375, -2.191864013671875, -2.12359619140625, -2.055328369140625, -1.987060546875, -1.918792724609375, -1.85052490234375, -1.782257080078125, -1.7139892578125, -1.645721435546875, -1.57745361328125, -1.509185791015625, -1.44091796875, -1.372650146484375, -1.30438232421875, -1.236114501953125, -1.1678466796875, -1.099578857421875, -1.03131103515625, -0.963043212890625, -0.894775390625, -0.826507568359375, -0.75823974609375, -0.689971923828125, -0.6217041015625, -0.553436279296875, -0.48516845703125, -0.416900634765625, -0.3486328125, -0.280364990234375, -0.21209716796875, -0.143829345703125, -0.0755615234375, -0.007293701171875, 0.06097412109375, 0.129241943359375, 0.197509765625, 0.265777587890625, 0.33404541015625, 0.402313232421875, 0.4705810546875, 0.538848876953125, 0.60711669921875, 0.675384521484375, 0.74365234375, 0.811920166015625, 0.88018798828125, 0.948455810546875, 1.0167236328125, 1.084991455078125, 1.15325927734375, 1.221527099609375, 1.289794921875, 1.358062744140625, 1.42633056640625, 1.494598388671875, 1.5628662109375, 1.631134033203125, 1.69940185546875, 1.767669677734375, 1.8359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 3.0, 5.0, 7.0, 12.0, 6.0, 13.0, 9.0, 14.0, 11.0, 19.0, 26.0, 38.0, 34.0, 45.0, 65.0, 78.0, 87.0, 105.0, 82.0, 63.0, 35.0, 39.0, 33.0, 25.0, 26.0, 24.0, 21.0, 9.0, 14.0, 10.0, 8.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0004477500915527344, -0.00043338537216186523, -0.0004190206527709961, -0.00040465593338012695, -0.0003902912139892578, -0.00037592649459838867, -0.00036156177520751953, -0.0003471970558166504, -0.00033283233642578125, -0.0003184676170349121, -0.00030410289764404297, -0.00028973817825317383, -0.0002753734588623047, -0.00026100873947143555, -0.0002466440200805664, -0.00023227930068969727, -0.00021791458129882812, -0.00020354986190795898, -0.00018918514251708984, -0.0001748204231262207, -0.00016045570373535156, -0.00014609098434448242, -0.00013172626495361328, -0.00011736154556274414, -0.000102996826171875, -8.863210678100586e-05, -7.426738739013672e-05, -5.990266799926758e-05, -4.553794860839844e-05, -3.11732292175293e-05, -1.6808509826660156e-05, -2.4437904357910156e-06, 1.1920928955078125e-05, 2.6285648345947266e-05, 4.0650367736816406e-05, 5.501508712768555e-05, 6.937980651855469e-05, 8.374452590942383e-05, 9.810924530029297e-05, 0.00011247396469116211, 0.00012683868408203125, 0.0001412034034729004, 0.00015556812286376953, 0.00016993284225463867, 0.0001842975616455078, 0.00019866228103637695, 0.0002130270004272461, 0.00022739171981811523, 0.00024175643920898438, 0.0002561211585998535, 0.00027048587799072266, 0.0002848505973815918, 0.00029921531677246094, 0.0003135800361633301, 0.0003279447555541992, 0.00034230947494506836, 0.0003566741943359375, 0.00037103891372680664, 0.0003854036331176758, 0.0003997683525085449, 0.00041413307189941406, 0.0004284977912902832, 0.00044286251068115234, 0.0004572272300720215, 0.0004715919494628906]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 8.0, 5.0, 10.0, 20.0, 19.0, 24.0, 61.0, 69.0, 110.0, 240.0, 488.0, 1052.0, 2912.0, 11142.0, 78724.0, 827970.0, 106455.0, 13546.0, 3359.0, 1182.0, 502.0, 279.0, 148.0, 76.0, 56.0, 25.0, 27.0, 14.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.12109375, -2.057891845703125, -1.99468994140625, -1.931488037109375, -1.8682861328125, -1.805084228515625, -1.74188232421875, -1.678680419921875, -1.615478515625, -1.552276611328125, -1.48907470703125, -1.425872802734375, -1.3626708984375, -1.299468994140625, -1.23626708984375, -1.173065185546875, -1.10986328125, -1.046661376953125, -0.98345947265625, -0.920257568359375, -0.8570556640625, -0.793853759765625, -0.73065185546875, -0.667449951171875, -0.604248046875, -0.541046142578125, -0.47784423828125, -0.414642333984375, -0.3514404296875, -0.288238525390625, -0.22503662109375, -0.161834716796875, -0.0986328125, -0.035430908203125, 0.02777099609375, 0.090972900390625, 0.1541748046875, 0.217376708984375, 0.28057861328125, 0.343780517578125, 0.406982421875, 0.470184326171875, 0.53338623046875, 0.596588134765625, 0.6597900390625, 0.722991943359375, 0.78619384765625, 0.849395751953125, 0.91259765625, 0.975799560546875, 1.03900146484375, 1.102203369140625, 1.1654052734375, 1.228607177734375, 1.29180908203125, 1.355010986328125, 1.418212890625, 1.481414794921875, 1.54461669921875, 1.607818603515625, 1.6710205078125, 1.734222412109375, 1.79742431640625, 1.860626220703125, 1.923828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 8.0, 9.0, 2.0, 5.0, 7.0, 15.0, 14.0, 19.0, 18.0, 23.0, 25.0, 36.0, 32.0, 48.0, 62.0, 60.0, 65.0, 71.0, 81.0, 59.0, 67.0, 44.0, 37.0, 30.0, 30.0, 21.0, 17.0, 19.0, 12.0, 15.0, 6.0, 7.0, 5.0, 8.0, 4.0, 8.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97705078125, -0.9403915405273438, -0.9037322998046875, -0.8670730590820312, -0.830413818359375, -0.7937545776367188, -0.7570953369140625, -0.7204360961914062, -0.68377685546875, -0.6471176147460938, -0.6104583740234375, -0.5737991333007812, -0.537139892578125, -0.5004806518554688, -0.4638214111328125, -0.42716217041015625, -0.3905029296875, -0.35384368896484375, -0.3171844482421875, -0.28052520751953125, -0.243865966796875, -0.20720672607421875, -0.1705474853515625, -0.13388824462890625, -0.09722900390625, -0.06056976318359375, -0.0239105224609375, 0.01274871826171875, 0.049407958984375, 0.08606719970703125, 0.1227264404296875, 0.15938568115234375, 0.196044921875, 0.23270416259765625, 0.2693634033203125, 0.30602264404296875, 0.342681884765625, 0.37934112548828125, 0.4160003662109375, 0.45265960693359375, 0.48931884765625, 0.5259780883789062, 0.5626373291015625, 0.5992965698242188, 0.635955810546875, 0.6726150512695312, 0.7092742919921875, 0.7459335327148438, 0.7825927734375, 0.8192520141601562, 0.8559112548828125, 0.8925704956054688, 0.929229736328125, 0.9658889770507812, 1.0025482177734375, 1.0392074584960938, 1.07586669921875, 1.1125259399414062, 1.1491851806640625, 1.1858444213867188, 1.222503662109375, 1.2591629028320312, 1.2958221435546875, 1.3324813842773438, 1.369140625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 20.0, 18.0, 25.0, 70.0, 104.0, 272.0, 232.0, 104.0, 52.0, 35.0, 21.0, 17.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.20669937133789, -49.92448425292969, -48.642269134521484, -47.36005401611328, -46.07783889770508, -44.795623779296875, -43.51340866088867, -42.23119354248047, -40.948978424072266, -39.66676330566406, -38.38454818725586, -37.102333068847656, -35.82011795043945, -34.53790283203125, -33.25568771362305, -31.973472595214844, -30.691259384155273, -29.40904426574707, -28.126829147338867, -26.844614028930664, -25.56239891052246, -24.280183792114258, -22.997970581054688, -21.715755462646484, -20.43354034423828, -19.151325225830078, -17.869110107421875, -16.586894989013672, -15.304679870605469, -14.022464752197266, -12.740250587463379, -11.458035469055176, -10.175817489624023, -8.89360237121582, -7.611387252807617, -6.329172611236572, -5.046957492828369, -3.764742374420166, -2.482527732849121, -1.200312614440918, 0.08190250396728516, 1.3641175031661987, 2.6463325023651123, 3.9285473823547363, 5.2107625007629395, 6.492977619171143, 7.7751922607421875, 9.05740737915039, 10.339622497558594, 11.621837615966797, 12.904052734375, 14.186267852783203, 15.468482971191406, 16.75069808959961, 18.032913208007812, 19.315128326416016, 20.59734344482422, 21.879558563232422, 23.161773681640625, 24.443988800048828, 25.72620391845703, 27.008419036865234, 28.290634155273438, 29.57284927368164, 30.85506248474121]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 9.0, 11.0, 8.0, 13.0, 14.0, 23.0, 24.0, 24.0, 28.0, 28.0, 37.0, 49.0, 76.0, 126.0, 132.0, 65.0, 43.0, 28.0, 36.0, 23.0, 30.0, 22.0, 19.0, 17.0, 13.0, 21.0, 9.0, 9.0, 9.0, 10.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.73331642150879, -24.840646743774414, -23.947975158691406, -23.05530548095703, -22.162633895874023, -21.26996421813965, -20.37729263305664, -19.484622955322266, -18.59195327758789, -17.699283599853516, -16.806612014770508, -15.913942337036133, -15.021270751953125, -14.12860107421875, -13.235930442810059, -12.343259811401367, -11.45058822631836, -10.557917594909668, -9.665246963500977, -8.772577285766602, -7.879906177520752, -6.9872355461120605, -6.094565391540527, -5.201894760131836, -4.3092241287231445, -3.416553497314453, -2.523883104324341, -1.6312127113342285, -0.7385420799255371, 0.1541285514831543, 1.0467987060546875, 1.939469337463379, 2.8321380615234375, 3.724808692932129, 4.61747932434082, 5.5101494789123535, 6.402820110321045, 7.295490741729736, 8.18816089630127, 9.080831527709961, 9.973502159118652, 10.866172790527344, 11.758843421936035, 12.651514053344727, 13.544183731079102, 14.43685531616211, 15.329524993896484, 16.22219467163086, 17.114866256713867, 18.007535934448242, 18.90020751953125, 19.792877197265625, 20.685548782348633, 21.578218460083008, 22.470890045166016, 23.36355972290039, 24.256229400634766, 25.14889907836914, 26.04157066345215, 26.934240341186523, 27.82691192626953, 28.719581604003906, 29.61225128173828, 30.50492286682129, 31.397594451904297]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 11.0, 9.0, 14.0, 27.0, 32.0, 43.0, 66.0, 75.0, 109.0, 182.0, 261.0, 469.0, 759.0, 1295.0, 2523.0, 4895.0, 10547.0, 26719.0, 93146.0, 445703.0, 1781671.0, 1390467.0, 317576.0, 73327.0, 25343.0, 9511.0, 4332.0, 2131.0, 1175.0, 731.0, 432.0, 255.0, 151.0, 116.0, 56.0, 41.0, 28.0, 15.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.765625, -3.6688232421875, -3.572021484375, -3.4752197265625, -3.37841796875, -3.2816162109375, -3.184814453125, -3.0880126953125, -2.9912109375, -2.8944091796875, -2.797607421875, -2.7008056640625, -2.60400390625, -2.5072021484375, -2.410400390625, -2.3135986328125, -2.216796875, -2.1199951171875, -2.023193359375, -1.9263916015625, -1.82958984375, -1.7327880859375, -1.635986328125, -1.5391845703125, -1.4423828125, -1.3455810546875, -1.248779296875, -1.1519775390625, -1.05517578125, -0.9583740234375, -0.861572265625, -0.7647705078125, -0.66796875, -0.5711669921875, -0.474365234375, -0.3775634765625, -0.28076171875, -0.1839599609375, -0.087158203125, 0.0096435546875, 0.1064453125, 0.2032470703125, 0.300048828125, 0.3968505859375, 0.49365234375, 0.5904541015625, 0.687255859375, 0.7840576171875, 0.880859375, 0.9776611328125, 1.074462890625, 1.1712646484375, 1.26806640625, 1.3648681640625, 1.461669921875, 1.5584716796875, 1.6552734375, 1.7520751953125, 1.848876953125, 1.9456787109375, 2.04248046875, 2.1392822265625, 2.236083984375, 2.3328857421875, 2.4296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 7.0, 9.0, 11.0, 13.0, 12.0, 29.0, 31.0, 36.0, 36.0, 31.0, 41.0, 34.0, 70.0, 52.0, 46.0, 64.0, 57.0, 70.0, 55.0, 47.0, 53.0, 35.0, 44.0, 27.0, 12.0, 12.0, 17.0, 14.0, 8.0, 9.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.958984375, -2.88543701171875, -2.8118896484375, -2.73834228515625, -2.664794921875, -2.59124755859375, -2.5177001953125, -2.44415283203125, -2.37060546875, -2.29705810546875, -2.2235107421875, -2.14996337890625, -2.076416015625, -2.00286865234375, -1.9293212890625, -1.85577392578125, -1.7822265625, -1.70867919921875, -1.6351318359375, -1.56158447265625, -1.488037109375, -1.41448974609375, -1.3409423828125, -1.26739501953125, -1.19384765625, -1.12030029296875, -1.0467529296875, -0.97320556640625, -0.899658203125, -0.82611083984375, -0.7525634765625, -0.67901611328125, -0.60546875, -0.53192138671875, -0.4583740234375, -0.38482666015625, -0.311279296875, -0.23773193359375, -0.1641845703125, -0.09063720703125, -0.01708984375, 0.05645751953125, 0.1300048828125, 0.20355224609375, 0.277099609375, 0.35064697265625, 0.4241943359375, 0.49774169921875, 0.5712890625, 0.64483642578125, 0.7183837890625, 0.79193115234375, 0.865478515625, 0.93902587890625, 1.0125732421875, 1.08612060546875, 1.15966796875, 1.23321533203125, 1.3067626953125, 1.38031005859375, 1.453857421875, 1.52740478515625, 1.6009521484375, 1.67449951171875, 1.748046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 8.0, 12.0, 13.0, 38.0, 85.0, 212.0, 560.0, 2919.0, 2737201.0, 1450188.0, 2287.0, 462.0, 167.0, 62.0, 32.0, 16.0, 9.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.171875, -30.016845703125, -28.86181640625, -27.706787109375, -26.5517578125, -25.396728515625, -24.24169921875, -23.086669921875, -21.931640625, -20.776611328125, -19.62158203125, -18.466552734375, -17.3115234375, -16.156494140625, -15.00146484375, -13.846435546875, -12.69140625, -11.536376953125, -10.38134765625, -9.226318359375, -8.0712890625, -6.916259765625, -5.76123046875, -4.606201171875, -3.451171875, -2.296142578125, -1.14111328125, 0.013916015625, 1.1689453125, 2.323974609375, 3.47900390625, 4.634033203125, 5.7890625, 6.944091796875, 8.09912109375, 9.254150390625, 10.4091796875, 11.564208984375, 12.71923828125, 13.874267578125, 15.029296875, 16.184326171875, 17.33935546875, 18.494384765625, 19.6494140625, 20.804443359375, 21.95947265625, 23.114501953125, 24.26953125, 25.424560546875, 26.57958984375, 27.734619140625, 28.8896484375, 30.044677734375, 31.19970703125, 32.354736328125, 33.509765625, 34.664794921875, 35.81982421875, 36.974853515625, 38.1298828125, 39.284912109375, 40.43994140625, 41.594970703125, 42.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 11.0, 6.0, 18.0, 18.0, 41.0, 59.0, 106.0, 210.0, 419.0, 1060.0, 1225.0, 490.0, 221.0, 98.0, 44.0, 32.0, 10.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-23.875, -23.40771484375, -22.9404296875, -22.47314453125, -22.005859375, -21.53857421875, -21.0712890625, -20.60400390625, -20.13671875, -19.66943359375, -19.2021484375, -18.73486328125, -18.267578125, -17.80029296875, -17.3330078125, -16.86572265625, -16.3984375, -15.93115234375, -15.4638671875, -14.99658203125, -14.529296875, -14.06201171875, -13.5947265625, -13.12744140625, -12.66015625, -12.19287109375, -11.7255859375, -11.25830078125, -10.791015625, -10.32373046875, -9.8564453125, -9.38916015625, -8.921875, -8.45458984375, -7.9873046875, -7.52001953125, -7.052734375, -6.58544921875, -6.1181640625, -5.65087890625, -5.18359375, -4.71630859375, -4.2490234375, -3.78173828125, -3.314453125, -2.84716796875, -2.3798828125, -1.91259765625, -1.4453125, -0.97802734375, -0.5107421875, -0.04345703125, 0.423828125, 0.89111328125, 1.3583984375, 1.82568359375, 2.29296875, 2.76025390625, 3.2275390625, 3.69482421875, 4.162109375, 4.62939453125, 5.0966796875, 5.56396484375, 6.03125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 4.0, 8.0, 9.0, 20.0, 35.0, 110.0, 415.0, 319.0, 64.0, 13.0, 9.0, 3.0, 2.0, 2.0], "bins": [-436.5189208984375, -428.8507080078125, -421.1825256347656, -413.5143127441406, -405.84613037109375, -398.17791748046875, -390.5097351074219, -382.8415222167969, -375.17333984375, -367.505126953125, -359.8369445800781, -352.1687316894531, -344.50054931640625, -336.83233642578125, -329.1641540527344, -321.4959411621094, -313.8277282714844, -306.1595153808594, -298.4913330078125, -290.8231201171875, -283.1549377441406, -275.4867248535156, -267.81854248046875, -260.15032958984375, -252.4821319580078, -244.81393432617188, -237.14573669433594, -229.4775390625, -221.809326171875, -214.14114379882812, -206.47293090820312, -198.8047332763672, -191.13653564453125, -183.4683380126953, -175.80014038085938, -168.13194274902344, -160.4637451171875, -152.7955322265625, -145.12733459472656, -137.45913696289062, -129.7909393310547, -122.12274169921875, -114.45454406738281, -106.78633880615234, -99.1181411743164, -91.44994354248047, -83.78173828125, -76.11354064941406, -68.44534301757812, -60.77714538574219, -53.108943939208984, -45.44074249267578, -37.772544860839844, -30.104347229003906, -22.436145782470703, -14.7679443359375, -7.099750518798828, 0.5684490203857422, 8.236648559570312, 15.904848098754883, 23.573047637939453, 31.24124526977539, 38.909446716308594, 46.5776481628418, 54.245845794677734]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 10.0, 5.0, 15.0, 21.0, 28.0, 38.0, 50.0, 61.0, 91.0, 112.0, 102.0, 78.0, 92.0, 78.0, 69.0, 41.0, 30.0, 22.0, 15.0, 11.0, 5.0, 4.0, 5.0, 2.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.37156677246094, -95.3665542602539, -92.36154174804688, -89.35652160644531, -86.35150909423828, -83.34649658203125, -80.34148406982422, -77.33647155761719, -74.33145141601562, -71.3264389038086, -68.32142639160156, -65.31640625, -62.31139373779297, -59.30638122558594, -56.301368713378906, -53.296356201171875, -50.291343688964844, -47.28633117675781, -44.281314849853516, -41.276302337646484, -38.27128601074219, -35.266273498535156, -32.261260986328125, -29.25624656677246, -26.251232147216797, -23.246217727661133, -20.24120330810547, -17.236190795898438, -14.231176376342773, -11.22616195678711, -8.221149444580078, -5.216135025024414, -2.21112060546875, 0.7938933372497559, 3.7989072799682617, 6.803920745849609, 9.808935165405273, 12.813949584960938, 15.818962097167969, 18.823976516723633, 21.828990936279297, 24.83400535583496, 27.839019775390625, 30.844032287597656, 33.84904479980469, 36.854061126708984, 39.859073638916016, 42.86408996582031, 45.869102478027344, 48.874114990234375, 51.87913131713867, 54.8841438293457, 57.88916015625, 60.89417266845703, 63.89918518066406, 66.9041976928711, 69.90921020507812, 72.91422271728516, 75.91923522949219, 78.92425537109375, 81.92926788330078, 84.93428039550781, 87.93929290771484, 90.94430541992188, 93.94932556152344]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 9.0, 6.0, 16.0, 18.0, 32.0, 30.0, 50.0, 62.0, 74.0, 138.0, 228.0, 348.0, 539.0, 1108.0, 1879.0, 3695.0, 8358.0, 21610.0, 75463.0, 561141.0, 290655.0, 52467.0, 16995.0, 6764.0, 3003.0, 1586.0, 894.0, 517.0, 278.0, 182.0, 96.0, 76.0, 73.0, 39.0, 33.0, 26.0, 15.0, 15.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0], "bins": [-5.8828125, -5.714111328125, -5.54541015625, -5.376708984375, -5.2080078125, -5.039306640625, -4.87060546875, -4.701904296875, -4.533203125, -4.364501953125, -4.19580078125, -4.027099609375, -3.8583984375, -3.689697265625, -3.52099609375, -3.352294921875, -3.18359375, -3.014892578125, -2.84619140625, -2.677490234375, -2.5087890625, -2.340087890625, -2.17138671875, -2.002685546875, -1.833984375, -1.665283203125, -1.49658203125, -1.327880859375, -1.1591796875, -0.990478515625, -0.82177734375, -0.653076171875, -0.484375, -0.315673828125, -0.14697265625, 0.021728515625, 0.1904296875, 0.359130859375, 0.52783203125, 0.696533203125, 0.865234375, 1.033935546875, 1.20263671875, 1.371337890625, 1.5400390625, 1.708740234375, 1.87744140625, 2.046142578125, 2.21484375, 2.383544921875, 2.55224609375, 2.720947265625, 2.8896484375, 3.058349609375, 3.22705078125, 3.395751953125, 3.564453125, 3.733154296875, 3.90185546875, 4.070556640625, 4.2392578125, 4.407958984375, 4.57666015625, 4.745361328125, 4.9140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 11.0, 4.0, 25.0, 31.0, 25.0, 44.0, 51.0, 47.0, 63.0, 59.0, 89.0, 80.0, 76.0, 70.0, 63.0, 55.0, 40.0, 27.0, 34.0, 22.0, 23.0, 16.0, 10.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.69140625, -4.562591552734375, -4.43377685546875, -4.304962158203125, -4.1761474609375, -4.047332763671875, -3.91851806640625, -3.789703369140625, -3.660888671875, -3.532073974609375, -3.40325927734375, -3.274444580078125, -3.1456298828125, -3.016815185546875, -2.88800048828125, -2.759185791015625, -2.63037109375, -2.501556396484375, -2.37274169921875, -2.243927001953125, -2.1151123046875, -1.986297607421875, -1.85748291015625, -1.728668212890625, -1.599853515625, -1.471038818359375, -1.34222412109375, -1.213409423828125, -1.0845947265625, -0.955780029296875, -0.82696533203125, -0.698150634765625, -0.5693359375, -0.440521240234375, -0.31170654296875, -0.182891845703125, -0.0540771484375, 0.074737548828125, 0.20355224609375, 0.332366943359375, 0.461181640625, 0.589996337890625, 0.71881103515625, 0.847625732421875, 0.9764404296875, 1.105255126953125, 1.23406982421875, 1.362884521484375, 1.49169921875, 1.620513916015625, 1.74932861328125, 1.878143310546875, 2.0069580078125, 2.135772705078125, 2.26458740234375, 2.393402099609375, 2.522216796875, 2.651031494140625, 2.77984619140625, 2.908660888671875, 3.0374755859375, 3.166290283203125, 3.29510498046875, 3.423919677734375, 3.552734375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 15.0, 12.0, 11.0, 16.0, 23.0, 35.0, 41.0, 70.0, 76.0, 152.0, 220.0, 370.0, 735.0, 1715.0, 4887.0, 20328.0, 214109.0, 770958.0, 25208.0, 5747.0, 1923.0, 805.0, 352.0, 250.0, 157.0, 95.0, 62.0, 37.0, 30.0, 21.0, 16.0, 12.0, 6.0, 10.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.71429443359375, -6.4832763671875, -6.25225830078125, -6.021240234375, -5.79022216796875, -5.5592041015625, -5.32818603515625, -5.09716796875, -4.86614990234375, -4.6351318359375, -4.40411376953125, -4.173095703125, -3.94207763671875, -3.7110595703125, -3.48004150390625, -3.2490234375, -3.01800537109375, -2.7869873046875, -2.55596923828125, -2.324951171875, -2.09393310546875, -1.8629150390625, -1.63189697265625, -1.40087890625, -1.16986083984375, -0.9388427734375, -0.70782470703125, -0.476806640625, -0.24578857421875, -0.0147705078125, 0.21624755859375, 0.447265625, 0.67828369140625, 0.9093017578125, 1.14031982421875, 1.371337890625, 1.60235595703125, 1.8333740234375, 2.06439208984375, 2.29541015625, 2.52642822265625, 2.7574462890625, 2.98846435546875, 3.219482421875, 3.45050048828125, 3.6815185546875, 3.91253662109375, 4.1435546875, 4.37457275390625, 4.6055908203125, 4.83660888671875, 5.067626953125, 5.29864501953125, 5.5296630859375, 5.76068115234375, 5.99169921875, 6.22271728515625, 6.4537353515625, 6.68475341796875, 6.915771484375, 7.14678955078125, 7.3778076171875, 7.60882568359375, 7.83984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 8.0, 6.0, 6.0, 6.0, 11.0, 14.0, 11.0, 13.0, 17.0, 28.0, 26.0, 39.0, 27.0, 38.0, 51.0, 63.0, 74.0, 74.0, 79.0, 68.0, 65.0, 50.0, 39.0, 34.0, 28.0, 19.0, 15.0, 13.0, 15.0, 12.0, 9.0, 9.0, 9.0, 7.0, 9.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-15.59375, -15.19287109375, -14.7919921875, -14.39111328125, -13.990234375, -13.58935546875, -13.1884765625, -12.78759765625, -12.38671875, -11.98583984375, -11.5849609375, -11.18408203125, -10.783203125, -10.38232421875, -9.9814453125, -9.58056640625, -9.1796875, -8.77880859375, -8.3779296875, -7.97705078125, -7.576171875, -7.17529296875, -6.7744140625, -6.37353515625, -5.97265625, -5.57177734375, -5.1708984375, -4.77001953125, -4.369140625, -3.96826171875, -3.5673828125, -3.16650390625, -2.765625, -2.36474609375, -1.9638671875, -1.56298828125, -1.162109375, -0.76123046875, -0.3603515625, 0.04052734375, 0.44140625, 0.84228515625, 1.2431640625, 1.64404296875, 2.044921875, 2.44580078125, 2.8466796875, 3.24755859375, 3.6484375, 4.04931640625, 4.4501953125, 4.85107421875, 5.251953125, 5.65283203125, 6.0537109375, 6.45458984375, 6.85546875, 7.25634765625, 7.6572265625, 8.05810546875, 8.458984375, 8.85986328125, 9.2607421875, 9.66162109375, 10.0625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 2.0, 2.0, 6.0, 6.0, 12.0, 14.0, 20.0, 27.0, 27.0, 36.0, 109.0, 198.0, 419.0, 1041.0, 3484.0, 17329.0, 928194.0, 86503.0, 7755.0, 1998.0, 714.0, 276.0, 148.0, 88.0, 35.0, 23.0, 28.0, 11.0, 10.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.599151611328125, -2.51470947265625, -2.430267333984375, -2.3458251953125, -2.261383056640625, -2.17694091796875, -2.092498779296875, -2.008056640625, -1.923614501953125, -1.83917236328125, -1.754730224609375, -1.6702880859375, -1.585845947265625, -1.50140380859375, -1.416961669921875, -1.33251953125, -1.248077392578125, -1.16363525390625, -1.079193115234375, -0.9947509765625, -0.910308837890625, -0.82586669921875, -0.741424560546875, -0.656982421875, -0.572540283203125, -0.48809814453125, -0.403656005859375, -0.3192138671875, -0.234771728515625, -0.15032958984375, -0.065887451171875, 0.0185546875, 0.102996826171875, 0.18743896484375, 0.271881103515625, 0.3563232421875, 0.440765380859375, 0.52520751953125, 0.609649658203125, 0.694091796875, 0.778533935546875, 0.86297607421875, 0.947418212890625, 1.0318603515625, 1.116302490234375, 1.20074462890625, 1.285186767578125, 1.36962890625, 1.454071044921875, 1.53851318359375, 1.622955322265625, 1.7073974609375, 1.791839599609375, 1.87628173828125, 1.960723876953125, 2.045166015625, 2.129608154296875, 2.21405029296875, 2.298492431640625, 2.3829345703125, 2.467376708984375, 2.55181884765625, 2.636260986328125, 2.720703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 16.0, 16.0, 12.0, 21.0, 35.0, 25.0, 56.0, 62.0, 112.0, 176.0, 125.0, 79.0, 61.0, 45.0, 25.0, 24.0, 19.0, 9.0, 6.0, 8.0, 8.0, 3.0, 6.0, 7.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0005207061767578125, -0.000505201518535614, -0.0004896968603134155, -0.00047419220209121704, -0.00045868754386901855, -0.00044318288564682007, -0.0004276782274246216, -0.0004121735692024231, -0.0003966689109802246, -0.0003811642527580261, -0.00036565959453582764, -0.00035015493631362915, -0.00033465027809143066, -0.0003191456198692322, -0.0003036409616470337, -0.0002881363034248352, -0.0002726316452026367, -0.00025712698698043823, -0.00024162232875823975, -0.00022611767053604126, -0.00021061301231384277, -0.0001951083540916443, -0.0001796036958694458, -0.00016409903764724731, -0.00014859437942504883, -0.00013308972120285034, -0.00011758506298065186, -0.00010208040475845337, -8.657574653625488e-05, -7.10710883140564e-05, -5.556643009185791e-05, -4.0061771869659424e-05, -2.4557113647460938e-05, -9.052455425262451e-06, 6.452202796936035e-06, 2.195686101913452e-05, 3.746151924133301e-05, 5.2966177463531494e-05, 6.847083568572998e-05, 8.397549390792847e-05, 9.948015213012695e-05, 0.00011498481035232544, 0.00013048946857452393, 0.0001459941267967224, 0.0001614987850189209, 0.00017700344324111938, 0.00019250810146331787, 0.00020801275968551636, 0.00022351741790771484, 0.00023902207612991333, 0.0002545267343521118, 0.0002700313925743103, 0.0002855360507965088, 0.0003010407090187073, 0.00031654536724090576, 0.00033205002546310425, 0.00034755468368530273, 0.0003630593419075012, 0.0003785640001296997, 0.0003940686583518982, 0.0004095733165740967, 0.00042507797479629517, 0.00044058263301849365, 0.00045608729124069214, 0.0004715919494628906]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 3.0, 13.0, 12.0, 14.0, 24.0, 37.0, 51.0, 109.0, 182.0, 358.0, 699.0, 1771.0, 5024.0, 20381.0, 161342.0, 809149.0, 36967.0, 7862.0, 2488.0, 962.0, 480.0, 256.0, 124.0, 65.0, 55.0, 25.0, 14.0, 17.0, 9.0, 13.0, 7.0, 10.0, 6.0, 2.0, 4.0, 4.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.060577392578125, -1.02154541015625, -0.982513427734375, -0.9434814453125, -0.904449462890625, -0.86541748046875, -0.826385498046875, -0.787353515625, -0.748321533203125, -0.70928955078125, -0.670257568359375, -0.6312255859375, -0.592193603515625, -0.55316162109375, -0.514129638671875, -0.47509765625, -0.436065673828125, -0.39703369140625, -0.358001708984375, -0.3189697265625, -0.279937744140625, -0.24090576171875, -0.201873779296875, -0.162841796875, -0.123809814453125, -0.08477783203125, -0.045745849609375, -0.0067138671875, 0.032318115234375, 0.07135009765625, 0.110382080078125, 0.1494140625, 0.188446044921875, 0.22747802734375, 0.266510009765625, 0.3055419921875, 0.344573974609375, 0.38360595703125, 0.422637939453125, 0.461669921875, 0.500701904296875, 0.53973388671875, 0.578765869140625, 0.6177978515625, 0.656829833984375, 0.69586181640625, 0.734893798828125, 0.77392578125, 0.812957763671875, 0.85198974609375, 0.891021728515625, 0.9300537109375, 0.969085693359375, 1.00811767578125, 1.047149658203125, 1.086181640625, 1.125213623046875, 1.16424560546875, 1.203277587890625, 1.2423095703125, 1.281341552734375, 1.32037353515625, 1.359405517578125, 1.3984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 8.0, 3.0, 4.0, 7.0, 21.0, 21.0, 39.0, 53.0, 83.0, 122.0, 190.0, 163.0, 84.0, 63.0, 40.0, 10.0, 19.0, 10.0, 10.0, 6.0, 5.0, 5.0, 6.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16796875, -2.103302001953125, -2.03863525390625, -1.973968505859375, -1.9093017578125, -1.844635009765625, -1.77996826171875, -1.715301513671875, -1.650634765625, -1.585968017578125, -1.52130126953125, -1.456634521484375, -1.3919677734375, -1.327301025390625, -1.26263427734375, -1.197967529296875, -1.13330078125, -1.068634033203125, -1.00396728515625, -0.939300537109375, -0.8746337890625, -0.809967041015625, -0.74530029296875, -0.680633544921875, -0.615966796875, -0.551300048828125, -0.48663330078125, -0.421966552734375, -0.3572998046875, -0.292633056640625, -0.22796630859375, -0.163299560546875, -0.0986328125, -0.033966064453125, 0.03070068359375, 0.095367431640625, 0.1600341796875, 0.224700927734375, 0.28936767578125, 0.354034423828125, 0.418701171875, 0.483367919921875, 0.54803466796875, 0.612701416015625, 0.6773681640625, 0.742034912109375, 0.80670166015625, 0.871368408203125, 0.93603515625, 1.000701904296875, 1.06536865234375, 1.130035400390625, 1.1947021484375, 1.259368896484375, 1.32403564453125, 1.388702392578125, 1.453369140625, 1.518035888671875, 1.58270263671875, 1.647369384765625, 1.7120361328125, 1.776702880859375, 1.84136962890625, 1.906036376953125, 1.970703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 13.0, 31.0, 94.0, 591.0, 178.0, 63.0, 17.0, 15.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.619384765625, -111.98573303222656, -108.35208892822266, -104.71843719482422, -101.08479309082031, -97.45114135742188, -93.81749725341797, -90.18384552001953, -86.55020141601562, -82.91654968261719, -79.28290557861328, -75.64925384521484, -72.01560974121094, -68.3819580078125, -64.7483139038086, -61.114662170410156, -57.481014251708984, -53.84736633300781, -50.21371841430664, -46.58007049560547, -42.9464225769043, -39.312774658203125, -35.67912292480469, -32.04547882080078, -28.411828994750977, -24.778181076049805, -21.144533157348633, -17.510883331298828, -13.877236366271973, -10.243587493896484, -6.6099395751953125, -2.9762916564941406, 0.6573562622070312, 4.291004180908203, 7.924652576446533, 11.558300971984863, 15.191948890686035, 18.825597763061523, 22.459245681762695, 26.092893600463867, 29.72654151916504, 33.360191345214844, 36.993839263916016, 40.62748718261719, 44.26113510131836, 47.89478302001953, 51.5284309387207, 55.162078857421875, 58.79572677612305, 62.42937469482422, 66.06302642822266, 69.69667053222656, 73.330322265625, 76.9639663696289, 80.59761810302734, 84.23126220703125, 87.86491394042969, 91.49856567382812, 95.13220977783203, 98.76586151123047, 102.39950561523438, 106.03315734863281, 109.66680145263672, 113.30045318603516, 116.93409729003906]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 10.0, 5.0, 9.0, 9.0, 9.0, 18.0, 17.0, 24.0, 20.0, 23.0, 40.0, 50.0, 234.0, 239.0, 40.0, 36.0, 30.0, 32.0, 23.0, 21.0, 24.0, 15.0, 12.0, 12.0, 10.0, 9.0, 9.0, 5.0, 2.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-61.98535919189453, -60.50719451904297, -59.029029846191406, -57.550865173339844, -56.07270050048828, -54.59453582763672, -53.116371154785156, -51.638206481933594, -50.16004180908203, -48.68187713623047, -47.203712463378906, -45.725547790527344, -44.24738311767578, -42.76921844482422, -41.291053771972656, -39.812889099121094, -38.33472442626953, -36.85655975341797, -35.378395080566406, -33.900230407714844, -32.42206573486328, -30.94390106201172, -29.465736389160156, -27.987571716308594, -26.50940704345703, -25.03124237060547, -23.553077697753906, -22.074913024902344, -20.59674835205078, -19.11858367919922, -17.640419006347656, -16.162254333496094, -14.684089660644531, -13.205924987792969, -11.727760314941406, -10.249595642089844, -8.771430969238281, -7.293266296386719, -5.815101623535156, -4.336936950683594, -2.8587722778320312, -1.3806076049804688, 0.09755706787109375, 1.5757217407226562, 3.0538864135742188, 4.532051086425781, 6.010215759277344, 7.488380432128906, 8.966545104980469, 10.444709777832031, 11.922874450683594, 13.401039123535156, 14.879203796386719, 16.35736846923828, 17.835533142089844, 19.313697814941406, 20.79186248779297, 22.27002716064453, 23.748191833496094, 25.226356506347656, 26.70452117919922, 28.18268585205078, 29.660850524902344, 31.139015197753906, 32.61717987060547]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 13.0, 12.0, 11.0, 17.0, 22.0, 31.0, 23.0, 34.0, 29.0, 77.0, 264.0, 142.0, 59.0, 48.0, 38.0, 29.0, 25.0, 24.0, 16.0, 18.0, 11.0, 9.0, 8.0, 8.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.685546875, -3.582550048828125, -3.47955322265625, -3.376556396484375, -3.2735595703125, -3.170562744140625, -3.06756591796875, -2.964569091796875, -2.861572265625, -2.758575439453125, -2.65557861328125, -2.552581787109375, -2.4495849609375, -2.346588134765625, -2.24359130859375, -2.140594482421875, -2.03759765625, -1.934600830078125, -1.83160400390625, -1.728607177734375, -1.6256103515625, -1.522613525390625, -1.41961669921875, -1.316619873046875, -1.213623046875, -1.110626220703125, -1.00762939453125, -0.904632568359375, -0.8016357421875, -0.698638916015625, -0.59564208984375, -0.492645263671875, -0.3896484375, -0.286651611328125, -0.18365478515625, -0.080657958984375, 0.0223388671875, 0.125335693359375, 0.22833251953125, 0.331329345703125, 0.434326171875, 0.537322998046875, 0.64031982421875, 0.743316650390625, 0.8463134765625, 0.949310302734375, 1.05230712890625, 1.155303955078125, 1.25830078125, 1.361297607421875, 1.46429443359375, 1.567291259765625, 1.6702880859375, 1.773284912109375, 1.87628173828125, 1.979278564453125, 2.082275390625, 2.185272216796875, 2.28826904296875, 2.391265869140625, 2.4942626953125, 2.597259521484375, 2.70025634765625, 2.803253173828125, 2.90625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 14.0, 8.0, 18.0, 25.0, 31.0, 59.0, 167.0, 675.0, 6428.0, 8370906.0, 8975.0, 843.0, 189.0, 75.0, 61.0, 15.0, 23.0, 16.0, 7.0, 7.0, 11.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-49.537994384765625, -47.8031005859375, -46.068206787109375, -44.33331298828125, -42.598419189453125, -40.863525390625, -39.128631591796875, -37.39373779296875, -35.658843994140625, -33.9239501953125, -32.189056396484375, -30.45416259765625, -28.719268798828125, -26.984375, -25.249479293823242, -23.514585494995117, -21.77968978881836, -20.044795989990234, -18.30990219116211, -16.575008392333984, -14.840113639831543, -13.105219841003418, -11.370325088500977, -9.635431289672852, -7.900537490844727, -6.165643692016602, -4.430749416351318, -2.695855140686035, -0.9609613418579102, 0.7739324569702148, 2.5088272094726562, 4.243721008300781, 5.978614807128906, 7.713508605957031, 9.448402404785156, 11.183297157287598, 12.918190956115723, 14.653084754943848, 16.38797950744629, 18.122873306274414, 19.85776710510254, 21.592660903930664, 23.32755470275879, 25.062450408935547, 26.797344207763672, 28.532238006591797, 30.267131805419922, 32.00202560424805, 33.73691940307617, 35.4718132019043, 37.20670700073242, 38.94160079956055, 40.67649459838867, 42.4113883972168, 44.14628601074219, 45.88117980957031, 47.61607360839844, 49.35096740722656, 51.08586120605469, 52.82075500488281, 54.55564880371094, 56.29054260253906, 58.02543640136719, 59.76033020019531, 61.49522399902344]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 8.0, 4.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.089269638061523, -18.179800033569336, -17.27033233642578, -16.360862731933594, -15.451395034790039, -14.541925430297852, -13.63245677947998, -12.72298812866211, -11.813519477844238, -10.904050827026367, -9.994582176208496, -9.085113525390625, -8.175643920898438, -7.266175746917725, -6.356706619262695, -5.447237968444824, -4.537769317626953, -3.628300666809082, -2.718831777572632, -1.8093628883361816, -0.8998942375183105, 0.009574413299560547, 0.9190435409545898, 1.828512191772461, 2.737980842590332, 3.647449493408203, 4.556918144226074, 5.4663872718811035, 6.375855922698975, 7.285324573516846, 8.194793701171875, 9.104262351989746, 10.013729095458984, 10.923197746276855, 11.832666397094727, 12.742136001586914, 13.651603698730469, 14.561073303222656, 15.470541954040527, 16.3800106048584, 17.289478302001953, 18.19894790649414, 19.108415603637695, 20.017885208129883, 20.927352905273438, 21.836822509765625, 22.746292114257812, 23.655759811401367, 24.565229415893555, 25.474699020385742, 26.384166717529297, 27.293636322021484, 28.20310401916504, 29.112573623657227, 30.02204132080078, 30.93151092529297, 31.840980529785156, 32.750450134277344, 33.65991973876953, 34.56938552856445, 35.47885513305664, 36.38832473754883, 37.297794342041016, 38.20726013183594, 39.116729736328125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 15.0, 15.0, 34.0, 39.0, 104.0, 177.0, 384.0, 995.0, 3634.0, 21365.0, 203011.0, 262535.0, 25760.0, 4131.0, 1122.0, 452.0, 201.0, 116.0, 59.0, 41.0, 25.0, 10.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -36.7666015625, -35.408203125, -34.0498046875, -32.69140625, -31.3330078125, -29.974609375, -28.6162109375, -27.2578125, -25.8994140625, -24.541015625, -23.1826171875, -21.82421875, -20.4658203125, -19.107421875, -17.7490234375, -16.390625, -15.0322265625, -13.673828125, -12.3154296875, -10.95703125, -9.5986328125, -8.240234375, -6.8818359375, -5.5234375, -4.1650390625, -2.806640625, -1.4482421875, -0.08984375, 1.2685546875, 2.626953125, 3.9853515625, 5.34375, 6.7021484375, 8.060546875, 9.4189453125, 10.77734375, 12.1357421875, 13.494140625, 14.8525390625, 16.2109375, 17.5693359375, 18.927734375, 20.2861328125, 21.64453125, 23.0029296875, 24.361328125, 25.7197265625, 27.078125, 28.4365234375, 29.794921875, 31.1533203125, 32.51171875, 33.8701171875, 35.228515625, 36.5869140625, 37.9453125, 39.3037109375, 40.662109375, 42.0205078125, 43.37890625, 44.7373046875, 46.095703125, 47.4541015625, 48.8125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 0.0, 3.0, 3.0, 9.0, 10.0, 18.0, 18.0, 25.0, 42.0, 43.0, 55.0, 69.0, 81.0, 109.0, 100.0, 80.0, 85.0, 64.0, 54.0, 32.0, 30.0, 21.0, 13.0, 8.0, 3.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.05859375, -4.91949462890625, -4.7803955078125, -4.64129638671875, -4.502197265625, -4.36309814453125, -4.2239990234375, -4.08489990234375, -3.94580078125, -3.80670166015625, -3.6676025390625, -3.52850341796875, -3.389404296875, -3.25030517578125, -3.1112060546875, -2.97210693359375, -2.8330078125, -2.69390869140625, -2.5548095703125, -2.41571044921875, -2.276611328125, -2.13751220703125, -1.9984130859375, -1.85931396484375, -1.72021484375, -1.58111572265625, -1.4420166015625, -1.30291748046875, -1.163818359375, -1.02471923828125, -0.8856201171875, -0.74652099609375, -0.607421875, -0.46832275390625, -0.3292236328125, -0.19012451171875, -0.051025390625, 0.08807373046875, 0.2271728515625, 0.36627197265625, 0.50537109375, 0.64447021484375, 0.7835693359375, 0.92266845703125, 1.061767578125, 1.20086669921875, 1.3399658203125, 1.47906494140625, 1.6181640625, 1.75726318359375, 1.8963623046875, 2.03546142578125, 2.174560546875, 2.31365966796875, 2.4527587890625, 2.59185791015625, 2.73095703125, 2.87005615234375, 3.0091552734375, 3.14825439453125, 3.287353515625, 3.42645263671875, 3.5655517578125, 3.70465087890625, 3.84375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 11.0, 26.0, 52.0, 132.0, 125.0, 63.0, 34.0, 5.0, 10.0, 3.0, 5.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.15226745605469, -43.020484924316406, -41.88870620727539, -40.756927490234375, -39.625144958496094, -38.49336242675781, -37.3615837097168, -36.22980499267578, -35.0980224609375, -33.96623992919922, -32.8344612121582, -31.702680587768555, -30.570899963378906, -29.439119338989258, -28.30733871459961, -27.17555809020996, -26.043777465820312, -24.911996841430664, -23.780216217041016, -22.648435592651367, -21.51665496826172, -20.38487434387207, -19.253093719482422, -18.121313095092773, -16.989532470703125, -15.857751846313477, -14.725971221923828, -13.59419059753418, -12.462409973144531, -11.330629348754883, -10.198848724365234, -9.067068099975586, -7.935285568237305, -6.803504943847656, -5.671724319458008, -4.539943695068359, -3.408163070678711, -2.2763824462890625, -1.144601821899414, -0.012821197509765625, 1.1189594268798828, 2.2507400512695312, 3.3825206756591797, 4.514301300048828, 5.646081924438477, 6.777862548828125, 7.909643173217773, 9.041423797607422, 10.17320442199707, 11.304985046386719, 12.436765670776367, 13.568546295166016, 14.700326919555664, 15.832107543945312, 16.96388816833496, 18.09566879272461, 19.227449417114258, 20.359230041503906, 21.491010665893555, 22.622791290283203, 23.75457191467285, 24.8863525390625, 26.01813316345215, 27.149913787841797, 28.281694412231445]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 4.0, 7.0, 22.0, 35.0, 75.0, 137.0, 88.0, 40.0, 16.0, 11.0, 7.0, 3.0, 5.0, 7.0, 2.0, 7.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.07525634765625, -25.367338180541992, -24.659420013427734, -23.951501846313477, -23.24358367919922, -22.535667419433594, -21.827749252319336, -21.119831085205078, -20.41191291809082, -19.703994750976562, -18.996076583862305, -18.288158416748047, -17.580242156982422, -16.872323989868164, -16.164405822753906, -15.456487655639648, -14.74856948852539, -14.040651321411133, -13.332733154296875, -12.624815940856934, -11.916897773742676, -11.208979606628418, -10.501062393188477, -9.793144226074219, -9.085226058959961, -8.377307891845703, -7.6693902015686035, -6.961472511291504, -6.253554344177246, -5.545636177062988, -4.837718486785889, -4.129800796508789, -3.421884536743164, -2.7139666080474854, -2.0060486793518066, -1.298130750656128, -0.5902128219604492, 0.11770510673522949, 0.8256230354309082, 1.5335407257080078, 2.2414588928222656, 2.9493768215179443, 3.657294750213623, 4.365212440490723, 5.0731306076049805, 5.781048774719238, 6.488966464996338, 7.1968841552734375, 7.904802322387695, 8.612720489501953, 9.320638656616211, 10.028555870056152, 10.73647403717041, 11.444392204284668, 12.15230941772461, 12.860227584838867, 13.568145751953125, 14.276063919067383, 14.98398208618164, 15.691899299621582, 16.399818420410156, 17.10773468017578, 17.81565284729004, 18.523571014404297, 19.231489181518555]}, "eval/loss": 4.305517673492432, "eval/wer": 1.9549980166600556, "eval/runtime": 784.9234, "eval/samples_per_second": 3.366, "eval/steps_per_second": 0.282} \ No newline at end of file