diff --git "a/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" "b/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.8067, "train/learning_rate": 9.92e-05, "train/epoch": 0.42, "train/global_step": 500, "_runtime": 2790, "_timestamp": 1646182171, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 16.0, 20.0, 36.0, 74.0, 142.0, 342.0, 148.0, 80.0, 51.0, 38.0, 11.0, 7.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0], "bins": [-412.4659423828125, -404.3079528808594, -396.1499938964844, -387.99200439453125, -379.8340148925781, -371.676025390625, -363.51806640625, -355.3600769042969, -347.20208740234375, -339.0440979003906, -330.8861389160156, -322.7281494140625, -314.5701599121094, -306.41217041015625, -298.25421142578125, -290.0962219238281, -281.9382629394531, -273.7802734375, -265.622314453125, -257.4643249511719, -249.30633544921875, -241.1483612060547, -232.99038696289062, -224.8323974609375, -216.67442321777344, -208.51644897460938, -200.35845947265625, -192.2004852294922, -184.04251098632812, -175.884521484375, -167.72654724121094, -159.56857299804688, -151.41058349609375, -143.2526092529297, -135.09461975097656, -126.9366455078125, -118.7786636352539, -110.62068176269531, -102.46270751953125, -94.30472564697266, -86.14674377441406, -77.98876190185547, -69.83078002929688, -61.67280578613281, -53.51482391357422, -45.356842041015625, -37.1988639831543, -29.04088592529297, -20.882904052734375, -12.724924087524414, -4.566944122314453, 3.591035842895508, 11.749015808105469, 19.906997680664062, 28.06497573852539, 36.22295379638672, 44.38093566894531, 52.538917541503906, 60.696895599365234, 68.85487365722656, 77.01285552978516, 85.17083740234375, 93.32881164550781, 101.4867935180664, 109.644775390625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 14.0, 8.0, 12.0, 11.0, 16.0, 13.0, 24.0, 17.0, 27.0, 29.0, 37.0, 44.0, 47.0, 61.0, 62.0, 56.0, 57.0, 48.0, 49.0, 56.0, 38.0, 47.0, 44.0, 25.0, 21.0, 16.0, 21.0, 10.0, 10.0, 6.0, 10.0, 5.0, 9.0, 10.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-280.0460205078125, -271.1632385253906, -262.28045654296875, -253.39767456054688, -244.514892578125, -235.63211059570312, -226.7493438720703, -217.86656188964844, -208.98377990722656, -200.1009979248047, -191.2182159423828, -182.33543395996094, -173.45266723632812, -164.56988525390625, -155.68710327148438, -146.8043212890625, -137.92153930664062, -129.03875732421875, -120.15597534179688, -111.27320098876953, -102.39041900634766, -93.50763702392578, -84.62486267089844, -75.74208068847656, -66.85929870605469, -57.97651672363281, -49.0937385559082, -40.210960388183594, -31.32817840576172, -22.445396423339844, -13.562618255615234, -4.679840087890625, 4.202972412109375, 13.085752487182617, 21.96853256225586, 30.8513126373291, 39.734092712402344, 48.61687469482422, 57.49965286254883, 66.38243103027344, 75.26521301269531, 84.14799499511719, 93.03077697753906, 101.9135513305664, 110.79633331298828, 119.67911529541016, 128.5618896484375, 137.44467163085938, 146.32745361328125, 155.21023559570312, 164.093017578125, 172.97579956054688, 181.85858154296875, 190.74136352539062, 199.62413024902344, 208.5069122314453, 217.3896942138672, 226.27247619628906, 235.15525817871094, 244.0380401611328, 252.92080688476562, 261.8035888671875, 270.6863708496094, 279.56915283203125, 288.4519348144531]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 4.0, 12.0, 12.0, 16.0, 10.0, 24.0, 22.0, 33.0, 31.0, 48.0, 48.0, 68.0, 75.0, 86.0, 73.0, 57.0, 73.0, 64.0, 55.0, 45.0, 23.0, 25.0, 16.0, 11.0, 13.0, 10.0, 17.0, 10.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.21875, -22.638671875, -22.05859375, -21.478515625, -20.8984375, -20.318359375, -19.73828125, -19.158203125, -18.578125, -17.998046875, -17.41796875, -16.837890625, -16.2578125, -15.677734375, -15.09765625, -14.517578125, -13.9375, -13.357421875, -12.77734375, -12.197265625, -11.6171875, -11.037109375, -10.45703125, -9.876953125, -9.296875, -8.716796875, -8.13671875, -7.556640625, -6.9765625, -6.396484375, -5.81640625, -5.236328125, -4.65625, -4.076171875, -3.49609375, -2.916015625, -2.3359375, -1.755859375, -1.17578125, -0.595703125, -0.015625, 0.564453125, 1.14453125, 1.724609375, 2.3046875, 2.884765625, 3.46484375, 4.044921875, 4.625, 5.205078125, 5.78515625, 6.365234375, 6.9453125, 7.525390625, 8.10546875, 8.685546875, 9.265625, 9.845703125, 10.42578125, 11.005859375, 11.5859375, 12.166015625, 12.74609375, 13.326171875, 13.90625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 2.0, 6.0, 10.0, 9.0, 7.0, 13.0, 14.0, 32.0, 34.0, 52.0, 73.0, 87.0, 131.0, 212.0, 374.0, 611.0, 930.0, 1633.0, 2808.0, 5113.0, 9959.0, 22721.0, 68432.0, 2844560.0, 1138653.0, 58512.0, 20115.0, 8731.0, 4430.0, 2482.0, 1417.0, 831.0, 505.0, 287.0, 183.0, 115.0, 69.0, 52.0, 30.0, 12.0, 9.0, 13.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-92.875, -90.54833984375, -88.2216796875, -85.89501953125, -83.568359375, -81.24169921875, -78.9150390625, -76.58837890625, -74.26171875, -71.93505859375, -69.6083984375, -67.28173828125, -64.955078125, -62.62841796875, -60.3017578125, -57.97509765625, -55.6484375, -53.32177734375, -50.9951171875, -48.66845703125, -46.341796875, -44.01513671875, -41.6884765625, -39.36181640625, -37.03515625, -34.70849609375, -32.3818359375, -30.05517578125, -27.728515625, -25.40185546875, -23.0751953125, -20.74853515625, -18.421875, -16.09521484375, -13.7685546875, -11.44189453125, -9.115234375, -6.78857421875, -4.4619140625, -2.13525390625, 0.19140625, 2.51806640625, 4.8447265625, 7.17138671875, 9.498046875, 11.82470703125, 14.1513671875, 16.47802734375, 18.8046875, 21.13134765625, 23.4580078125, 25.78466796875, 28.111328125, 30.43798828125, 32.7646484375, 35.09130859375, 37.41796875, 39.74462890625, 42.0712890625, 44.39794921875, 46.724609375, 49.05126953125, 51.3779296875, 53.70458984375, 56.03125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 9.0, 3.0, 11.0, 12.0, 6.0, 8.0, 14.0, 11.0, 17.0, 32.0, 33.0, 46.0, 41.0, 60.0, 64.0, 85.0, 150.0, 328.0, 780.0, 1135.0, 500.0, 219.0, 106.0, 70.0, 61.0, 47.0, 39.0, 37.0, 20.0, 25.0, 23.0, 9.0, 10.0, 13.0, 10.0, 5.0, 6.0, 5.0, 3.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-59.28125, -57.44580078125, -55.6103515625, -53.77490234375, -51.939453125, -50.10400390625, -48.2685546875, -46.43310546875, -44.59765625, -42.76220703125, -40.9267578125, -39.09130859375, -37.255859375, -35.42041015625, -33.5849609375, -31.74951171875, -29.9140625, -28.07861328125, -26.2431640625, -24.40771484375, -22.572265625, -20.73681640625, -18.9013671875, -17.06591796875, -15.23046875, -13.39501953125, -11.5595703125, -9.72412109375, -7.888671875, -6.05322265625, -4.2177734375, -2.38232421875, -0.546875, 1.28857421875, 3.1240234375, 4.95947265625, 6.794921875, 8.63037109375, 10.4658203125, 12.30126953125, 14.13671875, 15.97216796875, 17.8076171875, 19.64306640625, 21.478515625, 23.31396484375, 25.1494140625, 26.98486328125, 28.8203125, 30.65576171875, 32.4912109375, 34.32666015625, 36.162109375, 37.99755859375, 39.8330078125, 41.66845703125, 43.50390625, 45.33935546875, 47.1748046875, 49.01025390625, 50.845703125, 52.68115234375, 54.5166015625, 56.35205078125, 58.1875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 11.0, 9.0, 21.0, 11.0, 24.0, 30.0, 34.0, 26.0, 35.0, 54.0, 64.0, 93.0, 148.0, 241.0, 452.0, 1090.0, 2693.0, 8453.0, 29725.0, 155251.0, 3728229.0, 215283.0, 36396.0, 9951.0, 3345.0, 1228.0, 514.0, 240.0, 143.0, 101.0, 76.0, 50.0, 33.0, 43.0, 27.0, 18.0, 22.0, 21.0, 16.0, 23.0, 8.0, 9.0, 5.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-171.0, -165.583984375, -160.16796875, -154.751953125, -149.3359375, -143.919921875, -138.50390625, -133.087890625, -127.671875, -122.255859375, -116.83984375, -111.423828125, -106.0078125, -100.591796875, -95.17578125, -89.759765625, -84.34375, -78.927734375, -73.51171875, -68.095703125, -62.6796875, -57.263671875, -51.84765625, -46.431640625, -41.015625, -35.599609375, -30.18359375, -24.767578125, -19.3515625, -13.935546875, -8.51953125, -3.103515625, 2.3125, 7.728515625, 13.14453125, 18.560546875, 23.9765625, 29.392578125, 34.80859375, 40.224609375, 45.640625, 51.056640625, 56.47265625, 61.888671875, 67.3046875, 72.720703125, 78.13671875, 83.552734375, 88.96875, 94.384765625, 99.80078125, 105.216796875, 110.6328125, 116.048828125, 121.46484375, 126.880859375, 132.296875, 137.712890625, 143.12890625, 148.544921875, 153.9609375, 159.376953125, 164.79296875, 170.208984375, 175.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 8.0, 13.0, 16.0, 20.0, 34.0, 50.0, 105.0, 191.0, 240.0, 119.0, 66.0, 59.0, 24.0, 12.0, 17.0, 9.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.90673828125, -118.60746002197266, -111.30818176269531, -104.00889587402344, -96.7096176147461, -89.41033935546875, -82.1110610961914, -74.81178283691406, -67.51249694824219, -60.213218688964844, -52.913936614990234, -45.61465835571289, -38.31537628173828, -31.016098022460938, -23.716819763183594, -16.417537689208984, -9.118263244628906, -1.818983554840088, 5.4802961349487305, 12.77957534790039, 20.078855514526367, 27.378135681152344, 34.67741394042969, 41.9766960144043, 49.27597427368164, 56.575252532958984, 63.874534606933594, 71.17381286621094, 78.47309112548828, 85.77236938476562, 93.0716552734375, 100.37093353271484, 107.67021179199219, 114.96949005126953, 122.26876831054688, 129.56805419921875, 136.86732482910156, 144.16661071777344, 151.46588134765625, 158.76516723632812, 166.064453125, 173.36373901367188, 180.6630096435547, 187.96229553222656, 195.26156616210938, 202.56085205078125, 209.86013793945312, 217.15940856933594, 224.45867919921875, 231.75796508789062, 239.05723571777344, 246.3565216064453, 253.65579223632812, 260.955078125, 268.2543640136719, 275.55364990234375, 282.8529357910156, 290.1522216796875, 297.4515075683594, 304.7507629394531, 312.050048828125, 319.3493347167969, 326.64862060546875, 333.9479064941406, 341.2471618652344]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 9.0, 8.0, 9.0, 9.0, 8.0, 11.0, 16.0, 29.0, 25.0, 24.0, 27.0, 23.0, 37.0, 26.0, 44.0, 44.0, 43.0, 43.0, 52.0, 46.0, 39.0, 47.0, 40.0, 26.0, 40.0, 35.0, 28.0, 37.0, 28.0, 34.0, 21.0, 11.0, 20.0, 11.0, 10.0, 10.0, 14.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-201.2471466064453, -194.98915100097656, -188.73114013671875, -182.47314453125, -176.21514892578125, -169.95713806152344, -163.6991424560547, -157.44113159179688, -151.18313598632812, -144.92514038085938, -138.66712951660156, -132.4091339111328, -126.15113067626953, -119.89312744140625, -113.6351318359375, -107.37712860107422, -101.11913299560547, -94.86112976074219, -88.60313415527344, -82.34513092041016, -76.08712768554688, -69.82913208007812, -63.571128845214844, -57.31312561035156, -51.05512619018555, -44.79712677001953, -38.53912353515625, -32.281124114990234, -26.023122787475586, -19.765121459960938, -13.507122039794922, -7.249118804931641, -0.991119384765625, 5.266881465911865, 11.524882316589355, 17.782882690429688, 24.040884017944336, 30.298885345458984, 36.556884765625, 42.81488800048828, 49.0728874206543, 55.33088684082031, 61.588890075683594, 67.84689331054688, 74.10488891601562, 80.3628921508789, 86.62089538574219, 92.87889099121094, 99.13689422607422, 105.3948974609375, 111.65289306640625, 117.91089630126953, 124.16889953613281, 130.42689514160156, 136.68490600585938, 142.94290161132812, 149.20089721679688, 155.45889282226562, 161.71690368652344, 167.9748992919922, 174.23289489746094, 180.49090576171875, 186.7489013671875, 193.00689697265625, 199.26490783691406]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 8.0, 6.0, 4.0, 6.0, 11.0, 17.0, 15.0, 26.0, 33.0, 31.0, 34.0, 35.0, 45.0, 59.0, 75.0, 70.0, 64.0, 81.0, 48.0, 50.0, 53.0, 46.0, 26.0, 26.0, 20.0, 28.0, 16.0, 16.0, 13.0, 13.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.203125, -22.6290283203125, -22.054931640625, -21.4808349609375, -20.90673828125, -20.3326416015625, -19.758544921875, -19.1844482421875, -18.6103515625, -18.0362548828125, -17.462158203125, -16.8880615234375, -16.31396484375, -15.7398681640625, -15.165771484375, -14.5916748046875, -14.017578125, -13.4434814453125, -12.869384765625, -12.2952880859375, -11.72119140625, -11.1470947265625, -10.572998046875, -9.9989013671875, -9.4248046875, -8.8507080078125, -8.276611328125, -7.7025146484375, -7.12841796875, -6.5543212890625, -5.980224609375, -5.4061279296875, -4.83203125, -4.2579345703125, -3.683837890625, -3.1097412109375, -2.53564453125, -1.9615478515625, -1.387451171875, -0.8133544921875, -0.2392578125, 0.3348388671875, 0.908935546875, 1.4830322265625, 2.05712890625, 2.6312255859375, 3.205322265625, 3.7794189453125, 4.353515625, 4.9276123046875, 5.501708984375, 6.0758056640625, 6.64990234375, 7.2239990234375, 7.798095703125, 8.3721923828125, 8.9462890625, 9.5203857421875, 10.094482421875, 10.6685791015625, 11.24267578125, 11.8167724609375, 12.390869140625, 12.9649658203125, 13.5390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 10.0, 11.0, 15.0, 29.0, 32.0, 48.0, 77.0, 146.0, 278.0, 482.0, 986.0, 1836.0, 3659.0, 7567.0, 15823.0, 35311.0, 90968.0, 302783.0, 390622.0, 117781.0, 43274.0, 18753.0, 9055.0, 4372.0, 2231.0, 1115.0, 533.0, 320.0, 158.0, 99.0, 60.0, 36.0, 25.0, 15.0, 5.0, 10.0, 10.0, 6.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9140625, -0.8776702880859375, -0.841278076171875, -0.8048858642578125, -0.76849365234375, -0.7321014404296875, -0.695709228515625, -0.6593170166015625, -0.6229248046875, -0.5865325927734375, -0.550140380859375, -0.5137481689453125, -0.47735595703125, -0.4409637451171875, -0.404571533203125, -0.3681793212890625, -0.331787109375, -0.2953948974609375, -0.259002685546875, -0.2226104736328125, -0.18621826171875, -0.1498260498046875, -0.113433837890625, -0.0770416259765625, -0.0406494140625, -0.0042572021484375, 0.032135009765625, 0.0685272216796875, 0.10491943359375, 0.1413116455078125, 0.177703857421875, 0.2140960693359375, 0.25048828125, 0.2868804931640625, 0.323272705078125, 0.3596649169921875, 0.39605712890625, 0.4324493408203125, 0.468841552734375, 0.5052337646484375, 0.5416259765625, 0.5780181884765625, 0.614410400390625, 0.6508026123046875, 0.68719482421875, 0.7235870361328125, 0.759979248046875, 0.7963714599609375, 0.832763671875, 0.8691558837890625, 0.905548095703125, 0.9419403076171875, 0.97833251953125, 1.0147247314453125, 1.051116943359375, 1.0875091552734375, 1.1239013671875, 1.1602935791015625, 1.196685791015625, 1.2330780029296875, 1.26947021484375, 1.3058624267578125, 1.342254638671875, 1.3786468505859375, 1.4150390625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 7.0, 9.0, 15.0, 17.0, 7.0, 21.0, 26.0, 17.0, 27.0, 27.0, 36.0, 30.0, 38.0, 34.0, 43.0, 45.0, 47.0, 44.0, 1062.0, 36.0, 30.0, 32.0, 41.0, 24.0, 38.0, 31.0, 20.0, 31.0, 25.0, 21.0, 21.0, 26.0, 5.0, 12.0, 17.0, 10.0, 7.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.609375, -8.340576171875, -8.07177734375, -7.802978515625, -7.5341796875, -7.265380859375, -6.99658203125, -6.727783203125, -6.458984375, -6.190185546875, -5.92138671875, -5.652587890625, -5.3837890625, -5.114990234375, -4.84619140625, -4.577392578125, -4.30859375, -4.039794921875, -3.77099609375, -3.502197265625, -3.2333984375, -2.964599609375, -2.69580078125, -2.427001953125, -2.158203125, -1.889404296875, -1.62060546875, -1.351806640625, -1.0830078125, -0.814208984375, -0.54541015625, -0.276611328125, -0.0078125, 0.260986328125, 0.52978515625, 0.798583984375, 1.0673828125, 1.336181640625, 1.60498046875, 1.873779296875, 2.142578125, 2.411376953125, 2.68017578125, 2.948974609375, 3.2177734375, 3.486572265625, 3.75537109375, 4.024169921875, 4.29296875, 4.561767578125, 4.83056640625, 5.099365234375, 5.3681640625, 5.636962890625, 5.90576171875, 6.174560546875, 6.443359375, 6.712158203125, 6.98095703125, 7.249755859375, 7.5185546875, 7.787353515625, 8.05615234375, 8.324951171875, 8.59375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 9.0, 6.0, 8.0, 17.0, 15.0, 30.0, 55.0, 58.0, 93.0, 148.0, 193.0, 250.0, 351.0, 507.0, 724.0, 1014.0, 1416.0, 1956.0, 2931.0, 4078.0, 5789.0, 8300.0, 11923.0, 16859.0, 25351.0, 38396.0, 59914.0, 99510.0, 177281.0, 1271767.0, 137788.0, 79461.0, 48913.0, 31960.0, 21346.0, 14647.0, 10107.0, 7077.0, 4983.0, 3521.0, 2392.0, 1774.0, 1273.0, 867.0, 600.0, 407.0, 295.0, 230.0, 163.0, 125.0, 94.0, 56.0, 30.0, 27.0, 16.0, 15.0, 20.0, 5.0, 4.0, 0.0, 2.0], "bins": [-0.525390625, -0.5091171264648438, -0.4928436279296875, -0.47657012939453125, -0.460296630859375, -0.44402313232421875, -0.4277496337890625, -0.41147613525390625, -0.39520263671875, -0.37892913818359375, -0.3626556396484375, -0.34638214111328125, -0.330108642578125, -0.31383514404296875, -0.2975616455078125, -0.28128814697265625, -0.2650146484375, -0.24874114990234375, -0.2324676513671875, -0.21619415283203125, -0.199920654296875, -0.18364715576171875, -0.1673736572265625, -0.15110015869140625, -0.13482666015625, -0.11855316162109375, -0.1022796630859375, -0.08600616455078125, -0.069732666015625, -0.05345916748046875, -0.0371856689453125, -0.02091217041015625, -0.004638671875, 0.01163482666015625, 0.0279083251953125, 0.04418182373046875, 0.060455322265625, 0.07672882080078125, 0.0930023193359375, 0.10927581787109375, 0.12554931640625, 0.14182281494140625, 0.1580963134765625, 0.17436981201171875, 0.190643310546875, 0.20691680908203125, 0.2231903076171875, 0.23946380615234375, 0.2557373046875, 0.27201080322265625, 0.2882843017578125, 0.30455780029296875, 0.320831298828125, 0.33710479736328125, 0.3533782958984375, 0.36965179443359375, 0.38592529296875, 0.40219879150390625, 0.4184722900390625, 0.43474578857421875, 0.451019287109375, 0.46729278564453125, 0.4835662841796875, 0.49983978271484375, 0.51611328125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 10.0, 10.0, 6.0, 4.0, 7.0, 10.0, 17.0, 23.0, 19.0, 24.0, 18.0, 24.0, 34.0, 41.0, 34.0, 41.0, 49.0, 51.0, 37.0, 37.0, 43.0, 49.0, 39.0, 49.0, 47.0, 35.0, 41.0, 26.0, 27.0, 16.0, 20.0, 18.0, 13.0, 10.0, 12.0, 8.0, 8.0, 5.0, 6.0, 7.0, 4.0, 8.0, 6.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0017871856689453125, -0.001730591058731079, -0.0016739964485168457, -0.0016174018383026123, -0.001560807228088379, -0.0015042126178741455, -0.0014476180076599121, -0.0013910233974456787, -0.0013344287872314453, -0.001277834177017212, -0.0012212395668029785, -0.0011646449565887451, -0.0011080503463745117, -0.0010514557361602783, -0.000994861125946045, -0.0009382665157318115, -0.0008816719055175781, -0.0008250772953033447, -0.0007684826850891113, -0.0007118880748748779, -0.0006552934646606445, -0.0005986988544464111, -0.0005421042442321777, -0.00048550963401794434, -0.00042891502380371094, -0.00037232041358947754, -0.00031572580337524414, -0.00025913119316101074, -0.00020253658294677734, -0.00014594197273254395, -8.934736251831055e-05, -3.275275230407715e-05, 2.384185791015625e-05, 8.043646812438965e-05, 0.00013703107833862305, 0.00019362568855285645, 0.00025022029876708984, 0.00030681490898132324, 0.00036340951919555664, 0.00042000412940979004, 0.00047659873962402344, 0.0005331933498382568, 0.0005897879600524902, 0.0006463825702667236, 0.000702977180480957, 0.0007595717906951904, 0.0008161664009094238, 0.0008727610111236572, 0.0009293556213378906, 0.000985950231552124, 0.0010425448417663574, 0.0010991394519805908, 0.0011557340621948242, 0.0012123286724090576, 0.001268923282623291, 0.0013255178928375244, 0.0013821125030517578, 0.0014387071132659912, 0.0014953017234802246, 0.001551896333694458, 0.0016084909439086914, 0.0016650855541229248, 0.0017216801643371582, 0.0017782747745513916, 0.001834869384765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 2.0, 1.0, 6.0, 9.0, 6.0, 6.0, 4.0, 12.0, 20.0, 17.0, 21.0, 14.0, 24.0, 33.0, 34.0, 38.0, 55.0, 77.0, 62.0, 69.0, 78.0, 92.0, 117.0, 140.0, 222.0, 341.0, 895.0, 11178.0, 898856.0, 131620.0, 2613.0, 560.0, 268.0, 157.0, 155.0, 114.0, 106.0, 76.0, 67.0, 52.0, 47.0, 35.0, 53.0, 19.0, 26.0, 20.0, 20.0, 25.0, 13.0, 17.0, 13.0, 16.0, 11.0, 4.0, 7.0, 8.0, 4.0, 1.0, 4.0, 3.0, 2.0], "bins": [-0.0301361083984375, -0.029187679290771484, -0.02823925018310547, -0.027290821075439453, -0.026342391967773438, -0.025393962860107422, -0.024445533752441406, -0.02349710464477539, -0.022548675537109375, -0.02160024642944336, -0.020651817321777344, -0.019703388214111328, -0.018754959106445312, -0.017806529998779297, -0.01685810089111328, -0.015909671783447266, -0.01496124267578125, -0.014012813568115234, -0.013064384460449219, -0.012115955352783203, -0.011167526245117188, -0.010219097137451172, -0.009270668029785156, -0.00832223892211914, -0.007373809814453125, -0.006425380706787109, -0.005476951599121094, -0.004528522491455078, -0.0035800933837890625, -0.002631664276123047, -0.0016832351684570312, -0.0007348060607910156, 0.000213623046875, 0.0011620521545410156, 0.0021104812622070312, 0.003058910369873047, 0.0040073394775390625, 0.004955768585205078, 0.005904197692871094, 0.006852626800537109, 0.007801055908203125, 0.00874948501586914, 0.009697914123535156, 0.010646343231201172, 0.011594772338867188, 0.012543201446533203, 0.013491630554199219, 0.014440059661865234, 0.01538848876953125, 0.016336917877197266, 0.01728534698486328, 0.018233776092529297, 0.019182205200195312, 0.020130634307861328, 0.021079063415527344, 0.02202749252319336, 0.022975921630859375, 0.02392435073852539, 0.024872779846191406, 0.025821208953857422, 0.026769638061523438, 0.027718067169189453, 0.02866649627685547, 0.029614925384521484, 0.0305633544921875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 102.0, 803.0, 88.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016998164355754852, -0.016654565930366516, -0.01631096936762333, -0.015967370942234993, -0.015623772516846657, -0.015280175022780895, -0.014936577528715134, -0.014592979103326797, -0.014249381609261036, -0.013905784115195274, -0.013562185689806938, -0.013218588195741177, -0.01287498977035284, -0.012531392276287079, -0.012187793850898743, -0.011844196356832981, -0.01150059886276722, -0.011157001368701458, -0.010813402943313122, -0.01046980544924736, -0.010126207023859024, -0.009782609529793262, -0.009439012035727501, -0.009095413610339165, -0.008751815184950829, -0.008408217690885067, -0.00806461926549673, -0.007721021771430969, -0.00737742381170392, -0.0070338258519768715, -0.006690227892249823, -0.006346629932522774, -0.006003032438457012, -0.005659434478729963, -0.005315836519002914, -0.004972239024937153, -0.004628641065210104, -0.004285043105483055, -0.003941445145756006, -0.003597847418859601, -0.003254249459132552, -0.0029106514994055033, -0.002567053772509098, -0.002223455812782049, -0.0018798579694703221, -0.001536260126158595, -0.0011926621664315462, -0.000849064439535141, -0.0005054664798080921, -0.00016186860739253461, 0.0001817292650230229, 0.0005253271665424109, 0.0008689250098541379, 0.001212522853165865, 0.0015561208128929138, 0.001899718539789319, 0.002243316499516368, 0.002586914459243417, 0.002930512186139822, 0.003274110145866871, 0.0036177081055939198, 0.003961306065320969, 0.00430490355938673, 0.004648501519113779, 0.004992099478840828]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 15.0, 10.0, 15.0, 17.0, 15.0, 16.0, 25.0, 25.0, 27.0, 29.0, 25.0, 31.0, 42.0, 35.0, 46.0, 37.0, 37.0, 33.0, 32.0, 42.0, 51.0, 37.0, 34.0, 46.0, 29.0, 26.0, 33.0, 24.0, 19.0, 17.0, 14.0, 14.0, 15.0, 11.0, 13.0, 15.0, 5.0, 8.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.001232743263244629, -0.0011970698833465576, -0.0011613965034484863, -0.001125723123550415, -0.0010900497436523438, -0.0010543763637542725, -0.0010187029838562012, -0.0009830296039581299, -0.0009473562240600586, -0.0009116828441619873, -0.000876009464263916, -0.0008403360843658447, -0.0008046627044677734, -0.0007689893245697021, -0.0007333159446716309, -0.0006976425647735596, -0.0006619691848754883, -0.000626295804977417, -0.0005906224250793457, -0.0005549490451812744, -0.0005192756652832031, -0.00048360228538513184, -0.00044792890548706055, -0.00041225552558898926, -0.00037658214569091797, -0.0003409087657928467, -0.0003052353858947754, -0.0002695620059967041, -0.0002338886260986328, -0.00019821524620056152, -0.00016254186630249023, -0.00012686848640441895, -9.119510650634766e-05, -5.552172660827637e-05, -1.9848346710205078e-05, 1.582503318786621e-05, 5.14984130859375e-05, 8.717179298400879e-05, 0.00012284517288208008, 0.00015851855278015137, 0.00019419193267822266, 0.00022986531257629395, 0.00026553869247436523, 0.0003012120723724365, 0.0003368854522705078, 0.0003725588321685791, 0.0004082322120666504, 0.0004439055919647217, 0.00047957897186279297, 0.0005152523517608643, 0.0005509257316589355, 0.0005865991115570068, 0.0006222724914550781, 0.0006579458713531494, 0.0006936192512512207, 0.000729292631149292, 0.0007649660110473633, 0.0008006393909454346, 0.0008363127708435059, 0.0008719861507415771, 0.0009076595306396484, 0.0009433329105377197, 0.000979006290435791, 0.0010146796703338623, 0.0010503530502319336]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 8.0, 6.0, 4.0, 6.0, 11.0, 17.0, 15.0, 26.0, 33.0, 31.0, 34.0, 35.0, 45.0, 59.0, 75.0, 70.0, 64.0, 81.0, 48.0, 50.0, 53.0, 46.0, 26.0, 26.0, 20.0, 28.0, 16.0, 16.0, 13.0, 13.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.203125, -22.6290283203125, -22.054931640625, -21.4808349609375, -20.90673828125, -20.3326416015625, -19.758544921875, -19.1844482421875, -18.6103515625, -18.0362548828125, -17.462158203125, -16.8880615234375, -16.31396484375, -15.7398681640625, -15.165771484375, -14.5916748046875, -14.017578125, -13.4434814453125, -12.869384765625, -12.2952880859375, -11.72119140625, -11.1470947265625, -10.572998046875, -9.9989013671875, -9.4248046875, -8.8507080078125, -8.276611328125, -7.7025146484375, -7.12841796875, -6.5543212890625, -5.980224609375, -5.4061279296875, -4.83203125, -4.2579345703125, -3.683837890625, -3.1097412109375, -2.53564453125, -1.9615478515625, -1.387451171875, -0.8133544921875, -0.2392578125, 0.3348388671875, 0.908935546875, 1.4830322265625, 2.05712890625, 2.6312255859375, 3.205322265625, 3.7794189453125, 4.353515625, 4.9276123046875, 5.501708984375, 6.0758056640625, 6.64990234375, 7.2239990234375, 7.798095703125, 8.3721923828125, 8.9462890625, 9.5203857421875, 10.094482421875, 10.6685791015625, 11.24267578125, 11.8167724609375, 12.390869140625, 12.9649658203125, 13.5390625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 18.0, 26.0, 48.0, 52.0, 120.0, 166.0, 250.0, 389.0, 705.0, 1297.0, 2091.0, 3753.0, 7717.0, 20928.0, 109099.0, 789731.0, 79444.0, 17472.0, 7041.0, 3454.0, 1843.0, 1088.0, 682.0, 416.0, 269.0, 166.0, 98.0, 66.0, 39.0, 21.0, 16.0, 9.0, 9.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-71.375, -69.3603515625, -67.345703125, -65.3310546875, -63.31640625, -61.3017578125, -59.287109375, -57.2724609375, -55.2578125, -53.2431640625, -51.228515625, -49.2138671875, -47.19921875, -45.1845703125, -43.169921875, -41.1552734375, -39.140625, -37.1259765625, -35.111328125, -33.0966796875, -31.08203125, -29.0673828125, -27.052734375, -25.0380859375, -23.0234375, -21.0087890625, -18.994140625, -16.9794921875, -14.96484375, -12.9501953125, -10.935546875, -8.9208984375, -6.90625, -4.8916015625, -2.876953125, -0.8623046875, 1.15234375, 3.1669921875, 5.181640625, 7.1962890625, 9.2109375, 11.2255859375, 13.240234375, 15.2548828125, 17.26953125, 19.2841796875, 21.298828125, 23.3134765625, 25.328125, 27.3427734375, 29.357421875, 31.3720703125, 33.38671875, 35.4013671875, 37.416015625, 39.4306640625, 41.4453125, 43.4599609375, 45.474609375, 47.4892578125, 49.50390625, 51.5185546875, 53.533203125, 55.5478515625, 57.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 6.0, 8.0, 7.0, 9.0, 11.0, 11.0, 16.0, 23.0, 23.0, 21.0, 25.0, 34.0, 38.0, 36.0, 43.0, 45.0, 43.0, 65.0, 88.0, 1866.0, 145.0, 72.0, 48.0, 53.0, 41.0, 38.0, 33.0, 29.0, 24.0, 23.0, 19.0, 14.0, 17.0, 9.0, 11.0, 15.0, 6.0, 7.0, 6.0, 1.0, 5.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-49.34375, -47.8779296875, -46.412109375, -44.9462890625, -43.48046875, -42.0146484375, -40.548828125, -39.0830078125, -37.6171875, -36.1513671875, -34.685546875, -33.2197265625, -31.75390625, -30.2880859375, -28.822265625, -27.3564453125, -25.890625, -24.4248046875, -22.958984375, -21.4931640625, -20.02734375, -18.5615234375, -17.095703125, -15.6298828125, -14.1640625, -12.6982421875, -11.232421875, -9.7666015625, -8.30078125, -6.8349609375, -5.369140625, -3.9033203125, -2.4375, -0.9716796875, 0.494140625, 1.9599609375, 3.42578125, 4.8916015625, 6.357421875, 7.8232421875, 9.2890625, 10.7548828125, 12.220703125, 13.6865234375, 15.15234375, 16.6181640625, 18.083984375, 19.5498046875, 21.015625, 22.4814453125, 23.947265625, 25.4130859375, 26.87890625, 28.3447265625, 29.810546875, 31.2763671875, 32.7421875, 34.2080078125, 35.673828125, 37.1396484375, 38.60546875, 40.0712890625, 41.537109375, 43.0029296875, 44.46875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 1.0, 4.0, 6.0, 6.0, 7.0, 16.0, 6.0, 10.0, 16.0, 16.0, 19.0, 23.0, 23.0, 40.0, 48.0, 59.0, 94.0, 206.0, 520.0, 3208.0, 3032694.0, 106368.0, 1388.0, 376.0, 157.0, 82.0, 57.0, 38.0, 34.0, 30.0, 25.0, 18.0, 19.0, 20.0, 8.0, 15.0, 7.0, 11.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-212.625, -205.728515625, -198.83203125, -191.935546875, -185.0390625, -178.142578125, -171.24609375, -164.349609375, -157.453125, -150.556640625, -143.66015625, -136.763671875, -129.8671875, -122.970703125, -116.07421875, -109.177734375, -102.28125, -95.384765625, -88.48828125, -81.591796875, -74.6953125, -67.798828125, -60.90234375, -54.005859375, -47.109375, -40.212890625, -33.31640625, -26.419921875, -19.5234375, -12.626953125, -5.73046875, 1.166015625, 8.0625, 14.958984375, 21.85546875, 28.751953125, 35.6484375, 42.544921875, 49.44140625, 56.337890625, 63.234375, 70.130859375, 77.02734375, 83.923828125, 90.8203125, 97.716796875, 104.61328125, 111.509765625, 118.40625, 125.302734375, 132.19921875, 139.095703125, 145.9921875, 152.888671875, 159.78515625, 166.681640625, 173.578125, 180.474609375, 187.37109375, 194.267578125, 201.1640625, 208.060546875, 214.95703125, 221.853515625, 228.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 67.0, 556.0, 364.0, 23.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.14572143554688, -237.601806640625, -228.05789184570312, -218.51397705078125, -208.97006225585938, -199.4261474609375, -189.88223266601562, -180.33831787109375, -170.79440307617188, -161.25048828125, -151.70657348632812, -142.16265869140625, -132.61874389648438, -123.0748291015625, -113.5309066772461, -103.98699188232422, -94.44306945800781, -84.89915466308594, -75.35523986816406, -65.81132507324219, -56.26740646362305, -46.72349166870117, -37.17957305908203, -27.635658264160156, -18.09174346923828, -8.54782772064209, 0.9960880279541016, 10.54000473022461, 20.083919525146484, 29.62783432006836, 39.1717529296875, 48.715667724609375, 58.25958251953125, 67.80349731445312, 77.347412109375, 86.89132690429688, 96.43524169921875, 105.97915649414062, 115.52307891845703, 125.0669937133789, 134.61090087890625, 144.15481567382812, 153.69873046875, 163.24264526367188, 172.78656005859375, 182.33047485351562, 191.8743896484375, 201.41830444335938, 210.9622344970703, 220.5061492919922, 230.05006408691406, 239.59397888183594, 249.1378936767578, 258.68182373046875, 268.2257385253906, 277.7696533203125, 287.3135681152344, 296.85748291015625, 306.4013977050781, 315.9453125, 325.4892272949219, 335.03314208984375, 344.5770568847656, 354.1209716796875, 363.6648864746094]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 5.0, 5.0, 6.0, 9.0, 8.0, 19.0, 13.0, 16.0, 21.0, 16.0, 18.0, 32.0, 36.0, 29.0, 32.0, 44.0, 46.0, 45.0, 34.0, 35.0, 33.0, 45.0, 51.0, 40.0, 36.0, 33.0, 42.0, 29.0, 33.0, 16.0, 24.0, 26.0, 21.0, 22.0, 19.0, 11.0, 8.0, 8.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-162.52908325195312, -157.9332733154297, -153.33746337890625, -148.74163818359375, -144.1458282470703, -139.55001831054688, -134.95420837402344, -130.3583984375, -125.7625732421875, -121.16676330566406, -116.5709457397461, -111.97513580322266, -107.37931823730469, -102.78350830078125, -98.18769836425781, -93.59188079833984, -88.9960708618164, -84.40026092529297, -79.804443359375, -75.20863342285156, -70.6128158569336, -66.01700592041016, -61.42119216918945, -56.82537841796875, -52.22956466674805, -47.633750915527344, -43.03793716430664, -38.44212341308594, -33.8463134765625, -29.250497817993164, -24.654685974121094, -20.05887222290039, -15.463058471679688, -10.867244720458984, -6.271431922912598, -1.675619125366211, 2.920194625854492, 7.516008377075195, 12.111820220947266, 16.70763397216797, 21.303447723388672, 25.899261474609375, 30.495075225830078, 35.09088897705078, 39.68669891357422, 44.28251647949219, 48.878326416015625, 53.47414016723633, 58.06995391845703, 62.665767669677734, 67.26158142089844, 71.85739135742188, 76.45320892333984, 81.04901885986328, 85.64483642578125, 90.24064636230469, 94.83645629882812, 99.43226623535156, 104.02808380126953, 108.62389373779297, 113.21971130371094, 117.81552124023438, 122.41133117675781, 127.00714874267578, 131.60296630859375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 6.0, 10.0, 10.0, 17.0, 23.0, 30.0, 34.0, 30.0, 33.0, 34.0, 54.0, 64.0, 68.0, 83.0, 67.0, 58.0, 66.0, 55.0, 35.0, 34.0, 33.0, 29.0, 17.0, 20.0, 21.0, 10.0, 19.0, 10.0, 4.0, 14.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.65625, -24.040283203125, -23.42431640625, -22.808349609375, -22.1923828125, -21.576416015625, -20.96044921875, -20.344482421875, -19.728515625, -19.112548828125, -18.49658203125, -17.880615234375, -17.2646484375, -16.648681640625, -16.03271484375, -15.416748046875, -14.80078125, -14.184814453125, -13.56884765625, -12.952880859375, -12.3369140625, -11.720947265625, -11.10498046875, -10.489013671875, -9.873046875, -9.257080078125, -8.64111328125, -8.025146484375, -7.4091796875, -6.793212890625, -6.17724609375, -5.561279296875, -4.9453125, -4.329345703125, -3.71337890625, -3.097412109375, -2.4814453125, -1.865478515625, -1.24951171875, -0.633544921875, -0.017578125, 0.598388671875, 1.21435546875, 1.830322265625, 2.4462890625, 3.062255859375, 3.67822265625, 4.294189453125, 4.91015625, 5.526123046875, 6.14208984375, 6.758056640625, 7.3740234375, 7.989990234375, 8.60595703125, 9.221923828125, 9.837890625, 10.453857421875, 11.06982421875, 11.685791015625, 12.3017578125, 12.917724609375, 13.53369140625, 14.149658203125, 14.765625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 1.0, 7.0, 4.0, 7.0, 6.0, 13.0, 24.0, 9.0, 29.0, 41.0, 57.0, 81.0, 104.0, 183.0, 246.0, 366.0, 570.0, 850.0, 1403.0, 2181.0, 3745.0, 6359.0, 11639.0, 22950.0, 53076.0, 655125.0, 3283281.0, 85628.0, 30613.0, 15263.0, 8198.0, 4792.0, 2820.0, 1695.0, 1097.0, 668.0, 430.0, 268.0, 185.0, 99.0, 67.0, 41.0, 25.0, 15.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0], "bins": [-92.375, -90.076171875, -87.77734375, -85.478515625, -83.1796875, -80.880859375, -78.58203125, -76.283203125, -73.984375, -71.685546875, -69.38671875, -67.087890625, -64.7890625, -62.490234375, -60.19140625, -57.892578125, -55.59375, -53.294921875, -50.99609375, -48.697265625, -46.3984375, -44.099609375, -41.80078125, -39.501953125, -37.203125, -34.904296875, -32.60546875, -30.306640625, -28.0078125, -25.708984375, -23.41015625, -21.111328125, -18.8125, -16.513671875, -14.21484375, -11.916015625, -9.6171875, -7.318359375, -5.01953125, -2.720703125, -0.421875, 1.876953125, 4.17578125, 6.474609375, 8.7734375, 11.072265625, 13.37109375, 15.669921875, 17.96875, 20.267578125, 22.56640625, 24.865234375, 27.1640625, 29.462890625, 31.76171875, 34.060546875, 36.359375, 38.658203125, 40.95703125, 43.255859375, 45.5546875, 47.853515625, 50.15234375, 52.451171875, 54.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 11.0, 8.0, 18.0, 15.0, 10.0, 18.0, 14.0, 19.0, 22.0, 53.0, 44.0, 38.0, 59.0, 96.0, 224.0, 619.0, 1329.0, 747.0, 282.0, 107.0, 62.0, 44.0, 31.0, 25.0, 28.0, 24.0, 16.0, 16.0, 18.0, 22.0, 9.0, 4.0, 6.0, 2.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.6875, -57.734375, -55.78125, -53.828125, -51.875, -49.921875, -47.96875, -46.015625, -44.0625, -42.109375, -40.15625, -38.203125, -36.25, -34.296875, -32.34375, -30.390625, -28.4375, -26.484375, -24.53125, -22.578125, -20.625, -18.671875, -16.71875, -14.765625, -12.8125, -10.859375, -8.90625, -6.953125, -5.0, -3.046875, -1.09375, 0.859375, 2.8125, 4.765625, 6.71875, 8.671875, 10.625, 12.578125, 14.53125, 16.484375, 18.4375, 20.390625, 22.34375, 24.296875, 26.25, 28.203125, 30.15625, 32.109375, 34.0625, 36.015625, 37.96875, 39.921875, 41.875, 43.828125, 45.78125, 47.734375, 49.6875, 51.640625, 53.59375, 55.546875, 57.5, 59.453125, 61.40625, 63.359375, 65.3125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 3.0, 7.0, 13.0, 22.0, 33.0, 41.0, 61.0, 93.0, 140.0, 209.0, 242.0, 386.0, 585.0, 892.0, 1273.0, 1981.0, 2894.0, 4466.0, 6745.0, 10643.0, 16930.0, 29238.0, 52183.0, 120434.0, 1713136.0, 1976618.0, 124885.0, 52937.0, 29000.0, 17250.0, 10761.0, 6916.0, 4497.0, 2831.0, 1935.0, 1232.0, 832.0, 629.0, 412.0, 265.0, 190.0, 131.0, 93.0, 58.0, 54.0, 33.0, 26.0, 10.0, 10.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0], "bins": [-85.0625, -82.5615234375, -80.060546875, -77.5595703125, -75.05859375, -72.5576171875, -70.056640625, -67.5556640625, -65.0546875, -62.5537109375, -60.052734375, -57.5517578125, -55.05078125, -52.5498046875, -50.048828125, -47.5478515625, -45.046875, -42.5458984375, -40.044921875, -37.5439453125, -35.04296875, -32.5419921875, -30.041015625, -27.5400390625, -25.0390625, -22.5380859375, -20.037109375, -17.5361328125, -15.03515625, -12.5341796875, -10.033203125, -7.5322265625, -5.03125, -2.5302734375, -0.029296875, 2.4716796875, 4.97265625, 7.4736328125, 9.974609375, 12.4755859375, 14.9765625, 17.4775390625, 19.978515625, 22.4794921875, 24.98046875, 27.4814453125, 29.982421875, 32.4833984375, 34.984375, 37.4853515625, 39.986328125, 42.4873046875, 44.98828125, 47.4892578125, 49.990234375, 52.4912109375, 54.9921875, 57.4931640625, 59.994140625, 62.4951171875, 64.99609375, 67.4970703125, 69.998046875, 72.4990234375, 75.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 24.0, 60.0, 191.0, 534.0, 129.0, 46.0, 18.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1674.283935546875, -1642.9210205078125, -1611.55810546875, -1580.1951904296875, -1548.832275390625, -1517.469482421875, -1486.1065673828125, -1454.74365234375, -1423.3807373046875, -1392.017822265625, -1360.6549072265625, -1329.2919921875, -1297.92919921875, -1266.5662841796875, -1235.203369140625, -1203.8404541015625, -1172.4775390625, -1141.1146240234375, -1109.751708984375, -1078.3887939453125, -1047.02587890625, -1015.6630249023438, -984.3001708984375, -952.937255859375, -921.5743408203125, -890.21142578125, -858.8485107421875, -827.4856567382812, -796.1227416992188, -764.7598266601562, -733.39697265625, -702.0340576171875, -670.6712036132812, -639.3082885742188, -607.9454345703125, -576.58251953125, -545.2196044921875, -513.856689453125, -482.4938049316406, -451.13092041015625, -419.76800537109375, -388.40509033203125, -357.0422058105469, -325.6793212890625, -294.31640625, -262.9534912109375, -231.59060668945312, -200.2277069091797, -168.86480712890625, -137.5019073486328, -106.13900756835938, -74.77610778808594, -43.4132080078125, -12.050308227539062, 19.312591552734375, 50.67549133300781, 82.03839111328125, 113.40129089355469, 144.76419067382812, 176.12709045410156, 207.489990234375, 238.85289001464844, 270.2157897949219, 301.57867431640625, 332.94158935546875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 12.0, 5.0, 9.0, 10.0, 15.0, 9.0, 12.0, 19.0, 16.0, 26.0, 19.0, 30.0, 37.0, 31.0, 17.0, 27.0, 44.0, 30.0, 43.0, 34.0, 42.0, 39.0, 39.0, 35.0, 45.0, 35.0, 30.0, 41.0, 26.0, 22.0, 39.0, 31.0, 24.0, 16.0, 15.0, 17.0, 12.0, 10.0, 7.0, 6.0, 1.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-189.21368408203125, -183.88751220703125, -178.5613555908203, -173.2351837158203, -167.90902709960938, -162.58285522460938, -157.25669860839844, -151.93052673339844, -146.6043701171875, -141.2781982421875, -135.95204162597656, -130.62586975097656, -125.29971313476562, -119.97354125976562, -114.64737701416016, -109.32121276855469, -103.99504089355469, -98.66887664794922, -93.34271240234375, -88.01654815673828, -82.69038391113281, -77.36421203613281, -72.03804779052734, -66.71188354492188, -61.385719299316406, -56.05955505371094, -50.73339080810547, -45.407222747802734, -40.081058502197266, -34.7548942565918, -29.428728103637695, -24.102561950683594, -18.776397705078125, -13.45023250579834, -8.124067306518555, -2.7979021072387695, 2.5282630920410156, 7.854427337646484, 13.180593490600586, 18.506759643554688, 23.832923889160156, 29.159088134765625, 34.485252380371094, 39.81142044067383, 45.1375846862793, 50.463748931884766, 55.7899169921875, 61.11608123779297, 66.44224548339844, 71.7684097290039, 77.09457397460938, 82.42073822021484, 87.74690246582031, 93.07307434082031, 98.39923858642578, 103.72540283203125, 109.05156707763672, 114.37773132324219, 119.70389556884766, 125.03005981445312, 130.35623168945312, 135.68238830566406, 141.00856018066406, 146.334716796875, 151.660888671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 8.0, 7.0, 12.0, 10.0, 9.0, 21.0, 22.0, 29.0, 20.0, 32.0, 33.0, 38.0, 52.0, 47.0, 57.0, 51.0, 54.0, 47.0, 44.0, 57.0, 45.0, 38.0, 30.0, 34.0, 31.0, 26.0, 29.0, 17.0, 20.0, 12.0, 12.0, 15.0, 6.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.234375, -19.6695556640625, -19.104736328125, -18.5399169921875, -17.97509765625, -17.4102783203125, -16.845458984375, -16.2806396484375, -15.7158203125, -15.1510009765625, -14.586181640625, -14.0213623046875, -13.45654296875, -12.8917236328125, -12.326904296875, -11.7620849609375, -11.197265625, -10.6324462890625, -10.067626953125, -9.5028076171875, -8.93798828125, -8.3731689453125, -7.808349609375, -7.2435302734375, -6.6787109375, -6.1138916015625, -5.549072265625, -4.9842529296875, -4.41943359375, -3.8546142578125, -3.289794921875, -2.7249755859375, -2.16015625, -1.5953369140625, -1.030517578125, -0.4656982421875, 0.09912109375, 0.6639404296875, 1.228759765625, 1.7935791015625, 2.3583984375, 2.9232177734375, 3.488037109375, 4.0528564453125, 4.61767578125, 5.1824951171875, 5.747314453125, 6.3121337890625, 6.876953125, 7.4417724609375, 8.006591796875, 8.5714111328125, 9.13623046875, 9.7010498046875, 10.265869140625, 10.8306884765625, 11.3955078125, 11.9603271484375, 12.525146484375, 13.0899658203125, 13.65478515625, 14.2196044921875, 14.784423828125, 15.3492431640625, 15.9140625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 13.0, 9.0, 16.0, 30.0, 40.0, 59.0, 77.0, 132.0, 178.0, 299.0, 452.0, 685.0, 1057.0, 1683.0, 2711.0, 4335.0, 7001.0, 11553.0, 19648.0, 34971.0, 67303.0, 151632.0, 331257.0, 215428.0, 92072.0, 44584.0, 24368.0, 14293.0, 8433.0, 5246.0, 3307.0, 2069.0, 1256.0, 798.0, 511.0, 322.0, 234.0, 161.0, 106.0, 57.0, 63.0, 29.0, 25.0, 13.0, 9.0, 8.0, 10.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.970703125, -0.9410171508789062, -0.9113311767578125, -0.8816452026367188, -0.851959228515625, -0.8222732543945312, -0.7925872802734375, -0.7629013061523438, -0.73321533203125, -0.7035293579101562, -0.6738433837890625, -0.6441574096679688, -0.614471435546875, -0.5847854614257812, -0.5550994873046875, -0.5254135131835938, -0.4957275390625, -0.46604156494140625, -0.4363555908203125, -0.40666961669921875, -0.376983642578125, -0.34729766845703125, -0.3176116943359375, -0.28792572021484375, -0.25823974609375, -0.22855377197265625, -0.1988677978515625, -0.16918182373046875, -0.139495849609375, -0.10980987548828125, -0.0801239013671875, -0.05043792724609375, -0.020751953125, 0.00893402099609375, 0.0386199951171875, 0.06830596923828125, 0.097991943359375, 0.12767791748046875, 0.1573638916015625, 0.18704986572265625, 0.21673583984375, 0.24642181396484375, 0.2761077880859375, 0.30579376220703125, 0.335479736328125, 0.36516571044921875, 0.3948516845703125, 0.42453765869140625, 0.4542236328125, 0.48390960693359375, 0.5135955810546875, 0.5432815551757812, 0.572967529296875, 0.6026535034179688, 0.6323394775390625, 0.6620254516601562, 0.69171142578125, 0.7213973999023438, 0.7510833740234375, 0.7807693481445312, 0.810455322265625, 0.8401412963867188, 0.8698272705078125, 0.8995132446289062, 0.92919921875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 9.0, 9.0, 16.0, 8.0, 22.0, 17.0, 26.0, 22.0, 26.0, 25.0, 39.0, 27.0, 47.0, 40.0, 57.0, 42.0, 47.0, 1073.0, 50.0, 44.0, 34.0, 31.0, 41.0, 38.0, 31.0, 38.0, 24.0, 23.0, 26.0, 14.0, 24.0, 13.0, 10.0, 10.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.5299072265625, -9.169189453125, -8.8084716796875, -8.44775390625, -8.0870361328125, -7.726318359375, -7.3656005859375, -7.0048828125, -6.6441650390625, -6.283447265625, -5.9227294921875, -5.56201171875, -5.2012939453125, -4.840576171875, -4.4798583984375, -4.119140625, -3.7584228515625, -3.397705078125, -3.0369873046875, -2.67626953125, -2.3155517578125, -1.954833984375, -1.5941162109375, -1.2333984375, -0.8726806640625, -0.511962890625, -0.1512451171875, 0.20947265625, 0.5701904296875, 0.930908203125, 1.2916259765625, 1.65234375, 2.0130615234375, 2.373779296875, 2.7344970703125, 3.09521484375, 3.4559326171875, 3.816650390625, 4.1773681640625, 4.5380859375, 4.8988037109375, 5.259521484375, 5.6202392578125, 5.98095703125, 6.3416748046875, 6.702392578125, 7.0631103515625, 7.423828125, 7.7845458984375, 8.145263671875, 8.5059814453125, 8.86669921875, 9.2274169921875, 9.588134765625, 9.9488525390625, 10.3095703125, 10.6702880859375, 11.031005859375, 11.3917236328125, 11.75244140625, 12.1131591796875, 12.473876953125, 12.8345947265625, 13.1953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 11.0, 6.0, 14.0, 23.0, 31.0, 58.0, 62.0, 102.0, 171.0, 275.0, 434.0, 703.0, 1053.0, 1740.0, 2788.0, 4264.0, 6452.0, 10065.0, 15544.0, 24556.0, 39759.0, 67017.0, 124043.0, 1283977.0, 240293.0, 111925.0, 61504.0, 36599.0, 22827.0, 14365.0, 9412.0, 6172.0, 3908.0, 2561.0, 1641.0, 1018.0, 636.0, 400.0, 250.0, 161.0, 103.0, 67.0, 38.0, 32.0, 14.0, 19.0, 9.0, 9.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.75830078125, -0.7352676391601562, -0.7122344970703125, -0.6892013549804688, -0.666168212890625, -0.6431350708007812, -0.6201019287109375, -0.5970687866210938, -0.57403564453125, -0.5510025024414062, -0.5279693603515625, -0.5049362182617188, -0.481903076171875, -0.45886993408203125, -0.4358367919921875, -0.41280364990234375, -0.3897705078125, -0.36673736572265625, -0.3437042236328125, -0.32067108154296875, -0.297637939453125, -0.27460479736328125, -0.2515716552734375, -0.22853851318359375, -0.20550537109375, -0.18247222900390625, -0.1594390869140625, -0.13640594482421875, -0.113372802734375, -0.09033966064453125, -0.0673065185546875, -0.04427337646484375, -0.021240234375, 0.00179290771484375, 0.0248260498046875, 0.04785919189453125, 0.070892333984375, 0.09392547607421875, 0.1169586181640625, 0.13999176025390625, 0.16302490234375, 0.18605804443359375, 0.2090911865234375, 0.23212432861328125, 0.255157470703125, 0.27819061279296875, 0.3012237548828125, 0.32425689697265625, 0.3472900390625, 0.37032318115234375, 0.3933563232421875, 0.41638946533203125, 0.439422607421875, 0.46245574951171875, 0.4854888916015625, 0.5085220336914062, 0.53155517578125, 0.5545883178710938, 0.5776214599609375, 0.6006546020507812, 0.623687744140625, 0.6467208862304688, 0.6697540283203125, 0.6927871704101562, 0.7158203125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 6.0, 6.0, 8.0, 18.0, 31.0, 22.0, 33.0, 30.0, 51.0, 49.0, 51.0, 38.0, 63.0, 60.0, 58.0, 49.0, 53.0, 38.0, 44.0, 53.0, 52.0, 27.0, 30.0, 29.0, 15.0, 10.0, 13.0, 12.0, 6.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002773284912109375, -0.0026823580265045166, -0.002591431140899658, -0.0025005042552948, -0.0024095773696899414, -0.002318650484085083, -0.0022277235984802246, -0.002136796712875366, -0.002045869827270508, -0.0019549429416656494, -0.001864016056060791, -0.0017730891704559326, -0.0016821622848510742, -0.0015912353992462158, -0.0015003085136413574, -0.001409381628036499, -0.0013184547424316406, -0.0012275278568267822, -0.0011366009712219238, -0.0010456740856170654, -0.000954747200012207, -0.0008638203144073486, -0.0007728934288024902, -0.0006819665431976318, -0.0005910396575927734, -0.000500112771987915, -0.00040918588638305664, -0.00031825900077819824, -0.00022733211517333984, -0.00013640522956848145, -4.547834396362305e-05, 4.544854164123535e-05, 0.00013637542724609375, 0.00022730231285095215, 0.00031822919845581055, 0.00040915608406066895, 0.0005000829696655273, 0.0005910098552703857, 0.0006819367408752441, 0.0007728636264801025, 0.0008637905120849609, 0.0009547173976898193, 0.0010456442832946777, 0.0011365711688995361, 0.0012274980545043945, 0.001318424940109253, 0.0014093518257141113, 0.0015002787113189697, 0.0015912055969238281, 0.0016821324825286865, 0.001773059368133545, 0.0018639862537384033, 0.0019549131393432617, 0.00204584002494812, 0.0021367669105529785, 0.002227693796157837, 0.0023186206817626953, 0.0024095475673675537, 0.002500474452972412, 0.0025914013385772705, 0.002682328224182129, 0.0027732551097869873, 0.0028641819953918457, 0.002955108880996704, 0.0030460357666015625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 0.0, 3.0, 6.0, 4.0, 12.0, 20.0, 9.0, 30.0, 29.0, 26.0, 62.0, 85.0, 98.0, 158.0, 215.0, 330.0, 961.0, 23502.0, 1000249.0, 20712.0, 930.0, 355.0, 231.0, 145.0, 101.0, 76.0, 64.0, 27.0, 38.0, 34.0, 17.0, 8.0, 3.0, 6.0, 1.0, 13.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0777587890625, -0.07573843002319336, -0.07371807098388672, -0.07169771194458008, -0.06967735290527344, -0.0676569938659668, -0.06563663482666016, -0.06361627578735352, -0.061595916748046875, -0.059575557708740234, -0.057555198669433594, -0.05553483963012695, -0.05351448059082031, -0.05149412155151367, -0.04947376251220703, -0.04745340347290039, -0.04543304443359375, -0.04341268539428711, -0.04139232635498047, -0.03937196731567383, -0.03735160827636719, -0.03533124923706055, -0.033310890197753906, -0.031290531158447266, -0.029270172119140625, -0.027249813079833984, -0.025229454040527344, -0.023209095001220703, -0.021188735961914062, -0.019168376922607422, -0.01714801788330078, -0.01512765884399414, -0.0131072998046875, -0.01108694076538086, -0.009066581726074219, -0.007046222686767578, -0.0050258636474609375, -0.003005504608154297, -0.0009851455688476562, 0.0010352134704589844, 0.003055572509765625, 0.005075931549072266, 0.007096290588378906, 0.009116649627685547, 0.011137008666992188, 0.013157367706298828, 0.015177726745605469, 0.01719808578491211, 0.01921844482421875, 0.02123880386352539, 0.02325916290283203, 0.025279521942138672, 0.027299880981445312, 0.029320240020751953, 0.031340599060058594, 0.033360958099365234, 0.035381317138671875, 0.037401676177978516, 0.039422035217285156, 0.0414423942565918, 0.04346275329589844, 0.04548311233520508, 0.04750347137451172, 0.04952383041381836, 0.051544189453125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 387.0, 592.0, 29.0, 1.0], "bins": [-0.04468172416090965, -0.04395001381635666, -0.043218307197093964, -0.04248659685254097, -0.041754886507987976, -0.04102317616343498, -0.04029146581888199, -0.03955975919961929, -0.0388280488550663, -0.038096338510513306, -0.03736463189125061, -0.03663292154669762, -0.03590121120214462, -0.03516950085759163, -0.034437790513038635, -0.03370608389377594, -0.032974373549222946, -0.03224266320466995, -0.03151095658540726, -0.030779246240854263, -0.03004753589630127, -0.029315825551748276, -0.02858411706984043, -0.027852408587932587, -0.027120698243379593, -0.0263889878988266, -0.025657279416918755, -0.02492557093501091, -0.024193860590457916, -0.023462150245904922, -0.022730441763997078, -0.021998733282089233, -0.02126702107489109, -0.020535312592983246, -0.019803602248430252, -0.01907189190387726, -0.018340183421969414, -0.01760847494006157, -0.016876764595508575, -0.01614505425095558, -0.015413345769047737, -0.014681636355817318, -0.013949926942586899, -0.01321821752935648, -0.01248650811612606, -0.011754798702895641, -0.011023089289665222, -0.010291379876434803, -0.009559670463204384, -0.008827961049973965, -0.008096251636743546, -0.007364542223513126, -0.006632832810282707, -0.005901123397052288, -0.005169413983821869, -0.00443770457059145, -0.0037059953901916742, -0.002974285976961255, -0.002242576563730836, -0.0015108671505004168, -0.0007791577372699976, -4.744832403957844e-05, 0.0006842610891908407, 0.0014159705024212599, 0.002147679915651679]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 1.0, 4.0, 6.0, 10.0, 10.0, 18.0, 15.0, 16.0, 17.0, 23.0, 32.0, 37.0, 32.0, 34.0, 28.0, 34.0, 40.0, 53.0, 42.0, 28.0, 37.0, 48.0, 42.0, 30.0, 47.0, 44.0, 34.0, 36.0, 34.0, 20.0, 13.0, 18.0, 17.0, 12.0, 20.0, 14.0, 13.0, 13.0, 4.0, 4.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015085339546203613, -0.0014608250930905342, -0.001413116231560707, -0.00136540737003088, -0.0013176985085010529, -0.0012699896469712257, -0.0012222807854413986, -0.0011745719239115715, -0.0011268630623817444, -0.0010791542008519173, -0.0010314453393220901, -0.000983736477792263, -0.0009360276162624359, -0.0008883187547326088, -0.0008406098932027817, -0.0007929010316729546, -0.0007451921701431274, -0.0006974833086133003, -0.0006497744470834732, -0.0006020655855536461, -0.000554356724023819, -0.0005066478624939919, -0.00045893900096416473, -0.0004112301394343376, -0.0003635212779045105, -0.0003158124163746834, -0.00026810355484485626, -0.00022039469331502914, -0.00017268583178520203, -0.0001249769702553749, -7.726810872554779e-05, -2.9559247195720673e-05, 1.8149614334106445e-05, 6.585847586393356e-05, 0.00011356733739376068, 0.0001612761989235878, 0.00020898506045341492, 0.00025669392198324203, 0.00030440278351306915, 0.00035211164504289627, 0.0003998205065727234, 0.0004475293681025505, 0.0004952382296323776, 0.0005429470911622047, 0.0005906559526920319, 0.000638364814221859, 0.0006860736757516861, 0.0007337825372815132, 0.0007814913988113403, 0.0008292002603411674, 0.0008769091218709946, 0.0009246179834008217, 0.0009723268449306488, 0.001020035706460476, 0.001067744567990303, 0.0011154534295201302, 0.0011631622910499573, 0.0012108711525797844, 0.0012585800141096115, 0.0013062888756394386, 0.0013539977371692657, 0.0014017065986990929, 0.00144941546022892, 0.001497124321758747, 0.0015448331832885742]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 8.0, 7.0, 12.0, 10.0, 9.0, 21.0, 22.0, 29.0, 20.0, 32.0, 33.0, 38.0, 52.0, 47.0, 57.0, 51.0, 54.0, 47.0, 44.0, 57.0, 45.0, 38.0, 30.0, 34.0, 31.0, 26.0, 29.0, 17.0, 20.0, 12.0, 12.0, 15.0, 6.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.234375, -19.6695556640625, -19.104736328125, -18.5399169921875, -17.97509765625, -17.4102783203125, -16.845458984375, -16.2806396484375, -15.7158203125, -15.1510009765625, -14.586181640625, -14.0213623046875, -13.45654296875, -12.8917236328125, -12.326904296875, -11.7620849609375, -11.197265625, -10.6324462890625, -10.067626953125, -9.5028076171875, -8.93798828125, -8.3731689453125, -7.808349609375, -7.2435302734375, -6.6787109375, -6.1138916015625, -5.549072265625, -4.9842529296875, -4.41943359375, -3.8546142578125, -3.289794921875, -2.7249755859375, -2.16015625, -1.5953369140625, -1.030517578125, -0.4656982421875, 0.09912109375, 0.6639404296875, 1.228759765625, 1.7935791015625, 2.3583984375, 2.9232177734375, 3.488037109375, 4.0528564453125, 4.61767578125, 5.1824951171875, 5.747314453125, 6.3121337890625, 6.876953125, 7.4417724609375, 8.006591796875, 8.5714111328125, 9.13623046875, 9.7010498046875, 10.265869140625, 10.8306884765625, 11.3955078125, 11.9603271484375, 12.525146484375, 13.0899658203125, 13.65478515625, 14.2196044921875, 14.784423828125, 15.3492431640625, 15.9140625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 13.0, 11.0, 17.0, 24.0, 44.0, 47.0, 71.0, 119.0, 157.0, 228.0, 353.0, 523.0, 809.0, 1341.0, 2367.0, 4309.0, 9355.0, 25477.0, 101787.0, 661113.0, 178840.0, 36654.0, 12319.0, 5421.0, 2760.0, 1540.0, 978.0, 623.0, 411.0, 252.0, 193.0, 113.0, 79.0, 69.0, 39.0, 25.0, 18.0, 14.0, 9.0, 8.0, 8.0, 1.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.890625, -22.24853515625, -21.6064453125, -20.96435546875, -20.322265625, -19.68017578125, -19.0380859375, -18.39599609375, -17.75390625, -17.11181640625, -16.4697265625, -15.82763671875, -15.185546875, -14.54345703125, -13.9013671875, -13.25927734375, -12.6171875, -11.97509765625, -11.3330078125, -10.69091796875, -10.048828125, -9.40673828125, -8.7646484375, -8.12255859375, -7.48046875, -6.83837890625, -6.1962890625, -5.55419921875, -4.912109375, -4.27001953125, -3.6279296875, -2.98583984375, -2.34375, -1.70166015625, -1.0595703125, -0.41748046875, 0.224609375, 0.86669921875, 1.5087890625, 2.15087890625, 2.79296875, 3.43505859375, 4.0771484375, 4.71923828125, 5.361328125, 6.00341796875, 6.6455078125, 7.28759765625, 7.9296875, 8.57177734375, 9.2138671875, 9.85595703125, 10.498046875, 11.14013671875, 11.7822265625, 12.42431640625, 13.06640625, 13.70849609375, 14.3505859375, 14.99267578125, 15.634765625, 16.27685546875, 16.9189453125, 17.56103515625, 18.203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 13.0, 6.0, 6.0, 16.0, 10.0, 16.0, 19.0, 12.0, 15.0, 30.0, 43.0, 35.0, 28.0, 49.0, 48.0, 48.0, 37.0, 55.0, 1755.0, 254.0, 54.0, 51.0, 31.0, 47.0, 45.0, 34.0, 43.0, 37.0, 26.0, 26.0, 21.0, 22.0, 9.0, 17.0, 13.0, 17.0, 11.0, 12.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-61.1875, -59.43603515625, -57.6845703125, -55.93310546875, -54.181640625, -52.43017578125, -50.6787109375, -48.92724609375, -47.17578125, -45.42431640625, -43.6728515625, -41.92138671875, -40.169921875, -38.41845703125, -36.6669921875, -34.91552734375, -33.1640625, -31.41259765625, -29.6611328125, -27.90966796875, -26.158203125, -24.40673828125, -22.6552734375, -20.90380859375, -19.15234375, -17.40087890625, -15.6494140625, -13.89794921875, -12.146484375, -10.39501953125, -8.6435546875, -6.89208984375, -5.140625, -3.38916015625, -1.6376953125, 0.11376953125, 1.865234375, 3.61669921875, 5.3681640625, 7.11962890625, 8.87109375, 10.62255859375, 12.3740234375, 14.12548828125, 15.876953125, 17.62841796875, 19.3798828125, 21.13134765625, 22.8828125, 24.63427734375, 26.3857421875, 28.13720703125, 29.888671875, 31.64013671875, 33.3916015625, 35.14306640625, 36.89453125, 38.64599609375, 40.3974609375, 42.14892578125, 43.900390625, 45.65185546875, 47.4033203125, 49.15478515625, 50.90625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 6.0, 11.0, 15.0, 20.0, 30.0, 27.0, 38.0, 60.0, 91.0, 132.0, 199.0, 400.0, 945.0, 2811.0, 12094.0, 153460.0, 2949834.0, 18988.0, 4142.0, 1219.0, 475.0, 238.0, 149.0, 96.0, 53.0, 43.0, 29.0, 23.0, 20.0, 13.0, 12.0, 3.0, 2.0, 5.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-181.625, -176.3046875, -170.984375, -165.6640625, -160.34375, -155.0234375, -149.703125, -144.3828125, -139.0625, -133.7421875, -128.421875, -123.1015625, -117.78125, -112.4609375, -107.140625, -101.8203125, -96.5, -91.1796875, -85.859375, -80.5390625, -75.21875, -69.8984375, -64.578125, -59.2578125, -53.9375, -48.6171875, -43.296875, -37.9765625, -32.65625, -27.3359375, -22.015625, -16.6953125, -11.375, -6.0546875, -0.734375, 4.5859375, 9.90625, 15.2265625, 20.546875, 25.8671875, 31.1875, 36.5078125, 41.828125, 47.1484375, 52.46875, 57.7890625, 63.109375, 68.4296875, 73.75, 79.0703125, 84.390625, 89.7109375, 95.03125, 100.3515625, 105.671875, 110.9921875, 116.3125, 121.6328125, 126.953125, 132.2734375, 137.59375, 142.9140625, 148.234375, 153.5546875, 158.875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [12.0, 187.0, 778.0, 40.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.22724151611328, -38.65522766113281, -8.083213806152344, 22.488800048828125, 53.060813903808594, 83.6328353881836, 114.20484161376953, 144.77685546875, 175.348876953125, 205.9208984375, 236.49290466308594, 267.0649108886719, 297.6369323730469, 328.2089538574219, 358.78094482421875, 389.35296630859375, 419.92498779296875, 450.49700927734375, 481.06903076171875, 511.6410217285156, 542.2130126953125, 572.7850341796875, 603.3570556640625, 633.9290771484375, 664.5010986328125, 695.0731201171875, 725.6451416015625, 756.2171630859375, 786.7891845703125, 817.3612060546875, 847.9331665039062, 878.5051879882812, 909.0771484375, 939.649169921875, 970.22119140625, 1000.793212890625, 1031.365234375, 1061.937255859375, 1092.50927734375, 1123.081298828125, 1153.6533203125, 1184.225341796875, 1214.79736328125, 1245.369384765625, 1275.94140625, 1306.513427734375, 1337.08544921875, 1367.657470703125, 1398.2293701171875, 1428.8013916015625, 1459.3734130859375, 1489.9454345703125, 1520.5174560546875, 1551.0894775390625, 1581.6614990234375, 1612.2333984375, 1642.805419921875, 1673.37744140625, 1703.949462890625, 1734.521484375, 1765.093505859375, 1795.66552734375, 1826.237548828125, 1856.8095703125, 1887.381591796875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 9.0, 11.0, 9.0, 18.0, 16.0, 20.0, 20.0, 25.0, 31.0, 26.0, 34.0, 32.0, 43.0, 24.0, 37.0, 33.0, 38.0, 29.0, 40.0, 35.0, 32.0, 29.0, 32.0, 37.0, 33.0, 32.0, 38.0, 34.0, 33.0, 24.0, 17.0, 16.0, 10.0, 16.0, 17.0, 4.0, 11.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-176.732421875, -171.211669921875, -165.69091796875, -160.17015075683594, -154.64939880371094, -149.12864685058594, -143.60787963867188, -138.08712768554688, -132.56637573242188, -127.04562377929688, -121.52486419677734, -116.00410461425781, -110.48335266113281, -104.96260070800781, -99.44184112548828, -93.92108154296875, -88.40032958984375, -82.87957763671875, -77.35881805419922, -71.83805847167969, -66.31730651855469, -60.79655075073242, -55.275794982910156, -49.75503921508789, -44.234283447265625, -38.71352767944336, -33.192771911621094, -27.672016143798828, -22.151260375976562, -16.630504608154297, -11.109748840332031, -5.588993072509766, -0.0682373046875, 5.452518463134766, 10.973274230957031, 16.494029998779297, 22.014785766601562, 27.535541534423828, 33.056297302246094, 38.57705307006836, 44.097808837890625, 49.61856460571289, 55.139320373535156, 60.66007614135742, 66.18083190917969, 71.70158386230469, 77.22234344482422, 82.74310302734375, 88.26385498046875, 93.78460693359375, 99.30536651611328, 104.82612609863281, 110.34687805175781, 115.86763000488281, 121.38838958740234, 126.90914916992188, 132.42990112304688, 137.95065307617188, 143.47140502929688, 148.99217224121094, 154.51292419433594, 160.03367614746094, 165.554443359375, 171.0751953125, 176.595947265625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 10.0, 8.0, 14.0, 13.0, 18.0, 18.0, 25.0, 31.0, 22.0, 38.0, 50.0, 46.0, 50.0, 57.0, 48.0, 52.0, 48.0, 60.0, 46.0, 46.0, 44.0, 34.0, 28.0, 23.0, 35.0, 30.0, 15.0, 17.0, 16.0, 7.0, 10.0, 5.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.59375, -20.987548828125, -20.38134765625, -19.775146484375, -19.1689453125, -18.562744140625, -17.95654296875, -17.350341796875, -16.744140625, -16.137939453125, -15.53173828125, -14.925537109375, -14.3193359375, -13.713134765625, -13.10693359375, -12.500732421875, -11.89453125, -11.288330078125, -10.68212890625, -10.075927734375, -9.4697265625, -8.863525390625, -8.25732421875, -7.651123046875, -7.044921875, -6.438720703125, -5.83251953125, -5.226318359375, -4.6201171875, -4.013916015625, -3.40771484375, -2.801513671875, -2.1953125, -1.589111328125, -0.98291015625, -0.376708984375, 0.2294921875, 0.835693359375, 1.44189453125, 2.048095703125, 2.654296875, 3.260498046875, 3.86669921875, 4.472900390625, 5.0791015625, 5.685302734375, 6.29150390625, 6.897705078125, 7.50390625, 8.110107421875, 8.71630859375, 9.322509765625, 9.9287109375, 10.534912109375, 11.14111328125, 11.747314453125, 12.353515625, 12.959716796875, 13.56591796875, 14.172119140625, 14.7783203125, 15.384521484375, 15.99072265625, 16.596923828125, 17.203125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 10.0, 10.0, 9.0, 14.0, 21.0, 27.0, 41.0, 66.0, 97.0, 140.0, 234.0, 394.0, 754.0, 1295.0, 2561.0, 5169.0, 12360.0, 35462.0, 2517678.0, 1562068.0, 33889.0, 11639.0, 4972.0, 2476.0, 1187.0, 737.0, 362.0, 208.0, 148.0, 91.0, 47.0, 47.0, 24.0, 14.0, 8.0, 6.0, 3.0, 3.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-118.0, -114.7197265625, -111.439453125, -108.1591796875, -104.87890625, -101.5986328125, -98.318359375, -95.0380859375, -91.7578125, -88.4775390625, -85.197265625, -81.9169921875, -78.63671875, -75.3564453125, -72.076171875, -68.7958984375, -65.515625, -62.2353515625, -58.955078125, -55.6748046875, -52.39453125, -49.1142578125, -45.833984375, -42.5537109375, -39.2734375, -35.9931640625, -32.712890625, -29.4326171875, -26.15234375, -22.8720703125, -19.591796875, -16.3115234375, -13.03125, -9.7509765625, -6.470703125, -3.1904296875, 0.08984375, 3.3701171875, 6.650390625, 9.9306640625, 13.2109375, 16.4912109375, 19.771484375, 23.0517578125, 26.33203125, 29.6123046875, 32.892578125, 36.1728515625, 39.453125, 42.7333984375, 46.013671875, 49.2939453125, 52.57421875, 55.8544921875, 59.134765625, 62.4150390625, 65.6953125, 68.9755859375, 72.255859375, 75.5361328125, 78.81640625, 82.0966796875, 85.376953125, 88.6572265625, 91.9375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 0.0, 4.0, 6.0, 9.0, 17.0, 10.0, 7.0, 13.0, 17.0, 21.0, 26.0, 26.0, 41.0, 67.0, 154.0, 417.0, 1333.0, 1170.0, 368.0, 108.0, 55.0, 38.0, 33.0, 28.0, 20.0, 16.0, 15.0, 10.0, 6.0, 7.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.4375, -65.10546875, -62.7734375, -60.44140625, -58.109375, -55.77734375, -53.4453125, -51.11328125, -48.78125, -46.44921875, -44.1171875, -41.78515625, -39.453125, -37.12109375, -34.7890625, -32.45703125, -30.125, -27.79296875, -25.4609375, -23.12890625, -20.796875, -18.46484375, -16.1328125, -13.80078125, -11.46875, -9.13671875, -6.8046875, -4.47265625, -2.140625, 0.19140625, 2.5234375, 4.85546875, 7.1875, 9.51953125, 11.8515625, 14.18359375, 16.515625, 18.84765625, 21.1796875, 23.51171875, 25.84375, 28.17578125, 30.5078125, 32.83984375, 35.171875, 37.50390625, 39.8359375, 42.16796875, 44.5, 46.83203125, 49.1640625, 51.49609375, 53.828125, 56.16015625, 58.4921875, 60.82421875, 63.15625, 65.48828125, 67.8203125, 70.15234375, 72.484375, 74.81640625, 77.1484375, 79.48046875, 81.8125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 5.0, 13.0, 18.0, 29.0, 41.0, 60.0, 86.0, 112.0, 160.0, 238.0, 356.0, 435.0, 687.0, 1057.0, 1679.0, 2587.0, 3975.0, 6574.0, 11113.0, 19682.0, 39225.0, 108633.0, 2953856.0, 887357.0, 79907.0, 32965.0, 17355.0, 9819.0, 5957.0, 3603.0, 2207.0, 1480.0, 924.0, 622.0, 457.0, 294.0, 191.0, 136.0, 87.0, 79.0, 45.0, 42.0, 32.0, 27.0, 19.0, 11.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0], "bins": [-95.1875, -92.29296875, -89.3984375, -86.50390625, -83.609375, -80.71484375, -77.8203125, -74.92578125, -72.03125, -69.13671875, -66.2421875, -63.34765625, -60.453125, -57.55859375, -54.6640625, -51.76953125, -48.875, -45.98046875, -43.0859375, -40.19140625, -37.296875, -34.40234375, -31.5078125, -28.61328125, -25.71875, -22.82421875, -19.9296875, -17.03515625, -14.140625, -11.24609375, -8.3515625, -5.45703125, -2.5625, 0.33203125, 3.2265625, 6.12109375, 9.015625, 11.91015625, 14.8046875, 17.69921875, 20.59375, 23.48828125, 26.3828125, 29.27734375, 32.171875, 35.06640625, 37.9609375, 40.85546875, 43.75, 46.64453125, 49.5390625, 52.43359375, 55.328125, 58.22265625, 61.1171875, 64.01171875, 66.90625, 69.80078125, 72.6953125, 75.58984375, 78.484375, 81.37890625, 84.2734375, 87.16796875, 90.0625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 10.0, 8.0, 20.0, 37.0, 71.0, 93.0, 244.0, 250.0, 106.0, 71.0, 36.0, 19.0, 9.0, 6.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-276.7287902832031, -262.95281982421875, -249.17681884765625, -235.40084838867188, -221.62484741210938, -207.848876953125, -194.07289123535156, -180.29690551757812, -166.5209197998047, -152.74493408203125, -138.9689483642578, -125.1929702758789, -111.41698455810547, -97.64099884033203, -83.86502075195312, -70.08903503417969, -56.31304931640625, -42.53706359863281, -28.76108169555664, -14.985099792480469, -1.2091140747070312, 12.566871643066406, 26.342849731445312, 40.11883544921875, 53.89482116699219, 67.67080688476562, 81.44679260253906, 95.22277069091797, 108.9987564086914, 122.77474212646484, 136.55072021484375, 150.3267059326172, 164.10272216796875, 177.8787078857422, 191.65469360351562, 205.4306640625, 219.2066650390625, 232.98263549804688, 246.7586212158203, 260.53460693359375, 274.31060791015625, 288.0865783691406, 301.8625793457031, 315.6385498046875, 329.41455078125, 343.1905212402344, 356.96649169921875, 370.74249267578125, 384.5184631347656, 398.29443359375, 412.0704345703125, 425.8464050292969, 439.6224060058594, 453.39837646484375, 467.17437744140625, 480.9503479003906, 494.726318359375, 508.5022888183594, 522.2782592773438, 536.0542602539062, 549.8302612304688, 563.6062622070312, 577.3822021484375, 591.158203125, 604.9342041015625]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 4.0, 7.0, 10.0, 11.0, 9.0, 11.0, 13.0, 14.0, 21.0, 27.0, 40.0, 24.0, 28.0, 35.0, 33.0, 38.0, 38.0, 42.0, 42.0, 47.0, 46.0, 45.0, 46.0, 32.0, 43.0, 27.0, 34.0, 25.0, 24.0, 27.0, 26.0, 19.0, 24.0, 19.0, 11.0, 10.0, 19.0, 5.0, 3.0, 4.0, 9.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-181.99717712402344, -176.496826171875, -170.99647521972656, -165.49612426757812, -159.9957733154297, -154.49542236328125, -148.99505615234375, -143.49472045898438, -137.99435424804688, -132.49400329589844, -126.99365234375, -121.49330139160156, -115.99295043945312, -110.49259948730469, -104.99224090576172, -99.49188995361328, -93.99154663085938, -88.49119567871094, -82.9908447265625, -77.49049377441406, -71.99014282226562, -66.48979187011719, -60.98943328857422, -55.48908233642578, -49.988731384277344, -44.488380432128906, -38.98802947998047, -33.487674713134766, -27.987323760986328, -22.48697280883789, -16.986618041992188, -11.48626708984375, -5.985931396484375, -0.4855794906616211, 5.014772415161133, 10.515125274658203, 16.01547622680664, 21.515827178955078, 27.01618194580078, 32.51653289794922, 38.016883850097656, 43.517234802246094, 49.01758575439453, 54.517940521240234, 60.01829147338867, 65.51864624023438, 71.01899719238281, 76.51934814453125, 82.01969909667969, 87.52005004882812, 93.02040100097656, 98.520751953125, 104.02110290527344, 109.52145385742188, 115.02181243896484, 120.52216339111328, 126.02251434326172, 131.5228729248047, 137.02322387695312, 142.52357482910156, 148.02392578125, 153.52427673339844, 159.02462768554688, 164.5249786376953, 170.02532958984375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 2.0, 11.0, 7.0, 12.0, 10.0, 16.0, 9.0, 18.0, 23.0, 31.0, 26.0, 39.0, 34.0, 38.0, 40.0, 50.0, 50.0, 41.0, 42.0, 54.0, 60.0, 47.0, 26.0, 43.0, 24.0, 35.0, 25.0, 25.0, 29.0, 24.0, 18.0, 12.0, 19.0, 8.0, 11.0, 8.0, 9.0, 1.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.890625, -19.3154296875, -18.740234375, -18.1650390625, -17.58984375, -17.0146484375, -16.439453125, -15.8642578125, -15.2890625, -14.7138671875, -14.138671875, -13.5634765625, -12.98828125, -12.4130859375, -11.837890625, -11.2626953125, -10.6875, -10.1123046875, -9.537109375, -8.9619140625, -8.38671875, -7.8115234375, -7.236328125, -6.6611328125, -6.0859375, -5.5107421875, -4.935546875, -4.3603515625, -3.78515625, -3.2099609375, -2.634765625, -2.0595703125, -1.484375, -0.9091796875, -0.333984375, 0.2412109375, 0.81640625, 1.3916015625, 1.966796875, 2.5419921875, 3.1171875, 3.6923828125, 4.267578125, 4.8427734375, 5.41796875, 5.9931640625, 6.568359375, 7.1435546875, 7.71875, 8.2939453125, 8.869140625, 9.4443359375, 10.01953125, 10.5947265625, 11.169921875, 11.7451171875, 12.3203125, 12.8955078125, 13.470703125, 14.0458984375, 14.62109375, 15.1962890625, 15.771484375, 16.3466796875, 16.921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 18.0, 22.0, 26.0, 54.0, 65.0, 91.0, 145.0, 232.0, 313.0, 495.0, 700.0, 1087.0, 1548.0, 2395.0, 3713.0, 5612.0, 9082.0, 14475.0, 23921.0, 41916.0, 77279.0, 161972.0, 301917.0, 193403.0, 89581.0, 47337.0, 26969.0, 16218.0, 9925.0, 6142.0, 3991.0, 2665.0, 1712.0, 1154.0, 787.0, 496.0, 344.0, 238.0, 150.0, 121.0, 80.0, 47.0, 42.0, 28.0, 11.0, 12.0, 9.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.92919921875, -0.9007034301757812, -0.8722076416015625, -0.8437118530273438, -0.815216064453125, -0.7867202758789062, -0.7582244873046875, -0.7297286987304688, -0.70123291015625, -0.6727371215820312, -0.6442413330078125, -0.6157455444335938, -0.587249755859375, -0.5587539672851562, -0.5302581787109375, -0.5017623901367188, -0.4732666015625, -0.44477081298828125, -0.4162750244140625, -0.38777923583984375, -0.359283447265625, -0.33078765869140625, -0.3022918701171875, -0.27379608154296875, -0.24530029296875, -0.21680450439453125, -0.1883087158203125, -0.15981292724609375, -0.131317138671875, -0.10282135009765625, -0.0743255615234375, -0.04582977294921875, -0.017333984375, 0.01116180419921875, 0.0396575927734375, 0.06815338134765625, 0.096649169921875, 0.12514495849609375, 0.1536407470703125, 0.18213653564453125, 0.21063232421875, 0.23912811279296875, 0.2676239013671875, 0.29611968994140625, 0.324615478515625, 0.35311126708984375, 0.3816070556640625, 0.41010284423828125, 0.4385986328125, 0.46709442138671875, 0.4955902099609375, 0.5240859985351562, 0.552581787109375, 0.5810775756835938, 0.6095733642578125, 0.6380691528320312, 0.66656494140625, 0.6950607299804688, 0.7235565185546875, 0.7520523071289062, 0.780548095703125, 0.8090438842773438, 0.8375396728515625, 0.8660354614257812, 0.89453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 7.0, 6.0, 11.0, 13.0, 18.0, 16.0, 26.0, 17.0, 23.0, 24.0, 50.0, 28.0, 31.0, 34.0, 35.0, 29.0, 33.0, 39.0, 1071.0, 36.0, 40.0, 41.0, 34.0, 33.0, 36.0, 32.0, 38.0, 27.0, 29.0, 23.0, 23.0, 21.0, 15.0, 14.0, 9.0, 4.0, 10.0, 12.0, 4.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.2578125, -9.933837890625, -9.60986328125, -9.285888671875, -8.9619140625, -8.637939453125, -8.31396484375, -7.989990234375, -7.666015625, -7.342041015625, -7.01806640625, -6.694091796875, -6.3701171875, -6.046142578125, -5.72216796875, -5.398193359375, -5.07421875, -4.750244140625, -4.42626953125, -4.102294921875, -3.7783203125, -3.454345703125, -3.13037109375, -2.806396484375, -2.482421875, -2.158447265625, -1.83447265625, -1.510498046875, -1.1865234375, -0.862548828125, -0.53857421875, -0.214599609375, 0.109375, 0.433349609375, 0.75732421875, 1.081298828125, 1.4052734375, 1.729248046875, 2.05322265625, 2.377197265625, 2.701171875, 3.025146484375, 3.34912109375, 3.673095703125, 3.9970703125, 4.321044921875, 4.64501953125, 4.968994140625, 5.29296875, 5.616943359375, 5.94091796875, 6.264892578125, 6.5888671875, 6.912841796875, 7.23681640625, 7.560791015625, 7.884765625, 8.208740234375, 8.53271484375, 8.856689453125, 9.1806640625, 9.504638671875, 9.82861328125, 10.152587890625, 10.4765625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 9.0, 15.0, 10.0, 24.0, 19.0, 44.0, 67.0, 104.0, 158.0, 171.0, 271.0, 342.0, 485.0, 726.0, 948.0, 1389.0, 1833.0, 2563.0, 3682.0, 5106.0, 6997.0, 10235.0, 14593.0, 21067.0, 31115.0, 46949.0, 72699.0, 119143.0, 1206601.0, 228935.0, 111091.0, 68378.0, 44141.0, 29724.0, 20043.0, 13853.0, 9694.0, 6826.0, 4797.0, 3459.0, 2500.0, 1776.0, 1278.0, 902.0, 730.0, 469.0, 353.0, 248.0, 160.0, 124.0, 81.0, 76.0, 40.0, 33.0, 25.0, 15.0, 9.0, 4.0, 6.0, 1.0, 2.0], "bins": [-0.5966796875, -0.5779953002929688, -0.5593109130859375, -0.5406265258789062, -0.521942138671875, -0.5032577514648438, -0.4845733642578125, -0.46588897705078125, -0.44720458984375, -0.42852020263671875, -0.4098358154296875, -0.39115142822265625, -0.372467041015625, -0.35378265380859375, -0.3350982666015625, -0.31641387939453125, -0.2977294921875, -0.27904510498046875, -0.2603607177734375, -0.24167633056640625, -0.222991943359375, -0.20430755615234375, -0.1856231689453125, -0.16693878173828125, -0.14825439453125, -0.12957000732421875, -0.1108856201171875, -0.09220123291015625, -0.073516845703125, -0.05483245849609375, -0.0361480712890625, -0.01746368408203125, 0.001220703125, 0.01990509033203125, 0.0385894775390625, 0.05727386474609375, 0.075958251953125, 0.09464263916015625, 0.1133270263671875, 0.13201141357421875, 0.15069580078125, 0.16938018798828125, 0.1880645751953125, 0.20674896240234375, 0.225433349609375, 0.24411773681640625, 0.2628021240234375, 0.28148651123046875, 0.3001708984375, 0.31885528564453125, 0.3375396728515625, 0.35622406005859375, 0.374908447265625, 0.39359283447265625, 0.4122772216796875, 0.43096160888671875, 0.44964599609375, 0.46833038330078125, 0.4870147705078125, 0.5056991577148438, 0.524383544921875, 0.5430679321289062, 0.5617523193359375, 0.5804367065429688, 0.59912109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 10.0, 7.0, 14.0, 19.0, 15.0, 17.0, 28.0, 25.0, 34.0, 37.0, 43.0, 52.0, 59.0, 51.0, 44.0, 62.0, 51.0, 58.0, 48.0, 44.0, 42.0, 44.0, 33.0, 23.0, 22.0, 20.0, 13.0, 13.0, 12.0, 6.0, 16.0, 5.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024890899658203125, -0.0024011433124542236, -0.0023131966590881348, -0.002225250005722046, -0.002137303352355957, -0.002049356698989868, -0.0019614100456237793, -0.0018734633922576904, -0.0017855167388916016, -0.0016975700855255127, -0.0016096234321594238, -0.001521676778793335, -0.001433730125427246, -0.0013457834720611572, -0.0012578368186950684, -0.0011698901653289795, -0.0010819435119628906, -0.0009939968585968018, -0.0009060502052307129, -0.000818103551864624, -0.0007301568984985352, -0.0006422102451324463, -0.0005542635917663574, -0.00046631693840026855, -0.0003783702850341797, -0.0002904236316680908, -0.00020247697830200195, -0.00011453032493591309, -2.658367156982422e-05, 6.136298179626465e-05, 0.00014930963516235352, 0.00023725628852844238, 0.00032520294189453125, 0.0004131495952606201, 0.000501096248626709, 0.0005890429019927979, 0.0006769895553588867, 0.0007649362087249756, 0.0008528828620910645, 0.0009408295154571533, 0.0010287761688232422, 0.001116722822189331, 0.00120466947555542, 0.0012926161289215088, 0.0013805627822875977, 0.0014685094356536865, 0.0015564560890197754, 0.0016444027423858643, 0.0017323493957519531, 0.001820296049118042, 0.0019082427024841309, 0.0019961893558502197, 0.0020841360092163086, 0.0021720826625823975, 0.0022600293159484863, 0.002347975969314575, 0.002435922622680664, 0.002523869276046753, 0.002611815929412842, 0.0026997625827789307, 0.0027877092361450195, 0.0028756558895111084, 0.0029636025428771973, 0.003051549196243286, 0.003139495849609375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 4.0, 3.0, 10.0, 10.0, 21.0, 23.0, 18.0, 35.0, 40.0, 64.0, 86.0, 76.0, 117.0, 156.0, 218.0, 376.0, 1117.0, 12674.0, 534965.0, 484375.0, 11746.0, 1118.0, 353.0, 229.0, 182.0, 121.0, 96.0, 76.0, 42.0, 54.0, 31.0, 16.0, 16.0, 24.0, 18.0, 13.0, 11.0, 3.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.052032470703125, -0.050586700439453125, -0.04914093017578125, -0.047695159912109375, -0.0462493896484375, -0.044803619384765625, -0.04335784912109375, -0.041912078857421875, -0.04046630859375, -0.039020538330078125, -0.03757476806640625, -0.036128997802734375, -0.0346832275390625, -0.033237457275390625, -0.03179168701171875, -0.030345916748046875, -0.028900146484375, -0.027454376220703125, -0.02600860595703125, -0.024562835693359375, -0.0231170654296875, -0.021671295166015625, -0.02022552490234375, -0.018779754638671875, -0.017333984375, -0.015888214111328125, -0.01444244384765625, -0.012996673583984375, -0.0115509033203125, -0.010105133056640625, -0.00865936279296875, -0.007213592529296875, -0.005767822265625, -0.004322052001953125, -0.00287628173828125, -0.001430511474609375, 1.52587890625e-05, 0.001461029052734375, 0.00290679931640625, 0.004352569580078125, 0.00579833984375, 0.007244110107421875, 0.00868988037109375, 0.010135650634765625, 0.0115814208984375, 0.013027191162109375, 0.01447296142578125, 0.015918731689453125, 0.017364501953125, 0.018810272216796875, 0.02025604248046875, 0.021701812744140625, 0.0231475830078125, 0.024593353271484375, 0.02603912353515625, 0.027484893798828125, 0.0289306640625, 0.030376434326171875, 0.03182220458984375, 0.033267974853515625, 0.0347137451171875, 0.036159515380859375, 0.03760528564453125, 0.039051055908203125, 0.040496826171875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 13.0, 41.0, 157.0, 527.0, 204.0, 54.0, 16.0, 4.0, 1.0], "bins": [-0.020976660773158073, -0.020618431270122528, -0.020260199904441833, -0.019901970401406288, -0.019543740898370743, -0.019185509532690048, -0.018827280029654503, -0.018469050526618958, -0.018110821023583412, -0.017752591520547867, -0.017394360154867172, -0.017036130651831627, -0.01667790114879608, -0.016319669783115387, -0.01596144028007984, -0.015603210777044296, -0.015244979411363602, -0.014886748977005482, -0.014528519473969936, -0.014170289039611816, -0.013812059536576271, -0.013453829102218151, -0.013095598667860031, -0.012737369164824486, -0.01237913966178894, -0.01202090922743082, -0.011662679724395275, -0.011304449290037155, -0.01094621978700161, -0.01058798935264349, -0.01022975891828537, -0.009871529415249825, -0.009513298980891705, -0.009155068546533585, -0.00879683904349804, -0.00843860860913992, -0.008080379106104374, -0.007722148671746254, -0.007363918703049421, -0.007005688734352589, -0.006647458299994469, -0.006289228331297636, -0.005930998362600803, -0.005572767928242683, -0.005214537959545851, -0.004856307990849018, -0.0044980780221521854, -0.004139848053455353, -0.003781617619097233, -0.0034233876504004, -0.003065157448872924, -0.002706927480176091, -0.002348697278648615, -0.0019904673099517822, -0.0016322373412549496, -0.0012740071397274733, -0.0009157772874459624, -0.0005575472023338079, -0.00019931717542931437, 0.0001589128514751792, 0.0005171429365873337, 0.0008753730216994882, 0.0012336029903963208, 0.0015918331919237971, 0.0019500631606206298]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 9.0, 8.0, 5.0, 4.0, 12.0, 8.0, 17.0, 23.0, 20.0, 19.0, 19.0, 27.0, 17.0, 28.0, 34.0, 36.0, 37.0, 30.0, 38.0, 36.0, 44.0, 38.0, 40.0, 45.0, 34.0, 32.0, 38.0, 33.0, 34.0, 22.0, 26.0, 23.0, 18.0, 18.0, 23.0, 21.0, 18.0, 13.0, 10.0, 7.0, 5.0, 9.0, 6.0, 9.0, 0.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0015026330947875977, -0.0014580637216567993, -0.001413494348526001, -0.0013689249753952026, -0.0013243556022644043, -0.001279786229133606, -0.0012352168560028076, -0.0011906474828720093, -0.001146078109741211, -0.0011015087366104126, -0.0010569393634796143, -0.001012369990348816, -0.0009678006172180176, -0.0009232312440872192, -0.0008786618709564209, -0.0008340924978256226, -0.0007895231246948242, -0.0007449537515640259, -0.0007003843784332275, -0.0006558150053024292, -0.0006112456321716309, -0.0005666762590408325, -0.0005221068859100342, -0.00047753751277923584, -0.0004329681396484375, -0.00038839876651763916, -0.0003438293933868408, -0.0002992600202560425, -0.00025469064712524414, -0.0002101212739944458, -0.00016555190086364746, -0.00012098252773284912, -7.641315460205078e-05, -3.184378147125244e-05, 1.2725591659545898e-05, 5.729496479034424e-05, 0.00010186433792114258, 0.00014643371105194092, 0.00019100308418273926, 0.0002355724573135376, 0.00028014183044433594, 0.0003247112035751343, 0.0003692805767059326, 0.00041384994983673096, 0.0004584193229675293, 0.0005029886960983276, 0.000547558069229126, 0.0005921274423599243, 0.0006366968154907227, 0.000681266188621521, 0.0007258355617523193, 0.0007704049348831177, 0.000814974308013916, 0.0008595436811447144, 0.0009041130542755127, 0.000948682427406311, 0.0009932518005371094, 0.0010378211736679077, 0.001082390546798706, 0.0011269599199295044, 0.0011715292930603027, 0.001216098666191101, 0.0012606680393218994, 0.0013052374124526978, 0.001349806785583496]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 2.0, 11.0, 7.0, 12.0, 10.0, 16.0, 9.0, 18.0, 23.0, 31.0, 26.0, 39.0, 34.0, 38.0, 40.0, 50.0, 50.0, 41.0, 42.0, 54.0, 60.0, 47.0, 26.0, 43.0, 24.0, 35.0, 25.0, 25.0, 29.0, 24.0, 18.0, 12.0, 19.0, 8.0, 11.0, 8.0, 9.0, 1.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.890625, -19.3154296875, -18.740234375, -18.1650390625, -17.58984375, -17.0146484375, -16.439453125, -15.8642578125, -15.2890625, -14.7138671875, -14.138671875, -13.5634765625, -12.98828125, -12.4130859375, -11.837890625, -11.2626953125, -10.6875, -10.1123046875, -9.537109375, -8.9619140625, -8.38671875, -7.8115234375, -7.236328125, -6.6611328125, -6.0859375, -5.5107421875, -4.935546875, -4.3603515625, -3.78515625, -3.2099609375, -2.634765625, -2.0595703125, -1.484375, -0.9091796875, -0.333984375, 0.2412109375, 0.81640625, 1.3916015625, 1.966796875, 2.5419921875, 3.1171875, 3.6923828125, 4.267578125, 4.8427734375, 5.41796875, 5.9931640625, 6.568359375, 7.1435546875, 7.71875, 8.2939453125, 8.869140625, 9.4443359375, 10.01953125, 10.5947265625, 11.169921875, 11.7451171875, 12.3203125, 12.8955078125, 13.470703125, 14.0458984375, 14.62109375, 15.1962890625, 15.771484375, 16.3466796875, 16.921875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 11.0, 16.0, 21.0, 27.0, 37.0, 48.0, 69.0, 101.0, 162.0, 183.0, 258.0, 399.0, 601.0, 922.0, 1533.0, 2549.0, 4570.0, 8604.0, 17594.0, 40294.0, 107310.0, 447846.0, 275244.0, 77736.0, 31252.0, 14269.0, 7135.0, 3743.0, 2134.0, 1311.0, 804.0, 530.0, 349.0, 235.0, 176.0, 133.0, 91.0, 66.0, 48.0, 31.0, 25.0, 32.0, 14.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.633056640625, -9.32080078125, -9.008544921875, -8.6962890625, -8.384033203125, -8.07177734375, -7.759521484375, -7.447265625, -7.135009765625, -6.82275390625, -6.510498046875, -6.1982421875, -5.885986328125, -5.57373046875, -5.261474609375, -4.94921875, -4.636962890625, -4.32470703125, -4.012451171875, -3.7001953125, -3.387939453125, -3.07568359375, -2.763427734375, -2.451171875, -2.138916015625, -1.82666015625, -1.514404296875, -1.2021484375, -0.889892578125, -0.57763671875, -0.265380859375, 0.046875, 0.359130859375, 0.67138671875, 0.983642578125, 1.2958984375, 1.608154296875, 1.92041015625, 2.232666015625, 2.544921875, 2.857177734375, 3.16943359375, 3.481689453125, 3.7939453125, 4.106201171875, 4.41845703125, 4.730712890625, 5.04296875, 5.355224609375, 5.66748046875, 5.979736328125, 6.2919921875, 6.604248046875, 6.91650390625, 7.228759765625, 7.541015625, 7.853271484375, 8.16552734375, 8.477783203125, 8.7900390625, 9.102294921875, 9.41455078125, 9.726806640625, 10.0390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 3.0, 2.0, 4.0, 9.0, 5.0, 11.0, 15.0, 14.0, 14.0, 21.0, 25.0, 16.0, 25.0, 27.0, 38.0, 33.0, 46.0, 40.0, 53.0, 53.0, 61.0, 154.0, 1867.0, 64.0, 44.0, 45.0, 39.0, 37.0, 36.0, 37.0, 39.0, 28.0, 20.0, 23.0, 16.0, 14.0, 16.0, 8.0, 9.0, 4.0, 8.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-60.03125, -58.103515625, -56.17578125, -54.248046875, -52.3203125, -50.392578125, -48.46484375, -46.537109375, -44.609375, -42.681640625, -40.75390625, -38.826171875, -36.8984375, -34.970703125, -33.04296875, -31.115234375, -29.1875, -27.259765625, -25.33203125, -23.404296875, -21.4765625, -19.548828125, -17.62109375, -15.693359375, -13.765625, -11.837890625, -9.91015625, -7.982421875, -6.0546875, -4.126953125, -2.19921875, -0.271484375, 1.65625, 3.583984375, 5.51171875, 7.439453125, 9.3671875, 11.294921875, 13.22265625, 15.150390625, 17.078125, 19.005859375, 20.93359375, 22.861328125, 24.7890625, 26.716796875, 28.64453125, 30.572265625, 32.5, 34.427734375, 36.35546875, 38.283203125, 40.2109375, 42.138671875, 44.06640625, 45.994140625, 47.921875, 49.849609375, 51.77734375, 53.705078125, 55.6328125, 57.560546875, 59.48828125, 61.416015625, 63.34375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 15.0, 21.0, 29.0, 57.0, 92.0, 167.0, 409.0, 1114.0, 3520.0, 12675.0, 3043126.0, 73038.0, 7821.0, 2182.0, 784.0, 283.0, 125.0, 83.0, 32.0, 29.0, 21.0, 14.0, 9.0, 13.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.375, -161.56640625, -155.7578125, -149.94921875, -144.140625, -138.33203125, -132.5234375, -126.71484375, -120.90625, -115.09765625, -109.2890625, -103.48046875, -97.671875, -91.86328125, -86.0546875, -80.24609375, -74.4375, -68.62890625, -62.8203125, -57.01171875, -51.203125, -45.39453125, -39.5859375, -33.77734375, -27.96875, -22.16015625, -16.3515625, -10.54296875, -4.734375, 1.07421875, 6.8828125, 12.69140625, 18.5, 24.30859375, 30.1171875, 35.92578125, 41.734375, 47.54296875, 53.3515625, 59.16015625, 64.96875, 70.77734375, 76.5859375, 82.39453125, 88.203125, 94.01171875, 99.8203125, 105.62890625, 111.4375, 117.24609375, 123.0546875, 128.86328125, 134.671875, 140.48046875, 146.2890625, 152.09765625, 157.90625, 163.71484375, 169.5234375, 175.33203125, 181.140625, 186.94921875, 192.7578125, 198.56640625, 204.375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 16.0, 970.0, 34.0], "bins": [-3499.896240234375, -3443.91357421875, -3387.930908203125, -3331.9482421875, -3275.965576171875, -3219.98291015625, -3164.00048828125, -3108.017578125, -3052.03515625, -2996.052490234375, -2940.06982421875, -2884.087158203125, -2828.1044921875, -2772.121826171875, -2716.13916015625, -2660.15673828125, -2604.173828125, -2548.191162109375, -2492.20849609375, -2436.225830078125, -2380.2431640625, -2324.260498046875, -2268.27783203125, -2212.29541015625, -2156.312744140625, -2100.330078125, -2044.347412109375, -1988.36474609375, -1932.3822021484375, -1876.3995361328125, -1820.4168701171875, -1764.4342041015625, -1708.4515380859375, -1652.4688720703125, -1596.4862060546875, -1540.503662109375, -1484.52099609375, -1428.538330078125, -1372.5556640625, -1316.572998046875, -1260.59033203125, -1204.607666015625, -1148.625, -1092.642333984375, -1036.6597900390625, -980.6771240234375, -924.6944580078125, -868.7117919921875, -812.7291870117188, -756.7465209960938, -700.763916015625, -644.78125, -588.798583984375, -532.81591796875, -476.83331298828125, -420.85064697265625, -364.8680419921875, -308.8854064941406, -252.90274047851562, -196.92010498046875, -140.9374542236328, -84.95480346679688, -28.97216796875, 27.010498046875, 82.9931411743164]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 9.0, 11.0, 11.0, 10.0, 19.0, 15.0, 15.0, 19.0, 20.0, 17.0, 26.0, 34.0, 32.0, 35.0, 45.0, 41.0, 42.0, 48.0, 41.0, 35.0, 40.0, 37.0, 44.0, 37.0, 28.0, 22.0, 32.0, 26.0, 34.0, 21.0, 31.0, 15.0, 27.0, 13.0, 14.0, 11.0, 4.0, 7.0, 4.0, 11.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-220.40110778808594, -213.7253875732422, -207.04966735839844, -200.3739471435547, -193.69822692871094, -187.0225067138672, -180.34677124023438, -173.67105102539062, -166.99533081054688, -160.31961059570312, -153.64389038085938, -146.96817016601562, -140.29244995117188, -133.61672973632812, -126.94100189208984, -120.2652816772461, -113.58956909179688, -106.91384887695312, -100.23812866210938, -93.56240844726562, -86.88668823242188, -80.21096801757812, -73.53524017333984, -66.8595199584961, -60.183799743652344, -53.508079528808594, -46.832359313964844, -40.15663528442383, -33.48091506958008, -26.805194854736328, -20.129470825195312, -13.453750610351562, -6.778045654296875, -0.1023244857788086, 6.573396682739258, 13.24911880493164, 19.92483901977539, 26.60055923461914, 33.276283264160156, 39.952003479003906, 46.627723693847656, 53.303443908691406, 59.979164123535156, 66.65489196777344, 73.33061218261719, 80.00633239746094, 86.68205261230469, 93.35777282714844, 100.03349304199219, 106.70921325683594, 113.38493347167969, 120.06065368652344, 126.73637390136719, 133.41209411621094, 140.08782958984375, 146.7635498046875, 153.43927001953125, 160.114990234375, 166.79071044921875, 173.4664306640625, 180.14215087890625, 186.81787109375, 193.49359130859375, 200.1693115234375, 206.84503173828125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 2.0, 7.0, 4.0, 8.0, 8.0, 11.0, 16.0, 13.0, 10.0, 16.0, 28.0, 29.0, 27.0, 40.0, 41.0, 39.0, 40.0, 38.0, 51.0, 52.0, 46.0, 53.0, 47.0, 42.0, 39.0, 37.0, 28.0, 33.0, 29.0, 16.0, 29.0, 32.0, 13.0, 10.0, 9.0, 12.0, 13.0, 6.0, 9.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-21.3125, -20.725341796875, -20.13818359375, -19.551025390625, -18.9638671875, -18.376708984375, -17.78955078125, -17.202392578125, -16.615234375, -16.028076171875, -15.44091796875, -14.853759765625, -14.2666015625, -13.679443359375, -13.09228515625, -12.505126953125, -11.91796875, -11.330810546875, -10.74365234375, -10.156494140625, -9.5693359375, -8.982177734375, -8.39501953125, -7.807861328125, -7.220703125, -6.633544921875, -6.04638671875, -5.459228515625, -4.8720703125, -4.284912109375, -3.69775390625, -3.110595703125, -2.5234375, -1.936279296875, -1.34912109375, -0.761962890625, -0.1748046875, 0.412353515625, 0.99951171875, 1.586669921875, 2.173828125, 2.760986328125, 3.34814453125, 3.935302734375, 4.5224609375, 5.109619140625, 5.69677734375, 6.283935546875, 6.87109375, 7.458251953125, 8.04541015625, 8.632568359375, 9.2197265625, 9.806884765625, 10.39404296875, 10.981201171875, 11.568359375, 12.155517578125, 12.74267578125, 13.329833984375, 13.9169921875, 14.504150390625, 15.09130859375, 15.678466796875, 16.265625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 11.0, 17.0, 12.0, 22.0, 19.0, 47.0, 55.0, 69.0, 103.0, 135.0, 174.0, 277.0, 375.0, 542.0, 779.0, 1071.0, 1654.0, 2557.0, 3871.0, 6406.0, 11118.0, 21404.0, 87938.0, 3270350.0, 705252.0, 39485.0, 16059.0, 8844.0, 5352.0, 3339.0, 2152.0, 1477.0, 964.0, 682.0, 521.0, 343.0, 231.0, 166.0, 113.0, 92.0, 66.0, 41.0, 24.0, 21.0, 19.0, 15.0, 6.0, 5.0, 3.0, 2.0, 4.0], "bins": [-71.8125, -69.861328125, -67.91015625, -65.958984375, -64.0078125, -62.056640625, -60.10546875, -58.154296875, -56.203125, -54.251953125, -52.30078125, -50.349609375, -48.3984375, -46.447265625, -44.49609375, -42.544921875, -40.59375, -38.642578125, -36.69140625, -34.740234375, -32.7890625, -30.837890625, -28.88671875, -26.935546875, -24.984375, -23.033203125, -21.08203125, -19.130859375, -17.1796875, -15.228515625, -13.27734375, -11.326171875, -9.375, -7.423828125, -5.47265625, -3.521484375, -1.5703125, 0.380859375, 2.33203125, 4.283203125, 6.234375, 8.185546875, 10.13671875, 12.087890625, 14.0390625, 15.990234375, 17.94140625, 19.892578125, 21.84375, 23.794921875, 25.74609375, 27.697265625, 29.6484375, 31.599609375, 33.55078125, 35.501953125, 37.453125, 39.404296875, 41.35546875, 43.306640625, 45.2578125, 47.208984375, 49.16015625, 51.111328125, 53.0625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 8.0, 10.0, 18.0, 18.0, 34.0, 26.0, 44.0, 62.0, 148.0, 546.0, 1935.0, 802.0, 162.0, 67.0, 50.0, 23.0, 21.0, 16.0, 12.0, 12.0, 16.0, 9.0, 10.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.6875, -72.73046875, -69.7734375, -66.81640625, -63.859375, -60.90234375, -57.9453125, -54.98828125, -52.03125, -49.07421875, -46.1171875, -43.16015625, -40.203125, -37.24609375, -34.2890625, -31.33203125, -28.375, -25.41796875, -22.4609375, -19.50390625, -16.546875, -13.58984375, -10.6328125, -7.67578125, -4.71875, -1.76171875, 1.1953125, 4.15234375, 7.109375, 10.06640625, 13.0234375, 15.98046875, 18.9375, 21.89453125, 24.8515625, 27.80859375, 30.765625, 33.72265625, 36.6796875, 39.63671875, 42.59375, 45.55078125, 48.5078125, 51.46484375, 54.421875, 57.37890625, 60.3359375, 63.29296875, 66.25, 69.20703125, 72.1640625, 75.12109375, 78.078125, 81.03515625, 83.9921875, 86.94921875, 89.90625, 92.86328125, 95.8203125, 98.77734375, 101.734375, 104.69140625, 107.6484375, 110.60546875, 113.5625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 4.0, 4.0, 8.0, 10.0, 16.0, 32.0, 39.0, 55.0, 96.0, 171.0, 296.0, 697.0, 1630.0, 4104.0, 11374.0, 32198.0, 150688.0, 3838907.0, 110372.0, 27130.0, 9814.0, 3790.0, 1535.0, 613.0, 304.0, 144.0, 89.0, 44.0, 37.0, 29.0, 17.0, 17.0, 8.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.0, -202.587890625, -197.17578125, -191.763671875, -186.3515625, -180.939453125, -175.52734375, -170.115234375, -164.703125, -159.291015625, -153.87890625, -148.466796875, -143.0546875, -137.642578125, -132.23046875, -126.818359375, -121.40625, -115.994140625, -110.58203125, -105.169921875, -99.7578125, -94.345703125, -88.93359375, -83.521484375, -78.109375, -72.697265625, -67.28515625, -61.873046875, -56.4609375, -51.048828125, -45.63671875, -40.224609375, -34.8125, -29.400390625, -23.98828125, -18.576171875, -13.1640625, -7.751953125, -2.33984375, 3.072265625, 8.484375, 13.896484375, 19.30859375, 24.720703125, 30.1328125, 35.544921875, 40.95703125, 46.369140625, 51.78125, 57.193359375, 62.60546875, 68.017578125, 73.4296875, 78.841796875, 84.25390625, 89.666015625, 95.078125, 100.490234375, 105.90234375, 111.314453125, 116.7265625, 122.138671875, 127.55078125, 132.962890625, 138.375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 12.0, 4.0, 12.0, 11.0, 21.0, 35.0, 54.0, 70.0, 151.0, 242.0, 150.0, 78.0, 42.0, 38.0, 22.0, 20.0, 12.0, 11.0, 5.0, 0.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-408.8102722167969, -398.4637756347656, -388.1172790527344, -377.77081298828125, -367.42431640625, -357.07781982421875, -346.7313232421875, -336.38482666015625, -326.0383605957031, -315.6918640136719, -305.3453674316406, -294.9989013671875, -284.65240478515625, -274.305908203125, -263.95941162109375, -253.61293029785156, -243.2664337158203, -232.91993713378906, -222.57345581054688, -212.22695922851562, -201.88047790527344, -191.5339813232422, -181.1875, -170.84100341796875, -160.4945068359375, -150.14801025390625, -139.80152893066406, -129.4550323486328, -119.10855102539062, -108.76205444335938, -98.41556549072266, -88.06907653808594, -77.72257995605469, -67.37609100341797, -57.02960205078125, -46.683109283447266, -36.33662033081055, -25.990131378173828, -15.643638610839844, -5.297149658203125, 5.049339294433594, 15.395829200744629, 25.742319107055664, 36.088809967041016, 46.435298919677734, 56.78178787231445, 67.12828063964844, 77.47476959228516, 87.82125854492188, 98.1677474975586, 108.51423645019531, 118.86073303222656, 129.20721435546875, 139.5537109375, 149.90020751953125, 160.24668884277344, 170.59317016601562, 180.93966674804688, 191.28614807128906, 201.6326446533203, 211.9791259765625, 222.32562255859375, 232.672119140625, 243.0186004638672, 253.36509704589844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 4.0, 4.0, 7.0, 9.0, 11.0, 10.0, 14.0, 11.0, 24.0, 11.0, 22.0, 23.0, 31.0, 33.0, 40.0, 36.0, 40.0, 52.0, 45.0, 31.0, 37.0, 43.0, 37.0, 44.0, 45.0, 42.0, 35.0, 38.0, 38.0, 24.0, 25.0, 19.0, 13.0, 17.0, 16.0, 11.0, 15.0, 9.0, 8.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-174.0596923828125, -168.74830627441406, -163.43692016601562, -158.12551879882812, -152.8141326904297, -147.50274658203125, -142.1913604736328, -136.87997436523438, -131.56857299804688, -126.25718688964844, -120.94579315185547, -115.63440704345703, -110.32301330566406, -105.01162719726562, -99.70024108886719, -94.38885498046875, -89.07746887207031, -83.76608276367188, -78.4546890258789, -73.14330291748047, -67.8319091796875, -62.52052307128906, -57.209136962890625, -51.89774703979492, -46.58635711669922, -41.274967193603516, -35.96357727050781, -30.652191162109375, -25.340801239013672, -20.02941131591797, -14.718023300170898, -9.406635284423828, -4.095245361328125, 1.2161436080932617, 6.527532577514648, 11.838921546936035, 17.150310516357422, 22.461700439453125, 27.773088455200195, 33.084476470947266, 38.39586639404297, 43.70725631713867, 49.018646240234375, 54.33003234863281, 59.641422271728516, 64.95281219482422, 70.26419830322266, 75.57559204101562, 80.88697814941406, 86.1983642578125, 91.50975799560547, 96.8211441040039, 102.13253784179688, 107.44392395019531, 112.75531005859375, 118.06669616699219, 123.37808990478516, 128.68948364257812, 134.00086975097656, 139.312255859375, 144.62364196777344, 149.93502807617188, 155.24642944335938, 160.5578155517578, 165.86920166015625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 5.0, 4.0, 20.0, 11.0, 15.0, 13.0, 16.0, 28.0, 31.0, 28.0, 24.0, 42.0, 35.0, 50.0, 44.0, 48.0, 58.0, 53.0, 48.0, 37.0, 46.0, 45.0, 43.0, 40.0, 27.0, 35.0, 31.0, 18.0, 15.0, 17.0, 6.0, 9.0, 7.0, 12.0, 9.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.103271484375, -19.45654296875, -18.809814453125, -18.1630859375, -17.516357421875, -16.86962890625, -16.222900390625, -15.576171875, -14.929443359375, -14.28271484375, -13.635986328125, -12.9892578125, -12.342529296875, -11.69580078125, -11.049072265625, -10.40234375, -9.755615234375, -9.10888671875, -8.462158203125, -7.8154296875, -7.168701171875, -6.52197265625, -5.875244140625, -5.228515625, -4.581787109375, -3.93505859375, -3.288330078125, -2.6416015625, -1.994873046875, -1.34814453125, -0.701416015625, -0.0546875, 0.592041015625, 1.23876953125, 1.885498046875, 2.5322265625, 3.178955078125, 3.82568359375, 4.472412109375, 5.119140625, 5.765869140625, 6.41259765625, 7.059326171875, 7.7060546875, 8.352783203125, 8.99951171875, 9.646240234375, 10.29296875, 10.939697265625, 11.58642578125, 12.233154296875, 12.8798828125, 13.526611328125, 14.17333984375, 14.820068359375, 15.466796875, 16.113525390625, 16.76025390625, 17.406982421875, 18.0537109375, 18.700439453125, 19.34716796875, 19.993896484375, 20.640625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 10.0, 5.0, 7.0, 11.0, 13.0, 22.0, 26.0, 39.0, 61.0, 99.0, 124.0, 186.0, 242.0, 345.0, 551.0, 745.0, 1152.0, 1713.0, 2464.0, 3959.0, 6021.0, 9312.0, 15027.0, 24916.0, 42390.0, 76121.0, 148355.0, 274903.0, 202377.0, 100710.0, 54149.0, 31111.0, 18653.0, 11557.0, 7334.0, 4617.0, 3011.0, 1968.0, 1375.0, 883.0, 590.0, 425.0, 305.0, 197.0, 152.0, 100.0, 76.0, 47.0, 30.0, 26.0, 17.0, 7.0, 13.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.90234375, -0.8738937377929688, -0.8454437255859375, -0.8169937133789062, -0.788543701171875, -0.7600936889648438, -0.7316436767578125, -0.7031936645507812, -0.67474365234375, -0.6462936401367188, -0.6178436279296875, -0.5893936157226562, -0.560943603515625, -0.5324935913085938, -0.5040435791015625, -0.47559356689453125, -0.4471435546875, -0.41869354248046875, -0.3902435302734375, -0.36179351806640625, -0.333343505859375, -0.30489349365234375, -0.2764434814453125, -0.24799346923828125, -0.21954345703125, -0.19109344482421875, -0.1626434326171875, -0.13419342041015625, -0.105743408203125, -0.07729339599609375, -0.0488433837890625, -0.02039337158203125, 0.008056640625, 0.03650665283203125, 0.0649566650390625, 0.09340667724609375, 0.121856689453125, 0.15030670166015625, 0.1787567138671875, 0.20720672607421875, 0.23565673828125, 0.26410675048828125, 0.2925567626953125, 0.32100677490234375, 0.349456787109375, 0.37790679931640625, 0.4063568115234375, 0.43480682373046875, 0.4632568359375, 0.49170684814453125, 0.5201568603515625, 0.5486068725585938, 0.577056884765625, 0.6055068969726562, 0.6339569091796875, 0.6624069213867188, 0.69085693359375, 0.7193069458007812, 0.7477569580078125, 0.7762069702148438, 0.804656982421875, 0.8331069946289062, 0.8615570068359375, 0.8900070190429688, 0.91845703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 9.0, 8.0, 8.0, 12.0, 9.0, 10.0, 15.0, 18.0, 22.0, 12.0, 31.0, 34.0, 25.0, 32.0, 43.0, 35.0, 35.0, 48.0, 41.0, 33.0, 1070.0, 45.0, 38.0, 51.0, 27.0, 31.0, 31.0, 33.0, 38.0, 27.0, 20.0, 18.0, 17.0, 17.0, 9.0, 6.0, 13.0, 16.0, 7.0, 8.0, 8.0, 2.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9884033203125, -10.617431640625, -10.2464599609375, -9.87548828125, -9.5045166015625, -9.133544921875, -8.7625732421875, -8.3916015625, -8.0206298828125, -7.649658203125, -7.2786865234375, -6.90771484375, -6.5367431640625, -6.165771484375, -5.7947998046875, -5.423828125, -5.0528564453125, -4.681884765625, -4.3109130859375, -3.93994140625, -3.5689697265625, -3.197998046875, -2.8270263671875, -2.4560546875, -2.0850830078125, -1.714111328125, -1.3431396484375, -0.97216796875, -0.6011962890625, -0.230224609375, 0.1407470703125, 0.51171875, 0.8826904296875, 1.253662109375, 1.6246337890625, 1.99560546875, 2.3665771484375, 2.737548828125, 3.1085205078125, 3.4794921875, 3.8504638671875, 4.221435546875, 4.5924072265625, 4.96337890625, 5.3343505859375, 5.705322265625, 6.0762939453125, 6.447265625, 6.8182373046875, 7.189208984375, 7.5601806640625, 7.93115234375, 8.3021240234375, 8.673095703125, 9.0440673828125, 9.4150390625, 9.7860107421875, 10.156982421875, 10.5279541015625, 10.89892578125, 11.2698974609375, 11.640869140625, 12.0118408203125, 12.3828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 14.0, 17.0, 34.0, 37.0, 68.0, 87.0, 139.0, 185.0, 275.0, 406.0, 565.0, 848.0, 1138.0, 1657.0, 2343.0, 3197.0, 4458.0, 6348.0, 8870.0, 13132.0, 19308.0, 28858.0, 44294.0, 70852.0, 124277.0, 1259095.0, 207284.0, 109669.0, 63999.0, 40627.0, 26593.0, 17697.0, 12115.0, 8347.0, 5917.0, 4148.0, 3016.0, 2084.0, 1572.0, 1100.0, 736.0, 548.0, 365.0, 274.0, 180.0, 122.0, 69.0, 68.0, 33.0, 22.0, 16.0, 7.0, 12.0, 3.0, 6.0, 1.0, 1.0], "bins": [-0.73486328125, -0.7125244140625, -0.690185546875, -0.6678466796875, -0.6455078125, -0.6231689453125, -0.600830078125, -0.5784912109375, -0.55615234375, -0.5338134765625, -0.511474609375, -0.4891357421875, -0.466796875, -0.4444580078125, -0.422119140625, -0.3997802734375, -0.37744140625, -0.3551025390625, -0.332763671875, -0.3104248046875, -0.2880859375, -0.2657470703125, -0.243408203125, -0.2210693359375, -0.19873046875, -0.1763916015625, -0.154052734375, -0.1317138671875, -0.109375, -0.0870361328125, -0.064697265625, -0.0423583984375, -0.02001953125, 0.0023193359375, 0.024658203125, 0.0469970703125, 0.0693359375, 0.0916748046875, 0.114013671875, 0.1363525390625, 0.15869140625, 0.1810302734375, 0.203369140625, 0.2257080078125, 0.248046875, 0.2703857421875, 0.292724609375, 0.3150634765625, 0.33740234375, 0.3597412109375, 0.382080078125, 0.4044189453125, 0.4267578125, 0.4490966796875, 0.471435546875, 0.4937744140625, 0.51611328125, 0.5384521484375, 0.560791015625, 0.5831298828125, 0.60546875, 0.6278076171875, 0.650146484375, 0.6724853515625, 0.69482421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 7.0, 7.0, 8.0, 11.0, 19.0, 15.0, 21.0, 30.0, 32.0, 34.0, 34.0, 40.0, 56.0, 60.0, 52.0, 62.0, 55.0, 51.0, 53.0, 50.0, 47.0, 46.0, 40.0, 31.0, 25.0, 17.0, 21.0, 13.0, 12.0, 10.0, 4.0, 5.0, 6.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003070831298828125, -0.0029622912406921387, -0.0028537511825561523, -0.002745211124420166, -0.0026366710662841797, -0.0025281310081481934, -0.002419590950012207, -0.0023110508918762207, -0.0022025108337402344, -0.002093970775604248, -0.0019854307174682617, -0.0018768906593322754, -0.001768350601196289, -0.0016598105430603027, -0.0015512704849243164, -0.00144273042678833, -0.0013341903686523438, -0.0012256503105163574, -0.001117110252380371, -0.0010085701942443848, -0.0009000301361083984, -0.0007914900779724121, -0.0006829500198364258, -0.0005744099617004395, -0.0004658699035644531, -0.0003573298454284668, -0.00024878978729248047, -0.00014024972915649414, -3.170967102050781e-05, 7.683038711547852e-05, 0.00018537044525146484, 0.00029391050338745117, 0.0004024505615234375, 0.0005109906196594238, 0.0006195306777954102, 0.0007280707359313965, 0.0008366107940673828, 0.0009451508522033691, 0.0010536909103393555, 0.0011622309684753418, 0.0012707710266113281, 0.0013793110847473145, 0.0014878511428833008, 0.0015963912010192871, 0.0017049312591552734, 0.0018134713172912598, 0.001922011375427246, 0.0020305514335632324, 0.0021390914916992188, 0.002247631549835205, 0.0023561716079711914, 0.0024647116661071777, 0.002573251724243164, 0.0026817917823791504, 0.0027903318405151367, 0.002898871898651123, 0.0030074119567871094, 0.0031159520149230957, 0.003224492073059082, 0.0033330321311950684, 0.0034415721893310547, 0.003550112247467041, 0.0036586523056030273, 0.0037671923637390137, 0.003875732421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 13.0, 10.0, 16.0, 19.0, 14.0, 20.0, 35.0, 39.0, 53.0, 71.0, 86.0, 92.0, 150.0, 234.0, 380.0, 967.0, 9066.0, 298852.0, 716523.0, 19168.0, 1356.0, 395.0, 239.0, 177.0, 120.0, 88.0, 89.0, 63.0, 43.0, 40.0, 27.0, 21.0, 17.0, 10.0, 10.0, 11.0, 9.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.053741455078125, -0.05216646194458008, -0.050591468811035156, -0.049016475677490234, -0.04744148254394531, -0.04586648941040039, -0.04429149627685547, -0.04271650314331055, -0.041141510009765625, -0.0395665168762207, -0.03799152374267578, -0.03641653060913086, -0.03484153747558594, -0.033266544342041016, -0.031691551208496094, -0.030116558074951172, -0.02854156494140625, -0.026966571807861328, -0.025391578674316406, -0.023816585540771484, -0.022241592407226562, -0.02066659927368164, -0.01909160614013672, -0.017516613006591797, -0.015941619873046875, -0.014366626739501953, -0.012791633605957031, -0.01121664047241211, -0.009641647338867188, -0.008066654205322266, -0.006491661071777344, -0.004916667938232422, -0.0033416748046875, -0.0017666816711425781, -0.00019168853759765625, 0.0013833045959472656, 0.0029582977294921875, 0.004533290863037109, 0.006108283996582031, 0.007683277130126953, 0.009258270263671875, 0.010833263397216797, 0.012408256530761719, 0.01398324966430664, 0.015558242797851562, 0.017133235931396484, 0.018708229064941406, 0.020283222198486328, 0.02185821533203125, 0.023433208465576172, 0.025008201599121094, 0.026583194732666016, 0.028158187866210938, 0.02973318099975586, 0.03130817413330078, 0.0328831672668457, 0.034458160400390625, 0.03603315353393555, 0.03760814666748047, 0.03918313980102539, 0.04075813293457031, 0.042333126068115234, 0.043908119201660156, 0.04548311233520508, 0.04705810546875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 43.0, 445.0, 437.0, 70.0, 9.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026122938841581345, -0.025485867634415627, -0.02484879456460476, -0.02421172335743904, -0.023574650287628174, -0.022937579080462456, -0.022300507873296738, -0.02166343480348587, -0.021026363596320152, -0.020389292389154434, -0.019752219319343567, -0.01911514811217785, -0.01847807504236698, -0.017841003835201263, -0.017203930765390396, -0.016566859558224678, -0.01592978835105896, -0.015292716212570667, -0.014655644074082375, -0.014018572866916656, -0.013381500728428364, -0.012744428589940071, -0.012107356451451778, -0.011470284312963486, -0.010833211243152618, -0.010196139104664326, -0.009559066966176033, -0.008921995759010315, -0.008284923620522022, -0.0076478514820337296, -0.007010779343545437, -0.0063737076707184315, -0.0057366350665688515, -0.005099562928080559, -0.004462491255253553, -0.0038254191167652607, -0.0031883472111076117, -0.0025512753054499626, -0.00191420316696167, -0.0012771314941346645, -0.0006400593556463718, -2.9873917810618877e-06, 0.0006340845720842481, 0.001271156594157219, 0.001908228499814868, 0.002545300405472517, 0.0031823725439608097, 0.003819444216787815, 0.004456516355276108, 0.0050935884937644005, 0.005730660166591406, 0.0063677323050796986, 0.007004803977906704, 0.007641876116394997, 0.00827894825488329, 0.008916020393371582, 0.0095530916005373, 0.010190163739025593, 0.010827235877513885, 0.011464307084679604, 0.012101379223167896, 0.012738451361656189, 0.013375523500144482, 0.014012595638632774, 0.014649667777121067]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 6.0, 5.0, 6.0, 3.0, 14.0, 11.0, 9.0, 13.0, 19.0, 22.0, 18.0, 18.0, 22.0, 21.0, 33.0, 30.0, 39.0, 47.0, 45.0, 43.0, 37.0, 42.0, 42.0, 33.0, 45.0, 50.0, 40.0, 43.0, 35.0, 37.0, 24.0, 26.0, 18.0, 24.0, 26.0, 15.0, 13.0, 10.0, 4.0, 7.0, 5.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0024372339248657227, -0.002367524430155754, -0.0022978149354457855, -0.002228105440735817, -0.0021583959460258484, -0.00208868645131588, -0.0020189769566059113, -0.0019492674618959427, -0.0018795579671859741, -0.0018098484724760056, -0.001740138977766037, -0.0016704294830560684, -0.0016007199883460999, -0.0015310104936361313, -0.0014613009989261627, -0.0013915915042161942, -0.0013218820095062256, -0.001252172514796257, -0.0011824630200862885, -0.0011127535253763199, -0.0010430440306663513, -0.0009733345359563828, -0.0009036250412464142, -0.0008339155465364456, -0.000764206051826477, -0.0006944965571165085, -0.0006247870624065399, -0.0005550775676965714, -0.0004853680729866028, -0.0004156585782766342, -0.00034594908356666565, -0.0002762395888566971, -0.00020653009414672852, -0.00013682059943675995, -6.711110472679138e-05, 2.598389983177185e-06, 7.230788469314575e-05, 0.00014201737940311432, 0.00021172687411308289, 0.00028143636882305145, 0.00035114586353302, 0.0004208553582429886, 0.0004905648529529572, 0.0005602743476629257, 0.0006299838423728943, 0.0006996933370828629, 0.0007694028317928314, 0.0008391123265028, 0.0009088218212127686, 0.0009785313159227371, 0.0010482408106327057, 0.0011179503053426743, 0.0011876598000526428, 0.0012573692947626114, 0.00132707878947258, 0.0013967882841825485, 0.001466497778892517, 0.0015362072736024857, 0.0016059167683124542, 0.0016756262630224228, 0.0017453357577323914, 0.00181504525244236, 0.0018847547471523285, 0.001954464241862297, 0.0020241737365722656]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 5.0, 4.0, 20.0, 11.0, 15.0, 13.0, 16.0, 28.0, 31.0, 28.0, 24.0, 42.0, 35.0, 50.0, 44.0, 48.0, 58.0, 53.0, 48.0, 37.0, 46.0, 45.0, 43.0, 40.0, 27.0, 35.0, 31.0, 18.0, 15.0, 17.0, 6.0, 9.0, 7.0, 12.0, 9.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.103271484375, -19.45654296875, -18.809814453125, -18.1630859375, -17.516357421875, -16.86962890625, -16.222900390625, -15.576171875, -14.929443359375, -14.28271484375, -13.635986328125, -12.9892578125, -12.342529296875, -11.69580078125, -11.049072265625, -10.40234375, -9.755615234375, -9.10888671875, -8.462158203125, -7.8154296875, -7.168701171875, -6.52197265625, -5.875244140625, -5.228515625, -4.581787109375, -3.93505859375, -3.288330078125, -2.6416015625, -1.994873046875, -1.34814453125, -0.701416015625, -0.0546875, 0.592041015625, 1.23876953125, 1.885498046875, 2.5322265625, 3.178955078125, 3.82568359375, 4.472412109375, 5.119140625, 5.765869140625, 6.41259765625, 7.059326171875, 7.7060546875, 8.352783203125, 8.99951171875, 9.646240234375, 10.29296875, 10.939697265625, 11.58642578125, 12.233154296875, 12.8798828125, 13.526611328125, 14.17333984375, 14.820068359375, 15.466796875, 16.113525390625, 16.76025390625, 17.406982421875, 18.0537109375, 18.700439453125, 19.34716796875, 19.993896484375, 20.640625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 8.0, 13.0, 16.0, 17.0, 38.0, 55.0, 57.0, 85.0, 124.0, 186.0, 323.0, 436.0, 619.0, 792.0, 1302.0, 1990.0, 3341.0, 6201.0, 12680.0, 34174.0, 144960.0, 643027.0, 137692.0, 32546.0, 12140.0, 6144.0, 3411.0, 2093.0, 1315.0, 832.0, 598.0, 426.0, 306.0, 174.0, 121.0, 63.0, 75.0, 55.0, 35.0, 26.0, 18.0, 12.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.640625, -14.18994140625, -13.7392578125, -13.28857421875, -12.837890625, -12.38720703125, -11.9365234375, -11.48583984375, -11.03515625, -10.58447265625, -10.1337890625, -9.68310546875, -9.232421875, -8.78173828125, -8.3310546875, -7.88037109375, -7.4296875, -6.97900390625, -6.5283203125, -6.07763671875, -5.626953125, -5.17626953125, -4.7255859375, -4.27490234375, -3.82421875, -3.37353515625, -2.9228515625, -2.47216796875, -2.021484375, -1.57080078125, -1.1201171875, -0.66943359375, -0.21875, 0.23193359375, 0.6826171875, 1.13330078125, 1.583984375, 2.03466796875, 2.4853515625, 2.93603515625, 3.38671875, 3.83740234375, 4.2880859375, 4.73876953125, 5.189453125, 5.64013671875, 6.0908203125, 6.54150390625, 6.9921875, 7.44287109375, 7.8935546875, 8.34423828125, 8.794921875, 9.24560546875, 9.6962890625, 10.14697265625, 10.59765625, 11.04833984375, 11.4990234375, 11.94970703125, 12.400390625, 12.85107421875, 13.3017578125, 13.75244140625, 14.203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 7.0, 8.0, 6.0, 10.0, 11.0, 18.0, 18.0, 12.0, 18.0, 16.0, 27.0, 27.0, 24.0, 35.0, 30.0, 25.0, 25.0, 45.0, 41.0, 35.0, 77.0, 1910.0, 123.0, 51.0, 31.0, 38.0, 38.0, 34.0, 41.0, 29.0, 26.0, 22.0, 30.0, 21.0, 18.0, 24.0, 11.0, 11.0, 16.0, 12.0, 5.0, 3.0, 5.0, 4.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-53.4375, -51.697265625, -49.95703125, -48.216796875, -46.4765625, -44.736328125, -42.99609375, -41.255859375, -39.515625, -37.775390625, -36.03515625, -34.294921875, -32.5546875, -30.814453125, -29.07421875, -27.333984375, -25.59375, -23.853515625, -22.11328125, -20.373046875, -18.6328125, -16.892578125, -15.15234375, -13.412109375, -11.671875, -9.931640625, -8.19140625, -6.451171875, -4.7109375, -2.970703125, -1.23046875, 0.509765625, 2.25, 3.990234375, 5.73046875, 7.470703125, 9.2109375, 10.951171875, 12.69140625, 14.431640625, 16.171875, 17.912109375, 19.65234375, 21.392578125, 23.1328125, 24.873046875, 26.61328125, 28.353515625, 30.09375, 31.833984375, 33.57421875, 35.314453125, 37.0546875, 38.794921875, 40.53515625, 42.275390625, 44.015625, 45.755859375, 47.49609375, 49.236328125, 50.9765625, 52.716796875, 54.45703125, 56.197265625, 57.9375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 8.0, 7.0, 19.0, 26.0, 23.0, 48.0, 54.0, 81.0, 137.0, 182.0, 396.0, 813.0, 2969.0, 23509.0, 3080609.0, 31451.0, 3413.0, 915.0, 400.0, 216.0, 124.0, 82.0, 53.0, 35.0, 28.0, 23.0, 25.0, 13.0, 14.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.3125, -91.0849609375, -86.857421875, -82.6298828125, -78.40234375, -74.1748046875, -69.947265625, -65.7197265625, -61.4921875, -57.2646484375, -53.037109375, -48.8095703125, -44.58203125, -40.3544921875, -36.126953125, -31.8994140625, -27.671875, -23.4443359375, -19.216796875, -14.9892578125, -10.76171875, -6.5341796875, -2.306640625, 1.9208984375, 6.1484375, 10.3759765625, 14.603515625, 18.8310546875, 23.05859375, 27.2861328125, 31.513671875, 35.7412109375, 39.96875, 44.1962890625, 48.423828125, 52.6513671875, 56.87890625, 61.1064453125, 65.333984375, 69.5615234375, 73.7890625, 78.0166015625, 82.244140625, 86.4716796875, 90.69921875, 94.9267578125, 99.154296875, 103.3818359375, 107.609375, 111.8369140625, 116.064453125, 120.2919921875, 124.51953125, 128.7470703125, 132.974609375, 137.2021484375, 141.4296875, 145.6572265625, 149.884765625, 154.1123046875, 158.33984375, 162.5673828125, 166.794921875, 171.0224609375, 175.25]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 307.0, 694.0, 17.0], "bins": [-1668.79833984375, -1641.927490234375, -1615.056640625, -1588.185791015625, -1561.31494140625, -1534.444091796875, -1507.5732421875, -1480.7022705078125, -1453.8314208984375, -1426.9605712890625, -1400.0897216796875, -1373.2188720703125, -1346.3480224609375, -1319.47705078125, -1292.606201171875, -1265.7353515625, -1238.864501953125, -1211.99365234375, -1185.122802734375, -1158.251953125, -1131.381103515625, -1104.51025390625, -1077.639404296875, -1050.7684326171875, -1023.897705078125, -997.02685546875, -970.156005859375, -943.28515625, -916.4142456054688, -889.5433959960938, -862.6725463867188, -835.8016967773438, -808.9307861328125, -782.0599365234375, -755.1890869140625, -728.3182373046875, -701.4473266601562, -674.5764770507812, -647.7056274414062, -620.8347778320312, -593.9639282226562, -567.0930786132812, -540.2222290039062, -513.351318359375, -486.48046875, -459.609619140625, -432.73876953125, -405.867919921875, -378.9970397949219, -352.1261901855469, -325.25531005859375, -298.38446044921875, -271.51361083984375, -244.64273071289062, -217.77188110351562, -190.90101623535156, -164.0301513671875, -137.15928649902344, -110.2884292602539, -83.41757202148438, -56.54670715332031, -29.67584228515625, -2.80499267578125, 24.065872192382812, 50.93674087524414]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 10.0, 8.0, 7.0, 6.0, 9.0, 19.0, 18.0, 22.0, 21.0, 27.0, 24.0, 35.0, 34.0, 34.0, 37.0, 51.0, 45.0, 42.0, 45.0, 50.0, 48.0, 60.0, 35.0, 36.0, 34.0, 29.0, 28.0, 29.0, 28.0, 21.0, 14.0, 20.0, 13.0, 7.0, 10.0, 10.0, 2.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.66770935058594, -188.0906219482422, -181.51353454589844, -174.9364471435547, -168.35935974121094, -161.78228759765625, -155.2052001953125, -148.62811279296875, -142.051025390625, -135.47393798828125, -128.8968505859375, -122.31976318359375, -115.74268341064453, -109.16559600830078, -102.58850860595703, -96.01142883300781, -89.43433380126953, -82.85724639892578, -76.28015899658203, -69.70307922363281, -63.12599182128906, -56.54890441894531, -49.97181701660156, -43.39473342895508, -36.81764602661133, -30.24056053161621, -23.663475036621094, -17.086387634277344, -10.509302139282227, -3.9322166442871094, 2.6448707580566406, 9.221954345703125, 15.799041748046875, 22.376127243041992, 28.95321273803711, 35.53030014038086, 42.107383728027344, 48.684471130371094, 55.261558532714844, 61.83864212036133, 68.41572570800781, 74.99281311035156, 81.56990051269531, 88.14698791503906, 94.72406768798828, 101.30115509033203, 107.87824249267578, 114.455322265625, 121.03241729736328, 127.60950469970703, 134.18658447265625, 140.763671875, 147.34075927734375, 153.9178466796875, 160.49493408203125, 167.072021484375, 173.64910888671875, 180.2261962890625, 186.80328369140625, 193.38037109375, 199.95745849609375, 206.5345458984375, 213.11163330078125, 219.68870544433594, 226.2657928466797]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 6.0, 3.0, 5.0, 10.0, 15.0, 11.0, 19.0, 14.0, 13.0, 22.0, 24.0, 40.0, 33.0, 36.0, 35.0, 44.0, 56.0, 61.0, 56.0, 45.0, 53.0, 44.0, 38.0, 40.0, 42.0, 38.0, 24.0, 39.0, 25.0, 21.0, 17.0, 9.0, 12.0, 12.0, 9.0, 6.0, 6.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.9375, -21.270751953125, -20.60400390625, -19.937255859375, -19.2705078125, -18.603759765625, -17.93701171875, -17.270263671875, -16.603515625, -15.936767578125, -15.27001953125, -14.603271484375, -13.9365234375, -13.269775390625, -12.60302734375, -11.936279296875, -11.26953125, -10.602783203125, -9.93603515625, -9.269287109375, -8.6025390625, -7.935791015625, -7.26904296875, -6.602294921875, -5.935546875, -5.268798828125, -4.60205078125, -3.935302734375, -3.2685546875, -2.601806640625, -1.93505859375, -1.268310546875, -0.6015625, 0.065185546875, 0.73193359375, 1.398681640625, 2.0654296875, 2.732177734375, 3.39892578125, 4.065673828125, 4.732421875, 5.399169921875, 6.06591796875, 6.732666015625, 7.3994140625, 8.066162109375, 8.73291015625, 9.399658203125, 10.06640625, 10.733154296875, 11.39990234375, 12.066650390625, 12.7333984375, 13.400146484375, 14.06689453125, 14.733642578125, 15.400390625, 16.067138671875, 16.73388671875, 17.400634765625, 18.0673828125, 18.734130859375, 19.40087890625, 20.067626953125, 20.734375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 13.0, 13.0, 18.0, 32.0, 49.0, 48.0, 81.0, 129.0, 157.0, 214.0, 351.0, 441.0, 674.0, 943.0, 1403.0, 2136.0, 3312.0, 5407.0, 8909.0, 16474.0, 41704.0, 917798.0, 3059854.0, 85520.0, 20752.0, 10674.0, 6078.0, 3735.0, 2460.0, 1499.0, 1034.0, 643.0, 486.0, 353.0, 251.0, 198.0, 130.0, 92.0, 73.0, 41.0, 26.0, 27.0, 15.0, 11.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.9375, -63.88671875, -61.8359375, -59.78515625, -57.734375, -55.68359375, -53.6328125, -51.58203125, -49.53125, -47.48046875, -45.4296875, -43.37890625, -41.328125, -39.27734375, -37.2265625, -35.17578125, -33.125, -31.07421875, -29.0234375, -26.97265625, -24.921875, -22.87109375, -20.8203125, -18.76953125, -16.71875, -14.66796875, -12.6171875, -10.56640625, -8.515625, -6.46484375, -4.4140625, -2.36328125, -0.3125, 1.73828125, 3.7890625, 5.83984375, 7.890625, 9.94140625, 11.9921875, 14.04296875, 16.09375, 18.14453125, 20.1953125, 22.24609375, 24.296875, 26.34765625, 28.3984375, 30.44921875, 32.5, 34.55078125, 36.6015625, 38.65234375, 40.703125, 42.75390625, 44.8046875, 46.85546875, 48.90625, 50.95703125, 53.0078125, 55.05859375, 57.109375, 59.16015625, 61.2109375, 63.26171875, 65.3125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 10.0, 4.0, 12.0, 11.0, 16.0, 21.0, 25.0, 32.0, 43.0, 93.0, 184.0, 498.0, 1606.0, 949.0, 252.0, 86.0, 46.0, 34.0, 31.0, 31.0, 19.0, 16.0, 9.0, 8.0, 7.0, 10.0, 2.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0625, -70.4248046875, -67.787109375, -65.1494140625, -62.51171875, -59.8740234375, -57.236328125, -54.5986328125, -51.9609375, -49.3232421875, -46.685546875, -44.0478515625, -41.41015625, -38.7724609375, -36.134765625, -33.4970703125, -30.859375, -28.2216796875, -25.583984375, -22.9462890625, -20.30859375, -17.6708984375, -15.033203125, -12.3955078125, -9.7578125, -7.1201171875, -4.482421875, -1.8447265625, 0.79296875, 3.4306640625, 6.068359375, 8.7060546875, 11.34375, 13.9814453125, 16.619140625, 19.2568359375, 21.89453125, 24.5322265625, 27.169921875, 29.8076171875, 32.4453125, 35.0830078125, 37.720703125, 40.3583984375, 42.99609375, 45.6337890625, 48.271484375, 50.9091796875, 53.546875, 56.1845703125, 58.822265625, 61.4599609375, 64.09765625, 66.7353515625, 69.373046875, 72.0107421875, 74.6484375, 77.2861328125, 79.923828125, 82.5615234375, 85.19921875, 87.8369140625, 90.474609375, 93.1123046875, 95.75]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 10.0, 9.0, 21.0, 20.0, 41.0, 49.0, 66.0, 114.0, 202.0, 335.0, 559.0, 940.0, 1765.0, 3336.0, 6334.0, 12999.0, 30339.0, 93751.0, 3062780.0, 863104.0, 68902.0, 25475.0, 11163.0, 5473.0, 2830.0, 1549.0, 849.0, 512.0, 284.0, 147.0, 117.0, 64.0, 52.0, 32.0, 15.0, 14.0, 13.0, 8.0, 11.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.3125, -103.8388671875, -100.365234375, -96.8916015625, -93.41796875, -89.9443359375, -86.470703125, -82.9970703125, -79.5234375, -76.0498046875, -72.576171875, -69.1025390625, -65.62890625, -62.1552734375, -58.681640625, -55.2080078125, -51.734375, -48.2607421875, -44.787109375, -41.3134765625, -37.83984375, -34.3662109375, -30.892578125, -27.4189453125, -23.9453125, -20.4716796875, -16.998046875, -13.5244140625, -10.05078125, -6.5771484375, -3.103515625, 0.3701171875, 3.84375, 7.3173828125, 10.791015625, 14.2646484375, 17.73828125, 21.2119140625, 24.685546875, 28.1591796875, 31.6328125, 35.1064453125, 38.580078125, 42.0537109375, 45.52734375, 49.0009765625, 52.474609375, 55.9482421875, 59.421875, 62.8955078125, 66.369140625, 69.8427734375, 73.31640625, 76.7900390625, 80.263671875, 83.7373046875, 87.2109375, 90.6845703125, 94.158203125, 97.6318359375, 101.10546875, 104.5791015625, 108.052734375, 111.5263671875, 115.0]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 6.0, 13.0, 22.0, 29.0, 40.0, 65.0, 97.0, 177.0, 211.0, 95.0, 67.0, 49.0, 30.0, 20.0, 17.0, 8.0, 11.0, 6.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-368.1773681640625, -359.00347900390625, -349.82958984375, -340.6557312011719, -331.4818420410156, -322.3079528808594, -313.1340637207031, -303.9601745605469, -294.78631591796875, -285.6124267578125, -276.43853759765625, -267.2646789550781, -258.0907897949219, -248.91690063476562, -239.74301147460938, -230.56912231445312, -221.39523315429688, -212.22134399414062, -203.04747009277344, -193.8735809326172, -184.69970703125, -175.52581787109375, -166.3519287109375, -157.17803955078125, -148.00416564941406, -138.8302764892578, -129.65640258789062, -120.48251342773438, -111.30863189697266, -102.13475036621094, -92.96086120605469, -83.78697967529297, -74.61306762695312, -65.4391860961914, -56.26530075073242, -47.09141540527344, -37.91753387451172, -28.74365234375, -19.569766998291016, -10.395881652832031, -1.2220001220703125, 7.951883316040039, 17.12576675415039, 26.299650192260742, 35.473533630371094, 44.64741516113281, 53.8213005065918, 62.99518585205078, 72.1690673828125, 81.34294891357422, 90.51683044433594, 99.69071960449219, 108.8646011352539, 118.03848266601562, 127.21237182617188, 136.38626098632812, 145.5601348876953, 154.73402404785156, 163.90789794921875, 173.081787109375, 182.25567626953125, 191.42955017089844, 200.6034393310547, 209.77731323242188, 218.95120239257812]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 8.0, 7.0, 5.0, 10.0, 8.0, 9.0, 15.0, 13.0, 12.0, 12.0, 29.0, 29.0, 25.0, 26.0, 30.0, 27.0, 43.0, 38.0, 35.0, 45.0, 35.0, 51.0, 47.0, 48.0, 38.0, 36.0, 32.0, 26.0, 39.0, 25.0, 19.0, 23.0, 22.0, 25.0, 17.0, 11.0, 14.0, 14.0, 10.0, 14.0, 8.0, 7.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-144.2861785888672, -139.2480010986328, -134.20982360839844, -129.17164611816406, -124.13346862792969, -119.09529113769531, -114.05711364746094, -109.01893615722656, -103.98075866699219, -98.94258117675781, -93.90440368652344, -88.86622619628906, -83.82804870605469, -78.78987121582031, -73.75169372558594, -68.71351623535156, -63.675331115722656, -58.63715362548828, -53.598976135253906, -48.56079864501953, -43.522621154785156, -38.48444366455078, -33.44626235961914, -28.408084869384766, -23.36990737915039, -18.331729888916016, -13.293551445007324, -8.255373001098633, -3.217195510864258, 1.8209819793701172, 6.859161376953125, 11.8973388671875, 16.935516357421875, 21.97369384765625, 27.011871337890625, 32.050048828125, 37.088226318359375, 42.12640380859375, 47.16458511352539, 52.202762603759766, 57.24094009399414, 62.279117584228516, 67.31729888916016, 72.35547637939453, 77.3936538696289, 82.43183135986328, 87.47000885009766, 92.50818634033203, 97.5463638305664, 102.58454132080078, 107.62271881103516, 112.66089630126953, 117.6990737915039, 122.73725128173828, 127.77543640136719, 132.81361389160156, 137.85179138183594, 142.8899688720703, 147.9281463623047, 152.96632385253906, 158.00450134277344, 163.0426788330078, 168.0808563232422, 173.11903381347656, 178.15721130371094]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 8.0, 9.0, 10.0, 11.0, 16.0, 24.0, 17.0, 12.0, 21.0, 27.0, 33.0, 45.0, 38.0, 45.0, 55.0, 51.0, 49.0, 48.0, 48.0, 50.0, 49.0, 48.0, 30.0, 59.0, 32.0, 23.0, 19.0, 24.0, 26.0, 14.0, 9.0, 9.0, 6.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.84375, -23.14794921875, -22.4521484375, -21.75634765625, -21.060546875, -20.36474609375, -19.6689453125, -18.97314453125, -18.27734375, -17.58154296875, -16.8857421875, -16.18994140625, -15.494140625, -14.79833984375, -14.1025390625, -13.40673828125, -12.7109375, -12.01513671875, -11.3193359375, -10.62353515625, -9.927734375, -9.23193359375, -8.5361328125, -7.84033203125, -7.14453125, -6.44873046875, -5.7529296875, -5.05712890625, -4.361328125, -3.66552734375, -2.9697265625, -2.27392578125, -1.578125, -0.88232421875, -0.1865234375, 0.50927734375, 1.205078125, 1.90087890625, 2.5966796875, 3.29248046875, 3.98828125, 4.68408203125, 5.3798828125, 6.07568359375, 6.771484375, 7.46728515625, 8.1630859375, 8.85888671875, 9.5546875, 10.25048828125, 10.9462890625, 11.64208984375, 12.337890625, 13.03369140625, 13.7294921875, 14.42529296875, 15.12109375, 15.81689453125, 16.5126953125, 17.20849609375, 17.904296875, 18.60009765625, 19.2958984375, 19.99169921875, 20.6875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 11.0, 14.0, 11.0, 20.0, 34.0, 56.0, 76.0, 114.0, 160.0, 221.0, 330.0, 493.0, 751.0, 1124.0, 1656.0, 2532.0, 3729.0, 5515.0, 8564.0, 13363.0, 21693.0, 37104.0, 66091.0, 127740.0, 247233.0, 235443.0, 119253.0, 62188.0, 34860.0, 20715.0, 12960.0, 8359.0, 5434.0, 3540.0, 2408.0, 1553.0, 1041.0, 640.0, 478.0, 353.0, 223.0, 146.0, 98.0, 79.0, 46.0, 36.0, 19.0, 18.0, 13.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.94873046875, -0.919036865234375, -0.88934326171875, -0.859649658203125, -0.8299560546875, -0.800262451171875, -0.77056884765625, -0.740875244140625, -0.711181640625, -0.681488037109375, -0.65179443359375, -0.622100830078125, -0.5924072265625, -0.562713623046875, -0.53302001953125, -0.503326416015625, -0.4736328125, -0.443939208984375, -0.41424560546875, -0.384552001953125, -0.3548583984375, -0.325164794921875, -0.29547119140625, -0.265777587890625, -0.236083984375, -0.206390380859375, -0.17669677734375, -0.147003173828125, -0.1173095703125, -0.087615966796875, -0.05792236328125, -0.028228759765625, 0.00146484375, 0.031158447265625, 0.06085205078125, 0.090545654296875, 0.1202392578125, 0.149932861328125, 0.17962646484375, 0.209320068359375, 0.239013671875, 0.268707275390625, 0.29840087890625, 0.328094482421875, 0.3577880859375, 0.387481689453125, 0.41717529296875, 0.446868896484375, 0.4765625, 0.506256103515625, 0.53594970703125, 0.565643310546875, 0.5953369140625, 0.625030517578125, 0.65472412109375, 0.684417724609375, 0.714111328125, 0.743804931640625, 0.77349853515625, 0.803192138671875, 0.8328857421875, 0.862579345703125, 0.89227294921875, 0.921966552734375, 0.95166015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 3.0, 8.0, 7.0, 13.0, 12.0, 10.0, 7.0, 18.0, 20.0, 23.0, 24.0, 23.0, 31.0, 30.0, 26.0, 36.0, 40.0, 37.0, 38.0, 36.0, 32.0, 1071.0, 45.0, 48.0, 30.0, 44.0, 21.0, 31.0, 42.0, 22.0, 26.0, 25.0, 21.0, 18.0, 18.0, 14.0, 16.0, 14.0, 9.0, 6.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.8609619140625, -9.510986328125, -9.1610107421875, -8.81103515625, -8.4610595703125, -8.111083984375, -7.7611083984375, -7.4111328125, -7.0611572265625, -6.711181640625, -6.3612060546875, -6.01123046875, -5.6612548828125, -5.311279296875, -4.9613037109375, -4.611328125, -4.2613525390625, -3.911376953125, -3.5614013671875, -3.21142578125, -2.8614501953125, -2.511474609375, -2.1614990234375, -1.8115234375, -1.4615478515625, -1.111572265625, -0.7615966796875, -0.41162109375, -0.0616455078125, 0.288330078125, 0.6383056640625, 0.98828125, 1.3382568359375, 1.688232421875, 2.0382080078125, 2.38818359375, 2.7381591796875, 3.088134765625, 3.4381103515625, 3.7880859375, 4.1380615234375, 4.488037109375, 4.8380126953125, 5.18798828125, 5.5379638671875, 5.887939453125, 6.2379150390625, 6.587890625, 6.9378662109375, 7.287841796875, 7.6378173828125, 7.98779296875, 8.3377685546875, 8.687744140625, 9.0377197265625, 9.3876953125, 9.7376708984375, 10.087646484375, 10.4376220703125, 10.78759765625, 11.1375732421875, 11.487548828125, 11.8375244140625, 12.1875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 8.0, 25.0, 37.0, 52.0, 74.0, 106.0, 160.0, 245.0, 400.0, 526.0, 767.0, 1123.0, 1661.0, 2431.0, 3380.0, 5062.0, 7194.0, 10509.0, 15735.0, 23383.0, 36193.0, 57590.0, 97386.0, 176709.0, 1283480.0, 145924.0, 81806.0, 49417.0, 31117.0, 20712.0, 13921.0, 9371.0, 6431.0, 4409.0, 3039.0, 2126.0, 1422.0, 1058.0, 724.0, 454.0, 303.0, 234.0, 155.0, 97.0, 59.0, 40.0, 24.0, 14.0, 18.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.75927734375, -0.7365036010742188, -0.7137298583984375, -0.6909561157226562, -0.668182373046875, -0.6454086303710938, -0.6226348876953125, -0.5998611450195312, -0.57708740234375, -0.5543136596679688, -0.5315399169921875, -0.5087661743164062, -0.485992431640625, -0.46321868896484375, -0.4404449462890625, -0.41767120361328125, -0.3948974609375, -0.37212371826171875, -0.3493499755859375, -0.32657623291015625, -0.303802490234375, -0.28102874755859375, -0.2582550048828125, -0.23548126220703125, -0.21270751953125, -0.18993377685546875, -0.1671600341796875, -0.14438629150390625, -0.121612548828125, -0.09883880615234375, -0.0760650634765625, -0.05329132080078125, -0.030517578125, -0.00774383544921875, 0.0150299072265625, 0.03780364990234375, 0.060577392578125, 0.08335113525390625, 0.1061248779296875, 0.12889862060546875, 0.15167236328125, 0.17444610595703125, 0.1972198486328125, 0.21999359130859375, 0.242767333984375, 0.26554107666015625, 0.2883148193359375, 0.31108856201171875, 0.3338623046875, 0.35663604736328125, 0.3794097900390625, 0.40218353271484375, 0.424957275390625, 0.44773101806640625, 0.4705047607421875, 0.49327850341796875, 0.51605224609375, 0.5388259887695312, 0.5615997314453125, 0.5843734741210938, 0.607147216796875, 0.6299209594726562, 0.6526947021484375, 0.6754684448242188, 0.6982421875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 11.0, 17.0, 16.0, 15.0, 24.0, 26.0, 39.0, 38.0, 47.0, 44.0, 55.0, 72.0, 69.0, 69.0, 73.0, 61.0, 49.0, 44.0, 47.0, 29.0, 42.0, 17.0, 19.0, 11.0, 11.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0041656494140625, -0.004054933786392212, -0.003944218158721924, -0.0038335025310516357, -0.0037227869033813477, -0.0036120712757110596, -0.0035013556480407715, -0.0033906400203704834, -0.0032799243927001953, -0.0031692087650299072, -0.003058493137359619, -0.002947777509689331, -0.002837061882019043, -0.002726346254348755, -0.002615630626678467, -0.0025049149990081787, -0.0023941993713378906, -0.0022834837436676025, -0.0021727681159973145, -0.0020620524883270264, -0.0019513368606567383, -0.0018406212329864502, -0.0017299056053161621, -0.001619189977645874, -0.001508474349975586, -0.0013977587223052979, -0.0012870430946350098, -0.0011763274669647217, -0.0010656118392944336, -0.0009548962116241455, -0.0008441805839538574, -0.0007334649562835693, -0.0006227493286132812, -0.0005120337009429932, -0.0004013180732727051, -0.000290602445602417, -0.0001798868179321289, -6.917119026184082e-05, 4.1544437408447266e-05, 0.00015226006507873535, 0.00026297569274902344, 0.0003736913204193115, 0.0004844069480895996, 0.0005951225757598877, 0.0007058382034301758, 0.0008165538311004639, 0.000927269458770752, 0.00103798508644104, 0.0011487007141113281, 0.0012594163417816162, 0.0013701319694519043, 0.0014808475971221924, 0.0015915632247924805, 0.0017022788524627686, 0.0018129944801330566, 0.0019237101078033447, 0.002034425735473633, 0.002145141363143921, 0.002255856990814209, 0.002366572618484497, 0.002477288246154785, 0.0025880038738250732, 0.0026987195014953613, 0.0028094351291656494, 0.0029201507568359375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 13.0, 12.0, 12.0, 20.0, 35.0, 43.0, 54.0, 78.0, 112.0, 157.0, 214.0, 340.0, 673.0, 4853.0, 240217.0, 784873.0, 14566.0, 988.0, 399.0, 245.0, 183.0, 141.0, 81.0, 62.0, 52.0, 35.0, 24.0, 14.0, 8.0, 8.0, 5.0, 9.0, 3.0, 6.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055999755859375, -0.05425834655761719, -0.052516937255859375, -0.05077552795410156, -0.04903411865234375, -0.04729270935058594, -0.045551300048828125, -0.04380989074707031, -0.0420684814453125, -0.04032707214355469, -0.038585662841796875, -0.03684425354003906, -0.03510284423828125, -0.03336143493652344, -0.031620025634765625, -0.029878616333007812, -0.02813720703125, -0.026395797729492188, -0.024654388427734375, -0.022912979125976562, -0.02117156982421875, -0.019430160522460938, -0.017688751220703125, -0.015947341918945312, -0.0142059326171875, -0.012464523315429688, -0.010723114013671875, -0.008981704711914062, -0.00724029541015625, -0.0054988861083984375, -0.003757476806640625, -0.0020160675048828125, -0.000274658203125, 0.0014667510986328125, 0.003208160400390625, 0.0049495697021484375, 0.00669097900390625, 0.008432388305664062, 0.010173797607421875, 0.011915206909179688, 0.0136566162109375, 0.015398025512695312, 0.017139434814453125, 0.018880844116210938, 0.02062225341796875, 0.022363662719726562, 0.024105072021484375, 0.025846481323242188, 0.027587890625, 0.029329299926757812, 0.031070709228515625, 0.03281211853027344, 0.03455352783203125, 0.03629493713378906, 0.038036346435546875, 0.03977775573730469, 0.0415191650390625, 0.04326057434082031, 0.045001983642578125, 0.04674339294433594, 0.04848480224609375, 0.05022621154785156, 0.051967620849609375, 0.05370903015136719, 0.055450439453125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 43.0, 236.0, 524.0, 151.0, 29.0, 15.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015575243160128593, -0.015108834952116013, -0.014642426744103432, -0.014176017604768276, -0.013709609396755695, -0.013243201188743114, -0.012776792049407959, -0.012310383841395378, -0.011843975633382797, -0.011377567425370216, -0.010911159217357635, -0.01044475007802248, -0.0099783418700099, -0.009511933661997318, -0.009045524522662163, -0.008579116314649582, -0.008112708106637001, -0.00764629989862442, -0.007179891224950552, -0.006713482551276684, -0.006247074343264103, -0.005780666135251522, -0.005314257461577654, -0.004847848787903786, -0.004381440579891205, -0.003915032371878624, -0.0034486236982047558, -0.0029822152573615313, -0.0025158068165183067, -0.002049398375675082, -0.0015829899348318577, -0.0011165814939886332, -0.0006501730531454086, -0.0001837646123021841, 0.0002826438285410404, 0.000749052269384265, 0.0012154607102274895, 0.001681869151070714, 0.0021482775919139385, 0.002614686032757163, 0.0030810944736003876, 0.003547502914443612, 0.004013911355286837, 0.004480320028960705, 0.004946728236973286, 0.0054131364449858665, 0.005879545118659735, 0.006345953792333603, 0.006812362000346184, 0.007278770208358765, 0.007745178882032633, 0.008211587555706501, 0.008677995763719082, 0.009144403971731663, 0.009610813111066818, 0.010077221319079399, 0.01054362952709198, 0.01101003773510456, 0.011476445943117142, 0.011942855082452297, 0.012409263290464878, 0.012875671498477459, 0.013342080637812614, 0.013808488845825195, 0.014274897053837776]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 4.0, 9.0, 17.0, 10.0, 16.0, 25.0, 12.0, 24.0, 21.0, 31.0, 43.0, 29.0, 34.0, 31.0, 41.0, 50.0, 44.0, 35.0, 44.0, 32.0, 38.0, 51.0, 40.0, 45.0, 37.0, 32.0, 32.0, 28.0, 19.0, 17.0, 14.0, 16.0, 13.0, 8.0, 8.0, 8.0, 3.0, 9.0, 9.0, 7.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0021110177040100098, -0.0020444775000214577, -0.0019779372960329056, -0.0019113970920443535, -0.0018448568880558014, -0.0017783166840672493, -0.0017117764800786972, -0.0016452362760901451, -0.001578696072101593, -0.001512155868113041, -0.0014456156641244888, -0.0013790754601359367, -0.0013125352561473846, -0.0012459950521588326, -0.0011794548481702805, -0.0011129146441817284, -0.0010463744401931763, -0.0009798342362046242, -0.0009132940322160721, -0.00084675382822752, -0.0007802136242389679, -0.0007136734202504158, -0.0006471332162618637, -0.0005805930122733116, -0.0005140528082847595, -0.00044751260429620743, -0.00038097240030765533, -0.00031443219631910324, -0.00024789199233055115, -0.00018135178834199905, -0.00011481158435344696, -4.827138036489487e-05, 1.8268823623657227e-05, 8.480902761220932e-05, 0.00015134923160076141, 0.0002178894355893135, 0.0002844296395778656, 0.0003509698435664177, 0.0004175100475549698, 0.0004840502515435219, 0.000550590455532074, 0.0006171306595206261, 0.0006836708635091782, 0.0007502110674977303, 0.0008167512714862823, 0.0008832914754748344, 0.0009498316794633865, 0.0010163718834519386, 0.0010829120874404907, 0.0011494522914290428, 0.001215992495417595, 0.001282532699406147, 0.001349072903394699, 0.0014156131073832512, 0.0014821533113718033, 0.0015486935153603554, 0.0016152337193489075, 0.0016817739233374596, 0.0017483141273260117, 0.0018148543313145638, 0.0018813945353031158, 0.001947934739291668, 0.00201447494328022, 0.002081015147268772, 0.0021475553512573242]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 8.0, 9.0, 10.0, 11.0, 16.0, 24.0, 17.0, 12.0, 21.0, 27.0, 33.0, 45.0, 38.0, 45.0, 55.0, 51.0, 49.0, 48.0, 48.0, 50.0, 49.0, 48.0, 30.0, 59.0, 32.0, 23.0, 19.0, 24.0, 26.0, 14.0, 9.0, 9.0, 6.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.84375, -23.14794921875, -22.4521484375, -21.75634765625, -21.060546875, -20.36474609375, -19.6689453125, -18.97314453125, -18.27734375, -17.58154296875, -16.8857421875, -16.18994140625, -15.494140625, -14.79833984375, -14.1025390625, -13.40673828125, -12.7109375, -12.01513671875, -11.3193359375, -10.62353515625, -9.927734375, -9.23193359375, -8.5361328125, -7.84033203125, -7.14453125, -6.44873046875, -5.7529296875, -5.05712890625, -4.361328125, -3.66552734375, -2.9697265625, -2.27392578125, -1.578125, -0.88232421875, -0.1865234375, 0.50927734375, 1.205078125, 1.90087890625, 2.5966796875, 3.29248046875, 3.98828125, 4.68408203125, 5.3798828125, 6.07568359375, 6.771484375, 7.46728515625, 8.1630859375, 8.85888671875, 9.5546875, 10.25048828125, 10.9462890625, 11.64208984375, 12.337890625, 13.03369140625, 13.7294921875, 14.42529296875, 15.12109375, 15.81689453125, 16.5126953125, 17.20849609375, 17.904296875, 18.60009765625, 19.2958984375, 19.99169921875, 20.6875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 6.0, 13.0, 11.0, 20.0, 21.0, 46.0, 47.0, 64.0, 77.0, 123.0, 161.0, 224.0, 302.0, 435.0, 598.0, 858.0, 1292.0, 2105.0, 3706.0, 6972.0, 15230.0, 41269.0, 158384.0, 597550.0, 148758.0, 38766.0, 14850.0, 6774.0, 3550.0, 2093.0, 1274.0, 850.0, 598.0, 428.0, 296.0, 199.0, 162.0, 116.0, 90.0, 58.0, 39.0, 31.0, 35.0, 20.0, 12.0, 9.0, 4.0, 7.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0], "bins": [-14.328125, -13.900146484375, -13.47216796875, -13.044189453125, -12.6162109375, -12.188232421875, -11.76025390625, -11.332275390625, -10.904296875, -10.476318359375, -10.04833984375, -9.620361328125, -9.1923828125, -8.764404296875, -8.33642578125, -7.908447265625, -7.48046875, -7.052490234375, -6.62451171875, -6.196533203125, -5.7685546875, -5.340576171875, -4.91259765625, -4.484619140625, -4.056640625, -3.628662109375, -3.20068359375, -2.772705078125, -2.3447265625, -1.916748046875, -1.48876953125, -1.060791015625, -0.6328125, -0.204833984375, 0.22314453125, 0.651123046875, 1.0791015625, 1.507080078125, 1.93505859375, 2.363037109375, 2.791015625, 3.218994140625, 3.64697265625, 4.074951171875, 4.5029296875, 4.930908203125, 5.35888671875, 5.786865234375, 6.21484375, 6.642822265625, 7.07080078125, 7.498779296875, 7.9267578125, 8.354736328125, 8.78271484375, 9.210693359375, 9.638671875, 10.066650390625, 10.49462890625, 10.922607421875, 11.3505859375, 11.778564453125, 12.20654296875, 12.634521484375, 13.0625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 8.0, 6.0, 2.0, 10.0, 19.0, 17.0, 18.0, 13.0, 21.0, 35.0, 19.0, 32.0, 38.0, 42.0, 38.0, 54.0, 62.0, 150.0, 1869.0, 122.0, 75.0, 61.0, 36.0, 39.0, 35.0, 23.0, 23.0, 20.0, 22.0, 20.0, 20.0, 17.0, 23.0, 14.0, 12.0, 6.0, 9.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -64.294921875, -62.02734375, -59.759765625, -57.4921875, -55.224609375, -52.95703125, -50.689453125, -48.421875, -46.154296875, -43.88671875, -41.619140625, -39.3515625, -37.083984375, -34.81640625, -32.548828125, -30.28125, -28.013671875, -25.74609375, -23.478515625, -21.2109375, -18.943359375, -16.67578125, -14.408203125, -12.140625, -9.873046875, -7.60546875, -5.337890625, -3.0703125, -0.802734375, 1.46484375, 3.732421875, 6.0, 8.267578125, 10.53515625, 12.802734375, 15.0703125, 17.337890625, 19.60546875, 21.873046875, 24.140625, 26.408203125, 28.67578125, 30.943359375, 33.2109375, 35.478515625, 37.74609375, 40.013671875, 42.28125, 44.548828125, 46.81640625, 49.083984375, 51.3515625, 53.619140625, 55.88671875, 58.154296875, 60.421875, 62.689453125, 64.95703125, 67.224609375, 69.4921875, 71.759765625, 74.02734375, 76.294921875, 78.5625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 14.0, 17.0, 22.0, 17.0, 23.0, 28.0, 24.0, 24.0, 39.0, 59.0, 101.0, 138.0, 240.0, 419.0, 1085.0, 13589.0, 3077902.0, 48799.0, 1818.0, 488.0, 277.0, 151.0, 105.0, 71.0, 45.0, 38.0, 34.0, 19.0, 14.0, 20.0, 11.0, 15.0, 8.0, 2.0, 7.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-125.3125, -121.6953125, -118.078125, -114.4609375, -110.84375, -107.2265625, -103.609375, -99.9921875, -96.375, -92.7578125, -89.140625, -85.5234375, -81.90625, -78.2890625, -74.671875, -71.0546875, -67.4375, -63.8203125, -60.203125, -56.5859375, -52.96875, -49.3515625, -45.734375, -42.1171875, -38.5, -34.8828125, -31.265625, -27.6484375, -24.03125, -20.4140625, -16.796875, -13.1796875, -9.5625, -5.9453125, -2.328125, 1.2890625, 4.90625, 8.5234375, 12.140625, 15.7578125, 19.375, 22.9921875, 26.609375, 30.2265625, 33.84375, 37.4609375, 41.078125, 44.6953125, 48.3125, 51.9296875, 55.546875, 59.1640625, 62.78125, 66.3984375, 70.015625, 73.6328125, 77.25, 80.8671875, 84.484375, 88.1015625, 91.71875, 95.3359375, 98.953125, 102.5703125, 106.1875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 92.0, 698.0, 201.0, 16.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-498.83734130859375, -487.66375732421875, -476.49017333984375, -465.3165588378906, -454.1429748535156, -442.9693908691406, -431.7957763671875, -420.6221923828125, -409.4486083984375, -398.2750244140625, -387.1014404296875, -375.9278259277344, -364.7542419433594, -353.5806579589844, -342.40704345703125, -331.23345947265625, -320.05987548828125, -308.88629150390625, -297.71270751953125, -286.5390930175781, -275.3655090332031, -264.1919250488281, -253.01832580566406, -241.8447265625, -230.671142578125, -219.49755859375, -208.32395935058594, -197.15036010742188, -185.97677612304688, -174.80319213867188, -163.6295928955078, -152.45599365234375, -141.28244018554688, -130.10885620117188, -118.93525695800781, -107.76166534423828, -96.58807373046875, -85.41448211669922, -74.24089050292969, -63.067298889160156, -51.893707275390625, -40.720115661621094, -29.546524047851562, -18.37293243408203, -7.1993408203125, 3.9742507934570312, 15.147842407226562, 26.321434020996094, 37.495025634765625, 48.668617248535156, 59.84220886230469, 71.01580047607422, 82.18939208984375, 93.36298370361328, 104.53657531738281, 115.71016693115234, 126.88375854492188, 138.05734252929688, 149.23094177246094, 160.404541015625, 171.578125, 182.751708984375, 193.92530822753906, 205.09890747070312, 216.27249145507812]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 11.0, 8.0, 10.0, 13.0, 15.0, 17.0, 20.0, 25.0, 34.0, 26.0, 30.0, 41.0, 43.0, 44.0, 39.0, 49.0, 46.0, 35.0, 47.0, 42.0, 45.0, 32.0, 29.0, 30.0, 40.0, 33.0, 23.0, 29.0, 18.0, 14.0, 23.0, 18.0, 16.0, 14.0, 8.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-216.22706604003906, -209.43746948242188, -202.6478729248047, -195.8582763671875, -189.06869506835938, -182.2790985107422, -175.489501953125, -168.6999053955078, -161.91030883789062, -155.12071228027344, -148.33111572265625, -141.54153442382812, -134.75193786621094, -127.96234130859375, -121.17274475097656, -114.38314819335938, -107.59355926513672, -100.80396270751953, -94.01437377929688, -87.22477722167969, -80.4351806640625, -73.64558410644531, -66.85599517822266, -60.06639862060547, -53.27680587768555, -46.487213134765625, -39.69761657714844, -32.908023834228516, -26.11842918395996, -19.328834533691406, -12.539241790771484, -5.749645233154297, 1.039947509765625, 7.8295416831970215, 14.619135856628418, 21.408729553222656, 28.19832420349121, 34.987918853759766, 41.77751159667969, 48.567108154296875, 55.3567008972168, 62.14629364013672, 68.9358901977539, 75.72547912597656, 82.51507568359375, 89.30467224121094, 96.09426879882812, 102.88386535644531, 109.67345428466797, 116.46305084228516, 123.25263977050781, 130.042236328125, 136.8318328857422, 143.62142944335938, 150.4110107421875, 157.20062255859375, 163.99020385742188, 170.77980041503906, 177.56939697265625, 184.35897827148438, 191.14857482910156, 197.93817138671875, 204.72776794433594, 211.51736450195312, 218.3069610595703]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 11.0, 6.0, 7.0, 9.0, 16.0, 18.0, 19.0, 16.0, 17.0, 21.0, 28.0, 38.0, 35.0, 37.0, 42.0, 60.0, 48.0, 43.0, 53.0, 45.0, 46.0, 56.0, 40.0, 35.0, 45.0, 33.0, 31.0, 16.0, 25.0, 22.0, 22.0, 6.0, 12.0, 7.0, 10.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.375, -22.692626953125, -22.01025390625, -21.327880859375, -20.6455078125, -19.963134765625, -19.28076171875, -18.598388671875, -17.916015625, -17.233642578125, -16.55126953125, -15.868896484375, -15.1865234375, -14.504150390625, -13.82177734375, -13.139404296875, -12.45703125, -11.774658203125, -11.09228515625, -10.409912109375, -9.7275390625, -9.045166015625, -8.36279296875, -7.680419921875, -6.998046875, -6.315673828125, -5.63330078125, -4.950927734375, -4.2685546875, -3.586181640625, -2.90380859375, -2.221435546875, -1.5390625, -0.856689453125, -0.17431640625, 0.508056640625, 1.1904296875, 1.872802734375, 2.55517578125, 3.237548828125, 3.919921875, 4.602294921875, 5.28466796875, 5.967041015625, 6.6494140625, 7.331787109375, 8.01416015625, 8.696533203125, 9.37890625, 10.061279296875, 10.74365234375, 11.426025390625, 12.1083984375, 12.790771484375, 13.47314453125, 14.155517578125, 14.837890625, 15.520263671875, 16.20263671875, 16.885009765625, 17.5673828125, 18.249755859375, 18.93212890625, 19.614501953125, 20.296875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 10.0, 11.0, 18.0, 25.0, 38.0, 58.0, 81.0, 88.0, 173.0, 262.0, 345.0, 573.0, 872.0, 1305.0, 2124.0, 3373.0, 5435.0, 9796.0, 17769.0, 44683.0, 631207.0, 3268150.0, 148280.0, 27810.0, 13367.0, 7246.0, 4211.0, 2545.0, 1568.0, 986.0, 613.0, 434.0, 256.0, 177.0, 125.0, 67.0, 63.0, 45.0, 24.0, 21.0, 14.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-65.25, -63.28857421875, -61.3271484375, -59.36572265625, -57.404296875, -55.44287109375, -53.4814453125, -51.52001953125, -49.55859375, -47.59716796875, -45.6357421875, -43.67431640625, -41.712890625, -39.75146484375, -37.7900390625, -35.82861328125, -33.8671875, -31.90576171875, -29.9443359375, -27.98291015625, -26.021484375, -24.06005859375, -22.0986328125, -20.13720703125, -18.17578125, -16.21435546875, -14.2529296875, -12.29150390625, -10.330078125, -8.36865234375, -6.4072265625, -4.44580078125, -2.484375, -0.52294921875, 1.4384765625, 3.39990234375, 5.361328125, 7.32275390625, 9.2841796875, 11.24560546875, 13.20703125, 15.16845703125, 17.1298828125, 19.09130859375, 21.052734375, 23.01416015625, 24.9755859375, 26.93701171875, 28.8984375, 30.85986328125, 32.8212890625, 34.78271484375, 36.744140625, 38.70556640625, 40.6669921875, 42.62841796875, 44.58984375, 46.55126953125, 48.5126953125, 50.47412109375, 52.435546875, 54.39697265625, 56.3583984375, 58.31982421875, 60.28125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 9.0, 8.0, 7.0, 10.0, 16.0, 17.0, 34.0, 52.0, 54.0, 79.0, 178.0, 738.0, 1675.0, 727.0, 203.0, 76.0, 59.0, 33.0, 22.0, 20.0, 19.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.125, -76.13671875, -73.1484375, -70.16015625, -67.171875, -64.18359375, -61.1953125, -58.20703125, -55.21875, -52.23046875, -49.2421875, -46.25390625, -43.265625, -40.27734375, -37.2890625, -34.30078125, -31.3125, -28.32421875, -25.3359375, -22.34765625, -19.359375, -16.37109375, -13.3828125, -10.39453125, -7.40625, -4.41796875, -1.4296875, 1.55859375, 4.546875, 7.53515625, 10.5234375, 13.51171875, 16.5, 19.48828125, 22.4765625, 25.46484375, 28.453125, 31.44140625, 34.4296875, 37.41796875, 40.40625, 43.39453125, 46.3828125, 49.37109375, 52.359375, 55.34765625, 58.3359375, 61.32421875, 64.3125, 67.30078125, 70.2890625, 73.27734375, 76.265625, 79.25390625, 82.2421875, 85.23046875, 88.21875, 91.20703125, 94.1953125, 97.18359375, 100.171875, 103.16015625, 106.1484375, 109.13671875, 112.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 17.0, 24.0, 33.0, 66.0, 96.0, 148.0, 257.0, 503.0, 917.0, 1734.0, 3686.0, 8205.0, 21613.0, 76096.0, 3030056.0, 959128.0, 59923.0, 18013.0, 7128.0, 3226.0, 1504.0, 838.0, 432.0, 235.0, 146.0, 77.0, 50.0, 40.0, 21.0, 15.0, 10.0, 14.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.125, -139.8759765625, -135.626953125, -131.3779296875, -127.12890625, -122.8798828125, -118.630859375, -114.3818359375, -110.1328125, -105.8837890625, -101.634765625, -97.3857421875, -93.13671875, -88.8876953125, -84.638671875, -80.3896484375, -76.140625, -71.8916015625, -67.642578125, -63.3935546875, -59.14453125, -54.8955078125, -50.646484375, -46.3974609375, -42.1484375, -37.8994140625, -33.650390625, -29.4013671875, -25.15234375, -20.9033203125, -16.654296875, -12.4052734375, -8.15625, -3.9072265625, 0.341796875, 4.5908203125, 8.83984375, 13.0888671875, 17.337890625, 21.5869140625, 25.8359375, 30.0849609375, 34.333984375, 38.5830078125, 42.83203125, 47.0810546875, 51.330078125, 55.5791015625, 59.828125, 64.0771484375, 68.326171875, 72.5751953125, 76.82421875, 81.0732421875, 85.322265625, 89.5712890625, 93.8203125, 98.0693359375, 102.318359375, 106.5673828125, 110.81640625, 115.0654296875, 119.314453125, 123.5634765625, 127.8125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 16.0, 12.0, 32.0, 64.0, 169.0, 423.0, 174.0, 57.0, 31.0, 11.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-641.5611572265625, -619.0591430664062, -596.5571899414062, -574.05517578125, -551.55322265625, -529.0512084960938, -506.5492248535156, -484.0472412109375, -461.5452575683594, -439.04327392578125, -416.5412902832031, -394.039306640625, -371.53729248046875, -349.03533935546875, -326.5333251953125, -304.0313415527344, -281.52935791015625, -259.0273742675781, -236.525390625, -214.0233917236328, -191.5214080810547, -169.01942443847656, -146.51742553710938, -124.01544189453125, -101.51345825195312, -79.011474609375, -56.509483337402344, -34.00749206542969, -11.505508422851562, 10.996475219726562, 33.49847412109375, 56.000457763671875, 78.50238037109375, 101.00436401367188, 123.50635528564453, 146.0083465576172, 168.5103302001953, 191.01231384277344, 213.51431274414062, 236.01629638671875, 258.5182800292969, 281.020263671875, 303.5222473144531, 326.02423095703125, 348.5262451171875, 371.0281982421875, 393.53021240234375, 416.0321960449219, 438.5341796875, 461.0361633300781, 483.53814697265625, 506.0401611328125, 528.5421142578125, 551.0441284179688, 573.546142578125, 596.048095703125, 618.550048828125, 641.0520629882812, 663.5540161132812, 686.0560302734375, 708.5579833984375, 731.0599975585938, 753.56201171875, 776.06396484375, 798.5659790039062]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 9.0, 10.0, 11.0, 11.0, 15.0, 23.0, 31.0, 26.0, 27.0, 33.0, 33.0, 38.0, 53.0, 44.0, 51.0, 48.0, 32.0, 59.0, 48.0, 44.0, 36.0, 31.0, 41.0, 34.0, 22.0, 29.0, 25.0, 24.0, 17.0, 11.0, 15.0, 15.0, 12.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-183.6816864013672, -177.49147033691406, -171.30123901367188, -165.11102294921875, -158.92079162597656, -152.73057556152344, -146.54034423828125, -140.35012817382812, -134.159912109375, -127.96968841552734, -121.77946472167969, -115.58924865722656, -109.39901733398438, -103.20880126953125, -97.0185775756836, -90.82835388183594, -84.63812255859375, -78.4478988647461, -72.25767517089844, -66.06745910644531, -59.87723159790039, -53.687007904052734, -47.496788024902344, -41.30656433105469, -35.11634063720703, -28.926116943359375, -22.73589515686035, -16.545673370361328, -10.355449676513672, -4.165225982666016, 2.024993896484375, 8.215217590332031, 14.40545654296875, 20.595680236816406, 26.78590202331543, 32.97612380981445, 39.16634750366211, 45.356571197509766, 51.546791076660156, 57.73701477050781, 63.92723846435547, 70.11746215820312, 76.30768585205078, 82.49790954589844, 88.68812561035156, 94.87835693359375, 101.06857299804688, 107.25879669189453, 113.44902038574219, 119.63924407958984, 125.8294677734375, 132.01968383789062, 138.2099151611328, 144.40013122558594, 150.59036254882812, 156.78057861328125, 162.97079467773438, 169.1610107421875, 175.3512420654297, 181.5414581298828, 187.731689453125, 193.92190551757812, 200.11212158203125, 206.30235290527344, 212.49258422851562]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 21.0, 21.0, 17.0, 26.0, 24.0, 31.0, 33.0, 25.0, 39.0, 43.0, 50.0, 54.0, 49.0, 46.0, 57.0, 40.0, 40.0, 35.0, 36.0, 28.0, 32.0, 37.0, 27.0, 19.0, 20.0, 22.0, 15.0, 10.0, 12.0, 7.0, 6.0, 5.0, 5.0, 0.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.135498046875, -20.47412109375, -19.812744140625, -19.1513671875, -18.489990234375, -17.82861328125, -17.167236328125, -16.505859375, -15.844482421875, -15.18310546875, -14.521728515625, -13.8603515625, -13.198974609375, -12.53759765625, -11.876220703125, -11.21484375, -10.553466796875, -9.89208984375, -9.230712890625, -8.5693359375, -7.907958984375, -7.24658203125, -6.585205078125, -5.923828125, -5.262451171875, -4.60107421875, -3.939697265625, -3.2783203125, -2.616943359375, -1.95556640625, -1.294189453125, -0.6328125, 0.028564453125, 0.68994140625, 1.351318359375, 2.0126953125, 2.674072265625, 3.33544921875, 3.996826171875, 4.658203125, 5.319580078125, 5.98095703125, 6.642333984375, 7.3037109375, 7.965087890625, 8.62646484375, 9.287841796875, 9.94921875, 10.610595703125, 11.27197265625, 11.933349609375, 12.5947265625, 13.256103515625, 13.91748046875, 14.578857421875, 15.240234375, 15.901611328125, 16.56298828125, 17.224365234375, 17.8857421875, 18.547119140625, 19.20849609375, 19.869873046875, 20.53125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 10.0, 26.0, 20.0, 49.0, 57.0, 91.0, 119.0, 181.0, 258.0, 480.0, 617.0, 962.0, 1647.0, 2613.0, 4071.0, 6841.0, 11517.0, 19838.0, 35394.0, 66014.0, 135851.0, 282736.0, 239671.0, 111181.0, 55066.0, 29999.0, 17178.0, 10171.0, 6061.0, 3686.0, 2187.0, 1416.0, 869.0, 559.0, 355.0, 250.0, 167.0, 108.0, 63.0, 53.0, 28.0, 27.0, 21.0, 14.0, 8.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.0157928466796875, -0.981781005859375, -0.9477691650390625, -0.91375732421875, -0.8797454833984375, -0.845733642578125, -0.8117218017578125, -0.7777099609375, -0.7436981201171875, -0.709686279296875, -0.6756744384765625, -0.64166259765625, -0.6076507568359375, -0.573638916015625, -0.5396270751953125, -0.505615234375, -0.4716033935546875, -0.437591552734375, -0.4035797119140625, -0.36956787109375, -0.3355560302734375, -0.301544189453125, -0.2675323486328125, -0.2335205078125, -0.1995086669921875, -0.165496826171875, -0.1314849853515625, -0.09747314453125, -0.0634613037109375, -0.029449462890625, 0.0045623779296875, 0.03857421875, 0.0725860595703125, 0.106597900390625, 0.1406097412109375, 0.17462158203125, 0.2086334228515625, 0.242645263671875, 0.2766571044921875, 0.3106689453125, 0.3446807861328125, 0.378692626953125, 0.4127044677734375, 0.44671630859375, 0.4807281494140625, 0.514739990234375, 0.5487518310546875, 0.582763671875, 0.6167755126953125, 0.650787353515625, 0.6847991943359375, 0.71881103515625, 0.7528228759765625, 0.786834716796875, 0.8208465576171875, 0.8548583984375, 0.8888702392578125, 0.922882080078125, 0.9568939208984375, 0.99090576171875, 1.0249176025390625, 1.058929443359375, 1.0929412841796875, 1.126953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 8.0, 6.0, 7.0, 6.0, 12.0, 14.0, 16.0, 19.0, 17.0, 18.0, 21.0, 30.0, 26.0, 25.0, 20.0, 31.0, 37.0, 39.0, 31.0, 37.0, 30.0, 1064.0, 41.0, 50.0, 38.0, 30.0, 29.0, 35.0, 33.0, 32.0, 22.0, 26.0, 22.0, 14.0, 25.0, 16.0, 7.0, 10.0, 15.0, 15.0, 10.0, 11.0, 6.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.7734375, -11.4246826171875, -11.075927734375, -10.7271728515625, -10.37841796875, -10.0296630859375, -9.680908203125, -9.3321533203125, -8.9833984375, -8.6346435546875, -8.285888671875, -7.9371337890625, -7.58837890625, -7.2396240234375, -6.890869140625, -6.5421142578125, -6.193359375, -5.8446044921875, -5.495849609375, -5.1470947265625, -4.79833984375, -4.4495849609375, -4.100830078125, -3.7520751953125, -3.4033203125, -3.0545654296875, -2.705810546875, -2.3570556640625, -2.00830078125, -1.6595458984375, -1.310791015625, -0.9620361328125, -0.61328125, -0.2645263671875, 0.084228515625, 0.4329833984375, 0.78173828125, 1.1304931640625, 1.479248046875, 1.8280029296875, 2.1767578125, 2.5255126953125, 2.874267578125, 3.2230224609375, 3.57177734375, 3.9205322265625, 4.269287109375, 4.6180419921875, 4.966796875, 5.3155517578125, 5.664306640625, 6.0130615234375, 6.36181640625, 6.7105712890625, 7.059326171875, 7.4080810546875, 7.7568359375, 8.1055908203125, 8.454345703125, 8.8031005859375, 9.15185546875, 9.5006103515625, 9.849365234375, 10.1981201171875, 10.546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 11.0, 12.0, 18.0, 34.0, 46.0, 71.0, 96.0, 159.0, 237.0, 345.0, 458.0, 682.0, 935.0, 1321.0, 1913.0, 2570.0, 3538.0, 4901.0, 6741.0, 9337.0, 13102.0, 18382.0, 26788.0, 39120.0, 59116.0, 95894.0, 163946.0, 1255091.0, 139907.0, 82531.0, 52285.0, 34842.0, 23898.0, 16568.0, 11854.0, 8465.0, 6123.0, 4459.0, 3295.0, 2323.0, 1693.0, 1230.0, 859.0, 626.0, 424.0, 285.0, 207.0, 147.0, 90.0, 54.0, 45.0, 28.0, 12.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.6611328125, -0.640045166015625, -0.61895751953125, -0.597869873046875, -0.5767822265625, -0.555694580078125, -0.53460693359375, -0.513519287109375, -0.492431640625, -0.471343994140625, -0.45025634765625, -0.429168701171875, -0.4080810546875, -0.386993408203125, -0.36590576171875, -0.344818115234375, -0.32373046875, -0.302642822265625, -0.28155517578125, -0.260467529296875, -0.2393798828125, -0.218292236328125, -0.19720458984375, -0.176116943359375, -0.155029296875, -0.133941650390625, -0.11285400390625, -0.091766357421875, -0.0706787109375, -0.049591064453125, -0.02850341796875, -0.007415771484375, 0.013671875, 0.034759521484375, 0.05584716796875, 0.076934814453125, 0.0980224609375, 0.119110107421875, 0.14019775390625, 0.161285400390625, 0.182373046875, 0.203460693359375, 0.22454833984375, 0.245635986328125, 0.2667236328125, 0.287811279296875, 0.30889892578125, 0.329986572265625, 0.35107421875, 0.372161865234375, 0.39324951171875, 0.414337158203125, 0.4354248046875, 0.456512451171875, 0.47760009765625, 0.498687744140625, 0.519775390625, 0.540863037109375, 0.56195068359375, 0.583038330078125, 0.6041259765625, 0.625213623046875, 0.64630126953125, 0.667388916015625, 0.6884765625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 11.0, 11.0, 11.0, 7.0, 19.0, 25.0, 25.0, 17.0, 33.0, 18.0, 30.0, 38.0, 38.0, 45.0, 34.0, 39.0, 54.0, 46.0, 53.0, 34.0, 37.0, 31.0, 49.0, 42.0, 25.0, 31.0, 24.0, 28.0, 20.0, 24.0, 13.0, 9.0, 7.0, 8.0, 8.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.002750396728515625, -0.002663552761077881, -0.0025767087936401367, -0.0024898648262023926, -0.0024030208587646484, -0.0023161768913269043, -0.00222933292388916, -0.002142488956451416, -0.002055644989013672, -0.0019688010215759277, -0.0018819570541381836, -0.0017951130867004395, -0.0017082691192626953, -0.0016214251518249512, -0.001534581184387207, -0.0014477372169494629, -0.0013608932495117188, -0.0012740492820739746, -0.0011872053146362305, -0.0011003613471984863, -0.0010135173797607422, -0.000926673412322998, -0.0008398294448852539, -0.0007529854774475098, -0.0006661415100097656, -0.0005792975425720215, -0.0004924535751342773, -0.0004056096076965332, -0.00031876564025878906, -0.00023192167282104492, -0.00014507770538330078, -5.823373794555664e-05, 2.86102294921875e-05, 0.00011545419692993164, 0.00020229816436767578, 0.0002891421318054199, 0.00037598609924316406, 0.0004628300666809082, 0.0005496740341186523, 0.0006365180015563965, 0.0007233619689941406, 0.0008102059364318848, 0.0008970499038696289, 0.000983893871307373, 0.0010707378387451172, 0.0011575818061828613, 0.0012444257736206055, 0.0013312697410583496, 0.0014181137084960938, 0.0015049576759338379, 0.001591801643371582, 0.0016786456108093262, 0.0017654895782470703, 0.0018523335456848145, 0.0019391775131225586, 0.0020260214805603027, 0.002112865447998047, 0.002199709415435791, 0.002286553382873535, 0.0023733973503112793, 0.0024602413177490234, 0.0025470852851867676, 0.0026339292526245117, 0.002720773220062256, 0.0028076171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 6.0, 12.0, 9.0, 16.0, 17.0, 25.0, 23.0, 44.0, 54.0, 53.0, 62.0, 85.0, 124.0, 204.0, 310.0, 518.0, 2552.0, 27832.0, 666074.0, 331560.0, 15730.0, 1837.0, 481.0, 257.0, 169.0, 114.0, 75.0, 64.0, 49.0, 42.0, 35.0, 23.0, 18.0, 15.0, 16.0, 7.0, 10.0, 3.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051849365234375, -0.05027294158935547, -0.04869651794433594, -0.047120094299316406, -0.045543670654296875, -0.043967247009277344, -0.04239082336425781, -0.04081439971923828, -0.03923797607421875, -0.03766155242919922, -0.03608512878417969, -0.034508705139160156, -0.032932281494140625, -0.031355857849121094, -0.029779434204101562, -0.02820301055908203, -0.0266265869140625, -0.02505016326904297, -0.023473739624023438, -0.021897315979003906, -0.020320892333984375, -0.018744468688964844, -0.017168045043945312, -0.015591621398925781, -0.01401519775390625, -0.012438774108886719, -0.010862350463867188, -0.009285926818847656, -0.007709503173828125, -0.006133079528808594, -0.0045566558837890625, -0.0029802322387695312, -0.00140380859375, 0.00017261505126953125, 0.0017490386962890625, 0.0033254623413085938, 0.004901885986328125, 0.006478309631347656, 0.008054733276367188, 0.009631156921386719, 0.01120758056640625, 0.012784004211425781, 0.014360427856445312, 0.015936851501464844, 0.017513275146484375, 0.019089698791503906, 0.020666122436523438, 0.02224254608154297, 0.0238189697265625, 0.02539539337158203, 0.026971817016601562, 0.028548240661621094, 0.030124664306640625, 0.031701087951660156, 0.03327751159667969, 0.03485393524169922, 0.03643035888671875, 0.03800678253173828, 0.03958320617675781, 0.041159629821777344, 0.042736053466796875, 0.044312477111816406, 0.04588890075683594, 0.04746532440185547, 0.049041748046875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 16.0, 30.0, 98.0, 250.0, 306.0, 156.0, 65.0, 35.0, 24.0, 13.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004133736249059439, -0.0037919438909739256, -0.003450151300057769, -0.0031083589419722557, -0.002766566351056099, -0.002424773992970586, -0.0020829816348850727, -0.001741189043968916, -0.0013993966858834028, -0.0010576042113825679, -0.0007158117950893939, -0.0003740193787962198, -3.2226904295384884e-05, 0.00030956557020545006, 0.0006513579282909632, 0.00099315051920712, 0.001334942877292633, 0.001676735351793468, 0.002018527826294303, 0.002360320184379816, 0.002702112775295973, 0.003043905133381486, 0.003385697491466999, 0.003727490082383156, 0.004069282673299313, 0.004411075264215469, 0.004752867389470339, 0.005094659980386496, 0.005436452571302652, 0.005778244696557522, 0.006120037287473679, 0.006461829878389835, 0.0068036215379834175, 0.007145414128899574, 0.007487206254154444, 0.007828999310731888, 0.00817079097032547, 0.008512583561241627, 0.008854376152157784, 0.00919616874307394, 0.009537961333990097, 0.009879753924906254, 0.01022154651582241, 0.010563338175415993, 0.01090513076633215, 0.011246923357248306, 0.011588715948164463, 0.01193050853908062, 0.012272300198674202, 0.012614092789590359, 0.012955885380506516, 0.013297677040100098, 0.013639469631016254, 0.013981262221932411, 0.014323054812848568, 0.014664847403764725, 0.015006639994680882, 0.015348432585597038, 0.01569022424519062, 0.016032017767429352, 0.016373809427022934, 0.016715602949261665, 0.017057394608855247, 0.01739918813109398, 0.01774097979068756]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 4.0, 9.0, 9.0, 13.0, 12.0, 13.0, 11.0, 16.0, 26.0, 27.0, 22.0, 31.0, 27.0, 38.0, 46.0, 52.0, 43.0, 51.0, 41.0, 48.0, 41.0, 41.0, 46.0, 36.0, 34.0, 36.0, 33.0, 29.0, 23.0, 27.0, 18.0, 27.0, 14.0, 16.0, 7.0, 11.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.002096116542816162, -0.0020323926582932472, -0.0019686687737703323, -0.0019049448892474174, -0.0018412210047245026, -0.0017774971202015877, -0.0017137732356786728, -0.001650049351155758, -0.001586325466632843, -0.0015226015821099281, -0.0014588776975870132, -0.0013951538130640984, -0.0013314299285411835, -0.0012677060440182686, -0.0012039821594953537, -0.0011402582749724388, -0.001076534390449524, -0.001012810505926609, -0.0009490866214036942, -0.0008853627368807793, -0.0008216388523578644, -0.0007579149678349495, -0.0006941910833120346, -0.0006304671987891197, -0.0005667433142662048, -0.00050301942974329, -0.00043929554522037506, -0.0003755716606974602, -0.0003118477761745453, -0.0002481238916516304, -0.00018440000712871552, -0.00012067612260580063, -5.695223808288574e-05, 6.771646440029144e-06, 7.049553096294403e-05, 0.00013421941548585892, 0.0001979433000087738, 0.0002616671845316887, 0.0003253910690546036, 0.00038911495357751846, 0.00045283883810043335, 0.0005165627226233482, 0.0005802866071462631, 0.000644010491669178, 0.0007077343761920929, 0.0007714582607150078, 0.0008351821452379227, 0.0008989060297608376, 0.0009626299142837524, 0.0010263537988066673, 0.0010900776833295822, 0.001153801567852497, 0.001217525452375412, 0.0012812493368983269, 0.0013449732214212418, 0.0014086971059441566, 0.0014724209904670715, 0.0015361448749899864, 0.0015998687595129013, 0.0016635926440358162, 0.001727316528558731, 0.001791040413081646, 0.0018547642976045609, 0.0019184881821274757, 0.0019822120666503906]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 21.0, 21.0, 17.0, 26.0, 24.0, 31.0, 33.0, 25.0, 39.0, 43.0, 50.0, 54.0, 49.0, 46.0, 57.0, 40.0, 40.0, 35.0, 36.0, 28.0, 32.0, 37.0, 27.0, 19.0, 20.0, 22.0, 15.0, 10.0, 12.0, 7.0, 6.0, 5.0, 5.0, 0.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.135498046875, -20.47412109375, -19.812744140625, -19.1513671875, -18.489990234375, -17.82861328125, -17.167236328125, -16.505859375, -15.844482421875, -15.18310546875, -14.521728515625, -13.8603515625, -13.198974609375, -12.53759765625, -11.876220703125, -11.21484375, -10.553466796875, -9.89208984375, -9.230712890625, -8.5693359375, -7.907958984375, -7.24658203125, -6.585205078125, -5.923828125, -5.262451171875, -4.60107421875, -3.939697265625, -3.2783203125, -2.616943359375, -1.95556640625, -1.294189453125, -0.6328125, 0.028564453125, 0.68994140625, 1.351318359375, 2.0126953125, 2.674072265625, 3.33544921875, 3.996826171875, 4.658203125, 5.319580078125, 5.98095703125, 6.642333984375, 7.3037109375, 7.965087890625, 8.62646484375, 9.287841796875, 9.94921875, 10.610595703125, 11.27197265625, 11.933349609375, 12.5947265625, 13.256103515625, 13.91748046875, 14.578857421875, 15.240234375, 15.901611328125, 16.56298828125, 17.224365234375, 17.8857421875, 18.547119140625, 19.20849609375, 19.869873046875, 20.53125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 4.0, 3.0, 7.0, 7.0, 16.0, 11.0, 25.0, 23.0, 31.0, 47.0, 82.0, 87.0, 142.0, 228.0, 335.0, 538.0, 849.0, 1608.0, 3469.0, 9822.0, 48825.0, 878050.0, 83218.0, 12436.0, 4148.0, 1870.0, 970.0, 594.0, 353.0, 231.0, 152.0, 104.0, 70.0, 54.0, 43.0, 29.0, 20.0, 14.0, 13.0, 11.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.5625, -45.0888671875, -43.615234375, -42.1416015625, -40.66796875, -39.1943359375, -37.720703125, -36.2470703125, -34.7734375, -33.2998046875, -31.826171875, -30.3525390625, -28.87890625, -27.4052734375, -25.931640625, -24.4580078125, -22.984375, -21.5107421875, -20.037109375, -18.5634765625, -17.08984375, -15.6162109375, -14.142578125, -12.6689453125, -11.1953125, -9.7216796875, -8.248046875, -6.7744140625, -5.30078125, -3.8271484375, -2.353515625, -0.8798828125, 0.59375, 2.0673828125, 3.541015625, 5.0146484375, 6.48828125, 7.9619140625, 9.435546875, 10.9091796875, 12.3828125, 13.8564453125, 15.330078125, 16.8037109375, 18.27734375, 19.7509765625, 21.224609375, 22.6982421875, 24.171875, 25.6455078125, 27.119140625, 28.5927734375, 30.06640625, 31.5400390625, 33.013671875, 34.4873046875, 35.9609375, 37.4345703125, 38.908203125, 40.3818359375, 41.85546875, 43.3291015625, 44.802734375, 46.2763671875, 47.75]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 10.0, 9.0, 15.0, 17.0, 19.0, 15.0, 22.0, 26.0, 43.0, 19.0, 36.0, 37.0, 48.0, 56.0, 57.0, 76.0, 130.0, 1775.0, 119.0, 62.0, 56.0, 38.0, 53.0, 43.0, 35.0, 30.0, 29.0, 25.0, 16.0, 27.0, 14.0, 12.0, 11.0, 16.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-62.3125, -60.2685546875, -58.224609375, -56.1806640625, -54.13671875, -52.0927734375, -50.048828125, -48.0048828125, -45.9609375, -43.9169921875, -41.873046875, -39.8291015625, -37.78515625, -35.7412109375, -33.697265625, -31.6533203125, -29.609375, -27.5654296875, -25.521484375, -23.4775390625, -21.43359375, -19.3896484375, -17.345703125, -15.3017578125, -13.2578125, -11.2138671875, -9.169921875, -7.1259765625, -5.08203125, -3.0380859375, -0.994140625, 1.0498046875, 3.09375, 5.1376953125, 7.181640625, 9.2255859375, 11.26953125, 13.3134765625, 15.357421875, 17.4013671875, 19.4453125, 21.4892578125, 23.533203125, 25.5771484375, 27.62109375, 29.6650390625, 31.708984375, 33.7529296875, 35.796875, 37.8408203125, 39.884765625, 41.9287109375, 43.97265625, 46.0166015625, 48.060546875, 50.1044921875, 52.1484375, 54.1923828125, 56.236328125, 58.2802734375, 60.32421875, 62.3681640625, 64.412109375, 66.4560546875, 68.5]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 10.0, 11.0, 27.0, 50.0, 77.0, 137.0, 222.0, 579.0, 2422.0, 56608.0, 3074877.0, 8880.0, 1025.0, 350.0, 173.0, 96.0, 53.0, 40.0, 18.0, 20.0, 7.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-355.0, -346.79296875, -338.5859375, -330.37890625, -322.171875, -313.96484375, -305.7578125, -297.55078125, -289.34375, -281.13671875, -272.9296875, -264.72265625, -256.515625, -248.30859375, -240.1015625, -231.89453125, -223.6875, -215.48046875, -207.2734375, -199.06640625, -190.859375, -182.65234375, -174.4453125, -166.23828125, -158.03125, -149.82421875, -141.6171875, -133.41015625, -125.203125, -116.99609375, -108.7890625, -100.58203125, -92.375, -84.16796875, -75.9609375, -67.75390625, -59.546875, -51.33984375, -43.1328125, -34.92578125, -26.71875, -18.51171875, -10.3046875, -2.09765625, 6.109375, 14.31640625, 22.5234375, 30.73046875, 38.9375, 47.14453125, 55.3515625, 63.55859375, 71.765625, 79.97265625, 88.1796875, 96.38671875, 104.59375, 112.80078125, 121.0078125, 129.21484375, 137.421875, 145.62890625, 153.8359375, 162.04296875, 170.25]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 37.0, 503.0, 428.0, 44.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1105.7313232421875, -1086.3189697265625, -1066.90673828125, -1047.494384765625, -1028.08203125, -1008.6697387695312, -989.2574462890625, -969.8450927734375, -950.4328002929688, -931.0205078125, -911.608154296875, -892.1958618164062, -872.7835083007812, -853.3712158203125, -833.9588623046875, -814.5465698242188, -795.13427734375, -775.7219848632812, -756.3096313476562, -736.8973388671875, -717.4849853515625, -698.0726928710938, -678.660400390625, -659.248046875, -639.835693359375, -620.4234008789062, -601.0110473632812, -581.5987548828125, -562.1864013671875, -542.7741088867188, -523.36181640625, -503.949462890625, -484.5372314453125, -465.1249084472656, -445.71258544921875, -426.30029296875, -406.8879699707031, -387.47564697265625, -368.0633239746094, -348.6510009765625, -329.2386779785156, -309.82635498046875, -290.4140319824219, -271.001708984375, -251.58941650390625, -232.17709350585938, -212.7647705078125, -193.3524627685547, -173.9401397705078, -154.52781677246094, -135.11550903320312, -115.70318603515625, -96.2908706665039, -76.87855529785156, -57.46623229980469, -38.053924560546875, -18.6416015625, 0.7707157135009766, 20.183032989501953, 39.59535217285156, 59.007667541503906, 78.41998291015625, 97.83230590820312, 117.24461364746094, 136.6569366455078]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 8.0, 13.0, 5.0, 9.0, 15.0, 14.0, 26.0, 23.0, 25.0, 20.0, 38.0, 29.0, 29.0, 31.0, 30.0, 39.0, 48.0, 56.0, 50.0, 47.0, 43.0, 50.0, 44.0, 42.0, 44.0, 29.0, 41.0, 26.0, 23.0, 14.0, 22.0, 20.0, 13.0, 6.0, 9.0, 5.0, 3.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-239.0789794921875, -232.3161163330078, -225.5532684326172, -218.7904052734375, -212.0275421142578, -205.26467895507812, -198.5018310546875, -191.7389678955078, -184.97610473632812, -178.21324157714844, -171.4503936767578, -164.68753051757812, -157.92466735839844, -151.16180419921875, -144.39895629882812, -137.63609313964844, -130.8732452392578, -124.11038970947266, -117.34752655029297, -110.58467102050781, -103.82180786132812, -97.05895233154297, -90.29609680175781, -83.53323364257812, -76.77037811279297, -70.00752258300781, -63.244659423828125, -56.48180389404297, -49.71894454956055, -42.956085205078125, -36.19322967529297, -29.430370330810547, -22.667510986328125, -15.90465259552002, -9.141794204711914, -2.378936767578125, 4.383922576904297, 11.146781921386719, 17.909637451171875, 24.672496795654297, 31.43535614013672, 38.19821548461914, 44.96107482910156, 51.72393035888672, 58.48678970336914, 65.24964904785156, 72.01250457763672, 78.77536010742188, 85.53822326660156, 92.30107879638672, 99.0639419555664, 105.82679748535156, 112.58966064453125, 119.3525161743164, 126.11537170410156, 132.87823486328125, 139.64108276367188, 146.40394592285156, 153.1667938232422, 159.92965698242188, 166.69252014160156, 173.45538330078125, 180.21823120117188, 186.98109436035156, 193.74395751953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 8.0, 11.0, 11.0, 14.0, 21.0, 21.0, 23.0, 19.0, 25.0, 21.0, 42.0, 33.0, 26.0, 38.0, 46.0, 49.0, 41.0, 59.0, 52.0, 48.0, 42.0, 40.0, 31.0, 37.0, 42.0, 27.0, 23.0, 21.0, 17.0, 16.0, 13.0, 18.0, 14.0, 11.0, 7.0, 2.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.703125, -21.0322265625, -20.361328125, -19.6904296875, -19.01953125, -18.3486328125, -17.677734375, -17.0068359375, -16.3359375, -15.6650390625, -14.994140625, -14.3232421875, -13.65234375, -12.9814453125, -12.310546875, -11.6396484375, -10.96875, -10.2978515625, -9.626953125, -8.9560546875, -8.28515625, -7.6142578125, -6.943359375, -6.2724609375, -5.6015625, -4.9306640625, -4.259765625, -3.5888671875, -2.91796875, -2.2470703125, -1.576171875, -0.9052734375, -0.234375, 0.4365234375, 1.107421875, 1.7783203125, 2.44921875, 3.1201171875, 3.791015625, 4.4619140625, 5.1328125, 5.8037109375, 6.474609375, 7.1455078125, 7.81640625, 8.4873046875, 9.158203125, 9.8291015625, 10.5, 11.1708984375, 11.841796875, 12.5126953125, 13.18359375, 13.8544921875, 14.525390625, 15.1962890625, 15.8671875, 16.5380859375, 17.208984375, 17.8798828125, 18.55078125, 19.2216796875, 19.892578125, 20.5634765625, 21.234375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 17.0, 15.0, 14.0, 44.0, 37.0, 59.0, 83.0, 147.0, 223.0, 388.0, 651.0, 1246.0, 2424.0, 4557.0, 9792.0, 24248.0, 247275.0, 3705066.0, 159029.0, 21310.0, 8898.0, 4033.0, 2098.0, 1114.0, 567.0, 304.0, 197.0, 124.0, 116.0, 55.0, 45.0, 27.0, 12.0, 12.0, 10.0, 6.0, 11.0, 10.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.0625, -75.498046875, -72.93359375, -70.369140625, -67.8046875, -65.240234375, -62.67578125, -60.111328125, -57.546875, -54.982421875, -52.41796875, -49.853515625, -47.2890625, -44.724609375, -42.16015625, -39.595703125, -37.03125, -34.466796875, -31.90234375, -29.337890625, -26.7734375, -24.208984375, -21.64453125, -19.080078125, -16.515625, -13.951171875, -11.38671875, -8.822265625, -6.2578125, -3.693359375, -1.12890625, 1.435546875, 4.0, 6.564453125, 9.12890625, 11.693359375, 14.2578125, 16.822265625, 19.38671875, 21.951171875, 24.515625, 27.080078125, 29.64453125, 32.208984375, 34.7734375, 37.337890625, 39.90234375, 42.466796875, 45.03125, 47.595703125, 50.16015625, 52.724609375, 55.2890625, 57.853515625, 60.41796875, 62.982421875, 65.546875, 68.111328125, 70.67578125, 73.240234375, 75.8046875, 78.369140625, 80.93359375, 83.498046875, 86.0625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 9.0, 9.0, 12.0, 19.0, 39.0, 21.0, 61.0, 102.0, 355.0, 1181.0, 1507.0, 410.0, 118.0, 63.0, 36.0, 34.0, 22.0, 19.0, 12.0, 5.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.1875, -106.076171875, -102.96484375, -99.853515625, -96.7421875, -93.630859375, -90.51953125, -87.408203125, -84.296875, -81.185546875, -78.07421875, -74.962890625, -71.8515625, -68.740234375, -65.62890625, -62.517578125, -59.40625, -56.294921875, -53.18359375, -50.072265625, -46.9609375, -43.849609375, -40.73828125, -37.626953125, -34.515625, -31.404296875, -28.29296875, -25.181640625, -22.0703125, -18.958984375, -15.84765625, -12.736328125, -9.625, -6.513671875, -3.40234375, -0.291015625, 2.8203125, 5.931640625, 9.04296875, 12.154296875, 15.265625, 18.376953125, 21.48828125, 24.599609375, 27.7109375, 30.822265625, 33.93359375, 37.044921875, 40.15625, 43.267578125, 46.37890625, 49.490234375, 52.6015625, 55.712890625, 58.82421875, 61.935546875, 65.046875, 68.158203125, 71.26953125, 74.380859375, 77.4921875, 80.603515625, 83.71484375, 86.826171875, 89.9375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 7.0, 9.0, 15.0, 24.0, 44.0, 47.0, 72.0, 115.0, 211.0, 272.0, 505.0, 849.0, 1572.0, 2987.0, 6223.0, 14412.0, 41137.0, 242944.0, 3706924.0, 123189.0, 30585.0, 11346.0, 5069.0, 2517.0, 1345.0, 723.0, 415.0, 268.0, 140.0, 103.0, 75.0, 38.0, 34.0, 25.0, 8.0, 11.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.5625, -122.76953125, -118.9765625, -115.18359375, -111.390625, -107.59765625, -103.8046875, -100.01171875, -96.21875, -92.42578125, -88.6328125, -84.83984375, -81.046875, -77.25390625, -73.4609375, -69.66796875, -65.875, -62.08203125, -58.2890625, -54.49609375, -50.703125, -46.91015625, -43.1171875, -39.32421875, -35.53125, -31.73828125, -27.9453125, -24.15234375, -20.359375, -16.56640625, -12.7734375, -8.98046875, -5.1875, -1.39453125, 2.3984375, 6.19140625, 9.984375, 13.77734375, 17.5703125, 21.36328125, 25.15625, 28.94921875, 32.7421875, 36.53515625, 40.328125, 44.12109375, 47.9140625, 51.70703125, 55.5, 59.29296875, 63.0859375, 66.87890625, 70.671875, 74.46484375, 78.2578125, 82.05078125, 85.84375, 89.63671875, 93.4296875, 97.22265625, 101.015625, 104.80859375, 108.6015625, 112.39453125, 116.1875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 16.0, 27.0, 34.0, 37.0, 69.0, 143.0, 254.0, 160.0, 100.0, 53.0, 25.0, 27.0, 13.0, 11.0, 8.0, 5.0, 10.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-385.98712158203125, -374.1722717285156, -362.357421875, -350.5425720214844, -338.72772216796875, -326.9128723144531, -315.0980224609375, -303.28314208984375, -291.46832275390625, -279.6534729003906, -267.838623046875, -256.0237731933594, -244.20892333984375, -232.39407348632812, -220.57920837402344, -208.7643585205078, -196.94949340820312, -185.1346435546875, -173.31979370117188, -161.50494384765625, -149.69009399414062, -137.875244140625, -126.06037902832031, -114.24552917480469, -102.43067932128906, -90.61582946777344, -78.80097961425781, -66.98612213134766, -55.17127227783203, -43.356422424316406, -31.54156494140625, -19.726715087890625, -7.911834716796875, 3.903017044067383, 15.71786880493164, 27.53272247314453, 39.347572326660156, 51.16242218017578, 62.97727966308594, 74.79212951660156, 86.60697937011719, 98.42182922363281, 110.23667907714844, 122.0515365600586, 133.86639404296875, 145.68124389648438, 157.49609375, 169.31094360351562, 181.12579345703125, 192.94064331054688, 204.7554931640625, 216.57034301757812, 228.38519287109375, 240.20004272460938, 252.01490783691406, 263.82977294921875, 275.64459228515625, 287.4594421386719, 299.2742919921875, 311.0891418457031, 322.90399169921875, 334.7188415527344, 346.53369140625, 358.34857177734375, 370.1634216308594]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 9.0, 3.0, 7.0, 8.0, 12.0, 9.0, 14.0, 16.0, 11.0, 21.0, 15.0, 21.0, 23.0, 28.0, 24.0, 44.0, 36.0, 31.0, 38.0, 37.0, 34.0, 51.0, 37.0, 42.0, 22.0, 44.0, 38.0, 32.0, 30.0, 31.0, 25.0, 26.0, 34.0, 19.0, 16.0, 19.0, 13.0, 16.0, 14.0, 9.0, 11.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-156.39993286132812, -151.50070190429688, -146.6014862060547, -141.70225524902344, -136.80303955078125, -131.90380859375, -127.00457763671875, -122.10535430908203, -117.20613098144531, -112.3069076538086, -107.40768432617188, -102.50845336914062, -97.6092300415039, -92.71000671386719, -87.81077575683594, -82.91155242919922, -78.0123291015625, -73.11310577392578, -68.21388244628906, -63.31465148925781, -58.415428161621094, -53.516204833984375, -48.61697769165039, -43.717750549316406, -38.81852722167969, -33.91930389404297, -29.020076751708984, -24.120851516723633, -19.22162628173828, -14.32240104675293, -9.423175811767578, -4.523948669433594, 0.3752593994140625, 5.274484634399414, 10.173709869384766, 15.072935104370117, 19.97216033935547, 24.87138557434082, 29.770610809326172, 34.669837951660156, 39.569061279296875, 44.468284606933594, 49.36751174926758, 54.26673889160156, 59.16596221923828, 64.065185546875, 68.96441650390625, 73.86363983154297, 78.76286315917969, 83.6620864868164, 88.56130981445312, 93.46054077148438, 98.3597640991211, 103.25898742675781, 108.15821838378906, 113.05744171142578, 117.9566650390625, 122.85588836669922, 127.75511169433594, 132.6543426513672, 137.55355834960938, 142.45278930664062, 147.35202026367188, 152.25125122070312, 157.1504669189453]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 13.0, 9.0, 11.0, 8.0, 15.0, 16.0, 24.0, 21.0, 24.0, 27.0, 36.0, 29.0, 29.0, 36.0, 34.0, 44.0, 41.0, 52.0, 45.0, 48.0, 51.0, 38.0, 42.0, 39.0, 37.0, 33.0, 35.0, 32.0, 22.0, 16.0, 15.0, 11.0, 10.0, 14.0, 8.0, 10.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.640625, -21.959716796875, -21.27880859375, -20.597900390625, -19.9169921875, -19.236083984375, -18.55517578125, -17.874267578125, -17.193359375, -16.512451171875, -15.83154296875, -15.150634765625, -14.4697265625, -13.788818359375, -13.10791015625, -12.427001953125, -11.74609375, -11.065185546875, -10.38427734375, -9.703369140625, -9.0224609375, -8.341552734375, -7.66064453125, -6.979736328125, -6.298828125, -5.617919921875, -4.93701171875, -4.256103515625, -3.5751953125, -2.894287109375, -2.21337890625, -1.532470703125, -0.8515625, -0.170654296875, 0.51025390625, 1.191162109375, 1.8720703125, 2.552978515625, 3.23388671875, 3.914794921875, 4.595703125, 5.276611328125, 5.95751953125, 6.638427734375, 7.3193359375, 8.000244140625, 8.68115234375, 9.362060546875, 10.04296875, 10.723876953125, 11.40478515625, 12.085693359375, 12.7666015625, 13.447509765625, 14.12841796875, 14.809326171875, 15.490234375, 16.171142578125, 16.85205078125, 17.532958984375, 18.2138671875, 18.894775390625, 19.57568359375, 20.256591796875, 20.9375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 18.0, 20.0, 31.0, 44.0, 74.0, 78.0, 113.0, 188.0, 256.0, 364.0, 543.0, 803.0, 1104.0, 1591.0, 2370.0, 3310.0, 4767.0, 7199.0, 10689.0, 16557.0, 26224.0, 42710.0, 72432.0, 127791.0, 226672.0, 209347.0, 116501.0, 66716.0, 38902.0, 24262.0, 15303.0, 10148.0, 6627.0, 4606.0, 3093.0, 2154.0, 1485.0, 1071.0, 714.0, 507.0, 354.0, 227.0, 175.0, 129.0, 71.0, 57.0, 54.0, 35.0, 21.0, 11.0, 12.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.9423828125, -0.9128570556640625, -0.883331298828125, -0.8538055419921875, -0.82427978515625, -0.7947540283203125, -0.765228271484375, -0.7357025146484375, -0.7061767578125, -0.6766510009765625, -0.647125244140625, -0.6175994873046875, -0.58807373046875, -0.5585479736328125, -0.529022216796875, -0.4994964599609375, -0.469970703125, -0.4404449462890625, -0.410919189453125, -0.3813934326171875, -0.35186767578125, -0.3223419189453125, -0.292816162109375, -0.2632904052734375, -0.2337646484375, -0.2042388916015625, -0.174713134765625, -0.1451873779296875, -0.11566162109375, -0.0861358642578125, -0.056610107421875, -0.0270843505859375, 0.00244140625, 0.0319671630859375, 0.061492919921875, 0.0910186767578125, 0.12054443359375, 0.1500701904296875, 0.179595947265625, 0.2091217041015625, 0.2386474609375, 0.2681732177734375, 0.297698974609375, 0.3272247314453125, 0.35675048828125, 0.3862762451171875, 0.415802001953125, 0.4453277587890625, 0.474853515625, 0.5043792724609375, 0.533905029296875, 0.5634307861328125, 0.59295654296875, 0.6224822998046875, 0.652008056640625, 0.6815338134765625, 0.7110595703125, 0.7405853271484375, 0.770111083984375, 0.7996368408203125, 0.82916259765625, 0.8586883544921875, 0.888214111328125, 0.9177398681640625, 0.947265625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 3.0, 6.0, 4.0, 11.0, 12.0, 12.0, 13.0, 15.0, 19.0, 31.0, 24.0, 29.0, 26.0, 34.0, 28.0, 33.0, 33.0, 40.0, 38.0, 41.0, 32.0, 1061.0, 34.0, 39.0, 40.0, 33.0, 34.0, 30.0, 31.0, 22.0, 29.0, 18.0, 24.0, 19.0, 20.0, 21.0, 17.0, 12.0, 7.0, 13.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.046875, -10.6693115234375, -10.291748046875, -9.9141845703125, -9.53662109375, -9.1590576171875, -8.781494140625, -8.4039306640625, -8.0263671875, -7.6488037109375, -7.271240234375, -6.8936767578125, -6.51611328125, -6.1385498046875, -5.760986328125, -5.3834228515625, -5.005859375, -4.6282958984375, -4.250732421875, -3.8731689453125, -3.49560546875, -3.1180419921875, -2.740478515625, -2.3629150390625, -1.9853515625, -1.6077880859375, -1.230224609375, -0.8526611328125, -0.47509765625, -0.0975341796875, 0.280029296875, 0.6575927734375, 1.03515625, 1.4127197265625, 1.790283203125, 2.1678466796875, 2.54541015625, 2.9229736328125, 3.300537109375, 3.6781005859375, 4.0556640625, 4.4332275390625, 4.810791015625, 5.1883544921875, 5.56591796875, 5.9434814453125, 6.321044921875, 6.6986083984375, 7.076171875, 7.4537353515625, 7.831298828125, 8.2088623046875, 8.58642578125, 8.9639892578125, 9.341552734375, 9.7191162109375, 10.0966796875, 10.4742431640625, 10.851806640625, 11.2293701171875, 11.60693359375, 11.9844970703125, 12.362060546875, 12.7396240234375, 13.1171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 8.0, 4.0, 4.0, 14.0, 15.0, 23.0, 39.0, 47.0, 70.0, 98.0, 151.0, 226.0, 295.0, 396.0, 608.0, 770.0, 1125.0, 1582.0, 2273.0, 3174.0, 4578.0, 6586.0, 9200.0, 13276.0, 18864.0, 28304.0, 42104.0, 66645.0, 109073.0, 187192.0, 1249909.0, 126112.0, 75599.0, 47626.0, 31210.0, 21180.0, 14452.0, 10121.0, 7145.0, 5044.0, 3480.0, 2485.0, 1841.0, 1173.0, 887.0, 613.0, 429.0, 314.0, 224.0, 181.0, 120.0, 75.0, 49.0, 40.0, 30.0, 21.0, 15.0, 12.0, 7.0, 1.0, 2.0], "bins": [-0.771484375, -0.748199462890625, -0.72491455078125, -0.701629638671875, -0.6783447265625, -0.655059814453125, -0.63177490234375, -0.608489990234375, -0.585205078125, -0.561920166015625, -0.53863525390625, -0.515350341796875, -0.4920654296875, -0.468780517578125, -0.44549560546875, -0.422210693359375, -0.39892578125, -0.375640869140625, -0.35235595703125, -0.329071044921875, -0.3057861328125, -0.282501220703125, -0.25921630859375, -0.235931396484375, -0.212646484375, -0.189361572265625, -0.16607666015625, -0.142791748046875, -0.1195068359375, -0.096221923828125, -0.07293701171875, -0.049652099609375, -0.0263671875, -0.003082275390625, 0.02020263671875, 0.043487548828125, 0.0667724609375, 0.090057373046875, 0.11334228515625, 0.136627197265625, 0.159912109375, 0.183197021484375, 0.20648193359375, 0.229766845703125, 0.2530517578125, 0.276336669921875, 0.29962158203125, 0.322906494140625, 0.34619140625, 0.369476318359375, 0.39276123046875, 0.416046142578125, 0.4393310546875, 0.462615966796875, 0.48590087890625, 0.509185791015625, 0.532470703125, 0.555755615234375, 0.57904052734375, 0.602325439453125, 0.6256103515625, 0.648895263671875, 0.67218017578125, 0.695465087890625, 0.71875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 9.0, 5.0, 7.0, 10.0, 14.0, 18.0, 22.0, 26.0, 30.0, 33.0, 49.0, 39.0, 50.0, 63.0, 62.0, 66.0, 65.0, 59.0, 62.0, 60.0, 36.0, 48.0, 30.0, 29.0, 27.0, 22.0, 11.0, 8.0, 8.0, 12.0, 6.0, 4.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004283905029296875, -0.00415194034576416, -0.004019975662231445, -0.0038880109786987305, -0.0037560462951660156, -0.0036240816116333008, -0.003492116928100586, -0.003360152244567871, -0.0032281875610351562, -0.0030962228775024414, -0.0029642581939697266, -0.0028322935104370117, -0.002700328826904297, -0.002568364143371582, -0.002436399459838867, -0.0023044347763061523, -0.0021724700927734375, -0.0020405054092407227, -0.0019085407257080078, -0.001776576042175293, -0.0016446113586425781, -0.0015126466751098633, -0.0013806819915771484, -0.0012487173080444336, -0.0011167526245117188, -0.000984787940979004, -0.0008528232574462891, -0.0007208585739135742, -0.0005888938903808594, -0.00045692920684814453, -0.0003249645233154297, -0.00019299983978271484, -6.103515625e-05, 7.092952728271484e-05, 0.0002028942108154297, 0.00033485889434814453, 0.0004668235778808594, 0.0005987882614135742, 0.0007307529449462891, 0.0008627176284790039, 0.0009946823120117188, 0.0011266469955444336, 0.0012586116790771484, 0.0013905763626098633, 0.0015225410461425781, 0.001654505729675293, 0.0017864704132080078, 0.0019184350967407227, 0.0020503997802734375, 0.0021823644638061523, 0.002314329147338867, 0.002446293830871582, 0.002578258514404297, 0.0027102231979370117, 0.0028421878814697266, 0.0029741525650024414, 0.0031061172485351562, 0.003238081932067871, 0.003370046615600586, 0.0035020112991333008, 0.0036339759826660156, 0.0037659406661987305, 0.0038979053497314453, 0.00402987003326416, 0.004161834716796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 11.0, 12.0, 7.0, 20.0, 16.0, 25.0, 36.0, 26.0, 53.0, 76.0, 108.0, 201.0, 265.0, 473.0, 1718.0, 70479.0, 946752.0, 26016.0, 1082.0, 393.0, 252.0, 140.0, 122.0, 65.0, 64.0, 39.0, 27.0, 22.0, 16.0, 7.0, 6.0, 4.0, 8.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06793212890625, -0.06569671630859375, -0.0634613037109375, -0.06122589111328125, -0.058990478515625, -0.05675506591796875, -0.0545196533203125, -0.05228424072265625, -0.050048828125, -0.04781341552734375, -0.0455780029296875, -0.04334259033203125, -0.041107177734375, -0.03887176513671875, -0.0366363525390625, -0.03440093994140625, -0.03216552734375, -0.02993011474609375, -0.0276947021484375, -0.02545928955078125, -0.023223876953125, -0.02098846435546875, -0.0187530517578125, -0.01651763916015625, -0.0142822265625, -0.01204681396484375, -0.0098114013671875, -0.00757598876953125, -0.005340576171875, -0.00310516357421875, -0.0008697509765625, 0.00136566162109375, 0.00360107421875, 0.00583648681640625, 0.0080718994140625, 0.01030731201171875, 0.012542724609375, 0.01477813720703125, 0.0170135498046875, 0.01924896240234375, 0.021484375, 0.02371978759765625, 0.0259552001953125, 0.02819061279296875, 0.030426025390625, 0.03266143798828125, 0.0348968505859375, 0.03713226318359375, 0.03936767578125, 0.04160308837890625, 0.0438385009765625, 0.04607391357421875, 0.048309326171875, 0.05054473876953125, 0.0527801513671875, 0.05501556396484375, 0.0572509765625, 0.05948638916015625, 0.0617218017578125, 0.06395721435546875, 0.066192626953125, 0.06842803955078125, 0.0706634521484375, 0.07289886474609375, 0.07513427734375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 184.0, 761.0, 64.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03840736299753189, -0.037218060344457626, -0.03602875769138336, -0.0348394550383091, -0.03365015238523483, -0.03246085345745087, -0.0312715508043766, -0.030082248151302338, -0.028892945498228073, -0.02770364284515381, -0.026514340192079544, -0.02532503940165043, -0.024135736748576164, -0.0229464340955019, -0.021757133305072784, -0.02056783065199852, -0.019378527998924255, -0.01818922534584999, -0.016999922692775726, -0.01581062190234661, -0.014621319249272346, -0.013432016596198082, -0.012242714874446392, -0.011053413152694702, -0.009864110499620438, -0.008674807846546173, -0.007485506124794483, -0.006296203937381506, -0.005106901749968529, -0.0039175995625555515, -0.0027282973751425743, -0.0015389956533908844, -0.0003496892750263214, 0.0008396129123866558, 0.002028915099799633, 0.0032182172872126102, 0.0044075194746255875, 0.005596821662038565, 0.006786123849451542, 0.007975425571203232, 0.009164728224277496, 0.01035403087735176, 0.01154333259910345, 0.01273263432085514, 0.013921936973929405, 0.01511123962700367, 0.016300540417432785, 0.01748984307050705, 0.018679145723581314, 0.01986844837665558, 0.021057751029729843, 0.02224705182015896, 0.023436354473233223, 0.024625657126307487, 0.025814957916736603, 0.027004260569810867, 0.028193563222885132, 0.029382865875959396, 0.03057216852903366, 0.031761471182107925, 0.03295077383518219, 0.034140072762966156, 0.03532937541604042, 0.036518678069114685, 0.03770798072218895]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 9.0, 10.0, 10.0, 16.0, 21.0, 35.0, 23.0, 22.0, 27.0, 26.0, 31.0, 32.0, 49.0, 28.0, 40.0, 52.0, 40.0, 50.0, 40.0, 58.0, 45.0, 37.0, 29.0, 37.0, 30.0, 36.0, 21.0, 25.0, 20.0, 21.0, 18.0, 15.0, 6.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0027756094932556152, -0.0026910006999969482, -0.0026063919067382812, -0.0025217831134796143, -0.0024371743202209473, -0.0023525655269622803, -0.0022679567337036133, -0.0021833479404449463, -0.0020987391471862793, -0.0020141303539276123, -0.0019295215606689453, -0.0018449127674102783, -0.0017603039741516113, -0.0016756951808929443, -0.0015910863876342773, -0.0015064775943756104, -0.0014218688011169434, -0.0013372600078582764, -0.0012526512145996094, -0.0011680424213409424, -0.0010834336280822754, -0.0009988248348236084, -0.0009142160415649414, -0.0008296072483062744, -0.0007449984550476074, -0.0006603896617889404, -0.0005757808685302734, -0.0004911720752716064, -0.00040656328201293945, -0.00032195448875427246, -0.00023734569549560547, -0.00015273690223693848, -6.812810897827148e-05, 1.6480684280395508e-05, 0.0001010894775390625, 0.0001856982707977295, 0.0002703070640563965, 0.0003549158573150635, 0.00043952465057373047, 0.0005241334438323975, 0.0006087422370910645, 0.0006933510303497314, 0.0007779598236083984, 0.0008625686168670654, 0.0009471774101257324, 0.0010317862033843994, 0.0011163949966430664, 0.0012010037899017334, 0.0012856125831604004, 0.0013702213764190674, 0.0014548301696777344, 0.0015394389629364014, 0.0016240477561950684, 0.0017086565494537354, 0.0017932653427124023, 0.0018778741359710693, 0.0019624829292297363, 0.0020470917224884033, 0.0021317005157470703, 0.0022163093090057373, 0.0023009181022644043, 0.0023855268955230713, 0.0024701356887817383, 0.0025547444820404053, 0.0026393532752990723]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 13.0, 9.0, 11.0, 8.0, 15.0, 16.0, 24.0, 21.0, 24.0, 27.0, 36.0, 29.0, 29.0, 36.0, 34.0, 44.0, 41.0, 52.0, 45.0, 48.0, 51.0, 38.0, 42.0, 39.0, 37.0, 33.0, 35.0, 32.0, 22.0, 16.0, 15.0, 11.0, 10.0, 14.0, 8.0, 10.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.640625, -21.959716796875, -21.27880859375, -20.597900390625, -19.9169921875, -19.236083984375, -18.55517578125, -17.874267578125, -17.193359375, -16.512451171875, -15.83154296875, -15.150634765625, -14.4697265625, -13.788818359375, -13.10791015625, -12.427001953125, -11.74609375, -11.065185546875, -10.38427734375, -9.703369140625, -9.0224609375, -8.341552734375, -7.66064453125, -6.979736328125, -6.298828125, -5.617919921875, -4.93701171875, -4.256103515625, -3.5751953125, -2.894287109375, -2.21337890625, -1.532470703125, -0.8515625, -0.170654296875, 0.51025390625, 1.191162109375, 1.8720703125, 2.552978515625, 3.23388671875, 3.914794921875, 4.595703125, 5.276611328125, 5.95751953125, 6.638427734375, 7.3193359375, 8.000244140625, 8.68115234375, 9.362060546875, 10.04296875, 10.723876953125, 11.40478515625, 12.085693359375, 12.7666015625, 13.447509765625, 14.12841796875, 14.809326171875, 15.490234375, 16.171142578125, 16.85205078125, 17.532958984375, 18.2138671875, 18.894775390625, 19.57568359375, 20.256591796875, 20.9375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 5.0, 9.0, 11.0, 19.0, 29.0, 32.0, 39.0, 72.0, 86.0, 135.0, 165.0, 266.0, 426.0, 559.0, 790.0, 1273.0, 2045.0, 3235.0, 5761.0, 12266.0, 40816.0, 708726.0, 226213.0, 23639.0, 9415.0, 4750.0, 2646.0, 1645.0, 1065.0, 773.0, 493.0, 337.0, 280.0, 152.0, 113.0, 64.0, 58.0, 44.0, 32.0, 25.0, 16.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-38.59375, -37.41796875, -36.2421875, -35.06640625, -33.890625, -32.71484375, -31.5390625, -30.36328125, -29.1875, -28.01171875, -26.8359375, -25.66015625, -24.484375, -23.30859375, -22.1328125, -20.95703125, -19.78125, -18.60546875, -17.4296875, -16.25390625, -15.078125, -13.90234375, -12.7265625, -11.55078125, -10.375, -9.19921875, -8.0234375, -6.84765625, -5.671875, -4.49609375, -3.3203125, -2.14453125, -0.96875, 0.20703125, 1.3828125, 2.55859375, 3.734375, 4.91015625, 6.0859375, 7.26171875, 8.4375, 9.61328125, 10.7890625, 11.96484375, 13.140625, 14.31640625, 15.4921875, 16.66796875, 17.84375, 19.01953125, 20.1953125, 21.37109375, 22.546875, 23.72265625, 24.8984375, 26.07421875, 27.25, 28.42578125, 29.6015625, 30.77734375, 31.953125, 33.12890625, 34.3046875, 35.48046875, 36.65625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 7.0, 4.0, 2.0, 10.0, 11.0, 18.0, 20.0, 23.0, 31.0, 33.0, 35.0, 39.0, 50.0, 49.0, 54.0, 52.0, 88.0, 1738.0, 241.0, 85.0, 74.0, 51.0, 50.0, 43.0, 36.0, 39.0, 21.0, 31.0, 22.0, 18.0, 20.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.8125, -74.240234375, -71.66796875, -69.095703125, -66.5234375, -63.951171875, -61.37890625, -58.806640625, -56.234375, -53.662109375, -51.08984375, -48.517578125, -45.9453125, -43.373046875, -40.80078125, -38.228515625, -35.65625, -33.083984375, -30.51171875, -27.939453125, -25.3671875, -22.794921875, -20.22265625, -17.650390625, -15.078125, -12.505859375, -9.93359375, -7.361328125, -4.7890625, -2.216796875, 0.35546875, 2.927734375, 5.5, 8.072265625, 10.64453125, 13.216796875, 15.7890625, 18.361328125, 20.93359375, 23.505859375, 26.078125, 28.650390625, 31.22265625, 33.794921875, 36.3671875, 38.939453125, 41.51171875, 44.083984375, 46.65625, 49.228515625, 51.80078125, 54.373046875, 56.9453125, 59.517578125, 62.08984375, 64.662109375, 67.234375, 69.806640625, 72.37890625, 74.951171875, 77.5234375, 80.095703125, 82.66796875, 85.240234375, 87.8125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 13.0, 19.0, 15.0, 37.0, 54.0, 70.0, 90.0, 185.0, 485.0, 1861.0, 16555.0, 3076125.0, 45541.0, 3317.0, 679.0, 264.0, 113.0, 77.0, 52.0, 38.0, 24.0, 13.0, 12.0, 10.0, 11.0, 5.0, 8.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-211.625, -203.685546875, -195.74609375, -187.806640625, -179.8671875, -171.927734375, -163.98828125, -156.048828125, -148.109375, -140.169921875, -132.23046875, -124.291015625, -116.3515625, -108.412109375, -100.47265625, -92.533203125, -84.59375, -76.654296875, -68.71484375, -60.775390625, -52.8359375, -44.896484375, -36.95703125, -29.017578125, -21.078125, -13.138671875, -5.19921875, 2.740234375, 10.6796875, 18.619140625, 26.55859375, 34.498046875, 42.4375, 50.376953125, 58.31640625, 66.255859375, 74.1953125, 82.134765625, 90.07421875, 98.013671875, 105.953125, 113.892578125, 121.83203125, 129.771484375, 137.7109375, 145.650390625, 153.58984375, 161.529296875, 169.46875, 177.408203125, 185.34765625, 193.287109375, 201.2265625, 209.166015625, 217.10546875, 225.044921875, 232.984375, 240.923828125, 248.86328125, 256.802734375, 264.7421875, 272.681640625, 280.62109375, 288.560546875, 296.5]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 29.0, 381.0, 542.0, 59.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1419.4779052734375, -1394.1719970703125, -1368.8662109375, -1343.560302734375, -1318.2545166015625, -1292.9486083984375, -1267.642822265625, -1242.3369140625, -1217.031005859375, -1191.72509765625, -1166.4193115234375, -1141.1134033203125, -1115.8076171875, -1090.501708984375, -1065.19580078125, -1039.8900146484375, -1014.5841674804688, -989.2783203125, -963.9724731445312, -938.6666259765625, -913.3607177734375, -888.0548706054688, -862.7490234375, -837.4431762695312, -812.1373291015625, -786.8314819335938, -761.525634765625, -736.2197265625, -710.9138793945312, -685.6080322265625, -660.3021850585938, -634.996337890625, -609.6904296875, -584.3845825195312, -559.0787353515625, -533.7728271484375, -508.46697998046875, -483.1611328125, -457.85528564453125, -432.5494384765625, -407.24359130859375, -381.937744140625, -356.6318664550781, -331.3260192871094, -306.0201416015625, -280.71429443359375, -255.408447265625, -230.1025848388672, -204.7967071533203, -179.4908447265625, -154.18499755859375, -128.87913513183594, -103.57327270507812, -78.26741027832031, -52.96156311035156, -27.65570068359375, -2.3498382568359375, 22.95602035522461, 48.261878967285156, 73.56773376464844, 98.87359619140625, 124.17945861816406, 149.4853057861328, 174.79116821289062, 200.09703063964844]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 6.0, 9.0, 9.0, 11.0, 14.0, 18.0, 9.0, 21.0, 22.0, 20.0, 24.0, 37.0, 31.0, 38.0, 47.0, 33.0, 39.0, 46.0, 46.0, 39.0, 38.0, 47.0, 33.0, 33.0, 38.0, 35.0, 39.0, 27.0, 19.0, 16.0, 27.0, 20.0, 15.0, 17.0, 11.0, 12.0, 10.0, 8.0, 10.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-165.22840881347656, -159.32656860351562, -153.42474365234375, -147.5229034423828, -141.62106323242188, -135.71922302246094, -129.8173828125, -123.91555786132812, -118.01371765136719, -112.11187744140625, -106.21004486083984, -100.30821228027344, -94.4063720703125, -88.50453186035156, -82.60269927978516, -76.70086669921875, -70.79902648925781, -64.89718627929688, -58.99535369873047, -53.0935173034668, -47.191680908203125, -41.28984451293945, -35.38800811767578, -29.48617172241211, -23.584335327148438, -17.682498931884766, -11.780662536621094, -5.878826141357422, 0.02301025390625, 5.924846649169922, 11.826683044433594, 17.728519439697266, 23.630340576171875, 29.532176971435547, 35.43401336669922, 41.33584976196289, 47.23768615722656, 53.139522552490234, 59.041358947753906, 64.94319152832031, 70.84503173828125, 76.74687194824219, 82.6487045288086, 88.550537109375, 94.45237731933594, 100.35421752929688, 106.25605010986328, 112.15788269042969, 118.05972290039062, 123.96156311035156, 129.8634033203125, 135.76522827148438, 141.6670684814453, 147.56890869140625, 153.47073364257812, 159.37257385253906, 165.2744140625, 171.17625427246094, 177.07809448242188, 182.97991943359375, 188.8817596435547, 194.78359985351562, 200.6854248046875, 206.58726501464844, 212.48910522460938]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 3.0, 13.0, 9.0, 14.0, 14.0, 11.0, 27.0, 19.0, 30.0, 27.0, 29.0, 34.0, 33.0, 44.0, 26.0, 32.0, 33.0, 41.0, 36.0, 51.0, 42.0, 39.0, 43.0, 50.0, 37.0, 32.0, 30.0, 15.0, 24.0, 37.0, 12.0, 15.0, 11.0, 16.0, 7.0, 9.0, 16.0, 3.0, 3.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-22.71875, -22.04248046875, -21.3662109375, -20.68994140625, -20.013671875, -19.33740234375, -18.6611328125, -17.98486328125, -17.30859375, -16.63232421875, -15.9560546875, -15.27978515625, -14.603515625, -13.92724609375, -13.2509765625, -12.57470703125, -11.8984375, -11.22216796875, -10.5458984375, -9.86962890625, -9.193359375, -8.51708984375, -7.8408203125, -7.16455078125, -6.48828125, -5.81201171875, -5.1357421875, -4.45947265625, -3.783203125, -3.10693359375, -2.4306640625, -1.75439453125, -1.078125, -0.40185546875, 0.2744140625, 0.95068359375, 1.626953125, 2.30322265625, 2.9794921875, 3.65576171875, 4.33203125, 5.00830078125, 5.6845703125, 6.36083984375, 7.037109375, 7.71337890625, 8.3896484375, 9.06591796875, 9.7421875, 10.41845703125, 11.0947265625, 11.77099609375, 12.447265625, 13.12353515625, 13.7998046875, 14.47607421875, 15.15234375, 15.82861328125, 16.5048828125, 17.18115234375, 17.857421875, 18.53369140625, 19.2099609375, 19.88623046875, 20.5625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 7.0, 11.0, 8.0, 17.0, 29.0, 43.0, 55.0, 65.0, 75.0, 123.0, 194.0, 245.0, 353.0, 549.0, 876.0, 1248.0, 2088.0, 3330.0, 6036.0, 10655.0, 22832.0, 288712.0, 3513319.0, 294603.0, 23791.0, 10349.0, 5652.0, 3275.0, 1994.0, 1170.0, 805.0, 529.0, 346.0, 236.0, 175.0, 130.0, 98.0, 67.0, 44.0, 32.0, 27.0, 24.0, 19.0, 8.0, 3.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0], "bins": [-75.5625, -73.3720703125, -71.181640625, -68.9912109375, -66.80078125, -64.6103515625, -62.419921875, -60.2294921875, -58.0390625, -55.8486328125, -53.658203125, -51.4677734375, -49.27734375, -47.0869140625, -44.896484375, -42.7060546875, -40.515625, -38.3251953125, -36.134765625, -33.9443359375, -31.75390625, -29.5634765625, -27.373046875, -25.1826171875, -22.9921875, -20.8017578125, -18.611328125, -16.4208984375, -14.23046875, -12.0400390625, -9.849609375, -7.6591796875, -5.46875, -3.2783203125, -1.087890625, 1.1025390625, 3.29296875, 5.4833984375, 7.673828125, 9.8642578125, 12.0546875, 14.2451171875, 16.435546875, 18.6259765625, 20.81640625, 23.0068359375, 25.197265625, 27.3876953125, 29.578125, 31.7685546875, 33.958984375, 36.1494140625, 38.33984375, 40.5302734375, 42.720703125, 44.9111328125, 47.1015625, 49.2919921875, 51.482421875, 53.6728515625, 55.86328125, 58.0537109375, 60.244140625, 62.4345703125, 64.625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 6.0, 4.0, 10.0, 7.0, 12.0, 13.0, 25.0, 28.0, 29.0, 46.0, 76.0, 171.0, 543.0, 1441.0, 1048.0, 312.0, 106.0, 57.0, 27.0, 25.0, 14.0, 16.0, 10.0, 7.0, 11.0, 3.0, 3.0, 6.0, 8.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.9375, -90.185546875, -87.43359375, -84.681640625, -81.9296875, -79.177734375, -76.42578125, -73.673828125, -70.921875, -68.169921875, -65.41796875, -62.666015625, -59.9140625, -57.162109375, -54.41015625, -51.658203125, -48.90625, -46.154296875, -43.40234375, -40.650390625, -37.8984375, -35.146484375, -32.39453125, -29.642578125, -26.890625, -24.138671875, -21.38671875, -18.634765625, -15.8828125, -13.130859375, -10.37890625, -7.626953125, -4.875, -2.123046875, 0.62890625, 3.380859375, 6.1328125, 8.884765625, 11.63671875, 14.388671875, 17.140625, 19.892578125, 22.64453125, 25.396484375, 28.1484375, 30.900390625, 33.65234375, 36.404296875, 39.15625, 41.908203125, 44.66015625, 47.412109375, 50.1640625, 52.916015625, 55.66796875, 58.419921875, 61.171875, 63.923828125, 66.67578125, 69.427734375, 72.1796875, 74.931640625, 77.68359375, 80.435546875, 83.1875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 7.0, 7.0, 5.0, 20.0, 24.0, 35.0, 89.0, 175.0, 339.0, 797.0, 2397.0, 7768.0, 35755.0, 3476308.0, 635450.0, 25602.0, 6122.0, 2001.0, 720.0, 305.0, 158.0, 81.0, 41.0, 17.0, 14.0, 10.0, 7.0, 8.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-209.125, -202.1328125, -195.140625, -188.1484375, -181.15625, -174.1640625, -167.171875, -160.1796875, -153.1875, -146.1953125, -139.203125, -132.2109375, -125.21875, -118.2265625, -111.234375, -104.2421875, -97.25, -90.2578125, -83.265625, -76.2734375, -69.28125, -62.2890625, -55.296875, -48.3046875, -41.3125, -34.3203125, -27.328125, -20.3359375, -13.34375, -6.3515625, 0.640625, 7.6328125, 14.625, 21.6171875, 28.609375, 35.6015625, 42.59375, 49.5859375, 56.578125, 63.5703125, 70.5625, 77.5546875, 84.546875, 91.5390625, 98.53125, 105.5234375, 112.515625, 119.5078125, 126.5, 133.4921875, 140.484375, 147.4765625, 154.46875, 161.4609375, 168.453125, 175.4453125, 182.4375, 189.4296875, 196.421875, 203.4140625, 210.40625, 217.3984375, 224.390625, 231.3828125, 238.375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 3.0, 8.0, 17.0, 12.0, 12.0, 35.0, 43.0, 59.0, 89.0, 108.0, 175.0, 147.0, 86.0, 49.0, 41.0, 29.0, 24.0, 13.0, 11.0, 6.0, 5.0, 7.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-314.72857666015625, -305.9132080078125, -297.0978088378906, -288.2824401855469, -279.4670715332031, -270.65167236328125, -261.8363037109375, -253.02093505859375, -244.20555114746094, -235.39016723632812, -226.57479858398438, -217.75941467285156, -208.94403076171875, -200.128662109375, -191.3132781982422, -182.49789428710938, -173.68252563476562, -164.8671417236328, -156.05177307128906, -147.23638916015625, -138.4210205078125, -129.6056365966797, -120.79025268554688, -111.9748764038086, -103.15950012207031, -94.34412384033203, -85.52874755859375, -76.71336364746094, -67.89798736572266, -59.082611083984375, -50.26723098754883, -41.45185089111328, -32.636505126953125, -23.82112693786621, -15.005748748779297, -6.190370559692383, 2.6250076293945312, 11.440383911132812, 20.25576400756836, 29.071144104003906, 37.88652038574219, 46.70189666748047, 55.517276763916016, 64.33265686035156, 73.14803314208984, 81.96340942382812, 90.77879333496094, 99.59416961669922, 108.4095458984375, 117.22492218017578, 126.04029846191406, 134.85568237304688, 143.67105102539062, 152.48643493652344, 161.30181884765625, 170.1171875, 178.9325714111328, 187.74795532226562, 196.56332397460938, 205.3787078857422, 214.194091796875, 223.00946044921875, 231.82484436035156, 240.64022827148438, 249.45559692382812]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 10.0, 11.0, 11.0, 15.0, 11.0, 23.0, 20.0, 21.0, 28.0, 26.0, 34.0, 25.0, 26.0, 38.0, 33.0, 36.0, 39.0, 46.0, 38.0, 32.0, 27.0, 32.0, 48.0, 39.0, 34.0, 25.0, 30.0, 27.0, 17.0, 33.0, 28.0, 17.0, 23.0, 11.0, 14.0, 10.0, 7.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-165.3268280029297, -159.85072326660156, -154.37461853027344, -148.8985137939453, -143.4224090576172, -137.94630432128906, -132.47019958496094, -126.99409484863281, -121.51799011230469, -116.04188537597656, -110.56578063964844, -105.08967590332031, -99.61357116699219, -94.13746643066406, -88.66136169433594, -83.18525695800781, -77.70915222167969, -72.23304748535156, -66.75694274902344, -61.28083801269531, -55.80473327636719, -50.32862854003906, -44.85252380371094, -39.37641906738281, -33.90031433105469, -28.424209594726562, -22.948104858398438, -17.472000122070312, -11.995895385742188, -6.5197906494140625, -1.0436859130859375, 4.4324188232421875, 9.908523559570312, 15.384628295898438, 20.860733032226562, 26.336837768554688, 31.812942504882812, 37.28904724121094, 42.76515197753906, 48.24125671386719, 53.71736145019531, 59.19346618652344, 64.66957092285156, 70.14567565917969, 75.62178039550781, 81.09788513183594, 86.57398986816406, 92.05009460449219, 97.52619934082031, 103.00230407714844, 108.47840881347656, 113.95451354980469, 119.43061828613281, 124.90672302246094, 130.38282775878906, 135.8589324951172, 141.3350372314453, 146.81114196777344, 152.28724670410156, 157.7633514404297, 163.2394561767578, 168.71556091308594, 174.19166564941406, 179.6677703857422, 185.1438751220703]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 6.0, 3.0, 10.0, 13.0, 12.0, 18.0, 16.0, 20.0, 21.0, 16.0, 24.0, 24.0, 37.0, 27.0, 40.0, 30.0, 35.0, 45.0, 39.0, 45.0, 38.0, 51.0, 41.0, 46.0, 35.0, 26.0, 34.0, 36.0, 34.0, 23.0, 23.0, 22.0, 20.0, 15.0, 18.0, 8.0, 14.0, 6.0, 3.0, 8.0, 6.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-24.5625, -23.861572265625, -23.16064453125, -22.459716796875, -21.7587890625, -21.057861328125, -20.35693359375, -19.656005859375, -18.955078125, -18.254150390625, -17.55322265625, -16.852294921875, -16.1513671875, -15.450439453125, -14.74951171875, -14.048583984375, -13.34765625, -12.646728515625, -11.94580078125, -11.244873046875, -10.5439453125, -9.843017578125, -9.14208984375, -8.441162109375, -7.740234375, -7.039306640625, -6.33837890625, -5.637451171875, -4.9365234375, -4.235595703125, -3.53466796875, -2.833740234375, -2.1328125, -1.431884765625, -0.73095703125, -0.030029296875, 0.6708984375, 1.371826171875, 2.07275390625, 2.773681640625, 3.474609375, 4.175537109375, 4.87646484375, 5.577392578125, 6.2783203125, 6.979248046875, 7.68017578125, 8.381103515625, 9.08203125, 9.782958984375, 10.48388671875, 11.184814453125, 11.8857421875, 12.586669921875, 13.28759765625, 13.988525390625, 14.689453125, 15.390380859375, 16.09130859375, 16.792236328125, 17.4931640625, 18.194091796875, 18.89501953125, 19.595947265625, 20.296875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 7.0, 16.0, 15.0, 21.0, 35.0, 43.0, 59.0, 104.0, 148.0, 211.0, 280.0, 463.0, 669.0, 949.0, 1418.0, 2082.0, 3190.0, 4572.0, 7086.0, 10650.0, 16193.0, 25402.0, 40588.0, 67823.0, 119891.0, 216746.0, 220539.0, 123168.0, 69836.0, 41360.0, 25898.0, 16620.0, 10757.0, 7214.0, 4763.0, 3195.0, 2089.0, 1475.0, 969.0, 644.0, 405.0, 334.0, 205.0, 126.0, 98.0, 67.0, 49.0, 37.0, 19.0, 13.0, 10.0, 6.0, 2.0, 2.0, 0.0, 4.0], "bins": [-1.1591796875, -1.1251068115234375, -1.091033935546875, -1.0569610595703125, -1.02288818359375, -0.9888153076171875, -0.954742431640625, -0.9206695556640625, -0.8865966796875, -0.8525238037109375, -0.818450927734375, -0.7843780517578125, -0.75030517578125, -0.7162322998046875, -0.682159423828125, -0.6480865478515625, -0.614013671875, -0.5799407958984375, -0.545867919921875, -0.5117950439453125, -0.47772216796875, -0.4436492919921875, -0.409576416015625, -0.3755035400390625, -0.3414306640625, -0.3073577880859375, -0.273284912109375, -0.2392120361328125, -0.20513916015625, -0.1710662841796875, -0.136993408203125, -0.1029205322265625, -0.06884765625, -0.0347747802734375, -0.000701904296875, 0.0333709716796875, 0.06744384765625, 0.1015167236328125, 0.135589599609375, 0.1696624755859375, 0.2037353515625, 0.2378082275390625, 0.271881103515625, 0.3059539794921875, 0.34002685546875, 0.3740997314453125, 0.408172607421875, 0.4422454833984375, 0.476318359375, 0.5103912353515625, 0.544464111328125, 0.5785369873046875, 0.61260986328125, 0.6466827392578125, 0.680755615234375, 0.7148284912109375, 0.7489013671875, 0.7829742431640625, 0.817047119140625, 0.8511199951171875, 0.88519287109375, 0.9192657470703125, 0.953338623046875, 0.9874114990234375, 1.021484375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 10.0, 9.0, 12.0, 13.0, 14.0, 14.0, 17.0, 23.0, 24.0, 17.0, 22.0, 25.0, 24.0, 33.0, 40.0, 34.0, 50.0, 44.0, 46.0, 1066.0, 49.0, 38.0, 42.0, 33.0, 36.0, 38.0, 34.0, 34.0, 22.0, 24.0, 20.0, 19.0, 24.0, 11.0, 13.0, 17.0, 11.0, 7.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21875, -13.7652587890625, -13.311767578125, -12.8582763671875, -12.40478515625, -11.9512939453125, -11.497802734375, -11.0443115234375, -10.5908203125, -10.1373291015625, -9.683837890625, -9.2303466796875, -8.77685546875, -8.3233642578125, -7.869873046875, -7.4163818359375, -6.962890625, -6.5093994140625, -6.055908203125, -5.6024169921875, -5.14892578125, -4.6954345703125, -4.241943359375, -3.7884521484375, -3.3349609375, -2.8814697265625, -2.427978515625, -1.9744873046875, -1.52099609375, -1.0675048828125, -0.614013671875, -0.1605224609375, 0.29296875, 0.7464599609375, 1.199951171875, 1.6534423828125, 2.10693359375, 2.5604248046875, 3.013916015625, 3.4674072265625, 3.9208984375, 4.3743896484375, 4.827880859375, 5.2813720703125, 5.73486328125, 6.1883544921875, 6.641845703125, 7.0953369140625, 7.548828125, 8.0023193359375, 8.455810546875, 8.9093017578125, 9.36279296875, 9.8162841796875, 10.269775390625, 10.7232666015625, 11.1767578125, 11.6302490234375, 12.083740234375, 12.5372314453125, 12.99072265625, 13.4442138671875, 13.897705078125, 14.3511962890625, 14.8046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 14.0, 12.0, 27.0, 33.0, 31.0, 66.0, 79.0, 119.0, 173.0, 241.0, 356.0, 614.0, 770.0, 1051.0, 1666.0, 2482.0, 3561.0, 4951.0, 7153.0, 10249.0, 14289.0, 21341.0, 31892.0, 49215.0, 80445.0, 141262.0, 1273089.0, 175777.0, 99584.0, 59217.0, 37338.0, 24903.0, 16711.0, 11425.0, 8245.0, 5690.0, 4057.0, 2864.0, 1934.0, 1326.0, 913.0, 594.0, 413.0, 273.0, 205.0, 144.0, 122.0, 73.0, 50.0, 29.0, 16.0, 13.0, 11.0, 8.0, 4.0, 7.0, 1.0, 4.0], "bins": [-0.87353515625, -0.8468170166015625, -0.820098876953125, -0.7933807373046875, -0.76666259765625, -0.7399444580078125, -0.713226318359375, -0.6865081787109375, -0.6597900390625, -0.6330718994140625, -0.606353759765625, -0.5796356201171875, -0.55291748046875, -0.5261993408203125, -0.499481201171875, -0.4727630615234375, -0.446044921875, -0.4193267822265625, -0.392608642578125, -0.3658905029296875, -0.33917236328125, -0.3124542236328125, -0.285736083984375, -0.2590179443359375, -0.2322998046875, -0.2055816650390625, -0.178863525390625, -0.1521453857421875, -0.12542724609375, -0.0987091064453125, -0.071990966796875, -0.0452728271484375, -0.0185546875, 0.0081634521484375, 0.034881591796875, 0.0615997314453125, 0.08831787109375, 0.1150360107421875, 0.141754150390625, 0.1684722900390625, 0.1951904296875, 0.2219085693359375, 0.248626708984375, 0.2753448486328125, 0.30206298828125, 0.3287811279296875, 0.355499267578125, 0.3822174072265625, 0.408935546875, 0.4356536865234375, 0.462371826171875, 0.4890899658203125, 0.51580810546875, 0.5425262451171875, 0.569244384765625, 0.5959625244140625, 0.6226806640625, 0.6493988037109375, 0.676116943359375, 0.7028350830078125, 0.72955322265625, 0.7562713623046875, 0.782989501953125, 0.8097076416015625, 0.83642578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 8.0, 9.0, 8.0, 15.0, 15.0, 27.0, 17.0, 38.0, 47.0, 46.0, 48.0, 47.0, 68.0, 62.0, 68.0, 69.0, 44.0, 64.0, 60.0, 45.0, 36.0, 25.0, 27.0, 20.0, 18.0, 12.0, 7.0, 7.0, 18.0, 4.0, 10.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003726959228515625, -0.003591299057006836, -0.003455638885498047, -0.003319978713989258, -0.0031843185424804688, -0.0030486583709716797, -0.0029129981994628906, -0.0027773380279541016, -0.0026416778564453125, -0.0025060176849365234, -0.0023703575134277344, -0.0022346973419189453, -0.0020990371704101562, -0.001963376998901367, -0.0018277168273925781, -0.001692056655883789, -0.001556396484375, -0.001420736312866211, -0.0012850761413574219, -0.0011494159698486328, -0.0010137557983398438, -0.0008780956268310547, -0.0007424354553222656, -0.0006067752838134766, -0.0004711151123046875, -0.00033545494079589844, -0.00019979476928710938, -6.413459777832031e-05, 7.152557373046875e-05, 0.0002071857452392578, 0.0003428459167480469, 0.00047850608825683594, 0.000614166259765625, 0.0007498264312744141, 0.0008854866027832031, 0.0010211467742919922, 0.0011568069458007812, 0.0012924671173095703, 0.0014281272888183594, 0.0015637874603271484, 0.0016994476318359375, 0.0018351078033447266, 0.0019707679748535156, 0.0021064281463623047, 0.0022420883178710938, 0.002377748489379883, 0.002513408660888672, 0.002649068832397461, 0.00278472900390625, 0.002920389175415039, 0.003056049346923828, 0.003191709518432617, 0.0033273696899414062, 0.0034630298614501953, 0.0035986900329589844, 0.0037343502044677734, 0.0038700103759765625, 0.0040056705474853516, 0.004141330718994141, 0.00427699089050293, 0.004412651062011719, 0.004548311233520508, 0.004683971405029297, 0.004819631576538086, 0.004955291748046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 6.0, 7.0, 10.0, 11.0, 12.0, 17.0, 18.0, 18.0, 30.0, 46.0, 51.0, 79.0, 121.0, 186.0, 394.0, 2132.0, 76691.0, 939136.0, 27411.0, 1244.0, 346.0, 190.0, 132.0, 73.0, 52.0, 40.0, 18.0, 28.0, 11.0, 11.0, 9.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0887451171875, -0.08630561828613281, -0.08386611938476562, -0.08142662048339844, -0.07898712158203125, -0.07654762268066406, -0.07410812377929688, -0.07166862487792969, -0.0692291259765625, -0.06678962707519531, -0.06435012817382812, -0.06191062927246094, -0.05947113037109375, -0.05703163146972656, -0.054592132568359375, -0.05215263366699219, -0.049713134765625, -0.04727363586425781, -0.044834136962890625, -0.04239463806152344, -0.03995513916015625, -0.03751564025878906, -0.035076141357421875, -0.03263664245605469, -0.0301971435546875, -0.027757644653320312, -0.025318145751953125, -0.022878646850585938, -0.02043914794921875, -0.017999649047851562, -0.015560150146484375, -0.013120651245117188, -0.01068115234375, -0.008241653442382812, -0.005802154541015625, -0.0033626556396484375, -0.00092315673828125, 0.0015163421630859375, 0.003955841064453125, 0.0063953399658203125, 0.0088348388671875, 0.011274337768554688, 0.013713836669921875, 0.016153335571289062, 0.01859283447265625, 0.021032333374023438, 0.023471832275390625, 0.025911331176757812, 0.028350830078125, 0.030790328979492188, 0.033229827880859375, 0.03566932678222656, 0.03810882568359375, 0.04054832458496094, 0.042987823486328125, 0.04542732238769531, 0.0478668212890625, 0.05030632019042969, 0.052745819091796875, 0.05518531799316406, 0.05762481689453125, 0.06006431579589844, 0.06250381469726562, 0.06494331359863281, 0.0673828125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 13.0, 17.0, 16.0, 18.0, 37.0, 50.0, 67.0, 82.0, 102.0, 118.0, 118.0, 91.0, 70.0, 48.0, 33.0, 27.0, 25.0, 12.0, 7.0, 9.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003312567714601755, -0.003192593576386571, -0.0030726194381713867, -0.002952645532786846, -0.002832671394571662, -0.0027126972563564777, -0.0025927231181412935, -0.0024727489799261093, -0.0023527750745415688, -0.0022328009363263845, -0.0021128267981112003, -0.0019928528927266598, -0.0018728787545114756, -0.0017529046162962914, -0.0016329304780811071, -0.001512956339865923, -0.0013929822016507387, -0.0012730080634355545, -0.0011530340416356921, -0.001033059903420508, -0.0009130858234129846, -0.0007931117434054613, -0.0006731376051902771, -0.0005531635251827538, -0.0004331894451752305, -0.0003132153651677072, -0.00019324125605635345, -7.32671469449997e-05, 4.6706933062523603e-05, 0.0001666810130700469, 0.0002866551512852311, 0.0004066292312927544, 0.0005266033113002777, 0.000646577391307801, 0.0007665514713153243, 0.0008865256095305085, 0.001006499631330371, 0.0011264737695455551, 0.0012464479077607393, 0.0013664220459759235, 0.001486396067775786, 0.0016063702059909701, 0.0017263442277908325, 0.0018463183660060167, 0.001966292504221201, 0.0020862664096057415, 0.0022062407806515694, 0.00232621468603611, 0.002446188824251294, 0.0025661629624664783, 0.0026861371006816626, 0.0028061112388968468, 0.0029260851442813873, 0.0030460592824965715, 0.0031660334207117558, 0.00328600755892694, 0.003405981697142124, 0.0035259558353573084, 0.0036459299735724926, 0.003765903878957033, 0.0038858780171722174, 0.004005852155387402, 0.004125826060771942, 0.00424580043181777, 0.0043657743372023106]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 6.0, 16.0, 16.0, 11.0, 18.0, 30.0, 24.0, 26.0, 25.0, 32.0, 35.0, 34.0, 35.0, 32.0, 42.0, 39.0, 39.0, 38.0, 37.0, 43.0, 46.0, 45.0, 30.0, 35.0, 40.0, 27.0, 16.0, 25.0, 22.0, 26.0, 18.0, 18.0, 5.0, 10.0, 7.0, 7.0, 9.0, 7.0, 1.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002184927463531494, -0.002119190990924835, -0.0020534545183181763, -0.0019877180457115173, -0.0019219815731048584, -0.0018562451004981995, -0.0017905086278915405, -0.0017247721552848816, -0.0016590356826782227, -0.0015932992100715637, -0.0015275627374649048, -0.0014618262648582458, -0.001396089792251587, -0.001330353319644928, -0.001264616847038269, -0.00119888037443161, -0.0011331439018249512, -0.0010674074292182922, -0.0010016709566116333, -0.0009359344840049744, -0.0008701980113983154, -0.0008044615387916565, -0.0007387250661849976, -0.0006729885935783386, -0.0006072521209716797, -0.0005415156483650208, -0.0004757791757583618, -0.0004100427031517029, -0.00034430623054504395, -0.000278569757938385, -0.00021283328533172607, -0.00014709681272506714, -8.13603401184082e-05, -1.5623867511749268e-05, 5.011260509490967e-05, 0.0001158490777015686, 0.00018158555030822754, 0.0002473220229148865, 0.0003130584955215454, 0.00037879496812820435, 0.0004445314407348633, 0.0005102679133415222, 0.0005760043859481812, 0.0006417408585548401, 0.000707477331161499, 0.000773213803768158, 0.0008389502763748169, 0.0009046867489814758, 0.0009704232215881348, 0.0010361596941947937, 0.0011018961668014526, 0.0011676326394081116, 0.0012333691120147705, 0.0012991055846214294, 0.0013648420572280884, 0.0014305785298347473, 0.0014963150024414062, 0.0015620514750480652, 0.0016277879476547241, 0.001693524420261383, 0.001759260892868042, 0.001824997365474701, 0.0018907338380813599, 0.001956470310688019, 0.0020222067832946777]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 6.0, 3.0, 10.0, 13.0, 12.0, 18.0, 16.0, 20.0, 21.0, 16.0, 24.0, 24.0, 37.0, 27.0, 40.0, 30.0, 35.0, 45.0, 39.0, 45.0, 38.0, 51.0, 41.0, 46.0, 35.0, 26.0, 34.0, 36.0, 34.0, 23.0, 23.0, 22.0, 20.0, 15.0, 18.0, 8.0, 14.0, 6.0, 3.0, 8.0, 6.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-24.5625, -23.861572265625, -23.16064453125, -22.459716796875, -21.7587890625, -21.057861328125, -20.35693359375, -19.656005859375, -18.955078125, -18.254150390625, -17.55322265625, -16.852294921875, -16.1513671875, -15.450439453125, -14.74951171875, -14.048583984375, -13.34765625, -12.646728515625, -11.94580078125, -11.244873046875, -10.5439453125, -9.843017578125, -9.14208984375, -8.441162109375, -7.740234375, -7.039306640625, -6.33837890625, -5.637451171875, -4.9365234375, -4.235595703125, -3.53466796875, -2.833740234375, -2.1328125, -1.431884765625, -0.73095703125, -0.030029296875, 0.6708984375, 1.371826171875, 2.07275390625, 2.773681640625, 3.474609375, 4.175537109375, 4.87646484375, 5.577392578125, 6.2783203125, 6.979248046875, 7.68017578125, 8.381103515625, 9.08203125, 9.782958984375, 10.48388671875, 11.184814453125, 11.8857421875, 12.586669921875, 13.28759765625, 13.988525390625, 14.689453125, 15.390380859375, 16.09130859375, 16.792236328125, 17.4931640625, 18.194091796875, 18.89501953125, 19.595947265625, 20.296875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 11.0, 6.0, 14.0, 22.0, 22.0, 36.0, 50.0, 70.0, 104.0, 133.0, 211.0, 278.0, 385.0, 564.0, 784.0, 1095.0, 1584.0, 2614.0, 4522.0, 9308.0, 23532.0, 83585.0, 550163.0, 281691.0, 52681.0, 16858.0, 7378.0, 3793.0, 2210.0, 1478.0, 1027.0, 698.0, 479.0, 332.0, 242.0, 166.0, 115.0, 89.0, 55.0, 52.0, 31.0, 32.0, 13.0, 11.0, 11.0, 7.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.8125, -16.315673828125, -15.81884765625, -15.322021484375, -14.8251953125, -14.328369140625, -13.83154296875, -13.334716796875, -12.837890625, -12.341064453125, -11.84423828125, -11.347412109375, -10.8505859375, -10.353759765625, -9.85693359375, -9.360107421875, -8.86328125, -8.366455078125, -7.86962890625, -7.372802734375, -6.8759765625, -6.379150390625, -5.88232421875, -5.385498046875, -4.888671875, -4.391845703125, -3.89501953125, -3.398193359375, -2.9013671875, -2.404541015625, -1.90771484375, -1.410888671875, -0.9140625, -0.417236328125, 0.07958984375, 0.576416015625, 1.0732421875, 1.570068359375, 2.06689453125, 2.563720703125, 3.060546875, 3.557373046875, 4.05419921875, 4.551025390625, 5.0478515625, 5.544677734375, 6.04150390625, 6.538330078125, 7.03515625, 7.531982421875, 8.02880859375, 8.525634765625, 9.0224609375, 9.519287109375, 10.01611328125, 10.512939453125, 11.009765625, 11.506591796875, 12.00341796875, 12.500244140625, 12.9970703125, 13.493896484375, 13.99072265625, 14.487548828125, 14.984375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 6.0, 8.0, 10.0, 8.0, 23.0, 16.0, 13.0, 27.0, 18.0, 34.0, 32.0, 38.0, 37.0, 28.0, 47.0, 47.0, 74.0, 219.0, 1831.0, 102.0, 48.0, 57.0, 31.0, 36.0, 34.0, 38.0, 23.0, 35.0, 13.0, 16.0, 18.0, 19.0, 17.0, 16.0, 9.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-93.5, -90.84375, -88.1875, -85.53125, -82.875, -80.21875, -77.5625, -74.90625, -72.25, -69.59375, -66.9375, -64.28125, -61.625, -58.96875, -56.3125, -53.65625, -51.0, -48.34375, -45.6875, -43.03125, -40.375, -37.71875, -35.0625, -32.40625, -29.75, -27.09375, -24.4375, -21.78125, -19.125, -16.46875, -13.8125, -11.15625, -8.5, -5.84375, -3.1875, -0.53125, 2.125, 4.78125, 7.4375, 10.09375, 12.75, 15.40625, 18.0625, 20.71875, 23.375, 26.03125, 28.6875, 31.34375, 34.0, 36.65625, 39.3125, 41.96875, 44.625, 47.28125, 49.9375, 52.59375, 55.25, 57.90625, 60.5625, 63.21875, 65.875, 68.53125, 71.1875, 73.84375, 76.5]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 6.0, 16.0, 19.0, 32.0, 26.0, 26.0, 43.0, 70.0, 117.0, 148.0, 231.0, 443.0, 1453.0, 61870.0, 3075614.0, 4102.0, 615.0, 268.0, 165.0, 129.0, 80.0, 61.0, 44.0, 23.0, 30.0, 18.0, 13.0, 10.0, 11.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-210.25, -204.27734375, -198.3046875, -192.33203125, -186.359375, -180.38671875, -174.4140625, -168.44140625, -162.46875, -156.49609375, -150.5234375, -144.55078125, -138.578125, -132.60546875, -126.6328125, -120.66015625, -114.6875, -108.71484375, -102.7421875, -96.76953125, -90.796875, -84.82421875, -78.8515625, -72.87890625, -66.90625, -60.93359375, -54.9609375, -48.98828125, -43.015625, -37.04296875, -31.0703125, -25.09765625, -19.125, -13.15234375, -7.1796875, -1.20703125, 4.765625, 10.73828125, 16.7109375, 22.68359375, 28.65625, 34.62890625, 40.6015625, 46.57421875, 52.546875, 58.51953125, 64.4921875, 70.46484375, 76.4375, 82.41015625, 88.3828125, 94.35546875, 100.328125, 106.30078125, 112.2734375, 118.24609375, 124.21875, 130.19140625, 136.1640625, 142.13671875, 148.109375, 154.08203125, 160.0546875, 166.02734375, 172.0]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 14.0, 30.0, 96.0, 257.0, 345.0, 178.0, 64.0, 22.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.8077850341797, -201.80271911621094, -196.79766845703125, -191.7926025390625, -186.78753662109375, -181.782470703125, -176.7774200439453, -171.77235412597656, -166.76730346679688, -161.76223754882812, -156.75718688964844, -151.7521209716797, -146.74705505371094, -141.74200439453125, -136.7369384765625, -131.73187255859375, -126.726806640625, -121.72174835205078, -116.71668243408203, -111.71162414550781, -106.70655822753906, -101.70149993896484, -96.69644165039062, -91.69137573242188, -86.68631744384766, -81.68125915527344, -76.67619323730469, -71.67113494873047, -66.66607666015625, -61.6610107421875, -56.65595245361328, -51.6508903503418, -46.64582061767578, -41.6407585144043, -36.63569641113281, -31.630638122558594, -26.62557601928711, -21.620513916015625, -16.615453720092773, -11.610393524169922, -6.6053314208984375, -1.6002702713012695, 3.4047908782958984, 8.409852027893066, 13.414913177490234, 18.41997528076172, 23.42503547668457, 28.430095672607422, 33.435157775878906, 38.44021987915039, 43.445281982421875, 48.450340270996094, 53.45540237426758, 58.46046447753906, 63.46552276611328, 68.4705810546875, 73.47564697265625, 78.48070526123047, 83.48577117919922, 88.49082946777344, 93.49589538574219, 98.5009536743164, 103.50601196289062, 108.51107788085938, 113.5161361694336]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 11.0, 4.0, 14.0, 11.0, 7.0, 12.0, 11.0, 23.0, 23.0, 21.0, 29.0, 37.0, 32.0, 39.0, 35.0, 46.0, 27.0, 40.0, 48.0, 43.0, 44.0, 39.0, 45.0, 36.0, 45.0, 47.0, 30.0, 26.0, 26.0, 20.0, 25.0, 16.0, 20.0, 11.0, 7.0, 10.0, 8.0, 11.0, 6.0, 6.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-230.90023803710938, -223.32843017578125, -215.75662231445312, -208.184814453125, -200.61300659179688, -193.04119873046875, -185.46939086914062, -177.8975830078125, -170.32577514648438, -162.75396728515625, -155.18215942382812, -147.6103515625, -140.03854370117188, -132.46673583984375, -124.89492797851562, -117.3231201171875, -109.75131225585938, -102.17950439453125, -94.60769653320312, -87.035888671875, -79.46408081054688, -71.89227294921875, -64.32046508789062, -56.7486572265625, -49.176849365234375, -41.60504150390625, -34.033233642578125, -26.46142578125, -18.889617919921875, -11.31781005859375, -3.746002197265625, 3.8258056640625, 11.397628784179688, 18.969436645507812, 26.541244506835938, 34.11305236816406, 41.68486022949219, 49.25666809082031, 56.82847595214844, 64.40028381347656, 71.97209167480469, 79.54389953613281, 87.11570739746094, 94.68751525878906, 102.25932312011719, 109.83113098144531, 117.40293884277344, 124.97474670410156, 132.5465545654297, 140.1183624267578, 147.69017028808594, 155.26197814941406, 162.8337860107422, 170.4055938720703, 177.97740173339844, 185.54920959472656, 193.1210174560547, 200.6928253173828, 208.26463317871094, 215.83644104003906, 223.4082489013672, 230.9800567626953, 238.55186462402344, 246.12367248535156, 253.6954803466797]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 1.0, 6.0, 15.0, 8.0, 14.0, 23.0, 19.0, 13.0, 19.0, 22.0, 22.0, 28.0, 39.0, 32.0, 32.0, 37.0, 32.0, 44.0, 46.0, 40.0, 34.0, 50.0, 44.0, 43.0, 47.0, 23.0, 32.0, 38.0, 19.0, 24.0, 23.0, 25.0, 17.0, 19.0, 11.0, 14.0, 4.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0], "bins": [-25.703125, -24.981201171875, -24.25927734375, -23.537353515625, -22.8154296875, -22.093505859375, -21.37158203125, -20.649658203125, -19.927734375, -19.205810546875, -18.48388671875, -17.761962890625, -17.0400390625, -16.318115234375, -15.59619140625, -14.874267578125, -14.15234375, -13.430419921875, -12.70849609375, -11.986572265625, -11.2646484375, -10.542724609375, -9.82080078125, -9.098876953125, -8.376953125, -7.655029296875, -6.93310546875, -6.211181640625, -5.4892578125, -4.767333984375, -4.04541015625, -3.323486328125, -2.6015625, -1.879638671875, -1.15771484375, -0.435791015625, 0.2861328125, 1.008056640625, 1.72998046875, 2.451904296875, 3.173828125, 3.895751953125, 4.61767578125, 5.339599609375, 6.0615234375, 6.783447265625, 7.50537109375, 8.227294921875, 8.94921875, 9.671142578125, 10.39306640625, 11.114990234375, 11.8369140625, 12.558837890625, 13.28076171875, 14.002685546875, 14.724609375, 15.446533203125, 16.16845703125, 16.890380859375, 17.6123046875, 18.334228515625, 19.05615234375, 19.778076171875, 20.5]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 6.0, 8.0, 15.0, 19.0, 17.0, 28.0, 40.0, 44.0, 88.0, 101.0, 138.0, 199.0, 279.0, 394.0, 550.0, 732.0, 1080.0, 1582.0, 2584.0, 4430.0, 8155.0, 16076.0, 107642.0, 2871617.0, 1096990.0, 51566.0, 13100.0, 6531.0, 3663.0, 2142.0, 1360.0, 955.0, 610.0, 456.0, 283.0, 208.0, 154.0, 114.0, 85.0, 60.0, 45.0, 38.0, 24.0, 23.0, 14.0, 12.0, 6.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-69.25, -67.2041015625, -65.158203125, -63.1123046875, -61.06640625, -59.0205078125, -56.974609375, -54.9287109375, -52.8828125, -50.8369140625, -48.791015625, -46.7451171875, -44.69921875, -42.6533203125, -40.607421875, -38.5615234375, -36.515625, -34.4697265625, -32.423828125, -30.3779296875, -28.33203125, -26.2861328125, -24.240234375, -22.1943359375, -20.1484375, -18.1025390625, -16.056640625, -14.0107421875, -11.96484375, -9.9189453125, -7.873046875, -5.8271484375, -3.78125, -1.7353515625, 0.310546875, 2.3564453125, 4.40234375, 6.4482421875, 8.494140625, 10.5400390625, 12.5859375, 14.6318359375, 16.677734375, 18.7236328125, 20.76953125, 22.8154296875, 24.861328125, 26.9072265625, 28.953125, 30.9990234375, 33.044921875, 35.0908203125, 37.13671875, 39.1826171875, 41.228515625, 43.2744140625, 45.3203125, 47.3662109375, 49.412109375, 51.4580078125, 53.50390625, 55.5498046875, 57.595703125, 59.6416015625, 61.6875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 2.0, 6.0, 10.0, 7.0, 8.0, 19.0, 19.0, 13.0, 26.0, 18.0, 39.0, 74.0, 134.0, 334.0, 771.0, 1172.0, 734.0, 298.0, 116.0, 73.0, 42.0, 40.0, 22.0, 11.0, 14.0, 9.0, 9.0, 15.0, 11.0, 8.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -73.00341796875, -70.9443359375, -68.88525390625, -66.826171875, -64.76708984375, -62.7080078125, -60.64892578125, -58.58984375, -56.53076171875, -54.4716796875, -52.41259765625, -50.353515625, -48.29443359375, -46.2353515625, -44.17626953125, -42.1171875, -40.05810546875, -37.9990234375, -35.93994140625, -33.880859375, -31.82177734375, -29.7626953125, -27.70361328125, -25.64453125, -23.58544921875, -21.5263671875, -19.46728515625, -17.408203125, -15.34912109375, -13.2900390625, -11.23095703125, -9.171875, -7.11279296875, -5.0537109375, -2.99462890625, -0.935546875, 1.12353515625, 3.1826171875, 5.24169921875, 7.30078125, 9.35986328125, 11.4189453125, 13.47802734375, 15.537109375, 17.59619140625, 19.6552734375, 21.71435546875, 23.7734375, 25.83251953125, 27.8916015625, 29.95068359375, 32.009765625, 34.06884765625, 36.1279296875, 38.18701171875, 40.24609375, 42.30517578125, 44.3642578125, 46.42333984375, 48.482421875, 50.54150390625, 52.6005859375, 54.65966796875, 56.71875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 15.0, 11.0, 19.0, 47.0, 52.0, 75.0, 88.0, 199.0, 285.0, 545.0, 997.0, 2023.0, 4536.0, 10389.0, 28581.0, 132445.0, 3703272.0, 250016.0, 37333.0, 12967.0, 5289.0, 2486.0, 1176.0, 586.0, 332.0, 162.0, 141.0, 49.0, 46.0, 41.0, 19.0, 17.0, 10.0, 1.0, 7.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-93.8125, -90.4150390625, -87.017578125, -83.6201171875, -80.22265625, -76.8251953125, -73.427734375, -70.0302734375, -66.6328125, -63.2353515625, -59.837890625, -56.4404296875, -53.04296875, -49.6455078125, -46.248046875, -42.8505859375, -39.453125, -36.0556640625, -32.658203125, -29.2607421875, -25.86328125, -22.4658203125, -19.068359375, -15.6708984375, -12.2734375, -8.8759765625, -5.478515625, -2.0810546875, 1.31640625, 4.7138671875, 8.111328125, 11.5087890625, 14.90625, 18.3037109375, 21.701171875, 25.0986328125, 28.49609375, 31.8935546875, 35.291015625, 38.6884765625, 42.0859375, 45.4833984375, 48.880859375, 52.2783203125, 55.67578125, 59.0732421875, 62.470703125, 65.8681640625, 69.265625, 72.6630859375, 76.060546875, 79.4580078125, 82.85546875, 86.2529296875, 89.650390625, 93.0478515625, 96.4453125, 99.8427734375, 103.240234375, 106.6376953125, 110.03515625, 113.4326171875, 116.830078125, 120.2275390625, 123.625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 7.0, 7.0, 8.0, 15.0, 22.0, 37.0, 63.0, 96.0, 196.0, 225.0, 127.0, 93.0, 43.0, 23.0, 13.0, 5.0, 6.0, 10.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.8699493408203, -231.9002685546875, -221.93060302734375, -211.96092224121094, -201.99124145507812, -192.02157592773438, -182.05189514160156, -172.08221435546875, -162.112548828125, -152.1428680419922, -142.17320251464844, -132.20352172851562, -122.23384094238281, -112.26416778564453, -102.29449462890625, -92.32481384277344, -82.35513305664062, -72.38545989990234, -62.41577911376953, -52.44610595703125, -42.4764289855957, -32.506752014160156, -22.537078857421875, -12.567398071289062, -2.5977249145507812, 7.371951103210449, 17.34162712097168, 27.311302185058594, 37.28097915649414, 47.25065612792969, 57.22032928466797, 67.19001007080078, 77.15966796875, 87.12934112548828, 97.0990219116211, 107.06869506835938, 117.03837585449219, 127.00804901123047, 136.97772216796875, 146.94740295410156, 156.91708374023438, 166.8867645263672, 176.85643005371094, 186.82611083984375, 196.79579162597656, 206.76547241210938, 216.73513793945312, 226.70481872558594, 236.6744842529297, 246.6441650390625, 256.61383056640625, 266.58349609375, 276.5531921386719, 286.5228576660156, 296.4925537109375, 306.46221923828125, 316.431884765625, 326.40155029296875, 336.3712463378906, 346.3409118652344, 356.3105773925781, 366.2802734375, 376.24993896484375, 386.2196044921875, 396.1893005371094]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 10.0, 5.0, 9.0, 3.0, 7.0, 16.0, 9.0, 21.0, 19.0, 19.0, 30.0, 20.0, 25.0, 30.0, 40.0, 38.0, 30.0, 35.0, 44.0, 46.0, 36.0, 46.0, 45.0, 35.0, 41.0, 45.0, 44.0, 44.0, 21.0, 23.0, 17.0, 22.0, 15.0, 20.0, 15.0, 13.0, 14.0, 7.0, 9.0, 12.0, 8.0, 5.0, 4.0, 0.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-172.6673583984375, -167.89022827148438, -163.1131134033203, -158.3359832763672, -153.55885314941406, -148.78173828125, -144.00460815429688, -139.22747802734375, -134.45034790039062, -129.6732177734375, -124.8960952758789, -120.11897277832031, -115.34184265136719, -110.5647201538086, -105.78759765625, -101.01046752929688, -96.23335266113281, -91.45623016357422, -86.6791000366211, -81.9019775390625, -77.12484741210938, -72.34772491455078, -67.57060241699219, -62.79347610473633, -58.01634979248047, -53.23922348022461, -48.46209716796875, -43.684974670410156, -38.9078483581543, -34.13072204589844, -29.35359764099121, -24.576473236083984, -19.799346923828125, -15.022221565246582, -10.245096206665039, -5.467970848083496, -0.6908454895019531, 4.086280822753906, 8.863405227661133, 13.64052963256836, 18.41765594482422, 23.194782257080078, 27.971906661987305, 32.74903106689453, 37.52615737915039, 42.30328369140625, 47.080406188964844, 51.8575325012207, 56.63465881347656, 61.41178512573242, 66.18891143798828, 70.96603393554688, 75.7431640625, 80.5202865600586, 85.29740905761719, 90.07453918457031, 94.8516616821289, 99.6287841796875, 104.40591430664062, 109.18303680419922, 113.96015930175781, 118.73728942871094, 123.51441192626953, 128.29153442382812, 133.06866455078125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 9.0, 11.0, 7.0, 15.0, 11.0, 21.0, 16.0, 27.0, 22.0, 25.0, 24.0, 36.0, 27.0, 38.0, 46.0, 31.0, 38.0, 35.0, 38.0, 45.0, 42.0, 47.0, 46.0, 43.0, 31.0, 33.0, 30.0, 31.0, 22.0, 21.0, 20.0, 21.0, 14.0, 10.0, 14.0, 10.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.75, -22.0517578125, -21.353515625, -20.6552734375, -19.95703125, -19.2587890625, -18.560546875, -17.8623046875, -17.1640625, -16.4658203125, -15.767578125, -15.0693359375, -14.37109375, -13.6728515625, -12.974609375, -12.2763671875, -11.578125, -10.8798828125, -10.181640625, -9.4833984375, -8.78515625, -8.0869140625, -7.388671875, -6.6904296875, -5.9921875, -5.2939453125, -4.595703125, -3.8974609375, -3.19921875, -2.5009765625, -1.802734375, -1.1044921875, -0.40625, 0.2919921875, 0.990234375, 1.6884765625, 2.38671875, 3.0849609375, 3.783203125, 4.4814453125, 5.1796875, 5.8779296875, 6.576171875, 7.2744140625, 7.97265625, 8.6708984375, 9.369140625, 10.0673828125, 10.765625, 11.4638671875, 12.162109375, 12.8603515625, 13.55859375, 14.2568359375, 14.955078125, 15.6533203125, 16.3515625, 17.0498046875, 17.748046875, 18.4462890625, 19.14453125, 19.8427734375, 20.541015625, 21.2392578125, 21.9375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 8.0, 18.0, 18.0, 40.0, 46.0, 68.0, 118.0, 144.0, 216.0, 337.0, 496.0, 703.0, 1073.0, 1590.0, 2401.0, 3744.0, 5741.0, 9121.0, 14297.0, 23457.0, 38361.0, 66288.0, 118587.0, 209825.0, 229935.0, 134067.0, 74685.0, 43008.0, 25807.0, 15791.0, 10097.0, 6352.0, 4092.0, 2633.0, 1727.0, 1237.0, 767.0, 510.0, 382.0, 244.0, 157.0, 117.0, 83.0, 45.0, 38.0, 29.0, 12.0, 15.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.1259765625, -1.0919647216796875, -1.057952880859375, -1.0239410400390625, -0.98992919921875, -0.9559173583984375, -0.921905517578125, -0.8878936767578125, -0.8538818359375, -0.8198699951171875, -0.785858154296875, -0.7518463134765625, -0.71783447265625, -0.6838226318359375, -0.649810791015625, -0.6157989501953125, -0.581787109375, -0.5477752685546875, -0.513763427734375, -0.4797515869140625, -0.44573974609375, -0.4117279052734375, -0.377716064453125, -0.3437042236328125, -0.3096923828125, -0.2756805419921875, -0.241668701171875, -0.2076568603515625, -0.17364501953125, -0.1396331787109375, -0.105621337890625, -0.0716094970703125, -0.03759765625, -0.0035858154296875, 0.030426025390625, 0.0644378662109375, 0.09844970703125, 0.1324615478515625, 0.166473388671875, 0.2004852294921875, 0.2344970703125, 0.2685089111328125, 0.302520751953125, 0.3365325927734375, 0.37054443359375, 0.4045562744140625, 0.438568115234375, 0.4725799560546875, 0.506591796875, 0.5406036376953125, 0.574615478515625, 0.6086273193359375, 0.64263916015625, 0.6766510009765625, 0.710662841796875, 0.7446746826171875, 0.7786865234375, 0.8126983642578125, 0.846710205078125, 0.8807220458984375, 0.91473388671875, 0.9487457275390625, 0.982757568359375, 1.0167694091796875, 1.05078125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 11.0, 9.0, 12.0, 16.0, 20.0, 17.0, 25.0, 36.0, 27.0, 20.0, 25.0, 41.0, 29.0, 31.0, 42.0, 44.0, 47.0, 1076.0, 43.0, 41.0, 36.0, 38.0, 33.0, 42.0, 30.0, 24.0, 24.0, 24.0, 26.0, 16.0, 16.0, 19.0, 10.0, 13.0, 11.0, 13.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3671875, -13.9031982421875, -13.439208984375, -12.9752197265625, -12.51123046875, -12.0472412109375, -11.583251953125, -11.1192626953125, -10.6552734375, -10.1912841796875, -9.727294921875, -9.2633056640625, -8.79931640625, -8.3353271484375, -7.871337890625, -7.4073486328125, -6.943359375, -6.4793701171875, -6.015380859375, -5.5513916015625, -5.08740234375, -4.6234130859375, -4.159423828125, -3.6954345703125, -3.2314453125, -2.7674560546875, -2.303466796875, -1.8394775390625, -1.37548828125, -0.9114990234375, -0.447509765625, 0.0164794921875, 0.48046875, 0.9444580078125, 1.408447265625, 1.8724365234375, 2.33642578125, 2.8004150390625, 3.264404296875, 3.7283935546875, 4.1923828125, 4.6563720703125, 5.120361328125, 5.5843505859375, 6.04833984375, 6.5123291015625, 6.976318359375, 7.4403076171875, 7.904296875, 8.3682861328125, 8.832275390625, 9.2962646484375, 9.76025390625, 10.2242431640625, 10.688232421875, 11.1522216796875, 11.6162109375, 12.0802001953125, 12.544189453125, 13.0081787109375, 13.47216796875, 13.9361572265625, 14.400146484375, 14.8641357421875, 15.328125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 19.0, 33.0, 45.0, 76.0, 105.0, 155.0, 243.0, 364.0, 505.0, 793.0, 1125.0, 1634.0, 2397.0, 3444.0, 4932.0, 7236.0, 10369.0, 15147.0, 21752.0, 33017.0, 51416.0, 84440.0, 150369.0, 1278106.0, 168074.0, 93569.0, 56396.0, 36015.0, 23567.0, 15893.0, 11053.0, 7682.0, 5328.0, 3746.0, 2544.0, 1822.0, 1212.0, 785.0, 563.0, 391.0, 253.0, 153.0, 121.0, 66.0, 51.0, 41.0, 28.0, 13.0, 14.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.9169921875, -0.88885498046875, -0.8607177734375, -0.83258056640625, -0.804443359375, -0.77630615234375, -0.7481689453125, -0.72003173828125, -0.69189453125, -0.66375732421875, -0.6356201171875, -0.60748291015625, -0.579345703125, -0.55120849609375, -0.5230712890625, -0.49493408203125, -0.466796875, -0.43865966796875, -0.4105224609375, -0.38238525390625, -0.354248046875, -0.32611083984375, -0.2979736328125, -0.26983642578125, -0.24169921875, -0.21356201171875, -0.1854248046875, -0.15728759765625, -0.129150390625, -0.10101318359375, -0.0728759765625, -0.04473876953125, -0.0166015625, 0.01153564453125, 0.0396728515625, 0.06781005859375, 0.095947265625, 0.12408447265625, 0.1522216796875, 0.18035888671875, 0.20849609375, 0.23663330078125, 0.2647705078125, 0.29290771484375, 0.321044921875, 0.34918212890625, 0.3773193359375, 0.40545654296875, 0.43359375, 0.46173095703125, 0.4898681640625, 0.51800537109375, 0.546142578125, 0.57427978515625, 0.6024169921875, 0.63055419921875, 0.65869140625, 0.68682861328125, 0.7149658203125, 0.74310302734375, 0.771240234375, 0.79937744140625, 0.8275146484375, 0.85565185546875, 0.8837890625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 12.0, 12.0, 14.0, 26.0, 31.0, 26.0, 48.0, 60.0, 61.0, 76.0, 78.0, 78.0, 53.0, 65.0, 67.0, 57.0, 46.0, 40.0, 37.0, 22.0, 10.0, 16.0, 18.0, 8.0, 9.0, 9.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005794525146484375, -0.005633056163787842, -0.005471587181091309, -0.005310118198394775, -0.005148649215698242, -0.004987180233001709, -0.004825711250305176, -0.004664242267608643, -0.004502773284912109, -0.004341304302215576, -0.004179835319519043, -0.00401836633682251, -0.0038568973541259766, -0.0036954283714294434, -0.00353395938873291, -0.003372490406036377, -0.0032110214233398438, -0.0030495524406433105, -0.0028880834579467773, -0.002726614475250244, -0.002565145492553711, -0.0024036765098571777, -0.0022422075271606445, -0.0020807385444641113, -0.0019192695617675781, -0.001757800579071045, -0.0015963315963745117, -0.0014348626136779785, -0.0012733936309814453, -0.0011119246482849121, -0.0009504556655883789, -0.0007889866828918457, -0.0006275177001953125, -0.0004660487174987793, -0.0003045797348022461, -0.0001431107521057129, 1.8358230590820312e-05, 0.00017982721328735352, 0.0003412961959838867, 0.0005027651786804199, 0.0006642341613769531, 0.0008257031440734863, 0.0009871721267700195, 0.0011486411094665527, 0.001310110092163086, 0.0014715790748596191, 0.0016330480575561523, 0.0017945170402526855, 0.0019559860229492188, 0.002117455005645752, 0.002278923988342285, 0.0024403929710388184, 0.0026018619537353516, 0.0027633309364318848, 0.002924799919128418, 0.003086268901824951, 0.0032477378845214844, 0.0034092068672180176, 0.0035706758499145508, 0.003732144832611084, 0.003893613815307617, 0.00405508279800415, 0.004216551780700684, 0.004378020763397217, 0.00453948974609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 11.0, 19.0, 21.0, 19.0, 23.0, 35.0, 49.0, 72.0, 96.0, 160.0, 260.0, 773.0, 12765.0, 919352.0, 111488.0, 2319.0, 408.0, 233.0, 124.0, 78.0, 79.0, 43.0, 25.0, 24.0, 22.0, 9.0, 12.0, 7.0, 8.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.078948974609375, -0.0762939453125, -0.073638916015625, -0.07098388671875, -0.068328857421875, -0.065673828125, -0.063018798828125, -0.06036376953125, -0.057708740234375, -0.0550537109375, -0.052398681640625, -0.04974365234375, -0.047088623046875, -0.04443359375, -0.041778564453125, -0.03912353515625, -0.036468505859375, -0.0338134765625, -0.031158447265625, -0.02850341796875, -0.025848388671875, -0.023193359375, -0.020538330078125, -0.01788330078125, -0.015228271484375, -0.0125732421875, -0.009918212890625, -0.00726318359375, -0.004608154296875, -0.001953125, 0.000701904296875, 0.00335693359375, 0.006011962890625, 0.0086669921875, 0.011322021484375, 0.01397705078125, 0.016632080078125, 0.019287109375, 0.021942138671875, 0.02459716796875, 0.027252197265625, 0.0299072265625, 0.032562255859375, 0.03521728515625, 0.037872314453125, 0.04052734375, 0.043182373046875, 0.04583740234375, 0.048492431640625, 0.0511474609375, 0.053802490234375, 0.05645751953125, 0.059112548828125, 0.061767578125, 0.064422607421875, 0.06707763671875, 0.069732666015625, 0.0723876953125, 0.075042724609375, 0.07769775390625, 0.080352783203125, 0.0830078125, 0.085662841796875, 0.08831787109375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 12.0, 46.0, 175.0, 426.0, 249.0, 78.0, 14.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008297149091959, -0.007826501503586769, -0.007355854846537113, -0.00688520772382617, -0.006414560601115227, -0.005943913012742996, -0.00547326635569334, -0.00500261876732111, -0.004531972110271454, -0.004061324987560511, -0.0035906778648495674, -0.003120030742138624, -0.002649383619427681, -0.002178736263886094, -0.0017080891411751509, -0.0012374420184642076, -0.0007667946629226208, -0.0002961475111078471, 0.00017449964070692658, 0.0006451468216255307, 0.001115793944336474, 0.001586441183462739, 0.002057088306173682, 0.0025277354288846254, 0.0029983825515955687, 0.003469029674306512, 0.003939677029848099, 0.004410324152559042, 0.004880971275269985, 0.005351618397980928, 0.005822265520691872, 0.006292912643402815, 0.006763559766113758, 0.007234206888824701, 0.0077048540115356445, 0.008175501599907875, 0.008646148256957531, 0.009116795845329762, 0.009587442502379417, 0.010058090090751648, 0.010528736747801304, 0.010999384336173534, 0.01147003099322319, 0.01194067858159542, 0.012411325238645077, 0.012881972827017307, 0.013352619484066963, 0.013823267072439194, 0.014293914660811424, 0.014764562249183655, 0.01523520890623331, 0.015705855563282967, 0.016176503151655197, 0.016647150740027428, 0.017117798328399658, 0.01758844405412674, 0.01805909164249897, 0.0185297392308712, 0.01900038681924343, 0.019471032544970512, 0.019941680133342743, 0.020412327721714973, 0.020882975310087204, 0.021353621035814285, 0.021824268624186516]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 4.0, 9.0, 12.0, 14.0, 12.0, 20.0, 22.0, 19.0, 21.0, 23.0, 34.0, 31.0, 42.0, 39.0, 30.0, 47.0, 50.0, 34.0, 27.0, 34.0, 38.0, 41.0, 34.0, 27.0, 43.0, 33.0, 32.0, 30.0, 23.0, 22.0, 27.0, 16.0, 15.0, 8.0, 15.0, 7.0, 10.0, 11.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0], "bins": [-0.002365589141845703, -0.00229695625603199, -0.002228323370218277, -0.002159690484404564, -0.002091057598590851, -0.0020224247127771378, -0.0019537918269634247, -0.0018851589411497116, -0.0018165260553359985, -0.0017478931695222855, -0.0016792602837085724, -0.0016106273978948593, -0.0015419945120811462, -0.0014733616262674332, -0.00140472874045372, -0.001336095854640007, -0.001267462968826294, -0.0011988300830125809, -0.0011301971971988678, -0.0010615643113851547, -0.0009929314255714417, -0.0009242985397577286, -0.0008556656539440155, -0.0007870327681303024, -0.0007183998823165894, -0.0006497669965028763, -0.0005811341106891632, -0.0005125012248754501, -0.00044386833906173706, -0.000375235453248024, -0.0003066025674343109, -0.00023796968162059784, -0.00016933679580688477, -0.00010070390999317169, -3.207102417945862e-05, 3.6561861634254456e-05, 0.00010519474744796753, 0.0001738276332616806, 0.00024246051907539368, 0.00031109340488910675, 0.0003797262907028198, 0.0004483591765165329, 0.000516992062330246, 0.000585624948143959, 0.0006542578339576721, 0.0007228907197713852, 0.0007915236055850983, 0.0008601564913988113, 0.0009287893772125244, 0.0009974222630262375, 0.0010660551488399506, 0.0011346880346536636, 0.0012033209204673767, 0.0012719538062810898, 0.0013405866920948029, 0.001409219577908516, 0.001477852463722229, 0.001546485349535942, 0.0016151182353496552, 0.0016837511211633682, 0.0017523840069770813, 0.0018210168927907944, 0.0018896497786045074, 0.0019582826644182205, 0.0020269155502319336]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 9.0, 11.0, 7.0, 15.0, 11.0, 21.0, 16.0, 27.0, 22.0, 25.0, 24.0, 36.0, 27.0, 38.0, 46.0, 31.0, 38.0, 35.0, 38.0, 45.0, 42.0, 47.0, 46.0, 43.0, 31.0, 33.0, 30.0, 31.0, 22.0, 21.0, 20.0, 21.0, 14.0, 10.0, 14.0, 10.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.75, -22.0517578125, -21.353515625, -20.6552734375, -19.95703125, -19.2587890625, -18.560546875, -17.8623046875, -17.1640625, -16.4658203125, -15.767578125, -15.0693359375, -14.37109375, -13.6728515625, -12.974609375, -12.2763671875, -11.578125, -10.8798828125, -10.181640625, -9.4833984375, -8.78515625, -8.0869140625, -7.388671875, -6.6904296875, -5.9921875, -5.2939453125, -4.595703125, -3.8974609375, -3.19921875, -2.5009765625, -1.802734375, -1.1044921875, -0.40625, 0.2919921875, 0.990234375, 1.6884765625, 2.38671875, 3.0849609375, 3.783203125, 4.4814453125, 5.1796875, 5.8779296875, 6.576171875, 7.2744140625, 7.97265625, 8.6708984375, 9.369140625, 10.0673828125, 10.765625, 11.4638671875, 12.162109375, 12.8603515625, 13.55859375, 14.2568359375, 14.955078125, 15.6533203125, 16.3515625, 17.0498046875, 17.748046875, 18.4462890625, 19.14453125, 19.8427734375, 20.541015625, 21.2392578125, 21.9375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 5.0, 4.0, 6.0, 10.0, 11.0, 13.0, 20.0, 21.0, 32.0, 43.0, 71.0, 97.0, 117.0, 213.0, 335.0, 534.0, 939.0, 1600.0, 3276.0, 7390.0, 22385.0, 135605.0, 749149.0, 95001.0, 18477.0, 6458.0, 2909.0, 1538.0, 877.0, 488.0, 303.0, 195.0, 141.0, 80.0, 44.0, 49.0, 34.0, 22.0, 14.0, 18.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-38.90625, -37.7421875, -36.578125, -35.4140625, -34.25, -33.0859375, -31.921875, -30.7578125, -29.59375, -28.4296875, -27.265625, -26.1015625, -24.9375, -23.7734375, -22.609375, -21.4453125, -20.28125, -19.1171875, -17.953125, -16.7890625, -15.625, -14.4609375, -13.296875, -12.1328125, -10.96875, -9.8046875, -8.640625, -7.4765625, -6.3125, -5.1484375, -3.984375, -2.8203125, -1.65625, -0.4921875, 0.671875, 1.8359375, 3.0, 4.1640625, 5.328125, 6.4921875, 7.65625, 8.8203125, 9.984375, 11.1484375, 12.3125, 13.4765625, 14.640625, 15.8046875, 16.96875, 18.1328125, 19.296875, 20.4609375, 21.625, 22.7890625, 23.953125, 25.1171875, 26.28125, 27.4453125, 28.609375, 29.7734375, 30.9375, 32.1015625, 33.265625, 34.4296875, 35.59375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 15.0, 16.0, 8.0, 12.0, 13.0, 15.0, 22.0, 21.0, 46.0, 40.0, 39.0, 67.0, 60.0, 64.0, 102.0, 178.0, 1719.0, 129.0, 75.0, 54.0, 55.0, 37.0, 38.0, 38.0, 25.0, 23.0, 19.0, 21.0, 18.0, 13.0, 13.0, 12.0, 6.0, 4.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-90.0, -87.1259765625, -84.251953125, -81.3779296875, -78.50390625, -75.6298828125, -72.755859375, -69.8818359375, -67.0078125, -64.1337890625, -61.259765625, -58.3857421875, -55.51171875, -52.6376953125, -49.763671875, -46.8896484375, -44.015625, -41.1416015625, -38.267578125, -35.3935546875, -32.51953125, -29.6455078125, -26.771484375, -23.8974609375, -21.0234375, -18.1494140625, -15.275390625, -12.4013671875, -9.52734375, -6.6533203125, -3.779296875, -0.9052734375, 1.96875, 4.8427734375, 7.716796875, 10.5908203125, 13.46484375, 16.3388671875, 19.212890625, 22.0869140625, 24.9609375, 27.8349609375, 30.708984375, 33.5830078125, 36.45703125, 39.3310546875, 42.205078125, 45.0791015625, 47.953125, 50.8271484375, 53.701171875, 56.5751953125, 59.44921875, 62.3232421875, 65.197265625, 68.0712890625, 70.9453125, 73.8193359375, 76.693359375, 79.5673828125, 82.44140625, 85.3154296875, 88.189453125, 91.0634765625, 93.9375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 8.0, 12.0, 22.0, 29.0, 39.0, 66.0, 77.0, 126.0, 227.0, 439.0, 1515.0, 24387.0, 3108477.0, 8236.0, 1056.0, 398.0, 189.0, 138.0, 75.0, 46.0, 31.0, 26.0, 21.0, 15.0, 17.0, 5.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-248.875, -239.064453125, -229.25390625, -219.443359375, -209.6328125, -199.822265625, -190.01171875, -180.201171875, -170.390625, -160.580078125, -150.76953125, -140.958984375, -131.1484375, -121.337890625, -111.52734375, -101.716796875, -91.90625, -82.095703125, -72.28515625, -62.474609375, -52.6640625, -42.853515625, -33.04296875, -23.232421875, -13.421875, -3.611328125, 6.19921875, 16.009765625, 25.8203125, 35.630859375, 45.44140625, 55.251953125, 65.0625, 74.873046875, 84.68359375, 94.494140625, 104.3046875, 114.115234375, 123.92578125, 133.736328125, 143.546875, 153.357421875, 163.16796875, 172.978515625, 182.7890625, 192.599609375, 202.41015625, 212.220703125, 222.03125, 231.841796875, 241.65234375, 251.462890625, 261.2734375, 271.083984375, 280.89453125, 290.705078125, 300.515625, 310.326171875, 320.13671875, 329.947265625, 339.7578125, 349.568359375, 359.37890625, 369.189453125, 379.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 8.0, 12.0, 39.0, 70.0, 157.0, 269.0, 219.0, 123.0, 59.0, 24.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.35208892822266, -83.11502075195312, -77.8779525756836, -72.64088439941406, -67.40380859375, -62.16674041748047, -56.92967224121094, -51.69260025024414, -46.45553207397461, -41.21846389770508, -35.98139190673828, -30.74432373046875, -25.507253646850586, -20.270183563232422, -15.03311538696289, -9.796043395996094, -4.5589752197265625, 0.6780943870544434, 5.915163993835449, 11.152233123779297, 16.38930320739746, 21.626373291015625, 26.863441467285156, 32.10051345825195, 37.337581634521484, 42.574649810791016, 47.81172180175781, 53.048789978027344, 58.285858154296875, 63.52293014526367, 68.75999450683594, 73.9970703125, 79.234130859375, 84.47119903564453, 89.70826721191406, 94.94534301757812, 100.18241119384766, 105.41947937011719, 110.65654754638672, 115.89361572265625, 121.13069152832031, 126.36775970458984, 131.60482788085938, 136.84190368652344, 142.07896423339844, 147.3160400390625, 152.5531005859375, 157.79017639160156, 163.02725219726562, 168.2643280029297, 173.5013885498047, 178.73846435546875, 183.97552490234375, 189.2126007080078, 194.44967651367188, 199.68673706054688, 204.92379760742188, 210.16087341308594, 215.39793395996094, 220.635009765625, 225.8720703125, 231.10914611816406, 236.34622192382812, 241.58328247070312, 246.8203582763672]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 6.0, 9.0, 3.0, 11.0, 17.0, 10.0, 18.0, 16.0, 18.0, 21.0, 10.0, 25.0, 20.0, 31.0, 28.0, 35.0, 39.0, 39.0, 51.0, 36.0, 44.0, 36.0, 41.0, 43.0, 39.0, 45.0, 36.0, 36.0, 29.0, 33.0, 23.0, 16.0, 25.0, 19.0, 19.0, 18.0, 14.0, 13.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-184.27944946289062, -178.48728942871094, -172.6951446533203, -166.90298461914062, -161.11082458496094, -155.3186798095703, -149.52651977539062, -143.734375, -137.9422149658203, -132.15005493164062, -126.35790252685547, -120.56575012207031, -114.77359771728516, -108.9814453125, -103.18928527832031, -97.39713287353516, -91.60497283935547, -85.81282043457031, -80.02066040039062, -74.22850799560547, -68.43635559082031, -62.64419937133789, -56.85204315185547, -51.05989074707031, -45.26773452758789, -39.47557830810547, -33.68342590332031, -27.89126968383789, -22.0991153717041, -16.306961059570312, -10.51480484008789, -4.722652435302734, 1.0695037841796875, 6.861658573150635, 12.653813362121582, 18.445968627929688, 24.238122940063477, 30.030277252197266, 35.82243347167969, 41.614585876464844, 47.406742095947266, 53.19889831542969, 58.991050720214844, 64.783203125, 70.57536315917969, 76.36751556396484, 82.15966796875, 87.95182800292969, 93.74398040771484, 99.5361328125, 105.32829284667969, 111.12044525146484, 116.91259765625, 122.70475769042969, 128.49691772460938, 134.2890625, 140.0812225341797, 145.87338256835938, 151.66552734375, 157.4576873779297, 163.24984741210938, 169.0419921875, 174.8341522216797, 180.62631225585938, 186.41845703125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 9.0, 10.0, 17.0, 4.0, 13.0, 14.0, 14.0, 26.0, 15.0, 16.0, 33.0, 22.0, 30.0, 37.0, 38.0, 41.0, 31.0, 34.0, 36.0, 39.0, 49.0, 47.0, 44.0, 34.0, 37.0, 36.0, 34.0, 37.0, 23.0, 25.0, 19.0, 14.0, 21.0, 19.0, 16.0, 15.0, 11.0, 9.0, 3.0, 9.0, 6.0, 1.0, 0.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.3125, -22.601806640625, -21.89111328125, -21.180419921875, -20.4697265625, -19.759033203125, -19.04833984375, -18.337646484375, -17.626953125, -16.916259765625, -16.20556640625, -15.494873046875, -14.7841796875, -14.073486328125, -13.36279296875, -12.652099609375, -11.94140625, -11.230712890625, -10.52001953125, -9.809326171875, -9.0986328125, -8.387939453125, -7.67724609375, -6.966552734375, -6.255859375, -5.545166015625, -4.83447265625, -4.123779296875, -3.4130859375, -2.702392578125, -1.99169921875, -1.281005859375, -0.5703125, 0.140380859375, 0.85107421875, 1.561767578125, 2.2724609375, 2.983154296875, 3.69384765625, 4.404541015625, 5.115234375, 5.825927734375, 6.53662109375, 7.247314453125, 7.9580078125, 8.668701171875, 9.37939453125, 10.090087890625, 10.80078125, 11.511474609375, 12.22216796875, 12.932861328125, 13.6435546875, 14.354248046875, 15.06494140625, 15.775634765625, 16.486328125, 17.197021484375, 17.90771484375, 18.618408203125, 19.3291015625, 20.039794921875, 20.75048828125, 21.461181640625, 22.171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 8.0, 6.0, 9.0, 18.0, 23.0, 24.0, 33.0, 37.0, 37.0, 81.0, 113.0, 176.0, 274.0, 378.0, 519.0, 900.0, 1453.0, 2549.0, 4656.0, 9643.0, 25315.0, 558615.0, 3422234.0, 135125.0, 16635.0, 6917.0, 3468.0, 1935.0, 1095.0, 683.0, 424.0, 260.0, 187.0, 113.0, 84.0, 64.0, 43.0, 42.0, 25.0, 19.0, 14.0, 12.0, 10.0, 2.0, 1.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-79.6875, -77.220703125, -74.75390625, -72.287109375, -69.8203125, -67.353515625, -64.88671875, -62.419921875, -59.953125, -57.486328125, -55.01953125, -52.552734375, -50.0859375, -47.619140625, -45.15234375, -42.685546875, -40.21875, -37.751953125, -35.28515625, -32.818359375, -30.3515625, -27.884765625, -25.41796875, -22.951171875, -20.484375, -18.017578125, -15.55078125, -13.083984375, -10.6171875, -8.150390625, -5.68359375, -3.216796875, -0.75, 1.716796875, 4.18359375, 6.650390625, 9.1171875, 11.583984375, 14.05078125, 16.517578125, 18.984375, 21.451171875, 23.91796875, 26.384765625, 28.8515625, 31.318359375, 33.78515625, 36.251953125, 38.71875, 41.185546875, 43.65234375, 46.119140625, 48.5859375, 51.052734375, 53.51953125, 55.986328125, 58.453125, 60.919921875, 63.38671875, 65.853515625, 68.3203125, 70.787109375, 73.25390625, 75.720703125, 78.1875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 6.0, 13.0, 13.0, 14.0, 20.0, 17.0, 43.0, 36.0, 87.0, 179.0, 495.0, 1086.0, 1154.0, 437.0, 181.0, 88.0, 35.0, 30.0, 28.0, 25.0, 13.0, 17.0, 7.0, 6.0, 12.0, 3.0, 9.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.5625, -77.2236328125, -74.884765625, -72.5458984375, -70.20703125, -67.8681640625, -65.529296875, -63.1904296875, -60.8515625, -58.5126953125, -56.173828125, -53.8349609375, -51.49609375, -49.1572265625, -46.818359375, -44.4794921875, -42.140625, -39.8017578125, -37.462890625, -35.1240234375, -32.78515625, -30.4462890625, -28.107421875, -25.7685546875, -23.4296875, -21.0908203125, -18.751953125, -16.4130859375, -14.07421875, -11.7353515625, -9.396484375, -7.0576171875, -4.71875, -2.3798828125, -0.041015625, 2.2978515625, 4.63671875, 6.9755859375, 9.314453125, 11.6533203125, 13.9921875, 16.3310546875, 18.669921875, 21.0087890625, 23.34765625, 25.6865234375, 28.025390625, 30.3642578125, 32.703125, 35.0419921875, 37.380859375, 39.7197265625, 42.05859375, 44.3974609375, 46.736328125, 49.0751953125, 51.4140625, 53.7529296875, 56.091796875, 58.4306640625, 60.76953125, 63.1083984375, 65.447265625, 67.7861328125, 70.125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 9.0, 12.0, 17.0, 26.0, 33.0, 69.0, 82.0, 161.0, 289.0, 580.0, 1509.0, 4069.0, 13027.0, 55027.0, 3359384.0, 706603.0, 37737.0, 9992.0, 3302.0, 1246.0, 508.0, 228.0, 135.0, 88.0, 42.0, 29.0, 28.0, 13.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.75, -133.140625, -128.53125, -123.921875, -119.3125, -114.703125, -110.09375, -105.484375, -100.875, -96.265625, -91.65625, -87.046875, -82.4375, -77.828125, -73.21875, -68.609375, -64.0, -59.390625, -54.78125, -50.171875, -45.5625, -40.953125, -36.34375, -31.734375, -27.125, -22.515625, -17.90625, -13.296875, -8.6875, -4.078125, 0.53125, 5.140625, 9.75, 14.359375, 18.96875, 23.578125, 28.1875, 32.796875, 37.40625, 42.015625, 46.625, 51.234375, 55.84375, 60.453125, 65.0625, 69.671875, 74.28125, 78.890625, 83.5, 88.109375, 92.71875, 97.328125, 101.9375, 106.546875, 111.15625, 115.765625, 120.375, 124.984375, 129.59375, 134.203125, 138.8125, 143.421875, 148.03125, 152.640625, 157.25]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 6.0, 17.0, 9.0, 9.0, 28.0, 42.0, 62.0, 125.0, 182.0, 189.0, 113.0, 73.0, 53.0, 26.0, 18.0, 15.0, 11.0, 5.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.41448974609375, -139.1709442138672, -129.92739868164062, -120.6838607788086, -111.44031524658203, -102.19676971435547, -92.95323181152344, -83.70968627929688, -74.46614074707031, -65.22259521484375, -55.97905349731445, -46.735511779785156, -37.491966247558594, -28.24842071533203, -19.004878997802734, -9.761337280273438, -0.517791748046875, 8.725751876831055, 17.969295501708984, 27.212839126586914, 36.456382751464844, 45.699928283691406, 54.9434700012207, 64.18701171875, 73.43055725097656, 82.67410278320312, 91.91764831542969, 101.16118621826172, 110.40473175048828, 119.64827728271484, 128.89181518554688, 138.13536071777344, 147.37893676757812, 156.6224822998047, 165.86602783203125, 175.1095733642578, 184.35311889648438, 193.59664916992188, 202.84019470214844, 212.083740234375, 221.32728576660156, 230.57083129882812, 239.8143768310547, 249.05792236328125, 258.30145263671875, 267.5450134277344, 276.7885437011719, 286.0321044921875, 295.275634765625, 304.5191650390625, 313.7627258300781, 323.0062561035156, 332.24981689453125, 341.49334716796875, 350.7369079589844, 359.9804382324219, 369.2239990234375, 378.467529296875, 387.7110900878906, 396.9546203613281, 406.19818115234375, 415.44171142578125, 424.6852722167969, 433.9288024902344, 443.1723327636719]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 4.0, 2.0, 10.0, 13.0, 6.0, 6.0, 13.0, 12.0, 18.0, 17.0, 32.0, 19.0, 31.0, 29.0, 29.0, 25.0, 40.0, 25.0, 36.0, 32.0, 45.0, 43.0, 28.0, 27.0, 34.0, 40.0, 33.0, 30.0, 37.0, 28.0, 34.0, 24.0, 24.0, 16.0, 18.0, 23.0, 23.0, 13.0, 13.0, 11.0, 10.0, 13.0, 8.0, 8.0, 8.0, 3.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-149.5488739013672, -145.10719299316406, -140.66549682617188, -136.22381591796875, -131.78211975097656, -127.34043884277344, -122.89875030517578, -118.45706176757812, -114.01537322998047, -109.57368469238281, -105.13199615478516, -100.6903076171875, -96.24862670898438, -91.80693054199219, -87.36524963378906, -82.9235610961914, -78.48187255859375, -74.0401840209961, -69.59849548339844, -65.15680694580078, -60.71512222290039, -56.273433685302734, -51.831748962402344, -47.39006042480469, -42.94837188720703, -38.506683349609375, -34.06499481201172, -29.623310089111328, -25.181621551513672, -20.739933013916016, -16.298246383666992, -11.856559753417969, -7.41485595703125, -2.97316837310791, 1.4685192108154297, 5.9102067947387695, 10.35189437866211, 14.793582916259766, 19.23526954650879, 23.676956176757812, 28.11864471435547, 32.560333251953125, 37.00202178955078, 41.44370651245117, 45.88539505004883, 50.327083587646484, 54.768768310546875, 59.21045684814453, 63.65214538574219, 68.09383392333984, 72.5355224609375, 76.97721099853516, 81.41889953613281, 85.86058044433594, 90.3022689819336, 94.74395751953125, 99.1856460571289, 103.62733459472656, 108.06902313232422, 112.51071166992188, 116.952392578125, 121.39408874511719, 125.83576965332031, 130.2774658203125, 134.71914672851562]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 9.0, 17.0, 14.0, 20.0, 15.0, 22.0, 22.0, 25.0, 35.0, 30.0, 25.0, 38.0, 36.0, 47.0, 35.0, 32.0, 62.0, 43.0, 45.0, 46.0, 33.0, 49.0, 36.0, 34.0, 35.0, 26.0, 27.0, 21.0, 21.0, 16.0, 14.0, 13.0, 6.0, 6.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.671875, -21.929443359375, -21.18701171875, -20.444580078125, -19.7021484375, -18.959716796875, -18.21728515625, -17.474853515625, -16.732421875, -15.989990234375, -15.24755859375, -14.505126953125, -13.7626953125, -13.020263671875, -12.27783203125, -11.535400390625, -10.79296875, -10.050537109375, -9.30810546875, -8.565673828125, -7.8232421875, -7.080810546875, -6.33837890625, -5.595947265625, -4.853515625, -4.111083984375, -3.36865234375, -2.626220703125, -1.8837890625, -1.141357421875, -0.39892578125, 0.343505859375, 1.0859375, 1.828369140625, 2.57080078125, 3.313232421875, 4.0556640625, 4.798095703125, 5.54052734375, 6.282958984375, 7.025390625, 7.767822265625, 8.51025390625, 9.252685546875, 9.9951171875, 10.737548828125, 11.47998046875, 12.222412109375, 12.96484375, 13.707275390625, 14.44970703125, 15.192138671875, 15.9345703125, 16.677001953125, 17.41943359375, 18.161865234375, 18.904296875, 19.646728515625, 20.38916015625, 21.131591796875, 21.8740234375, 22.616455078125, 23.35888671875, 24.101318359375, 24.84375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 15.0, 10.0, 18.0, 40.0, 45.0, 67.0, 107.0, 133.0, 170.0, 272.0, 391.0, 609.0, 945.0, 1353.0, 2031.0, 3016.0, 4694.0, 7000.0, 10896.0, 17308.0, 27318.0, 45237.0, 75592.0, 133611.0, 222504.0, 201665.0, 117143.0, 67223.0, 39958.0, 24675.0, 15454.0, 9976.0, 6544.0, 4074.0, 2726.0, 1800.0, 1303.0, 823.0, 562.0, 388.0, 289.0, 151.0, 115.0, 83.0, 58.0, 45.0, 46.0, 20.0, 18.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0], "bins": [-1.1494140625, -1.1154937744140625, -1.081573486328125, -1.0476531982421875, -1.01373291015625, -0.9798126220703125, -0.945892333984375, -0.9119720458984375, -0.8780517578125, -0.8441314697265625, -0.810211181640625, -0.7762908935546875, -0.74237060546875, -0.7084503173828125, -0.674530029296875, -0.6406097412109375, -0.606689453125, -0.5727691650390625, -0.538848876953125, -0.5049285888671875, -0.47100830078125, -0.4370880126953125, -0.403167724609375, -0.3692474365234375, -0.3353271484375, -0.3014068603515625, -0.267486572265625, -0.2335662841796875, -0.19964599609375, -0.1657257080078125, -0.131805419921875, -0.0978851318359375, -0.06396484375, -0.0300445556640625, 0.003875732421875, 0.0377960205078125, 0.07171630859375, 0.1056365966796875, 0.139556884765625, 0.1734771728515625, 0.2073974609375, 0.2413177490234375, 0.275238037109375, 0.3091583251953125, 0.34307861328125, 0.3769989013671875, 0.410919189453125, 0.4448394775390625, 0.478759765625, 0.5126800537109375, 0.546600341796875, 0.5805206298828125, 0.61444091796875, 0.6483612060546875, 0.682281494140625, 0.7162017822265625, 0.7501220703125, 0.7840423583984375, 0.817962646484375, 0.8518829345703125, 0.88580322265625, 0.9197235107421875, 0.953643798828125, 0.9875640869140625, 1.021484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 8.0, 8.0, 15.0, 15.0, 16.0, 19.0, 22.0, 27.0, 32.0, 32.0, 31.0, 55.0, 51.0, 51.0, 52.0, 35.0, 1073.0, 55.0, 43.0, 47.0, 28.0, 36.0, 31.0, 37.0, 25.0, 31.0, 19.0, 19.0, 14.0, 21.0, 16.0, 11.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-18.796875, -18.2950439453125, -17.793212890625, -17.2913818359375, -16.78955078125, -16.2877197265625, -15.785888671875, -15.2840576171875, -14.7822265625, -14.2803955078125, -13.778564453125, -13.2767333984375, -12.77490234375, -12.2730712890625, -11.771240234375, -11.2694091796875, -10.767578125, -10.2657470703125, -9.763916015625, -9.2620849609375, -8.76025390625, -8.2584228515625, -7.756591796875, -7.2547607421875, -6.7529296875, -6.2510986328125, -5.749267578125, -5.2474365234375, -4.74560546875, -4.2437744140625, -3.741943359375, -3.2401123046875, -2.73828125, -2.2364501953125, -1.734619140625, -1.2327880859375, -0.73095703125, -0.2291259765625, 0.272705078125, 0.7745361328125, 1.2763671875, 1.7781982421875, 2.280029296875, 2.7818603515625, 3.28369140625, 3.7855224609375, 4.287353515625, 4.7891845703125, 5.291015625, 5.7928466796875, 6.294677734375, 6.7965087890625, 7.29833984375, 7.8001708984375, 8.302001953125, 8.8038330078125, 9.3056640625, 9.8074951171875, 10.309326171875, 10.8111572265625, 11.31298828125, 11.8148193359375, 12.316650390625, 12.8184814453125, 13.3203125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 11.0, 11.0, 20.0, 35.0, 37.0, 67.0, 82.0, 149.0, 204.0, 320.0, 493.0, 734.0, 1118.0, 1643.0, 2530.0, 3899.0, 5814.0, 8718.0, 13920.0, 21844.0, 36409.0, 62708.0, 117720.0, 253413.0, 1267008.0, 127291.0, 67418.0, 38545.0, 23094.0, 14563.0, 9414.0, 6091.0, 3921.0, 2687.0, 1710.0, 1174.0, 832.0, 474.0, 331.0, 243.0, 165.0, 88.0, 61.0, 40.0, 27.0, 20.0, 12.0, 8.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.0283203125, -0.995208740234375, -0.96209716796875, -0.928985595703125, -0.8958740234375, -0.862762451171875, -0.82965087890625, -0.796539306640625, -0.763427734375, -0.730316162109375, -0.69720458984375, -0.664093017578125, -0.6309814453125, -0.597869873046875, -0.56475830078125, -0.531646728515625, -0.49853515625, -0.465423583984375, -0.43231201171875, -0.399200439453125, -0.3660888671875, -0.332977294921875, -0.29986572265625, -0.266754150390625, -0.233642578125, -0.200531005859375, -0.16741943359375, -0.134307861328125, -0.1011962890625, -0.068084716796875, -0.03497314453125, -0.001861572265625, 0.03125, 0.064361572265625, 0.09747314453125, 0.130584716796875, 0.1636962890625, 0.196807861328125, 0.22991943359375, 0.263031005859375, 0.296142578125, 0.329254150390625, 0.36236572265625, 0.395477294921875, 0.4285888671875, 0.461700439453125, 0.49481201171875, 0.527923583984375, 0.56103515625, 0.594146728515625, 0.62725830078125, 0.660369873046875, 0.6934814453125, 0.726593017578125, 0.75970458984375, 0.792816162109375, 0.825927734375, 0.859039306640625, 0.89215087890625, 0.925262451171875, 0.9583740234375, 0.991485595703125, 1.02459716796875, 1.057708740234375, 1.0908203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 11.0, 14.0, 17.0, 25.0, 28.0, 39.0, 39.0, 43.0, 49.0, 49.0, 42.0, 60.0, 50.0, 42.0, 61.0, 48.0, 55.0, 50.0, 46.0, 41.0, 35.0, 17.0, 19.0, 14.0, 20.0, 13.0, 17.0, 9.0, 4.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.004486083984375, -0.004356026649475098, -0.004225969314575195, -0.004095911979675293, -0.003965854644775391, -0.0038357973098754883, -0.003705739974975586, -0.0035756826400756836, -0.0034456253051757812, -0.003315567970275879, -0.0031855106353759766, -0.0030554533004760742, -0.002925395965576172, -0.0027953386306762695, -0.002665281295776367, -0.002535223960876465, -0.0024051666259765625, -0.00227510929107666, -0.002145051956176758, -0.0020149946212768555, -0.0018849372863769531, -0.0017548799514770508, -0.0016248226165771484, -0.001494765281677246, -0.0013647079467773438, -0.0012346506118774414, -0.001104593276977539, -0.0009745359420776367, -0.0008444786071777344, -0.000714421272277832, -0.0005843639373779297, -0.00045430660247802734, -0.000324249267578125, -0.00019419193267822266, -6.413459777832031e-05, 6.592273712158203e-05, 0.00019598007202148438, 0.0003260374069213867, 0.00045609474182128906, 0.0005861520767211914, 0.0007162094116210938, 0.0008462667465209961, 0.0009763240814208984, 0.0011063814163208008, 0.0012364387512207031, 0.0013664960861206055, 0.0014965534210205078, 0.0016266107559204102, 0.0017566680908203125, 0.0018867254257202148, 0.002016782760620117, 0.0021468400955200195, 0.002276897430419922, 0.0024069547653198242, 0.0025370121002197266, 0.002667069435119629, 0.0027971267700195312, 0.0029271841049194336, 0.003057241439819336, 0.0031872987747192383, 0.0033173561096191406, 0.003447413444519043, 0.0035774707794189453, 0.0037075281143188477, 0.00383758544921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 6.0, 13.0, 16.0, 19.0, 12.0, 26.0, 30.0, 43.0, 47.0, 93.0, 108.0, 165.0, 309.0, 1347.0, 39224.0, 972675.0, 32292.0, 1165.0, 322.0, 192.0, 112.0, 78.0, 59.0, 53.0, 37.0, 24.0, 17.0, 18.0, 12.0, 9.0, 9.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.081298828125, -0.07871627807617188, -0.07613372802734375, -0.07355117797851562, -0.0709686279296875, -0.06838607788085938, -0.06580352783203125, -0.06322097778320312, -0.060638427734375, -0.058055877685546875, -0.05547332763671875, -0.052890777587890625, -0.0503082275390625, -0.047725677490234375, -0.04514312744140625, -0.042560577392578125, -0.03997802734375, -0.037395477294921875, -0.03481292724609375, -0.032230377197265625, -0.0296478271484375, -0.027065277099609375, -0.02448272705078125, -0.021900177001953125, -0.019317626953125, -0.016735076904296875, -0.01415252685546875, -0.011569976806640625, -0.0089874267578125, -0.006404876708984375, -0.00382232666015625, -0.001239776611328125, 0.0013427734375, 0.003925323486328125, 0.00650787353515625, 0.009090423583984375, 0.0116729736328125, 0.014255523681640625, 0.01683807373046875, 0.019420623779296875, 0.022003173828125, 0.024585723876953125, 0.02716827392578125, 0.029750823974609375, 0.0323333740234375, 0.034915924072265625, 0.03749847412109375, 0.040081024169921875, 0.04266357421875, 0.045246124267578125, 0.04782867431640625, 0.050411224365234375, 0.0529937744140625, 0.055576324462890625, 0.05815887451171875, 0.060741424560546875, 0.063323974609375, 0.06590652465820312, 0.06848907470703125, 0.07107162475585938, 0.0736541748046875, 0.07623672485351562, 0.07881927490234375, 0.08140182495117188, 0.083984375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 10.0, 72.0, 440.0, 382.0, 87.0, 15.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014348218217492104, -0.013694781810045242, -0.013041345402598381, -0.01238790899515152, -0.011734472587704659, -0.011081036180257797, -0.010427598841488361, -0.0097741624340415, -0.009120726026594639, -0.008467289619147778, -0.007813853211700916, -0.007160416338592768, -0.0065069799311459064, -0.005853543523699045, -0.005200106650590897, -0.004546670243144035, -0.003893233835697174, -0.003239797428250313, -0.002586360787972808, -0.001932924147695303, -0.0012794877402484417, -0.0006260513328015804, 2.7385540306568146e-05, 0.0006808219477534294, 0.0013342583552002907, 0.001987694762647152, 0.002641131402924657, 0.003294568043202162, 0.003948004450649023, 0.004601440858095884, 0.005254877731204033, 0.005908314138650894, 0.006561752408742905, 0.007215188816189766, 0.007868625223636627, 0.008522061631083488, 0.00917549803853035, 0.009828934445977211, 0.010482371784746647, 0.011135808192193508, 0.01178924459964037, 0.01244268100708723, 0.013096117414534092, 0.013749554753303528, 0.014402991160750389, 0.01505642756819725, 0.01570986397564411, 0.016363300383090973, 0.017016736790537834, 0.017670173197984695, 0.018323609605431557, 0.018977046012878418, 0.01963048242032528, 0.02028391882777214, 0.02093735709786415, 0.021590791642665863, 0.022244229912757874, 0.022897666320204735, 0.023551102727651596, 0.024204539135098457, 0.02485797554254532, 0.02551141194999218, 0.02616484835743904, 0.02681828662753105, 0.027471721172332764]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 10.0, 9.0, 15.0, 9.0, 23.0, 15.0, 16.0, 26.0, 33.0, 23.0, 28.0, 29.0, 26.0, 40.0, 42.0, 38.0, 46.0, 31.0, 43.0, 32.0, 47.0, 37.0, 38.0, 30.0, 42.0, 27.0, 29.0, 31.0, 24.0, 24.0, 24.0, 22.0, 17.0, 13.0, 12.0, 11.0, 14.0, 5.0, 1.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002149343490600586, -0.0020791543647646904, -0.002008965238928795, -0.0019387761130928993, -0.0018685869872570038, -0.0017983978614211082, -0.0017282087355852127, -0.0016580196097493172, -0.0015878304839134216, -0.001517641358077526, -0.0014474522322416306, -0.001377263106405735, -0.0013070739805698395, -0.001236884854733944, -0.0011666957288980484, -0.0010965066030621529, -0.0010263174772262573, -0.0009561283513903618, -0.0008859392255544662, -0.0008157500997185707, -0.0007455609738826752, -0.0006753718480467796, -0.0006051827222108841, -0.0005349935963749886, -0.000464804470539093, -0.0003946153447031975, -0.00032442621886730194, -0.0002542370930314064, -0.00018404796719551086, -0.00011385884135961533, -4.366971552371979e-05, 2.651941031217575e-05, 9.670853614807129e-05, 0.00016689766198396683, 0.00023708678781986237, 0.0003072759136557579, 0.00037746503949165344, 0.000447654165327549, 0.0005178432911634445, 0.0005880324169993401, 0.0006582215428352356, 0.0007284106686711311, 0.0007985997945070267, 0.0008687889203429222, 0.0009389780461788177, 0.0010091671720147133, 0.0010793562978506088, 0.0011495454236865044, 0.0012197345495224, 0.0012899236753582954, 0.001360112801194191, 0.0014303019270300865, 0.001500491052865982, 0.0015706801787018776, 0.0016408693045377731, 0.0017110584303736687, 0.0017812475562095642, 0.0018514366820454597, 0.0019216258078813553, 0.001991814933717251, 0.0020620040595531464, 0.002132193185389042, 0.0022023823112249374, 0.002272571437060833, 0.0023427605628967285]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 9.0, 17.0, 14.0, 20.0, 15.0, 22.0, 22.0, 25.0, 35.0, 30.0, 25.0, 38.0, 36.0, 47.0, 35.0, 32.0, 62.0, 43.0, 45.0, 46.0, 33.0, 49.0, 36.0, 34.0, 35.0, 26.0, 27.0, 21.0, 21.0, 16.0, 14.0, 13.0, 6.0, 6.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.671875, -21.929443359375, -21.18701171875, -20.444580078125, -19.7021484375, -18.959716796875, -18.21728515625, -17.474853515625, -16.732421875, -15.989990234375, -15.24755859375, -14.505126953125, -13.7626953125, -13.020263671875, -12.27783203125, -11.535400390625, -10.79296875, -10.050537109375, -9.30810546875, -8.565673828125, -7.8232421875, -7.080810546875, -6.33837890625, -5.595947265625, -4.853515625, -4.111083984375, -3.36865234375, -2.626220703125, -1.8837890625, -1.141357421875, -0.39892578125, 0.343505859375, 1.0859375, 1.828369140625, 2.57080078125, 3.313232421875, 4.0556640625, 4.798095703125, 5.54052734375, 6.282958984375, 7.025390625, 7.767822265625, 8.51025390625, 9.252685546875, 9.9951171875, 10.737548828125, 11.47998046875, 12.222412109375, 12.96484375, 13.707275390625, 14.44970703125, 15.192138671875, 15.9345703125, 16.677001953125, 17.41943359375, 18.161865234375, 18.904296875, 19.646728515625, 20.38916015625, 21.131591796875, 21.8740234375, 22.616455078125, 23.35888671875, 24.101318359375, 24.84375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 12.0, 9.0, 12.0, 6.0, 24.0, 28.0, 45.0, 56.0, 88.0, 120.0, 187.0, 289.0, 416.0, 599.0, 1005.0, 1588.0, 2712.0, 4909.0, 9430.0, 23553.0, 103341.0, 679998.0, 164657.0, 30620.0, 11143.0, 5457.0, 3186.0, 1837.0, 1120.0, 690.0, 433.0, 315.0, 222.0, 114.0, 91.0, 63.0, 57.0, 34.0, 28.0, 12.0, 15.0, 10.0, 6.0, 9.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-32.09375, -31.138916015625, -30.18408203125, -29.229248046875, -28.2744140625, -27.319580078125, -26.36474609375, -25.409912109375, -24.455078125, -23.500244140625, -22.54541015625, -21.590576171875, -20.6357421875, -19.680908203125, -18.72607421875, -17.771240234375, -16.81640625, -15.861572265625, -14.90673828125, -13.951904296875, -12.9970703125, -12.042236328125, -11.08740234375, -10.132568359375, -9.177734375, -8.222900390625, -7.26806640625, -6.313232421875, -5.3583984375, -4.403564453125, -3.44873046875, -2.493896484375, -1.5390625, -0.584228515625, 0.37060546875, 1.325439453125, 2.2802734375, 3.235107421875, 4.18994140625, 5.144775390625, 6.099609375, 7.054443359375, 8.00927734375, 8.964111328125, 9.9189453125, 10.873779296875, 11.82861328125, 12.783447265625, 13.73828125, 14.693115234375, 15.64794921875, 16.602783203125, 17.5576171875, 18.512451171875, 19.46728515625, 20.422119140625, 21.376953125, 22.331787109375, 23.28662109375, 24.241455078125, 25.1962890625, 26.151123046875, 27.10595703125, 28.060791015625, 29.015625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 7.0, 9.0, 10.0, 23.0, 11.0, 13.0, 20.0, 30.0, 36.0, 47.0, 35.0, 45.0, 63.0, 56.0, 77.0, 279.0, 1726.0, 94.0, 74.0, 52.0, 48.0, 37.0, 39.0, 33.0, 32.0, 28.0, 22.0, 19.0, 14.0, 15.0, 9.0, 8.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0], "bins": [-87.25, -84.6953125, -82.140625, -79.5859375, -77.03125, -74.4765625, -71.921875, -69.3671875, -66.8125, -64.2578125, -61.703125, -59.1484375, -56.59375, -54.0390625, -51.484375, -48.9296875, -46.375, -43.8203125, -41.265625, -38.7109375, -36.15625, -33.6015625, -31.046875, -28.4921875, -25.9375, -23.3828125, -20.828125, -18.2734375, -15.71875, -13.1640625, -10.609375, -8.0546875, -5.5, -2.9453125, -0.390625, 2.1640625, 4.71875, 7.2734375, 9.828125, 12.3828125, 14.9375, 17.4921875, 20.046875, 22.6015625, 25.15625, 27.7109375, 30.265625, 32.8203125, 35.375, 37.9296875, 40.484375, 43.0390625, 45.59375, 48.1484375, 50.703125, 53.2578125, 55.8125, 58.3671875, 60.921875, 63.4765625, 66.03125, 68.5859375, 71.140625, 73.6953125, 76.25]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 6.0, 15.0, 17.0, 27.0, 43.0, 65.0, 102.0, 137.0, 295.0, 980.0, 22992.0, 3114994.0, 4917.0, 585.0, 196.0, 116.0, 72.0, 45.0, 32.0, 17.0, 12.0, 10.0, 5.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.5, -297.98046875, -287.4609375, -276.94140625, -266.421875, -255.90234375, -245.3828125, -234.86328125, -224.34375, -213.82421875, -203.3046875, -192.78515625, -182.265625, -171.74609375, -161.2265625, -150.70703125, -140.1875, -129.66796875, -119.1484375, -108.62890625, -98.109375, -87.58984375, -77.0703125, -66.55078125, -56.03125, -45.51171875, -34.9921875, -24.47265625, -13.953125, -3.43359375, 7.0859375, 17.60546875, 28.125, 38.64453125, 49.1640625, 59.68359375, 70.203125, 80.72265625, 91.2421875, 101.76171875, 112.28125, 122.80078125, 133.3203125, 143.83984375, 154.359375, 164.87890625, 175.3984375, 185.91796875, 196.4375, 206.95703125, 217.4765625, 227.99609375, 238.515625, 249.03515625, 259.5546875, 270.07421875, 280.59375, 291.11328125, 301.6328125, 312.15234375, 322.671875, 333.19140625, 343.7109375, 354.23046875, 364.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 8.0, 6.0, 10.0, 31.0, 50.0, 92.0, 138.0, 248.0, 216.0, 103.0, 56.0, 19.0, 15.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.34490203857422, -58.84526062011719, -53.345619201660156, -47.84598159790039, -42.34634017944336, -36.84669876098633, -31.347061157226562, -25.84741973876953, -20.3477783203125, -14.848137855529785, -9.34849739074707, -3.848857879638672, 1.6507835388183594, 7.150424957275391, 12.650062561035156, 18.149703979492188, 23.64934539794922, 29.14898681640625, 34.64862823486328, 40.14826583862305, 45.64790725708008, 51.14754867553711, 56.647186279296875, 62.146827697753906, 67.64646911621094, 73.14611053466797, 78.645751953125, 84.1453857421875, 89.64503479003906, 95.14466857910156, 100.6443099975586, 106.14395141601562, 111.64358520507812, 117.14322662353516, 122.64286804199219, 128.1425018310547, 133.64215087890625, 139.14178466796875, 144.64141845703125, 150.1410675048828, 155.64071655273438, 161.14035034179688, 166.63999938964844, 172.13963317871094, 177.6392822265625, 183.138916015625, 188.6385498046875, 194.13819885253906, 199.63783264160156, 205.13746643066406, 210.63711547851562, 216.13674926757812, 221.6363983154297, 227.1360321044922, 232.63568115234375, 238.13531494140625, 243.63494873046875, 249.13458251953125, 254.6342315673828, 260.1338806152344, 265.6335144042969, 271.1331481933594, 276.6327819824219, 282.1324462890625, 287.632080078125]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 9.0, 8.0, 9.0, 12.0, 7.0, 11.0, 18.0, 18.0, 22.0, 25.0, 24.0, 20.0, 14.0, 25.0, 29.0, 32.0, 36.0, 33.0, 33.0, 33.0, 48.0, 48.0, 41.0, 29.0, 44.0, 40.0, 27.0, 41.0, 40.0, 33.0, 33.0, 27.0, 14.0, 25.0, 16.0, 12.0, 6.0, 8.0, 9.0, 5.0, 10.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-224.2779998779297, -218.01217651367188, -211.746337890625, -205.4805145263672, -199.21469116210938, -192.9488525390625, -186.6830291748047, -180.41720581054688, -174.1513671875, -167.8855438232422, -161.6197052001953, -155.3538818359375, -149.0880584716797, -142.8222198486328, -136.556396484375, -130.29055786132812, -124.02474212646484, -117.7589111328125, -111.49308776855469, -105.22725677490234, -98.96142578125, -92.69560241699219, -86.42977142333984, -80.1639404296875, -73.89811706542969, -67.63228607177734, -61.366458892822266, -55.10063171386719, -48.834800720214844, -42.568973541259766, -36.30314636230469, -30.037315368652344, -23.771484375, -17.50565528869629, -11.239827156066895, -4.9739990234375, 1.291830062866211, 7.557659149169922, 13.823486328125, 20.089317321777344, 26.355144500732422, 32.6209716796875, 38.886802673339844, 45.15262985229492, 51.41845703125, 57.684288024902344, 63.95011520385742, 70.2159423828125, 76.48177337646484, 82.74760437011719, 89.013427734375, 95.27925872802734, 101.54508972167969, 107.8109130859375, 114.07674407958984, 120.34257507324219, 126.6083984375, 132.8742218017578, 139.1400604248047, 145.4058837890625, 151.6717071533203, 157.9375457763672, 164.203369140625, 170.46920776367188, 176.7350311279297]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 12.0, 11.0, 7.0, 19.0, 16.0, 20.0, 17.0, 15.0, 27.0, 33.0, 24.0, 36.0, 38.0, 48.0, 34.0, 42.0, 37.0, 43.0, 55.0, 40.0, 38.0, 45.0, 38.0, 46.0, 32.0, 28.0, 35.0, 25.0, 22.0, 26.0, 9.0, 18.0, 16.0, 5.0, 9.0, 5.0, 3.0, 2.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.46875, -24.66552734375, -23.8623046875, -23.05908203125, -22.255859375, -21.45263671875, -20.6494140625, -19.84619140625, -19.04296875, -18.23974609375, -17.4365234375, -16.63330078125, -15.830078125, -15.02685546875, -14.2236328125, -13.42041015625, -12.6171875, -11.81396484375, -11.0107421875, -10.20751953125, -9.404296875, -8.60107421875, -7.7978515625, -6.99462890625, -6.19140625, -5.38818359375, -4.5849609375, -3.78173828125, -2.978515625, -2.17529296875, -1.3720703125, -0.56884765625, 0.234375, 1.03759765625, 1.8408203125, 2.64404296875, 3.447265625, 4.25048828125, 5.0537109375, 5.85693359375, 6.66015625, 7.46337890625, 8.2666015625, 9.06982421875, 9.873046875, 10.67626953125, 11.4794921875, 12.28271484375, 13.0859375, 13.88916015625, 14.6923828125, 15.49560546875, 16.298828125, 17.10205078125, 17.9052734375, 18.70849609375, 19.51171875, 20.31494140625, 21.1181640625, 21.92138671875, 22.724609375, 23.52783203125, 24.3310546875, 25.13427734375, 25.9375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 16.0, 20.0, 19.0, 14.0, 35.0, 33.0, 55.0, 66.0, 88.0, 139.0, 227.0, 325.0, 530.0, 1042.0, 2168.0, 4836.0, 11022.0, 53803.0, 2614181.0, 1452386.0, 35847.0, 9371.0, 3878.0, 1826.0, 913.0, 494.0, 282.0, 198.0, 129.0, 90.0, 57.0, 47.0, 32.0, 28.0, 17.0, 15.0, 17.0, 7.0, 4.0, 9.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.1875, -79.529296875, -76.87109375, -74.212890625, -71.5546875, -68.896484375, -66.23828125, -63.580078125, -60.921875, -58.263671875, -55.60546875, -52.947265625, -50.2890625, -47.630859375, -44.97265625, -42.314453125, -39.65625, -36.998046875, -34.33984375, -31.681640625, -29.0234375, -26.365234375, -23.70703125, -21.048828125, -18.390625, -15.732421875, -13.07421875, -10.416015625, -7.7578125, -5.099609375, -2.44140625, 0.216796875, 2.875, 5.533203125, 8.19140625, 10.849609375, 13.5078125, 16.166015625, 18.82421875, 21.482421875, 24.140625, 26.798828125, 29.45703125, 32.115234375, 34.7734375, 37.431640625, 40.08984375, 42.748046875, 45.40625, 48.064453125, 50.72265625, 53.380859375, 56.0390625, 58.697265625, 61.35546875, 64.013671875, 66.671875, 69.330078125, 71.98828125, 74.646484375, 77.3046875, 79.962890625, 82.62109375, 85.279296875, 87.9375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 5.0, 6.0, 5.0, 6.0, 12.0, 10.0, 10.0, 25.0, 16.0, 25.0, 30.0, 37.0, 61.0, 94.0, 172.0, 334.0, 605.0, 986.0, 725.0, 380.0, 174.0, 85.0, 66.0, 38.0, 35.0, 28.0, 20.0, 16.0, 14.0, 8.0, 12.0, 7.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.0, -48.25048828125, -46.5009765625, -44.75146484375, -43.001953125, -41.25244140625, -39.5029296875, -37.75341796875, -36.00390625, -34.25439453125, -32.5048828125, -30.75537109375, -29.005859375, -27.25634765625, -25.5068359375, -23.75732421875, -22.0078125, -20.25830078125, -18.5087890625, -16.75927734375, -15.009765625, -13.26025390625, -11.5107421875, -9.76123046875, -8.01171875, -6.26220703125, -4.5126953125, -2.76318359375, -1.013671875, 0.73583984375, 2.4853515625, 4.23486328125, 5.984375, 7.73388671875, 9.4833984375, 11.23291015625, 12.982421875, 14.73193359375, 16.4814453125, 18.23095703125, 19.98046875, 21.72998046875, 23.4794921875, 25.22900390625, 26.978515625, 28.72802734375, 30.4775390625, 32.22705078125, 33.9765625, 35.72607421875, 37.4755859375, 39.22509765625, 40.974609375, 42.72412109375, 44.4736328125, 46.22314453125, 47.97265625, 49.72216796875, 51.4716796875, 53.22119140625, 54.970703125, 56.72021484375, 58.4697265625, 60.21923828125, 61.96875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 11.0, 8.0, 13.0, 16.0, 23.0, 32.0, 52.0, 96.0, 201.0, 474.0, 1481.0, 5490.0, 28805.0, 1324035.0, 2791166.0, 33466.0, 6173.0, 1651.0, 562.0, 229.0, 91.0, 51.0, 33.0, 31.0, 13.0, 14.0, 11.0, 9.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-205.25, -199.5546875, -193.859375, -188.1640625, -182.46875, -176.7734375, -171.078125, -165.3828125, -159.6875, -153.9921875, -148.296875, -142.6015625, -136.90625, -131.2109375, -125.515625, -119.8203125, -114.125, -108.4296875, -102.734375, -97.0390625, -91.34375, -85.6484375, -79.953125, -74.2578125, -68.5625, -62.8671875, -57.171875, -51.4765625, -45.78125, -40.0859375, -34.390625, -28.6953125, -23.0, -17.3046875, -11.609375, -5.9140625, -0.21875, 5.4765625, 11.171875, 16.8671875, 22.5625, 28.2578125, 33.953125, 39.6484375, 45.34375, 51.0390625, 56.734375, 62.4296875, 68.125, 73.8203125, 79.515625, 85.2109375, 90.90625, 96.6015625, 102.296875, 107.9921875, 113.6875, 119.3828125, 125.078125, 130.7734375, 136.46875, 142.1640625, 147.859375, 153.5546875, 159.25]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 19.0, 36.0, 125.0, 357.0, 326.0, 92.0, 27.0, 11.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-317.2574462890625, -295.9310607910156, -274.60467529296875, -253.2782745361328, -231.95188903808594, -210.62550354003906, -189.29910278320312, -167.97271728515625, -146.64633178710938, -125.3199462890625, -103.9935531616211, -82.66716003417969, -61.34077453613281, -40.01438903808594, -18.68799591064453, 2.638397216796875, 23.96478271484375, 45.29117202758789, 66.61756134033203, 87.94395446777344, 109.27033996582031, 130.5967254638672, 151.92312622070312, 173.24951171875, 194.57589721679688, 215.90228271484375, 237.22866821289062, 258.5550537109375, 279.8814697265625, 301.20782470703125, 322.53424072265625, 343.8606262207031, 365.18701171875, 386.5133972167969, 407.83978271484375, 429.1661682128906, 450.4925537109375, 471.8189697265625, 493.1453552246094, 514.4717407226562, 535.798095703125, 557.12451171875, 578.4508666992188, 599.7772827148438, 621.1036376953125, 642.4300537109375, 663.7564086914062, 685.0828247070312, 706.4092407226562, 727.7356567382812, 749.06201171875, 770.388427734375, 791.7147827148438, 813.0411987304688, 834.3675537109375, 855.6939697265625, 877.0203857421875, 898.3468017578125, 919.6731567382812, 940.9995727539062, 962.325927734375, 983.65234375, 1004.9786987304688, 1026.30517578125, 1047.6314697265625]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 9.0, 7.0, 4.0, 8.0, 5.0, 7.0, 10.0, 13.0, 12.0, 21.0, 19.0, 17.0, 27.0, 23.0, 24.0, 23.0, 33.0, 26.0, 31.0, 25.0, 32.0, 25.0, 39.0, 43.0, 40.0, 40.0, 47.0, 41.0, 40.0, 25.0, 27.0, 29.0, 26.0, 25.0, 26.0, 23.0, 23.0, 13.0, 12.0, 13.0, 8.0, 17.0, 9.0, 8.0, 2.0, 6.0, 9.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.8083724975586, -115.5762939453125, -111.3442153930664, -107.11213684082031, -102.88005828857422, -98.64797973632812, -94.41590881347656, -90.18382263183594, -85.95175170898438, -81.71967315673828, -77.48759460449219, -73.2555160522461, -69.0234375, -64.7913589477539, -60.55928421020508, -56.327205657958984, -52.095123291015625, -47.86304473876953, -43.63096618652344, -39.398887634277344, -35.16680908203125, -30.93473243713379, -26.702655792236328, -22.470577239990234, -18.23849868774414, -14.006420135498047, -9.77434253692627, -5.542264938354492, -1.3101863861083984, 2.9218921661376953, 7.153968811035156, 11.38604736328125, 15.618133544921875, 19.85021209716797, 24.082290649414062, 28.314367294311523, 32.54644775390625, 36.778526306152344, 41.01060104370117, 45.242679595947266, 49.47475814819336, 53.70683670043945, 57.93891525268555, 62.170989990234375, 66.40306854248047, 70.63514709472656, 74.86722564697266, 79.09930419921875, 83.33138275146484, 87.56346130371094, 91.79553985595703, 96.02761840820312, 100.25969696044922, 104.49177551269531, 108.72384643554688, 112.9559326171875, 117.18800354003906, 121.42008209228516, 125.65216064453125, 129.8842315673828, 134.11631774902344, 138.348388671875, 142.58047485351562, 146.8125457763672, 151.0446319580078]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 7.0, 7.0, 15.0, 14.0, 21.0, 22.0, 21.0, 20.0, 41.0, 29.0, 31.0, 33.0, 32.0, 52.0, 50.0, 43.0, 65.0, 55.0, 46.0, 41.0, 44.0, 40.0, 35.0, 41.0, 36.0, 18.0, 32.0, 19.0, 19.0, 13.0, 8.0, 8.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.384033203125, -22.53369140625, -21.683349609375, -20.8330078125, -19.982666015625, -19.13232421875, -18.281982421875, -17.431640625, -16.581298828125, -15.73095703125, -14.880615234375, -14.0302734375, -13.179931640625, -12.32958984375, -11.479248046875, -10.62890625, -9.778564453125, -8.92822265625, -8.077880859375, -7.2275390625, -6.377197265625, -5.52685546875, -4.676513671875, -3.826171875, -2.975830078125, -2.12548828125, -1.275146484375, -0.4248046875, 0.425537109375, 1.27587890625, 2.126220703125, 2.9765625, 3.826904296875, 4.67724609375, 5.527587890625, 6.3779296875, 7.228271484375, 8.07861328125, 8.928955078125, 9.779296875, 10.629638671875, 11.47998046875, 12.330322265625, 13.1806640625, 14.031005859375, 14.88134765625, 15.731689453125, 16.58203125, 17.432373046875, 18.28271484375, 19.133056640625, 19.9833984375, 20.833740234375, 21.68408203125, 22.534423828125, 23.384765625, 24.235107421875, 25.08544921875, 25.935791015625, 26.7861328125, 27.636474609375, 28.48681640625, 29.337158203125, 30.1875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 18.0, 18.0, 20.0, 28.0, 55.0, 96.0, 108.0, 222.0, 316.0, 498.0, 822.0, 1324.0, 2176.0, 3583.0, 6306.0, 10997.0, 20429.0, 39454.0, 80230.0, 173485.0, 320301.0, 200144.0, 90844.0, 44695.0, 22978.0, 12338.0, 6972.0, 4016.0, 2320.0, 1412.0, 870.0, 515.0, 326.0, 242.0, 123.0, 89.0, 62.0, 35.0, 32.0, 24.0, 8.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.54296875, -1.4956207275390625, -1.448272705078125, -1.4009246826171875, -1.35357666015625, -1.3062286376953125, -1.258880615234375, -1.2115325927734375, -1.1641845703125, -1.1168365478515625, -1.069488525390625, -1.0221405029296875, -0.97479248046875, -0.9274444580078125, -0.880096435546875, -0.8327484130859375, -0.785400390625, -0.7380523681640625, -0.690704345703125, -0.6433563232421875, -0.59600830078125, -0.5486602783203125, -0.501312255859375, -0.4539642333984375, -0.4066162109375, -0.3592681884765625, -0.311920166015625, -0.2645721435546875, -0.21722412109375, -0.1698760986328125, -0.122528076171875, -0.0751800537109375, -0.02783203125, 0.0195159912109375, 0.066864013671875, 0.1142120361328125, 0.16156005859375, 0.2089080810546875, 0.256256103515625, 0.3036041259765625, 0.3509521484375, 0.3983001708984375, 0.445648193359375, 0.4929962158203125, 0.54034423828125, 0.5876922607421875, 0.635040283203125, 0.6823883056640625, 0.729736328125, 0.7770843505859375, 0.824432373046875, 0.8717803955078125, 0.91912841796875, 0.9664764404296875, 1.013824462890625, 1.0611724853515625, 1.1085205078125, 1.1558685302734375, 1.203216552734375, 1.2505645751953125, 1.29791259765625, 1.3452606201171875, 1.392608642578125, 1.4399566650390625, 1.4873046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 3.0, 7.0, 4.0, 8.0, 10.0, 13.0, 5.0, 11.0, 19.0, 27.0, 31.0, 27.0, 37.0, 25.0, 46.0, 45.0, 40.0, 41.0, 50.0, 35.0, 1070.0, 48.0, 41.0, 43.0, 36.0, 43.0, 31.0, 38.0, 26.0, 30.0, 29.0, 21.0, 12.0, 16.0, 10.0, 14.0, 7.0, 9.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-19.375, -18.843017578125, -18.31103515625, -17.779052734375, -17.2470703125, -16.715087890625, -16.18310546875, -15.651123046875, -15.119140625, -14.587158203125, -14.05517578125, -13.523193359375, -12.9912109375, -12.459228515625, -11.92724609375, -11.395263671875, -10.86328125, -10.331298828125, -9.79931640625, -9.267333984375, -8.7353515625, -8.203369140625, -7.67138671875, -7.139404296875, -6.607421875, -6.075439453125, -5.54345703125, -5.011474609375, -4.4794921875, -3.947509765625, -3.41552734375, -2.883544921875, -2.3515625, -1.819580078125, -1.28759765625, -0.755615234375, -0.2236328125, 0.308349609375, 0.84033203125, 1.372314453125, 1.904296875, 2.436279296875, 2.96826171875, 3.500244140625, 4.0322265625, 4.564208984375, 5.09619140625, 5.628173828125, 6.16015625, 6.692138671875, 7.22412109375, 7.756103515625, 8.2880859375, 8.820068359375, 9.35205078125, 9.884033203125, 10.416015625, 10.947998046875, 11.47998046875, 12.011962890625, 12.5439453125, 13.075927734375, 13.60791015625, 14.139892578125, 14.671875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 14.0, 16.0, 22.0, 33.0, 40.0, 68.0, 98.0, 153.0, 246.0, 383.0, 497.0, 715.0, 1075.0, 1577.0, 2392.0, 3434.0, 5229.0, 8080.0, 12744.0, 20119.0, 32511.0, 54576.0, 95883.0, 177710.0, 1297028.0, 162030.0, 86696.0, 50471.0, 30145.0, 18678.0, 11796.0, 7645.0, 4923.0, 3244.0, 2219.0, 1417.0, 1016.0, 701.0, 515.0, 334.0, 210.0, 151.0, 101.0, 70.0, 44.0, 25.0, 22.0, 16.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.083984375, -1.0494842529296875, -1.014984130859375, -0.9804840087890625, -0.94598388671875, -0.9114837646484375, -0.876983642578125, -0.8424835205078125, -0.8079833984375, -0.7734832763671875, -0.738983154296875, -0.7044830322265625, -0.66998291015625, -0.6354827880859375, -0.600982666015625, -0.5664825439453125, -0.531982421875, -0.4974822998046875, -0.462982177734375, -0.4284820556640625, -0.39398193359375, -0.3594818115234375, -0.324981689453125, -0.2904815673828125, -0.2559814453125, -0.2214813232421875, -0.186981201171875, -0.1524810791015625, -0.11798095703125, -0.0834808349609375, -0.048980712890625, -0.0144805908203125, 0.02001953125, 0.0545196533203125, 0.089019775390625, 0.1235198974609375, 0.15802001953125, 0.1925201416015625, 0.227020263671875, 0.2615203857421875, 0.2960205078125, 0.3305206298828125, 0.365020751953125, 0.3995208740234375, 0.43402099609375, 0.4685211181640625, 0.503021240234375, 0.5375213623046875, 0.572021484375, 0.6065216064453125, 0.641021728515625, 0.6755218505859375, 0.71002197265625, 0.7445220947265625, 0.779022216796875, 0.8135223388671875, 0.8480224609375, 0.8825225830078125, 0.917022705078125, 0.9515228271484375, 0.98602294921875, 1.0205230712890625, 1.055023193359375, 1.0895233154296875, 1.1240234375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 7.0, 5.0, 8.0, 8.0, 9.0, 19.0, 24.0, 25.0, 29.0, 37.0, 46.0, 44.0, 52.0, 61.0, 48.0, 56.0, 63.0, 49.0, 73.0, 57.0, 49.0, 48.0, 27.0, 24.0, 19.0, 18.0, 20.0, 15.0, 7.0, 14.0, 7.0, 3.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00559234619140625, -0.00543135404586792, -0.00527036190032959, -0.00510936975479126, -0.00494837760925293, -0.0047873854637146, -0.0046263933181762695, -0.0044654011726379395, -0.004304409027099609, -0.004143416881561279, -0.003982424736022949, -0.003821432590484619, -0.003660440444946289, -0.003499448299407959, -0.003338456153869629, -0.003177464008331299, -0.0030164718627929688, -0.0028554797172546387, -0.0026944875717163086, -0.0025334954261779785, -0.0023725032806396484, -0.0022115111351013184, -0.0020505189895629883, -0.0018895268440246582, -0.0017285346984863281, -0.001567542552947998, -0.001406550407409668, -0.0012455582618713379, -0.0010845661163330078, -0.0009235739707946777, -0.0007625818252563477, -0.0006015896797180176, -0.0004405975341796875, -0.0002796053886413574, -0.00011861324310302734, 4.2378902435302734e-05, 0.0002033710479736328, 0.0003643631935119629, 0.000525355339050293, 0.000686347484588623, 0.0008473396301269531, 0.0010083317756652832, 0.0011693239212036133, 0.0013303160667419434, 0.0014913082122802734, 0.0016523003578186035, 0.0018132925033569336, 0.0019742846488952637, 0.0021352767944335938, 0.002296268939971924, 0.002457261085510254, 0.002618253231048584, 0.002779245376586914, 0.002940237522125244, 0.0031012296676635742, 0.0032622218132019043, 0.0034232139587402344, 0.0035842061042785645, 0.0037451982498168945, 0.0039061903953552246, 0.004067182540893555, 0.004228174686431885, 0.004389166831970215, 0.004550158977508545, 0.004711151123046875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 14.0, 8.0, 15.0, 18.0, 13.0, 25.0, 32.0, 47.0, 67.0, 92.0, 144.0, 253.0, 565.0, 15519.0, 1010788.0, 19626.0, 588.0, 252.0, 150.0, 76.0, 68.0, 41.0, 25.0, 36.0, 18.0, 10.0, 13.0, 9.0, 2.0, 5.0, 5.0, 7.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1038818359375, -0.10036277770996094, -0.09684371948242188, -0.09332466125488281, -0.08980560302734375, -0.08628654479980469, -0.08276748657226562, -0.07924842834472656, -0.0757293701171875, -0.07221031188964844, -0.06869125366210938, -0.06517219543457031, -0.06165313720703125, -0.05813407897949219, -0.054615020751953125, -0.05109596252441406, -0.047576904296875, -0.04405784606933594, -0.040538787841796875, -0.03701972961425781, -0.03350067138671875, -0.029981613159179688, -0.026462554931640625, -0.022943496704101562, -0.0194244384765625, -0.015905380249023438, -0.012386322021484375, -0.008867263793945312, -0.00534820556640625, -0.0018291473388671875, 0.001689910888671875, 0.0052089691162109375, 0.00872802734375, 0.012247085571289062, 0.015766143798828125, 0.019285202026367188, 0.02280426025390625, 0.026323318481445312, 0.029842376708984375, 0.03336143493652344, 0.0368804931640625, 0.04039955139160156, 0.043918609619140625, 0.04743766784667969, 0.05095672607421875, 0.05447578430175781, 0.057994842529296875, 0.06151390075683594, 0.065032958984375, 0.06855201721191406, 0.07207107543945312, 0.07559013366699219, 0.07910919189453125, 0.08262825012207031, 0.08614730834960938, 0.08966636657714844, 0.0931854248046875, 0.09670448303222656, 0.10022354125976562, 0.10374259948730469, 0.10726165771484375, 0.11078071594238281, 0.11429977416992188, 0.11781883239746094, 0.121337890625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 15.0, 202.0, 601.0, 166.0, 24.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00406833877786994, -0.0033215638250112534, -0.0025747891049832106, -0.0018280143849551678, -0.0010812394320964813, -0.0003344644792377949, 0.00041231000795960426, 0.0011590849608182907, 0.0019058599136769772, 0.0026526348665356636, 0.0033994095865637064, 0.004146184306591749, 0.004892959259450436, 0.005639734212309122, 0.006386508699506521, 0.007133283652365208, 0.007880058139562607, 0.008626832626760006, 0.00937360804527998, 0.010120382532477379, 0.010867157950997353, 0.011613932438194752, 0.012360706925392151, 0.013107482343912125, 0.013854257762432098, 0.014601032249629498, 0.015347807668149471, 0.01609458215534687, 0.016841357573866844, 0.01758813112974167, 0.018334906548261642, 0.019081681966781616, 0.01982845738530159, 0.020575232803821564, 0.021322006359696388, 0.022068781778216362, 0.022815557196736336, 0.02356233075261116, 0.024309106171131134, 0.025055881589651108, 0.02580265700817108, 0.026549432426691055, 0.02729620598256588, 0.028042981401085854, 0.028789756819605827, 0.029536530375480652, 0.030283305794000626, 0.0310300812125206, 0.031776852905750275, 0.03252362832427025, 0.03327040374279022, 0.0340171754360199, 0.03476395085453987, 0.035510726273059845, 0.03625750169157982, 0.03700427711009979, 0.037751052528619766, 0.03849782794713974, 0.039244603365659714, 0.03999137878417969, 0.04073815047740936, 0.04148492589592934, 0.04223170131444931, 0.042978476732969284, 0.04372525215148926]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 11.0, 6.0, 13.0, 9.0, 15.0, 17.0, 22.0, 24.0, 27.0, 21.0, 29.0, 35.0, 26.0, 25.0, 33.0, 31.0, 57.0, 44.0, 35.0, 44.0, 44.0, 43.0, 47.0, 42.0, 37.0, 27.0, 30.0, 19.0, 30.0, 17.0, 18.0, 17.0, 24.0, 11.0, 14.0, 11.0, 10.0, 3.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.002600252628326416, -0.0025182142853736877, -0.0024361759424209595, -0.002354137599468231, -0.002272099256515503, -0.0021900609135627747, -0.0021080225706100464, -0.002025984227657318, -0.0019439458847045898, -0.0018619075417518616, -0.0017798691987991333, -0.001697830855846405, -0.0016157925128936768, -0.0015337541699409485, -0.0014517158269882202, -0.001369677484035492, -0.0012876391410827637, -0.0012056007981300354, -0.0011235624551773071, -0.0010415241122245789, -0.0009594857692718506, -0.0008774474263191223, -0.000795409083366394, -0.0007133707404136658, -0.0006313323974609375, -0.0005492940545082092, -0.00046725571155548096, -0.0003852173686027527, -0.0003031790256500244, -0.00022114068269729614, -0.00013910233974456787, -5.70639967918396e-05, 2.4974346160888672e-05, 0.00010701268911361694, 0.00018905103206634521, 0.0002710893750190735, 0.00035312771797180176, 0.00043516606092453003, 0.0005172044038772583, 0.0005992427468299866, 0.0006812810897827148, 0.0007633194327354431, 0.0008453577756881714, 0.0009273961186408997, 0.001009434461593628, 0.0010914728045463562, 0.0011735111474990845, 0.0012555494904518127, 0.001337587833404541, 0.0014196261763572693, 0.0015016645193099976, 0.0015837028622627258, 0.001665741205215454, 0.0017477795481681824, 0.0018298178911209106, 0.001911856234073639, 0.001993894577026367, 0.0020759329199790955, 0.0021579712629318237, 0.002240009605884552, 0.0023220479488372803, 0.0024040862917900085, 0.002486124634742737, 0.002568162977695465, 0.0026502013206481934]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 7.0, 7.0, 16.0, 14.0, 20.0, 23.0, 20.0, 21.0, 41.0, 29.0, 30.0, 33.0, 34.0, 52.0, 48.0, 43.0, 65.0, 56.0, 45.0, 41.0, 44.0, 40.0, 35.0, 42.0, 35.0, 18.0, 33.0, 18.0, 19.0, 13.0, 8.0, 8.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.36865234375, -22.5185546875, -21.66845703125, -20.818359375, -19.96826171875, -19.1181640625, -18.26806640625, -17.41796875, -16.56787109375, -15.7177734375, -14.86767578125, -14.017578125, -13.16748046875, -12.3173828125, -11.46728515625, -10.6171875, -9.76708984375, -8.9169921875, -8.06689453125, -7.216796875, -6.36669921875, -5.5166015625, -4.66650390625, -3.81640625, -2.96630859375, -2.1162109375, -1.26611328125, -0.416015625, 0.43408203125, 1.2841796875, 2.13427734375, 2.984375, 3.83447265625, 4.6845703125, 5.53466796875, 6.384765625, 7.23486328125, 8.0849609375, 8.93505859375, 9.78515625, 10.63525390625, 11.4853515625, 12.33544921875, 13.185546875, 14.03564453125, 14.8857421875, 15.73583984375, 16.5859375, 17.43603515625, 18.2861328125, 19.13623046875, 19.986328125, 20.83642578125, 21.6865234375, 22.53662109375, 23.38671875, 24.23681640625, 25.0869140625, 25.93701171875, 26.787109375, 27.63720703125, 28.4873046875, 29.33740234375, 30.1875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 5.0, 9.0, 10.0, 22.0, 39.0, 42.0, 67.0, 94.0, 129.0, 192.0, 318.0, 464.0, 748.0, 1124.0, 1955.0, 3517.0, 7279.0, 27914.0, 456038.0, 503001.0, 29210.0, 7501.0, 3491.0, 2034.0, 1174.0, 755.0, 454.0, 298.0, 242.0, 133.0, 86.0, 63.0, 36.0, 35.0, 20.0, 12.0, 13.0, 3.0, 6.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.375, -38.14501953125, -36.9150390625, -35.68505859375, -34.455078125, -33.22509765625, -31.9951171875, -30.76513671875, -29.53515625, -28.30517578125, -27.0751953125, -25.84521484375, -24.615234375, -23.38525390625, -22.1552734375, -20.92529296875, -19.6953125, -18.46533203125, -17.2353515625, -16.00537109375, -14.775390625, -13.54541015625, -12.3154296875, -11.08544921875, -9.85546875, -8.62548828125, -7.3955078125, -6.16552734375, -4.935546875, -3.70556640625, -2.4755859375, -1.24560546875, -0.015625, 1.21435546875, 2.4443359375, 3.67431640625, 4.904296875, 6.13427734375, 7.3642578125, 8.59423828125, 9.82421875, 11.05419921875, 12.2841796875, 13.51416015625, 14.744140625, 15.97412109375, 17.2041015625, 18.43408203125, 19.6640625, 20.89404296875, 22.1240234375, 23.35400390625, 24.583984375, 25.81396484375, 27.0439453125, 28.27392578125, 29.50390625, 30.73388671875, 31.9638671875, 33.19384765625, 34.423828125, 35.65380859375, 36.8837890625, 38.11376953125, 39.34375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 6.0, 8.0, 13.0, 18.0, 20.0, 32.0, 36.0, 30.0, 30.0, 46.0, 51.0, 51.0, 77.0, 91.0, 1796.0, 215.0, 66.0, 72.0, 60.0, 33.0, 44.0, 40.0, 26.0, 28.0, 25.0, 20.0, 20.0, 9.0, 11.0, 16.0, 8.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-89.125, -86.318359375, -83.51171875, -80.705078125, -77.8984375, -75.091796875, -72.28515625, -69.478515625, -66.671875, -63.865234375, -61.05859375, -58.251953125, -55.4453125, -52.638671875, -49.83203125, -47.025390625, -44.21875, -41.412109375, -38.60546875, -35.798828125, -32.9921875, -30.185546875, -27.37890625, -24.572265625, -21.765625, -18.958984375, -16.15234375, -13.345703125, -10.5390625, -7.732421875, -4.92578125, -2.119140625, 0.6875, 3.494140625, 6.30078125, 9.107421875, 11.9140625, 14.720703125, 17.52734375, 20.333984375, 23.140625, 25.947265625, 28.75390625, 31.560546875, 34.3671875, 37.173828125, 39.98046875, 42.787109375, 45.59375, 48.400390625, 51.20703125, 54.013671875, 56.8203125, 59.626953125, 62.43359375, 65.240234375, 68.046875, 70.853515625, 73.66015625, 76.466796875, 79.2734375, 82.080078125, 84.88671875, 87.693359375, 90.5]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 9.0, 6.0, 8.0, 11.0, 13.0, 24.0, 36.0, 38.0, 43.0, 61.0, 88.0, 128.0, 167.0, 263.0, 454.0, 1994.0, 113710.0, 3022741.0, 4343.0, 582.0, 281.0, 179.0, 141.0, 101.0, 75.0, 56.0, 30.0, 28.0, 28.0, 10.0, 13.0, 7.0, 6.0, 6.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-290.75, -283.322265625, -275.89453125, -268.466796875, -261.0390625, -253.611328125, -246.18359375, -238.755859375, -231.328125, -223.900390625, -216.47265625, -209.044921875, -201.6171875, -194.189453125, -186.76171875, -179.333984375, -171.90625, -164.478515625, -157.05078125, -149.623046875, -142.1953125, -134.767578125, -127.33984375, -119.912109375, -112.484375, -105.056640625, -97.62890625, -90.201171875, -82.7734375, -75.345703125, -67.91796875, -60.490234375, -53.0625, -45.634765625, -38.20703125, -30.779296875, -23.3515625, -15.923828125, -8.49609375, -1.068359375, 6.359375, 13.787109375, 21.21484375, 28.642578125, 36.0703125, 43.498046875, 50.92578125, 58.353515625, 65.78125, 73.208984375, 80.63671875, 88.064453125, 95.4921875, 102.919921875, 110.34765625, 117.775390625, 125.203125, 132.630859375, 140.05859375, 147.486328125, 154.9140625, 162.341796875, 169.76953125, 177.197265625, 184.625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 10.0, 26.0, 47.0, 90.0, 194.0, 232.0, 208.0, 115.0, 59.0, 19.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-191.43386840820312, -187.41830444335938, -183.40272521972656, -179.3871612548828, -175.37159729003906, -171.35601806640625, -167.3404541015625, -163.32489013671875, -159.309326171875, -155.29376220703125, -151.27818298339844, -147.2626190185547, -143.24705505371094, -139.23147583007812, -135.21591186523438, -131.20034790039062, -127.18476867675781, -123.16919708251953, -119.15363311767578, -115.1380615234375, -111.12249755859375, -107.10692596435547, -103.09135437011719, -99.07579040527344, -95.06021881103516, -91.04464721679688, -87.02908325195312, -83.01351165771484, -78.99794006347656, -74.98237609863281, -70.96680450439453, -66.95123291015625, -62.93565368652344, -58.92008590698242, -54.904518127441406, -50.888946533203125, -46.87337875366211, -42.857810974121094, -38.84223937988281, -34.8266716003418, -30.81110382080078, -26.795536041259766, -22.779966354370117, -18.76439666748047, -14.748828887939453, -10.733261108398438, -6.717691421508789, -2.7021217346191406, 1.313446044921875, 5.329014778137207, 9.344583511352539, 13.360152244567871, 17.375720977783203, 21.39128875732422, 25.406858444213867, 29.422428131103516, 33.43799591064453, 37.45356369018555, 41.46913146972656, 45.484703063964844, 49.50027084350586, 53.515838623046875, 57.531410217285156, 61.54697799682617, 65.56254577636719]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 6.0, 9.0, 14.0, 5.0, 18.0, 13.0, 12.0, 12.0, 23.0, 17.0, 16.0, 16.0, 31.0, 31.0, 32.0, 34.0, 31.0, 40.0, 30.0, 37.0, 38.0, 34.0, 35.0, 39.0, 46.0, 35.0, 26.0, 38.0, 29.0, 29.0, 30.0, 31.0, 24.0, 23.0, 23.0, 12.0, 12.0, 12.0, 10.0, 6.0, 9.0, 5.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-173.79222106933594, -168.29708862304688, -162.80194091796875, -157.3068084716797, -151.81167602539062, -146.31654357910156, -140.8214111328125, -135.32626342773438, -129.8311309814453, -124.33599853515625, -118.84085845947266, -113.34571838378906, -107.8505859375, -102.35545349121094, -96.86031341552734, -91.36517333984375, -85.87004089355469, -80.37490844726562, -74.87976837158203, -69.38462829589844, -63.889495849609375, -58.39435958862305, -52.89922332763672, -47.40408706665039, -41.90895080566406, -36.413814544677734, -30.918678283691406, -25.423542022705078, -19.92840576171875, -14.433269500732422, -8.938133239746094, -3.4429969787597656, 2.0521240234375, 7.547260284423828, 13.042396545410156, 18.537532806396484, 24.032669067382812, 29.52780532836914, 35.02294158935547, 40.5180778503418, 46.013214111328125, 51.50835037231445, 57.00348663330078, 62.49862289428711, 67.99375915527344, 73.4888916015625, 78.9840316772461, 84.47917175292969, 89.97430419921875, 95.46943664550781, 100.9645767211914, 106.459716796875, 111.95484924316406, 117.44998168945312, 122.94512176513672, 128.4402618408203, 133.93539428710938, 139.43052673339844, 144.9256591796875, 150.42080688476562, 155.9159393310547, 161.41107177734375, 166.90621948242188, 172.40135192871094, 177.896484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 6.0, 8.0, 13.0, 12.0, 18.0, 12.0, 22.0, 23.0, 19.0, 30.0, 33.0, 38.0, 43.0, 37.0, 40.0, 55.0, 54.0, 66.0, 55.0, 48.0, 44.0, 36.0, 49.0, 44.0, 33.0, 28.0, 31.0, 24.0, 15.0, 17.0, 13.0, 12.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.46875, -25.53662109375, -24.6044921875, -23.67236328125, -22.740234375, -21.80810546875, -20.8759765625, -19.94384765625, -19.01171875, -18.07958984375, -17.1474609375, -16.21533203125, -15.283203125, -14.35107421875, -13.4189453125, -12.48681640625, -11.5546875, -10.62255859375, -9.6904296875, -8.75830078125, -7.826171875, -6.89404296875, -5.9619140625, -5.02978515625, -4.09765625, -3.16552734375, -2.2333984375, -1.30126953125, -0.369140625, 0.56298828125, 1.4951171875, 2.42724609375, 3.359375, 4.29150390625, 5.2236328125, 6.15576171875, 7.087890625, 8.02001953125, 8.9521484375, 9.88427734375, 10.81640625, 11.74853515625, 12.6806640625, 13.61279296875, 14.544921875, 15.47705078125, 16.4091796875, 17.34130859375, 18.2734375, 19.20556640625, 20.1376953125, 21.06982421875, 22.001953125, 22.93408203125, 23.8662109375, 24.79833984375, 25.73046875, 26.66259765625, 27.5947265625, 28.52685546875, 29.458984375, 30.39111328125, 31.3232421875, 32.25537109375, 33.1875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 9.0, 11.0, 11.0, 12.0, 27.0, 25.0, 38.0, 32.0, 84.0, 121.0, 151.0, 180.0, 285.0, 540.0, 755.0, 1392.0, 2533.0, 5353.0, 12125.0, 44598.0, 959723.0, 2992231.0, 141810.0, 17173.0, 6999.0, 3420.0, 1791.0, 1017.0, 581.0, 397.0, 267.0, 164.0, 102.0, 78.0, 67.0, 37.0, 27.0, 26.0, 29.0, 14.0, 17.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.71875, -57.60205078125, -55.4853515625, -53.36865234375, -51.251953125, -49.13525390625, -47.0185546875, -44.90185546875, -42.78515625, -40.66845703125, -38.5517578125, -36.43505859375, -34.318359375, -32.20166015625, -30.0849609375, -27.96826171875, -25.8515625, -23.73486328125, -21.6181640625, -19.50146484375, -17.384765625, -15.26806640625, -13.1513671875, -11.03466796875, -8.91796875, -6.80126953125, -4.6845703125, -2.56787109375, -0.451171875, 1.66552734375, 3.7822265625, 5.89892578125, 8.015625, 10.13232421875, 12.2490234375, 14.36572265625, 16.482421875, 18.59912109375, 20.7158203125, 22.83251953125, 24.94921875, 27.06591796875, 29.1826171875, 31.29931640625, 33.416015625, 35.53271484375, 37.6494140625, 39.76611328125, 41.8828125, 43.99951171875, 46.1162109375, 48.23291015625, 50.349609375, 52.46630859375, 54.5830078125, 56.69970703125, 58.81640625, 60.93310546875, 63.0498046875, 65.16650390625, 67.283203125, 69.39990234375, 71.5166015625, 73.63330078125, 75.75]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 6.0, 9.0, 10.0, 8.0, 13.0, 19.0, 31.0, 48.0, 72.0, 127.0, 265.0, 587.0, 1120.0, 853.0, 434.0, 187.0, 78.0, 58.0, 43.0, 26.0, 21.0, 14.0, 8.0, 7.0, 7.0, 9.0, 3.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.59375, -53.51611328125, -51.4384765625, -49.36083984375, -47.283203125, -45.20556640625, -43.1279296875, -41.05029296875, -38.97265625, -36.89501953125, -34.8173828125, -32.73974609375, -30.662109375, -28.58447265625, -26.5068359375, -24.42919921875, -22.3515625, -20.27392578125, -18.1962890625, -16.11865234375, -14.041015625, -11.96337890625, -9.8857421875, -7.80810546875, -5.73046875, -3.65283203125, -1.5751953125, 0.50244140625, 2.580078125, 4.65771484375, 6.7353515625, 8.81298828125, 10.890625, 12.96826171875, 15.0458984375, 17.12353515625, 19.201171875, 21.27880859375, 23.3564453125, 25.43408203125, 27.51171875, 29.58935546875, 31.6669921875, 33.74462890625, 35.822265625, 37.89990234375, 39.9775390625, 42.05517578125, 44.1328125, 46.21044921875, 48.2880859375, 50.36572265625, 52.443359375, 54.52099609375, 56.5986328125, 58.67626953125, 60.75390625, 62.83154296875, 64.9091796875, 66.98681640625, 69.064453125, 71.14208984375, 73.2197265625, 75.29736328125, 77.375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 11.0, 10.0, 11.0, 17.0, 26.0, 43.0, 81.0, 132.0, 249.0, 738.0, 2732.0, 15443.0, 807929.0, 3340128.0, 21820.0, 3375.0, 867.0, 318.0, 136.0, 76.0, 50.0, 21.0, 13.0, 14.0, 11.0, 11.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-236.5, -230.12109375, -223.7421875, -217.36328125, -210.984375, -204.60546875, -198.2265625, -191.84765625, -185.46875, -179.08984375, -172.7109375, -166.33203125, -159.953125, -153.57421875, -147.1953125, -140.81640625, -134.4375, -128.05859375, -121.6796875, -115.30078125, -108.921875, -102.54296875, -96.1640625, -89.78515625, -83.40625, -77.02734375, -70.6484375, -64.26953125, -57.890625, -51.51171875, -45.1328125, -38.75390625, -32.375, -25.99609375, -19.6171875, -13.23828125, -6.859375, -0.48046875, 5.8984375, 12.27734375, 18.65625, 25.03515625, 31.4140625, 37.79296875, 44.171875, 50.55078125, 56.9296875, 63.30859375, 69.6875, 76.06640625, 82.4453125, 88.82421875, 95.203125, 101.58203125, 107.9609375, 114.33984375, 120.71875, 127.09765625, 133.4765625, 139.85546875, 146.234375, 152.61328125, 158.9921875, 165.37109375, 171.75]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 10.0, 9.0, 5.0, 13.0, 9.0, 17.0, 19.0, 42.0, 34.0, 46.0, 87.0, 79.0, 106.0, 95.0, 86.0, 64.0, 59.0, 44.0, 38.0, 33.0, 16.0, 13.0, 17.0, 12.0, 8.0, 5.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-117.79104614257812, -113.89295959472656, -109.994873046875, -106.09678649902344, -102.19869995117188, -98.30061340332031, -94.40252685546875, -90.50444030761719, -86.60635375976562, -82.70826721191406, -78.8101806640625, -74.91209411621094, -71.01400756835938, -67.11592102050781, -63.21783447265625, -59.31974792480469, -55.42166519165039, -51.52357864379883, -47.625492095947266, -43.7274055480957, -39.82931900024414, -35.931236267089844, -32.03314971923828, -28.135061264038086, -24.236974716186523, -20.33888816833496, -16.4408016204834, -12.542716026306152, -8.64462947845459, -4.746543884277344, -0.8484573364257812, 3.0496292114257812, 6.947715759277344, 10.845802307128906, 14.743888854980469, 18.64197540283203, 22.540061950683594, 26.438146591186523, 30.336233139038086, 34.23432159423828, 38.132408142089844, 42.030494689941406, 45.92858123779297, 49.82666778564453, 53.724754333496094, 57.622840881347656, 61.52092742919922, 65.41901397705078, 69.31709289550781, 73.21517944335938, 77.11326599121094, 81.0113525390625, 84.90943908691406, 88.80752563476562, 92.70561218261719, 96.60369873046875, 100.50178527832031, 104.39987182617188, 108.29795837402344, 112.196044921875, 116.09413146972656, 119.99221801757812, 123.89030456542969, 127.78839111328125, 131.6864776611328]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 8.0, 4.0, 1.0, 8.0, 4.0, 12.0, 17.0, 12.0, 13.0, 21.0, 18.0, 19.0, 22.0, 21.0, 29.0, 26.0, 34.0, 37.0, 27.0, 36.0, 34.0, 31.0, 32.0, 40.0, 33.0, 26.0, 30.0, 31.0, 50.0, 31.0, 31.0, 26.0, 25.0, 18.0, 18.0, 19.0, 23.0, 28.0, 24.0, 18.0, 10.0, 6.0, 11.0, 9.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-109.8528823852539, -106.22437286376953, -102.59586334228516, -98.96735382080078, -95.3388442993164, -91.71033477783203, -88.08183288574219, -84.45332336425781, -80.82481384277344, -77.19630432128906, -73.56779479980469, -69.93928527832031, -66.31077575683594, -62.68226623535156, -59.05376052856445, -55.42525100708008, -51.79673767089844, -48.16822814941406, -44.53971862792969, -40.91120910644531, -37.28269958496094, -33.65419006347656, -30.025684356689453, -26.397174835205078, -22.768665313720703, -19.140155792236328, -15.51164722442627, -11.883138656616211, -8.254629135131836, -4.626119613647461, -0.9976119995117188, 2.6308975219726562, 6.2594146728515625, 9.887924194335938, 13.516432762145996, 17.144941329956055, 20.77345085144043, 24.401960372924805, 28.030467987060547, 31.658977508544922, 35.2874870300293, 38.91599655151367, 42.54450607299805, 46.173011779785156, 49.80152130126953, 53.430030822753906, 57.05854034423828, 60.687049865722656, 64.31555938720703, 67.9440689086914, 71.57257843017578, 75.20108795166016, 78.82959747314453, 82.4581069946289, 86.08660888671875, 89.71511840820312, 93.3436279296875, 96.97213745117188, 100.60064697265625, 104.22915649414062, 107.857666015625, 111.48617553710938, 115.11468505859375, 118.74319458007812, 122.3717041015625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 12.0, 9.0, 13.0, 11.0, 15.0, 20.0, 21.0, 21.0, 24.0, 28.0, 27.0, 30.0, 30.0, 37.0, 46.0, 42.0, 49.0, 44.0, 49.0, 53.0, 45.0, 48.0, 36.0, 43.0, 35.0, 22.0, 33.0, 29.0, 21.0, 22.0, 12.0, 11.0, 8.0, 12.0, 4.0, 7.0, 7.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.6298828125, -20.853515625, -20.0771484375, -19.30078125, -18.5244140625, -17.748046875, -16.9716796875, -16.1953125, -15.4189453125, -14.642578125, -13.8662109375, -13.08984375, -12.3134765625, -11.537109375, -10.7607421875, -9.984375, -9.2080078125, -8.431640625, -7.6552734375, -6.87890625, -6.1025390625, -5.326171875, -4.5498046875, -3.7734375, -2.9970703125, -2.220703125, -1.4443359375, -0.66796875, 0.1083984375, 0.884765625, 1.6611328125, 2.4375, 3.2138671875, 3.990234375, 4.7666015625, 5.54296875, 6.3193359375, 7.095703125, 7.8720703125, 8.6484375, 9.4248046875, 10.201171875, 10.9775390625, 11.75390625, 12.5302734375, 13.306640625, 14.0830078125, 14.859375, 15.6357421875, 16.412109375, 17.1884765625, 17.96484375, 18.7412109375, 19.517578125, 20.2939453125, 21.0703125, 21.8466796875, 22.623046875, 23.3994140625, 24.17578125, 24.9521484375, 25.728515625, 26.5048828125, 27.28125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 21.0, 27.0, 36.0, 69.0, 93.0, 137.0, 216.0, 327.0, 423.0, 685.0, 1095.0, 1614.0, 2463.0, 3920.0, 6189.0, 9925.0, 16158.0, 27052.0, 46040.0, 82163.0, 154382.0, 254706.0, 195557.0, 103829.0, 57121.0, 32507.0, 19286.0, 11733.0, 7326.0, 4729.0, 2961.0, 1947.0, 1285.0, 877.0, 557.0, 361.0, 257.0, 150.0, 103.0, 79.0, 49.0, 23.0, 24.0, 14.0, 10.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.104400634765625, -1.06719970703125, -1.029998779296875, -0.9927978515625, -0.955596923828125, -0.91839599609375, -0.881195068359375, -0.843994140625, -0.806793212890625, -0.76959228515625, -0.732391357421875, -0.6951904296875, -0.657989501953125, -0.62078857421875, -0.583587646484375, -0.54638671875, -0.509185791015625, -0.47198486328125, -0.434783935546875, -0.3975830078125, -0.360382080078125, -0.32318115234375, -0.285980224609375, -0.248779296875, -0.211578369140625, -0.17437744140625, -0.137176513671875, -0.0999755859375, -0.062774658203125, -0.02557373046875, 0.011627197265625, 0.048828125, 0.086029052734375, 0.12322998046875, 0.160430908203125, 0.1976318359375, 0.234832763671875, 0.27203369140625, 0.309234619140625, 0.346435546875, 0.383636474609375, 0.42083740234375, 0.458038330078125, 0.4952392578125, 0.532440185546875, 0.56964111328125, 0.606842041015625, 0.64404296875, 0.681243896484375, 0.71844482421875, 0.755645751953125, 0.7928466796875, 0.830047607421875, 0.86724853515625, 0.904449462890625, 0.941650390625, 0.978851318359375, 1.01605224609375, 1.053253173828125, 1.0904541015625, 1.127655029296875, 1.16485595703125, 1.202056884765625, 1.2392578125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 11.0, 8.0, 8.0, 13.0, 23.0, 18.0, 15.0, 23.0, 18.0, 28.0, 26.0, 33.0, 31.0, 36.0, 34.0, 42.0, 48.0, 46.0, 1064.0, 37.0, 37.0, 36.0, 38.0, 40.0, 38.0, 33.0, 33.0, 30.0, 25.0, 23.0, 16.0, 17.0, 17.0, 17.0, 11.0, 6.0, 8.0, 3.0, 3.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.78125, -14.322265625, -13.86328125, -13.404296875, -12.9453125, -12.486328125, -12.02734375, -11.568359375, -11.109375, -10.650390625, -10.19140625, -9.732421875, -9.2734375, -8.814453125, -8.35546875, -7.896484375, -7.4375, -6.978515625, -6.51953125, -6.060546875, -5.6015625, -5.142578125, -4.68359375, -4.224609375, -3.765625, -3.306640625, -2.84765625, -2.388671875, -1.9296875, -1.470703125, -1.01171875, -0.552734375, -0.09375, 0.365234375, 0.82421875, 1.283203125, 1.7421875, 2.201171875, 2.66015625, 3.119140625, 3.578125, 4.037109375, 4.49609375, 4.955078125, 5.4140625, 5.873046875, 6.33203125, 6.791015625, 7.25, 7.708984375, 8.16796875, 8.626953125, 9.0859375, 9.544921875, 10.00390625, 10.462890625, 10.921875, 11.380859375, 11.83984375, 12.298828125, 12.7578125, 13.216796875, 13.67578125, 14.134765625, 14.59375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 6.0, 15.0, 10.0, 23.0, 28.0, 48.0, 91.0, 94.0, 116.0, 139.0, 244.0, 354.0, 486.0, 646.0, 912.0, 1205.0, 1756.0, 2516.0, 3603.0, 5046.0, 7123.0, 10030.0, 14713.0, 21393.0, 32197.0, 49692.0, 80094.0, 134422.0, 1254787.0, 177852.0, 105967.0, 64289.0, 40538.0, 26905.0, 17950.0, 12380.0, 8708.0, 5916.0, 4365.0, 2999.0, 2123.0, 1513.0, 1097.0, 763.0, 557.0, 430.0, 285.0, 187.0, 175.0, 116.0, 73.0, 49.0, 41.0, 22.0, 13.0, 11.0, 10.0, 5.0, 6.0, 9.0], "bins": [-0.89501953125, -0.8677139282226562, -0.8404083251953125, -0.8131027221679688, -0.785797119140625, -0.7584915161132812, -0.7311859130859375, -0.7038803100585938, -0.67657470703125, -0.6492691040039062, -0.6219635009765625, -0.5946578979492188, -0.567352294921875, -0.5400466918945312, -0.5127410888671875, -0.48543548583984375, -0.4581298828125, -0.43082427978515625, -0.4035186767578125, -0.37621307373046875, -0.348907470703125, -0.32160186767578125, -0.2942962646484375, -0.26699066162109375, -0.23968505859375, -0.21237945556640625, -0.1850738525390625, -0.15776824951171875, -0.130462646484375, -0.10315704345703125, -0.0758514404296875, -0.04854583740234375, -0.021240234375, 0.00606536865234375, 0.0333709716796875, 0.06067657470703125, 0.087982177734375, 0.11528778076171875, 0.1425933837890625, 0.16989898681640625, 0.19720458984375, 0.22451019287109375, 0.2518157958984375, 0.27912139892578125, 0.306427001953125, 0.33373260498046875, 0.3610382080078125, 0.38834381103515625, 0.4156494140625, 0.44295501708984375, 0.4702606201171875, 0.49756622314453125, 0.524871826171875, 0.5521774291992188, 0.5794830322265625, 0.6067886352539062, 0.63409423828125, 0.6613998413085938, 0.6887054443359375, 0.7160110473632812, 0.743316650390625, 0.7706222534179688, 0.7979278564453125, 0.8252334594726562, 0.8525390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 12.0, 12.0, 11.0, 24.0, 13.0, 21.0, 33.0, 23.0, 34.0, 34.0, 30.0, 42.0, 53.0, 48.0, 46.0, 63.0, 49.0, 57.0, 35.0, 44.0, 35.0, 35.0, 28.0, 36.0, 33.0, 34.0, 15.0, 14.0, 12.0, 8.0, 10.0, 10.0, 5.0, 5.0, 6.0, 1.0, 5.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004241943359375, -0.004106760025024414, -0.003971576690673828, -0.003836393356323242, -0.0037012100219726562, -0.0035660266876220703, -0.0034308433532714844, -0.0032956600189208984, -0.0031604766845703125, -0.0030252933502197266, -0.0028901100158691406, -0.0027549266815185547, -0.0026197433471679688, -0.002484560012817383, -0.002349376678466797, -0.002214193344116211, -0.002079010009765625, -0.001943826675415039, -0.0018086433410644531, -0.0016734600067138672, -0.0015382766723632812, -0.0014030933380126953, -0.0012679100036621094, -0.0011327266693115234, -0.0009975433349609375, -0.0008623600006103516, -0.0007271766662597656, -0.0005919933319091797, -0.00045680999755859375, -0.0003216266632080078, -0.00018644332885742188, -5.125999450683594e-05, 8.392333984375e-05, 0.00021910667419433594, 0.0003542900085449219, 0.0004894733428955078, 0.0006246566772460938, 0.0007598400115966797, 0.0008950233459472656, 0.0010302066802978516, 0.0011653900146484375, 0.0013005733489990234, 0.0014357566833496094, 0.0015709400177001953, 0.0017061233520507812, 0.0018413066864013672, 0.001976490020751953, 0.002111673355102539, 0.002246856689453125, 0.002382040023803711, 0.002517223358154297, 0.002652406692504883, 0.0027875900268554688, 0.0029227733612060547, 0.0030579566955566406, 0.0031931400299072266, 0.0033283233642578125, 0.0034635066986083984, 0.0035986900329589844, 0.0037338733673095703, 0.0038690567016601562, 0.004004240036010742, 0.004139423370361328, 0.004274606704711914, 0.0044097900390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 3.0, 7.0, 14.0, 11.0, 11.0, 13.0, 17.0, 29.0, 39.0, 46.0, 43.0, 64.0, 90.0, 110.0, 164.0, 336.0, 1209.0, 57666.0, 967072.0, 19913.0, 817.0, 280.0, 141.0, 106.0, 75.0, 51.0, 47.0, 37.0, 29.0, 21.0, 19.0, 17.0, 10.0, 12.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08831787109375, -0.08550453186035156, -0.08269119262695312, -0.07987785339355469, -0.07706451416015625, -0.07425117492675781, -0.07143783569335938, -0.06862449645996094, -0.0658111572265625, -0.06299781799316406, -0.060184478759765625, -0.05737113952636719, -0.05455780029296875, -0.05174446105957031, -0.048931121826171875, -0.04611778259277344, -0.043304443359375, -0.04049110412597656, -0.037677764892578125, -0.03486442565917969, -0.03205108642578125, -0.029237747192382812, -0.026424407958984375, -0.023611068725585938, -0.0207977294921875, -0.017984390258789062, -0.015171051025390625, -0.012357711791992188, -0.00954437255859375, -0.0067310333251953125, -0.003917694091796875, -0.0011043548583984375, 0.001708984375, 0.0045223236083984375, 0.007335662841796875, 0.010149002075195312, 0.01296234130859375, 0.015775680541992188, 0.018589019775390625, 0.021402359008789062, 0.0242156982421875, 0.027029037475585938, 0.029842376708984375, 0.03265571594238281, 0.03546905517578125, 0.03828239440917969, 0.041095733642578125, 0.04390907287597656, 0.046722412109375, 0.04953575134277344, 0.052349090576171875, 0.05516242980957031, 0.05797576904296875, 0.06078910827636719, 0.06360244750976562, 0.06641578674316406, 0.0692291259765625, 0.07204246520996094, 0.07485580444335938, 0.07766914367675781, 0.08048248291015625, 0.08329582214355469, 0.08610916137695312, 0.08892250061035156, 0.09173583984375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 12.0, 18.0, 41.0, 68.0, 60.0, 121.0, 142.0, 162.0, 124.0, 99.0, 59.0, 29.0, 22.0, 11.0, 12.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022897045128047466, -0.0021149171516299248, -0.0019401300232857466, -0.0017653426621109247, -0.0015905554173514247, -0.0014157681725919247, -0.0012409808114171028, -0.0010661935666576028, -0.0008914063218981028, -0.0007166190771386027, -0.0005418317741714418, -0.00036704447120428085, -0.00019225722644478083, -1.74699816852808e-05, 0.00015731737948954105, 0.0003321046242490411, 0.0005068918690085411, 0.0006816791137680411, 0.0008564664167352021, 0.001031253719702363, 0.001206040964461863, 0.001380828209221363, 0.001555615570396185, 0.001730402815155685, 0.001905190059915185, 0.002079977421090007, 0.002254764549434185, 0.002429551910609007, 0.0026043392717838287, 0.002779126400128007, 0.002953913761302829, 0.003128700889647007, 0.003303488716483116, 0.003478276077657938, 0.003653063206002116, 0.003827850567176938, 0.004002637695521116, 0.004177425056695938, 0.00435221241787076, 0.004526999779045582, 0.004701786674559116, 0.004876574035733938, 0.00505136139690876, 0.005226148292422295, 0.0054009356535971165, 0.005575723014771938, 0.00575051037594676, 0.005925297737121582, 0.006100085098296404, 0.006274872459471226, 0.006449659820646048, 0.0066244471818208694, 0.006799234077334404, 0.006974021438509226, 0.007148808799684048, 0.0073235961608588696, 0.007498383522033691, 0.007673170883208513, 0.007847958244383335, 0.00802274513989687, 0.008197532966732979, 0.008372319862246513, 0.008547106757760048, 0.008721894584596157, 0.008896681480109692]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 2.0, 11.0, 8.0, 15.0, 10.0, 13.0, 14.0, 28.0, 15.0, 32.0, 30.0, 40.0, 32.0, 31.0, 26.0, 36.0, 38.0, 44.0, 38.0, 41.0, 42.0, 36.0, 40.0, 40.0, 37.0, 26.0, 34.0, 22.0, 27.0, 28.0, 28.0, 25.0, 24.0, 15.0, 12.0, 16.0, 8.0, 6.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025544166564941406, -0.0024745389819145203, -0.0023946613073349, -0.0023147836327552795, -0.002234905958175659, -0.002155028283596039, -0.0020751506090164185, -0.001995272934436798, -0.0019153952598571777, -0.0018355175852775574, -0.001755639910697937, -0.0016757622361183167, -0.0015958845615386963, -0.001516006886959076, -0.0014361292123794556, -0.0013562515377998352, -0.0012763738632202148, -0.0011964961886405945, -0.0011166185140609741, -0.0010367408394813538, -0.0009568631649017334, -0.000876985490322113, -0.0007971078157424927, -0.0007172301411628723, -0.000637352466583252, -0.0005574747920036316, -0.00047759711742401123, -0.00039771944284439087, -0.0003178417682647705, -0.00023796409368515015, -0.00015808641910552979, -7.820874452590942e-05, 1.6689300537109375e-06, 8.15466046333313e-05, 0.00016142427921295166, 0.00024130195379257202, 0.0003211796283721924, 0.00040105730295181274, 0.0004809349775314331, 0.0005608126521110535, 0.0006406903266906738, 0.0007205680012702942, 0.0008004456758499146, 0.0008803233504295349, 0.0009602010250091553, 0.0010400786995887756, 0.001119956374168396, 0.0011998340487480164, 0.0012797117233276367, 0.001359589397907257, 0.0014394670724868774, 0.0015193447470664978, 0.0015992224216461182, 0.0016791000962257385, 0.0017589777708053589, 0.0018388554453849792, 0.0019187331199645996, 0.00199861079454422, 0.0020784884691238403, 0.0021583661437034607, 0.002238243818283081, 0.0023181214928627014, 0.0023979991674423218, 0.002477876842021942, 0.0025577545166015625]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 12.0, 9.0, 13.0, 11.0, 15.0, 20.0, 21.0, 21.0, 24.0, 28.0, 27.0, 30.0, 30.0, 37.0, 46.0, 42.0, 49.0, 44.0, 49.0, 53.0, 45.0, 48.0, 36.0, 43.0, 35.0, 22.0, 33.0, 29.0, 21.0, 22.0, 12.0, 11.0, 8.0, 12.0, 4.0, 7.0, 7.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.6298828125, -20.853515625, -20.0771484375, -19.30078125, -18.5244140625, -17.748046875, -16.9716796875, -16.1953125, -15.4189453125, -14.642578125, -13.8662109375, -13.08984375, -12.3134765625, -11.537109375, -10.7607421875, -9.984375, -9.2080078125, -8.431640625, -7.6552734375, -6.87890625, -6.1025390625, -5.326171875, -4.5498046875, -3.7734375, -2.9970703125, -2.220703125, -1.4443359375, -0.66796875, 0.1083984375, 0.884765625, 1.6611328125, 2.4375, 3.2138671875, 3.990234375, 4.7666015625, 5.54296875, 6.3193359375, 7.095703125, 7.8720703125, 8.6484375, 9.4248046875, 10.201171875, 10.9775390625, 11.75390625, 12.5302734375, 13.306640625, 14.0830078125, 14.859375, 15.6357421875, 16.412109375, 17.1884765625, 17.96484375, 18.7412109375, 19.517578125, 20.2939453125, 21.0703125, 21.8466796875, 22.623046875, 23.3994140625, 24.17578125, 24.9521484375, 25.728515625, 26.5048828125, 27.28125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 6.0, 11.0, 13.0, 25.0, 17.0, 36.0, 37.0, 62.0, 90.0, 108.0, 148.0, 168.0, 252.0, 342.0, 457.0, 571.0, 769.0, 1063.0, 1496.0, 2501.0, 4654.0, 10659.0, 38832.0, 337601.0, 567645.0, 53691.0, 13081.0, 5374.0, 2681.0, 1708.0, 1223.0, 784.0, 627.0, 483.0, 322.0, 278.0, 188.0, 141.0, 107.0, 75.0, 64.0, 58.0, 24.0, 25.0, 19.0, 13.0, 14.0, 2.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.25, -24.43798828125, -23.6259765625, -22.81396484375, -22.001953125, -21.18994140625, -20.3779296875, -19.56591796875, -18.75390625, -17.94189453125, -17.1298828125, -16.31787109375, -15.505859375, -14.69384765625, -13.8818359375, -13.06982421875, -12.2578125, -11.44580078125, -10.6337890625, -9.82177734375, -9.009765625, -8.19775390625, -7.3857421875, -6.57373046875, -5.76171875, -4.94970703125, -4.1376953125, -3.32568359375, -2.513671875, -1.70166015625, -0.8896484375, -0.07763671875, 0.734375, 1.54638671875, 2.3583984375, 3.17041015625, 3.982421875, 4.79443359375, 5.6064453125, 6.41845703125, 7.23046875, 8.04248046875, 8.8544921875, 9.66650390625, 10.478515625, 11.29052734375, 12.1025390625, 12.91455078125, 13.7265625, 14.53857421875, 15.3505859375, 16.16259765625, 16.974609375, 17.78662109375, 18.5986328125, 19.41064453125, 20.22265625, 21.03466796875, 21.8466796875, 22.65869140625, 23.470703125, 24.28271484375, 25.0947265625, 25.90673828125, 26.71875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 6.0, 8.0, 6.0, 11.0, 14.0, 13.0, 27.0, 18.0, 31.0, 25.0, 21.0, 23.0, 38.0, 25.0, 36.0, 37.0, 44.0, 44.0, 152.0, 1814.0, 185.0, 39.0, 41.0, 44.0, 34.0, 29.0, 28.0, 35.0, 30.0, 23.0, 22.0, 23.0, 16.0, 12.0, 14.0, 10.0, 6.0, 11.0, 8.0, 5.0, 7.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-63.53125, -61.52001953125, -59.5087890625, -57.49755859375, -55.486328125, -53.47509765625, -51.4638671875, -49.45263671875, -47.44140625, -45.43017578125, -43.4189453125, -41.40771484375, -39.396484375, -37.38525390625, -35.3740234375, -33.36279296875, -31.3515625, -29.34033203125, -27.3291015625, -25.31787109375, -23.306640625, -21.29541015625, -19.2841796875, -17.27294921875, -15.26171875, -13.25048828125, -11.2392578125, -9.22802734375, -7.216796875, -5.20556640625, -3.1943359375, -1.18310546875, 0.828125, 2.83935546875, 4.8505859375, 6.86181640625, 8.873046875, 10.88427734375, 12.8955078125, 14.90673828125, 16.91796875, 18.92919921875, 20.9404296875, 22.95166015625, 24.962890625, 26.97412109375, 28.9853515625, 30.99658203125, 33.0078125, 35.01904296875, 37.0302734375, 39.04150390625, 41.052734375, 43.06396484375, 45.0751953125, 47.08642578125, 49.09765625, 51.10888671875, 53.1201171875, 55.13134765625, 57.142578125, 59.15380859375, 61.1650390625, 63.17626953125, 65.1875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 8.0, 9.0, 20.0, 23.0, 27.0, 38.0, 71.0, 107.0, 143.0, 232.0, 541.0, 3212.0, 3122161.0, 17284.0, 906.0, 322.0, 205.0, 104.0, 82.0, 62.0, 49.0, 25.0, 18.0, 11.0, 13.0, 3.0, 4.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-218.25, -210.375, -202.5, -194.625, -186.75, -178.875, -171.0, -163.125, -155.25, -147.375, -139.5, -131.625, -123.75, -115.875, -108.0, -100.125, -92.25, -84.375, -76.5, -68.625, -60.75, -52.875, -45.0, -37.125, -29.25, -21.375, -13.5, -5.625, 2.25, 10.125, 18.0, 25.875, 33.75, 41.625, 49.5, 57.375, 65.25, 73.125, 81.0, 88.875, 96.75, 104.625, 112.5, 120.375, 128.25, 136.125, 144.0, 151.875, 159.75, 167.625, 175.5, 183.375, 191.25, 199.125, 207.0, 214.875, 222.75, 230.625, 238.5, 246.375, 254.25, 262.125, 270.0, 277.875, 285.75]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 10.0, 12.0, 34.0, 40.0, 82.0, 117.0, 175.0, 182.0, 156.0, 94.0, 53.0, 21.0, 10.0, 10.0, 3.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.06866455078125, -102.8968734741211, -100.72508239746094, -98.55329895019531, -96.38150787353516, -94.209716796875, -92.03792572021484, -89.86613464355469, -87.69435119628906, -85.5225601196289, -83.35076904296875, -81.17898559570312, -79.00719451904297, -76.83540344238281, -74.66361236572266, -72.4918212890625, -70.32003021240234, -68.14823913574219, -65.97644805908203, -63.80466079711914, -61.63287353515625, -59.461082458496094, -57.28929138183594, -55.11750030517578, -52.94571304321289, -50.773921966552734, -48.602134704589844, -46.43034362792969, -44.25855255126953, -42.08676528930664, -39.914974212646484, -37.743186950683594, -35.57139205932617, -33.399600982666016, -31.227813720703125, -29.05602264404297, -26.884233474731445, -24.712444305419922, -22.540653228759766, -20.368864059448242, -18.19707489013672, -16.025285720825195, -13.853495597839355, -11.681705474853516, -9.509916305541992, -7.338127136230469, -5.166337013244629, -2.994546890258789, -0.8227577209472656, 1.349031925201416, 3.5208215713500977, 5.692611217498779, 7.864400863647461, 10.036190032958984, 12.207980155944824, 14.379770278930664, 16.551559448242188, 18.72334861755371, 20.895137786865234, 23.06692886352539, 25.238718032836914, 27.410507202148438, 29.582298278808594, 31.754087448120117, 33.92587661743164]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 5.0, 10.0, 6.0, 10.0, 10.0, 6.0, 10.0, 8.0, 14.0, 13.0, 18.0, 16.0, 20.0, 24.0, 24.0, 20.0, 36.0, 23.0, 44.0, 40.0, 37.0, 37.0, 26.0, 33.0, 38.0, 31.0, 36.0, 36.0, 40.0, 21.0, 27.0, 28.0, 21.0, 21.0, 36.0, 29.0, 23.0, 16.0, 18.0, 6.0, 15.0, 13.0, 9.0, 12.0, 5.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-143.6927490234375, -139.14691162109375, -134.60105895996094, -130.0552215576172, -125.50936889648438, -120.9635238647461, -116.41767883300781, -111.87184143066406, -107.32598876953125, -102.78014373779297, -98.23429870605469, -93.6884536743164, -89.14260864257812, -84.59676361083984, -80.05091857910156, -75.50508117675781, -70.95923614501953, -66.41339111328125, -61.86754608154297, -57.32170104980469, -52.775856018066406, -48.230010986328125, -43.68416976928711, -39.13832473754883, -34.59247970581055, -30.046634674072266, -25.500789642333984, -20.954946517944336, -16.409101486206055, -11.863256454467773, -7.317413330078125, -2.7715682983398438, 1.7742767333984375, 6.3201212882995605, 10.865965843200684, 15.411809921264648, 19.95765495300293, 24.50349998474121, 29.04934310913086, 33.59518814086914, 38.14103317260742, 42.6868782043457, 47.232723236083984, 51.778564453125, 56.32440948486328, 60.87025451660156, 65.41609954833984, 69.96194458007812, 74.5077896118164, 79.05363464355469, 83.59947967529297, 88.14532470703125, 92.69116973876953, 97.23701477050781, 101.78285217285156, 106.32870483398438, 110.87454223632812, 115.4203872680664, 119.96623229980469, 124.51207733154297, 129.05792236328125, 133.603759765625, 138.1496124267578, 142.69544982910156, 147.24130249023438]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 1.0, 8.0, 7.0, 9.0, 13.0, 15.0, 16.0, 14.0, 25.0, 21.0, 16.0, 29.0, 28.0, 31.0, 33.0, 38.0, 45.0, 44.0, 42.0, 53.0, 48.0, 46.0, 50.0, 48.0, 37.0, 43.0, 34.0, 27.0, 39.0, 27.0, 16.0, 20.0, 11.0, 14.0, 9.0, 9.0, 10.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.729736328125, -22.91259765625, -22.095458984375, -21.2783203125, -20.461181640625, -19.64404296875, -18.826904296875, -18.009765625, -17.192626953125, -16.37548828125, -15.558349609375, -14.7412109375, -13.924072265625, -13.10693359375, -12.289794921875, -11.47265625, -10.655517578125, -9.83837890625, -9.021240234375, -8.2041015625, -7.386962890625, -6.56982421875, -5.752685546875, -4.935546875, -4.118408203125, -3.30126953125, -2.484130859375, -1.6669921875, -0.849853515625, -0.03271484375, 0.784423828125, 1.6015625, 2.418701171875, 3.23583984375, 4.052978515625, 4.8701171875, 5.687255859375, 6.50439453125, 7.321533203125, 8.138671875, 8.955810546875, 9.77294921875, 10.590087890625, 11.4072265625, 12.224365234375, 13.04150390625, 13.858642578125, 14.67578125, 15.492919921875, 16.31005859375, 17.127197265625, 17.9443359375, 18.761474609375, 19.57861328125, 20.395751953125, 21.212890625, 22.030029296875, 22.84716796875, 23.664306640625, 24.4814453125, 25.298583984375, 26.11572265625, 26.932861328125, 27.75]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 10.0, 12.0, 15.0, 33.0, 35.0, 39.0, 54.0, 84.0, 101.0, 128.0, 181.0, 226.0, 282.0, 410.0, 555.0, 789.0, 1315.0, 2345.0, 4846.0, 13457.0, 150392.0, 3064574.0, 901514.0, 36210.0, 7825.0, 3363.0, 1840.0, 1047.0, 699.0, 469.0, 365.0, 252.0, 189.0, 141.0, 103.0, 96.0, 71.0, 48.0, 37.0, 34.0, 26.0, 19.0, 9.0, 11.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.40625, -59.34326171875, -57.2802734375, -55.21728515625, -53.154296875, -51.09130859375, -49.0283203125, -46.96533203125, -44.90234375, -42.83935546875, -40.7763671875, -38.71337890625, -36.650390625, -34.58740234375, -32.5244140625, -30.46142578125, -28.3984375, -26.33544921875, -24.2724609375, -22.20947265625, -20.146484375, -18.08349609375, -16.0205078125, -13.95751953125, -11.89453125, -9.83154296875, -7.7685546875, -5.70556640625, -3.642578125, -1.57958984375, 0.4833984375, 2.54638671875, 4.609375, 6.67236328125, 8.7353515625, 10.79833984375, 12.861328125, 14.92431640625, 16.9873046875, 19.05029296875, 21.11328125, 23.17626953125, 25.2392578125, 27.30224609375, 29.365234375, 31.42822265625, 33.4912109375, 35.55419921875, 37.6171875, 39.68017578125, 41.7431640625, 43.80615234375, 45.869140625, 47.93212890625, 49.9951171875, 52.05810546875, 54.12109375, 56.18408203125, 58.2470703125, 60.31005859375, 62.373046875, 64.43603515625, 66.4990234375, 68.56201171875, 70.625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 5.0, 5.0, 13.0, 21.0, 16.0, 31.0, 28.0, 36.0, 59.0, 118.0, 209.0, 421.0, 820.0, 929.0, 622.0, 310.0, 111.0, 90.0, 63.0, 39.0, 30.0, 30.0, 14.0, 12.0, 10.0, 5.0, 5.0, 4.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.125, -54.3828125, -52.640625, -50.8984375, -49.15625, -47.4140625, -45.671875, -43.9296875, -42.1875, -40.4453125, -38.703125, -36.9609375, -35.21875, -33.4765625, -31.734375, -29.9921875, -28.25, -26.5078125, -24.765625, -23.0234375, -21.28125, -19.5390625, -17.796875, -16.0546875, -14.3125, -12.5703125, -10.828125, -9.0859375, -7.34375, -5.6015625, -3.859375, -2.1171875, -0.375, 1.3671875, 3.109375, 4.8515625, 6.59375, 8.3359375, 10.078125, 11.8203125, 13.5625, 15.3046875, 17.046875, 18.7890625, 20.53125, 22.2734375, 24.015625, 25.7578125, 27.5, 29.2421875, 30.984375, 32.7265625, 34.46875, 36.2109375, 37.953125, 39.6953125, 41.4375, 43.1796875, 44.921875, 46.6640625, 48.40625, 50.1484375, 51.890625, 53.6328125, 55.375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 6.0, 6.0, 8.0, 14.0, 19.0, 38.0, 29.0, 61.0, 95.0, 217.0, 552.0, 2765.0, 35211.0, 4079623.0, 70456.0, 3937.0, 716.0, 239.0, 93.0, 47.0, 41.0, 28.0, 19.0, 16.0, 13.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.5, -233.85546875, -226.2109375, -218.56640625, -210.921875, -203.27734375, -195.6328125, -187.98828125, -180.34375, -172.69921875, -165.0546875, -157.41015625, -149.765625, -142.12109375, -134.4765625, -126.83203125, -119.1875, -111.54296875, -103.8984375, -96.25390625, -88.609375, -80.96484375, -73.3203125, -65.67578125, -58.03125, -50.38671875, -42.7421875, -35.09765625, -27.453125, -19.80859375, -12.1640625, -4.51953125, 3.125, 10.76953125, 18.4140625, 26.05859375, 33.703125, 41.34765625, 48.9921875, 56.63671875, 64.28125, 71.92578125, 79.5703125, 87.21484375, 94.859375, 102.50390625, 110.1484375, 117.79296875, 125.4375, 133.08203125, 140.7265625, 148.37109375, 156.015625, 163.66015625, 171.3046875, 178.94921875, 186.59375, 194.23828125, 201.8828125, 209.52734375, 217.171875, 224.81640625, 232.4609375, 240.10546875, 247.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 7.0, 9.0, 12.0, 34.0, 32.0, 69.0, 109.0, 150.0, 186.0, 153.0, 95.0, 58.0, 33.0, 24.0, 15.0, 10.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-317.0658264160156, -309.921630859375, -302.77740478515625, -295.6332092285156, -288.489013671875, -281.34478759765625, -274.2005920410156, -267.0563659667969, -259.91217041015625, -252.76795959472656, -245.62374877929688, -238.47955322265625, -231.33534240722656, -224.19113159179688, -217.04693603515625, -209.90272521972656, -202.75851440429688, -195.6143035888672, -188.4700927734375, -181.32589721679688, -174.1816864013672, -167.0374755859375, -159.89328002929688, -152.7490692138672, -145.6048583984375, -138.4606475830078, -131.31643676757812, -124.1722412109375, -117.02803039550781, -109.88381958007812, -102.73961639404297, -95.59541320800781, -88.45121765136719, -81.3070068359375, -74.16280364990234, -67.01860046386719, -59.8743896484375, -52.73018264770508, -45.585975646972656, -38.441768646240234, -31.297561645507812, -24.15335464477539, -17.00914764404297, -9.864940643310547, -2.720733642578125, 4.423473358154297, 11.567680358886719, 18.71188735961914, 25.856094360351562, 33.000301361083984, 40.144508361816406, 47.28871536254883, 54.43292236328125, 61.57712936401367, 68.7213363647461, 75.86553955078125, 83.00975036621094, 90.15396118164062, 97.29816436767578, 104.44236755371094, 111.58657836914062, 118.73078918457031, 125.87499237060547, 133.01919555664062, 140.1634063720703]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 6.0, 2.0, 7.0, 6.0, 11.0, 12.0, 17.0, 7.0, 8.0, 25.0, 19.0, 28.0, 32.0, 24.0, 30.0, 26.0, 30.0, 44.0, 27.0, 26.0, 32.0, 45.0, 29.0, 46.0, 35.0, 35.0, 40.0, 37.0, 38.0, 33.0, 35.0, 25.0, 24.0, 26.0, 17.0, 19.0, 11.0, 15.0, 9.0, 11.0, 9.0, 9.0, 5.0, 9.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-113.650634765625, -109.86417388916016, -106.07772064208984, -102.291259765625, -98.50480651855469, -94.71834564208984, -90.931884765625, -87.14543151855469, -83.35897064208984, -79.572509765625, -75.78605651855469, -71.99959564208984, -68.213134765625, -64.42668151855469, -60.640220642089844, -56.853763580322266, -53.06730651855469, -49.28084945678711, -45.49439239501953, -41.70793151855469, -37.92147445678711, -34.13501739501953, -30.34855842590332, -26.56209945678711, -22.77564239501953, -18.989185333251953, -15.202726364135742, -11.416268348693848, -7.629810333251953, -3.843353271484375, -0.05689430236816406, 3.729564666748047, 7.516021728515625, 11.30247974395752, 15.088937759399414, 18.875396728515625, 22.661853790283203, 26.44831085205078, 30.234769821166992, 34.0212287902832, 37.80768585205078, 41.59414291381836, 45.38059997558594, 49.16706085205078, 52.95351791381836, 56.73997497558594, 60.52643585205078, 64.31289672851562, 68.09934997558594, 71.88581085205078, 75.6722640991211, 79.45872497558594, 83.24517822265625, 87.0316390991211, 90.81809997558594, 94.60455322265625, 98.3910140991211, 102.17747497558594, 105.96392822265625, 109.7503890991211, 113.53684997558594, 117.32330322265625, 121.1097640991211, 124.89622497558594, 128.68267822265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 8.0, 14.0, 12.0, 14.0, 17.0, 26.0, 21.0, 20.0, 29.0, 27.0, 38.0, 32.0, 31.0, 30.0, 31.0, 53.0, 59.0, 50.0, 37.0, 45.0, 41.0, 35.0, 42.0, 44.0, 22.0, 33.0, 23.0, 25.0, 22.0, 18.0, 15.0, 11.0, 8.0, 12.0, 9.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.75, -21.00830078125, -20.2666015625, -19.52490234375, -18.783203125, -18.04150390625, -17.2998046875, -16.55810546875, -15.81640625, -15.07470703125, -14.3330078125, -13.59130859375, -12.849609375, -12.10791015625, -11.3662109375, -10.62451171875, -9.8828125, -9.14111328125, -8.3994140625, -7.65771484375, -6.916015625, -6.17431640625, -5.4326171875, -4.69091796875, -3.94921875, -3.20751953125, -2.4658203125, -1.72412109375, -0.982421875, -0.24072265625, 0.5009765625, 1.24267578125, 1.984375, 2.72607421875, 3.4677734375, 4.20947265625, 4.951171875, 5.69287109375, 6.4345703125, 7.17626953125, 7.91796875, 8.65966796875, 9.4013671875, 10.14306640625, 10.884765625, 11.62646484375, 12.3681640625, 13.10986328125, 13.8515625, 14.59326171875, 15.3349609375, 16.07666015625, 16.818359375, 17.56005859375, 18.3017578125, 19.04345703125, 19.78515625, 20.52685546875, 21.2685546875, 22.01025390625, 22.751953125, 23.49365234375, 24.2353515625, 24.97705078125, 25.71875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 20.0, 13.0, 27.0, 34.0, 58.0, 79.0, 114.0, 146.0, 256.0, 345.0, 550.0, 802.0, 1147.0, 1896.0, 2939.0, 4677.0, 7565.0, 12388.0, 20919.0, 35277.0, 61128.0, 109030.0, 198492.0, 249281.0, 146322.0, 80429.0, 45990.0, 26679.0, 15928.0, 9538.0, 5898.0, 3687.0, 2410.0, 1512.0, 971.0, 664.0, 415.0, 284.0, 202.0, 120.0, 97.0, 62.0, 61.0, 30.0, 14.0, 17.0, 10.0, 9.0, 7.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.109375, -1.07269287109375, -1.0360107421875, -0.99932861328125, -0.962646484375, -0.92596435546875, -0.8892822265625, -0.85260009765625, -0.81591796875, -0.77923583984375, -0.7425537109375, -0.70587158203125, -0.669189453125, -0.63250732421875, -0.5958251953125, -0.55914306640625, -0.5224609375, -0.48577880859375, -0.4490966796875, -0.41241455078125, -0.375732421875, -0.33905029296875, -0.3023681640625, -0.26568603515625, -0.22900390625, -0.19232177734375, -0.1556396484375, -0.11895751953125, -0.082275390625, -0.04559326171875, -0.0089111328125, 0.02777099609375, 0.064453125, 0.10113525390625, 0.1378173828125, 0.17449951171875, 0.211181640625, 0.24786376953125, 0.2845458984375, 0.32122802734375, 0.35791015625, 0.39459228515625, 0.4312744140625, 0.46795654296875, 0.504638671875, 0.54132080078125, 0.5780029296875, 0.61468505859375, 0.6513671875, 0.68804931640625, 0.7247314453125, 0.76141357421875, 0.798095703125, 0.83477783203125, 0.8714599609375, 0.90814208984375, 0.94482421875, 0.98150634765625, 1.0181884765625, 1.05487060546875, 1.091552734375, 1.12823486328125, 1.1649169921875, 1.20159912109375, 1.23828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 7.0, 6.0, 14.0, 9.0, 20.0, 14.0, 24.0, 24.0, 15.0, 24.0, 29.0, 36.0, 38.0, 43.0, 35.0, 36.0, 31.0, 43.0, 38.0, 1059.0, 36.0, 35.0, 35.0, 38.0, 26.0, 33.0, 32.0, 31.0, 25.0, 25.0, 14.0, 16.0, 17.0, 15.0, 19.0, 10.0, 11.0, 11.0, 5.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0], "bins": [-14.7578125, -14.32470703125, -13.8916015625, -13.45849609375, -13.025390625, -12.59228515625, -12.1591796875, -11.72607421875, -11.29296875, -10.85986328125, -10.4267578125, -9.99365234375, -9.560546875, -9.12744140625, -8.6943359375, -8.26123046875, -7.828125, -7.39501953125, -6.9619140625, -6.52880859375, -6.095703125, -5.66259765625, -5.2294921875, -4.79638671875, -4.36328125, -3.93017578125, -3.4970703125, -3.06396484375, -2.630859375, -2.19775390625, -1.7646484375, -1.33154296875, -0.8984375, -0.46533203125, -0.0322265625, 0.40087890625, 0.833984375, 1.26708984375, 1.7001953125, 2.13330078125, 2.56640625, 2.99951171875, 3.4326171875, 3.86572265625, 4.298828125, 4.73193359375, 5.1650390625, 5.59814453125, 6.03125, 6.46435546875, 6.8974609375, 7.33056640625, 7.763671875, 8.19677734375, 8.6298828125, 9.06298828125, 9.49609375, 9.92919921875, 10.3623046875, 10.79541015625, 11.228515625, 11.66162109375, 12.0947265625, 12.52783203125, 12.9609375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 6.0, 15.0, 17.0, 26.0, 51.0, 56.0, 81.0, 143.0, 201.0, 290.0, 370.0, 574.0, 813.0, 1113.0, 1639.0, 2293.0, 3194.0, 4434.0, 6367.0, 8901.0, 12792.0, 18806.0, 27627.0, 41961.0, 65765.0, 107252.0, 175485.0, 1247418.0, 133429.0, 80263.0, 50375.0, 33118.0, 22013.0, 14866.0, 10412.0, 7311.0, 5141.0, 3623.0, 2605.0, 1880.0, 1322.0, 931.0, 661.0, 488.0, 301.0, 222.0, 180.0, 98.0, 85.0, 45.0, 32.0, 15.0, 17.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.83740234375, -0.8105697631835938, -0.7837371826171875, -0.7569046020507812, -0.730072021484375, -0.7032394409179688, -0.6764068603515625, -0.6495742797851562, -0.62274169921875, -0.5959091186523438, -0.5690765380859375, -0.5422439575195312, -0.515411376953125, -0.48857879638671875, -0.4617462158203125, -0.43491363525390625, -0.4080810546875, -0.38124847412109375, -0.3544158935546875, -0.32758331298828125, -0.300750732421875, -0.27391815185546875, -0.2470855712890625, -0.22025299072265625, -0.19342041015625, -0.16658782958984375, -0.1397552490234375, -0.11292266845703125, -0.086090087890625, -0.05925750732421875, -0.0324249267578125, -0.00559234619140625, 0.021240234375, 0.04807281494140625, 0.0749053955078125, 0.10173797607421875, 0.128570556640625, 0.15540313720703125, 0.1822357177734375, 0.20906829833984375, 0.23590087890625, 0.26273345947265625, 0.2895660400390625, 0.31639862060546875, 0.343231201171875, 0.37006378173828125, 0.3968963623046875, 0.42372894287109375, 0.4505615234375, 0.47739410400390625, 0.5042266845703125, 0.5310592651367188, 0.557891845703125, 0.5847244262695312, 0.6115570068359375, 0.6383895874023438, 0.66522216796875, 0.6920547485351562, 0.7188873291015625, 0.7457199096679688, 0.772552490234375, 0.7993850708007812, 0.8262176513671875, 0.8530502319335938, 0.8798828125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 5.0, 10.0, 9.0, 15.0, 26.0, 27.0, 37.0, 32.0, 52.0, 51.0, 52.0, 72.0, 66.0, 63.0, 61.0, 64.0, 53.0, 47.0, 48.0, 39.0, 31.0, 26.0, 16.0, 22.0, 14.0, 10.0, 13.0, 8.0, 7.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00482940673828125, -0.00467228889465332, -0.004515171051025391, -0.004358053207397461, -0.004200935363769531, -0.0040438175201416016, -0.003886699676513672, -0.003729581832885742, -0.0035724639892578125, -0.003415346145629883, -0.003258228302001953, -0.0031011104583740234, -0.0029439926147460938, -0.002786874771118164, -0.0026297569274902344, -0.0024726390838623047, -0.002315521240234375, -0.0021584033966064453, -0.0020012855529785156, -0.001844167709350586, -0.0016870498657226562, -0.0015299320220947266, -0.0013728141784667969, -0.0012156963348388672, -0.0010585784912109375, -0.0009014606475830078, -0.0007443428039550781, -0.0005872249603271484, -0.00043010711669921875, -0.00027298927307128906, -0.00011587142944335938, 4.124641418457031e-05, 0.0001983642578125, 0.0003554821014404297, 0.0005125999450683594, 0.0006697177886962891, 0.0008268356323242188, 0.0009839534759521484, 0.0011410713195800781, 0.0012981891632080078, 0.0014553070068359375, 0.0016124248504638672, 0.0017695426940917969, 0.0019266605377197266, 0.0020837783813476562, 0.002240896224975586, 0.0023980140686035156, 0.0025551319122314453, 0.002712249755859375, 0.0028693675994873047, 0.0030264854431152344, 0.003183603286743164, 0.0033407211303710938, 0.0034978389739990234, 0.003654956817626953, 0.003812074661254883, 0.0039691925048828125, 0.004126310348510742, 0.004283428192138672, 0.0044405460357666016, 0.004597663879394531, 0.004754781723022461, 0.004911899566650391, 0.00506901741027832, 0.00522613525390625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 5.0, 6.0, 9.0, 14.0, 17.0, 15.0, 18.0, 38.0, 40.0, 58.0, 95.0, 138.0, 207.0, 558.0, 19565.0, 1017260.0, 9416.0, 451.0, 205.0, 133.0, 84.0, 71.0, 36.0, 35.0, 22.0, 21.0, 9.0, 11.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11767578125, -0.11404800415039062, -0.11042022705078125, -0.10679244995117188, -0.1031646728515625, -0.09953689575195312, -0.09590911865234375, -0.09228134155273438, -0.088653564453125, -0.08502578735351562, -0.08139801025390625, -0.07777023315429688, -0.0741424560546875, -0.07051467895507812, -0.06688690185546875, -0.06325912475585938, -0.05963134765625, -0.056003570556640625, -0.05237579345703125, -0.048748016357421875, -0.0451202392578125, -0.041492462158203125, -0.03786468505859375, -0.034236907958984375, -0.030609130859375, -0.026981353759765625, -0.02335357666015625, -0.019725799560546875, -0.0160980224609375, -0.012470245361328125, -0.00884246826171875, -0.005214691162109375, -0.0015869140625, 0.002040863037109375, 0.00566864013671875, 0.009296417236328125, 0.0129241943359375, 0.016551971435546875, 0.02017974853515625, 0.023807525634765625, 0.027435302734375, 0.031063079833984375, 0.03469085693359375, 0.038318634033203125, 0.0419464111328125, 0.045574188232421875, 0.04920196533203125, 0.052829742431640625, 0.05645751953125, 0.060085296630859375, 0.06371307373046875, 0.06734085083007812, 0.0709686279296875, 0.07459640502929688, 0.07822418212890625, 0.08185195922851562, 0.085479736328125, 0.08910751342773438, 0.09273529052734375, 0.09636306762695312, 0.0999908447265625, 0.10361862182617188, 0.10724639892578125, 0.11087417602539062, 0.114501953125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 7.0, 41.0, 122.0, 374.0, 341.0, 89.0, 33.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002465706318616867, -0.002048881258815527, -0.0016320561990141869, -0.0012152311392128468, -0.0007984060794115067, -0.00038158101961016655, 3.5244040191173553e-05, 0.00045206909999251366, 0.0008688941597938538, 0.0012857192195951939, 0.001702544279396534, 0.002119369339197874, 0.002536194398999214, 0.0029530194588005543, 0.0033698445186018944, 0.0037866695784032345, 0.004203494638204575, 0.004620319698005915, 0.005037144757807255, 0.005453969817608595, 0.005870794877409935, 0.006287619937211275, 0.006704444997012615, 0.007121270056813955, 0.007538095116615295, 0.007954919710755348, 0.008371745236217976, 0.008788570761680603, 0.009205395355820656, 0.009622219949960709, 0.010039045475423336, 0.010455871000885963, 0.010872695595026016, 0.011289520189166069, 0.011706345714628696, 0.012123171240091324, 0.012539995834231377, 0.01295682042837143, 0.013373645953834057, 0.013790471479296684, 0.014207296073436737, 0.01462412066757679, 0.015040946193039417, 0.015457771718502045, 0.015874596312642097, 0.01629142090678215, 0.016708247363567352, 0.017125071957707405, 0.017541896551847458, 0.01795872114598751, 0.018375545740127563, 0.018792372196912766, 0.01920919679105282, 0.01962602138519287, 0.020042847841978073, 0.020459672436118126, 0.02087649703025818, 0.02129332162439823, 0.021710146218538284, 0.022126972675323486, 0.02254379726946354, 0.022960621863603592, 0.023377448320388794, 0.023794272914528847, 0.0242110975086689]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 14.0, 15.0, 12.0, 22.0, 16.0, 24.0, 22.0, 18.0, 21.0, 29.0, 32.0, 41.0, 35.0, 31.0, 47.0, 39.0, 32.0, 39.0, 37.0, 45.0, 38.0, 32.0, 43.0, 40.0, 31.0, 35.0, 24.0, 35.0, 31.0, 20.0, 15.0, 12.0, 13.0, 13.0, 13.0, 7.0, 8.0, 10.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020807981491088867, -0.002001827582716942, -0.001922857016324997, -0.001843886449933052, -0.0017649158835411072, -0.0016859453171491623, -0.0016069747507572174, -0.0015280041843652725, -0.0014490336179733276, -0.0013700630515813828, -0.0012910924851894379, -0.001212121918797493, -0.001133151352405548, -0.0010541807860136032, -0.0009752102196216583, -0.0008962396532297134, -0.0008172690868377686, -0.0007382985204458237, -0.0006593279540538788, -0.0005803573876619339, -0.000501386821269989, -0.00042241625487804413, -0.00034344568848609924, -0.00026447512209415436, -0.00018550455570220947, -0.00010653398931026459, -2.7563422918319702e-05, 5.140714347362518e-05, 0.00013037770986557007, 0.00020934827625751495, 0.00028831884264945984, 0.0003672894090414047, 0.0004462599754333496, 0.0005252305418252945, 0.0006042011082172394, 0.0006831716746091843, 0.0007621422410011292, 0.000841112807393074, 0.0009200833737850189, 0.0009990539401769638, 0.0010780245065689087, 0.0011569950729608536, 0.0012359656393527985, 0.0013149362057447433, 0.0013939067721366882, 0.0014728773385286331, 0.001551847904920578, 0.0016308184713125229, 0.0017097890377044678, 0.0017887596040964127, 0.0018677301704883575, 0.0019467007368803024, 0.0020256713032722473, 0.002104641869664192, 0.002183612436056137, 0.002262583002448082, 0.002341553568840027, 0.0024205241352319717, 0.0024994947016239166, 0.0025784652680158615, 0.0026574358344078064, 0.0027364064007997513, 0.002815376967191696, 0.002894347533583641, 0.002973318099975586]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 8.0, 14.0, 12.0, 14.0, 17.0, 26.0, 21.0, 20.0, 29.0, 27.0, 38.0, 32.0, 31.0, 30.0, 31.0, 53.0, 59.0, 50.0, 37.0, 45.0, 41.0, 35.0, 42.0, 44.0, 22.0, 33.0, 23.0, 25.0, 22.0, 18.0, 15.0, 11.0, 8.0, 12.0, 9.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.75, -21.00830078125, -20.2666015625, -19.52490234375, -18.783203125, -18.04150390625, -17.2998046875, -16.55810546875, -15.81640625, -15.07470703125, -14.3330078125, -13.59130859375, -12.849609375, -12.10791015625, -11.3662109375, -10.62451171875, -9.8828125, -9.14111328125, -8.3994140625, -7.65771484375, -6.916015625, -6.17431640625, -5.4326171875, -4.69091796875, -3.94921875, -3.20751953125, -2.4658203125, -1.72412109375, -0.982421875, -0.24072265625, 0.5009765625, 1.24267578125, 1.984375, 2.72607421875, 3.4677734375, 4.20947265625, 4.951171875, 5.69287109375, 6.4345703125, 7.17626953125, 7.91796875, 8.65966796875, 9.4013671875, 10.14306640625, 10.884765625, 11.62646484375, 12.3681640625, 13.10986328125, 13.8515625, 14.59326171875, 15.3349609375, 16.07666015625, 16.818359375, 17.56005859375, 18.3017578125, 19.04345703125, 19.78515625, 20.52685546875, 21.2685546875, 22.01025390625, 22.751953125, 23.49365234375, 24.2353515625, 24.97705078125, 25.71875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 7.0, 6.0, 5.0, 7.0, 9.0, 15.0, 24.0, 32.0, 39.0, 44.0, 64.0, 86.0, 163.0, 260.0, 395.0, 665.0, 1083.0, 1878.0, 3339.0, 6003.0, 11175.0, 22995.0, 51030.0, 135751.0, 441683.0, 228411.0, 77738.0, 32039.0, 15430.0, 7923.0, 4144.0, 2502.0, 1435.0, 789.0, 466.0, 307.0, 195.0, 137.0, 83.0, 57.0, 42.0, 32.0, 24.0, 20.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-15.0, -14.5416259765625, -14.083251953125, -13.6248779296875, -13.16650390625, -12.7081298828125, -12.249755859375, -11.7913818359375, -11.3330078125, -10.8746337890625, -10.416259765625, -9.9578857421875, -9.49951171875, -9.0411376953125, -8.582763671875, -8.1243896484375, -7.666015625, -7.2076416015625, -6.749267578125, -6.2908935546875, -5.83251953125, -5.3741455078125, -4.915771484375, -4.4573974609375, -3.9990234375, -3.5406494140625, -3.082275390625, -2.6239013671875, -2.16552734375, -1.7071533203125, -1.248779296875, -0.7904052734375, -0.33203125, 0.1263427734375, 0.584716796875, 1.0430908203125, 1.50146484375, 1.9598388671875, 2.418212890625, 2.8765869140625, 3.3349609375, 3.7933349609375, 4.251708984375, 4.7100830078125, 5.16845703125, 5.6268310546875, 6.085205078125, 6.5435791015625, 7.001953125, 7.4603271484375, 7.918701171875, 8.3770751953125, 8.83544921875, 9.2938232421875, 9.752197265625, 10.2105712890625, 10.6689453125, 11.1273193359375, 11.585693359375, 12.0440673828125, 12.50244140625, 12.9608154296875, 13.419189453125, 13.8775634765625, 14.3359375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 0.0, 3.0, 2.0, 4.0, 9.0, 2.0, 9.0, 13.0, 14.0, 16.0, 17.0, 24.0, 19.0, 23.0, 37.0, 38.0, 34.0, 44.0, 44.0, 53.0, 94.0, 267.0, 1676.0, 151.0, 72.0, 65.0, 47.0, 44.0, 32.0, 23.0, 32.0, 25.0, 24.0, 14.0, 19.0, 17.0, 8.0, 8.0, 6.0, 10.0, 10.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.4375, -69.962890625, -67.48828125, -65.013671875, -62.5390625, -60.064453125, -57.58984375, -55.115234375, -52.640625, -50.166015625, -47.69140625, -45.216796875, -42.7421875, -40.267578125, -37.79296875, -35.318359375, -32.84375, -30.369140625, -27.89453125, -25.419921875, -22.9453125, -20.470703125, -17.99609375, -15.521484375, -13.046875, -10.572265625, -8.09765625, -5.623046875, -3.1484375, -0.673828125, 1.80078125, 4.275390625, 6.75, 9.224609375, 11.69921875, 14.173828125, 16.6484375, 19.123046875, 21.59765625, 24.072265625, 26.546875, 29.021484375, 31.49609375, 33.970703125, 36.4453125, 38.919921875, 41.39453125, 43.869140625, 46.34375, 48.818359375, 51.29296875, 53.767578125, 56.2421875, 58.716796875, 61.19140625, 63.666015625, 66.140625, 68.615234375, 71.08984375, 73.564453125, 76.0390625, 78.513671875, 80.98828125, 83.462890625, 85.9375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 10.0, 8.0, 10.0, 15.0, 17.0, 22.0, 26.0, 38.0, 53.0, 69.0, 72.0, 97.0, 161.0, 215.0, 301.0, 721.0, 5537.0, 3091720.0, 44087.0, 1181.0, 400.0, 240.0, 177.0, 122.0, 107.0, 66.0, 46.0, 40.0, 29.0, 29.0, 22.0, 22.0, 10.0, 8.0, 3.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-202.625, -196.78515625, -190.9453125, -185.10546875, -179.265625, -173.42578125, -167.5859375, -161.74609375, -155.90625, -150.06640625, -144.2265625, -138.38671875, -132.546875, -126.70703125, -120.8671875, -115.02734375, -109.1875, -103.34765625, -97.5078125, -91.66796875, -85.828125, -79.98828125, -74.1484375, -68.30859375, -62.46875, -56.62890625, -50.7890625, -44.94921875, -39.109375, -33.26953125, -27.4296875, -21.58984375, -15.75, -9.91015625, -4.0703125, 1.76953125, 7.609375, 13.44921875, 19.2890625, 25.12890625, 30.96875, 36.80859375, 42.6484375, 48.48828125, 54.328125, 60.16796875, 66.0078125, 71.84765625, 77.6875, 83.52734375, 89.3671875, 95.20703125, 101.046875, 106.88671875, 112.7265625, 118.56640625, 124.40625, 130.24609375, 136.0859375, 141.92578125, 147.765625, 153.60546875, 159.4453125, 165.28515625, 171.125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 39.0, 83.0, 226.0, 346.0, 197.0, 78.0, 26.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.1983871459961, -76.55054473876953, -71.9027099609375, -67.25486755371094, -62.607025146484375, -57.95918273925781, -53.311344146728516, -48.66350555419922, -44.015663146972656, -39.367820739746094, -34.7199821472168, -30.072141647338867, -25.424301147460938, -20.776460647583008, -16.128620147705078, -11.480781555175781, -6.832939147949219, -2.185098648071289, 2.4627418518066406, 7.11058235168457, 11.7584228515625, 16.40626335144043, 21.05410385131836, 25.701942443847656, 30.34978485107422, 34.99762725830078, 39.64546585083008, 44.293304443359375, 48.94114685058594, 53.5889892578125, 58.2368278503418, 62.884666442871094, 67.53250122070312, 72.18034362792969, 76.82818603515625, 81.47602081298828, 86.12386322021484, 90.7717056274414, 95.41954040527344, 100.0673828125, 104.71522521972656, 109.36306762695312, 114.01091003417969, 118.65874481201172, 123.30658721923828, 127.95442962646484, 132.60226440429688, 137.25010681152344, 141.89794921875, 146.54579162597656, 151.19363403320312, 155.8414764404297, 160.48931884765625, 165.13714599609375, 169.7849884033203, 174.43283081054688, 179.08067321777344, 183.728515625, 188.37635803222656, 193.02420043945312, 197.67202758789062, 202.3198699951172, 206.96771240234375, 211.6155548095703, 216.26339721679688]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 10.0, 4.0, 9.0, 12.0, 13.0, 15.0, 24.0, 30.0, 22.0, 28.0, 36.0, 33.0, 30.0, 26.0, 28.0, 46.0, 34.0, 28.0, 45.0, 39.0, 43.0, 33.0, 49.0, 34.0, 40.0, 33.0, 47.0, 27.0, 24.0, 21.0, 20.0, 22.0, 20.0, 13.0, 11.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-169.39132690429688, -163.98867797851562, -158.5860137939453, -153.18336486816406, -147.78070068359375, -142.3780517578125, -136.97540283203125, -131.57273864746094, -126.17008209228516, -120.76742553710938, -115.3647689819336, -109.96211242675781, -104.55946350097656, -99.15679931640625, -93.754150390625, -88.35149383544922, -82.94883728027344, -77.54618072509766, -72.14352416992188, -66.74087524414062, -61.33821487426758, -55.9355583190918, -50.53290557861328, -45.1302490234375, -39.72759246826172, -34.32493591308594, -28.92228126525879, -23.51962661743164, -18.11697006225586, -12.714313507080078, -7.3116607666015625, -1.9090042114257812, 3.49365234375, 8.896307945251465, 14.29896354675293, 19.701618194580078, 25.10427474975586, 30.50693130493164, 35.909584045410156, 41.31224060058594, 46.71489715576172, 52.1175537109375, 57.52021026611328, 62.9228630065918, 68.32551574707031, 73.72817993164062, 79.13082885742188, 84.53348541259766, 89.93614196777344, 95.33879852294922, 100.741455078125, 106.14410400390625, 111.54676818847656, 116.94941711425781, 122.3520736694336, 127.75473022460938, 133.15737915039062, 138.56002807617188, 143.9626922607422, 149.36534118652344, 154.76800537109375, 160.170654296875, 165.57330322265625, 170.97596740722656, 176.37863159179688]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0, 8.0, 7.0, 9.0, 8.0, 14.0, 13.0, 19.0, 13.0, 28.0, 29.0, 23.0, 30.0, 28.0, 31.0, 31.0, 38.0, 49.0, 44.0, 43.0, 43.0, 51.0, 45.0, 40.0, 40.0, 49.0, 25.0, 36.0, 38.0, 32.0, 21.0, 18.0, 17.0, 16.0, 12.0, 5.0, 8.0, 7.0, 14.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.125, -21.3486328125, -20.572265625, -19.7958984375, -19.01953125, -18.2431640625, -17.466796875, -16.6904296875, -15.9140625, -15.1376953125, -14.361328125, -13.5849609375, -12.80859375, -12.0322265625, -11.255859375, -10.4794921875, -9.703125, -8.9267578125, -8.150390625, -7.3740234375, -6.59765625, -5.8212890625, -5.044921875, -4.2685546875, -3.4921875, -2.7158203125, -1.939453125, -1.1630859375, -0.38671875, 0.3896484375, 1.166015625, 1.9423828125, 2.71875, 3.4951171875, 4.271484375, 5.0478515625, 5.82421875, 6.6005859375, 7.376953125, 8.1533203125, 8.9296875, 9.7060546875, 10.482421875, 11.2587890625, 12.03515625, 12.8115234375, 13.587890625, 14.3642578125, 15.140625, 15.9169921875, 16.693359375, 17.4697265625, 18.24609375, 19.0224609375, 19.798828125, 20.5751953125, 21.3515625, 22.1279296875, 22.904296875, 23.6806640625, 24.45703125, 25.2333984375, 26.009765625, 26.7861328125, 27.5625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 11.0, 10.0, 9.0, 32.0, 23.0, 31.0, 51.0, 61.0, 82.0, 161.0, 168.0, 266.0, 411.0, 667.0, 1240.0, 2538.0, 6582.0, 38016.0, 1952327.0, 2139182.0, 39595.0, 6799.0, 2649.0, 1284.0, 705.0, 420.0, 286.0, 208.0, 121.0, 87.0, 67.0, 53.0, 36.0, 30.0, 22.0, 14.0, 12.0, 8.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.9375, -66.4765625, -64.015625, -61.5546875, -59.09375, -56.6328125, -54.171875, -51.7109375, -49.25, -46.7890625, -44.328125, -41.8671875, -39.40625, -36.9453125, -34.484375, -32.0234375, -29.5625, -27.1015625, -24.640625, -22.1796875, -19.71875, -17.2578125, -14.796875, -12.3359375, -9.875, -7.4140625, -4.953125, -2.4921875, -0.03125, 2.4296875, 4.890625, 7.3515625, 9.8125, 12.2734375, 14.734375, 17.1953125, 19.65625, 22.1171875, 24.578125, 27.0390625, 29.5, 31.9609375, 34.421875, 36.8828125, 39.34375, 41.8046875, 44.265625, 46.7265625, 49.1875, 51.6484375, 54.109375, 56.5703125, 59.03125, 61.4921875, 63.953125, 66.4140625, 68.875, 71.3359375, 73.796875, 76.2578125, 78.71875, 81.1796875, 83.640625, 86.1015625, 88.5625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 7.0, 11.0, 5.0, 5.0, 13.0, 12.0, 16.0, 28.0, 43.0, 43.0, 59.0, 106.0, 219.0, 398.0, 711.0, 908.0, 632.0, 333.0, 190.0, 102.0, 60.0, 38.0, 30.0, 28.0, 23.0, 17.0, 8.0, 7.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -32.634765625, -31.17578125, -29.716796875, -28.2578125, -26.798828125, -25.33984375, -23.880859375, -22.421875, -20.962890625, -19.50390625, -18.044921875, -16.5859375, -15.126953125, -13.66796875, -12.208984375, -10.75, -9.291015625, -7.83203125, -6.373046875, -4.9140625, -3.455078125, -1.99609375, -0.537109375, 0.921875, 2.380859375, 3.83984375, 5.298828125, 6.7578125, 8.216796875, 9.67578125, 11.134765625, 12.59375, 14.052734375, 15.51171875, 16.970703125, 18.4296875, 19.888671875, 21.34765625, 22.806640625, 24.265625, 25.724609375, 27.18359375, 28.642578125, 30.1015625, 31.560546875, 33.01953125, 34.478515625, 35.9375, 37.396484375, 38.85546875, 40.314453125, 41.7734375, 43.232421875, 44.69140625, 46.150390625, 47.609375, 49.068359375, 50.52734375, 51.986328125, 53.4453125, 54.904296875, 56.36328125, 57.822265625, 59.28125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 5.0, 7.0, 15.0, 23.0, 30.0, 44.0, 64.0, 80.0, 166.0, 425.0, 1153.0, 7433.0, 190521.0, 3967838.0, 22695.0, 2634.0, 564.0, 234.0, 105.0, 74.0, 48.0, 26.0, 22.0, 19.0, 9.0, 4.0, 10.0, 8.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.125, -236.765625, -230.40625, -224.046875, -217.6875, -211.328125, -204.96875, -198.609375, -192.25, -185.890625, -179.53125, -173.171875, -166.8125, -160.453125, -154.09375, -147.734375, -141.375, -135.015625, -128.65625, -122.296875, -115.9375, -109.578125, -103.21875, -96.859375, -90.5, -84.140625, -77.78125, -71.421875, -65.0625, -58.703125, -52.34375, -45.984375, -39.625, -33.265625, -26.90625, -20.546875, -14.1875, -7.828125, -1.46875, 4.890625, 11.25, 17.609375, 23.96875, 30.328125, 36.6875, 43.046875, 49.40625, 55.765625, 62.125, 68.484375, 74.84375, 81.203125, 87.5625, 93.921875, 100.28125, 106.640625, 113.0, 119.359375, 125.71875, 132.078125, 138.4375, 144.796875, 151.15625, 157.515625, 163.875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 11.0, 27.0, 57.0, 138.0, 237.0, 274.0, 142.0, 56.0, 31.0, 15.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-447.4386901855469, -437.7483825683594, -428.0580749511719, -418.3677978515625, -408.677490234375, -398.9871826171875, -389.296875, -379.6065673828125, -369.916259765625, -360.2259521484375, -350.53564453125, -340.8453674316406, -331.1550598144531, -321.4647521972656, -311.7744445800781, -302.0841369628906, -292.39385986328125, -282.70355224609375, -273.01324462890625, -263.3229675292969, -253.63265991210938, -243.94235229492188, -234.25204467773438, -224.56173706054688, -214.87144470214844, -205.18113708496094, -195.4908447265625, -185.800537109375, -176.1102294921875, -166.41993713378906, -156.72962951660156, -147.03933715820312, -137.3489990234375, -127.65869903564453, -117.96839904785156, -108.27809143066406, -98.5877914428711, -88.89749145507812, -79.20718383789062, -69.51688385009766, -59.82658386230469, -50.13628387451172, -40.445980072021484, -30.755678176879883, -21.06537628173828, -11.375076293945312, -1.6847724914550781, 8.005531311035156, 17.695831298828125, 27.386133193969727, 37.07643508911133, 46.76673889160156, 56.45703887939453, 66.1473388671875, 75.837646484375, 85.52794647216797, 95.21824645996094, 104.9085464477539, 114.59884643554688, 124.28915405273438, 133.97946166992188, 143.6697540283203, 153.3600616455078, 163.05035400390625, 172.74066162109375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 7.0, 12.0, 8.0, 16.0, 13.0, 17.0, 15.0, 30.0, 24.0, 32.0, 27.0, 40.0, 32.0, 28.0, 38.0, 38.0, 45.0, 52.0, 44.0, 38.0, 50.0, 26.0, 34.0, 39.0, 24.0, 36.0, 31.0, 34.0, 11.0, 35.0, 21.0, 12.0, 13.0, 12.0, 11.0, 8.0, 6.0, 9.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.64241790771484, -106.25418090820312, -102.8659439086914, -99.47770690917969, -96.0894775390625, -92.70124053955078, -89.31300354003906, -85.92476654052734, -82.53652954101562, -79.1482925415039, -75.76005554199219, -72.371826171875, -68.98358917236328, -65.59535217285156, -62.207115173339844, -58.818878173828125, -55.43064880371094, -52.04241180419922, -48.654178619384766, -45.26594161987305, -41.877708435058594, -38.489471435546875, -35.101234436035156, -31.71299934387207, -28.324764251708984, -24.9365291595459, -21.548294067382812, -18.160057067871094, -14.771821975708008, -11.383586883544922, -7.995349884033203, -4.607114791870117, -1.2188873291015625, 2.1693482398986816, 5.557583808898926, 8.945819854736328, 12.334054946899414, 15.7222900390625, 19.11052703857422, 22.498762130737305, 25.88699722290039, 29.275232315063477, 32.66346740722656, 36.05170440673828, 39.43994140625, 42.82817459106445, 46.21641159057617, 49.604644775390625, 52.992881774902344, 56.38111877441406, 59.769351959228516, 63.157588958740234, 66.54582214355469, 69.9340591430664, 73.32229614257812, 76.71053314208984, 80.09877014160156, 83.48700714111328, 86.875244140625, 90.26347351074219, 93.6517105102539, 97.03994750976562, 100.42818450927734, 103.81642150878906, 107.20465087890625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 6.0, 13.0, 15.0, 11.0, 15.0, 19.0, 24.0, 19.0, 28.0, 28.0, 31.0, 39.0, 39.0, 38.0, 34.0, 36.0, 50.0, 42.0, 58.0, 43.0, 44.0, 37.0, 27.0, 24.0, 29.0, 38.0, 25.0, 25.0, 20.0, 28.0, 15.0, 18.0, 14.0, 9.0, 4.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.75, -20.02392578125, -19.2978515625, -18.57177734375, -17.845703125, -17.11962890625, -16.3935546875, -15.66748046875, -14.94140625, -14.21533203125, -13.4892578125, -12.76318359375, -12.037109375, -11.31103515625, -10.5849609375, -9.85888671875, -9.1328125, -8.40673828125, -7.6806640625, -6.95458984375, -6.228515625, -5.50244140625, -4.7763671875, -4.05029296875, -3.32421875, -2.59814453125, -1.8720703125, -1.14599609375, -0.419921875, 0.30615234375, 1.0322265625, 1.75830078125, 2.484375, 3.21044921875, 3.9365234375, 4.66259765625, 5.388671875, 6.11474609375, 6.8408203125, 7.56689453125, 8.29296875, 9.01904296875, 9.7451171875, 10.47119140625, 11.197265625, 11.92333984375, 12.6494140625, 13.37548828125, 14.1015625, 14.82763671875, 15.5537109375, 16.27978515625, 17.005859375, 17.73193359375, 18.4580078125, 19.18408203125, 19.91015625, 20.63623046875, 21.3623046875, 22.08837890625, 22.814453125, 23.54052734375, 24.2666015625, 24.99267578125, 25.71875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 2.0, 7.0, 9.0, 10.0, 16.0, 31.0, 37.0, 38.0, 77.0, 99.0, 145.0, 197.0, 327.0, 476.0, 696.0, 1076.0, 1524.0, 2487.0, 3885.0, 5886.0, 9667.0, 16078.0, 26742.0, 47253.0, 85168.0, 162242.0, 265408.0, 188772.0, 98732.0, 53480.0, 30237.0, 17993.0, 10832.0, 6728.0, 4145.0, 2788.0, 1730.0, 1182.0, 760.0, 513.0, 342.0, 244.0, 150.0, 98.0, 74.0, 59.0, 43.0, 25.0, 17.0, 12.0, 6.0, 10.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1513671875, -1.11248779296875, -1.0736083984375, -1.03472900390625, -0.995849609375, -0.95697021484375, -0.9180908203125, -0.87921142578125, -0.84033203125, -0.80145263671875, -0.7625732421875, -0.72369384765625, -0.684814453125, -0.64593505859375, -0.6070556640625, -0.56817626953125, -0.529296875, -0.49041748046875, -0.4515380859375, -0.41265869140625, -0.373779296875, -0.33489990234375, -0.2960205078125, -0.25714111328125, -0.21826171875, -0.17938232421875, -0.1405029296875, -0.10162353515625, -0.062744140625, -0.02386474609375, 0.0150146484375, 0.05389404296875, 0.0927734375, 0.13165283203125, 0.1705322265625, 0.20941162109375, 0.248291015625, 0.28717041015625, 0.3260498046875, 0.36492919921875, 0.40380859375, 0.44268798828125, 0.4815673828125, 0.52044677734375, 0.559326171875, 0.59820556640625, 0.6370849609375, 0.67596435546875, 0.71484375, 0.75372314453125, 0.7926025390625, 0.83148193359375, 0.870361328125, 0.90924072265625, 0.9481201171875, 0.98699951171875, 1.02587890625, 1.06475830078125, 1.1036376953125, 1.14251708984375, 1.181396484375, 1.22027587890625, 1.2591552734375, 1.29803466796875, 1.3369140625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 9.0, 12.0, 11.0, 24.0, 19.0, 19.0, 27.0, 14.0, 30.0, 26.0, 27.0, 32.0, 20.0, 40.0, 31.0, 33.0, 43.0, 29.0, 1059.0, 33.0, 29.0, 42.0, 31.0, 37.0, 27.0, 26.0, 26.0, 32.0, 15.0, 27.0, 24.0, 21.0, 18.0, 17.0, 10.0, 19.0, 11.0, 9.0, 9.0, 10.0, 4.0, 2.0, 9.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.515625, -13.1043701171875, -12.693115234375, -12.2818603515625, -11.87060546875, -11.4593505859375, -11.048095703125, -10.6368408203125, -10.2255859375, -9.8143310546875, -9.403076171875, -8.9918212890625, -8.58056640625, -8.1693115234375, -7.758056640625, -7.3468017578125, -6.935546875, -6.5242919921875, -6.113037109375, -5.7017822265625, -5.29052734375, -4.8792724609375, -4.468017578125, -4.0567626953125, -3.6455078125, -3.2342529296875, -2.822998046875, -2.4117431640625, -2.00048828125, -1.5892333984375, -1.177978515625, -0.7667236328125, -0.35546875, 0.0557861328125, 0.467041015625, 0.8782958984375, 1.28955078125, 1.7008056640625, 2.112060546875, 2.5233154296875, 2.9345703125, 3.3458251953125, 3.757080078125, 4.1683349609375, 4.57958984375, 4.9908447265625, 5.402099609375, 5.8133544921875, 6.224609375, 6.6358642578125, 7.047119140625, 7.4583740234375, 7.86962890625, 8.2808837890625, 8.692138671875, 9.1033935546875, 9.5146484375, 9.9259033203125, 10.337158203125, 10.7484130859375, 11.15966796875, 11.5709228515625, 11.982177734375, 12.3934326171875, 12.8046875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 7.0, 14.0, 21.0, 28.0, 42.0, 58.0, 90.0, 124.0, 200.0, 280.0, 374.0, 548.0, 817.0, 1126.0, 1481.0, 2118.0, 2954.0, 4053.0, 5421.0, 7665.0, 10535.0, 14534.0, 20195.0, 28110.0, 40869.0, 60163.0, 92199.0, 143186.0, 1228637.0, 140974.0, 91064.0, 59136.0, 40444.0, 27835.0, 20117.0, 14371.0, 10152.0, 7431.0, 5600.0, 4056.0, 2834.0, 2087.0, 1498.0, 1108.0, 766.0, 574.0, 390.0, 283.0, 179.0, 129.0, 84.0, 62.0, 48.0, 28.0, 18.0, 11.0, 4.0, 6.0, 5.0, 1.0, 1.0], "bins": [-0.7568359375, -0.7327957153320312, -0.7087554931640625, -0.6847152709960938, -0.660675048828125, -0.6366348266601562, -0.6125946044921875, -0.5885543823242188, -0.56451416015625, -0.5404739379882812, -0.5164337158203125, -0.49239349365234375, -0.468353271484375, -0.44431304931640625, -0.4202728271484375, -0.39623260498046875, -0.3721923828125, -0.34815216064453125, -0.3241119384765625, -0.30007171630859375, -0.276031494140625, -0.25199127197265625, -0.2279510498046875, -0.20391082763671875, -0.17987060546875, -0.15583038330078125, -0.1317901611328125, -0.10774993896484375, -0.083709716796875, -0.05966949462890625, -0.0356292724609375, -0.01158905029296875, 0.012451171875, 0.03649139404296875, 0.0605316162109375, 0.08457183837890625, 0.108612060546875, 0.13265228271484375, 0.1566925048828125, 0.18073272705078125, 0.20477294921875, 0.22881317138671875, 0.2528533935546875, 0.27689361572265625, 0.300933837890625, 0.32497406005859375, 0.3490142822265625, 0.37305450439453125, 0.3970947265625, 0.42113494873046875, 0.4451751708984375, 0.46921539306640625, 0.493255615234375, 0.5172958374023438, 0.5413360595703125, 0.5653762817382812, 0.58941650390625, 0.6134567260742188, 0.6374969482421875, 0.6615371704101562, 0.685577392578125, 0.7096176147460938, 0.7336578369140625, 0.7576980590820312, 0.78173828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 5.0, 7.0, 13.0, 8.0, 7.0, 21.0, 15.0, 19.0, 31.0, 29.0, 35.0, 34.0, 37.0, 43.0, 46.0, 64.0, 54.0, 45.0, 65.0, 48.0, 46.0, 46.0, 35.0, 29.0, 34.0, 25.0, 30.0, 17.0, 13.0, 17.0, 11.0, 9.0, 10.0, 8.0, 8.0, 9.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.003765106201171875, -0.003645479679107666, -0.003525853157043457, -0.003406226634979248, -0.003286600112915039, -0.00316697359085083, -0.003047347068786621, -0.002927720546722412, -0.002808094024658203, -0.002688467502593994, -0.002568840980529785, -0.002449214458465576, -0.002329587936401367, -0.002209961414337158, -0.0020903348922729492, -0.0019707083702087402, -0.0018510818481445312, -0.0017314553260803223, -0.0016118288040161133, -0.0014922022819519043, -0.0013725757598876953, -0.0012529492378234863, -0.0011333227157592773, -0.0010136961936950684, -0.0008940696716308594, -0.0007744431495666504, -0.0006548166275024414, -0.0005351901054382324, -0.00041556358337402344, -0.00029593706130981445, -0.00017631053924560547, -5.6684017181396484e-05, 6.29425048828125e-05, 0.00018256902694702148, 0.00030219554901123047, 0.00042182207107543945, 0.0005414485931396484, 0.0006610751152038574, 0.0007807016372680664, 0.0009003281593322754, 0.0010199546813964844, 0.0011395812034606934, 0.0012592077255249023, 0.0013788342475891113, 0.0014984607696533203, 0.0016180872917175293, 0.0017377138137817383, 0.0018573403358459473, 0.0019769668579101562, 0.0020965933799743652, 0.0022162199020385742, 0.002335846424102783, 0.002455472946166992, 0.002575099468231201, 0.00269472599029541, 0.002814352512359619, 0.002933979034423828, 0.003053605556488037, 0.003173232078552246, 0.003292858600616455, 0.003412485122680664, 0.003532111644744873, 0.003651738166809082, 0.003771364688873291, 0.0038909912109375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 10.0, 10.0, 7.0, 15.0, 7.0, 21.0, 16.0, 19.0, 25.0, 42.0, 58.0, 55.0, 59.0, 91.0, 149.0, 212.0, 520.0, 5961.0, 915115.0, 123807.0, 1313.0, 317.0, 171.0, 121.0, 97.0, 76.0, 51.0, 41.0, 36.0, 23.0, 21.0, 20.0, 9.0, 12.0, 6.0, 4.0, 11.0, 5.0, 8.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.08203125, -0.07952880859375, -0.0770263671875, -0.07452392578125, -0.072021484375, -0.06951904296875, -0.0670166015625, -0.06451416015625, -0.06201171875, -0.05950927734375, -0.0570068359375, -0.05450439453125, -0.052001953125, -0.04949951171875, -0.0469970703125, -0.04449462890625, -0.0419921875, -0.03948974609375, -0.0369873046875, -0.03448486328125, -0.031982421875, -0.02947998046875, -0.0269775390625, -0.02447509765625, -0.02197265625, -0.01947021484375, -0.0169677734375, -0.01446533203125, -0.011962890625, -0.00946044921875, -0.0069580078125, -0.00445556640625, -0.001953125, 0.00054931640625, 0.0030517578125, 0.00555419921875, 0.008056640625, 0.01055908203125, 0.0130615234375, 0.01556396484375, 0.01806640625, 0.02056884765625, 0.0230712890625, 0.02557373046875, 0.028076171875, 0.03057861328125, 0.0330810546875, 0.03558349609375, 0.0380859375, 0.04058837890625, 0.0430908203125, 0.04559326171875, 0.048095703125, 0.05059814453125, 0.0531005859375, 0.05560302734375, 0.05810546875, 0.06060791015625, 0.0631103515625, 0.06561279296875, 0.068115234375, 0.07061767578125, 0.0731201171875, 0.07562255859375, 0.078125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 58.0, 716.0, 224.0, 17.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.043926455080509186, -0.04316602647304535, -0.042405594140291214, -0.04164516553282738, -0.04088473320007324, -0.040124304592609406, -0.03936387598514557, -0.038603443652391434, -0.0378430150449276, -0.03708258643746376, -0.036322154104709625, -0.03556172549724579, -0.03480129316449165, -0.03404086455702782, -0.03328043222427368, -0.032520003616809845, -0.03175957128405571, -0.030999140813946724, -0.030238710343837738, -0.0294782817363739, -0.028717851266264915, -0.02795742079615593, -0.027196990326046944, -0.026436559855937958, -0.02567613124847412, -0.024915700778365135, -0.02415527030825615, -0.023394841700792313, -0.022634411230683327, -0.02187398076057434, -0.021113550290465355, -0.02035311982035637, -0.019592689350247383, -0.018832258880138397, -0.01807182841002941, -0.017311397939920425, -0.01655096933245659, -0.015790538862347603, -0.015030108392238617, -0.014269677922129631, -0.013509247452020645, -0.01274881698191166, -0.011988387443125248, -0.011227956973016262, -0.010467526502907276, -0.009707096964120865, -0.008946666494011879, -0.008186236023902893, -0.0074258060194551945, -0.006665376015007496, -0.00590494554489851, -0.005144515540450811, -0.004384085536003113, -0.003623655065894127, -0.0028632250614464283, -0.0021027945913374424, -0.0013423645868897438, -0.0005819344078190625, 0.00017849577125161886, 0.0009389258921146393, 0.0016993561293929815, 0.0024597863666713238, 0.0032202163711190224, 0.003980646841228008, 0.004741076845675707]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 15.0, 10.0, 13.0, 14.0, 12.0, 12.0, 16.0, 23.0, 31.0, 35.0, 32.0, 37.0, 38.0, 32.0, 38.0, 35.0, 40.0, 35.0, 49.0, 60.0, 42.0, 36.0, 36.0, 35.0, 34.0, 33.0, 28.0, 25.0, 23.0, 15.0, 24.0, 12.0, 13.0, 14.0, 12.0, 8.0, 5.0, 9.0, 8.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002417266368865967, -0.0023432783782482147, -0.0022692903876304626, -0.0021953023970127106, -0.0021213144063949585, -0.0020473264157772064, -0.0019733384251594543, -0.0018993504345417023, -0.0018253624439239502, -0.0017513744533061981, -0.001677386462688446, -0.001603398472070694, -0.001529410481452942, -0.0014554224908351898, -0.0013814345002174377, -0.0013074465095996857, -0.0012334585189819336, -0.0011594705283641815, -0.0010854825377464294, -0.0010114945471286774, -0.0009375065565109253, -0.0008635185658931732, -0.0007895305752754211, -0.0007155425846576691, -0.000641554594039917, -0.0005675666034221649, -0.0004935786128044128, -0.00041959062218666077, -0.0003456026315689087, -0.0002716146409511566, -0.00019762665033340454, -0.00012363865971565247, -4.965066909790039e-05, 2.4337321519851685e-05, 9.832531213760376e-05, 0.00017231330275535583, 0.0002463012933731079, 0.00032028928399086, 0.00039427727460861206, 0.00046826526522636414, 0.0005422532558441162, 0.0006162412464618683, 0.0006902292370796204, 0.0007642172276973724, 0.0008382052183151245, 0.0009121932089328766, 0.0009861811995506287, 0.0010601691901683807, 0.0011341571807861328, 0.0012081451714038849, 0.001282133162021637, 0.001356121152639389, 0.0014301091432571411, 0.0015040971338748932, 0.0015780851244926453, 0.0016520731151103973, 0.0017260611057281494, 0.0018000490963459015, 0.0018740370869636536, 0.0019480250775814056, 0.0020220130681991577, 0.00209600105881691, 0.002169989049434662, 0.002243977040052414, 0.002317965030670166]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 6.0, 13.0, 15.0, 11.0, 15.0, 19.0, 24.0, 19.0, 28.0, 28.0, 31.0, 39.0, 39.0, 38.0, 34.0, 36.0, 50.0, 42.0, 58.0, 43.0, 44.0, 37.0, 27.0, 24.0, 29.0, 38.0, 25.0, 25.0, 20.0, 28.0, 15.0, 18.0, 14.0, 9.0, 4.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.75, -20.02392578125, -19.2978515625, -18.57177734375, -17.845703125, -17.11962890625, -16.3935546875, -15.66748046875, -14.94140625, -14.21533203125, -13.4892578125, -12.76318359375, -12.037109375, -11.31103515625, -10.5849609375, -9.85888671875, -9.1328125, -8.40673828125, -7.6806640625, -6.95458984375, -6.228515625, -5.50244140625, -4.7763671875, -4.05029296875, -3.32421875, -2.59814453125, -1.8720703125, -1.14599609375, -0.419921875, 0.30615234375, 1.0322265625, 1.75830078125, 2.484375, 3.21044921875, 3.9365234375, 4.66259765625, 5.388671875, 6.11474609375, 6.8408203125, 7.56689453125, 8.29296875, 9.01904296875, 9.7451171875, 10.47119140625, 11.197265625, 11.92333984375, 12.6494140625, 13.37548828125, 14.1015625, 14.82763671875, 15.5537109375, 16.27978515625, 17.005859375, 17.73193359375, 18.4580078125, 19.18408203125, 19.91015625, 20.63623046875, 21.3623046875, 22.08837890625, 22.814453125, 23.54052734375, 24.2666015625, 24.99267578125, 25.71875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 5.0, 11.0, 11.0, 18.0, 15.0, 21.0, 28.0, 35.0, 46.0, 52.0, 76.0, 100.0, 134.0, 220.0, 387.0, 687.0, 1344.0, 3133.0, 8332.0, 25668.0, 98114.0, 589222.0, 246768.0, 49794.0, 14673.0, 5208.0, 1993.0, 958.0, 522.0, 274.0, 180.0, 133.0, 89.0, 67.0, 61.0, 35.0, 26.0, 22.0, 19.0, 19.0, 9.0, 13.0, 6.0, 4.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.3662109375, -21.560546875, -20.7548828125, -19.94921875, -19.1435546875, -18.337890625, -17.5322265625, -16.7265625, -15.9208984375, -15.115234375, -14.3095703125, -13.50390625, -12.6982421875, -11.892578125, -11.0869140625, -10.28125, -9.4755859375, -8.669921875, -7.8642578125, -7.05859375, -6.2529296875, -5.447265625, -4.6416015625, -3.8359375, -3.0302734375, -2.224609375, -1.4189453125, -0.61328125, 0.1923828125, 0.998046875, 1.8037109375, 2.609375, 3.4150390625, 4.220703125, 5.0263671875, 5.83203125, 6.6376953125, 7.443359375, 8.2490234375, 9.0546875, 9.8603515625, 10.666015625, 11.4716796875, 12.27734375, 13.0830078125, 13.888671875, 14.6943359375, 15.5, 16.3056640625, 17.111328125, 17.9169921875, 18.72265625, 19.5283203125, 20.333984375, 21.1396484375, 21.9453125, 22.7509765625, 23.556640625, 24.3623046875, 25.16796875, 25.9736328125, 26.779296875, 27.5849609375, 28.390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 3.0, 7.0, 7.0, 13.0, 10.0, 13.0, 16.0, 20.0, 22.0, 24.0, 28.0, 41.0, 36.0, 34.0, 27.0, 37.0, 39.0, 73.0, 123.0, 1737.0, 231.0, 86.0, 42.0, 50.0, 28.0, 34.0, 36.0, 23.0, 40.0, 20.0, 23.0, 20.0, 21.0, 15.0, 9.0, 10.0, 7.0, 7.0, 4.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-62.9375, -61.009765625, -59.08203125, -57.154296875, -55.2265625, -53.298828125, -51.37109375, -49.443359375, -47.515625, -45.587890625, -43.66015625, -41.732421875, -39.8046875, -37.876953125, -35.94921875, -34.021484375, -32.09375, -30.166015625, -28.23828125, -26.310546875, -24.3828125, -22.455078125, -20.52734375, -18.599609375, -16.671875, -14.744140625, -12.81640625, -10.888671875, -8.9609375, -7.033203125, -5.10546875, -3.177734375, -1.25, 0.677734375, 2.60546875, 4.533203125, 6.4609375, 8.388671875, 10.31640625, 12.244140625, 14.171875, 16.099609375, 18.02734375, 19.955078125, 21.8828125, 23.810546875, 25.73828125, 27.666015625, 29.59375, 31.521484375, 33.44921875, 35.376953125, 37.3046875, 39.232421875, 41.16015625, 43.087890625, 45.015625, 46.943359375, 48.87109375, 50.798828125, 52.7265625, 54.654296875, 56.58203125, 58.509765625, 60.4375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 1.0, 5.0, 8.0, 7.0, 9.0, 10.0, 22.0, 14.0, 33.0, 41.0, 51.0, 66.0, 93.0, 98.0, 144.0, 217.0, 388.0, 1046.0, 26141.0, 3107368.0, 8081.0, 707.0, 317.0, 195.0, 164.0, 127.0, 66.0, 69.0, 62.0, 27.0, 33.0, 19.0, 21.0, 14.0, 9.0, 7.0, 13.0, 1.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.375, -151.392578125, -146.41015625, -141.427734375, -136.4453125, -131.462890625, -126.48046875, -121.498046875, -116.515625, -111.533203125, -106.55078125, -101.568359375, -96.5859375, -91.603515625, -86.62109375, -81.638671875, -76.65625, -71.673828125, -66.69140625, -61.708984375, -56.7265625, -51.744140625, -46.76171875, -41.779296875, -36.796875, -31.814453125, -26.83203125, -21.849609375, -16.8671875, -11.884765625, -6.90234375, -1.919921875, 3.0625, 8.044921875, 13.02734375, 18.009765625, 22.9921875, 27.974609375, 32.95703125, 37.939453125, 42.921875, 47.904296875, 52.88671875, 57.869140625, 62.8515625, 67.833984375, 72.81640625, 77.798828125, 82.78125, 87.763671875, 92.74609375, 97.728515625, 102.7109375, 107.693359375, 112.67578125, 117.658203125, 122.640625, 127.623046875, 132.60546875, 137.587890625, 142.5703125, 147.552734375, 152.53515625, 157.517578125, 162.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 12.0, 22.0, 36.0, 66.0, 113.0, 183.0, 191.0, 167.0, 112.0, 56.0, 24.0, 14.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.19904327392578, -98.8675537109375, -96.53605651855469, -94.2045669555664, -91.8730697631836, -89.54158020019531, -87.2100830078125, -84.87859344482422, -82.54710388183594, -80.21561431884766, -77.88411712646484, -75.55262756347656, -73.22113037109375, -70.88964080810547, -68.55815124511719, -66.22665405273438, -63.89516067504883, -61.56366729736328, -59.232173919677734, -56.90068054199219, -54.569190979003906, -52.23769760131836, -49.90620422363281, -47.57471466064453, -45.24321746826172, -42.91172409057617, -40.580230712890625, -38.248741149902344, -35.9172477722168, -33.58575439453125, -31.254261016845703, -28.92276954650879, -26.59127426147461, -24.259780883789062, -21.92828941345215, -19.5967960357666, -17.265304565429688, -14.93381118774414, -12.602317810058594, -10.27082633972168, -7.939332962036133, -5.607840538024902, -3.2763476371765137, -0.944854736328125, 1.3866376876831055, 3.718130111694336, 6.049623489379883, 8.381114959716797, 10.712608337402344, 13.044100761413574, 15.375593185424805, 17.70708656311035, 20.038578033447266, 22.370071411132812, 24.70156478881836, 27.033056259155273, 29.36454963684082, 31.696043014526367, 34.02753448486328, 36.35902786254883, 38.690521240234375, 41.022010803222656, 43.35350799560547, 45.68499755859375, 48.0164909362793]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 6.0, 4.0, 12.0, 15.0, 25.0, 16.0, 24.0, 25.0, 22.0, 29.0, 30.0, 29.0, 36.0, 41.0, 47.0, 53.0, 48.0, 40.0, 48.0, 35.0, 37.0, 34.0, 36.0, 21.0, 46.0, 41.0, 22.0, 22.0, 19.0, 19.0, 17.0, 18.0, 16.0, 13.0, 8.0, 14.0, 8.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-175.55494689941406, -170.40106201171875, -165.24716186523438, -160.09326171875, -154.9393768310547, -149.78549194335938, -144.631591796875, -139.47769165039062, -134.3238067626953, -129.169921875, -124.01602172851562, -118.86212921142578, -113.70823669433594, -108.5543441772461, -103.40045166015625, -98.2465591430664, -93.09266662597656, -87.93877410888672, -82.78488159179688, -77.63098907470703, -72.47709655761719, -67.32320404052734, -62.1693115234375, -57.015419006347656, -51.86152648925781, -46.70763397216797, -41.553741455078125, -36.39984893798828, -31.245956420898438, -26.092063903808594, -20.93817138671875, -15.784278869628906, -10.630386352539062, -5.476493835449219, -0.322601318359375, 4.831291198730469, 9.985183715820312, 15.139076232910156, 20.29296875, 25.446861267089844, 30.600753784179688, 35.75464630126953, 40.908538818359375, 46.06243133544922, 51.21632385253906, 56.370216369628906, 61.52410888671875, 66.6780014038086, 71.83189392089844, 76.98578643798828, 82.13967895507812, 87.29357147216797, 92.44746398925781, 97.60135650634766, 102.7552490234375, 107.90914154052734, 113.06303405761719, 118.21692657470703, 123.37081909179688, 128.52471923828125, 133.67860412597656, 138.83248901367188, 143.98638916015625, 149.14028930664062, 154.29417419433594]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 2.0, 10.0, 7.0, 16.0, 13.0, 16.0, 16.0, 24.0, 14.0, 33.0, 19.0, 35.0, 41.0, 39.0, 35.0, 43.0, 51.0, 46.0, 45.0, 49.0, 35.0, 42.0, 33.0, 41.0, 40.0, 28.0, 29.0, 20.0, 34.0, 18.0, 16.0, 22.0, 14.0, 18.0, 8.0, 6.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.796875, -22.02685546875, -21.2568359375, -20.48681640625, -19.716796875, -18.94677734375, -18.1767578125, -17.40673828125, -16.63671875, -15.86669921875, -15.0966796875, -14.32666015625, -13.556640625, -12.78662109375, -12.0166015625, -11.24658203125, -10.4765625, -9.70654296875, -8.9365234375, -8.16650390625, -7.396484375, -6.62646484375, -5.8564453125, -5.08642578125, -4.31640625, -3.54638671875, -2.7763671875, -2.00634765625, -1.236328125, -0.46630859375, 0.3037109375, 1.07373046875, 1.84375, 2.61376953125, 3.3837890625, 4.15380859375, 4.923828125, 5.69384765625, 6.4638671875, 7.23388671875, 8.00390625, 8.77392578125, 9.5439453125, 10.31396484375, 11.083984375, 11.85400390625, 12.6240234375, 13.39404296875, 14.1640625, 14.93408203125, 15.7041015625, 16.47412109375, 17.244140625, 18.01416015625, 18.7841796875, 19.55419921875, 20.32421875, 21.09423828125, 21.8642578125, 22.63427734375, 23.404296875, 24.17431640625, 24.9443359375, 25.71435546875, 26.484375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 5.0, 10.0, 7.0, 20.0, 20.0, 19.0, 34.0, 39.0, 52.0, 71.0, 85.0, 170.0, 274.0, 477.0, 1065.0, 2764.0, 10552.0, 304313.0, 3736005.0, 125767.0, 7934.0, 2334.0, 986.0, 467.0, 253.0, 161.0, 84.0, 67.0, 57.0, 44.0, 27.0, 30.0, 19.0, 13.0, 8.0, 8.0, 5.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.625, -76.9169921875, -74.208984375, -71.5009765625, -68.79296875, -66.0849609375, -63.376953125, -60.6689453125, -57.9609375, -55.2529296875, -52.544921875, -49.8369140625, -47.12890625, -44.4208984375, -41.712890625, -39.0048828125, -36.296875, -33.5888671875, -30.880859375, -28.1728515625, -25.46484375, -22.7568359375, -20.048828125, -17.3408203125, -14.6328125, -11.9248046875, -9.216796875, -6.5087890625, -3.80078125, -1.0927734375, 1.615234375, 4.3232421875, 7.03125, 9.7392578125, 12.447265625, 15.1552734375, 17.86328125, 20.5712890625, 23.279296875, 25.9873046875, 28.6953125, 31.4033203125, 34.111328125, 36.8193359375, 39.52734375, 42.2353515625, 44.943359375, 47.6513671875, 50.359375, 53.0673828125, 55.775390625, 58.4833984375, 61.19140625, 63.8994140625, 66.607421875, 69.3154296875, 72.0234375, 74.7314453125, 77.439453125, 80.1474609375, 82.85546875, 85.5634765625, 88.271484375, 90.9794921875, 93.6875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 11.0, 6.0, 6.0, 8.0, 9.0, 22.0, 28.0, 26.0, 57.0, 115.0, 211.0, 390.0, 847.0, 1030.0, 619.0, 310.0, 122.0, 92.0, 44.0, 26.0, 21.0, 23.0, 15.0, 8.0, 8.0, 3.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-72.0, -70.255859375, -68.51171875, -66.767578125, -65.0234375, -63.279296875, -61.53515625, -59.791015625, -58.046875, -56.302734375, -54.55859375, -52.814453125, -51.0703125, -49.326171875, -47.58203125, -45.837890625, -44.09375, -42.349609375, -40.60546875, -38.861328125, -37.1171875, -35.373046875, -33.62890625, -31.884765625, -30.140625, -28.396484375, -26.65234375, -24.908203125, -23.1640625, -21.419921875, -19.67578125, -17.931640625, -16.1875, -14.443359375, -12.69921875, -10.955078125, -9.2109375, -7.466796875, -5.72265625, -3.978515625, -2.234375, -0.490234375, 1.25390625, 2.998046875, 4.7421875, 6.486328125, 8.23046875, 9.974609375, 11.71875, 13.462890625, 15.20703125, 16.951171875, 18.6953125, 20.439453125, 22.18359375, 23.927734375, 25.671875, 27.416015625, 29.16015625, 30.904296875, 32.6484375, 34.392578125, 36.13671875, 37.880859375, 39.625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 2.0, 8.0, 11.0, 13.0, 16.0, 28.0, 41.0, 80.0, 143.0, 252.0, 720.0, 4355.0, 157686.0, 4015854.0, 12919.0, 1335.0, 397.0, 189.0, 77.0, 46.0, 23.0, 25.0, 14.0, 6.0, 7.0, 7.0, 8.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-196.25, -187.79296875, -179.3359375, -170.87890625, -162.421875, -153.96484375, -145.5078125, -137.05078125, -128.59375, -120.13671875, -111.6796875, -103.22265625, -94.765625, -86.30859375, -77.8515625, -69.39453125, -60.9375, -52.48046875, -44.0234375, -35.56640625, -27.109375, -18.65234375, -10.1953125, -1.73828125, 6.71875, 15.17578125, 23.6328125, 32.08984375, 40.546875, 49.00390625, 57.4609375, 65.91796875, 74.375, 82.83203125, 91.2890625, 99.74609375, 108.203125, 116.66015625, 125.1171875, 133.57421875, 142.03125, 150.48828125, 158.9453125, 167.40234375, 175.859375, 184.31640625, 192.7734375, 201.23046875, 209.6875, 218.14453125, 226.6015625, 235.05859375, 243.515625, 251.97265625, 260.4296875, 268.88671875, 277.34375, 285.80078125, 294.2578125, 302.71484375, 311.171875, 319.62890625, 328.0859375, 336.54296875, 345.0]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 18.0, 47.0, 99.0, 272.0, 319.0, 149.0, 50.0, 28.0, 7.0, 11.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.67606353759766, -105.22722625732422, -93.77838897705078, -82.32955932617188, -70.88072204589844, -59.431880950927734, -47.98304748535156, -36.534210205078125, -25.085372924804688, -13.636536598205566, -2.1877002716064453, 9.26113510131836, 20.709972381591797, 32.158809661865234, 43.607643127441406, 55.056480407714844, 66.50531768798828, 77.95415496826172, 89.40299224853516, 100.85182189941406, 112.3006591796875, 123.74949645996094, 135.19833374023438, 146.6471710205078, 158.09600830078125, 169.5448455810547, 180.99368286132812, 192.44252014160156, 203.891357421875, 215.34019470214844, 226.78903198242188, 238.23785400390625, 249.68667602539062, 261.135498046875, 272.5843505859375, 284.0331726074219, 295.4820251464844, 306.93084716796875, 318.37969970703125, 329.8285217285156, 341.2773742675781, 352.7261962890625, 364.175048828125, 375.6238708496094, 387.0727233886719, 398.52154541015625, 409.97039794921875, 421.4192199707031, 432.8680419921875, 444.3168640136719, 455.7657165527344, 467.21453857421875, 478.66339111328125, 490.1122131347656, 501.5610656738281, 513.0098876953125, 524.458740234375, 535.9075927734375, 547.3563842773438, 558.8052368164062, 570.2540893554688, 581.7029418945312, 593.1517333984375, 604.6005859375, 616.0494384765625]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 7.0, 14.0, 7.0, 10.0, 17.0, 14.0, 13.0, 19.0, 16.0, 24.0, 29.0, 29.0, 33.0, 37.0, 35.0, 40.0, 36.0, 36.0, 30.0, 29.0, 36.0, 46.0, 37.0, 45.0, 39.0, 32.0, 32.0, 34.0, 24.0, 34.0, 25.0, 21.0, 17.0, 15.0, 11.0, 19.0, 12.0, 10.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-123.71678161621094, -120.2337417602539, -116.75070190429688, -113.26766204833984, -109.78462219238281, -106.30157470703125, -102.81854248046875, -99.33549499511719, -95.85245513916016, -92.36941528320312, -88.8863754272461, -85.40333557128906, -81.92029571533203, -78.437255859375, -74.95420837402344, -71.4711685180664, -67.98812866210938, -64.50508880615234, -61.02204895019531, -57.53900909423828, -54.055965423583984, -50.57292556762695, -47.08988571166992, -43.606842041015625, -40.123809814453125, -36.640769958496094, -33.15773010253906, -29.6746883392334, -26.191646575927734, -22.708606719970703, -19.225566864013672, -15.742525100708008, -12.259483337402344, -8.776442527770996, -5.293402194976807, -1.8103618621826172, 1.6726789474487305, 5.155719757080078, 8.63875961303711, 12.121801376342773, 15.604841232299805, 19.087881088256836, 22.5709228515625, 26.05396270751953, 29.537002563476562, 33.020042419433594, 36.503082275390625, 39.98612594604492, 43.46916580200195, 46.952205657958984, 50.435245513916016, 53.91828918457031, 57.401329040527344, 60.884368896484375, 64.3674087524414, 67.85044860839844, 71.33348846435547, 74.8165283203125, 78.29956817626953, 81.78260803222656, 85.2656478881836, 88.74868774414062, 92.23173522949219, 95.71477508544922, 99.19781494140625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 8.0, 7.0, 7.0, 14.0, 11.0, 19.0, 23.0, 10.0, 16.0, 28.0, 37.0, 29.0, 43.0, 38.0, 27.0, 36.0, 53.0, 46.0, 38.0, 39.0, 42.0, 42.0, 38.0, 44.0, 36.0, 31.0, 29.0, 27.0, 23.0, 25.0, 23.0, 25.0, 11.0, 17.0, 8.0, 12.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-25.234375, -24.470947265625, -23.70751953125, -22.944091796875, -22.1806640625, -21.417236328125, -20.65380859375, -19.890380859375, -19.126953125, -18.363525390625, -17.60009765625, -16.836669921875, -16.0732421875, -15.309814453125, -14.54638671875, -13.782958984375, -13.01953125, -12.256103515625, -11.49267578125, -10.729248046875, -9.9658203125, -9.202392578125, -8.43896484375, -7.675537109375, -6.912109375, -6.148681640625, -5.38525390625, -4.621826171875, -3.8583984375, -3.094970703125, -2.33154296875, -1.568115234375, -0.8046875, -0.041259765625, 0.72216796875, 1.485595703125, 2.2490234375, 3.012451171875, 3.77587890625, 4.539306640625, 5.302734375, 6.066162109375, 6.82958984375, 7.593017578125, 8.3564453125, 9.119873046875, 9.88330078125, 10.646728515625, 11.41015625, 12.173583984375, 12.93701171875, 13.700439453125, 14.4638671875, 15.227294921875, 15.99072265625, 16.754150390625, 17.517578125, 18.281005859375, 19.04443359375, 19.807861328125, 20.5712890625, 21.334716796875, 22.09814453125, 22.861572265625, 23.625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 12.0, 16.0, 28.0, 37.0, 59.0, 72.0, 112.0, 156.0, 228.0, 330.0, 469.0, 684.0, 1041.0, 1419.0, 2082.0, 3021.0, 4607.0, 6762.0, 10314.0, 15848.0, 24395.0, 38287.0, 61443.0, 100068.0, 168147.0, 215668.0, 149730.0, 89831.0, 54813.0, 34180.0, 21844.0, 14232.0, 9347.0, 6213.0, 4176.0, 2741.0, 1911.0, 1285.0, 879.0, 584.0, 432.0, 309.0, 211.0, 163.0, 118.0, 76.0, 52.0, 39.0, 27.0, 22.0, 8.0, 10.0, 5.0, 6.0, 4.0, 1.0, 2.0], "bins": [-1.1171875, -1.0826873779296875, -1.048187255859375, -1.0136871337890625, -0.97918701171875, -0.9446868896484375, -0.910186767578125, -0.8756866455078125, -0.8411865234375, -0.8066864013671875, -0.772186279296875, -0.7376861572265625, -0.70318603515625, -0.6686859130859375, -0.634185791015625, -0.5996856689453125, -0.565185546875, -0.5306854248046875, -0.496185302734375, -0.4616851806640625, -0.42718505859375, -0.3926849365234375, -0.358184814453125, -0.3236846923828125, -0.2891845703125, -0.2546844482421875, -0.220184326171875, -0.1856842041015625, -0.15118408203125, -0.1166839599609375, -0.082183837890625, -0.0476837158203125, -0.01318359375, 0.0213165283203125, 0.055816650390625, 0.0903167724609375, 0.12481689453125, 0.1593170166015625, 0.193817138671875, 0.2283172607421875, 0.2628173828125, 0.2973175048828125, 0.331817626953125, 0.3663177490234375, 0.40081787109375, 0.4353179931640625, 0.469818115234375, 0.5043182373046875, 0.538818359375, 0.5733184814453125, 0.607818603515625, 0.6423187255859375, 0.67681884765625, 0.7113189697265625, 0.745819091796875, 0.7803192138671875, 0.8148193359375, 0.8493194580078125, 0.883819580078125, 0.9183197021484375, 0.95281982421875, 0.9873199462890625, 1.021820068359375, 1.0563201904296875, 1.0908203125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 6.0, 6.0, 5.0, 4.0, 11.0, 12.0, 13.0, 15.0, 16.0, 24.0, 18.0, 23.0, 23.0, 26.0, 30.0, 36.0, 38.0, 45.0, 44.0, 39.0, 51.0, 1066.0, 41.0, 38.0, 38.0, 27.0, 44.0, 35.0, 18.0, 20.0, 27.0, 32.0, 19.0, 14.0, 20.0, 19.0, 14.0, 10.0, 13.0, 4.0, 8.0, 6.0, 4.0, 8.0, 1.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.03125, -14.556640625, -14.08203125, -13.607421875, -13.1328125, -12.658203125, -12.18359375, -11.708984375, -11.234375, -10.759765625, -10.28515625, -9.810546875, -9.3359375, -8.861328125, -8.38671875, -7.912109375, -7.4375, -6.962890625, -6.48828125, -6.013671875, -5.5390625, -5.064453125, -4.58984375, -4.115234375, -3.640625, -3.166015625, -2.69140625, -2.216796875, -1.7421875, -1.267578125, -0.79296875, -0.318359375, 0.15625, 0.630859375, 1.10546875, 1.580078125, 2.0546875, 2.529296875, 3.00390625, 3.478515625, 3.953125, 4.427734375, 4.90234375, 5.376953125, 5.8515625, 6.326171875, 6.80078125, 7.275390625, 7.75, 8.224609375, 8.69921875, 9.173828125, 9.6484375, 10.123046875, 10.59765625, 11.072265625, 11.546875, 12.021484375, 12.49609375, 12.970703125, 13.4453125, 13.919921875, 14.39453125, 14.869140625, 15.34375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 13.0, 18.0, 20.0, 41.0, 83.0, 90.0, 128.0, 182.0, 272.0, 382.0, 529.0, 742.0, 1035.0, 1417.0, 1942.0, 2738.0, 3824.0, 5263.0, 7365.0, 10245.0, 14647.0, 21097.0, 31263.0, 47816.0, 76874.0, 126228.0, 1229350.0, 192514.0, 113530.0, 68809.0, 43502.0, 28498.0, 19228.0, 13644.0, 9632.0, 6676.0, 4949.0, 3502.0, 2593.0, 1750.0, 1383.0, 970.0, 699.0, 505.0, 351.0, 252.0, 188.0, 105.0, 73.0, 64.0, 41.0, 25.0, 18.0, 10.0, 5.0, 6.0, 2.0, 2.0], "bins": [-0.9111328125, -0.8834304809570312, -0.8557281494140625, -0.8280258178710938, -0.800323486328125, -0.7726211547851562, -0.7449188232421875, -0.7172164916992188, -0.68951416015625, -0.6618118286132812, -0.6341094970703125, -0.6064071655273438, -0.578704833984375, -0.5510025024414062, -0.5233001708984375, -0.49559783935546875, -0.4678955078125, -0.44019317626953125, -0.4124908447265625, -0.38478851318359375, -0.357086181640625, -0.32938385009765625, -0.3016815185546875, -0.27397918701171875, -0.24627685546875, -0.21857452392578125, -0.1908721923828125, -0.16316986083984375, -0.135467529296875, -0.10776519775390625, -0.0800628662109375, -0.05236053466796875, -0.024658203125, 0.00304412841796875, 0.0307464599609375, 0.05844879150390625, 0.086151123046875, 0.11385345458984375, 0.1415557861328125, 0.16925811767578125, 0.19696044921875, 0.22466278076171875, 0.2523651123046875, 0.28006744384765625, 0.307769775390625, 0.33547210693359375, 0.3631744384765625, 0.39087677001953125, 0.4185791015625, 0.44628143310546875, 0.4739837646484375, 0.5016860961914062, 0.529388427734375, 0.5570907592773438, 0.5847930908203125, 0.6124954223632812, 0.64019775390625, 0.6679000854492188, 0.6956024169921875, 0.7233047485351562, 0.751007080078125, 0.7787094116210938, 0.8064117431640625, 0.8341140747070312, 0.86181640625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 2.0, 7.0, 7.0, 7.0, 13.0, 11.0, 22.0, 10.0, 14.0, 19.0, 25.0, 32.0, 42.0, 45.0, 71.0, 67.0, 66.0, 66.0, 54.0, 68.0, 61.0, 58.0, 48.0, 34.0, 25.0, 23.0, 21.0, 10.0, 21.0, 15.0, 6.0, 3.0, 9.0, 6.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007076263427734375, -0.006861269474029541, -0.006646275520324707, -0.006431281566619873, -0.006216287612915039, -0.006001293659210205, -0.005786299705505371, -0.005571305751800537, -0.005356311798095703, -0.005141317844390869, -0.004926323890686035, -0.004711329936981201, -0.004496335983276367, -0.004281342029571533, -0.004066348075866699, -0.0038513541221618652, -0.0036363601684570312, -0.0034213662147521973, -0.0032063722610473633, -0.0029913783073425293, -0.0027763843536376953, -0.0025613903999328613, -0.0023463964462280273, -0.0021314024925231934, -0.0019164085388183594, -0.0017014145851135254, -0.0014864206314086914, -0.0012714266777038574, -0.0010564327239990234, -0.0008414387702941895, -0.0006264448165893555, -0.0004114508628845215, -0.0001964569091796875, 1.8537044525146484e-05, 0.00023353099822998047, 0.00044852495193481445, 0.0006635189056396484, 0.0008785128593444824, 0.0010935068130493164, 0.0013085007667541504, 0.0015234947204589844, 0.0017384886741638184, 0.0019534826278686523, 0.0021684765815734863, 0.0023834705352783203, 0.0025984644889831543, 0.0028134584426879883, 0.0030284523963928223, 0.0032434463500976562, 0.0034584403038024902, 0.0036734342575073242, 0.003888428211212158, 0.004103422164916992, 0.004318416118621826, 0.00453341007232666, 0.004748404026031494, 0.004963397979736328, 0.005178391933441162, 0.005393385887145996, 0.00560837984085083, 0.005823373794555664, 0.006038367748260498, 0.006253361701965332, 0.006468355655670166, 0.006683349609375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 8.0, 7.0, 3.0, 12.0, 13.0, 19.0, 27.0, 35.0, 40.0, 60.0, 79.0, 122.0, 234.0, 592.0, 21523.0, 1020840.0, 3827.0, 447.0, 219.0, 98.0, 73.0, 73.0, 45.0, 34.0, 19.0, 15.0, 18.0, 17.0, 10.0, 7.0, 10.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1536865234375, -0.1487865447998047, -0.14388656616210938, -0.13898658752441406, -0.13408660888671875, -0.12918663024902344, -0.12428665161132812, -0.11938667297363281, -0.1144866943359375, -0.10958671569824219, -0.10468673706054688, -0.09978675842285156, -0.09488677978515625, -0.08998680114746094, -0.08508682250976562, -0.08018684387207031, -0.075286865234375, -0.07038688659667969, -0.06548690795898438, -0.06058692932128906, -0.05568695068359375, -0.05078697204589844, -0.045886993408203125, -0.04098701477050781, -0.0360870361328125, -0.031187057495117188, -0.026287078857421875, -0.021387100219726562, -0.01648712158203125, -0.011587142944335938, -0.006687164306640625, -0.0017871856689453125, 0.00311279296875, 0.008012771606445312, 0.012912750244140625, 0.017812728881835938, 0.02271270751953125, 0.027612686157226562, 0.032512664794921875, 0.03741264343261719, 0.0423126220703125, 0.04721260070800781, 0.052112579345703125, 0.05701255798339844, 0.06191253662109375, 0.06681251525878906, 0.07171249389648438, 0.07661247253417969, 0.081512451171875, 0.08641242980957031, 0.09131240844726562, 0.09621238708496094, 0.10111236572265625, 0.10601234436035156, 0.11091232299804688, 0.11581230163574219, 0.1207122802734375, 0.1256122589111328, 0.13051223754882812, 0.13541221618652344, 0.14031219482421875, 0.14521217346191406, 0.15011215209960938, 0.1550121307373047, 0.159912109375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 16.0, 987.0, 17.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1968686878681183, -0.19332051277160645, -0.1897723376750946, -0.18622416257858276, -0.18267600238323212, -0.17912782728672028, -0.17557965219020844, -0.1720314770936966, -0.16848330199718475, -0.1649351269006729, -0.16138695180416107, -0.15783877670764923, -0.15429061651229858, -0.15074244141578674, -0.1471942663192749, -0.14364609122276306, -0.14009791612625122, -0.13654974102973938, -0.13300156593322754, -0.1294533908367157, -0.12590523064136505, -0.12235705554485321, -0.11880888044834137, -0.11526070535182953, -0.11171253770589828, -0.10816436260938644, -0.1046161949634552, -0.10106801986694336, -0.09751984477043152, -0.09397166967391968, -0.09042350202798843, -0.08687532693147659, -0.08332715183496475, -0.07977897673845291, -0.07623080909252167, -0.07268263399600983, -0.06913445889949799, -0.06558628380298615, -0.0620381161570549, -0.05848994106054306, -0.05494176968932152, -0.051393598318099976, -0.047845423221588135, -0.04429725185036659, -0.04074907675385475, -0.03720090538263321, -0.03365273028612137, -0.030104558914899826, -0.026556385681033134, -0.023008212447166443, -0.01946003921329975, -0.01591186597943306, -0.012363693676888943, -0.008815521374344826, -0.005267348140478134, -0.0017191749066114426, 0.001828998327255249, 0.005377171561121941, 0.008925344794988632, 0.01247351709753275, 0.016021691262722015, 0.019569862633943558, 0.02311803586781025, 0.02666620910167694, 0.030214382335543633]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 9.0, 8.0, 8.0, 14.0, 24.0, 17.0, 31.0, 33.0, 35.0, 48.0, 50.0, 41.0, 42.0, 51.0, 52.0, 52.0, 62.0, 57.0, 51.0, 56.0, 40.0, 31.0, 39.0, 36.0, 24.0, 25.0, 15.0, 12.0, 15.0, 8.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004563271999359131, -0.004379077814519405, -0.00419488362967968, -0.004010689444839954, -0.003826495260000229, -0.0036423010751605034, -0.003458106890320778, -0.0032739127054810524, -0.003089718520641327, -0.0029055243358016014, -0.002721330150961876, -0.0025371359661221504, -0.002352941781282425, -0.0021687475964426994, -0.001984553411602974, -0.0018003592267632484, -0.001616165041923523, -0.0014319708570837975, -0.001247776672244072, -0.0010635824874043465, -0.000879388302564621, -0.0006951941177248955, -0.00051099993288517, -0.0003268057480454445, -0.000142611563205719, 4.15826216340065e-05, 0.000225776806473732, 0.0004099709913134575, 0.000594165176153183, 0.0007783593609929085, 0.000962553545832634, 0.0011467477306723595, 0.001330941915512085, 0.0015151361003518105, 0.001699330285191536, 0.0018835244700312614, 0.002067718654870987, 0.0022519128397107124, 0.002436107024550438, 0.0026203012093901634, 0.002804495394229889, 0.0029886895790696144, 0.00317288376390934, 0.0033570779487490654, 0.003541272133588791, 0.0037254663184285164, 0.003909660503268242, 0.004093854688107967, 0.004278048872947693, 0.004462243057787418, 0.004646437242627144, 0.004830631427466869, 0.005014825612306595, 0.00519901979714632, 0.005383213981986046, 0.005567408166825771, 0.005751602351665497, 0.005935796536505222, 0.006119990721344948, 0.006304184906184673, 0.006488379091024399, 0.006672573275864124, 0.00685676746070385, 0.007040961645543575, 0.007225155830383301]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 8.0, 7.0, 7.0, 14.0, 11.0, 19.0, 23.0, 10.0, 16.0, 28.0, 37.0, 29.0, 43.0, 38.0, 27.0, 36.0, 53.0, 46.0, 38.0, 39.0, 42.0, 42.0, 38.0, 44.0, 36.0, 31.0, 29.0, 27.0, 23.0, 25.0, 23.0, 25.0, 11.0, 17.0, 8.0, 12.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-25.234375, -24.470947265625, -23.70751953125, -22.944091796875, -22.1806640625, -21.417236328125, -20.65380859375, -19.890380859375, -19.126953125, -18.363525390625, -17.60009765625, -16.836669921875, -16.0732421875, -15.309814453125, -14.54638671875, -13.782958984375, -13.01953125, -12.256103515625, -11.49267578125, -10.729248046875, -9.9658203125, -9.202392578125, -8.43896484375, -7.675537109375, -6.912109375, -6.148681640625, -5.38525390625, -4.621826171875, -3.8583984375, -3.094970703125, -2.33154296875, -1.568115234375, -0.8046875, -0.041259765625, 0.72216796875, 1.485595703125, 2.2490234375, 3.012451171875, 3.77587890625, 4.539306640625, 5.302734375, 6.066162109375, 6.82958984375, 7.593017578125, 8.3564453125, 9.119873046875, 9.88330078125, 10.646728515625, 11.41015625, 12.173583984375, 12.93701171875, 13.700439453125, 14.4638671875, 15.227294921875, 15.99072265625, 16.754150390625, 17.517578125, 18.281005859375, 19.04443359375, 19.807861328125, 20.5712890625, 21.334716796875, 22.09814453125, 22.861572265625, 23.625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 15.0, 11.0, 6.0, 14.0, 21.0, 18.0, 37.0, 46.0, 41.0, 71.0, 107.0, 160.0, 226.0, 431.0, 728.0, 1190.0, 2474.0, 6099.0, 25561.0, 401187.0, 567800.0, 29817.0, 6594.0, 2612.0, 1281.0, 744.0, 443.0, 245.0, 176.0, 107.0, 72.0, 55.0, 45.0, 23.0, 25.0, 12.0, 16.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-45.21875, -43.85009765625, -42.4814453125, -41.11279296875, -39.744140625, -38.37548828125, -37.0068359375, -35.63818359375, -34.26953125, -32.90087890625, -31.5322265625, -30.16357421875, -28.794921875, -27.42626953125, -26.0576171875, -24.68896484375, -23.3203125, -21.95166015625, -20.5830078125, -19.21435546875, -17.845703125, -16.47705078125, -15.1083984375, -13.73974609375, -12.37109375, -11.00244140625, -9.6337890625, -8.26513671875, -6.896484375, -5.52783203125, -4.1591796875, -2.79052734375, -1.421875, -0.05322265625, 1.3154296875, 2.68408203125, 4.052734375, 5.42138671875, 6.7900390625, 8.15869140625, 9.52734375, 10.89599609375, 12.2646484375, 13.63330078125, 15.001953125, 16.37060546875, 17.7392578125, 19.10791015625, 20.4765625, 21.84521484375, 23.2138671875, 24.58251953125, 25.951171875, 27.31982421875, 28.6884765625, 30.05712890625, 31.42578125, 32.79443359375, 34.1630859375, 35.53173828125, 36.900390625, 38.26904296875, 39.6376953125, 41.00634765625, 42.375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 9.0, 8.0, 12.0, 9.0, 4.0, 17.0, 13.0, 20.0, 17.0, 19.0, 37.0, 43.0, 38.0, 48.0, 42.0, 55.0, 94.0, 158.0, 1822.0, 132.0, 57.0, 60.0, 51.0, 59.0, 34.0, 31.0, 28.0, 23.0, 16.0, 26.0, 17.0, 12.0, 8.0, 8.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.59375, -57.14306640625, -54.6923828125, -52.24169921875, -49.791015625, -47.34033203125, -44.8896484375, -42.43896484375, -39.98828125, -37.53759765625, -35.0869140625, -32.63623046875, -30.185546875, -27.73486328125, -25.2841796875, -22.83349609375, -20.3828125, -17.93212890625, -15.4814453125, -13.03076171875, -10.580078125, -8.12939453125, -5.6787109375, -3.22802734375, -0.77734375, 1.67333984375, 4.1240234375, 6.57470703125, 9.025390625, 11.47607421875, 13.9267578125, 16.37744140625, 18.828125, 21.27880859375, 23.7294921875, 26.18017578125, 28.630859375, 31.08154296875, 33.5322265625, 35.98291015625, 38.43359375, 40.88427734375, 43.3349609375, 45.78564453125, 48.236328125, 50.68701171875, 53.1376953125, 55.58837890625, 58.0390625, 60.48974609375, 62.9404296875, 65.39111328125, 67.841796875, 70.29248046875, 72.7431640625, 75.19384765625, 77.64453125, 80.09521484375, 82.5458984375, 84.99658203125, 87.447265625, 89.89794921875, 92.3486328125, 94.79931640625, 97.25]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 9.0, 21.0, 30.0, 24.0, 27.0, 41.0, 41.0, 87.0, 134.0, 200.0, 426.0, 1347.0, 64992.0, 3074270.0, 2688.0, 573.0, 245.0, 147.0, 98.0, 61.0, 51.0, 16.0, 29.0, 22.0, 17.0, 17.0, 8.0, 5.0, 14.0, 6.0, 11.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-290.5, -283.083984375, -275.66796875, -268.251953125, -260.8359375, -253.419921875, -246.00390625, -238.587890625, -231.171875, -223.755859375, -216.33984375, -208.923828125, -201.5078125, -194.091796875, -186.67578125, -179.259765625, -171.84375, -164.427734375, -157.01171875, -149.595703125, -142.1796875, -134.763671875, -127.34765625, -119.931640625, -112.515625, -105.099609375, -97.68359375, -90.267578125, -82.8515625, -75.435546875, -68.01953125, -60.603515625, -53.1875, -45.771484375, -38.35546875, -30.939453125, -23.5234375, -16.107421875, -8.69140625, -1.275390625, 6.140625, 13.556640625, 20.97265625, 28.388671875, 35.8046875, 43.220703125, 50.63671875, 58.052734375, 65.46875, 72.884765625, 80.30078125, 87.716796875, 95.1328125, 102.548828125, 109.96484375, 117.380859375, 124.796875, 132.212890625, 139.62890625, 147.044921875, 154.4609375, 161.876953125, 169.29296875, 176.708984375, 184.125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 19.0, 66.0, 259.0, 366.0, 219.0, 54.0, 17.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-262.3897705078125, -257.3829040527344, -252.3760528564453, -247.36920166015625, -242.3623504638672, -237.35549926757812, -232.3486328125, -227.34178161621094, -222.33493041992188, -217.3280792236328, -212.3212127685547, -207.31436157226562, -202.30751037597656, -197.3006591796875, -192.29379272460938, -187.2869415283203, -182.2800750732422, -177.27322387695312, -172.266357421875, -167.25950622558594, -162.25265502929688, -157.24578857421875, -152.2389373779297, -147.23208618164062, -142.2252197265625, -137.21836853027344, -132.2115020751953, -127.20465087890625, -122.19779968261719, -117.1909408569336, -112.18408203125, -107.17723083496094, -102.17037963867188, -97.16352081298828, -92.15666961669922, -87.14981079101562, -82.14295959472656, -77.13610076904297, -72.12924194335938, -67.12239074707031, -62.11552810668945, -57.108673095703125, -52.10181427001953, -47.0949592590332, -42.088104248046875, -37.08124923706055, -32.07439422607422, -27.067535400390625, -22.060680389404297, -17.05382537841797, -12.046968460083008, -7.040112495422363, -2.0332565307617188, 2.9735984802246094, 7.98045539855957, 12.987312316894531, 17.99416732788086, 23.001022338867188, 28.00787925720215, 33.01473617553711, 38.02159118652344, 43.028446197509766, 48.035301208496094, 53.04216003417969, 58.049015045166016]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 8.0, 19.0, 20.0, 22.0, 20.0, 17.0, 17.0, 22.0, 38.0, 37.0, 33.0, 34.0, 33.0, 49.0, 43.0, 39.0, 34.0, 41.0, 47.0, 40.0, 36.0, 43.0, 36.0, 27.0, 33.0, 23.0, 26.0, 27.0, 17.0, 14.0, 15.0, 7.0, 13.0, 7.0, 6.0, 7.0, 6.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-168.46751403808594, -162.49844360351562, -156.52935791015625, -150.56027221679688, -144.59120178222656, -138.62213134765625, -132.65304565429688, -126.68396759033203, -120.71488952636719, -114.74581146240234, -108.7767333984375, -102.80765533447266, -96.83857727050781, -90.86949920654297, -84.90042114257812, -78.93134307861328, -72.96226501464844, -66.9931869506836, -61.02410888671875, -55.055030822753906, -49.08595275878906, -43.11687469482422, -37.147796630859375, -31.17871856689453, -25.209640502929688, -19.240562438964844, -13.271484375, -7.302406311035156, -1.3333282470703125, 4.635749816894531, 10.604827880859375, 16.57390594482422, 22.542999267578125, 28.51207733154297, 34.48115539550781, 40.450233459472656, 46.4193115234375, 52.388389587402344, 58.35746765136719, 64.32654571533203, 70.29562377929688, 76.26470184326172, 82.23377990722656, 88.2028579711914, 94.17193603515625, 100.1410140991211, 106.11009216308594, 112.07917022705078, 118.04824829101562, 124.01732635498047, 129.9864044189453, 135.95547485351562, 141.924560546875, 147.89364624023438, 153.8627166748047, 159.831787109375, 165.80087280273438, 171.76995849609375, 177.73902893066406, 183.70809936523438, 189.67718505859375, 195.64627075195312, 201.61534118652344, 207.58441162109375, 213.55349731445312]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 5.0, 9.0, 6.0, 8.0, 8.0, 16.0, 12.0, 20.0, 15.0, 17.0, 24.0, 24.0, 34.0, 39.0, 38.0, 32.0, 44.0, 39.0, 43.0, 42.0, 45.0, 38.0, 34.0, 36.0, 40.0, 53.0, 28.0, 39.0, 25.0, 26.0, 26.0, 18.0, 27.0, 14.0, 14.0, 12.0, 13.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.453125, -24.671630859375, -23.89013671875, -23.108642578125, -22.3271484375, -21.545654296875, -20.76416015625, -19.982666015625, -19.201171875, -18.419677734375, -17.63818359375, -16.856689453125, -16.0751953125, -15.293701171875, -14.51220703125, -13.730712890625, -12.94921875, -12.167724609375, -11.38623046875, -10.604736328125, -9.8232421875, -9.041748046875, -8.26025390625, -7.478759765625, -6.697265625, -5.915771484375, -5.13427734375, -4.352783203125, -3.5712890625, -2.789794921875, -2.00830078125, -1.226806640625, -0.4453125, 0.336181640625, 1.11767578125, 1.899169921875, 2.6806640625, 3.462158203125, 4.24365234375, 5.025146484375, 5.806640625, 6.588134765625, 7.36962890625, 8.151123046875, 8.9326171875, 9.714111328125, 10.49560546875, 11.277099609375, 12.05859375, 12.840087890625, 13.62158203125, 14.403076171875, 15.1845703125, 15.966064453125, 16.74755859375, 17.529052734375, 18.310546875, 19.092041015625, 19.87353515625, 20.655029296875, 21.4365234375, 22.218017578125, 22.99951171875, 23.781005859375, 24.5625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 5.0, 13.0, 12.0, 17.0, 15.0, 27.0, 29.0, 49.0, 74.0, 97.0, 125.0, 165.0, 234.0, 373.0, 520.0, 857.0, 1527.0, 3031.0, 7190.0, 48787.0, 746124.0, 2984310.0, 365694.0, 22955.0, 5584.0, 2599.0, 1326.0, 806.0, 512.0, 335.0, 248.0, 154.0, 120.0, 91.0, 88.0, 47.0, 35.0, 22.0, 19.0, 14.0, 12.0, 13.0, 11.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-54.71875, -53.0283203125, -51.337890625, -49.6474609375, -47.95703125, -46.2666015625, -44.576171875, -42.8857421875, -41.1953125, -39.5048828125, -37.814453125, -36.1240234375, -34.43359375, -32.7431640625, -31.052734375, -29.3623046875, -27.671875, -25.9814453125, -24.291015625, -22.6005859375, -20.91015625, -19.2197265625, -17.529296875, -15.8388671875, -14.1484375, -12.4580078125, -10.767578125, -9.0771484375, -7.38671875, -5.6962890625, -4.005859375, -2.3154296875, -0.625, 1.0654296875, 2.755859375, 4.4462890625, 6.13671875, 7.8271484375, 9.517578125, 11.2080078125, 12.8984375, 14.5888671875, 16.279296875, 17.9697265625, 19.66015625, 21.3505859375, 23.041015625, 24.7314453125, 26.421875, 28.1123046875, 29.802734375, 31.4931640625, 33.18359375, 34.8740234375, 36.564453125, 38.2548828125, 39.9453125, 41.6357421875, 43.326171875, 45.0166015625, 46.70703125, 48.3974609375, 50.087890625, 51.7783203125, 53.46875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 10.0, 10.0, 15.0, 34.0, 40.0, 49.0, 66.0, 132.0, 258.0, 487.0, 807.0, 852.0, 518.0, 299.0, 173.0, 80.0, 56.0, 37.0, 35.0, 32.0, 10.0, 17.0, 11.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.63671875, -46.0546875, -44.47265625, -42.890625, -41.30859375, -39.7265625, -38.14453125, -36.5625, -34.98046875, -33.3984375, -31.81640625, -30.234375, -28.65234375, -27.0703125, -25.48828125, -23.90625, -22.32421875, -20.7421875, -19.16015625, -17.578125, -15.99609375, -14.4140625, -12.83203125, -11.25, -9.66796875, -8.0859375, -6.50390625, -4.921875, -3.33984375, -1.7578125, -0.17578125, 1.40625, 2.98828125, 4.5703125, 6.15234375, 7.734375, 9.31640625, 10.8984375, 12.48046875, 14.0625, 15.64453125, 17.2265625, 18.80859375, 20.390625, 21.97265625, 23.5546875, 25.13671875, 26.71875, 28.30078125, 29.8828125, 31.46484375, 33.046875, 34.62890625, 36.2109375, 37.79296875, 39.375, 40.95703125, 42.5390625, 44.12109375, 45.703125, 47.28515625, 48.8671875, 50.44921875, 52.03125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 6.0, 5.0, 1.0, 9.0, 4.0, 17.0, 11.0, 13.0, 21.0, 35.0, 59.0, 91.0, 140.0, 317.0, 795.0, 2780.0, 21223.0, 3834255.0, 322411.0, 9322.0, 1698.0, 562.0, 190.0, 133.0, 59.0, 52.0, 26.0, 13.0, 15.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-186.625, -180.939453125, -175.25390625, -169.568359375, -163.8828125, -158.197265625, -152.51171875, -146.826171875, -141.140625, -135.455078125, -129.76953125, -124.083984375, -118.3984375, -112.712890625, -107.02734375, -101.341796875, -95.65625, -89.970703125, -84.28515625, -78.599609375, -72.9140625, -67.228515625, -61.54296875, -55.857421875, -50.171875, -44.486328125, -38.80078125, -33.115234375, -27.4296875, -21.744140625, -16.05859375, -10.373046875, -4.6875, 0.998046875, 6.68359375, 12.369140625, 18.0546875, 23.740234375, 29.42578125, 35.111328125, 40.796875, 46.482421875, 52.16796875, 57.853515625, 63.5390625, 69.224609375, 74.91015625, 80.595703125, 86.28125, 91.966796875, 97.65234375, 103.337890625, 109.0234375, 114.708984375, 120.39453125, 126.080078125, 131.765625, 137.451171875, 143.13671875, 148.822265625, 154.5078125, 160.193359375, 165.87890625, 171.564453125, 177.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 21.0, 123.0, 420.0, 335.0, 85.0, 17.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-671.45751953125, -655.0128173828125, -638.5680541992188, -622.1233520507812, -605.6786499023438, -589.2339477539062, -572.7891845703125, -556.344482421875, -539.8997802734375, -523.455078125, -507.0103454589844, -490.56561279296875, -474.12091064453125, -457.6761779785156, -441.2314453125, -424.7867431640625, -408.3420104980469, -391.89727783203125, -375.45257568359375, -359.0078430175781, -342.5631408691406, -326.118408203125, -309.6737060546875, -293.2289733886719, -276.78424072265625, -260.3395080566406, -243.89480590820312, -227.4500732421875, -211.00537109375, -194.56063842773438, -178.1159210205078, -161.67120361328125, -145.22647094726562, -128.78175354003906, -112.3370361328125, -95.8923110961914, -79.44759368896484, -63.00287628173828, -46.55815124511719, -30.113433837890625, -13.668716430664062, 2.776002883911133, 19.220722198486328, 35.665443420410156, 52.11016082763672, 68.55487823486328, 84.99960327148438, 101.44432067871094, 117.8890380859375, 134.33375549316406, 150.77847290039062, 167.22320556640625, 183.66790771484375, 200.11264038085938, 216.55735778808594, 233.0020751953125, 249.44679260253906, 265.8915100097656, 282.33624267578125, 298.78094482421875, 315.2256774902344, 331.6703796386719, 348.1151123046875, 364.559814453125, 381.0045471191406]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 12.0, 5.0, 11.0, 18.0, 17.0, 21.0, 18.0, 24.0, 24.0, 30.0, 30.0, 28.0, 37.0, 38.0, 44.0, 33.0, 30.0, 51.0, 38.0, 46.0, 40.0, 43.0, 39.0, 34.0, 30.0, 33.0, 28.0, 29.0, 27.0, 18.0, 19.0, 14.0, 17.0, 14.0, 13.0, 6.0, 5.0, 4.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-127.73908996582031, -124.02251434326172, -120.30593872070312, -116.58936309814453, -112.87278747558594, -109.15620422363281, -105.43963623046875, -101.72305297851562, -98.00647735595703, -94.28990173339844, -90.57332611083984, -86.85675048828125, -83.14017486572266, -79.42359924316406, -75.70701599121094, -71.99044036865234, -68.27386474609375, -64.55728912353516, -60.84071350097656, -57.12413787841797, -53.40755844116211, -49.690982818603516, -45.97440719604492, -42.25782775878906, -38.541259765625, -34.824684143066406, -31.10810661315918, -27.391530990600586, -23.67495346069336, -19.958377838134766, -16.241802215576172, -12.525224685668945, -8.808647155761719, -5.092070579528809, -1.3754944801330566, 2.3410816192626953, 6.0576581954956055, 9.774234771728516, 13.49081039428711, 17.207387924194336, 20.92396354675293, 24.640539169311523, 28.35711669921875, 32.073692321777344, 35.79026794433594, 39.50684356689453, 43.223419189453125, 46.939998626708984, 50.65657424926758, 54.37314987182617, 58.089725494384766, 61.806304931640625, 65.52288055419922, 69.23945617675781, 72.9560317993164, 76.672607421875, 80.3891830444336, 84.10575866699219, 87.82233428955078, 91.53890991210938, 95.25548553466797, 98.97206115722656, 102.68864440917969, 106.40522003173828, 110.12179565429688]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 8.0, 5.0, 14.0, 7.0, 16.0, 12.0, 12.0, 15.0, 21.0, 17.0, 26.0, 30.0, 37.0, 36.0, 36.0, 27.0, 46.0, 48.0, 35.0, 46.0, 35.0, 58.0, 39.0, 36.0, 38.0, 36.0, 28.0, 34.0, 27.0, 27.0, 28.0, 23.0, 12.0, 20.0, 9.0, 8.0, 11.0, 6.0, 8.0, 5.0, 4.0, 5.0, 0.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.90234375, -24.1484375, -23.39453125, -22.640625, -21.88671875, -21.1328125, -20.37890625, -19.625, -18.87109375, -18.1171875, -17.36328125, -16.609375, -15.85546875, -15.1015625, -14.34765625, -13.59375, -12.83984375, -12.0859375, -11.33203125, -10.578125, -9.82421875, -9.0703125, -8.31640625, -7.5625, -6.80859375, -6.0546875, -5.30078125, -4.546875, -3.79296875, -3.0390625, -2.28515625, -1.53125, -0.77734375, -0.0234375, 0.73046875, 1.484375, 2.23828125, 2.9921875, 3.74609375, 4.5, 5.25390625, 6.0078125, 6.76171875, 7.515625, 8.26953125, 9.0234375, 9.77734375, 10.53125, 11.28515625, 12.0390625, 12.79296875, 13.546875, 14.30078125, 15.0546875, 15.80859375, 16.5625, 17.31640625, 18.0703125, 18.82421875, 19.578125, 20.33203125, 21.0859375, 21.83984375, 22.59375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 12.0, 11.0, 20.0, 45.0, 54.0, 101.0, 131.0, 236.0, 327.0, 515.0, 850.0, 1348.0, 2048.0, 3301.0, 5173.0, 8273.0, 13853.0, 22706.0, 38835.0, 68331.0, 128413.0, 236255.0, 232152.0, 123512.0, 66561.0, 37743.0, 22305.0, 13381.0, 8274.0, 5036.0, 3073.0, 2077.0, 1254.0, 836.0, 550.0, 354.0, 214.0, 144.0, 95.0, 54.0, 40.0, 20.0, 11.0, 11.0, 5.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.1535491943359375, -1.113739013671875, -1.0739288330078125, -1.03411865234375, -0.9943084716796875, -0.954498291015625, -0.9146881103515625, -0.8748779296875, -0.8350677490234375, -0.795257568359375, -0.7554473876953125, -0.71563720703125, -0.6758270263671875, -0.636016845703125, -0.5962066650390625, -0.556396484375, -0.5165863037109375, -0.476776123046875, -0.4369659423828125, -0.39715576171875, -0.3573455810546875, -0.317535400390625, -0.2777252197265625, -0.2379150390625, -0.1981048583984375, -0.158294677734375, -0.1184844970703125, -0.07867431640625, -0.0388641357421875, 0.000946044921875, 0.0407562255859375, 0.08056640625, 0.1203765869140625, 0.160186767578125, 0.1999969482421875, 0.23980712890625, 0.2796173095703125, 0.319427490234375, 0.3592376708984375, 0.3990478515625, 0.4388580322265625, 0.478668212890625, 0.5184783935546875, 0.55828857421875, 0.5980987548828125, 0.637908935546875, 0.6777191162109375, 0.717529296875, 0.7573394775390625, 0.797149658203125, 0.8369598388671875, 0.87677001953125, 0.9165802001953125, 0.956390380859375, 0.9962005615234375, 1.0360107421875, 1.0758209228515625, 1.115631103515625, 1.1554412841796875, 1.19525146484375, 1.2350616455078125, 1.274871826171875, 1.3146820068359375, 1.3544921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 9.0, 5.0, 10.0, 4.0, 8.0, 10.0, 9.0, 14.0, 22.0, 17.0, 24.0, 17.0, 26.0, 32.0, 17.0, 28.0, 32.0, 35.0, 29.0, 45.0, 43.0, 46.0, 1061.0, 32.0, 32.0, 46.0, 36.0, 38.0, 32.0, 23.0, 28.0, 21.0, 36.0, 18.0, 28.0, 19.0, 21.0, 9.0, 8.0, 14.0, 9.0, 6.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.703125, -14.2491455078125, -13.795166015625, -13.3411865234375, -12.88720703125, -12.4332275390625, -11.979248046875, -11.5252685546875, -11.0712890625, -10.6173095703125, -10.163330078125, -9.7093505859375, -9.25537109375, -8.8013916015625, -8.347412109375, -7.8934326171875, -7.439453125, -6.9854736328125, -6.531494140625, -6.0775146484375, -5.62353515625, -5.1695556640625, -4.715576171875, -4.2615966796875, -3.8076171875, -3.3536376953125, -2.899658203125, -2.4456787109375, -1.99169921875, -1.5377197265625, -1.083740234375, -0.6297607421875, -0.17578125, 0.2781982421875, 0.732177734375, 1.1861572265625, 1.64013671875, 2.0941162109375, 2.548095703125, 3.0020751953125, 3.4560546875, 3.9100341796875, 4.364013671875, 4.8179931640625, 5.27197265625, 5.7259521484375, 6.179931640625, 6.6339111328125, 7.087890625, 7.5418701171875, 7.995849609375, 8.4498291015625, 8.90380859375, 9.3577880859375, 9.811767578125, 10.2657470703125, 10.7197265625, 11.1737060546875, 11.627685546875, 12.0816650390625, 12.53564453125, 12.9896240234375, 13.443603515625, 13.8975830078125, 14.3515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 8.0, 13.0, 16.0, 24.0, 31.0, 63.0, 70.0, 97.0, 171.0, 246.0, 356.0, 483.0, 682.0, 946.0, 1299.0, 1828.0, 2514.0, 3494.0, 5041.0, 7046.0, 9973.0, 14172.0, 20359.0, 29997.0, 44877.0, 70762.0, 114099.0, 190704.0, 1222728.0, 124388.0, 76529.0, 48474.0, 32183.0, 21633.0, 15171.0, 10684.0, 7411.0, 5305.0, 3838.0, 2675.0, 1962.0, 1345.0, 1066.0, 724.0, 506.0, 333.0, 249.0, 187.0, 125.0, 85.0, 72.0, 38.0, 18.0, 16.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.87744140625, -0.85009765625, -0.82275390625, -0.79541015625, -0.76806640625, -0.74072265625, -0.71337890625, -0.68603515625, -0.65869140625, -0.63134765625, -0.60400390625, -0.57666015625, -0.54931640625, -0.52197265625, -0.49462890625, -0.46728515625, -0.43994140625, -0.41259765625, -0.38525390625, -0.35791015625, -0.33056640625, -0.30322265625, -0.27587890625, -0.24853515625, -0.22119140625, -0.19384765625, -0.16650390625, -0.13916015625, -0.11181640625, -0.08447265625, -0.05712890625, -0.02978515625, -0.00244140625, 0.02490234375, 0.05224609375, 0.07958984375, 0.10693359375, 0.13427734375, 0.16162109375, 0.18896484375, 0.21630859375, 0.24365234375, 0.27099609375, 0.29833984375, 0.32568359375, 0.35302734375, 0.38037109375, 0.40771484375, 0.43505859375, 0.46240234375, 0.48974609375, 0.51708984375, 0.54443359375, 0.57177734375, 0.59912109375, 0.62646484375, 0.65380859375, 0.68115234375, 0.70849609375, 0.73583984375, 0.76318359375, 0.79052734375, 0.81787109375, 0.84521484375, 0.87255859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 8.0, 9.0, 15.0, 14.0, 14.0, 19.0, 22.0, 20.0, 30.0, 34.0, 51.0, 62.0, 59.0, 60.0, 67.0, 61.0, 54.0, 72.0, 44.0, 50.0, 46.0, 33.0, 32.0, 24.0, 19.0, 16.0, 13.0, 11.0, 9.0, 11.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006046295166015625, -0.005880534648895264, -0.005714774131774902, -0.005549013614654541, -0.00538325309753418, -0.005217492580413818, -0.005051732063293457, -0.004885971546173096, -0.004720211029052734, -0.004554450511932373, -0.004388689994812012, -0.00422292947769165, -0.004057168960571289, -0.0038914084434509277, -0.0037256479263305664, -0.003559887409210205, -0.0033941268920898438, -0.0032283663749694824, -0.003062605857849121, -0.0028968453407287598, -0.0027310848236083984, -0.002565324306488037, -0.0023995637893676758, -0.0022338032722473145, -0.002068042755126953, -0.0019022822380065918, -0.0017365217208862305, -0.0015707612037658691, -0.0014050006866455078, -0.0012392401695251465, -0.0010734796524047852, -0.0009077191352844238, -0.0007419586181640625, -0.0005761981010437012, -0.00041043758392333984, -0.0002446770668029785, -7.891654968261719e-05, 8.684396743774414e-05, 0.00025260448455810547, 0.0004183650016784668, 0.0005841255187988281, 0.0007498860359191895, 0.0009156465530395508, 0.0010814070701599121, 0.0012471675872802734, 0.0014129281044006348, 0.001578688621520996, 0.0017444491386413574, 0.0019102096557617188, 0.00207597017288208, 0.0022417306900024414, 0.0024074912071228027, 0.002573251724243164, 0.0027390122413635254, 0.0029047727584838867, 0.003070533275604248, 0.0032362937927246094, 0.0034020543098449707, 0.003567814826965332, 0.0037335753440856934, 0.0038993358612060547, 0.004065096378326416, 0.004230856895446777, 0.004396617412567139, 0.0045623779296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 3.0, 14.0, 12.0, 19.0, 14.0, 17.0, 34.0, 39.0, 47.0, 60.0, 78.0, 117.0, 198.0, 376.0, 2373.0, 807577.0, 235267.0, 1316.0, 325.0, 184.0, 110.0, 101.0, 59.0, 44.0, 44.0, 32.0, 13.0, 19.0, 10.0, 13.0, 11.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09063720703125, -0.08713817596435547, -0.08363914489746094, -0.0801401138305664, -0.07664108276367188, -0.07314205169677734, -0.06964302062988281, -0.06614398956298828, -0.06264495849609375, -0.05914592742919922, -0.05564689636230469, -0.052147865295410156, -0.048648834228515625, -0.045149803161621094, -0.04165077209472656, -0.03815174102783203, -0.0346527099609375, -0.03115367889404297, -0.027654647827148438, -0.024155616760253906, -0.020656585693359375, -0.017157554626464844, -0.013658523559570312, -0.010159492492675781, -0.00666046142578125, -0.0031614303588867188, 0.0003376007080078125, 0.0038366317749023438, 0.007335662841796875, 0.010834693908691406, 0.014333724975585938, 0.01783275604248047, 0.021331787109375, 0.02483081817626953, 0.028329849243164062, 0.031828880310058594, 0.035327911376953125, 0.038826942443847656, 0.04232597351074219, 0.04582500457763672, 0.04932403564453125, 0.05282306671142578, 0.05632209777832031, 0.059821128845214844, 0.06332015991210938, 0.0668191909790039, 0.07031822204589844, 0.07381725311279297, 0.0773162841796875, 0.08081531524658203, 0.08431434631347656, 0.0878133773803711, 0.09131240844726562, 0.09481143951416016, 0.09831047058105469, 0.10180950164794922, 0.10530853271484375, 0.10880756378173828, 0.11230659484863281, 0.11580562591552734, 0.11930465698242188, 0.1228036880493164, 0.12630271911621094, 0.12980175018310547, 0.13330078125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 32.0, 919.0, 64.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09649784862995148, -0.09479185193777084, -0.09308585524559021, -0.09137985855340958, -0.08967385441064835, -0.08796785771846771, -0.08626186102628708, -0.08455586433410645, -0.08284986764192581, -0.08114387094974518, -0.07943787425756454, -0.07773187756538391, -0.07602587342262268, -0.07431987673044205, -0.07261388003826141, -0.07090788334608078, -0.06920188665390015, -0.06749588996171951, -0.06578989326953888, -0.06408389657735825, -0.062377896159887314, -0.06067189574241638, -0.05896589905023575, -0.057259902358055115, -0.05555390194058418, -0.05384790524840355, -0.05214190483093262, -0.050435908138751984, -0.04872991144657135, -0.04702391475439072, -0.045317914336919785, -0.04361191764473915, -0.04190591722726822, -0.040199920535087585, -0.03849392011761665, -0.03678792342543602, -0.035081926733255386, -0.033375926315784454, -0.03166992962360382, -0.029963932931423187, -0.028257936239242554, -0.02655193768441677, -0.024845940992236137, -0.023139942437410355, -0.02143394574522972, -0.01972794719040394, -0.018021948635578156, -0.016315951943397522, -0.014609955251216888, -0.01290395762771368, -0.011197960004210472, -0.00949196144938469, -0.0077859642915427685, -0.006079966202378273, -0.004373968578875065, -0.0026679709553718567, -0.0009619733318686485, 0.0007440244080498815, 0.0024500221479684114, 0.004156020004302263, 0.005862017627805471, 0.007568015716969967, 0.009274013340473175, 0.010980010963976383, 0.012686008587479591]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 12.0, 11.0, 12.0, 19.0, 15.0, 23.0, 23.0, 17.0, 32.0, 31.0, 44.0, 38.0, 45.0, 48.0, 41.0, 33.0, 42.0, 50.0, 45.0, 46.0, 41.0, 37.0, 28.0, 43.0, 28.0, 31.0, 32.0, 19.0, 27.0, 15.0, 12.0, 6.0, 9.0, 11.0, 9.0, 7.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.003112494945526123, -0.0030047884210944176, -0.002897081896662712, -0.0027893753722310066, -0.002681668847799301, -0.0025739623233675957, -0.00246625579893589, -0.0023585492745041847, -0.0022508427500724792, -0.0021431362256407738, -0.0020354297012090683, -0.0019277231767773628, -0.0018200166523456573, -0.0017123101279139519, -0.0016046036034822464, -0.001496897079050541, -0.0013891905546188354, -0.00128148403018713, -0.0011737775057554245, -0.001066070981323719, -0.0009583644568920135, -0.0008506579324603081, -0.0007429514080286026, -0.0006352448835968971, -0.0005275383591651917, -0.0004198318347334862, -0.0003121253103017807, -0.00020441878587007523, -9.671226143836975e-05, 1.0994262993335724e-05, 0.0001187007874250412, 0.00022640731185674667, 0.00033411383628845215, 0.0004418203607201576, 0.0005495268851518631, 0.0006572334095835686, 0.000764939934015274, 0.0008726464584469795, 0.000980352982878685, 0.0010880595073103905, 0.001195766031742096, 0.0013034725561738014, 0.001411179080605507, 0.0015188856050372124, 0.0016265921294689178, 0.0017342986539006233, 0.0018420051783323288, 0.0019497117027640343, 0.0020574182271957397, 0.0021651247516274452, 0.0022728312760591507, 0.002380537800490856, 0.0024882443249225616, 0.002595950849354267, 0.0027036573737859726, 0.002811363898217678, 0.0029190704226493835, 0.003026776947081089, 0.0031344834715127945, 0.0032421899959445, 0.0033498965203762054, 0.003457603044807911, 0.0035653095692396164, 0.003673016093671322, 0.0037807226181030273]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 8.0, 5.0, 14.0, 7.0, 16.0, 12.0, 12.0, 15.0, 21.0, 17.0, 26.0, 30.0, 37.0, 36.0, 36.0, 27.0, 46.0, 48.0, 35.0, 46.0, 35.0, 58.0, 39.0, 36.0, 38.0, 36.0, 28.0, 34.0, 27.0, 27.0, 28.0, 23.0, 12.0, 20.0, 9.0, 8.0, 11.0, 6.0, 8.0, 5.0, 4.0, 5.0, 0.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.90234375, -24.1484375, -23.39453125, -22.640625, -21.88671875, -21.1328125, -20.37890625, -19.625, -18.87109375, -18.1171875, -17.36328125, -16.609375, -15.85546875, -15.1015625, -14.34765625, -13.59375, -12.83984375, -12.0859375, -11.33203125, -10.578125, -9.82421875, -9.0703125, -8.31640625, -7.5625, -6.80859375, -6.0546875, -5.30078125, -4.546875, -3.79296875, -3.0390625, -2.28515625, -1.53125, -0.77734375, -0.0234375, 0.73046875, 1.484375, 2.23828125, 2.9921875, 3.74609375, 4.5, 5.25390625, 6.0078125, 6.76171875, 7.515625, 8.26953125, 9.0234375, 9.77734375, 10.53125, 11.28515625, 12.0390625, 12.79296875, 13.546875, 14.30078125, 15.0546875, 15.80859375, 16.5625, 17.31640625, 18.0703125, 18.82421875, 19.578125, 20.33203125, 21.0859375, 21.83984375, 22.59375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 7.0, 7.0, 16.0, 19.0, 30.0, 30.0, 50.0, 72.0, 132.0, 224.0, 361.0, 613.0, 1054.0, 1918.0, 3361.0, 6187.0, 13114.0, 31033.0, 95137.0, 427449.0, 337354.0, 78735.0, 27169.0, 11600.0, 5654.0, 3082.0, 1641.0, 1010.0, 573.0, 361.0, 218.0, 112.0, 74.0, 50.0, 32.0, 18.0, 10.0, 10.0, 5.0, 6.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-30.296875, -29.40380859375, -28.5107421875, -27.61767578125, -26.724609375, -25.83154296875, -24.9384765625, -24.04541015625, -23.15234375, -22.25927734375, -21.3662109375, -20.47314453125, -19.580078125, -18.68701171875, -17.7939453125, -16.90087890625, -16.0078125, -15.11474609375, -14.2216796875, -13.32861328125, -12.435546875, -11.54248046875, -10.6494140625, -9.75634765625, -8.86328125, -7.97021484375, -7.0771484375, -6.18408203125, -5.291015625, -4.39794921875, -3.5048828125, -2.61181640625, -1.71875, -0.82568359375, 0.0673828125, 0.96044921875, 1.853515625, 2.74658203125, 3.6396484375, 4.53271484375, 5.42578125, 6.31884765625, 7.2119140625, 8.10498046875, 8.998046875, 9.89111328125, 10.7841796875, 11.67724609375, 12.5703125, 13.46337890625, 14.3564453125, 15.24951171875, 16.142578125, 17.03564453125, 17.9287109375, 18.82177734375, 19.71484375, 20.60791015625, 21.5009765625, 22.39404296875, 23.287109375, 24.18017578125, 25.0732421875, 25.96630859375, 26.859375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 3.0, 5.0, 10.0, 11.0, 5.0, 11.0, 16.0, 7.0, 35.0, 23.0, 29.0, 25.0, 30.0, 45.0, 29.0, 38.0, 51.0, 72.0, 101.0, 234.0, 1485.0, 235.0, 104.0, 75.0, 59.0, 47.0, 35.0, 35.0, 34.0, 24.0, 21.0, 14.0, 17.0, 18.0, 10.0, 11.0, 5.0, 4.0, 11.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.09375, -57.02783203125, -54.9619140625, -52.89599609375, -50.830078125, -48.76416015625, -46.6982421875, -44.63232421875, -42.56640625, -40.50048828125, -38.4345703125, -36.36865234375, -34.302734375, -32.23681640625, -30.1708984375, -28.10498046875, -26.0390625, -23.97314453125, -21.9072265625, -19.84130859375, -17.775390625, -15.70947265625, -13.6435546875, -11.57763671875, -9.51171875, -7.44580078125, -5.3798828125, -3.31396484375, -1.248046875, 0.81787109375, 2.8837890625, 4.94970703125, 7.015625, 9.08154296875, 11.1474609375, 13.21337890625, 15.279296875, 17.34521484375, 19.4111328125, 21.47705078125, 23.54296875, 25.60888671875, 27.6748046875, 29.74072265625, 31.806640625, 33.87255859375, 35.9384765625, 38.00439453125, 40.0703125, 42.13623046875, 44.2021484375, 46.26806640625, 48.333984375, 50.39990234375, 52.4658203125, 54.53173828125, 56.59765625, 58.66357421875, 60.7294921875, 62.79541015625, 64.861328125, 66.92724609375, 68.9931640625, 71.05908203125, 73.125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 7.0, 5.0, 11.0, 7.0, 13.0, 30.0, 16.0, 23.0, 39.0, 50.0, 43.0, 76.0, 66.0, 133.0, 181.0, 255.0, 581.0, 1563.0, 13302.0, 1097754.0, 2011575.0, 16500.0, 1764.0, 590.0, 310.0, 170.0, 123.0, 107.0, 84.0, 57.0, 50.0, 52.0, 25.0, 28.0, 14.0, 14.0, 14.0, 10.0, 12.0, 8.0, 12.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-115.8125, -112.5068359375, -109.201171875, -105.8955078125, -102.58984375, -99.2841796875, -95.978515625, -92.6728515625, -89.3671875, -86.0615234375, -82.755859375, -79.4501953125, -76.14453125, -72.8388671875, -69.533203125, -66.2275390625, -62.921875, -59.6162109375, -56.310546875, -53.0048828125, -49.69921875, -46.3935546875, -43.087890625, -39.7822265625, -36.4765625, -33.1708984375, -29.865234375, -26.5595703125, -23.25390625, -19.9482421875, -16.642578125, -13.3369140625, -10.03125, -6.7255859375, -3.419921875, -0.1142578125, 3.19140625, 6.4970703125, 9.802734375, 13.1083984375, 16.4140625, 19.7197265625, 23.025390625, 26.3310546875, 29.63671875, 32.9423828125, 36.248046875, 39.5537109375, 42.859375, 46.1650390625, 49.470703125, 52.7763671875, 56.08203125, 59.3876953125, 62.693359375, 65.9990234375, 69.3046875, 72.6103515625, 75.916015625, 79.2216796875, 82.52734375, 85.8330078125, 89.138671875, 92.4443359375, 95.75]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 38.0, 477.0, 460.0, 39.0, 3.0, 1.0, 0.0, 1.0], "bins": [-943.0515747070312, -926.796142578125, -910.5406494140625, -894.2852172851562, -878.02978515625, -861.7742919921875, -845.5188598632812, -829.263427734375, -813.0079345703125, -796.7525024414062, -780.4970092773438, -764.2415771484375, -747.9861450195312, -731.730712890625, -715.4752197265625, -699.2197875976562, -682.96435546875, -666.7089233398438, -650.4534301757812, -634.197998046875, -617.9425659179688, -601.6871337890625, -585.431640625, -569.1762084960938, -552.9207763671875, -536.6653442382812, -520.4098510742188, -504.1544189453125, -487.89898681640625, -471.6435241699219, -455.3880615234375, -439.13262939453125, -422.8771057128906, -406.62164306640625, -390.3662109375, -374.1107482910156, -357.85528564453125, -341.599853515625, -325.3443908691406, -309.08892822265625, -292.83349609375, -276.5780334472656, -260.3226013183594, -244.067138671875, -227.8116912841797, -211.55624389648438, -195.30078125, -179.0453338623047, -162.78988647460938, -146.53443908691406, -130.27899169921875, -114.02352905273438, -97.76808166503906, -81.51263427734375, -65.2571792602539, -49.00172424316406, -32.74628448486328, -16.490833282470703, -0.235382080078125, 16.020069122314453, 32.27552032470703, 48.530967712402344, 64.78642272949219, 81.04187774658203, 97.29732513427734]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 9.0, 13.0, 13.0, 11.0, 24.0, 15.0, 23.0, 20.0, 31.0, 20.0, 27.0, 40.0, 31.0, 27.0, 50.0, 40.0, 57.0, 40.0, 38.0, 41.0, 34.0, 50.0, 38.0, 41.0, 30.0, 27.0, 20.0, 22.0, 26.0, 27.0, 16.0, 12.0, 14.0, 13.0, 5.0, 9.0, 11.0, 7.0, 8.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-159.0382080078125, -153.84970092773438, -148.6611785888672, -143.47267150878906, -138.28416442871094, -133.09564208984375, -127.90713500976562, -122.7186279296875, -117.53011322021484, -112.34159851074219, -107.15309143066406, -101.9645767211914, -96.77606201171875, -91.58755493164062, -86.39904022216797, -81.21052551269531, -76.02201843261719, -70.83350372314453, -65.6449966430664, -60.45648193359375, -55.26797103881836, -50.07946014404297, -44.89094543457031, -39.70243453979492, -34.51392364501953, -29.32541275024414, -24.136899948120117, -18.948387145996094, -13.759876251220703, -8.571365356445312, -3.382852554321289, 1.8056602478027344, 6.9941864013671875, 12.182698249816895, 17.3712100982666, 22.559722900390625, 27.748233795166016, 32.936744689941406, 38.12525939941406, 43.31377029418945, 48.502281188964844, 53.690792083740234, 58.879302978515625, 64.06781768798828, 69.25633239746094, 74.44483947753906, 79.63335418701172, 84.82186889648438, 90.0103759765625, 95.19889068603516, 100.38739776611328, 105.57591247558594, 110.76441955566406, 115.95293426513672, 121.14144897460938, 126.3299560546875, 131.51846313476562, 136.70697021484375, 141.89549255371094, 147.08399963378906, 152.2725067138672, 157.46102905273438, 162.6495361328125, 167.83804321289062, 173.0265655517578]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 8.0, 7.0, 9.0, 11.0, 10.0, 10.0, 23.0, 12.0, 24.0, 25.0, 24.0, 34.0, 27.0, 36.0, 36.0, 41.0, 39.0, 43.0, 40.0, 53.0, 36.0, 43.0, 41.0, 37.0, 28.0, 41.0, 27.0, 32.0, 25.0, 16.0, 23.0, 24.0, 13.0, 20.0, 14.0, 10.0, 4.0, 9.0, 8.0, 5.0, 4.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.96875, -23.233642578125, -22.49853515625, -21.763427734375, -21.0283203125, -20.293212890625, -19.55810546875, -18.822998046875, -18.087890625, -17.352783203125, -16.61767578125, -15.882568359375, -15.1474609375, -14.412353515625, -13.67724609375, -12.942138671875, -12.20703125, -11.471923828125, -10.73681640625, -10.001708984375, -9.2666015625, -8.531494140625, -7.79638671875, -7.061279296875, -6.326171875, -5.591064453125, -4.85595703125, -4.120849609375, -3.3857421875, -2.650634765625, -1.91552734375, -1.180419921875, -0.4453125, 0.289794921875, 1.02490234375, 1.760009765625, 2.4951171875, 3.230224609375, 3.96533203125, 4.700439453125, 5.435546875, 6.170654296875, 6.90576171875, 7.640869140625, 8.3759765625, 9.111083984375, 9.84619140625, 10.581298828125, 11.31640625, 12.051513671875, 12.78662109375, 13.521728515625, 14.2568359375, 14.991943359375, 15.72705078125, 16.462158203125, 17.197265625, 17.932373046875, 18.66748046875, 19.402587890625, 20.1376953125, 20.872802734375, 21.60791015625, 22.343017578125, 23.078125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 8.0, 9.0, 5.0, 11.0, 17.0, 16.0, 15.0, 23.0, 32.0, 49.0, 91.0, 91.0, 197.0, 320.0, 720.0, 1438.0, 3694.0, 13791.0, 429486.0, 3587113.0, 142784.0, 8824.0, 2906.0, 1196.0, 570.0, 305.0, 201.0, 96.0, 61.0, 49.0, 36.0, 16.0, 20.0, 13.0, 13.0, 14.0, 6.0, 8.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-82.1875, -79.7958984375, -77.404296875, -75.0126953125, -72.62109375, -70.2294921875, -67.837890625, -65.4462890625, -63.0546875, -60.6630859375, -58.271484375, -55.8798828125, -53.48828125, -51.0966796875, -48.705078125, -46.3134765625, -43.921875, -41.5302734375, -39.138671875, -36.7470703125, -34.35546875, -31.9638671875, -29.572265625, -27.1806640625, -24.7890625, -22.3974609375, -20.005859375, -17.6142578125, -15.22265625, -12.8310546875, -10.439453125, -8.0478515625, -5.65625, -3.2646484375, -0.873046875, 1.5185546875, 3.91015625, 6.3017578125, 8.693359375, 11.0849609375, 13.4765625, 15.8681640625, 18.259765625, 20.6513671875, 23.04296875, 25.4345703125, 27.826171875, 30.2177734375, 32.609375, 35.0009765625, 37.392578125, 39.7841796875, 42.17578125, 44.5673828125, 46.958984375, 49.3505859375, 51.7421875, 54.1337890625, 56.525390625, 58.9169921875, 61.30859375, 63.7001953125, 66.091796875, 68.4833984375, 70.875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 4.0, 6.0, 4.0, 11.0, 13.0, 27.0, 36.0, 47.0, 82.0, 137.0, 301.0, 641.0, 1006.0, 856.0, 402.0, 196.0, 137.0, 62.0, 28.0, 23.0, 23.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.03125, -60.34423828125, -58.6572265625, -56.97021484375, -55.283203125, -53.59619140625, -51.9091796875, -50.22216796875, -48.53515625, -46.84814453125, -45.1611328125, -43.47412109375, -41.787109375, -40.10009765625, -38.4130859375, -36.72607421875, -35.0390625, -33.35205078125, -31.6650390625, -29.97802734375, -28.291015625, -26.60400390625, -24.9169921875, -23.22998046875, -21.54296875, -19.85595703125, -18.1689453125, -16.48193359375, -14.794921875, -13.10791015625, -11.4208984375, -9.73388671875, -8.046875, -6.35986328125, -4.6728515625, -2.98583984375, -1.298828125, 0.38818359375, 2.0751953125, 3.76220703125, 5.44921875, 7.13623046875, 8.8232421875, 10.51025390625, 12.197265625, 13.88427734375, 15.5712890625, 17.25830078125, 18.9453125, 20.63232421875, 22.3193359375, 24.00634765625, 25.693359375, 27.38037109375, 29.0673828125, 30.75439453125, 32.44140625, 34.12841796875, 35.8154296875, 37.50244140625, 39.189453125, 40.87646484375, 42.5634765625, 44.25048828125, 45.9375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 0.0, 7.0, 4.0, 8.0, 15.0, 17.0, 24.0, 40.0, 63.0, 116.0, 214.0, 429.0, 1132.0, 5063.0, 90128.0, 4058382.0, 33605.0, 3415.0, 799.0, 336.0, 193.0, 114.0, 65.0, 45.0, 30.0, 10.0, 5.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.25, -150.54296875, -144.8359375, -139.12890625, -133.421875, -127.71484375, -122.0078125, -116.30078125, -110.59375, -104.88671875, -99.1796875, -93.47265625, -87.765625, -82.05859375, -76.3515625, -70.64453125, -64.9375, -59.23046875, -53.5234375, -47.81640625, -42.109375, -36.40234375, -30.6953125, -24.98828125, -19.28125, -13.57421875, -7.8671875, -2.16015625, 3.546875, 9.25390625, 14.9609375, 20.66796875, 26.375, 32.08203125, 37.7890625, 43.49609375, 49.203125, 54.91015625, 60.6171875, 66.32421875, 72.03125, 77.73828125, 83.4453125, 89.15234375, 94.859375, 100.56640625, 106.2734375, 111.98046875, 117.6875, 123.39453125, 129.1015625, 134.80859375, 140.515625, 146.22265625, 151.9296875, 157.63671875, 163.34375, 169.05078125, 174.7578125, 180.46484375, 186.171875, 191.87890625, 197.5859375, 203.29296875, 209.0]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 31.0, 231.0, 589.0, 143.0, 15.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1170.8314208984375, -1150.0692138671875, -1129.3070068359375, -1108.5447998046875, -1087.78271484375, -1067.0205078125, -1046.25830078125, -1025.49609375, -1004.73388671875, -983.9716796875, -963.2095336914062, -942.4473266601562, -921.6851196289062, -900.9229125976562, -880.1607666015625, -859.3985595703125, -838.6363525390625, -817.8741455078125, -797.1119995117188, -776.3497924804688, -755.5875854492188, -734.8253784179688, -714.063232421875, -693.301025390625, -672.5388793945312, -651.7766723632812, -631.0145263671875, -610.2523193359375, -589.4901123046875, -568.7279052734375, -547.9657592773438, -527.2035522460938, -506.44134521484375, -485.6791687011719, -464.9169616699219, -444.15478515625, -423.392578125, -402.6304016113281, -381.86822509765625, -361.10601806640625, -340.34381103515625, -319.5816345214844, -298.8194274902344, -278.0572509765625, -257.2950439453125, -236.53286743164062, -215.7706756591797, -195.00848388671875, -174.2462921142578, -153.48410034179688, -132.72190856933594, -111.95972442626953, -91.1975326538086, -70.43534088134766, -49.67315673828125, -28.910964965820312, -8.148773193359375, 12.61341667175293, 33.375606536865234, 54.137794494628906, 74.89998626708984, 95.66217803955078, 116.42436218261719, 137.18655395507812, 157.94874572753906]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 3.0, 5.0, 5.0, 0.0, 9.0, 7.0, 16.0, 11.0, 18.0, 20.0, 24.0, 20.0, 21.0, 27.0, 34.0, 39.0, 42.0, 32.0, 37.0, 53.0, 44.0, 54.0, 45.0, 34.0, 30.0, 37.0, 43.0, 31.0, 30.0, 33.0, 24.0, 18.0, 25.0, 18.0, 20.0, 12.0, 19.0, 13.0, 12.0, 10.0, 6.0, 4.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-105.19232177734375, -101.75593566894531, -98.3195571899414, -94.88317108154297, -91.44679260253906, -88.01040649414062, -84.57402038574219, -81.13763427734375, -77.70125579833984, -74.2648696899414, -70.8284912109375, -67.39210510253906, -63.95572280883789, -60.51934051513672, -57.08295440673828, -53.64657211303711, -50.21018981933594, -46.773807525634766, -43.337425231933594, -39.901039123535156, -36.464656829833984, -33.02827453613281, -29.591890335083008, -26.155506134033203, -22.71912384033203, -19.28274154663086, -15.846357345581055, -12.409974098205566, -8.973590850830078, -5.537208557128906, -2.1008243560791016, 1.3355598449707031, 4.771942138671875, 8.208325386047363, 11.644708633422852, 15.08109188079834, 18.517475128173828, 21.953857421875, 25.390241622924805, 28.82662582397461, 32.26300811767578, 35.69939041137695, 39.135772705078125, 42.57215881347656, 46.008541107177734, 49.444923400878906, 52.881309509277344, 56.317691802978516, 59.75407409667969, 63.19045639038086, 66.62683868408203, 70.06322479248047, 73.49960327148438, 76.93598937988281, 80.37237548828125, 83.80876159667969, 87.2451400756836, 90.68152618408203, 94.11790466308594, 97.55429077148438, 100.99067687988281, 104.42705535888672, 107.86344146728516, 111.29981994628906, 114.7362060546875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 10.0, 8.0, 9.0, 13.0, 18.0, 9.0, 24.0, 15.0, 17.0, 19.0, 21.0, 28.0, 33.0, 46.0, 45.0, 35.0, 45.0, 50.0, 40.0, 33.0, 47.0, 31.0, 41.0, 31.0, 27.0, 30.0, 33.0, 35.0, 25.0, 27.0, 21.0, 18.0, 14.0, 17.0, 8.0, 8.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.3125, -22.607666015625, -21.90283203125, -21.197998046875, -20.4931640625, -19.788330078125, -19.08349609375, -18.378662109375, -17.673828125, -16.968994140625, -16.26416015625, -15.559326171875, -14.8544921875, -14.149658203125, -13.44482421875, -12.739990234375, -12.03515625, -11.330322265625, -10.62548828125, -9.920654296875, -9.2158203125, -8.510986328125, -7.80615234375, -7.101318359375, -6.396484375, -5.691650390625, -4.98681640625, -4.281982421875, -3.5771484375, -2.872314453125, -2.16748046875, -1.462646484375, -0.7578125, -0.052978515625, 0.65185546875, 1.356689453125, 2.0615234375, 2.766357421875, 3.47119140625, 4.176025390625, 4.880859375, 5.585693359375, 6.29052734375, 6.995361328125, 7.7001953125, 8.405029296875, 9.10986328125, 9.814697265625, 10.51953125, 11.224365234375, 11.92919921875, 12.634033203125, 13.3388671875, 14.043701171875, 14.74853515625, 15.453369140625, 16.158203125, 16.863037109375, 17.56787109375, 18.272705078125, 18.9775390625, 19.682373046875, 20.38720703125, 21.092041015625, 21.796875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 11.0, 17.0, 36.0, 46.0, 65.0, 108.0, 166.0, 211.0, 289.0, 483.0, 714.0, 1033.0, 1544.0, 2293.0, 3423.0, 5269.0, 7680.0, 11893.0, 18525.0, 28584.0, 46149.0, 76505.0, 129545.0, 207676.0, 197067.0, 118798.0, 70087.0, 42973.0, 27053.0, 17089.0, 11176.0, 7349.0, 4860.0, 3210.0, 2162.0, 1448.0, 1013.0, 610.0, 456.0, 320.0, 198.0, 128.0, 93.0, 65.0, 30.0, 26.0, 30.0, 13.0, 10.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0], "bins": [-1.1328125, -1.0984039306640625, -1.063995361328125, -1.0295867919921875, -0.99517822265625, -0.9607696533203125, -0.926361083984375, -0.8919525146484375, -0.8575439453125, -0.8231353759765625, -0.788726806640625, -0.7543182373046875, -0.71990966796875, -0.6855010986328125, -0.651092529296875, -0.6166839599609375, -0.582275390625, -0.5478668212890625, -0.513458251953125, -0.4790496826171875, -0.44464111328125, -0.4102325439453125, -0.375823974609375, -0.3414154052734375, -0.3070068359375, -0.2725982666015625, -0.238189697265625, -0.2037811279296875, -0.16937255859375, -0.1349639892578125, -0.100555419921875, -0.0661468505859375, -0.03173828125, 0.0026702880859375, 0.037078857421875, 0.0714874267578125, 0.10589599609375, 0.1403045654296875, 0.174713134765625, 0.2091217041015625, 0.2435302734375, 0.2779388427734375, 0.312347412109375, 0.3467559814453125, 0.38116455078125, 0.4155731201171875, 0.449981689453125, 0.4843902587890625, 0.518798828125, 0.5532073974609375, 0.587615966796875, 0.6220245361328125, 0.65643310546875, 0.6908416748046875, 0.725250244140625, 0.7596588134765625, 0.7940673828125, 0.8284759521484375, 0.862884521484375, 0.8972930908203125, 0.93170166015625, 0.9661102294921875, 1.000518798828125, 1.0349273681640625, 1.0693359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 5.0, 9.0, 4.0, 8.0, 12.0, 10.0, 13.0, 15.0, 16.0, 15.0, 24.0, 23.0, 21.0, 32.0, 38.0, 38.0, 48.0, 33.0, 34.0, 39.0, 39.0, 1071.0, 32.0, 45.0, 48.0, 50.0, 28.0, 29.0, 29.0, 19.0, 25.0, 17.0, 26.0, 17.0, 17.0, 11.0, 8.0, 13.0, 13.0, 6.0, 9.0, 3.0, 5.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4453125, -13.998046875, -13.55078125, -13.103515625, -12.65625, -12.208984375, -11.76171875, -11.314453125, -10.8671875, -10.419921875, -9.97265625, -9.525390625, -9.078125, -8.630859375, -8.18359375, -7.736328125, -7.2890625, -6.841796875, -6.39453125, -5.947265625, -5.5, -5.052734375, -4.60546875, -4.158203125, -3.7109375, -3.263671875, -2.81640625, -2.369140625, -1.921875, -1.474609375, -1.02734375, -0.580078125, -0.1328125, 0.314453125, 0.76171875, 1.208984375, 1.65625, 2.103515625, 2.55078125, 2.998046875, 3.4453125, 3.892578125, 4.33984375, 4.787109375, 5.234375, 5.681640625, 6.12890625, 6.576171875, 7.0234375, 7.470703125, 7.91796875, 8.365234375, 8.8125, 9.259765625, 9.70703125, 10.154296875, 10.6015625, 11.048828125, 11.49609375, 11.943359375, 12.390625, 12.837890625, 13.28515625, 13.732421875, 14.1796875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 3.0, 8.0, 8.0, 11.0, 32.0, 52.0, 60.0, 105.0, 135.0, 205.0, 287.0, 385.0, 549.0, 796.0, 1067.0, 1425.0, 1987.0, 2625.0, 3538.0, 4942.0, 6895.0, 9416.0, 13533.0, 19262.0, 28582.0, 43256.0, 67772.0, 108420.0, 165769.0, 1232967.0, 133878.0, 83466.0, 52885.0, 34360.0, 22976.0, 15645.0, 10919.0, 7823.0, 5733.0, 4194.0, 2963.0, 2265.0, 1606.0, 1241.0, 892.0, 658.0, 469.0, 331.0, 217.0, 181.0, 112.0, 79.0, 51.0, 38.0, 20.0, 21.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0], "bins": [-0.81201171875, -0.7860031127929688, -0.7599945068359375, -0.7339859008789062, -0.707977294921875, -0.6819686889648438, -0.6559600830078125, -0.6299514770507812, -0.60394287109375, -0.5779342651367188, -0.5519256591796875, -0.5259170532226562, -0.499908447265625, -0.47389984130859375, -0.4478912353515625, -0.42188262939453125, -0.3958740234375, -0.36986541748046875, -0.3438568115234375, -0.31784820556640625, -0.291839599609375, -0.26583099365234375, -0.2398223876953125, -0.21381378173828125, -0.18780517578125, -0.16179656982421875, -0.1357879638671875, -0.10977935791015625, -0.083770751953125, -0.05776214599609375, -0.0317535400390625, -0.00574493408203125, 0.020263671875, 0.04627227783203125, 0.0722808837890625, 0.09828948974609375, 0.124298095703125, 0.15030670166015625, 0.1763153076171875, 0.20232391357421875, 0.22833251953125, 0.25434112548828125, 0.2803497314453125, 0.30635833740234375, 0.332366943359375, 0.35837554931640625, 0.3843841552734375, 0.41039276123046875, 0.4364013671875, 0.46240997314453125, 0.4884185791015625, 0.5144271850585938, 0.540435791015625, 0.5664443969726562, 0.5924530029296875, 0.6184616088867188, 0.64447021484375, 0.6704788208007812, 0.6964874267578125, 0.7224960327148438, 0.748504638671875, 0.7745132446289062, 0.8005218505859375, 0.8265304565429688, 0.8525390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 12.0, 9.0, 10.0, 22.0, 19.0, 20.0, 33.0, 37.0, 48.0, 56.0, 59.0, 53.0, 52.0, 63.0, 64.0, 51.0, 50.0, 51.0, 46.0, 37.0, 29.0, 33.0, 22.0, 30.0, 15.0, 18.0, 12.0, 8.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.004974365234375, -0.004823505878448486, -0.004672646522521973, -0.004521787166595459, -0.004370927810668945, -0.004220068454742432, -0.004069209098815918, -0.003918349742889404, -0.0037674903869628906, -0.003616631031036377, -0.0034657716751098633, -0.0033149123191833496, -0.003164052963256836, -0.0030131936073303223, -0.0028623342514038086, -0.002711474895477295, -0.0025606155395507812, -0.0024097561836242676, -0.002258896827697754, -0.0021080374717712402, -0.0019571781158447266, -0.0018063187599182129, -0.0016554594039916992, -0.0015046000480651855, -0.0013537406921386719, -0.0012028813362121582, -0.0010520219802856445, -0.0009011626243591309, -0.0007503032684326172, -0.0005994439125061035, -0.00044858455657958984, -0.00029772520065307617, -0.0001468658447265625, 3.993511199951172e-06, 0.00015485286712646484, 0.0003057122230529785, 0.0004565715789794922, 0.0006074309349060059, 0.0007582902908325195, 0.0009091496467590332, 0.0010600090026855469, 0.0012108683586120605, 0.0013617277145385742, 0.0015125870704650879, 0.0016634464263916016, 0.0018143057823181152, 0.001965165138244629, 0.0021160244941711426, 0.0022668838500976562, 0.00241774320602417, 0.0025686025619506836, 0.0027194619178771973, 0.002870321273803711, 0.0030211806297302246, 0.0031720399856567383, 0.003322899341583252, 0.0034737586975097656, 0.0036246180534362793, 0.003775477409362793, 0.003926336765289307, 0.00407719612121582, 0.004228055477142334, 0.004378914833068848, 0.004529774188995361, 0.004680633544921875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 8.0, 8.0, 10.0, 8.0, 14.0, 25.0, 27.0, 34.0, 51.0, 57.0, 67.0, 90.0, 131.0, 227.0, 465.0, 2905.0, 938114.0, 104304.0, 1013.0, 322.0, 184.0, 123.0, 102.0, 78.0, 35.0, 28.0, 30.0, 28.0, 16.0, 13.0, 7.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09714317321777344, -0.09388351440429688, -0.09062385559082031, -0.08736419677734375, -0.08410453796386719, -0.08084487915039062, -0.07758522033691406, -0.0743255615234375, -0.07106590270996094, -0.06780624389648438, -0.06454658508300781, -0.06128692626953125, -0.05802726745605469, -0.054767608642578125, -0.05150794982910156, -0.048248291015625, -0.04498863220214844, -0.041728973388671875, -0.03846931457519531, -0.03520965576171875, -0.03194999694824219, -0.028690338134765625, -0.025430679321289062, -0.0221710205078125, -0.018911361694335938, -0.015651702880859375, -0.012392044067382812, -0.00913238525390625, -0.0058727264404296875, -0.002613067626953125, 0.0006465911865234375, 0.00390625, 0.0071659088134765625, 0.010425567626953125, 0.013685226440429688, 0.01694488525390625, 0.020204544067382812, 0.023464202880859375, 0.026723861694335938, 0.0299835205078125, 0.03324317932128906, 0.036502838134765625, 0.03976249694824219, 0.04302215576171875, 0.04628181457519531, 0.049541473388671875, 0.05280113220214844, 0.056060791015625, 0.05932044982910156, 0.06258010864257812, 0.06583976745605469, 0.06909942626953125, 0.07235908508300781, 0.07561874389648438, 0.07887840270996094, 0.0821380615234375, 0.08539772033691406, 0.08865737915039062, 0.09191703796386719, 0.09517669677734375, 0.09843635559082031, 0.10169601440429688, 0.10495567321777344, 0.10821533203125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 177.0, 806.0, 29.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0139493802562356, -0.012712707743048668, -0.011476034298539162, -0.01023936178535223, -0.009002689272165298, -0.007766015827655792, -0.006529343314468861, -0.005292669869959354, -0.004055997356772423, -0.002819324377924204, -0.0015826516319066286, -0.00034597888588905334, 0.0008906940929591656, 0.0021273670718073845, 0.003364039584994316, 0.004600713029503822, 0.005837385542690754, 0.007074058521538973, 0.008310731500387192, 0.009547404013574123, 0.010784076526761055, 0.012020749971270561, 0.013257422484457493, 0.014494095928966999, 0.01573076844215393, 0.016967441886663437, 0.018204113468527794, 0.0194407869130373, 0.020677460357546806, 0.021914131939411163, 0.02315080538392067, 0.024387478828430176, 0.025624152272939682, 0.026860825717449188, 0.028097497299313545, 0.02933417074382305, 0.030570844188332558, 0.031807515770196915, 0.03304418921470642, 0.03428086265921593, 0.03551753610372543, 0.03675420954823494, 0.037990882992744446, 0.039227552711963654, 0.04046422615647316, 0.041700899600982666, 0.04293757304549217, 0.04417424649000168, 0.045410916209220886, 0.04664758965373039, 0.0478842630982399, 0.049120932817459106, 0.05035760626196861, 0.05159427970647812, 0.052830953150987625, 0.05406762659549713, 0.05530430004000664, 0.056540973484516144, 0.05777764692902565, 0.059014320373535156, 0.060250990092754364, 0.06148766353726387, 0.06272433698177338, 0.06396101415157318, 0.06519768387079239]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 9.0, 9.0, 9.0, 16.0, 17.0, 30.0, 29.0, 34.0, 37.0, 40.0, 41.0, 38.0, 53.0, 45.0, 44.0, 51.0, 56.0, 59.0, 55.0, 39.0, 42.0, 34.0, 32.0, 37.0, 23.0, 21.0, 10.0, 20.0, 11.0, 10.0, 12.0, 7.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0036129355430603027, -0.0035112472251057625, -0.0034095589071512222, -0.003307870589196682, -0.0032061822712421417, -0.0031044939532876015, -0.0030028056353330612, -0.002901117317378521, -0.0027994289994239807, -0.0026977406814694405, -0.0025960523635149, -0.00249436404556036, -0.0023926757276058197, -0.0022909874096512794, -0.002189299091696739, -0.002087610773742199, -0.0019859224557876587, -0.0018842341378331184, -0.0017825458198785782, -0.001680857501924038, -0.0015791691839694977, -0.0014774808660149574, -0.0013757925480604172, -0.001274104230105877, -0.0011724159121513367, -0.0010707275941967964, -0.0009690392762422562, -0.0008673509582877159, -0.0007656626403331757, -0.0006639743223786354, -0.0005622860044240952, -0.0004605976864695549, -0.00035890936851501465, -0.0002572210505604744, -0.00015553273260593414, -5.384441465139389e-05, 4.784390330314636e-05, 0.00014953222125768661, 0.00025122053921222687, 0.0003529088571667671, 0.0004545971751213074, 0.0005562854930758476, 0.0006579738110303879, 0.0007596621289849281, 0.0008613504469394684, 0.0009630387648940086, 0.0010647270828485489, 0.0011664154008030891, 0.0012681037187576294, 0.0013697920367121696, 0.00147148035466671, 0.0015731686726212502, 0.0016748569905757904, 0.0017765453085303307, 0.001878233626484871, 0.001979921944439411, 0.0020816102623939514, 0.0021832985803484917, 0.002284986898303032, 0.002386675216257572, 0.0024883635342121124, 0.0025900518521666527, 0.002691740170121193, 0.002793428488075733, 0.0028951168060302734]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 10.0, 8.0, 9.0, 13.0, 18.0, 9.0, 24.0, 15.0, 17.0, 19.0, 21.0, 28.0, 33.0, 46.0, 45.0, 35.0, 45.0, 50.0, 40.0, 33.0, 47.0, 31.0, 41.0, 31.0, 27.0, 30.0, 33.0, 35.0, 25.0, 27.0, 21.0, 18.0, 14.0, 17.0, 8.0, 8.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.3125, -22.607666015625, -21.90283203125, -21.197998046875, -20.4931640625, -19.788330078125, -19.08349609375, -18.378662109375, -17.673828125, -16.968994140625, -16.26416015625, -15.559326171875, -14.8544921875, -14.149658203125, -13.44482421875, -12.739990234375, -12.03515625, -11.330322265625, -10.62548828125, -9.920654296875, -9.2158203125, -8.510986328125, -7.80615234375, -7.101318359375, -6.396484375, -5.691650390625, -4.98681640625, -4.281982421875, -3.5771484375, -2.872314453125, -2.16748046875, -1.462646484375, -0.7578125, -0.052978515625, 0.65185546875, 1.356689453125, 2.0615234375, 2.766357421875, 3.47119140625, 4.176025390625, 4.880859375, 5.585693359375, 6.29052734375, 6.995361328125, 7.7001953125, 8.405029296875, 9.10986328125, 9.814697265625, 10.51953125, 11.224365234375, 11.92919921875, 12.634033203125, 13.3388671875, 14.043701171875, 14.74853515625, 15.453369140625, 16.158203125, 16.863037109375, 17.56787109375, 18.272705078125, 18.9775390625, 19.682373046875, 20.38720703125, 21.092041015625, 21.796875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 6.0, 14.0, 8.0, 16.0, 19.0, 32.0, 30.0, 51.0, 51.0, 89.0, 148.0, 219.0, 327.0, 575.0, 954.0, 1692.0, 3396.0, 8121.0, 29487.0, 274898.0, 660760.0, 47407.0, 11071.0, 4142.0, 2105.0, 1098.0, 612.0, 374.0, 292.0, 148.0, 118.0, 63.0, 57.0, 31.0, 35.0, 17.0, 13.0, 17.0, 7.0, 10.0, 9.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-46.3125, -44.9150390625, -43.517578125, -42.1201171875, -40.72265625, -39.3251953125, -37.927734375, -36.5302734375, -35.1328125, -33.7353515625, -32.337890625, -30.9404296875, -29.54296875, -28.1455078125, -26.748046875, -25.3505859375, -23.953125, -22.5556640625, -21.158203125, -19.7607421875, -18.36328125, -16.9658203125, -15.568359375, -14.1708984375, -12.7734375, -11.3759765625, -9.978515625, -8.5810546875, -7.18359375, -5.7861328125, -4.388671875, -2.9912109375, -1.59375, -0.1962890625, 1.201171875, 2.5986328125, 3.99609375, 5.3935546875, 6.791015625, 8.1884765625, 9.5859375, 10.9833984375, 12.380859375, 13.7783203125, 15.17578125, 16.5732421875, 17.970703125, 19.3681640625, 20.765625, 22.1630859375, 23.560546875, 24.9580078125, 26.35546875, 27.7529296875, 29.150390625, 30.5478515625, 31.9453125, 33.3427734375, 34.740234375, 36.1376953125, 37.53515625, 38.9326171875, 40.330078125, 41.7275390625, 43.125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 6.0, 6.0, 14.0, 13.0, 15.0, 20.0, 13.0, 23.0, 29.0, 49.0, 37.0, 36.0, 40.0, 51.0, 62.0, 79.0, 188.0, 1693.0, 192.0, 76.0, 53.0, 34.0, 29.0, 34.0, 28.0, 34.0, 32.0, 27.0, 18.0, 14.0, 16.0, 10.0, 12.0, 15.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-67.4375, -65.48291015625, -63.5283203125, -61.57373046875, -59.619140625, -57.66455078125, -55.7099609375, -53.75537109375, -51.80078125, -49.84619140625, -47.8916015625, -45.93701171875, -43.982421875, -42.02783203125, -40.0732421875, -38.11865234375, -36.1640625, -34.20947265625, -32.2548828125, -30.30029296875, -28.345703125, -26.39111328125, -24.4365234375, -22.48193359375, -20.52734375, -18.57275390625, -16.6181640625, -14.66357421875, -12.708984375, -10.75439453125, -8.7998046875, -6.84521484375, -4.890625, -2.93603515625, -0.9814453125, 0.97314453125, 2.927734375, 4.88232421875, 6.8369140625, 8.79150390625, 10.74609375, 12.70068359375, 14.6552734375, 16.60986328125, 18.564453125, 20.51904296875, 22.4736328125, 24.42822265625, 26.3828125, 28.33740234375, 30.2919921875, 32.24658203125, 34.201171875, 36.15576171875, 38.1103515625, 40.06494140625, 42.01953125, 43.97412109375, 45.9287109375, 47.88330078125, 49.837890625, 51.79248046875, 53.7470703125, 55.70166015625, 57.65625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 5.0, 3.0, 12.0, 13.0, 13.0, 24.0, 21.0, 21.0, 32.0, 33.0, 56.0, 56.0, 60.0, 110.0, 164.0, 351.0, 1280.0, 13807.0, 3022527.0, 102120.0, 3541.0, 596.0, 238.0, 145.0, 100.0, 81.0, 52.0, 45.0, 33.0, 28.0, 30.0, 15.0, 14.0, 15.0, 8.0, 9.0, 5.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-131.0, -126.595703125, -122.19140625, -117.787109375, -113.3828125, -108.978515625, -104.57421875, -100.169921875, -95.765625, -91.361328125, -86.95703125, -82.552734375, -78.1484375, -73.744140625, -69.33984375, -64.935546875, -60.53125, -56.126953125, -51.72265625, -47.318359375, -42.9140625, -38.509765625, -34.10546875, -29.701171875, -25.296875, -20.892578125, -16.48828125, -12.083984375, -7.6796875, -3.275390625, 1.12890625, 5.533203125, 9.9375, 14.341796875, 18.74609375, 23.150390625, 27.5546875, 31.958984375, 36.36328125, 40.767578125, 45.171875, 49.576171875, 53.98046875, 58.384765625, 62.7890625, 67.193359375, 71.59765625, 76.001953125, 80.40625, 84.810546875, 89.21484375, 93.619140625, 98.0234375, 102.427734375, 106.83203125, 111.236328125, 115.640625, 120.044921875, 124.44921875, 128.853515625, 133.2578125, 137.662109375, 142.06640625, 146.470703125, 150.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 123.0, 698.0, 176.0, 17.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.29273986816406, -118.11075592041016, -106.92877197265625, -95.74678039550781, -84.56480407714844, -73.3828125, -62.200828552246094, -51.01884460449219, -39.83686065673828, -28.654876708984375, -17.472890853881836, -6.290904998779297, 4.891078948974609, 16.073062896728516, 27.255050659179688, 38.437034606933594, 49.6190185546875, 60.801002502441406, 71.98298645019531, 83.16497802734375, 94.34695434570312, 105.52894592285156, 116.71092987060547, 127.89291381835938, 139.07489013671875, 150.2568817138672, 161.43885803222656, 172.620849609375, 183.80282592773438, 194.9848175048828, 206.16680908203125, 217.34878540039062, 228.53079223632812, 239.71278381347656, 250.89476013183594, 262.0767517089844, 273.25872802734375, 284.4407043457031, 295.6227111816406, 306.8046875, 317.9866638183594, 329.16864013671875, 340.35064697265625, 351.5326232910156, 362.714599609375, 373.8965759277344, 385.0785827636719, 396.26055908203125, 407.44256591796875, 418.6245422363281, 429.8065490722656, 440.988525390625, 452.1705017089844, 463.35247802734375, 474.53448486328125, 485.7164611816406, 496.8984375, 508.0804138183594, 519.2623901367188, 530.4443969726562, 541.6264038085938, 552.808349609375, 563.9903564453125, 575.17236328125, 586.3543090820312]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 7.0, 2.0, 2.0, 9.0, 4.0, 16.0, 14.0, 22.0, 11.0, 16.0, 10.0, 18.0, 20.0, 20.0, 25.0, 30.0, 32.0, 30.0, 34.0, 30.0, 37.0, 42.0, 37.0, 43.0, 39.0, 37.0, 37.0, 26.0, 31.0, 32.0, 51.0, 23.0, 23.0, 28.0, 22.0, 18.0, 19.0, 16.0, 16.0, 7.0, 7.0, 10.0, 7.0, 9.0, 4.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0], "bins": [-142.92208862304688, -138.67311096191406, -134.42413330078125, -130.17515563964844, -125.9261703491211, -121.67719268798828, -117.42821502685547, -113.17923736572266, -108.93025207519531, -104.6812744140625, -100.43229675292969, -96.18331909179688, -91.93433380126953, -87.68535614013672, -83.4363784790039, -79.1874008178711, -74.93842315673828, -70.68944549560547, -66.44046783447266, -62.19148635864258, -57.9425048828125, -53.69352722167969, -49.444549560546875, -45.19557189941406, -40.946590423583984, -36.69761276245117, -32.448631286621094, -28.19965362548828, -23.950674057006836, -19.70169448852539, -15.452716827392578, -11.203737258911133, -6.9547576904296875, -2.7057785987854004, 1.5432004928588867, 5.792179107666016, 10.041158676147461, 14.290138244628906, 18.53911590576172, 22.788095474243164, 27.03707504272461, 31.286054611206055, 35.5350341796875, 39.78401184082031, 44.032989501953125, 48.2819709777832, 52.530948638916016, 56.779930114746094, 61.028907775878906, 65.27788543701172, 69.52686309814453, 73.77584838867188, 78.02482604980469, 82.2738037109375, 86.52278137207031, 90.77175903320312, 95.02073669433594, 99.26971435546875, 103.51869201660156, 107.76766967773438, 112.01665496826172, 116.26563262939453, 120.51461029052734, 124.76358795166016, 129.0125732421875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 5.0, 11.0, 7.0, 13.0, 13.0, 12.0, 13.0, 23.0, 19.0, 18.0, 16.0, 27.0, 29.0, 28.0, 30.0, 36.0, 43.0, 45.0, 58.0, 40.0, 39.0, 38.0, 40.0, 35.0, 22.0, 30.0, 28.0, 32.0, 33.0, 28.0, 24.0, 25.0, 19.0, 22.0, 13.0, 12.0, 5.0, 15.0, 7.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.5625, -22.853759765625, -22.14501953125, -21.436279296875, -20.7275390625, -20.018798828125, -19.31005859375, -18.601318359375, -17.892578125, -17.183837890625, -16.47509765625, -15.766357421875, -15.0576171875, -14.348876953125, -13.64013671875, -12.931396484375, -12.22265625, -11.513916015625, -10.80517578125, -10.096435546875, -9.3876953125, -8.678955078125, -7.97021484375, -7.261474609375, -6.552734375, -5.843994140625, -5.13525390625, -4.426513671875, -3.7177734375, -3.009033203125, -2.30029296875, -1.591552734375, -0.8828125, -0.174072265625, 0.53466796875, 1.243408203125, 1.9521484375, 2.660888671875, 3.36962890625, 4.078369140625, 4.787109375, 5.495849609375, 6.20458984375, 6.913330078125, 7.6220703125, 8.330810546875, 9.03955078125, 9.748291015625, 10.45703125, 11.165771484375, 11.87451171875, 12.583251953125, 13.2919921875, 14.000732421875, 14.70947265625, 15.418212890625, 16.126953125, 16.835693359375, 17.54443359375, 18.253173828125, 18.9619140625, 19.670654296875, 20.37939453125, 21.088134765625, 21.796875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 14.0, 12.0, 13.0, 24.0, 11.0, 27.0, 28.0, 35.0, 51.0, 57.0, 78.0, 103.0, 150.0, 203.0, 309.0, 544.0, 904.0, 1802.0, 4432.0, 15817.0, 323350.0, 3450076.0, 369560.0, 17386.0, 4644.0, 1959.0, 946.0, 548.0, 319.0, 211.0, 170.0, 118.0, 86.0, 69.0, 41.0, 32.0, 30.0, 25.0, 17.0, 16.0, 12.0, 11.0, 15.0, 4.0, 6.0, 8.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-71.9375, -69.853515625, -67.76953125, -65.685546875, -63.6015625, -61.517578125, -59.43359375, -57.349609375, -55.265625, -53.181640625, -51.09765625, -49.013671875, -46.9296875, -44.845703125, -42.76171875, -40.677734375, -38.59375, -36.509765625, -34.42578125, -32.341796875, -30.2578125, -28.173828125, -26.08984375, -24.005859375, -21.921875, -19.837890625, -17.75390625, -15.669921875, -13.5859375, -11.501953125, -9.41796875, -7.333984375, -5.25, -3.166015625, -1.08203125, 1.001953125, 3.0859375, 5.169921875, 7.25390625, 9.337890625, 11.421875, 13.505859375, 15.58984375, 17.673828125, 19.7578125, 21.841796875, 23.92578125, 26.009765625, 28.09375, 30.177734375, 32.26171875, 34.345703125, 36.4296875, 38.513671875, 40.59765625, 42.681640625, 44.765625, 46.849609375, 48.93359375, 51.017578125, 53.1015625, 55.185546875, 57.26953125, 59.353515625, 61.4375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 11.0, 16.0, 13.0, 25.0, 50.0, 68.0, 92.0, 160.0, 251.0, 474.0, 754.0, 795.0, 568.0, 316.0, 169.0, 97.0, 64.0, 33.0, 28.0, 18.0, 18.0, 7.0, 7.0, 4.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.78125, -44.439453125, -43.09765625, -41.755859375, -40.4140625, -39.072265625, -37.73046875, -36.388671875, -35.046875, -33.705078125, -32.36328125, -31.021484375, -29.6796875, -28.337890625, -26.99609375, -25.654296875, -24.3125, -22.970703125, -21.62890625, -20.287109375, -18.9453125, -17.603515625, -16.26171875, -14.919921875, -13.578125, -12.236328125, -10.89453125, -9.552734375, -8.2109375, -6.869140625, -5.52734375, -4.185546875, -2.84375, -1.501953125, -0.16015625, 1.181640625, 2.5234375, 3.865234375, 5.20703125, 6.548828125, 7.890625, 9.232421875, 10.57421875, 11.916015625, 13.2578125, 14.599609375, 15.94140625, 17.283203125, 18.625, 19.966796875, 21.30859375, 22.650390625, 23.9921875, 25.333984375, 26.67578125, 28.017578125, 29.359375, 30.701171875, 32.04296875, 33.384765625, 34.7265625, 36.068359375, 37.41015625, 38.751953125, 40.09375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 2.0, 6.0, 14.0, 20.0, 16.0, 26.0, 33.0, 56.0, 84.0, 125.0, 197.0, 331.0, 714.0, 1758.0, 5768.0, 30527.0, 1554792.0, 2553722.0, 36059.0, 6359.0, 1845.0, 791.0, 405.0, 220.0, 140.0, 77.0, 71.0, 31.0, 36.0, 15.0, 16.0, 13.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-99.5, -96.1875, -92.875, -89.5625, -86.25, -82.9375, -79.625, -76.3125, -73.0, -69.6875, -66.375, -63.0625, -59.75, -56.4375, -53.125, -49.8125, -46.5, -43.1875, -39.875, -36.5625, -33.25, -29.9375, -26.625, -23.3125, -20.0, -16.6875, -13.375, -10.0625, -6.75, -3.4375, -0.125, 3.1875, 6.5, 9.8125, 13.125, 16.4375, 19.75, 23.0625, 26.375, 29.6875, 33.0, 36.3125, 39.625, 42.9375, 46.25, 49.5625, 52.875, 56.1875, 59.5, 62.8125, 66.125, 69.4375, 72.75, 76.0625, 79.375, 82.6875, 86.0, 89.3125, 92.625, 95.9375, 99.25, 102.5625, 105.875, 109.1875, 112.5]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 11.0, 34.0, 53.0, 87.0, 214.0, 259.0, 165.0, 97.0, 46.0, 25.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.7823028564453, -223.08108520507812, -216.37986755371094, -209.67864990234375, -202.97743225097656, -196.27621459960938, -189.57498168945312, -182.87376403808594, -176.17254638671875, -169.47132873535156, -162.77011108398438, -156.0688934326172, -149.36767578125, -142.66644287109375, -135.96524047851562, -129.26400756835938, -122.56279754638672, -115.86157989501953, -109.16036224365234, -102.45913696289062, -95.75791931152344, -89.05670166015625, -82.35548400878906, -75.65426635742188, -68.95304870605469, -62.2518310546875, -55.55060958862305, -48.84939193725586, -42.148170471191406, -35.44695281982422, -28.74573516845703, -22.044513702392578, -15.343292236328125, -8.642072677612305, -1.9408540725708008, 4.760364532470703, 11.461584091186523, 18.162803649902344, 24.86402130126953, 31.565242767333984, 38.26646041870117, 44.96767807006836, 51.66889953613281, 58.3701171875, 65.07133483886719, 71.77255249023438, 78.47377014160156, 85.17499542236328, 91.87621307373047, 98.57743072509766, 105.27864837646484, 111.97987365722656, 118.68109130859375, 125.38230895996094, 132.08352661132812, 138.7847442626953, 145.4859619140625, 152.1871795654297, 158.88839721679688, 165.58961486816406, 172.29083251953125, 178.9920654296875, 185.69326782226562, 192.39450073242188, 199.09571838378906]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 7.0, 4.0, 9.0, 5.0, 7.0, 8.0, 17.0, 10.0, 14.0, 23.0, 22.0, 18.0, 22.0, 34.0, 28.0, 35.0, 38.0, 33.0, 31.0, 40.0, 41.0, 49.0, 37.0, 35.0, 44.0, 54.0, 39.0, 34.0, 32.0, 32.0, 25.0, 30.0, 22.0, 18.0, 17.0, 16.0, 14.0, 10.0, 10.0, 5.0, 9.0, 7.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.41238403320312, -84.44105529785156, -81.46971893310547, -78.4983901977539, -75.52705383300781, -72.55572509765625, -69.58439636230469, -66.6130599975586, -63.64173126220703, -60.6703987121582, -57.699066162109375, -54.72773742675781, -51.756404876708984, -48.785072326660156, -45.81373977661133, -42.8424072265625, -39.87107467651367, -36.899742126464844, -33.928409576416016, -30.95707893371582, -27.985748291015625, -25.014415740966797, -22.04308319091797, -19.071752548217773, -16.100419998168945, -13.129088401794434, -10.157756805419922, -7.186424255371094, -4.215092658996582, -1.2437610626220703, 1.7275714874267578, 4.698902130126953, 7.670234680175781, 10.641566276550293, 13.612897872924805, 16.584230422973633, 19.555561065673828, 22.526893615722656, 25.498226165771484, 28.46955680847168, 31.440889358520508, 34.4122200012207, 37.38355255126953, 40.35488510131836, 43.32621765136719, 46.29754638671875, 49.268882751464844, 52.240211486816406, 55.211544036865234, 58.18287658691406, 61.15420913696289, 64.12554168701172, 67.09687042236328, 70.06820678710938, 73.03953552246094, 76.0108642578125, 78.9822006225586, 81.95352935791016, 84.92486572265625, 87.89619445800781, 90.8675308227539, 93.83885955810547, 96.81019592285156, 99.78152465820312, 102.75285339355469]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 4.0, 6.0, 10.0, 13.0, 8.0, 4.0, 14.0, 17.0, 14.0, 14.0, 28.0, 29.0, 22.0, 32.0, 25.0, 41.0, 33.0, 44.0, 53.0, 47.0, 52.0, 47.0, 32.0, 45.0, 42.0, 40.0, 41.0, 28.0, 29.0, 23.0, 20.0, 21.0, 18.0, 21.0, 14.0, 13.0, 14.0, 11.0, 9.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-26.40625, -25.624755859375, -24.84326171875, -24.061767578125, -23.2802734375, -22.498779296875, -21.71728515625, -20.935791015625, -20.154296875, -19.372802734375, -18.59130859375, -17.809814453125, -17.0283203125, -16.246826171875, -15.46533203125, -14.683837890625, -13.90234375, -13.120849609375, -12.33935546875, -11.557861328125, -10.7763671875, -9.994873046875, -9.21337890625, -8.431884765625, -7.650390625, -6.868896484375, -6.08740234375, -5.305908203125, -4.5244140625, -3.742919921875, -2.96142578125, -2.179931640625, -1.3984375, -0.616943359375, 0.16455078125, 0.946044921875, 1.7275390625, 2.509033203125, 3.29052734375, 4.072021484375, 4.853515625, 5.635009765625, 6.41650390625, 7.197998046875, 7.9794921875, 8.760986328125, 9.54248046875, 10.323974609375, 11.10546875, 11.886962890625, 12.66845703125, 13.449951171875, 14.2314453125, 15.012939453125, 15.79443359375, 16.575927734375, 17.357421875, 18.138916015625, 18.92041015625, 19.701904296875, 20.4833984375, 21.264892578125, 22.04638671875, 22.827880859375, 23.609375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 14.0, 16.0, 8.0, 20.0, 24.0, 48.0, 63.0, 79.0, 130.0, 196.0, 271.0, 373.0, 560.0, 869.0, 1244.0, 1898.0, 2803.0, 4457.0, 6804.0, 10575.0, 16710.0, 26885.0, 44932.0, 76935.0, 138036.0, 236145.0, 202655.0, 111899.0, 63115.0, 37284.0, 23032.0, 14124.0, 9105.0, 5965.0, 3788.0, 2441.0, 1667.0, 1072.0, 736.0, 458.0, 361.0, 227.0, 170.0, 120.0, 71.0, 52.0, 40.0, 27.0, 25.0, 6.0, 8.0, 2.0, 5.0, 3.0, 7.0, 1.0, 1.0], "bins": [-1.26171875, -1.2232818603515625, -1.184844970703125, -1.1464080810546875, -1.10797119140625, -1.0695343017578125, -1.031097412109375, -0.9926605224609375, -0.9542236328125, -0.9157867431640625, -0.877349853515625, -0.8389129638671875, -0.80047607421875, -0.7620391845703125, -0.723602294921875, -0.6851654052734375, -0.646728515625, -0.6082916259765625, -0.569854736328125, -0.5314178466796875, -0.49298095703125, -0.4545440673828125, -0.416107177734375, -0.3776702880859375, -0.3392333984375, -0.3007965087890625, -0.262359619140625, -0.2239227294921875, -0.18548583984375, -0.1470489501953125, -0.108612060546875, -0.0701751708984375, -0.03173828125, 0.0066986083984375, 0.045135498046875, 0.0835723876953125, 0.12200927734375, 0.1604461669921875, 0.198883056640625, 0.2373199462890625, 0.2757568359375, 0.3141937255859375, 0.352630615234375, 0.3910675048828125, 0.42950439453125, 0.4679412841796875, 0.506378173828125, 0.5448150634765625, 0.583251953125, 0.6216888427734375, 0.660125732421875, 0.6985626220703125, 0.73699951171875, 0.7754364013671875, 0.813873291015625, 0.8523101806640625, 0.8907470703125, 0.9291839599609375, 0.967620849609375, 1.0060577392578125, 1.04449462890625, 1.0829315185546875, 1.121368408203125, 1.1598052978515625, 1.1982421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 7.0, 7.0, 4.0, 6.0, 7.0, 11.0, 6.0, 6.0, 15.0, 24.0, 20.0, 18.0, 36.0, 37.0, 36.0, 33.0, 49.0, 39.0, 41.0, 31.0, 49.0, 1069.0, 31.0, 47.0, 46.0, 36.0, 40.0, 40.0, 35.0, 32.0, 26.0, 24.0, 24.0, 23.0, 14.0, 12.0, 13.0, 10.0, 6.0, 6.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.78125, -15.24755859375, -14.7138671875, -14.18017578125, -13.646484375, -13.11279296875, -12.5791015625, -12.04541015625, -11.51171875, -10.97802734375, -10.4443359375, -9.91064453125, -9.376953125, -8.84326171875, -8.3095703125, -7.77587890625, -7.2421875, -6.70849609375, -6.1748046875, -5.64111328125, -5.107421875, -4.57373046875, -4.0400390625, -3.50634765625, -2.97265625, -2.43896484375, -1.9052734375, -1.37158203125, -0.837890625, -0.30419921875, 0.2294921875, 0.76318359375, 1.296875, 1.83056640625, 2.3642578125, 2.89794921875, 3.431640625, 3.96533203125, 4.4990234375, 5.03271484375, 5.56640625, 6.10009765625, 6.6337890625, 7.16748046875, 7.701171875, 8.23486328125, 8.7685546875, 9.30224609375, 9.8359375, 10.36962890625, 10.9033203125, 11.43701171875, 11.970703125, 12.50439453125, 13.0380859375, 13.57177734375, 14.10546875, 14.63916015625, 15.1728515625, 15.70654296875, 16.240234375, 16.77392578125, 17.3076171875, 17.84130859375, 18.375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 20.0, 14.0, 24.0, 49.0, 65.0, 72.0, 148.0, 225.0, 351.0, 464.0, 727.0, 1005.0, 1510.0, 2138.0, 3139.0, 4565.0, 6937.0, 10322.0, 15610.0, 24321.0, 38225.0, 61161.0, 100914.0, 170499.0, 1266645.0, 148471.0, 87944.0, 53659.0, 33552.0, 21504.0, 14097.0, 9351.0, 6187.0, 4102.0, 2868.0, 1990.0, 1358.0, 969.0, 664.0, 406.0, 291.0, 196.0, 132.0, 82.0, 58.0, 30.0, 22.0, 16.0, 14.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.03125, -0.9993896484375, -0.967529296875, -0.9356689453125, -0.90380859375, -0.8719482421875, -0.840087890625, -0.8082275390625, -0.7763671875, -0.7445068359375, -0.712646484375, -0.6807861328125, -0.64892578125, -0.6170654296875, -0.585205078125, -0.5533447265625, -0.521484375, -0.4896240234375, -0.457763671875, -0.4259033203125, -0.39404296875, -0.3621826171875, -0.330322265625, -0.2984619140625, -0.2666015625, -0.2347412109375, -0.202880859375, -0.1710205078125, -0.13916015625, -0.1072998046875, -0.075439453125, -0.0435791015625, -0.01171875, 0.0201416015625, 0.052001953125, 0.0838623046875, 0.11572265625, 0.1475830078125, 0.179443359375, 0.2113037109375, 0.2431640625, 0.2750244140625, 0.306884765625, 0.3387451171875, 0.37060546875, 0.4024658203125, 0.434326171875, 0.4661865234375, 0.498046875, 0.5299072265625, 0.561767578125, 0.5936279296875, 0.62548828125, 0.6573486328125, 0.689208984375, 0.7210693359375, 0.7529296875, 0.7847900390625, 0.816650390625, 0.8485107421875, 0.88037109375, 0.9122314453125, 0.944091796875, 0.9759521484375, 1.0078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 6.0, 5.0, 4.0, 4.0, 3.0, 9.0, 11.0, 13.0, 13.0, 17.0, 25.0, 29.0, 26.0, 32.0, 36.0, 48.0, 40.0, 42.0, 44.0, 49.0, 51.0, 69.0, 52.0, 48.0, 46.0, 41.0, 44.0, 34.0, 24.0, 30.0, 22.0, 9.0, 17.0, 9.0, 6.0, 2.0, 12.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004474639892578125, -0.004335999488830566, -0.004197359085083008, -0.004058718681335449, -0.003920078277587891, -0.003781437873840332, -0.0036427974700927734, -0.003504157066345215, -0.0033655166625976562, -0.0032268762588500977, -0.003088235855102539, -0.0029495954513549805, -0.002810955047607422, -0.0026723146438598633, -0.0025336742401123047, -0.002395033836364746, -0.0022563934326171875, -0.002117753028869629, -0.0019791126251220703, -0.0018404722213745117, -0.0017018318176269531, -0.0015631914138793945, -0.001424551010131836, -0.0012859106063842773, -0.0011472702026367188, -0.0010086297988891602, -0.0008699893951416016, -0.000731348991394043, -0.0005927085876464844, -0.0004540681838989258, -0.0003154277801513672, -0.0001767873764038086, -3.814697265625e-05, 0.0001004934310913086, 0.0002391338348388672, 0.0003777742385864258, 0.0005164146423339844, 0.000655055046081543, 0.0007936954498291016, 0.0009323358535766602, 0.0010709762573242188, 0.0012096166610717773, 0.001348257064819336, 0.0014868974685668945, 0.0016255378723144531, 0.0017641782760620117, 0.0019028186798095703, 0.002041459083557129, 0.0021800994873046875, 0.002318739891052246, 0.0024573802947998047, 0.0025960206985473633, 0.002734661102294922, 0.0028733015060424805, 0.003011941909790039, 0.0031505823135375977, 0.0032892227172851562, 0.003427863121032715, 0.0035665035247802734, 0.003705143928527832, 0.0038437843322753906, 0.003982424736022949, 0.004121065139770508, 0.004259705543518066, 0.004398345947265625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 9.0, 9.0, 8.0, 6.0, 14.0, 14.0, 8.0, 19.0, 27.0, 21.0, 41.0, 41.0, 68.0, 94.0, 125.0, 165.0, 257.0, 524.0, 3718.0, 902116.0, 138796.0, 1296.0, 383.0, 201.0, 134.0, 97.0, 81.0, 67.0, 51.0, 29.0, 23.0, 26.0, 14.0, 14.0, 14.0, 6.0, 4.0, 5.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093994140625, -0.09104061126708984, -0.08808708190917969, -0.08513355255126953, -0.08218002319335938, -0.07922649383544922, -0.07627296447753906, -0.0733194351196289, -0.07036590576171875, -0.0674123764038086, -0.06445884704589844, -0.06150531768798828, -0.058551788330078125, -0.05559825897216797, -0.05264472961425781, -0.049691200256347656, -0.0467376708984375, -0.043784141540527344, -0.04083061218261719, -0.03787708282470703, -0.034923553466796875, -0.03197002410888672, -0.029016494750976562, -0.026062965393066406, -0.02310943603515625, -0.020155906677246094, -0.017202377319335938, -0.014248847961425781, -0.011295318603515625, -0.008341789245605469, -0.0053882598876953125, -0.0024347305297851562, 0.000518798828125, 0.0034723281860351562, 0.0064258575439453125, 0.009379386901855469, 0.012332916259765625, 0.015286445617675781, 0.018239974975585938, 0.021193504333496094, 0.02414703369140625, 0.027100563049316406, 0.030054092407226562, 0.03300762176513672, 0.035961151123046875, 0.03891468048095703, 0.04186820983886719, 0.044821739196777344, 0.0477752685546875, 0.050728797912597656, 0.05368232727050781, 0.05663585662841797, 0.059589385986328125, 0.06254291534423828, 0.06549644470214844, 0.0684499740600586, 0.07140350341796875, 0.0743570327758789, 0.07731056213378906, 0.08026409149169922, 0.08321762084960938, 0.08617115020751953, 0.08912467956542969, 0.09207820892333984, 0.09503173828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 33.0, 751.0, 232.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036853814963251352, -0.0026991544291377068, -0.001712927594780922, -0.0007267005275934935, 0.00025952630676329136, 0.0012457531411200762, 0.0022319804411381483, 0.003218207275494933, 0.004204434342682362, 0.005190661177039146, 0.006176888011395931, 0.007163115311414003, 0.008149342611432076, 0.009135568514466286, 0.010121796280145645, 0.01110802311450243, 0.012094249948859215, 0.013080476783216, 0.014066703617572784, 0.015052931383252144, 0.016039157286286354, 0.017025385051965714, 0.018011610954999924, 0.018997838720679283, 0.019984064623713493, 0.020970292389392853, 0.021956518292427063, 0.022942746058106422, 0.023928971961140633, 0.024915199726819992, 0.025901425629854202, 0.02688765339553356, 0.02787388116121292, 0.02886010892689228, 0.02984633482992649, 0.03083256259560585, 0.03181878849864006, 0.03280501440167427, 0.03379124402999878, 0.03477746993303299, 0.0357636958360672, 0.03674992173910141, 0.03773615136742592, 0.03872237727046013, 0.03970860317349434, 0.04069482907652855, 0.04168105870485306, 0.04266728460788727, 0.04365351051092148, 0.04463973641395569, 0.0456259660422802, 0.04661219194531441, 0.04759841784834862, 0.04858464375138283, 0.049570873379707336, 0.05055709928274155, 0.051543328911066055, 0.052529554814100266, 0.053515784442424774, 0.054502010345458984, 0.055488236248493195, 0.056474462151527405, 0.05746069177985191, 0.058446917682886124, 0.059433143585920334]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 18.0, 7.0, 15.0, 19.0, 29.0, 28.0, 25.0, 39.0, 41.0, 45.0, 38.0, 41.0, 46.0, 52.0, 42.0, 45.0, 47.0, 41.0, 42.0, 43.0, 48.0, 36.0, 34.0, 22.0, 18.0, 12.0, 20.0, 20.0, 18.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0033148527145385742, -0.0032183146104216576, -0.003121776506304741, -0.0030252384021878242, -0.0029287002980709076, -0.002832162193953991, -0.0027356240898370743, -0.0026390859857201576, -0.002542547881603241, -0.0024460097774863243, -0.0023494716733694077, -0.002252933569252491, -0.0021563954651355743, -0.0020598573610186577, -0.001963319256901741, -0.0018667811527848244, -0.0017702430486679077, -0.001673704944550991, -0.0015771668404340744, -0.0014806287363171577, -0.001384090632200241, -0.0012875525280833244, -0.0011910144239664078, -0.0010944763198494911, -0.0009979382157325745, -0.0009014001116156578, -0.0008048620074987411, -0.0007083239033818245, -0.0006117857992649078, -0.0005152476951479912, -0.0004187095910310745, -0.00032217148691415787, -0.0002256333827972412, -0.00012909527868032455, -3.25571745634079e-05, 6.398092955350876e-05, 0.00016051903367042542, 0.00025705713778734207, 0.00035359524190425873, 0.0004501333460211754, 0.000546671450138092, 0.0006432095542550087, 0.0007397476583719254, 0.000836285762488842, 0.0009328238666057587, 0.0010293619707226753, 0.001125900074839592, 0.0012224381789565086, 0.0013189762830734253, 0.001415514387190342, 0.0015120524913072586, 0.0016085905954241753, 0.001705128699541092, 0.0018016668036580086, 0.0018982049077749252, 0.001994743011891842, 0.0020912811160087585, 0.002187819220125675, 0.002284357324242592, 0.0023808954283595085, 0.002477433532476425, 0.002573971636593342, 0.0026705097407102585, 0.002767047844827175, 0.002863585948944092]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 4.0, 6.0, 10.0, 13.0, 8.0, 4.0, 14.0, 17.0, 14.0, 14.0, 28.0, 29.0, 22.0, 32.0, 25.0, 41.0, 33.0, 44.0, 53.0, 47.0, 52.0, 47.0, 32.0, 45.0, 42.0, 40.0, 41.0, 28.0, 29.0, 23.0, 20.0, 21.0, 18.0, 21.0, 14.0, 13.0, 14.0, 11.0, 9.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-26.40625, -25.624755859375, -24.84326171875, -24.061767578125, -23.2802734375, -22.498779296875, -21.71728515625, -20.935791015625, -20.154296875, -19.372802734375, -18.59130859375, -17.809814453125, -17.0283203125, -16.246826171875, -15.46533203125, -14.683837890625, -13.90234375, -13.120849609375, -12.33935546875, -11.557861328125, -10.7763671875, -9.994873046875, -9.21337890625, -8.431884765625, -7.650390625, -6.868896484375, -6.08740234375, -5.305908203125, -4.5244140625, -3.742919921875, -2.96142578125, -2.179931640625, -1.3984375, -0.616943359375, 0.16455078125, 0.946044921875, 1.7275390625, 2.509033203125, 3.29052734375, 4.072021484375, 4.853515625, 5.635009765625, 6.41650390625, 7.197998046875, 7.9794921875, 8.760986328125, 9.54248046875, 10.323974609375, 11.10546875, 11.886962890625, 12.66845703125, 13.449951171875, 14.2314453125, 15.012939453125, 15.79443359375, 16.575927734375, 17.357421875, 18.138916015625, 18.92041015625, 19.701904296875, 20.4833984375, 21.264892578125, 22.04638671875, 22.827880859375, 23.609375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 8.0, 9.0, 9.0, 16.0, 25.0, 25.0, 24.0, 28.0, 56.0, 63.0, 67.0, 99.0, 138.0, 183.0, 295.0, 374.0, 520.0, 889.0, 1581.0, 3785.0, 10974.0, 49929.0, 766488.0, 177895.0, 22641.0, 6385.0, 2490.0, 1207.0, 675.0, 443.0, 308.0, 228.0, 178.0, 119.0, 91.0, 70.0, 57.0, 42.0, 31.0, 30.0, 20.0, 17.0, 7.0, 14.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-65.375, -63.43896484375, -61.5029296875, -59.56689453125, -57.630859375, -55.69482421875, -53.7587890625, -51.82275390625, -49.88671875, -47.95068359375, -46.0146484375, -44.07861328125, -42.142578125, -40.20654296875, -38.2705078125, -36.33447265625, -34.3984375, -32.46240234375, -30.5263671875, -28.59033203125, -26.654296875, -24.71826171875, -22.7822265625, -20.84619140625, -18.91015625, -16.97412109375, -15.0380859375, -13.10205078125, -11.166015625, -9.22998046875, -7.2939453125, -5.35791015625, -3.421875, -1.48583984375, 0.4501953125, 2.38623046875, 4.322265625, 6.25830078125, 8.1943359375, 10.13037109375, 12.06640625, 14.00244140625, 15.9384765625, 17.87451171875, 19.810546875, 21.74658203125, 23.6826171875, 25.61865234375, 27.5546875, 29.49072265625, 31.4267578125, 33.36279296875, 35.298828125, 37.23486328125, 39.1708984375, 41.10693359375, 43.04296875, 44.97900390625, 46.9150390625, 48.85107421875, 50.787109375, 52.72314453125, 54.6591796875, 56.59521484375, 58.53125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 4.0, 12.0, 6.0, 11.0, 10.0, 18.0, 16.0, 25.0, 18.0, 17.0, 28.0, 28.0, 29.0, 29.0, 45.0, 41.0, 47.0, 97.0, 142.0, 1524.0, 309.0, 114.0, 64.0, 39.0, 43.0, 36.0, 31.0, 38.0, 26.0, 21.0, 23.0, 19.0, 15.0, 18.0, 14.0, 11.0, 11.0, 10.0, 6.0, 6.0, 5.0, 6.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-55.28125, -53.60009765625, -51.9189453125, -50.23779296875, -48.556640625, -46.87548828125, -45.1943359375, -43.51318359375, -41.83203125, -40.15087890625, -38.4697265625, -36.78857421875, -35.107421875, -33.42626953125, -31.7451171875, -30.06396484375, -28.3828125, -26.70166015625, -25.0205078125, -23.33935546875, -21.658203125, -19.97705078125, -18.2958984375, -16.61474609375, -14.93359375, -13.25244140625, -11.5712890625, -9.89013671875, -8.208984375, -6.52783203125, -4.8466796875, -3.16552734375, -1.484375, 0.19677734375, 1.8779296875, 3.55908203125, 5.240234375, 6.92138671875, 8.6025390625, 10.28369140625, 11.96484375, 13.64599609375, 15.3271484375, 17.00830078125, 18.689453125, 20.37060546875, 22.0517578125, 23.73291015625, 25.4140625, 27.09521484375, 28.7763671875, 30.45751953125, 32.138671875, 33.81982421875, 35.5009765625, 37.18212890625, 38.86328125, 40.54443359375, 42.2255859375, 43.90673828125, 45.587890625, 47.26904296875, 48.9501953125, 50.63134765625, 52.3125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 6.0, 7.0, 8.0, 3.0, 10.0, 13.0, 8.0, 17.0, 27.0, 16.0, 18.0, 28.0, 33.0, 31.0, 53.0, 60.0, 82.0, 93.0, 164.0, 391.0, 1195.0, 14427.0, 3024840.0, 100213.0, 2627.0, 505.0, 244.0, 142.0, 84.0, 64.0, 52.0, 38.0, 31.0, 26.0, 19.0, 18.0, 16.0, 23.0, 9.0, 8.0, 13.0, 9.0, 5.0, 6.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-138.5, -133.990234375, -129.48046875, -124.970703125, -120.4609375, -115.951171875, -111.44140625, -106.931640625, -102.421875, -97.912109375, -93.40234375, -88.892578125, -84.3828125, -79.873046875, -75.36328125, -70.853515625, -66.34375, -61.833984375, -57.32421875, -52.814453125, -48.3046875, -43.794921875, -39.28515625, -34.775390625, -30.265625, -25.755859375, -21.24609375, -16.736328125, -12.2265625, -7.716796875, -3.20703125, 1.302734375, 5.8125, 10.322265625, 14.83203125, 19.341796875, 23.8515625, 28.361328125, 32.87109375, 37.380859375, 41.890625, 46.400390625, 50.91015625, 55.419921875, 59.9296875, 64.439453125, 68.94921875, 73.458984375, 77.96875, 82.478515625, 86.98828125, 91.498046875, 96.0078125, 100.517578125, 105.02734375, 109.537109375, 114.046875, 118.556640625, 123.06640625, 127.576171875, 132.0859375, 136.595703125, 141.10546875, 145.615234375, 150.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 14.0, 25.0, 29.0, 52.0, 61.0, 112.0, 129.0, 136.0, 133.0, 97.0, 82.0, 48.0, 34.0, 21.0, 7.0, 12.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.696502685546875, -46.86695861816406, -45.03741455078125, -43.20787048339844, -41.378326416015625, -39.54878234863281, -37.71923828125, -35.88969421386719, -34.060150146484375, -32.23060607910156, -30.40106201171875, -28.571517944335938, -26.741973876953125, -24.912429809570312, -23.0828857421875, -21.253341674804688, -19.423795700073242, -17.59425163269043, -15.764707565307617, -13.935163497924805, -12.105619430541992, -10.276074409484863, -8.44653034210205, -6.616986274719238, -4.787442207336426, -2.9578981399536133, -1.1283538341522217, 0.7011904716491699, 2.5307345390319824, 4.360279083251953, 6.189823150634766, 8.019367218017578, 9.84891128540039, 11.678455352783203, 13.507999420166016, 15.337543487548828, 17.16708755493164, 18.996631622314453, 20.826175689697266, 22.655719757080078, 24.48526382446289, 26.314807891845703, 28.144351959228516, 29.973896026611328, 31.80344009399414, 33.63298416137695, 35.462528228759766, 37.29207229614258, 39.121620178222656, 40.95116424560547, 42.78070831298828, 44.610252380371094, 46.439796447753906, 48.26934051513672, 50.09888458251953, 51.928428649902344, 53.757972717285156, 55.58751678466797, 57.41706085205078, 59.246604919433594, 61.076148986816406, 62.90569305419922, 64.73523712158203, 66.56478118896484, 68.39432525634766]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 2.0, 7.0, 14.0, 8.0, 9.0, 9.0, 19.0, 20.0, 16.0, 26.0, 21.0, 22.0, 27.0, 29.0, 27.0, 57.0, 42.0, 22.0, 34.0, 46.0, 45.0, 37.0, 34.0, 35.0, 44.0, 41.0, 39.0, 26.0, 27.0, 21.0, 31.0, 24.0, 23.0, 14.0, 16.0, 14.0, 13.0, 8.0, 8.0, 10.0, 7.0, 6.0, 5.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.99923706054688, -147.45291137695312, -142.9065704345703, -138.3602294921875, -133.81390380859375, -129.267578125, -124.72123718261719, -120.1749038696289, -115.62857055664062, -111.08223724365234, -106.53590393066406, -101.98957061767578, -97.4432373046875, -92.89690399169922, -88.35057067871094, -83.80423736572266, -79.25790405273438, -74.7115707397461, -70.16523742675781, -65.61890411376953, -61.07257080078125, -56.52623748779297, -51.97990417480469, -47.433570861816406, -42.887237548828125, -38.340904235839844, -33.79457092285156, -29.24823760986328, -24.701904296875, -20.15557098388672, -15.609237670898438, -11.062904357910156, -6.5165863037109375, -1.9702529907226562, 2.576080322265625, 7.122413635253906, 11.668746948242188, 16.21508026123047, 20.76141357421875, 25.30774688720703, 29.854080200195312, 34.400413513183594, 38.946746826171875, 43.493080139160156, 48.03941345214844, 52.58574676513672, 57.132080078125, 61.67841339111328, 66.22474670410156, 70.77108001708984, 75.31741333007812, 79.8637466430664, 84.41007995605469, 88.95641326904297, 93.50274658203125, 98.04907989501953, 102.59541320800781, 107.1417465209961, 111.68807983398438, 116.23441314697266, 120.78074645996094, 125.32707977294922, 129.8734130859375, 134.41973876953125, 138.96607971191406]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 7.0, 4.0, 15.0, 10.0, 15.0, 12.0, 16.0, 21.0, 22.0, 23.0, 29.0, 43.0, 35.0, 43.0, 38.0, 44.0, 42.0, 59.0, 47.0, 31.0, 56.0, 37.0, 40.0, 34.0, 34.0, 26.0, 38.0, 27.0, 18.0, 18.0, 18.0, 13.0, 19.0, 12.0, 3.0, 10.0, 11.0, 5.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.125, -27.3046875, -26.484375, -25.6640625, -24.84375, -24.0234375, -23.203125, -22.3828125, -21.5625, -20.7421875, -19.921875, -19.1015625, -18.28125, -17.4609375, -16.640625, -15.8203125, -15.0, -14.1796875, -13.359375, -12.5390625, -11.71875, -10.8984375, -10.078125, -9.2578125, -8.4375, -7.6171875, -6.796875, -5.9765625, -5.15625, -4.3359375, -3.515625, -2.6953125, -1.875, -1.0546875, -0.234375, 0.5859375, 1.40625, 2.2265625, 3.046875, 3.8671875, 4.6875, 5.5078125, 6.328125, 7.1484375, 7.96875, 8.7890625, 9.609375, 10.4296875, 11.25, 12.0703125, 12.890625, 13.7109375, 14.53125, 15.3515625, 16.171875, 16.9921875, 17.8125, 18.6328125, 19.453125, 20.2734375, 21.09375, 21.9140625, 22.734375, 23.5546875, 24.375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 4.0, 13.0, 10.0, 26.0, 21.0, 24.0, 52.0, 73.0, 106.0, 136.0, 225.0, 366.0, 614.0, 1061.0, 2114.0, 4809.0, 17277.0, 274006.0, 3303889.0, 551665.0, 25892.0, 6052.0, 2547.0, 1288.0, 720.0, 433.0, 274.0, 177.0, 122.0, 74.0, 62.0, 40.0, 29.0, 24.0, 14.0, 13.0, 8.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.1875, -64.21826171875, -62.2490234375, -60.27978515625, -58.310546875, -56.34130859375, -54.3720703125, -52.40283203125, -50.43359375, -48.46435546875, -46.4951171875, -44.52587890625, -42.556640625, -40.58740234375, -38.6181640625, -36.64892578125, -34.6796875, -32.71044921875, -30.7412109375, -28.77197265625, -26.802734375, -24.83349609375, -22.8642578125, -20.89501953125, -18.92578125, -16.95654296875, -14.9873046875, -13.01806640625, -11.048828125, -9.07958984375, -7.1103515625, -5.14111328125, -3.171875, -1.20263671875, 0.7666015625, 2.73583984375, 4.705078125, 6.67431640625, 8.6435546875, 10.61279296875, 12.58203125, 14.55126953125, 16.5205078125, 18.48974609375, 20.458984375, 22.42822265625, 24.3974609375, 26.36669921875, 28.3359375, 30.30517578125, 32.2744140625, 34.24365234375, 36.212890625, 38.18212890625, 40.1513671875, 42.12060546875, 44.08984375, 46.05908203125, 48.0283203125, 49.99755859375, 51.966796875, 53.93603515625, 55.9052734375, 57.87451171875, 59.84375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 10.0, 24.0, 34.0, 49.0, 120.0, 392.0, 1322.0, 1356.0, 456.0, 165.0, 68.0, 32.0, 18.0, 9.0, 7.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -48.29296875, -45.4609375, -42.62890625, -39.796875, -36.96484375, -34.1328125, -31.30078125, -28.46875, -25.63671875, -22.8046875, -19.97265625, -17.140625, -14.30859375, -11.4765625, -8.64453125, -5.8125, -2.98046875, -0.1484375, 2.68359375, 5.515625, 8.34765625, 11.1796875, 14.01171875, 16.84375, 19.67578125, 22.5078125, 25.33984375, 28.171875, 31.00390625, 33.8359375, 36.66796875, 39.5, 42.33203125, 45.1640625, 47.99609375, 50.828125, 53.66015625, 56.4921875, 59.32421875, 62.15625, 64.98828125, 67.8203125, 70.65234375, 73.484375, 76.31640625, 79.1484375, 81.98046875, 84.8125, 87.64453125, 90.4765625, 93.30859375, 96.140625, 98.97265625, 101.8046875, 104.63671875, 107.46875, 110.30078125, 113.1328125, 115.96484375, 118.796875, 121.62890625, 124.4609375, 127.29296875, 130.125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 11.0, 16.0, 25.0, 31.0, 54.0, 86.0, 146.0, 394.0, 1368.0, 9486.0, 3415018.0, 758824.0, 7136.0, 998.0, 331.0, 137.0, 90.0, 61.0, 26.0, 21.0, 9.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-315.25, -307.548828125, -299.84765625, -292.146484375, -284.4453125, -276.744140625, -269.04296875, -261.341796875, -253.640625, -245.939453125, -238.23828125, -230.537109375, -222.8359375, -215.134765625, -207.43359375, -199.732421875, -192.03125, -184.330078125, -176.62890625, -168.927734375, -161.2265625, -153.525390625, -145.82421875, -138.123046875, -130.421875, -122.720703125, -115.01953125, -107.318359375, -99.6171875, -91.916015625, -84.21484375, -76.513671875, -68.8125, -61.111328125, -53.41015625, -45.708984375, -38.0078125, -30.306640625, -22.60546875, -14.904296875, -7.203125, 0.498046875, 8.19921875, 15.900390625, 23.6015625, 31.302734375, 39.00390625, 46.705078125, 54.40625, 62.107421875, 69.80859375, 77.509765625, 85.2109375, 92.912109375, 100.61328125, 108.314453125, 116.015625, 123.716796875, 131.41796875, 139.119140625, 146.8203125, 154.521484375, 162.22265625, 169.923828125, 177.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 18.0, 48.0, 177.0, 446.0, 232.0, 61.0, 22.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-663.81103515625, -648.5704956054688, -633.3299560546875, -618.08935546875, -602.8488159179688, -587.6082763671875, -572.3677368164062, -557.127197265625, -541.8865966796875, -526.6460571289062, -511.4054870605469, -496.1649475097656, -480.92437744140625, -465.683837890625, -450.44329833984375, -435.2027587890625, -419.96221923828125, -404.7216796875, -389.4811096191406, -374.2405700683594, -359.0, -343.75946044921875, -328.5189208984375, -313.27838134765625, -298.0378112792969, -282.7972717285156, -267.55670166015625, -252.316162109375, -237.0756072998047, -221.83505249023438, -206.59451293945312, -191.3539581298828, -176.1134033203125, -160.8728485107422, -145.63229370117188, -130.39175415039062, -115.15119934082031, -99.91064453125, -84.67009735107422, -69.42955017089844, -54.188995361328125, -38.94844436645508, -23.70789337158203, -8.467342376708984, 6.7732086181640625, 22.013763427734375, 37.254310607910156, 52.49485778808594, 67.73541259765625, 82.97596740722656, 98.21651458740234, 113.45706176757812, 128.69761657714844, 143.93817138671875, 159.1787109375, 174.4192657470703, 189.65982055664062, 204.90037536621094, 220.14093017578125, 235.3814697265625, 250.6220245361328, 265.8625793457031, 281.1031188964844, 296.34368896484375, 311.584228515625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 0.0, 5.0, 5.0, 2.0, 8.0, 6.0, 10.0, 14.0, 11.0, 13.0, 24.0, 22.0, 27.0, 23.0, 23.0, 41.0, 25.0, 39.0, 45.0, 44.0, 34.0, 33.0, 33.0, 31.0, 48.0, 45.0, 39.0, 36.0, 45.0, 37.0, 30.0, 32.0, 21.0, 20.0, 16.0, 21.0, 19.0, 13.0, 13.0, 8.0, 5.0, 8.0, 6.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.99964141845703, -106.5563735961914, -103.11309814453125, -99.66983032226562, -96.2265625, -92.78329467773438, -89.34002685546875, -85.8967514038086, -82.45348358154297, -79.01021575927734, -75.56694030761719, -72.12367248535156, -68.68040466308594, -65.23713684082031, -61.79386520385742, -58.35059356689453, -54.907325744628906, -51.46405792236328, -48.02078628540039, -44.5775146484375, -41.134246826171875, -37.69097900390625, -34.24770736694336, -30.8044376373291, -27.361167907714844, -23.917898178100586, -20.474628448486328, -17.03135871887207, -13.588088989257812, -10.144819259643555, -6.701549530029297, -3.258279800415039, 0.1849822998046875, 3.6282520294189453, 7.071521759033203, 10.514791488647461, 13.958061218261719, 17.401330947875977, 20.844600677490234, 24.287870407104492, 27.73114013671875, 31.174409866333008, 34.617679595947266, 38.060951232910156, 41.50421905517578, 44.947486877441406, 48.3907585144043, 51.83403015136719, 55.27729797363281, 58.72056579589844, 62.16383743286133, 65.60710906982422, 69.05037689208984, 72.49364471435547, 75.93692016601562, 79.38018798828125, 82.82345581054688, 86.2667236328125, 89.70999145507812, 93.15326690673828, 96.5965347290039, 100.03980255126953, 103.48307800292969, 106.92634582519531, 110.36961364746094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 9.0, 7.0, 8.0, 3.0, 8.0, 8.0, 6.0, 14.0, 14.0, 19.0, 16.0, 30.0, 25.0, 38.0, 29.0, 29.0, 30.0, 33.0, 36.0, 38.0, 29.0, 50.0, 43.0, 46.0, 44.0, 45.0, 28.0, 29.0, 38.0, 27.0, 34.0, 29.0, 19.0, 21.0, 17.0, 10.0, 21.0, 14.0, 13.0, 12.0, 7.0, 4.0, 7.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-26.296875, -25.53466796875, -24.7724609375, -24.01025390625, -23.248046875, -22.48583984375, -21.7236328125, -20.96142578125, -20.19921875, -19.43701171875, -18.6748046875, -17.91259765625, -17.150390625, -16.38818359375, -15.6259765625, -14.86376953125, -14.1015625, -13.33935546875, -12.5771484375, -11.81494140625, -11.052734375, -10.29052734375, -9.5283203125, -8.76611328125, -8.00390625, -7.24169921875, -6.4794921875, -5.71728515625, -4.955078125, -4.19287109375, -3.4306640625, -2.66845703125, -1.90625, -1.14404296875, -0.3818359375, 0.38037109375, 1.142578125, 1.90478515625, 2.6669921875, 3.42919921875, 4.19140625, 4.95361328125, 5.7158203125, 6.47802734375, 7.240234375, 8.00244140625, 8.7646484375, 9.52685546875, 10.2890625, 11.05126953125, 11.8134765625, 12.57568359375, 13.337890625, 14.10009765625, 14.8623046875, 15.62451171875, 16.38671875, 17.14892578125, 17.9111328125, 18.67333984375, 19.435546875, 20.19775390625, 20.9599609375, 21.72216796875, 22.484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 8.0, 8.0, 10.0, 8.0, 15.0, 32.0, 47.0, 64.0, 99.0, 155.0, 193.0, 287.0, 389.0, 524.0, 809.0, 1179.0, 1673.0, 2454.0, 3625.0, 5218.0, 7694.0, 11569.0, 17553.0, 26742.0, 41398.0, 66022.0, 107842.0, 175530.0, 206529.0, 137841.0, 83379.0, 51943.0, 32733.0, 21423.0, 13993.0, 9331.0, 6322.0, 4330.0, 2973.0, 1994.0, 1408.0, 1025.0, 685.0, 470.0, 298.0, 232.0, 170.0, 116.0, 63.0, 38.0, 42.0, 25.0, 15.0, 17.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.0654296875, -1.0313262939453125, -0.997222900390625, -0.9631195068359375, -0.92901611328125, -0.8949127197265625, -0.860809326171875, -0.8267059326171875, -0.7926025390625, -0.7584991455078125, -0.724395751953125, -0.6902923583984375, -0.65618896484375, -0.6220855712890625, -0.587982177734375, -0.5538787841796875, -0.519775390625, -0.4856719970703125, -0.451568603515625, -0.4174652099609375, -0.38336181640625, -0.3492584228515625, -0.315155029296875, -0.2810516357421875, -0.2469482421875, -0.2128448486328125, -0.178741455078125, -0.1446380615234375, -0.11053466796875, -0.0764312744140625, -0.042327880859375, -0.0082244873046875, 0.02587890625, 0.0599822998046875, 0.094085693359375, 0.1281890869140625, 0.16229248046875, 0.1963958740234375, 0.230499267578125, 0.2646026611328125, 0.2987060546875, 0.3328094482421875, 0.366912841796875, 0.4010162353515625, 0.43511962890625, 0.4692230224609375, 0.503326416015625, 0.5374298095703125, 0.571533203125, 0.6056365966796875, 0.639739990234375, 0.6738433837890625, 0.70794677734375, 0.7420501708984375, 0.776153564453125, 0.8102569580078125, 0.8443603515625, 0.8784637451171875, 0.912567138671875, 0.9466705322265625, 0.98077392578125, 1.0148773193359375, 1.048980712890625, 1.0830841064453125, 1.1171875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 17.0, 13.0, 13.0, 15.0, 21.0, 21.0, 24.0, 38.0, 23.0, 27.0, 35.0, 28.0, 28.0, 34.0, 47.0, 36.0, 35.0, 24.0, 1065.0, 33.0, 41.0, 37.0, 25.0, 33.0, 28.0, 36.0, 22.0, 24.0, 17.0, 25.0, 16.0, 21.0, 23.0, 9.0, 23.0, 14.0, 6.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4296875, -13.96826171875, -13.5068359375, -13.04541015625, -12.583984375, -12.12255859375, -11.6611328125, -11.19970703125, -10.73828125, -10.27685546875, -9.8154296875, -9.35400390625, -8.892578125, -8.43115234375, -7.9697265625, -7.50830078125, -7.046875, -6.58544921875, -6.1240234375, -5.66259765625, -5.201171875, -4.73974609375, -4.2783203125, -3.81689453125, -3.35546875, -2.89404296875, -2.4326171875, -1.97119140625, -1.509765625, -1.04833984375, -0.5869140625, -0.12548828125, 0.3359375, 0.79736328125, 1.2587890625, 1.72021484375, 2.181640625, 2.64306640625, 3.1044921875, 3.56591796875, 4.02734375, 4.48876953125, 4.9501953125, 5.41162109375, 5.873046875, 6.33447265625, 6.7958984375, 7.25732421875, 7.71875, 8.18017578125, 8.6416015625, 9.10302734375, 9.564453125, 10.02587890625, 10.4873046875, 10.94873046875, 11.41015625, 11.87158203125, 12.3330078125, 12.79443359375, 13.255859375, 13.71728515625, 14.1787109375, 14.64013671875, 15.1015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 11.0, 15.0, 17.0, 30.0, 52.0, 71.0, 107.0, 154.0, 222.0, 286.0, 481.0, 603.0, 1013.0, 1412.0, 1997.0, 2802.0, 4050.0, 5631.0, 8093.0, 11356.0, 16298.0, 23479.0, 34122.0, 50029.0, 76379.0, 119817.0, 1174816.0, 219788.0, 114296.0, 73265.0, 48264.0, 32747.0, 22638.0, 15485.0, 11089.0, 7803.0, 5449.0, 3949.0, 2775.0, 1974.0, 1305.0, 944.0, 597.0, 441.0, 286.0, 241.0, 173.0, 91.0, 61.0, 42.0, 30.0, 26.0, 16.0, 6.0, 8.0, 2.0, 4.0, 1.0], "bins": [-0.908203125, -0.8806381225585938, -0.8530731201171875, -0.8255081176757812, -0.797943115234375, -0.7703781127929688, -0.7428131103515625, -0.7152481079101562, -0.68768310546875, -0.6601181030273438, -0.6325531005859375, -0.6049880981445312, -0.577423095703125, -0.5498580932617188, -0.5222930908203125, -0.49472808837890625, -0.4671630859375, -0.43959808349609375, -0.4120330810546875, -0.38446807861328125, -0.356903076171875, -0.32933807373046875, -0.3017730712890625, -0.27420806884765625, -0.24664306640625, -0.21907806396484375, -0.1915130615234375, -0.16394805908203125, -0.136383056640625, -0.10881805419921875, -0.0812530517578125, -0.05368804931640625, -0.026123046875, 0.00144195556640625, 0.0290069580078125, 0.05657196044921875, 0.084136962890625, 0.11170196533203125, 0.1392669677734375, 0.16683197021484375, 0.19439697265625, 0.22196197509765625, 0.2495269775390625, 0.27709197998046875, 0.304656982421875, 0.33222198486328125, 0.3597869873046875, 0.38735198974609375, 0.4149169921875, 0.44248199462890625, 0.4700469970703125, 0.49761199951171875, 0.525177001953125, 0.5527420043945312, 0.5803070068359375, 0.6078720092773438, 0.63543701171875, 0.6630020141601562, 0.6905670166015625, 0.7181320190429688, 0.745697021484375, 0.7732620239257812, 0.8008270263671875, 0.8283920288085938, 0.85595703125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 6.0, 4.0, 10.0, 16.0, 11.0, 17.0, 21.0, 17.0, 39.0, 43.0, 42.0, 47.0, 50.0, 50.0, 54.0, 70.0, 77.0, 62.0, 63.0, 56.0, 43.0, 39.0, 39.0, 29.0, 30.0, 19.0, 11.0, 11.0, 6.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004863739013671875, -0.004697918891906738, -0.0045320987701416016, -0.004366278648376465, -0.004200458526611328, -0.004034638404846191, -0.0038688182830810547, -0.003702998161315918, -0.0035371780395507812, -0.0033713579177856445, -0.003205537796020508, -0.003039717674255371, -0.0028738975524902344, -0.0027080774307250977, -0.002542257308959961, -0.0023764371871948242, -0.0022106170654296875, -0.0020447969436645508, -0.001878976821899414, -0.0017131567001342773, -0.0015473365783691406, -0.001381516456604004, -0.0012156963348388672, -0.0010498762130737305, -0.0008840560913085938, -0.000718235969543457, -0.0005524158477783203, -0.0003865957260131836, -0.00022077560424804688, -5.4955482482910156e-05, 0.00011086463928222656, 0.0002766847610473633, 0.0004425048828125, 0.0006083250045776367, 0.0007741451263427734, 0.0009399652481079102, 0.0011057853698730469, 0.0012716054916381836, 0.0014374256134033203, 0.001603245735168457, 0.0017690658569335938, 0.0019348859786987305, 0.002100706100463867, 0.002266526222229004, 0.0024323463439941406, 0.0025981664657592773, 0.002763986587524414, 0.0029298067092895508, 0.0030956268310546875, 0.0032614469528198242, 0.003427267074584961, 0.0035930871963500977, 0.0037589073181152344, 0.003924727439880371, 0.004090547561645508, 0.0042563676834106445, 0.004422187805175781, 0.004588007926940918, 0.004753828048706055, 0.004919648170471191, 0.005085468292236328, 0.005251288414001465, 0.0054171085357666016, 0.005582928657531738, 0.005748748779296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 12.0, 11.0, 14.0, 16.0, 19.0, 25.0, 47.0, 58.0, 80.0, 96.0, 95.0, 155.0, 300.0, 551.0, 3460.0, 976814.0, 64918.0, 862.0, 326.0, 190.0, 127.0, 104.0, 69.0, 43.0, 41.0, 29.0, 28.0, 16.0, 16.0, 13.0, 7.0, 5.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11383056640625, -0.11064529418945312, -0.10746002197265625, -0.10427474975585938, -0.1010894775390625, -0.09790420532226562, -0.09471893310546875, -0.09153366088867188, -0.088348388671875, -0.08516311645507812, -0.08197784423828125, -0.07879257202148438, -0.0756072998046875, -0.07242202758789062, -0.06923675537109375, -0.06605148315429688, -0.0628662109375, -0.059680938720703125, -0.05649566650390625, -0.053310394287109375, -0.0501251220703125, -0.046939849853515625, -0.04375457763671875, -0.040569305419921875, -0.037384033203125, -0.034198760986328125, -0.03101348876953125, -0.027828216552734375, -0.0246429443359375, -0.021457672119140625, -0.01827239990234375, -0.015087127685546875, -0.01190185546875, -0.008716583251953125, -0.00553131103515625, -0.002346038818359375, 0.0008392333984375, 0.004024505615234375, 0.00720977783203125, 0.010395050048828125, 0.013580322265625, 0.016765594482421875, 0.01995086669921875, 0.023136138916015625, 0.0263214111328125, 0.029506683349609375, 0.03269195556640625, 0.035877227783203125, 0.0390625, 0.042247772216796875, 0.04543304443359375, 0.048618316650390625, 0.0518035888671875, 0.054988861083984375, 0.05817413330078125, 0.061359405517578125, 0.064544677734375, 0.06772994995117188, 0.07091522216796875, 0.07410049438476562, 0.0772857666015625, 0.08047103881835938, 0.08365631103515625, 0.08684158325195312, 0.09002685546875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 344.0, 653.0, 13.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01742071658372879, -0.0162674468010664, -0.015114178881049156, -0.013960909098386765, -0.012807640247046947, -0.01165437139570713, -0.010501101613044739, -0.009347832761704922, -0.008194563910365105, -0.007041295059025288, -0.005888025742024183, -0.004734756425023079, -0.003581487573683262, -0.002428218722343445, -0.0012749494053423405, -0.00012168008834123611, 0.001031588762998581, 0.0021848578471690416, 0.0033381269313395023, 0.004491396248340607, 0.005644665099680424, 0.006797933951020241, 0.007951203733682632, 0.00910447258502245, 0.010257741436362267, 0.011411010287702084, 0.0125642791390419, 0.013717548921704292, 0.01487081777304411, 0.016024086624383926, 0.017177356407046318, 0.01833062618970871, 0.01948389783501625, 0.020637167617678642, 0.021790435537695885, 0.022943705320358276, 0.02409697324037552, 0.02525024302303791, 0.026403512805700302, 0.027556780725717545, 0.028710050508379936, 0.029863320291042328, 0.03101658821105957, 0.03216985613107681, 0.033323127776384354, 0.034476395696401596, 0.03562966361641884, 0.03678293526172638, 0.03793620318174362, 0.039089471101760864, 0.040242742747068405, 0.04139601066708565, 0.04254927858710289, 0.04370255023241043, 0.04485581815242767, 0.046009086072444916, 0.04716235399246216, 0.0483156219124794, 0.04946889355778694, 0.050622161477804184, 0.051775429397821426, 0.05292870104312897, 0.05408196896314621, 0.05523523688316345, 0.05638850852847099]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 0.0, 8.0, 15.0, 11.0, 17.0, 15.0, 25.0, 13.0, 30.0, 26.0, 38.0, 47.0, 45.0, 40.0, 45.0, 53.0, 62.0, 47.0, 49.0, 50.0, 42.0, 44.0, 36.0, 36.0, 44.0, 34.0, 31.0, 17.0, 22.0, 16.0, 14.0, 3.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0034325718879699707, -0.0033309776335954666, -0.0032293833792209625, -0.0031277891248464584, -0.0030261948704719543, -0.0029246006160974503, -0.002823006361722946, -0.002721412107348442, -0.002619817852973938, -0.002518223598599434, -0.00241662934422493, -0.0023150350898504257, -0.0022134408354759216, -0.0021118465811014175, -0.0020102523267269135, -0.0019086580723524094, -0.0018070638179779053, -0.0017054695636034012, -0.001603875309228897, -0.001502281054854393, -0.001400686800479889, -0.0012990925461053848, -0.0011974982917308807, -0.0010959040373563766, -0.0009943097829818726, -0.0008927155286073685, -0.0007911212742328644, -0.0006895270198583603, -0.0005879327654838562, -0.0004863385111093521, -0.000384744256734848, -0.00028315000236034393, -0.00018155574798583984, -7.996149361133575e-05, 2.1632760763168335e-05, 0.00012322701513767242, 0.00022482126951217651, 0.0003264155238866806, 0.0004280097782611847, 0.0005296040326356888, 0.0006311982870101929, 0.000732792541384697, 0.000834386795759201, 0.0009359810501337051, 0.0010375753045082092, 0.0011391695588827133, 0.0012407638132572174, 0.0013423580676317215, 0.0014439523220062256, 0.0015455465763807297, 0.0016471408307552338, 0.0017487350851297379, 0.001850329339504242, 0.001951923593878746, 0.00205351784825325, 0.002155112102627754, 0.0022567063570022583, 0.0023583006113767624, 0.0024598948657512665, 0.0025614891201257706, 0.0026630833745002747, 0.0027646776288747787, 0.002866271883249283, 0.002967866137623787, 0.003069460391998291]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 9.0, 7.0, 8.0, 3.0, 8.0, 8.0, 6.0, 14.0, 14.0, 19.0, 16.0, 30.0, 25.0, 38.0, 29.0, 29.0, 30.0, 33.0, 36.0, 38.0, 29.0, 49.0, 44.0, 46.0, 44.0, 45.0, 28.0, 29.0, 37.0, 28.0, 34.0, 29.0, 19.0, 21.0, 17.0, 10.0, 21.0, 14.0, 13.0, 12.0, 7.0, 4.0, 7.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-26.296875, -25.53466796875, -24.7724609375, -24.01025390625, -23.248046875, -22.48583984375, -21.7236328125, -20.96142578125, -20.19921875, -19.43701171875, -18.6748046875, -17.91259765625, -17.150390625, -16.38818359375, -15.6259765625, -14.86376953125, -14.1015625, -13.33935546875, -12.5771484375, -11.81494140625, -11.052734375, -10.29052734375, -9.5283203125, -8.76611328125, -8.00390625, -7.24169921875, -6.4794921875, -5.71728515625, -4.955078125, -4.19287109375, -3.4306640625, -2.66845703125, -1.90625, -1.14404296875, -0.3818359375, 0.38037109375, 1.142578125, 1.90478515625, 2.6669921875, 3.42919921875, 4.19140625, 4.95361328125, 5.7158203125, 6.47802734375, 7.240234375, 8.00244140625, 8.7646484375, 9.52685546875, 10.2890625, 11.05126953125, 11.8134765625, 12.57568359375, 13.337890625, 14.10009765625, 14.8623046875, 15.62451171875, 16.38671875, 17.14892578125, 17.9111328125, 18.67333984375, 19.435546875, 20.19775390625, 20.9599609375, 21.72216796875, 22.484375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 11.0, 10.0, 10.0, 14.0, 18.0, 15.0, 47.0, 48.0, 83.0, 110.0, 151.0, 202.0, 294.0, 441.0, 699.0, 1156.0, 1860.0, 3294.0, 5955.0, 11660.0, 25895.0, 66849.0, 224737.0, 478954.0, 139365.0, 46700.0, 19194.0, 9094.0, 4734.0, 2596.0, 1559.0, 914.0, 567.0, 398.0, 277.0, 182.0, 130.0, 89.0, 67.0, 47.0, 39.0, 20.0, 22.0, 16.0, 16.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-33.0625, -32.09912109375, -31.1357421875, -30.17236328125, -29.208984375, -28.24560546875, -27.2822265625, -26.31884765625, -25.35546875, -24.39208984375, -23.4287109375, -22.46533203125, -21.501953125, -20.53857421875, -19.5751953125, -18.61181640625, -17.6484375, -16.68505859375, -15.7216796875, -14.75830078125, -13.794921875, -12.83154296875, -11.8681640625, -10.90478515625, -9.94140625, -8.97802734375, -8.0146484375, -7.05126953125, -6.087890625, -5.12451171875, -4.1611328125, -3.19775390625, -2.234375, -1.27099609375, -0.3076171875, 0.65576171875, 1.619140625, 2.58251953125, 3.5458984375, 4.50927734375, 5.47265625, 6.43603515625, 7.3994140625, 8.36279296875, 9.326171875, 10.28955078125, 11.2529296875, 12.21630859375, 13.1796875, 14.14306640625, 15.1064453125, 16.06982421875, 17.033203125, 17.99658203125, 18.9599609375, 19.92333984375, 20.88671875, 21.85009765625, 22.8134765625, 23.77685546875, 24.740234375, 25.70361328125, 26.6669921875, 27.63037109375, 28.59375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 8.0, 8.0, 8.0, 13.0, 19.0, 11.0, 11.0, 14.0, 17.0, 27.0, 35.0, 24.0, 31.0, 44.0, 45.0, 58.0, 72.0, 77.0, 159.0, 1531.0, 264.0, 111.0, 68.0, 65.0, 45.0, 40.0, 35.0, 28.0, 28.0, 25.0, 17.0, 17.0, 20.0, 17.0, 10.0, 13.0, 7.0, 5.0, 4.0, 8.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-60.0, -58.17041015625, -56.3408203125, -54.51123046875, -52.681640625, -50.85205078125, -49.0224609375, -47.19287109375, -45.36328125, -43.53369140625, -41.7041015625, -39.87451171875, -38.044921875, -36.21533203125, -34.3857421875, -32.55615234375, -30.7265625, -28.89697265625, -27.0673828125, -25.23779296875, -23.408203125, -21.57861328125, -19.7490234375, -17.91943359375, -16.08984375, -14.26025390625, -12.4306640625, -10.60107421875, -8.771484375, -6.94189453125, -5.1123046875, -3.28271484375, -1.453125, 0.37646484375, 2.2060546875, 4.03564453125, 5.865234375, 7.69482421875, 9.5244140625, 11.35400390625, 13.18359375, 15.01318359375, 16.8427734375, 18.67236328125, 20.501953125, 22.33154296875, 24.1611328125, 25.99072265625, 27.8203125, 29.64990234375, 31.4794921875, 33.30908203125, 35.138671875, 36.96826171875, 38.7978515625, 40.62744140625, 42.45703125, 44.28662109375, 46.1162109375, 47.94580078125, 49.775390625, 51.60498046875, 53.4345703125, 55.26416015625, 57.09375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 10.0, 16.0, 17.0, 21.0, 20.0, 36.0, 50.0, 69.0, 92.0, 124.0, 160.0, 291.0, 521.0, 1986.0, 16347.0, 443448.0, 2631978.0, 44794.0, 3727.0, 788.0, 382.0, 228.0, 138.0, 99.0, 67.0, 65.0, 51.0, 41.0, 25.0, 10.0, 21.0, 19.0, 10.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-88.4375, -85.7724609375, -83.107421875, -80.4423828125, -77.77734375, -75.1123046875, -72.447265625, -69.7822265625, -67.1171875, -64.4521484375, -61.787109375, -59.1220703125, -56.45703125, -53.7919921875, -51.126953125, -48.4619140625, -45.796875, -43.1318359375, -40.466796875, -37.8017578125, -35.13671875, -32.4716796875, -29.806640625, -27.1416015625, -24.4765625, -21.8115234375, -19.146484375, -16.4814453125, -13.81640625, -11.1513671875, -8.486328125, -5.8212890625, -3.15625, -0.4912109375, 2.173828125, 4.8388671875, 7.50390625, 10.1689453125, 12.833984375, 15.4990234375, 18.1640625, 20.8291015625, 23.494140625, 26.1591796875, 28.82421875, 31.4892578125, 34.154296875, 36.8193359375, 39.484375, 42.1494140625, 44.814453125, 47.4794921875, 50.14453125, 52.8095703125, 55.474609375, 58.1396484375, 60.8046875, 63.4697265625, 66.134765625, 68.7998046875, 71.46484375, 74.1298828125, 76.794921875, 79.4599609375, 82.125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 16.0, 76.0, 250.0, 371.0, 213.0, 64.0, 14.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.11949157714844, -147.5257110595703, -140.93194580078125, -134.33816528320312, -127.74440002441406, -121.15061950683594, -114.55684661865234, -107.96307373046875, -101.36930084228516, -94.77552795410156, -88.18175506591797, -81.58798217773438, -74.99420166015625, -68.40043640136719, -61.80665588378906, -55.21288299560547, -48.619110107421875, -42.02533721923828, -35.43156433105469, -28.837787628173828, -22.244014739990234, -15.65024185180664, -9.056465148925781, -2.4626922607421875, 4.131080627441406, 10.724854469299316, 17.318628311157227, 23.912403106689453, 30.506175994873047, 37.09994888305664, 43.6937255859375, 50.287498474121094, 56.881256103515625, 63.47502899169922, 70.06880187988281, 76.66258239746094, 83.25634765625, 89.85012817382812, 96.44390106201172, 103.03767395019531, 109.6314468383789, 116.2252197265625, 122.8189926147461, 129.4127655029297, 136.0065460205078, 142.60031127929688, 149.194091796875, 155.78787231445312, 162.3816375732422, 168.9754180908203, 175.56918334960938, 182.1629638671875, 188.75672912597656, 195.3505096435547, 201.94427490234375, 208.53805541992188, 215.1318359375, 221.72561645507812, 228.3193817138672, 234.9131622314453, 241.50692749023438, 248.1007080078125, 254.69448852539062, 261.28826904296875, 267.88201904296875]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 12.0, 5.0, 8.0, 9.0, 11.0, 18.0, 23.0, 28.0, 28.0, 31.0, 23.0, 39.0, 33.0, 33.0, 38.0, 43.0, 45.0, 50.0, 44.0, 50.0, 49.0, 35.0, 43.0, 41.0, 34.0, 27.0, 30.0, 28.0, 27.0, 20.0, 17.0, 16.0, 20.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.93840026855469, -121.39701080322266, -116.85562133789062, -112.3142318725586, -107.77284240722656, -103.2314453125, -98.69005584716797, -94.14866638183594, -89.6072769165039, -85.06588745117188, -80.52449798583984, -75.98310852050781, -71.44171142578125, -66.90032958984375, -62.35893249511719, -57.817543029785156, -53.276153564453125, -48.734764099121094, -44.19337463378906, -39.651981353759766, -35.110591888427734, -30.569202423095703, -26.02781105041504, -21.486419677734375, -16.945030212402344, -12.403639793395996, -7.862249374389648, -3.320858955383301, 1.2205314636230469, 5.761920928955078, 10.303312301635742, 14.844703674316406, 19.3861083984375, 23.92749786376953, 28.468889236450195, 33.01028060913086, 37.55167007446289, 42.09305953979492, 46.63445281982422, 51.17584228515625, 55.71723175048828, 60.25862121582031, 64.80001068115234, 69.34140014648438, 73.88279724121094, 78.42417907714844, 82.965576171875, 87.50696563720703, 92.04835510253906, 96.5897445678711, 101.13113403320312, 105.67252349853516, 110.21391296386719, 114.75531005859375, 119.29669952392578, 123.83808898925781, 128.37948608398438, 132.92088317871094, 137.46226501464844, 142.003662109375, 146.5450439453125, 151.08644104003906, 155.62782287597656, 160.16921997070312, 164.71060180664062]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 2.0, 7.0, 10.0, 7.0, 6.0, 10.0, 10.0, 14.0, 18.0, 24.0, 24.0, 25.0, 36.0, 28.0, 30.0, 32.0, 31.0, 42.0, 41.0, 39.0, 42.0, 41.0, 45.0, 43.0, 43.0, 33.0, 36.0, 27.0, 30.0, 37.0, 31.0, 19.0, 10.0, 18.0, 25.0, 14.0, 17.0, 8.0, 10.0, 5.0, 8.0, 9.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.328125, -24.544677734375, -23.76123046875, -22.977783203125, -22.1943359375, -21.410888671875, -20.62744140625, -19.843994140625, -19.060546875, -18.277099609375, -17.49365234375, -16.710205078125, -15.9267578125, -15.143310546875, -14.35986328125, -13.576416015625, -12.79296875, -12.009521484375, -11.22607421875, -10.442626953125, -9.6591796875, -8.875732421875, -8.09228515625, -7.308837890625, -6.525390625, -5.741943359375, -4.95849609375, -4.175048828125, -3.3916015625, -2.608154296875, -1.82470703125, -1.041259765625, -0.2578125, 0.525634765625, 1.30908203125, 2.092529296875, 2.8759765625, 3.659423828125, 4.44287109375, 5.226318359375, 6.009765625, 6.793212890625, 7.57666015625, 8.360107421875, 9.1435546875, 9.927001953125, 10.71044921875, 11.493896484375, 12.27734375, 13.060791015625, 13.84423828125, 14.627685546875, 15.4111328125, 16.194580078125, 16.97802734375, 17.761474609375, 18.544921875, 19.328369140625, 20.11181640625, 20.895263671875, 21.6787109375, 22.462158203125, 23.24560546875, 24.029052734375, 24.8125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 11.0, 14.0, 13.0, 14.0, 23.0, 38.0, 63.0, 81.0, 102.0, 174.0, 219.0, 309.0, 458.0, 733.0, 1191.0, 2026.0, 3690.0, 8809.0, 40256.0, 330715.0, 2468060.0, 1172721.0, 133341.0, 18255.0, 5613.0, 2801.0, 1596.0, 956.0, 642.0, 389.0, 292.0, 197.0, 126.0, 94.0, 68.0, 65.0, 37.0, 29.0, 20.0, 12.0, 9.0, 6.0, 10.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.21875, -40.890625, -39.5625, -38.234375, -36.90625, -35.578125, -34.25, -32.921875, -31.59375, -30.265625, -28.9375, -27.609375, -26.28125, -24.953125, -23.625, -22.296875, -20.96875, -19.640625, -18.3125, -16.984375, -15.65625, -14.328125, -13.0, -11.671875, -10.34375, -9.015625, -7.6875, -6.359375, -5.03125, -3.703125, -2.375, -1.046875, 0.28125, 1.609375, 2.9375, 4.265625, 5.59375, 6.921875, 8.25, 9.578125, 10.90625, 12.234375, 13.5625, 14.890625, 16.21875, 17.546875, 18.875, 20.203125, 21.53125, 22.859375, 24.1875, 25.515625, 26.84375, 28.171875, 29.5, 30.828125, 32.15625, 33.484375, 34.8125, 36.140625, 37.46875, 38.796875, 40.125, 41.453125, 42.78125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 3.0, 7.0, 18.0, 13.0, 15.0, 19.0, 37.0, 69.0, 92.0, 200.0, 364.0, 714.0, 996.0, 747.0, 337.0, 169.0, 109.0, 54.0, 22.0, 17.0, 14.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.375, -37.943359375, -36.51171875, -35.080078125, -33.6484375, -32.216796875, -30.78515625, -29.353515625, -27.921875, -26.490234375, -25.05859375, -23.626953125, -22.1953125, -20.763671875, -19.33203125, -17.900390625, -16.46875, -15.037109375, -13.60546875, -12.173828125, -10.7421875, -9.310546875, -7.87890625, -6.447265625, -5.015625, -3.583984375, -2.15234375, -0.720703125, 0.7109375, 2.142578125, 3.57421875, 5.005859375, 6.4375, 7.869140625, 9.30078125, 10.732421875, 12.1640625, 13.595703125, 15.02734375, 16.458984375, 17.890625, 19.322265625, 20.75390625, 22.185546875, 23.6171875, 25.048828125, 26.48046875, 27.912109375, 29.34375, 30.775390625, 32.20703125, 33.638671875, 35.0703125, 36.501953125, 37.93359375, 39.365234375, 40.796875, 42.228515625, 43.66015625, 45.091796875, 46.5234375, 47.955078125, 49.38671875, 50.818359375, 52.25]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 8.0, 17.0, 16.0, 19.0, 35.0, 43.0, 68.0, 102.0, 155.0, 227.0, 358.0, 639.0, 1160.0, 2210.0, 4755.0, 11106.0, 33150.0, 217034.0, 3412037.0, 440618.0, 45552.0, 13648.0, 5544.0, 2612.0, 1291.0, 724.0, 395.0, 250.0, 167.0, 97.0, 66.0, 63.0, 29.0, 24.0, 18.0, 11.0, 7.0, 5.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-60.9375, -59.01025390625, -57.0830078125, -55.15576171875, -53.228515625, -51.30126953125, -49.3740234375, -47.44677734375, -45.51953125, -43.59228515625, -41.6650390625, -39.73779296875, -37.810546875, -35.88330078125, -33.9560546875, -32.02880859375, -30.1015625, -28.17431640625, -26.2470703125, -24.31982421875, -22.392578125, -20.46533203125, -18.5380859375, -16.61083984375, -14.68359375, -12.75634765625, -10.8291015625, -8.90185546875, -6.974609375, -5.04736328125, -3.1201171875, -1.19287109375, 0.734375, 2.66162109375, 4.5888671875, 6.51611328125, 8.443359375, 10.37060546875, 12.2978515625, 14.22509765625, 16.15234375, 18.07958984375, 20.0068359375, 21.93408203125, 23.861328125, 25.78857421875, 27.7158203125, 29.64306640625, 31.5703125, 33.49755859375, 35.4248046875, 37.35205078125, 39.279296875, 41.20654296875, 43.1337890625, 45.06103515625, 46.98828125, 48.91552734375, 50.8427734375, 52.77001953125, 54.697265625, 56.62451171875, 58.5517578125, 60.47900390625, 62.40625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 5.0, 9.0, 10.0, 40.0, 112.0, 246.0, 326.0, 159.0, 68.0, 23.0, 6.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.48783111572266, -62.63218688964844, -52.77653884887695, -42.92089080810547, -33.06524658203125, -23.20960235595703, -13.353954315185547, -3.4983062744140625, 6.357337951660156, 16.212984085083008, 26.06863021850586, 35.924278259277344, 45.77992248535156, 55.63556671142578, 65.4912109375, 75.34686279296875, 85.20250701904297, 95.05815124511719, 104.91380310058594, 114.76944732666016, 124.62509155273438, 134.48074340820312, 144.3363800048828, 154.19203186035156, 164.04766845703125, 173.9033203125, 183.7589569091797, 193.61460876464844, 203.47024536132812, 213.32589721679688, 223.18154907226562, 233.03720092773438, 242.892822265625, 252.74847412109375, 262.6041259765625, 272.4597473144531, 282.3153991699219, 292.1710510253906, 302.0267028808594, 311.8823547363281, 321.73797607421875, 331.5936279296875, 341.44927978515625, 351.3049011230469, 361.1605529785156, 371.0162048339844, 380.8718566894531, 390.7275085449219, 400.5831604003906, 410.4388122558594, 420.2944641113281, 430.15008544921875, 440.0057373046875, 449.86138916015625, 459.717041015625, 469.57269287109375, 479.4283447265625, 489.28399658203125, 499.1396484375, 508.9952697753906, 518.8509521484375, 528.70654296875, 538.5621948242188, 548.4178466796875, 558.2734985351562]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 11.0, 7.0, 14.0, 13.0, 16.0, 17.0, 21.0, 29.0, 27.0, 29.0, 42.0, 37.0, 32.0, 41.0, 39.0, 68.0, 43.0, 46.0, 34.0, 37.0, 47.0, 38.0, 30.0, 32.0, 29.0, 27.0, 27.0, 33.0, 22.0, 26.0, 18.0, 15.0, 6.0, 12.0, 3.0, 6.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.87333679199219, -107.46166229248047, -104.04999542236328, -100.63832092285156, -97.22664642333984, -93.81497192382812, -90.40330505371094, -86.99163055419922, -83.5799560546875, -80.16828155517578, -76.7566146850586, -73.34494018554688, -69.93326568603516, -66.52159118652344, -63.10992431640625, -59.69824981689453, -56.28657913208008, -52.874908447265625, -49.463233947753906, -46.05156326293945, -42.639888763427734, -39.22821807861328, -35.81654357910156, -32.40487289428711, -28.993200302124023, -25.581527709960938, -22.16985511779785, -18.758182525634766, -15.346510887145996, -11.934839248657227, -8.52316665649414, -5.111494064331055, -1.6998214721679688, 1.711850881576538, 5.123523235321045, 8.535195350646973, 11.946867942810059, 15.358539581298828, 18.770212173461914, 22.181884765625, 25.593557357788086, 29.005229949951172, 32.416900634765625, 35.828575134277344, 39.2402458190918, 42.65191650390625, 46.06359100341797, 49.47526550292969, 52.88693618774414, 56.298606872558594, 59.71028137207031, 63.121952056884766, 66.53362274169922, 69.94529724121094, 73.35697174072266, 76.76864624023438, 80.18031311035156, 83.59198760986328, 87.00365447998047, 90.41532897949219, 93.8270034790039, 97.23867797851562, 100.65034484863281, 104.06201934814453, 107.47369384765625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 12.0, 8.0, 14.0, 18.0, 21.0, 17.0, 25.0, 28.0, 21.0, 31.0, 38.0, 35.0, 35.0, 35.0, 45.0, 29.0, 45.0, 46.0, 49.0, 38.0, 49.0, 38.0, 34.0, 36.0, 27.0, 21.0, 18.0, 22.0, 21.0, 20.0, 26.0, 12.0, 12.0, 13.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.765625, -22.97900390625, -22.1923828125, -21.40576171875, -20.619140625, -19.83251953125, -19.0458984375, -18.25927734375, -17.47265625, -16.68603515625, -15.8994140625, -15.11279296875, -14.326171875, -13.53955078125, -12.7529296875, -11.96630859375, -11.1796875, -10.39306640625, -9.6064453125, -8.81982421875, -8.033203125, -7.24658203125, -6.4599609375, -5.67333984375, -4.88671875, -4.10009765625, -3.3134765625, -2.52685546875, -1.740234375, -0.95361328125, -0.1669921875, 0.61962890625, 1.40625, 2.19287109375, 2.9794921875, 3.76611328125, 4.552734375, 5.33935546875, 6.1259765625, 6.91259765625, 7.69921875, 8.48583984375, 9.2724609375, 10.05908203125, 10.845703125, 11.63232421875, 12.4189453125, 13.20556640625, 13.9921875, 14.77880859375, 15.5654296875, 16.35205078125, 17.138671875, 17.92529296875, 18.7119140625, 19.49853515625, 20.28515625, 21.07177734375, 21.8583984375, 22.64501953125, 23.431640625, 24.21826171875, 25.0048828125, 25.79150390625, 26.578125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 8.0, 24.0, 30.0, 62.0, 66.0, 115.0, 173.0, 248.0, 333.0, 512.0, 783.0, 1174.0, 1783.0, 2701.0, 4285.0, 6383.0, 9662.0, 14868.0, 24270.0, 39123.0, 66084.0, 111906.0, 182399.0, 212053.0, 146562.0, 86279.0, 51380.0, 30918.0, 19105.0, 12272.0, 7793.0, 5143.0, 3451.0, 2193.0, 1440.0, 971.0, 635.0, 442.0, 303.0, 219.0, 131.0, 88.0, 63.0, 49.0, 30.0, 15.0, 6.0, 7.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.115234375, -1.077117919921875, -1.03900146484375, -1.000885009765625, -0.9627685546875, -0.924652099609375, -0.88653564453125, -0.848419189453125, -0.810302734375, -0.772186279296875, -0.73406982421875, -0.695953369140625, -0.6578369140625, -0.619720458984375, -0.58160400390625, -0.543487548828125, -0.50537109375, -0.467254638671875, -0.42913818359375, -0.391021728515625, -0.3529052734375, -0.314788818359375, -0.27667236328125, -0.238555908203125, -0.200439453125, -0.162322998046875, -0.12420654296875, -0.086090087890625, -0.0479736328125, -0.009857177734375, 0.02825927734375, 0.066375732421875, 0.1044921875, 0.142608642578125, 0.18072509765625, 0.218841552734375, 0.2569580078125, 0.295074462890625, 0.33319091796875, 0.371307373046875, 0.409423828125, 0.447540283203125, 0.48565673828125, 0.523773193359375, 0.5618896484375, 0.600006103515625, 0.63812255859375, 0.676239013671875, 0.71435546875, 0.752471923828125, 0.79058837890625, 0.828704833984375, 0.8668212890625, 0.904937744140625, 0.94305419921875, 0.981170654296875, 1.019287109375, 1.057403564453125, 1.09552001953125, 1.133636474609375, 1.1717529296875, 1.209869384765625, 1.24798583984375, 1.286102294921875, 1.32421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 4.0, 20.0, 9.0, 16.0, 14.0, 19.0, 29.0, 21.0, 28.0, 28.0, 31.0, 41.0, 68.0, 41.0, 46.0, 47.0, 45.0, 1059.0, 45.0, 44.0, 35.0, 45.0, 29.0, 37.0, 36.0, 28.0, 30.0, 17.0, 21.0, 21.0, 16.0, 13.0, 6.0, 9.0, 2.0, 6.0, 8.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.6875, -18.1044921875, -17.521484375, -16.9384765625, -16.35546875, -15.7724609375, -15.189453125, -14.6064453125, -14.0234375, -13.4404296875, -12.857421875, -12.2744140625, -11.69140625, -11.1083984375, -10.525390625, -9.9423828125, -9.359375, -8.7763671875, -8.193359375, -7.6103515625, -7.02734375, -6.4443359375, -5.861328125, -5.2783203125, -4.6953125, -4.1123046875, -3.529296875, -2.9462890625, -2.36328125, -1.7802734375, -1.197265625, -0.6142578125, -0.03125, 0.5517578125, 1.134765625, 1.7177734375, 2.30078125, 2.8837890625, 3.466796875, 4.0498046875, 4.6328125, 5.2158203125, 5.798828125, 6.3818359375, 6.96484375, 7.5478515625, 8.130859375, 8.7138671875, 9.296875, 9.8798828125, 10.462890625, 11.0458984375, 11.62890625, 12.2119140625, 12.794921875, 13.3779296875, 13.9609375, 14.5439453125, 15.126953125, 15.7099609375, 16.29296875, 16.8759765625, 17.458984375, 18.0419921875, 18.625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 5.0, 22.0, 22.0, 25.0, 37.0, 49.0, 75.0, 106.0, 188.0, 254.0, 387.0, 594.0, 804.0, 1219.0, 1914.0, 2700.0, 4093.0, 6031.0, 8825.0, 13160.0, 19922.0, 30725.0, 49623.0, 81392.0, 134853.0, 1244948.0, 184683.0, 116521.0, 70193.0, 42887.0, 27120.0, 17818.0, 11620.0, 7883.0, 5301.0, 3608.0, 2413.0, 1689.0, 1130.0, 766.0, 505.0, 331.0, 208.0, 154.0, 109.0, 66.0, 38.0, 38.0, 34.0, 15.0, 11.0, 3.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.0546875, -1.021575927734375, -0.98846435546875, -0.955352783203125, -0.9222412109375, -0.889129638671875, -0.85601806640625, -0.822906494140625, -0.789794921875, -0.756683349609375, -0.72357177734375, -0.690460205078125, -0.6573486328125, -0.624237060546875, -0.59112548828125, -0.558013916015625, -0.52490234375, -0.491790771484375, -0.45867919921875, -0.425567626953125, -0.3924560546875, -0.359344482421875, -0.32623291015625, -0.293121337890625, -0.260009765625, -0.226898193359375, -0.19378662109375, -0.160675048828125, -0.1275634765625, -0.094451904296875, -0.06134033203125, -0.028228759765625, 0.0048828125, 0.037994384765625, 0.07110595703125, 0.104217529296875, 0.1373291015625, 0.170440673828125, 0.20355224609375, 0.236663818359375, 0.269775390625, 0.302886962890625, 0.33599853515625, 0.369110107421875, 0.4022216796875, 0.435333251953125, 0.46844482421875, 0.501556396484375, 0.53466796875, 0.567779541015625, 0.60089111328125, 0.634002685546875, 0.6671142578125, 0.700225830078125, 0.73333740234375, 0.766448974609375, 0.799560546875, 0.832672119140625, 0.86578369140625, 0.898895263671875, 0.9320068359375, 0.965118408203125, 0.99822998046875, 1.031341552734375, 1.064453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 2.0, 4.0, 7.0, 4.0, 9.0, 10.0, 11.0, 16.0, 22.0, 17.0, 30.0, 35.0, 31.0, 43.0, 58.0, 62.0, 57.0, 55.0, 73.0, 40.0, 65.0, 56.0, 55.0, 45.0, 36.0, 33.0, 17.0, 16.0, 24.0, 11.0, 14.0, 10.0, 8.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006656646728515625, -0.006450355052947998, -0.006244063377380371, -0.006037771701812744, -0.005831480026245117, -0.00562518835067749, -0.005418896675109863, -0.005212604999542236, -0.005006313323974609, -0.004800021648406982, -0.0045937299728393555, -0.0043874382972717285, -0.0041811466217041016, -0.003974854946136475, -0.0037685632705688477, -0.0035622715950012207, -0.0033559799194335938, -0.003149688243865967, -0.00294339656829834, -0.002737104892730713, -0.002530813217163086, -0.002324521541595459, -0.002118229866027832, -0.001911938190460205, -0.0017056465148925781, -0.0014993548393249512, -0.0012930631637573242, -0.0010867714881896973, -0.0008804798126220703, -0.0006741881370544434, -0.0004678964614868164, -0.00026160478591918945, -5.53131103515625e-05, 0.00015097856521606445, 0.0003572702407836914, 0.0005635619163513184, 0.0007698535919189453, 0.0009761452674865723, 0.0011824369430541992, 0.0013887286186218262, 0.0015950202941894531, 0.00180131196975708, 0.002007603645324707, 0.002213895320892334, 0.002420186996459961, 0.002626478672027588, 0.002832770347595215, 0.003039062023162842, 0.0032453536987304688, 0.0034516453742980957, 0.0036579370498657227, 0.0038642287254333496, 0.0040705204010009766, 0.0042768120765686035, 0.0044831037521362305, 0.004689395427703857, 0.004895687103271484, 0.005101978778839111, 0.005308270454406738, 0.005514562129974365, 0.005720853805541992, 0.005927145481109619, 0.006133437156677246, 0.006339728832244873, 0.0065460205078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 14.0, 8.0, 14.0, 23.0, 25.0, 31.0, 40.0, 54.0, 70.0, 86.0, 117.0, 233.0, 298.0, 639.0, 8086.0, 1012030.0, 24808.0, 848.0, 371.0, 189.0, 148.0, 94.0, 72.0, 52.0, 41.0, 35.0, 24.0, 20.0, 14.0, 16.0, 6.0, 11.0, 7.0, 4.0, 8.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1326904296875, -0.12862014770507812, -0.12454986572265625, -0.12047958374023438, -0.1164093017578125, -0.11233901977539062, -0.10826873779296875, -0.10419845581054688, -0.100128173828125, -0.09605789184570312, -0.09198760986328125, -0.08791732788085938, -0.0838470458984375, -0.07977676391601562, -0.07570648193359375, -0.07163619995117188, -0.06756591796875, -0.06349563598632812, -0.05942535400390625, -0.055355072021484375, -0.0512847900390625, -0.047214508056640625, -0.04314422607421875, -0.039073944091796875, -0.035003662109375, -0.030933380126953125, -0.02686309814453125, -0.022792816162109375, -0.0187225341796875, -0.014652252197265625, -0.01058197021484375, -0.006511688232421875, -0.00244140625, 0.001628875732421875, 0.00569915771484375, 0.009769439697265625, 0.0138397216796875, 0.017910003662109375, 0.02198028564453125, 0.026050567626953125, 0.030120849609375, 0.034191131591796875, 0.03826141357421875, 0.042331695556640625, 0.0464019775390625, 0.050472259521484375, 0.05454254150390625, 0.058612823486328125, 0.06268310546875, 0.06675338745117188, 0.07082366943359375, 0.07489395141601562, 0.0789642333984375, 0.08303451538085938, 0.08710479736328125, 0.09117507934570312, 0.095245361328125, 0.09931564331054688, 0.10338592529296875, 0.10745620727539062, 0.1115264892578125, 0.11559677124023438, 0.11966705322265625, 0.12373733520507812, 0.1278076171875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 37.0, 732.0, 230.0, 13.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0033708857372403145, -0.0021054628305137157, -0.000840039923787117, 0.00042538298293948174, 0.0016908058896660805, 0.002956228796392679, 0.004221651703119278, 0.005487074144184589, 0.006752497516572475, 0.008017919957637787, 0.009283343330025673, 0.010548766702413559, 0.01181418914347887, 0.013079611584544182, 0.014345034956932068, 0.01561045739799738, 0.01687588170170784, 0.018141305074095726, 0.019406728446483612, 0.02067214995622635, 0.021937573328614235, 0.02320299670100212, 0.024468418210744858, 0.025733841583132744, 0.02699926495552063, 0.028264688327908516, 0.029530111700296402, 0.03079553321003914, 0.032060958445072174, 0.03332637995481491, 0.03459180146455765, 0.035857222974300385, 0.03712264448404312, 0.03838806599378586, 0.03965349122881889, 0.04091891273856163, 0.042184337973594666, 0.0434497594833374, 0.04471518099308014, 0.045980602502822876, 0.04724602773785591, 0.04851144924759865, 0.04977687448263168, 0.05104229599237442, 0.05230771750211716, 0.05357314273715019, 0.05483856424689293, 0.056103989481925964, 0.0573694109916687, 0.05863483250141144, 0.05990025773644447, 0.06116567924618721, 0.062431104481220245, 0.06369652599096298, 0.06496194750070572, 0.06622736901044846, 0.06749279797077179, 0.06875821948051453, 0.07002364099025726, 0.0712890699505806, 0.07255449146032333, 0.07381991297006607, 0.07508533447980881, 0.07635075598955154, 0.07761617749929428]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 8.0, 13.0, 14.0, 22.0, 25.0, 36.0, 34.0, 45.0, 50.0, 49.0, 45.0, 49.0, 51.0, 59.0, 60.0, 52.0, 45.0, 52.0, 43.0, 42.0, 31.0, 24.0, 29.0, 25.0, 18.0, 16.0, 15.0, 13.0, 11.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005161285400390625, -0.005012081936001778, -0.00486287847161293, -0.004713675007224083, -0.004564471542835236, -0.004415268078446388, -0.004266064614057541, -0.0041168611496686935, -0.003967657685279846, -0.003818454220890999, -0.0036692507565021515, -0.003520047292113304, -0.003370843827724457, -0.0032216403633356094, -0.003072436898946762, -0.0029232334345579147, -0.0027740299701690674, -0.00262482650578022, -0.0024756230413913727, -0.0023264195770025253, -0.002177216112613678, -0.0020280126482248306, -0.0018788091838359833, -0.001729605719447136, -0.0015804022550582886, -0.0014311987906694412, -0.0012819953262805939, -0.0011327918618917465, -0.0009835883975028992, -0.0008343849331140518, -0.0006851814687252045, -0.0005359780043363571, -0.00038677453994750977, -0.00023757107555866241, -8.836761116981506e-05, 6.083585321903229e-05, 0.00021003931760787964, 0.000359242781996727, 0.0005084462463855743, 0.0006576497107744217, 0.000806853175163269, 0.0009560566395521164, 0.0011052601039409637, 0.001254463568329811, 0.0014036670327186584, 0.0015528704971075058, 0.0017020739614963531, 0.0018512774258852005, 0.002000480890274048, 0.002149684354662895, 0.0022988878190517426, 0.00244809128344059, 0.0025972947478294373, 0.0027464982122182846, 0.002895701676607132, 0.0030449051409959793, 0.0031941086053848267, 0.003343312069773674, 0.0034925155341625214, 0.0036417189985513687, 0.003790922462940216, 0.003940125927329063, 0.004089329391717911, 0.004238532856106758, 0.0043877363204956055]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 10.0, 12.0, 8.0, 14.0, 18.0, 21.0, 17.0, 25.0, 28.0, 21.0, 31.0, 38.0, 35.0, 35.0, 35.0, 45.0, 29.0, 45.0, 46.0, 49.0, 38.0, 49.0, 38.0, 34.0, 36.0, 27.0, 21.0, 18.0, 22.0, 21.0, 20.0, 27.0, 11.0, 12.0, 13.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.765625, -22.97900390625, -22.1923828125, -21.40576171875, -20.619140625, -19.83251953125, -19.0458984375, -18.25927734375, -17.47265625, -16.68603515625, -15.8994140625, -15.11279296875, -14.326171875, -13.53955078125, -12.7529296875, -11.96630859375, -11.1796875, -10.39306640625, -9.6064453125, -8.81982421875, -8.033203125, -7.24658203125, -6.4599609375, -5.67333984375, -4.88671875, -4.10009765625, -3.3134765625, -2.52685546875, -1.740234375, -0.95361328125, -0.1669921875, 0.61962890625, 1.40625, 2.19287109375, 2.9794921875, 3.76611328125, 4.552734375, 5.33935546875, 6.1259765625, 6.91259765625, 7.69921875, 8.48583984375, 9.2724609375, 10.05908203125, 10.845703125, 11.63232421875, 12.4189453125, 13.20556640625, 13.9921875, 14.77880859375, 15.5654296875, 16.35205078125, 17.138671875, 17.92529296875, 18.7119140625, 19.49853515625, 20.28515625, 21.07177734375, 21.8583984375, 22.64501953125, 23.431640625, 24.21826171875, 25.0048828125, 25.79150390625, 26.578125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 19.0, 18.0, 20.0, 38.0, 37.0, 48.0, 108.0, 146.0, 201.0, 324.0, 455.0, 711.0, 1243.0, 2158.0, 4244.0, 9515.0, 24158.0, 77463.0, 325647.0, 443171.0, 104764.0, 31123.0, 11462.0, 5074.0, 2575.0, 1411.0, 865.0, 519.0, 347.0, 211.0, 145.0, 96.0, 63.0, 41.0, 40.0, 27.0, 19.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.5625, -41.31494140625, -40.0673828125, -38.81982421875, -37.572265625, -36.32470703125, -35.0771484375, -33.82958984375, -32.58203125, -31.33447265625, -30.0869140625, -28.83935546875, -27.591796875, -26.34423828125, -25.0966796875, -23.84912109375, -22.6015625, -21.35400390625, -20.1064453125, -18.85888671875, -17.611328125, -16.36376953125, -15.1162109375, -13.86865234375, -12.62109375, -11.37353515625, -10.1259765625, -8.87841796875, -7.630859375, -6.38330078125, -5.1357421875, -3.88818359375, -2.640625, -1.39306640625, -0.1455078125, 1.10205078125, 2.349609375, 3.59716796875, 4.8447265625, 6.09228515625, 7.33984375, 8.58740234375, 9.8349609375, 11.08251953125, 12.330078125, 13.57763671875, 14.8251953125, 16.07275390625, 17.3203125, 18.56787109375, 19.8154296875, 21.06298828125, 22.310546875, 23.55810546875, 24.8056640625, 26.05322265625, 27.30078125, 28.54833984375, 29.7958984375, 31.04345703125, 32.291015625, 33.53857421875, 34.7861328125, 36.03369140625, 37.28125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 9.0, 8.0, 12.0, 15.0, 14.0, 22.0, 34.0, 28.0, 68.0, 45.0, 48.0, 59.0, 78.0, 143.0, 269.0, 1467.0, 197.0, 115.0, 76.0, 38.0, 61.0, 38.0, 35.0, 36.0, 24.0, 19.0, 18.0, 16.0, 6.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.625, -60.560546875, -58.49609375, -56.431640625, -54.3671875, -52.302734375, -50.23828125, -48.173828125, -46.109375, -44.044921875, -41.98046875, -39.916015625, -37.8515625, -35.787109375, -33.72265625, -31.658203125, -29.59375, -27.529296875, -25.46484375, -23.400390625, -21.3359375, -19.271484375, -17.20703125, -15.142578125, -13.078125, -11.013671875, -8.94921875, -6.884765625, -4.8203125, -2.755859375, -0.69140625, 1.373046875, 3.4375, 5.501953125, 7.56640625, 9.630859375, 11.6953125, 13.759765625, 15.82421875, 17.888671875, 19.953125, 22.017578125, 24.08203125, 26.146484375, 28.2109375, 30.275390625, 32.33984375, 34.404296875, 36.46875, 38.533203125, 40.59765625, 42.662109375, 44.7265625, 46.791015625, 48.85546875, 50.919921875, 52.984375, 55.048828125, 57.11328125, 59.177734375, 61.2421875, 63.306640625, 65.37109375, 67.435546875, 69.5]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 7.0, 10.0, 18.0, 23.0, 27.0, 29.0, 63.0, 99.0, 139.0, 261.0, 542.0, 2568.0, 195079.0, 2932869.0, 12103.0, 949.0, 361.0, 208.0, 104.0, 84.0, 41.0, 31.0, 29.0, 19.0, 10.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.125, -165.974609375, -160.82421875, -155.673828125, -150.5234375, -145.373046875, -140.22265625, -135.072265625, -129.921875, -124.771484375, -119.62109375, -114.470703125, -109.3203125, -104.169921875, -99.01953125, -93.869140625, -88.71875, -83.568359375, -78.41796875, -73.267578125, -68.1171875, -62.966796875, -57.81640625, -52.666015625, -47.515625, -42.365234375, -37.21484375, -32.064453125, -26.9140625, -21.763671875, -16.61328125, -11.462890625, -6.3125, -1.162109375, 3.98828125, 9.138671875, 14.2890625, 19.439453125, 24.58984375, 29.740234375, 34.890625, 40.041015625, 45.19140625, 50.341796875, 55.4921875, 60.642578125, 65.79296875, 70.943359375, 76.09375, 81.244140625, 86.39453125, 91.544921875, 96.6953125, 101.845703125, 106.99609375, 112.146484375, 117.296875, 122.447265625, 127.59765625, 132.748046875, 137.8984375, 143.048828125, 148.19921875, 153.349609375, 158.5]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 21.0, 565.0, 419.0, 11.0, 3.0], "bins": [-1529.5020751953125, -1504.400390625, -1479.298828125, -1454.197265625, -1429.0955810546875, -1403.993896484375, -1378.892333984375, -1353.790771484375, -1328.6890869140625, -1303.58740234375, -1278.48583984375, -1253.38427734375, -1228.2825927734375, -1203.180908203125, -1178.079345703125, -1152.977783203125, -1127.8760986328125, -1102.7744140625, -1077.6728515625, -1052.5712890625, -1027.4696044921875, -1002.3679809570312, -977.266357421875, -952.1647338867188, -927.0631103515625, -901.9614868164062, -876.85986328125, -851.7582397460938, -826.6566162109375, -801.5549926757812, -776.453369140625, -751.3517456054688, -726.2500610351562, -701.1484375, -676.0468139648438, -650.9451904296875, -625.8435668945312, -600.741943359375, -575.6403198242188, -550.5386962890625, -525.4370727539062, -500.33544921875, -475.23382568359375, -450.1322021484375, -425.03057861328125, -399.928955078125, -374.82733154296875, -349.7257080078125, -324.62408447265625, -299.5224609375, -274.42083740234375, -249.3192138671875, -224.21759033203125, -199.115966796875, -174.01434326171875, -148.9127197265625, -123.81111145019531, -98.70948791503906, -73.60786437988281, -48.50624084472656, -23.404617309570312, 1.6970062255859375, 26.798629760742188, 51.90025329589844, 77.00187683105469]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 5.0, 4.0, 6.0, 5.0, 8.0, 8.0, 8.0, 11.0, 14.0, 23.0, 20.0, 23.0, 36.0, 39.0, 21.0, 34.0, 41.0, 34.0, 47.0, 44.0, 50.0, 58.0, 39.0, 39.0, 40.0, 33.0, 35.0, 42.0, 35.0, 32.0, 24.0, 16.0, 23.0, 22.0, 21.0, 24.0, 9.0, 14.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.12045288085938, -151.65086364746094, -147.18125915527344, -142.711669921875, -138.24208068847656, -133.77249145507812, -129.30288696289062, -124.83329772949219, -120.36370086669922, -115.89410400390625, -111.42451477050781, -106.95491790771484, -102.48532104492188, -98.01573181152344, -93.54613494873047, -89.0765380859375, -84.60694885253906, -80.1373519897461, -75.66776275634766, -71.19816589355469, -66.72857666015625, -62.25897979736328, -57.78938293457031, -53.31978988647461, -48.850196838378906, -44.3806037902832, -39.9110107421875, -35.44141387939453, -30.971820831298828, -26.502227783203125, -22.03263282775879, -17.563037872314453, -13.09344482421875, -8.62385082244873, -4.154256820678711, 0.3153371810913086, 4.784931182861328, 9.254524230957031, 13.724119186401367, 18.193714141845703, 22.663307189941406, 27.13290023803711, 31.602495193481445, 36.07209014892578, 40.541683197021484, 45.01127624511719, 49.480873107910156, 53.95046615600586, 58.42005920410156, 62.889652252197266, 67.35924530029297, 71.82884216308594, 76.29843139648438, 80.76802825927734, 85.23762512207031, 89.70721435546875, 94.17681121826172, 98.64640808105469, 103.11599731445312, 107.5855941772461, 112.05519104003906, 116.5247802734375, 120.99437713623047, 125.46397399902344, 129.93356323242188]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 12.0, 11.0, 12.0, 17.0, 21.0, 26.0, 21.0, 25.0, 30.0, 31.0, 46.0, 33.0, 36.0, 36.0, 43.0, 39.0, 39.0, 36.0, 52.0, 45.0, 51.0, 35.0, 28.0, 44.0, 26.0, 26.0, 26.0, 21.0, 16.0, 12.0, 12.0, 22.0, 14.0, 6.0, 9.0, 13.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.734375, -25.895263671875, -25.05615234375, -24.217041015625, -23.3779296875, -22.538818359375, -21.69970703125, -20.860595703125, -20.021484375, -19.182373046875, -18.34326171875, -17.504150390625, -16.6650390625, -15.825927734375, -14.98681640625, -14.147705078125, -13.30859375, -12.469482421875, -11.63037109375, -10.791259765625, -9.9521484375, -9.113037109375, -8.27392578125, -7.434814453125, -6.595703125, -5.756591796875, -4.91748046875, -4.078369140625, -3.2392578125, -2.400146484375, -1.56103515625, -0.721923828125, 0.1171875, 0.956298828125, 1.79541015625, 2.634521484375, 3.4736328125, 4.312744140625, 5.15185546875, 5.990966796875, 6.830078125, 7.669189453125, 8.50830078125, 9.347412109375, 10.1865234375, 11.025634765625, 11.86474609375, 12.703857421875, 13.54296875, 14.382080078125, 15.22119140625, 16.060302734375, 16.8994140625, 17.738525390625, 18.57763671875, 19.416748046875, 20.255859375, 21.094970703125, 21.93408203125, 22.773193359375, 23.6123046875, 24.451416015625, 25.29052734375, 26.129638671875, 26.96875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 1.0, 1.0, 4.0, 9.0, 14.0, 16.0, 20.0, 19.0, 18.0, 24.0, 35.0, 52.0, 65.0, 72.0, 111.0, 193.0, 246.0, 455.0, 1012.0, 3947.0, 212753.0, 3964342.0, 7711.0, 1568.0, 579.0, 274.0, 182.0, 149.0, 90.0, 71.0, 45.0, 44.0, 34.0, 27.0, 18.0, 11.0, 15.0, 18.0, 7.0, 7.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0], "bins": [-341.0, -331.826171875, -322.65234375, -313.478515625, -304.3046875, -295.130859375, -285.95703125, -276.783203125, -267.609375, -258.435546875, -249.26171875, -240.087890625, -230.9140625, -221.740234375, -212.56640625, -203.392578125, -194.21875, -185.044921875, -175.87109375, -166.697265625, -157.5234375, -148.349609375, -139.17578125, -130.001953125, -120.828125, -111.654296875, -102.48046875, -93.306640625, -84.1328125, -74.958984375, -65.78515625, -56.611328125, -47.4375, -38.263671875, -29.08984375, -19.916015625, -10.7421875, -1.568359375, 7.60546875, 16.779296875, 25.953125, 35.126953125, 44.30078125, 53.474609375, 62.6484375, 71.822265625, 80.99609375, 90.169921875, 99.34375, 108.517578125, 117.69140625, 126.865234375, 136.0390625, 145.212890625, 154.38671875, 163.560546875, 172.734375, 181.908203125, 191.08203125, 200.255859375, 209.4296875, 218.603515625, 227.77734375, 236.951171875, 246.125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 10.0, 9.0, 19.0, 15.0, 29.0, 43.0, 89.0, 166.0, 458.0, 947.0, 1216.0, 563.0, 228.0, 104.0, 70.0, 31.0, 14.0, 19.0, 11.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.625, -61.447265625, -59.26953125, -57.091796875, -54.9140625, -52.736328125, -50.55859375, -48.380859375, -46.203125, -44.025390625, -41.84765625, -39.669921875, -37.4921875, -35.314453125, -33.13671875, -30.958984375, -28.78125, -26.603515625, -24.42578125, -22.248046875, -20.0703125, -17.892578125, -15.71484375, -13.537109375, -11.359375, -9.181640625, -7.00390625, -4.826171875, -2.6484375, -0.470703125, 1.70703125, 3.884765625, 6.0625, 8.240234375, 10.41796875, 12.595703125, 14.7734375, 16.951171875, 19.12890625, 21.306640625, 23.484375, 25.662109375, 27.83984375, 30.017578125, 32.1953125, 34.373046875, 36.55078125, 38.728515625, 40.90625, 43.083984375, 45.26171875, 47.439453125, 49.6171875, 51.794921875, 53.97265625, 56.150390625, 58.328125, 60.505859375, 62.68359375, 64.861328125, 67.0390625, 69.216796875, 71.39453125, 73.572265625, 75.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 11.0, 15.0, 28.0, 33.0, 34.0, 76.0, 121.0, 269.0, 737.0, 2439.0, 18396.0, 3824163.0, 336921.0, 8531.0, 1530.0, 506.0, 208.0, 95.0, 57.0, 26.0, 25.0, 22.0, 10.0, 14.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-314.75, -307.73046875, -300.7109375, -293.69140625, -286.671875, -279.65234375, -272.6328125, -265.61328125, -258.59375, -251.57421875, -244.5546875, -237.53515625, -230.515625, -223.49609375, -216.4765625, -209.45703125, -202.4375, -195.41796875, -188.3984375, -181.37890625, -174.359375, -167.33984375, -160.3203125, -153.30078125, -146.28125, -139.26171875, -132.2421875, -125.22265625, -118.203125, -111.18359375, -104.1640625, -97.14453125, -90.125, -83.10546875, -76.0859375, -69.06640625, -62.046875, -55.02734375, -48.0078125, -40.98828125, -33.96875, -26.94921875, -19.9296875, -12.91015625, -5.890625, 1.12890625, 8.1484375, 15.16796875, 22.1875, 29.20703125, 36.2265625, 43.24609375, 50.265625, 57.28515625, 64.3046875, 71.32421875, 78.34375, 85.36328125, 92.3828125, 99.40234375, 106.421875, 113.44140625, 120.4609375, 127.48046875, 134.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 12.0, 38.0, 102.0, 346.0, 300.0, 132.0, 43.0, 19.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-449.460205078125, -435.8744812011719, -422.2887268066406, -408.7030029296875, -395.11724853515625, -381.5315246582031, -367.94580078125, -354.36004638671875, -340.7743225097656, -327.1885986328125, -313.60284423828125, -300.0171203613281, -286.431396484375, -272.84564208984375, -259.2599182128906, -245.67417907714844, -232.08843994140625, -218.50270080566406, -204.91696166992188, -191.33123779296875, -177.74549865722656, -164.15975952148438, -150.57403564453125, -136.98829650878906, -123.40255737304688, -109.81681823730469, -96.23108673095703, -82.64535522460938, -69.05961608886719, -55.473876953125, -41.888145446777344, -28.302413940429688, -14.7166748046875, -1.1309394836425781, 12.454795837402344, 26.040531158447266, 39.62626647949219, 53.212005615234375, 66.79773712158203, 80.38346862792969, 93.96920776367188, 107.55494689941406, 121.14067840576172, 134.72640991210938, 148.31214904785156, 161.89788818359375, 175.48361206054688, 189.06935119628906, 202.65509033203125, 216.24082946777344, 229.82656860351562, 243.41229248046875, 256.998046875, 270.5837707519531, 284.16949462890625, 297.7552490234375, 311.3409729003906, 324.92669677734375, 338.512451171875, 352.0981750488281, 365.68389892578125, 379.2696533203125, 392.8553771972656, 406.44110107421875, 420.02685546875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 5.0, 5.0, 11.0, 18.0, 15.0, 14.0, 22.0, 26.0, 25.0, 23.0, 25.0, 32.0, 33.0, 45.0, 48.0, 38.0, 40.0, 32.0, 43.0, 46.0, 43.0, 45.0, 44.0, 37.0, 33.0, 36.0, 32.0, 22.0, 28.0, 20.0, 21.0, 21.0, 17.0, 12.0, 7.0, 7.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.51754760742188, -121.16007995605469, -116.80260467529297, -112.44512939453125, -108.08766174316406, -103.73019409179688, -99.37271881103516, -95.01524353027344, -90.65777587890625, -86.30030822753906, -81.94283294677734, -77.58535766601562, -73.22789001464844, -68.87042236328125, -64.51294708251953, -60.15547561645508, -55.798004150390625, -51.44053268432617, -47.08306121826172, -42.725589752197266, -38.36811828613281, -34.01064682006836, -29.653175354003906, -25.295703887939453, -20.938232421875, -16.580760955810547, -12.223289489746094, -7.865818023681641, -3.5083465576171875, 0.8491249084472656, 5.206596374511719, 9.564067840576172, 13.921524047851562, 18.278995513916016, 22.63646697998047, 26.993938446044922, 31.351409912109375, 35.70888137817383, 40.06635284423828, 44.423824310302734, 48.78129577636719, 53.13876724243164, 57.496238708496094, 61.85371017456055, 66.211181640625, 70.56864929199219, 74.9261245727539, 79.28359985351562, 83.64106750488281, 87.99853515625, 92.35601043701172, 96.71348571777344, 101.07095336914062, 105.42842102050781, 109.78589630126953, 114.14337158203125, 118.50083923339844, 122.85830688476562, 127.21578216552734, 131.57325744628906, 135.93072509765625, 140.28819274902344, 144.64566040039062, 149.00314331054688, 153.36061096191406]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 7.0, 15.0, 9.0, 5.0, 16.0, 10.0, 12.0, 20.0, 19.0, 22.0, 28.0, 27.0, 36.0, 32.0, 44.0, 27.0, 42.0, 38.0, 52.0, 33.0, 46.0, 56.0, 39.0, 46.0, 35.0, 40.0, 33.0, 26.0, 21.0, 23.0, 22.0, 27.0, 14.0, 16.0, 13.0, 2.0, 11.0, 4.0, 1.0, 9.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0], "bins": [-31.25, -30.3486328125, -29.447265625, -28.5458984375, -27.64453125, -26.7431640625, -25.841796875, -24.9404296875, -24.0390625, -23.1376953125, -22.236328125, -21.3349609375, -20.43359375, -19.5322265625, -18.630859375, -17.7294921875, -16.828125, -15.9267578125, -15.025390625, -14.1240234375, -13.22265625, -12.3212890625, -11.419921875, -10.5185546875, -9.6171875, -8.7158203125, -7.814453125, -6.9130859375, -6.01171875, -5.1103515625, -4.208984375, -3.3076171875, -2.40625, -1.5048828125, -0.603515625, 0.2978515625, 1.19921875, 2.1005859375, 3.001953125, 3.9033203125, 4.8046875, 5.7060546875, 6.607421875, 7.5087890625, 8.41015625, 9.3115234375, 10.212890625, 11.1142578125, 12.015625, 12.9169921875, 13.818359375, 14.7197265625, 15.62109375, 16.5224609375, 17.423828125, 18.3251953125, 19.2265625, 20.1279296875, 21.029296875, 21.9306640625, 22.83203125, 23.7333984375, 24.634765625, 25.5361328125, 26.4375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 10.0, 14.0, 26.0, 38.0, 69.0, 98.0, 142.0, 201.0, 275.0, 513.0, 812.0, 1210.0, 1842.0, 2952.0, 4487.0, 6983.0, 11129.0, 17401.0, 28522.0, 46428.0, 78351.0, 134109.0, 212223.0, 198481.0, 120418.0, 70158.0, 41792.0, 25401.0, 16372.0, 10073.0, 6454.0, 4086.0, 2667.0, 1684.0, 1090.0, 731.0, 491.0, 323.0, 162.0, 108.0, 79.0, 43.0, 40.0, 27.0, 11.0, 11.0, 9.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.314453125, -1.27191162109375, -1.2293701171875, -1.18682861328125, -1.144287109375, -1.10174560546875, -1.0592041015625, -1.01666259765625, -0.97412109375, -0.93157958984375, -0.8890380859375, -0.84649658203125, -0.803955078125, -0.76141357421875, -0.7188720703125, -0.67633056640625, -0.6337890625, -0.59124755859375, -0.5487060546875, -0.50616455078125, -0.463623046875, -0.42108154296875, -0.3785400390625, -0.33599853515625, -0.29345703125, -0.25091552734375, -0.2083740234375, -0.16583251953125, -0.123291015625, -0.08074951171875, -0.0382080078125, 0.00433349609375, 0.046875, 0.08941650390625, 0.1319580078125, 0.17449951171875, 0.217041015625, 0.25958251953125, 0.3021240234375, 0.34466552734375, 0.38720703125, 0.42974853515625, 0.4722900390625, 0.51483154296875, 0.557373046875, 0.59991455078125, 0.6424560546875, 0.68499755859375, 0.7275390625, 0.77008056640625, 0.8126220703125, 0.85516357421875, 0.897705078125, 0.94024658203125, 0.9827880859375, 1.02532958984375, 1.06787109375, 1.11041259765625, 1.1529541015625, 1.19549560546875, 1.238037109375, 1.28057861328125, 1.3231201171875, 1.36566162109375, 1.408203125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 4.0, 9.0, 12.0, 14.0, 17.0, 19.0, 14.0, 18.0, 25.0, 30.0, 20.0, 23.0, 32.0, 36.0, 38.0, 38.0, 38.0, 35.0, 43.0, 1072.0, 41.0, 43.0, 29.0, 27.0, 46.0, 32.0, 28.0, 24.0, 30.0, 27.0, 19.0, 18.0, 16.0, 24.0, 11.0, 10.0, 6.0, 8.0, 5.0, 5.0, 9.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-18.34375, -17.8087158203125, -17.273681640625, -16.7386474609375, -16.20361328125, -15.6685791015625, -15.133544921875, -14.5985107421875, -14.0634765625, -13.5284423828125, -12.993408203125, -12.4583740234375, -11.92333984375, -11.3883056640625, -10.853271484375, -10.3182373046875, -9.783203125, -9.2481689453125, -8.713134765625, -8.1781005859375, -7.64306640625, -7.1080322265625, -6.572998046875, -6.0379638671875, -5.5029296875, -4.9678955078125, -4.432861328125, -3.8978271484375, -3.36279296875, -2.8277587890625, -2.292724609375, -1.7576904296875, -1.22265625, -0.6876220703125, -0.152587890625, 0.3824462890625, 0.91748046875, 1.4525146484375, 1.987548828125, 2.5225830078125, 3.0576171875, 3.5926513671875, 4.127685546875, 4.6627197265625, 5.19775390625, 5.7327880859375, 6.267822265625, 6.8028564453125, 7.337890625, 7.8729248046875, 8.407958984375, 8.9429931640625, 9.47802734375, 10.0130615234375, 10.548095703125, 11.0831298828125, 11.6181640625, 12.1531982421875, 12.688232421875, 13.2232666015625, 13.75830078125, 14.2933349609375, 14.828369140625, 15.3634033203125, 15.8984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 7.0, 8.0, 11.0, 19.0, 25.0, 39.0, 66.0, 68.0, 117.0, 188.0, 253.0, 339.0, 577.0, 852.0, 1171.0, 1614.0, 2349.0, 3345.0, 4940.0, 6773.0, 9922.0, 14463.0, 21005.0, 32112.0, 49355.0, 77061.0, 125224.0, 1233334.0, 190142.0, 113644.0, 70928.0, 44977.0, 28991.0, 19656.0, 13267.0, 9193.0, 6381.0, 4451.0, 3127.0, 2156.0, 1579.0, 1048.0, 757.0, 508.0, 359.0, 230.0, 152.0, 138.0, 80.0, 57.0, 31.0, 20.0, 11.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-1.0615234375, -1.0282440185546875, -0.994964599609375, -0.9616851806640625, -0.92840576171875, -0.8951263427734375, -0.861846923828125, -0.8285675048828125, -0.7952880859375, -0.7620086669921875, -0.728729248046875, -0.6954498291015625, -0.66217041015625, -0.6288909912109375, -0.595611572265625, -0.5623321533203125, -0.529052734375, -0.4957733154296875, -0.462493896484375, -0.4292144775390625, -0.39593505859375, -0.3626556396484375, -0.329376220703125, -0.2960968017578125, -0.2628173828125, -0.2295379638671875, -0.196258544921875, -0.1629791259765625, -0.12969970703125, -0.0964202880859375, -0.063140869140625, -0.0298614501953125, 0.00341796875, 0.0366973876953125, 0.069976806640625, 0.1032562255859375, 0.13653564453125, 0.1698150634765625, 0.203094482421875, 0.2363739013671875, 0.2696533203125, 0.3029327392578125, 0.336212158203125, 0.3694915771484375, 0.40277099609375, 0.4360504150390625, 0.469329833984375, 0.5026092529296875, 0.535888671875, 0.5691680908203125, 0.602447509765625, 0.6357269287109375, 0.66900634765625, 0.7022857666015625, 0.735565185546875, 0.7688446044921875, 0.8021240234375, 0.8354034423828125, 0.868682861328125, 0.9019622802734375, 0.93524169921875, 0.9685211181640625, 1.001800537109375, 1.0350799560546875, 1.068359375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 2.0, 5.0, 12.0, 13.0, 13.0, 17.0, 31.0, 27.0, 27.0, 40.0, 52.0, 54.0, 46.0, 66.0, 64.0, 62.0, 54.0, 55.0, 64.0, 48.0, 39.0, 36.0, 31.0, 27.0, 19.0, 14.0, 7.0, 6.0, 14.0, 10.0, 4.0, 5.0, 7.0, 1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.007022857666015625, -0.006814539432525635, -0.0066062211990356445, -0.006397902965545654, -0.006189584732055664, -0.005981266498565674, -0.005772948265075684, -0.005564630031585693, -0.005356311798095703, -0.005147993564605713, -0.004939675331115723, -0.004731357097625732, -0.004523038864135742, -0.004314720630645752, -0.004106402397155762, -0.0038980841636657715, -0.0036897659301757812, -0.003481447696685791, -0.0032731294631958008, -0.0030648112297058105, -0.0028564929962158203, -0.00264817476272583, -0.00243985652923584, -0.0022315382957458496, -0.0020232200622558594, -0.0018149018287658691, -0.001606583595275879, -0.0013982653617858887, -0.0011899471282958984, -0.0009816288948059082, -0.000773310661315918, -0.0005649924278259277, -0.0003566741943359375, -0.00014835596084594727, 5.996227264404297e-05, 0.0002682805061340332, 0.00047659873962402344, 0.0006849169731140137, 0.0008932352066040039, 0.0011015534400939941, 0.0013098716735839844, 0.0015181899070739746, 0.0017265081405639648, 0.001934826374053955, 0.0021431446075439453, 0.0023514628410339355, 0.0025597810745239258, 0.002768099308013916, 0.0029764175415039062, 0.0031847357749938965, 0.0033930540084838867, 0.003601372241973877, 0.003809690475463867, 0.004018008708953857, 0.004226326942443848, 0.004434645175933838, 0.004642963409423828, 0.004851281642913818, 0.005059599876403809, 0.005267918109893799, 0.005476236343383789, 0.005684554576873779, 0.0058928728103637695, 0.00610119104385376, 0.00630950927734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 12.0, 10.0, 15.0, 14.0, 19.0, 30.0, 29.0, 36.0, 55.0, 92.0, 123.0, 150.0, 274.0, 551.0, 1291.0, 129268.0, 912181.0, 2828.0, 632.0, 290.0, 170.0, 125.0, 91.0, 67.0, 39.0, 31.0, 23.0, 17.0, 11.0, 17.0, 10.0, 6.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.11941719055175781, -0.11517715454101562, -0.11093711853027344, -0.10669708251953125, -0.10245704650878906, -0.09821701049804688, -0.09397697448730469, -0.0897369384765625, -0.08549690246582031, -0.08125686645507812, -0.07701683044433594, -0.07277679443359375, -0.06853675842285156, -0.06429672241210938, -0.06005668640136719, -0.055816650390625, -0.05157661437988281, -0.047336578369140625, -0.04309654235839844, -0.03885650634765625, -0.03461647033691406, -0.030376434326171875, -0.026136398315429688, -0.0218963623046875, -0.017656326293945312, -0.013416290283203125, -0.009176254272460938, -0.00493621826171875, -0.0006961822509765625, 0.003543853759765625, 0.0077838897705078125, 0.01202392578125, 0.016263961791992188, 0.020503997802734375, 0.024744033813476562, 0.02898406982421875, 0.03322410583496094, 0.037464141845703125, 0.04170417785644531, 0.0459442138671875, 0.05018424987792969, 0.054424285888671875, 0.05866432189941406, 0.06290435791015625, 0.06714439392089844, 0.07138442993164062, 0.07562446594238281, 0.079864501953125, 0.08410453796386719, 0.08834457397460938, 0.09258460998535156, 0.09682464599609375, 0.10106468200683594, 0.10530471801757812, 0.10954475402832031, 0.1137847900390625, 0.11802482604980469, 0.12226486206054688, 0.12650489807128906, 0.13074493408203125, 0.13498497009277344, 0.13922500610351562, 0.1434650421142578, 0.147705078125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 32.0, 765.0, 209.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00774567062035203, -0.0063897971995174885, -0.0050339242443442345, -0.003678050823509693, -0.002322177402675152, -0.0009663039818406105, 0.0003895689733326435, 0.0017454423941671848, 0.003101315815001726, 0.0044571892358362675, 0.0058130621910095215, 0.007168935611844063, 0.008524809032678604, 0.009880682453513145, 0.011236555874347687, 0.012592429295182228, 0.01394830271601677, 0.01530417613685131, 0.016660049557685852, 0.018015922978520393, 0.019371796399354935, 0.020727669820189476, 0.022083543241024017, 0.02343941479921341, 0.02479528822004795, 0.026151161640882492, 0.027507035061717033, 0.028862908482551575, 0.030218781903386116, 0.03157465532422066, 0.03293052688241005, 0.03428640216588974, 0.03564227744936943, 0.03699814900755882, 0.03835402429103851, 0.039709895849227905, 0.041065771132707596, 0.04242164269089699, 0.04377751797437668, 0.04513338953256607, 0.04648926481604576, 0.04784513637423515, 0.049201011657714844, 0.050556883215904236, 0.051912758499383926, 0.05326863005757332, 0.05462450534105301, 0.0559803768992424, 0.05733624845743179, 0.058692120015621185, 0.060047995299100876, 0.06140386685729027, 0.06275974214076996, 0.06411561369895935, 0.06547148525714874, 0.06682736426591873, 0.06818323582410812, 0.06953910738229752, 0.07089497894048691, 0.0722508579492569, 0.07360672950744629, 0.07496260106563568, 0.07631847262382507, 0.07767435163259506, 0.07903022319078445]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 10.0, 9.0, 10.0, 14.0, 15.0, 19.0, 19.0, 24.0, 24.0, 26.0, 30.0, 31.0, 43.0, 51.0, 44.0, 48.0, 39.0, 43.0, 44.0, 40.0, 43.0, 42.0, 32.0, 33.0, 27.0, 27.0, 45.0, 23.0, 28.0, 14.0, 12.0, 16.0, 11.0, 19.0, 9.0, 8.0, 2.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004876494407653809, -0.0047376034781336784, -0.004598712548613548, -0.004459821619093418, -0.004320930689573288, -0.004182039760053158, -0.004043148830533028, -0.0039042579010128975, -0.0037653669714927673, -0.003626476041972637, -0.003487585112452507, -0.003348694182932377, -0.0032098032534122467, -0.0030709123238921165, -0.0029320213943719864, -0.0027931304648518562, -0.002654239535331726, -0.002515348605811596, -0.0023764576762914658, -0.0022375667467713356, -0.0020986758172512054, -0.0019597848877310753, -0.0018208939582109451, -0.001682003028690815, -0.0015431120991706848, -0.0014042211696505547, -0.0012653302401304245, -0.0011264393106102943, -0.0009875483810901642, -0.000848657451570034, -0.0007097665220499039, -0.0005708755925297737, -0.00043198466300964355, -0.0002930937334895134, -0.00015420280396938324, -1.5311874449253082e-05, 0.00012357905507087708, 0.00026246998459100723, 0.0004013609141111374, 0.0005402518436312675, 0.0006791427731513977, 0.0008180337026715279, 0.000956924632191658, 0.0010958155617117882, 0.0012347064912319183, 0.0013735974207520485, 0.0015124883502721786, 0.0016513792797923088, 0.001790270209312439, 0.0019291611388325691, 0.0020680520683526993, 0.0022069429978728294, 0.0023458339273929596, 0.0024847248569130898, 0.00262361578643322, 0.00276250671595335, 0.0029013976454734802, 0.0030402885749936104, 0.0031791795045137405, 0.0033180704340338707, 0.003456961363554001, 0.003595852293074131, 0.003734743222594261, 0.0038736341521143913, 0.0040125250816345215]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 7.0, 15.0, 9.0, 5.0, 16.0, 10.0, 12.0, 20.0, 19.0, 22.0, 28.0, 27.0, 36.0, 32.0, 44.0, 27.0, 42.0, 38.0, 52.0, 33.0, 46.0, 56.0, 39.0, 46.0, 35.0, 40.0, 33.0, 26.0, 21.0, 23.0, 22.0, 27.0, 14.0, 16.0, 13.0, 2.0, 11.0, 4.0, 1.0, 9.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0], "bins": [-31.25, -30.3486328125, -29.447265625, -28.5458984375, -27.64453125, -26.7431640625, -25.841796875, -24.9404296875, -24.0390625, -23.1376953125, -22.236328125, -21.3349609375, -20.43359375, -19.5322265625, -18.630859375, -17.7294921875, -16.828125, -15.9267578125, -15.025390625, -14.1240234375, -13.22265625, -12.3212890625, -11.419921875, -10.5185546875, -9.6171875, -8.7158203125, -7.814453125, -6.9130859375, -6.01171875, -5.1103515625, -4.208984375, -3.3076171875, -2.40625, -1.5048828125, -0.603515625, 0.2978515625, 1.19921875, 2.1005859375, 3.001953125, 3.9033203125, 4.8046875, 5.7060546875, 6.607421875, 7.5087890625, 8.41015625, 9.3115234375, 10.212890625, 11.1142578125, 12.015625, 12.9169921875, 13.818359375, 14.7197265625, 15.62109375, 16.5224609375, 17.423828125, 18.3251953125, 19.2265625, 20.1279296875, 21.029296875, 21.9306640625, 22.83203125, 23.7333984375, 24.634765625, 25.5361328125, 26.4375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 13.0, 17.0, 21.0, 21.0, 31.0, 49.0, 70.0, 96.0, 110.0, 185.0, 227.0, 289.0, 410.0, 558.0, 798.0, 1207.0, 1964.0, 4516.0, 15048.0, 78815.0, 596899.0, 290521.0, 39248.0, 9049.0, 3232.0, 1570.0, 1001.0, 703.0, 496.0, 376.0, 285.0, 187.0, 164.0, 121.0, 59.0, 49.0, 33.0, 37.0, 22.0, 9.0, 9.0, 11.0, 6.0, 7.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.1875, -55.3896484375, -53.591796875, -51.7939453125, -49.99609375, -48.1982421875, -46.400390625, -44.6025390625, -42.8046875, -41.0068359375, -39.208984375, -37.4111328125, -35.61328125, -33.8154296875, -32.017578125, -30.2197265625, -28.421875, -26.6240234375, -24.826171875, -23.0283203125, -21.23046875, -19.4326171875, -17.634765625, -15.8369140625, -14.0390625, -12.2412109375, -10.443359375, -8.6455078125, -6.84765625, -5.0498046875, -3.251953125, -1.4541015625, 0.34375, 2.1416015625, 3.939453125, 5.7373046875, 7.53515625, 9.3330078125, 11.130859375, 12.9287109375, 14.7265625, 16.5244140625, 18.322265625, 20.1201171875, 21.91796875, 23.7158203125, 25.513671875, 27.3115234375, 29.109375, 30.9072265625, 32.705078125, 34.5029296875, 36.30078125, 38.0986328125, 39.896484375, 41.6943359375, 43.4921875, 45.2900390625, 47.087890625, 48.8857421875, 50.68359375, 52.4814453125, 54.279296875, 56.0771484375, 57.875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 14.0, 17.0, 20.0, 27.0, 30.0, 29.0, 48.0, 41.0, 65.0, 69.0, 81.0, 134.0, 1473.0, 360.0, 134.0, 104.0, 62.0, 57.0, 55.0, 45.0, 31.0, 25.0, 20.0, 12.0, 17.0, 15.0, 12.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-72.6875, -70.33984375, -67.9921875, -65.64453125, -63.296875, -60.94921875, -58.6015625, -56.25390625, -53.90625, -51.55859375, -49.2109375, -46.86328125, -44.515625, -42.16796875, -39.8203125, -37.47265625, -35.125, -32.77734375, -30.4296875, -28.08203125, -25.734375, -23.38671875, -21.0390625, -18.69140625, -16.34375, -13.99609375, -11.6484375, -9.30078125, -6.953125, -4.60546875, -2.2578125, 0.08984375, 2.4375, 4.78515625, 7.1328125, 9.48046875, 11.828125, 14.17578125, 16.5234375, 18.87109375, 21.21875, 23.56640625, 25.9140625, 28.26171875, 30.609375, 32.95703125, 35.3046875, 37.65234375, 40.0, 42.34765625, 44.6953125, 47.04296875, 49.390625, 51.73828125, 54.0859375, 56.43359375, 58.78125, 61.12890625, 63.4765625, 65.82421875, 68.171875, 70.51953125, 72.8671875, 75.21484375, 77.5625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 5.0, 9.0, 11.0, 12.0, 15.0, 16.0, 15.0, 18.0, 34.0, 32.0, 48.0, 76.0, 117.0, 175.0, 299.0, 593.0, 1520.0, 65022.0, 3073078.0, 2726.0, 793.0, 385.0, 238.0, 140.0, 71.0, 50.0, 36.0, 43.0, 29.0, 13.0, 11.0, 17.0, 11.0, 11.0, 9.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-287.75, -279.3359375, -270.921875, -262.5078125, -254.09375, -245.6796875, -237.265625, -228.8515625, -220.4375, -212.0234375, -203.609375, -195.1953125, -186.78125, -178.3671875, -169.953125, -161.5390625, -153.125, -144.7109375, -136.296875, -127.8828125, -119.46875, -111.0546875, -102.640625, -94.2265625, -85.8125, -77.3984375, -68.984375, -60.5703125, -52.15625, -43.7421875, -35.328125, -26.9140625, -18.5, -10.0859375, -1.671875, 6.7421875, 15.15625, 23.5703125, 31.984375, 40.3984375, 48.8125, 57.2265625, 65.640625, 74.0546875, 82.46875, 90.8828125, 99.296875, 107.7109375, 116.125, 124.5390625, 132.953125, 141.3671875, 149.78125, 158.1953125, 166.609375, 175.0234375, 183.4375, 191.8515625, 200.265625, 208.6796875, 217.09375, 225.5078125, 233.921875, 242.3359375, 250.75]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 14.0, 63.0, 449.0, 424.0, 53.0, 13.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-856.8184814453125, -840.9448852539062, -825.0713500976562, -809.19775390625, -793.32421875, -777.4506225585938, -761.5770874023438, -745.7034912109375, -729.8299560546875, -713.9563598632812, -698.0828247070312, -682.209228515625, -666.335693359375, -650.4620971679688, -634.5885620117188, -618.7149658203125, -602.8414306640625, -586.9678344726562, -571.0942993164062, -555.220703125, -539.34716796875, -523.4735717773438, -507.60003662109375, -491.7264709472656, -475.8528747558594, -459.97930908203125, -444.1057434082031, -428.232177734375, -412.3586120605469, -396.48504638671875, -380.6114807128906, -364.7379150390625, -348.8643798828125, -332.9908142089844, -317.11724853515625, -301.2436828613281, -285.3701171875, -269.4965515136719, -253.62298583984375, -237.74942016601562, -221.87582397460938, -206.00225830078125, -190.12869262695312, -174.255126953125, -158.38156127929688, -142.50799560546875, -126.6344223022461, -110.76085662841797, -94.88729858398438, -79.01373291015625, -63.140167236328125, -47.266597747802734, -31.39303207397461, -15.519462585449219, 0.35410308837890625, 16.22766876220703, 32.101234436035156, 47.97480010986328, 63.848365783691406, 79.72193908691406, 95.59550476074219, 111.46907043457031, 127.34263610839844, 143.21620178222656, 159.0897674560547]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 9.0, 7.0, 12.0, 4.0, 13.0, 12.0, 17.0, 30.0, 15.0, 18.0, 25.0, 18.0, 29.0, 29.0, 39.0, 45.0, 35.0, 41.0, 42.0, 50.0, 47.0, 41.0, 55.0, 54.0, 35.0, 41.0, 34.0, 40.0, 27.0, 28.0, 20.0, 18.0, 8.0, 12.0, 13.0, 9.0, 10.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-208.3531494140625, -202.52880859375, -196.7044677734375, -190.88014221191406, -185.05580139160156, -179.23146057128906, -173.40711975097656, -167.58279418945312, -161.75845336914062, -155.93411254882812, -150.10977172851562, -144.2854461669922, -138.4611053466797, -132.6367645263672, -126.81242370605469, -120.98809051513672, -115.16374969482422, -109.33940887451172, -103.51507568359375, -97.69073486328125, -91.86640167236328, -86.04206085205078, -80.21772766113281, -74.39338684082031, -68.56904602050781, -62.74470901489258, -56.920372009277344, -51.096031188964844, -45.271697998046875, -39.447357177734375, -33.62302017211914, -27.798683166503906, -21.974349975585938, -16.150012969970703, -10.325675010681152, -4.501337051391602, 1.3229999542236328, 7.147336959838867, 12.971675872802734, 18.79601287841797, 24.620349884033203, 30.444686889648438, 36.26902389526367, 42.093360900878906, 47.917701721191406, 53.742034912109375, 59.566375732421875, 65.39071655273438, 71.21504974365234, 77.03939056396484, 82.86372375488281, 88.68806457519531, 94.51239776611328, 100.33673858642578, 106.16107177734375, 111.98541259765625, 117.80975341796875, 123.63409423828125, 129.45843505859375, 135.2827606201172, 141.1071014404297, 146.9314422607422, 152.7557830810547, 158.58010864257812, 164.40444946289062]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 8.0, 9.0, 8.0, 10.0, 16.0, 14.0, 23.0, 22.0, 40.0, 31.0, 29.0, 35.0, 43.0, 44.0, 44.0, 45.0, 45.0, 61.0, 39.0, 54.0, 47.0, 27.0, 33.0, 37.0, 23.0, 29.0, 26.0, 34.0, 26.0, 16.0, 7.0, 7.0, 14.0, 10.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-37.78125, -36.7666015625, -35.751953125, -34.7373046875, -33.72265625, -32.7080078125, -31.693359375, -30.6787109375, -29.6640625, -28.6494140625, -27.634765625, -26.6201171875, -25.60546875, -24.5908203125, -23.576171875, -22.5615234375, -21.546875, -20.5322265625, -19.517578125, -18.5029296875, -17.48828125, -16.4736328125, -15.458984375, -14.4443359375, -13.4296875, -12.4150390625, -11.400390625, -10.3857421875, -9.37109375, -8.3564453125, -7.341796875, -6.3271484375, -5.3125, -4.2978515625, -3.283203125, -2.2685546875, -1.25390625, -0.2392578125, 0.775390625, 1.7900390625, 2.8046875, 3.8193359375, 4.833984375, 5.8486328125, 6.86328125, 7.8779296875, 8.892578125, 9.9072265625, 10.921875, 11.9365234375, 12.951171875, 13.9658203125, 14.98046875, 15.9951171875, 17.009765625, 18.0244140625, 19.0390625, 20.0537109375, 21.068359375, 22.0830078125, 23.09765625, 24.1123046875, 25.126953125, 26.1416015625, 27.15625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 7.0, 7.0, 9.0, 8.0, 6.0, 13.0, 16.0, 14.0, 13.0, 21.0, 44.0, 48.0, 57.0, 92.0, 162.0, 279.0, 493.0, 829.0, 1651.0, 3781.0, 15815.0, 1571764.0, 2570504.0, 20434.0, 4201.0, 1797.0, 892.0, 506.0, 267.0, 177.0, 97.0, 64.0, 51.0, 27.0, 30.0, 21.0, 11.0, 17.0, 9.0, 17.0, 5.0, 8.0, 6.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.875, -112.708984375, -108.54296875, -104.376953125, -100.2109375, -96.044921875, -91.87890625, -87.712890625, -83.546875, -79.380859375, -75.21484375, -71.048828125, -66.8828125, -62.716796875, -58.55078125, -54.384765625, -50.21875, -46.052734375, -41.88671875, -37.720703125, -33.5546875, -29.388671875, -25.22265625, -21.056640625, -16.890625, -12.724609375, -8.55859375, -4.392578125, -0.2265625, 3.939453125, 8.10546875, 12.271484375, 16.4375, 20.603515625, 24.76953125, 28.935546875, 33.1015625, 37.267578125, 41.43359375, 45.599609375, 49.765625, 53.931640625, 58.09765625, 62.263671875, 66.4296875, 70.595703125, 74.76171875, 78.927734375, 83.09375, 87.259765625, 91.42578125, 95.591796875, 99.7578125, 103.923828125, 108.08984375, 112.255859375, 116.421875, 120.587890625, 124.75390625, 128.919921875, 133.0859375, 137.251953125, 141.41796875, 145.583984375, 149.75]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 9.0, 18.0, 22.0, 13.0, 29.0, 39.0, 72.0, 109.0, 197.0, 376.0, 620.0, 891.0, 634.0, 397.0, 217.0, 130.0, 91.0, 44.0, 41.0, 29.0, 26.0, 11.0, 8.0, 7.0, 7.0, 7.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.96875, -62.064453125, -60.16015625, -58.255859375, -56.3515625, -54.447265625, -52.54296875, -50.638671875, -48.734375, -46.830078125, -44.92578125, -43.021484375, -41.1171875, -39.212890625, -37.30859375, -35.404296875, -33.5, -31.595703125, -29.69140625, -27.787109375, -25.8828125, -23.978515625, -22.07421875, -20.169921875, -18.265625, -16.361328125, -14.45703125, -12.552734375, -10.6484375, -8.744140625, -6.83984375, -4.935546875, -3.03125, -1.126953125, 0.77734375, 2.681640625, 4.5859375, 6.490234375, 8.39453125, 10.298828125, 12.203125, 14.107421875, 16.01171875, 17.916015625, 19.8203125, 21.724609375, 23.62890625, 25.533203125, 27.4375, 29.341796875, 31.24609375, 33.150390625, 35.0546875, 36.958984375, 38.86328125, 40.767578125, 42.671875, 44.576171875, 46.48046875, 48.384765625, 50.2890625, 52.193359375, 54.09765625, 56.001953125, 57.90625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 6.0, 11.0, 17.0, 17.0, 25.0, 37.0, 80.0, 142.0, 222.0, 452.0, 966.0, 2099.0, 5005.0, 16531.0, 101886.0, 3599947.0, 420221.0, 32713.0, 8103.0, 3008.0, 1348.0, 683.0, 316.0, 154.0, 101.0, 59.0, 36.0, 15.0, 12.0, 12.0, 13.0, 1.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.75, -99.4052734375, -96.060546875, -92.7158203125, -89.37109375, -86.0263671875, -82.681640625, -79.3369140625, -75.9921875, -72.6474609375, -69.302734375, -65.9580078125, -62.61328125, -59.2685546875, -55.923828125, -52.5791015625, -49.234375, -45.8896484375, -42.544921875, -39.2001953125, -35.85546875, -32.5107421875, -29.166015625, -25.8212890625, -22.4765625, -19.1318359375, -15.787109375, -12.4423828125, -9.09765625, -5.7529296875, -2.408203125, 0.9365234375, 4.28125, 7.6259765625, 10.970703125, 14.3154296875, 17.66015625, 21.0048828125, 24.349609375, 27.6943359375, 31.0390625, 34.3837890625, 37.728515625, 41.0732421875, 44.41796875, 47.7626953125, 51.107421875, 54.4521484375, 57.796875, 61.1416015625, 64.486328125, 67.8310546875, 71.17578125, 74.5205078125, 77.865234375, 81.2099609375, 84.5546875, 87.8994140625, 91.244140625, 94.5888671875, 97.93359375, 101.2783203125, 104.623046875, 107.9677734375, 111.3125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 47.0, 733.0, 223.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1271.74951171875, -1222.289794921875, -1172.830078125, -1123.370361328125, -1073.91064453125, -1024.450927734375, -974.9911499023438, -925.5313720703125, -876.0716552734375, -826.6119384765625, -777.1522216796875, -727.6925048828125, -678.2327270507812, -628.7730102539062, -579.3132934570312, -529.853515625, -480.39385986328125, -430.93414306640625, -381.4743957519531, -332.0146789550781, -282.554931640625, -233.09521484375, -183.635498046875, -134.17575073242188, -84.71603393554688, -35.25630569458008, 14.203422546386719, 63.66314697265625, 113.12287902832031, 162.58261108398438, 212.04232788085938, 261.5020751953125, 310.9617919921875, 360.4215087890625, 409.8812561035156, 459.3409729003906, 508.80072021484375, 558.2604370117188, 607.7201538085938, 657.179931640625, 706.6396484375, 756.099365234375, 805.55908203125, 855.018798828125, 904.4785766601562, 953.9382934570312, 1003.3980102539062, 1052.8577880859375, 1102.3173828125, 1151.777099609375, 1201.23681640625, 1250.696533203125, 1300.15625, 1349.615966796875, 1399.07568359375, 1448.5355224609375, 1497.9952392578125, 1547.4549560546875, 1596.9146728515625, 1646.3743896484375, 1695.8341064453125, 1745.2939453125, 1794.753662109375, 1844.21337890625, 1893.673095703125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 7.0, 7.0, 8.0, 4.0, 9.0, 6.0, 10.0, 24.0, 14.0, 9.0, 30.0, 14.0, 35.0, 26.0, 31.0, 25.0, 30.0, 33.0, 36.0, 29.0, 40.0, 50.0, 34.0, 31.0, 32.0, 45.0, 43.0, 43.0, 28.0, 38.0, 29.0, 21.0, 20.0, 25.0, 17.0, 18.0, 17.0, 16.0, 17.0, 11.0, 9.0, 7.0, 8.0, 10.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-154.60592651367188, -149.64340209960938, -144.68089294433594, -139.71836853027344, -134.75584411621094, -129.79331970214844, -124.830810546875, -119.8682861328125, -114.90576171875, -109.94324493408203, -104.98072052001953, -100.01820373535156, -95.05567932128906, -90.0931625366211, -85.13064575195312, -80.16812133789062, -75.20560455322266, -70.24308776855469, -65.28056335449219, -60.31804656982422, -55.35552215576172, -50.39300537109375, -45.430484771728516, -40.46796417236328, -35.50544357299805, -30.542922973632812, -25.580402374267578, -20.617883682250977, -15.655363082885742, -10.692842483520508, -5.730323791503906, -0.7678031921386719, 4.1947174072265625, 9.157238006591797, 14.119757652282715, 19.082277297973633, 24.044797897338867, 29.0073184967041, 33.9698371887207, 38.93235778808594, 43.89487838745117, 48.857398986816406, 53.81991958618164, 58.782440185546875, 63.744956970214844, 68.70748138427734, 73.66999816894531, 78.63252258300781, 83.59503936767578, 88.55755615234375, 93.52008056640625, 98.48259735107422, 103.44512176513672, 108.40763854980469, 113.37016296386719, 118.33267974853516, 123.29519653320312, 128.25772094726562, 133.22023010253906, 138.18275451660156, 143.14527893066406, 148.10780334472656, 153.0703125, 158.0328369140625, 162.995361328125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 9.0, 11.0, 13.0, 18.0, 20.0, 19.0, 26.0, 24.0, 33.0, 23.0, 30.0, 39.0, 33.0, 48.0, 41.0, 49.0, 40.0, 44.0, 37.0, 41.0, 42.0, 50.0, 29.0, 25.0, 37.0, 29.0, 33.0, 24.0, 15.0, 17.0, 15.0, 11.0, 10.0, 10.0, 6.0, 2.0, 2.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.794921875, -23.93359375, -23.072265625, -22.2109375, -21.349609375, -20.48828125, -19.626953125, -18.765625, -17.904296875, -17.04296875, -16.181640625, -15.3203125, -14.458984375, -13.59765625, -12.736328125, -11.875, -11.013671875, -10.15234375, -9.291015625, -8.4296875, -7.568359375, -6.70703125, -5.845703125, -4.984375, -4.123046875, -3.26171875, -2.400390625, -1.5390625, -0.677734375, 0.18359375, 1.044921875, 1.90625, 2.767578125, 3.62890625, 4.490234375, 5.3515625, 6.212890625, 7.07421875, 7.935546875, 8.796875, 9.658203125, 10.51953125, 11.380859375, 12.2421875, 13.103515625, 13.96484375, 14.826171875, 15.6875, 16.548828125, 17.41015625, 18.271484375, 19.1328125, 19.994140625, 20.85546875, 21.716796875, 22.578125, 23.439453125, 24.30078125, 25.162109375, 26.0234375, 26.884765625, 27.74609375, 28.607421875, 29.46875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 7.0, 9.0, 9.0, 13.0, 17.0, 22.0, 43.0, 45.0, 81.0, 101.0, 164.0, 196.0, 335.0, 459.0, 618.0, 896.0, 1315.0, 1869.0, 2655.0, 3983.0, 5968.0, 9263.0, 14581.0, 23389.0, 37562.0, 61402.0, 103722.0, 171016.0, 221214.0, 150704.0, 90606.0, 54100.0, 32879.0, 20685.0, 13229.0, 8529.0, 5458.0, 3673.0, 2402.0, 1601.0, 1098.0, 770.0, 508.0, 382.0, 275.0, 216.0, 150.0, 93.0, 71.0, 45.0, 46.0, 23.0, 18.0, 17.0, 12.0, 4.0, 3.0, 5.0, 4.0, 2.0, 5.0, 2.0], "bins": [-1.2021484375, -1.162567138671875, -1.12298583984375, -1.083404541015625, -1.0438232421875, -1.004241943359375, -0.96466064453125, -0.925079345703125, -0.885498046875, -0.845916748046875, -0.80633544921875, -0.766754150390625, -0.7271728515625, -0.687591552734375, -0.64801025390625, -0.608428955078125, -0.56884765625, -0.529266357421875, -0.48968505859375, -0.450103759765625, -0.4105224609375, -0.370941162109375, -0.33135986328125, -0.291778564453125, -0.252197265625, -0.212615966796875, -0.17303466796875, -0.133453369140625, -0.0938720703125, -0.054290771484375, -0.01470947265625, 0.024871826171875, 0.064453125, 0.104034423828125, 0.14361572265625, 0.183197021484375, 0.2227783203125, 0.262359619140625, 0.30194091796875, 0.341522216796875, 0.381103515625, 0.420684814453125, 0.46026611328125, 0.499847412109375, 0.5394287109375, 0.579010009765625, 0.61859130859375, 0.658172607421875, 0.69775390625, 0.737335205078125, 0.77691650390625, 0.816497802734375, 0.8560791015625, 0.895660400390625, 0.93524169921875, 0.974822998046875, 1.014404296875, 1.053985595703125, 1.09356689453125, 1.133148193359375, 1.1727294921875, 1.212310791015625, 1.25189208984375, 1.291473388671875, 1.3310546875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 5.0, 16.0, 15.0, 19.0, 19.0, 34.0, 18.0, 18.0, 35.0, 27.0, 35.0, 47.0, 44.0, 43.0, 48.0, 51.0, 1070.0, 49.0, 42.0, 37.0, 43.0, 38.0, 18.0, 35.0, 25.0, 19.0, 29.0, 21.0, 19.0, 23.0, 13.0, 15.0, 6.0, 8.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-21.234375, -20.6632080078125, -20.092041015625, -19.5208740234375, -18.94970703125, -18.3785400390625, -17.807373046875, -17.2362060546875, -16.6650390625, -16.0938720703125, -15.522705078125, -14.9515380859375, -14.38037109375, -13.8092041015625, -13.238037109375, -12.6668701171875, -12.095703125, -11.5245361328125, -10.953369140625, -10.3822021484375, -9.81103515625, -9.2398681640625, -8.668701171875, -8.0975341796875, -7.5263671875, -6.9552001953125, -6.384033203125, -5.8128662109375, -5.24169921875, -4.6705322265625, -4.099365234375, -3.5281982421875, -2.95703125, -2.3858642578125, -1.814697265625, -1.2435302734375, -0.67236328125, -0.1011962890625, 0.469970703125, 1.0411376953125, 1.6123046875, 2.1834716796875, 2.754638671875, 3.3258056640625, 3.89697265625, 4.4681396484375, 5.039306640625, 5.6104736328125, 6.181640625, 6.7528076171875, 7.323974609375, 7.8951416015625, 8.46630859375, 9.0374755859375, 9.608642578125, 10.1798095703125, 10.7509765625, 11.3221435546875, 11.893310546875, 12.4644775390625, 13.03564453125, 13.6068115234375, 14.177978515625, 14.7491455078125, 15.3203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 6.0, 14.0, 14.0, 21.0, 35.0, 50.0, 81.0, 156.0, 215.0, 343.0, 481.0, 829.0, 1340.0, 1992.0, 3049.0, 4852.0, 7420.0, 11453.0, 17847.0, 28486.0, 47282.0, 82383.0, 146918.0, 1281365.0, 192071.0, 108891.0, 61149.0, 36168.0, 22373.0, 14119.0, 9188.0, 5691.0, 3954.0, 2486.0, 1573.0, 1011.0, 667.0, 418.0, 274.0, 173.0, 113.0, 70.0, 35.0, 24.0, 17.0, 18.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2080078125, -1.169952392578125, -1.13189697265625, -1.093841552734375, -1.0557861328125, -1.017730712890625, -0.97967529296875, -0.941619873046875, -0.903564453125, -0.865509033203125, -0.82745361328125, -0.789398193359375, -0.7513427734375, -0.713287353515625, -0.67523193359375, -0.637176513671875, -0.59912109375, -0.561065673828125, -0.52301025390625, -0.484954833984375, -0.4468994140625, -0.408843994140625, -0.37078857421875, -0.332733154296875, -0.294677734375, -0.256622314453125, -0.21856689453125, -0.180511474609375, -0.1424560546875, -0.104400634765625, -0.06634521484375, -0.028289794921875, 0.009765625, 0.047821044921875, 0.08587646484375, 0.123931884765625, 0.1619873046875, 0.200042724609375, 0.23809814453125, 0.276153564453125, 0.314208984375, 0.352264404296875, 0.39031982421875, 0.428375244140625, 0.4664306640625, 0.504486083984375, 0.54254150390625, 0.580596923828125, 0.61865234375, 0.656707763671875, 0.69476318359375, 0.732818603515625, 0.7708740234375, 0.808929443359375, 0.84698486328125, 0.885040283203125, 0.923095703125, 0.961151123046875, 0.99920654296875, 1.037261962890625, 1.0753173828125, 1.113372802734375, 1.15142822265625, 1.189483642578125, 1.2275390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 3.0, 6.0, 5.0, 10.0, 9.0, 12.0, 23.0, 14.0, 27.0, 43.0, 61.0, 86.0, 100.0, 95.0, 102.0, 103.0, 83.0, 56.0, 44.0, 29.0, 21.0, 17.0, 8.0, 7.0, 7.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0111236572265625, -0.01075279712677002, -0.010381937026977539, -0.010011076927185059, -0.009640216827392578, -0.009269356727600098, -0.008898496627807617, -0.008527636528015137, -0.008156776428222656, -0.007785916328430176, -0.007415056228637695, -0.007044196128845215, -0.006673336029052734, -0.006302475929260254, -0.0059316158294677734, -0.005560755729675293, -0.0051898956298828125, -0.004819035530090332, -0.0044481754302978516, -0.004077315330505371, -0.0037064552307128906, -0.00333559513092041, -0.0029647350311279297, -0.0025938749313354492, -0.0022230148315429688, -0.0018521547317504883, -0.0014812946319580078, -0.0011104345321655273, -0.0007395744323730469, -0.0003687143325805664, 2.1457672119140625e-06, 0.00037300586700439453, 0.000743865966796875, 0.0011147260665893555, 0.001485586166381836, 0.0018564462661743164, 0.002227306365966797, 0.0025981664657592773, 0.002969026565551758, 0.0033398866653442383, 0.0037107467651367188, 0.004081606864929199, 0.00445246696472168, 0.00482332706451416, 0.005194187164306641, 0.005565047264099121, 0.0059359073638916016, 0.006306767463684082, 0.0066776275634765625, 0.007048487663269043, 0.0074193477630615234, 0.007790207862854004, 0.008161067962646484, 0.008531928062438965, 0.008902788162231445, 0.009273648262023926, 0.009644508361816406, 0.010015368461608887, 0.010386228561401367, 0.010757088661193848, 0.011127948760986328, 0.011498808860778809, 0.011869668960571289, 0.01224052906036377, 0.01261138916015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 12.0, 10.0, 11.0, 11.0, 18.0, 31.0, 53.0, 59.0, 116.0, 175.0, 404.0, 1188.0, 914050.0, 130599.0, 917.0, 339.0, 191.0, 106.0, 59.0, 38.0, 39.0, 25.0, 20.0, 12.0, 10.0, 11.0, 4.0, 8.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2506828308105469, -0.24306488037109375, -0.23544692993164062, -0.2278289794921875, -0.22021102905273438, -0.21259307861328125, -0.20497512817382812, -0.197357177734375, -0.18973922729492188, -0.18212127685546875, -0.17450332641601562, -0.1668853759765625, -0.15926742553710938, -0.15164947509765625, -0.14403152465820312, -0.13641357421875, -0.12879562377929688, -0.12117767333984375, -0.11355972290039062, -0.1059417724609375, -0.09832382202148438, -0.09070587158203125, -0.08308792114257812, -0.075469970703125, -0.06785202026367188, -0.06023406982421875, -0.052616119384765625, -0.0449981689453125, -0.037380218505859375, -0.02976226806640625, -0.022144317626953125, -0.0145263671875, -0.006908416748046875, 0.00070953369140625, 0.008327484130859375, 0.0159454345703125, 0.023563385009765625, 0.03118133544921875, 0.038799285888671875, 0.046417236328125, 0.054035186767578125, 0.06165313720703125, 0.06927108764648438, 0.0768890380859375, 0.08450698852539062, 0.09212493896484375, 0.09974288940429688, 0.10736083984375, 0.11497879028320312, 0.12259674072265625, 0.13021469116210938, 0.1378326416015625, 0.14545059204101562, 0.15306854248046875, 0.16068649291992188, 0.168304443359375, 0.17592239379882812, 0.18354034423828125, 0.19115829467773438, 0.1987762451171875, 0.20639419555664062, 0.21401214599609375, 0.22163009643554688, 0.229248046875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 43.0, 958.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010794905945658684, -0.007518281228840351, -0.004241656046360731, -0.0009650308638811111, 0.0023115938529372215, 0.005588218569755554, 0.008864844217896461, 0.01214146800339222, 0.015418093651533127, 0.018694719299674034, 0.021971343085169792, 0.0252479687333107, 0.028524592518806458, 0.031801216304302216, 0.03507784381508827, 0.03835446760058403, 0.04163109511137009, 0.044907718896865845, 0.0481843464076519, 0.05146097019314766, 0.05473759397864342, 0.058014221489429474, 0.06129084527492523, 0.06456746906042099, 0.06784409284591675, 0.0711207166314125, 0.07439734041690826, 0.07767397165298462, 0.08095059543848038, 0.08422721922397614, 0.0875038430094719, 0.09078046679496765, 0.09405709058046341, 0.09733371436595917, 0.10061033815145493, 0.10388696193695068, 0.10716359317302704, 0.1104402169585228, 0.11371684074401855, 0.11699346452951431, 0.12027008831501007, 0.12354671210050583, 0.1268233358860016, 0.13009996712207794, 0.1333765834569931, 0.13665321469306946, 0.13992983102798462, 0.14320646226406097, 0.14648309350013733, 0.14975972473621368, 0.15303634107112885, 0.1563129723072052, 0.15958958864212036, 0.16286621987819672, 0.16614285111427307, 0.16941946744918823, 0.1726960837841034, 0.17597271502017975, 0.1792493313550949, 0.18252596259117126, 0.18580257892608643, 0.18907921016216278, 0.19235584139823914, 0.1956324577331543, 0.19890908896923065]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 13.0, 12.0, 12.0, 29.0, 22.0, 45.0, 48.0, 60.0, 58.0, 72.0, 66.0, 75.0, 60.0, 64.0, 74.0, 54.0, 41.0, 38.0, 32.0, 29.0, 26.0, 26.0, 17.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01441192626953125, -0.014080301858484745, -0.01374867744743824, -0.013417053036391735, -0.01308542862534523, -0.012753804214298725, -0.01242217980325222, -0.012090555392205715, -0.01175893098115921, -0.011427306570112705, -0.0110956821590662, -0.010764057748019695, -0.01043243333697319, -0.010100808925926685, -0.00976918451488018, -0.009437560103833675, -0.00910593569278717, -0.008774311281740665, -0.00844268687069416, -0.008111062459647655, -0.0077794380486011505, -0.0074478136375546455, -0.0071161892265081406, -0.006784564815461636, -0.006452940404415131, -0.006121315993368626, -0.005789691582322121, -0.005458067171275616, -0.005126442760229111, -0.004794818349182606, -0.004463193938136101, -0.004131569527089596, -0.003799945116043091, -0.003468320704996586, -0.003136696293950081, -0.002805071882903576, -0.002473447471857071, -0.002141823060810566, -0.001810198649764061, -0.001478574238717556, -0.001146949827671051, -0.000815325416624546, -0.0004837010055780411, -0.0001520765945315361, 0.00017954781651496887, 0.0005111722275614738, 0.0008427966386079788, 0.0011744210496544838, 0.0015060454607009888, 0.0018376698717474937, 0.0021692942827939987, 0.0025009186938405037, 0.0028325431048870087, 0.0031641675159335136, 0.0034957919269800186, 0.0038274163380265236, 0.0041590407490730286, 0.0044906651601195335, 0.0048222895711660385, 0.0051539139822125435, 0.0054855383932590485, 0.0058171628043055534, 0.006148787215352058, 0.006480411626398563, 0.006812036037445068]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 9.0, 11.0, 13.0, 18.0, 20.0, 19.0, 26.0, 24.0, 33.0, 23.0, 30.0, 39.0, 33.0, 48.0, 41.0, 49.0, 41.0, 43.0, 37.0, 41.0, 42.0, 50.0, 29.0, 25.0, 37.0, 29.0, 33.0, 24.0, 15.0, 17.0, 15.0, 11.0, 10.0, 10.0, 6.0, 2.0, 2.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.794921875, -23.93359375, -23.072265625, -22.2109375, -21.349609375, -20.48828125, -19.626953125, -18.765625, -17.904296875, -17.04296875, -16.181640625, -15.3203125, -14.458984375, -13.59765625, -12.736328125, -11.875, -11.013671875, -10.15234375, -9.291015625, -8.4296875, -7.568359375, -6.70703125, -5.845703125, -4.984375, -4.123046875, -3.26171875, -2.400390625, -1.5390625, -0.677734375, 0.18359375, 1.044921875, 1.90625, 2.767578125, 3.62890625, 4.490234375, 5.3515625, 6.212890625, 7.07421875, 7.935546875, 8.796875, 9.658203125, 10.51953125, 11.380859375, 12.2421875, 13.103515625, 13.96484375, 14.826171875, 15.6875, 16.548828125, 17.41015625, 18.271484375, 19.1328125, 19.994140625, 20.85546875, 21.716796875, 22.578125, 23.439453125, 24.30078125, 25.162109375, 26.0234375, 26.884765625, 27.74609375, 28.607421875, 29.46875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 11.0, 17.0, 25.0, 26.0, 33.0, 46.0, 74.0, 101.0, 143.0, 191.0, 227.0, 360.0, 520.0, 714.0, 968.0, 1470.0, 2222.0, 3798.0, 9768.0, 50690.0, 716051.0, 224503.0, 21530.0, 6132.0, 2972.0, 1720.0, 1246.0, 823.0, 624.0, 399.0, 291.0, 219.0, 160.0, 133.0, 86.0, 59.0, 55.0, 32.0, 30.0, 21.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0], "bins": [-81.375, -79.03515625, -76.6953125, -74.35546875, -72.015625, -69.67578125, -67.3359375, -64.99609375, -62.65625, -60.31640625, -57.9765625, -55.63671875, -53.296875, -50.95703125, -48.6171875, -46.27734375, -43.9375, -41.59765625, -39.2578125, -36.91796875, -34.578125, -32.23828125, -29.8984375, -27.55859375, -25.21875, -22.87890625, -20.5390625, -18.19921875, -15.859375, -13.51953125, -11.1796875, -8.83984375, -6.5, -4.16015625, -1.8203125, 0.51953125, 2.859375, 5.19921875, 7.5390625, 9.87890625, 12.21875, 14.55859375, 16.8984375, 19.23828125, 21.578125, 23.91796875, 26.2578125, 28.59765625, 30.9375, 33.27734375, 35.6171875, 37.95703125, 40.296875, 42.63671875, 44.9765625, 47.31640625, 49.65625, 51.99609375, 54.3359375, 56.67578125, 59.015625, 61.35546875, 63.6953125, 66.03515625, 68.375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 16.0, 14.0, 16.0, 23.0, 22.0, 22.0, 35.0, 40.0, 38.0, 47.0, 55.0, 74.0, 111.0, 368.0, 1545.0, 141.0, 80.0, 64.0, 54.0, 42.0, 32.0, 25.0, 22.0, 21.0, 14.0, 18.0, 8.0, 17.0, 11.0, 7.0, 9.0, 7.0, 4.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0625, -49.1787109375, -47.294921875, -45.4111328125, -43.52734375, -41.6435546875, -39.759765625, -37.8759765625, -35.9921875, -34.1083984375, -32.224609375, -30.3408203125, -28.45703125, -26.5732421875, -24.689453125, -22.8056640625, -20.921875, -19.0380859375, -17.154296875, -15.2705078125, -13.38671875, -11.5029296875, -9.619140625, -7.7353515625, -5.8515625, -3.9677734375, -2.083984375, -0.2001953125, 1.68359375, 3.5673828125, 5.451171875, 7.3349609375, 9.21875, 11.1025390625, 12.986328125, 14.8701171875, 16.75390625, 18.6376953125, 20.521484375, 22.4052734375, 24.2890625, 26.1728515625, 28.056640625, 29.9404296875, 31.82421875, 33.7080078125, 35.591796875, 37.4755859375, 39.359375, 41.2431640625, 43.126953125, 45.0107421875, 46.89453125, 48.7783203125, 50.662109375, 52.5458984375, 54.4296875, 56.3134765625, 58.197265625, 60.0810546875, 61.96484375, 63.8486328125, 65.732421875, 67.6162109375, 69.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 9.0, 3.0, 11.0, 6.0, 12.0, 17.0, 14.0, 22.0, 38.0, 55.0, 95.0, 126.0, 190.0, 423.0, 1049.0, 5915.0, 3132303.0, 3591.0, 869.0, 374.0, 204.0, 115.0, 71.0, 38.0, 32.0, 29.0, 23.0, 21.0, 11.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-341.25, -332.80859375, -324.3671875, -315.92578125, -307.484375, -299.04296875, -290.6015625, -282.16015625, -273.71875, -265.27734375, -256.8359375, -248.39453125, -239.953125, -231.51171875, -223.0703125, -214.62890625, -206.1875, -197.74609375, -189.3046875, -180.86328125, -172.421875, -163.98046875, -155.5390625, -147.09765625, -138.65625, -130.21484375, -121.7734375, -113.33203125, -104.890625, -96.44921875, -88.0078125, -79.56640625, -71.125, -62.68359375, -54.2421875, -45.80078125, -37.359375, -28.91796875, -20.4765625, -12.03515625, -3.59375, 4.84765625, 13.2890625, 21.73046875, 30.171875, 38.61328125, 47.0546875, 55.49609375, 63.9375, 72.37890625, 80.8203125, 89.26171875, 97.703125, 106.14453125, 114.5859375, 123.02734375, 131.46875, 139.91015625, 148.3515625, 156.79296875, 165.234375, 173.67578125, 182.1171875, 190.55859375, 199.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 16.0, 135.0, 497.0, 296.0, 55.0, 12.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-255.23687744140625, -242.28587341308594, -229.33486938476562, -216.38388061523438, -203.43287658691406, -190.48187255859375, -177.5308837890625, -164.5798797607422, -151.62887573242188, -138.67787170410156, -125.72687530517578, -112.77587890625, -99.82487487792969, -86.87387084960938, -73.9228744506836, -60.97187805175781, -48.0208740234375, -35.06987380981445, -22.118873596191406, -9.16787338256836, 3.7831268310546875, 16.734130859375, 29.68512725830078, 42.63612365722656, 55.587127685546875, 68.53813171386719, 81.48912811279297, 94.44012451171875, 107.39112854003906, 120.34213256835938, 133.29312133789062, 146.24412536621094, 159.19512939453125, 172.14613342285156, 185.09713745117188, 198.04812622070312, 210.99913024902344, 223.95013427734375, 236.901123046875, 249.8521270751953, 262.8031311035156, 275.7541198730469, 288.70513916015625, 301.6561279296875, 314.60711669921875, 327.5581359863281, 340.5091247558594, 353.46014404296875, 366.4111328125, 379.36212158203125, 392.3131408691406, 405.2641296386719, 418.21514892578125, 431.1661376953125, 444.11712646484375, 457.068115234375, 470.0191345214844, 482.9701232910156, 495.921142578125, 508.87213134765625, 521.8231201171875, 534.774169921875, 547.7251586914062, 560.6761474609375, 573.6271362304688]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 5.0, 11.0, 6.0, 12.0, 11.0, 10.0, 17.0, 20.0, 20.0, 20.0, 21.0, 28.0, 36.0, 34.0, 37.0, 21.0, 39.0, 34.0, 31.0, 37.0, 28.0, 48.0, 38.0, 36.0, 36.0, 37.0, 43.0, 34.0, 28.0, 28.0, 32.0, 17.0, 9.0, 14.0, 17.0, 14.0, 13.0, 10.0, 10.0, 10.0, 8.0, 10.0, 3.0, 5.0, 3.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-136.9477081298828, -132.6690216064453, -128.39035034179688, -124.11166381835938, -119.83297729492188, -115.55429077148438, -111.2756118774414, -106.99693298339844, -102.71824645996094, -98.43955993652344, -94.16088104248047, -89.8822021484375, -85.603515625, -81.3248291015625, -77.04615020751953, -72.76747131347656, -68.48878479003906, -64.21009826660156, -59.931419372558594, -55.65273666381836, -51.374053955078125, -47.09537124633789, -42.816688537597656, -38.53800582885742, -34.25932312011719, -29.980640411376953, -25.70195770263672, -21.423274993896484, -17.14459228515625, -12.865909576416016, -8.587226867675781, -4.308544158935547, -0.029876708984375, 4.248805999755859, 8.527488708496094, 12.806171417236328, 17.084854125976562, 21.363536834716797, 25.64221954345703, 29.920902252197266, 34.1995849609375, 38.478267669677734, 42.75695037841797, 47.0356330871582, 51.31431579589844, 55.59299850463867, 59.871681213378906, 64.15036010742188, 68.42904663085938, 72.70773315429688, 76.98641204833984, 81.26509094238281, 85.54377746582031, 89.82246398925781, 94.10114288330078, 98.37982177734375, 102.65850830078125, 106.93719482421875, 111.21587371826172, 115.49455261230469, 119.77323913574219, 124.05192565917969, 128.33059692382812, 132.60928344726562, 136.88796997070312]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 4.0, 14.0, 10.0, 14.0, 15.0, 17.0, 25.0, 19.0, 14.0, 21.0, 31.0, 24.0, 41.0, 33.0, 50.0, 36.0, 53.0, 43.0, 44.0, 48.0, 30.0, 41.0, 40.0, 41.0, 46.0, 32.0, 30.0, 28.0, 22.0, 21.0, 17.0, 20.0, 11.0, 16.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.125, -24.2158203125, -23.306640625, -22.3974609375, -21.48828125, -20.5791015625, -19.669921875, -18.7607421875, -17.8515625, -16.9423828125, -16.033203125, -15.1240234375, -14.21484375, -13.3056640625, -12.396484375, -11.4873046875, -10.578125, -9.6689453125, -8.759765625, -7.8505859375, -6.94140625, -6.0322265625, -5.123046875, -4.2138671875, -3.3046875, -2.3955078125, -1.486328125, -0.5771484375, 0.33203125, 1.2412109375, 2.150390625, 3.0595703125, 3.96875, 4.8779296875, 5.787109375, 6.6962890625, 7.60546875, 8.5146484375, 9.423828125, 10.3330078125, 11.2421875, 12.1513671875, 13.060546875, 13.9697265625, 14.87890625, 15.7880859375, 16.697265625, 17.6064453125, 18.515625, 19.4248046875, 20.333984375, 21.2431640625, 22.15234375, 23.0615234375, 23.970703125, 24.8798828125, 25.7890625, 26.6982421875, 27.607421875, 28.5166015625, 29.42578125, 30.3349609375, 31.244140625, 32.1533203125, 33.0625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 4.0, 10.0, 13.0, 7.0, 18.0, 13.0, 17.0, 35.0, 39.0, 35.0, 38.0, 40.0, 63.0, 69.0, 99.0, 127.0, 267.0, 437.0, 927.0, 2236.0, 5782.0, 22908.0, 259916.0, 3150781.0, 698091.0, 39263.0, 7654.0, 2717.0, 1126.0, 546.0, 301.0, 174.0, 115.0, 95.0, 64.0, 35.0, 47.0, 28.0, 32.0, 25.0, 21.0, 13.0, 9.0, 11.0, 8.0, 7.0, 4.0, 0.0, 2.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-69.125, -66.94140625, -64.7578125, -62.57421875, -60.390625, -58.20703125, -56.0234375, -53.83984375, -51.65625, -49.47265625, -47.2890625, -45.10546875, -42.921875, -40.73828125, -38.5546875, -36.37109375, -34.1875, -32.00390625, -29.8203125, -27.63671875, -25.453125, -23.26953125, -21.0859375, -18.90234375, -16.71875, -14.53515625, -12.3515625, -10.16796875, -7.984375, -5.80078125, -3.6171875, -1.43359375, 0.75, 2.93359375, 5.1171875, 7.30078125, 9.484375, 11.66796875, 13.8515625, 16.03515625, 18.21875, 20.40234375, 22.5859375, 24.76953125, 26.953125, 29.13671875, 31.3203125, 33.50390625, 35.6875, 37.87109375, 40.0546875, 42.23828125, 44.421875, 46.60546875, 48.7890625, 50.97265625, 53.15625, 55.33984375, 57.5234375, 59.70703125, 61.890625, 64.07421875, 66.2578125, 68.44140625, 70.625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 14.0, 17.0, 21.0, 45.0, 52.0, 74.0, 122.0, 188.0, 328.0, 566.0, 877.0, 724.0, 391.0, 232.0, 158.0, 88.0, 66.0, 42.0, 15.0, 16.0, 9.0, 11.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.947265625, -65.01953125, -63.091796875, -61.1640625, -59.236328125, -57.30859375, -55.380859375, -53.453125, -51.525390625, -49.59765625, -47.669921875, -45.7421875, -43.814453125, -41.88671875, -39.958984375, -38.03125, -36.103515625, -34.17578125, -32.248046875, -30.3203125, -28.392578125, -26.46484375, -24.537109375, -22.609375, -20.681640625, -18.75390625, -16.826171875, -14.8984375, -12.970703125, -11.04296875, -9.115234375, -7.1875, -5.259765625, -3.33203125, -1.404296875, 0.5234375, 2.451171875, 4.37890625, 6.306640625, 8.234375, 10.162109375, 12.08984375, 14.017578125, 15.9453125, 17.873046875, 19.80078125, 21.728515625, 23.65625, 25.583984375, 27.51171875, 29.439453125, 31.3671875, 33.294921875, 35.22265625, 37.150390625, 39.078125, 41.005859375, 42.93359375, 44.861328125, 46.7890625, 48.716796875, 50.64453125, 52.572265625, 54.5]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 7.0, 15.0, 24.0, 18.0, 48.0, 98.0, 169.0, 335.0, 943.0, 3747.0, 29088.0, 3639892.0, 502791.0, 13521.0, 2249.0, 711.0, 271.0, 158.0, 69.0, 44.0, 34.0, 19.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.75, -132.16796875, -127.5859375, -123.00390625, -118.421875, -113.83984375, -109.2578125, -104.67578125, -100.09375, -95.51171875, -90.9296875, -86.34765625, -81.765625, -77.18359375, -72.6015625, -68.01953125, -63.4375, -58.85546875, -54.2734375, -49.69140625, -45.109375, -40.52734375, -35.9453125, -31.36328125, -26.78125, -22.19921875, -17.6171875, -13.03515625, -8.453125, -3.87109375, 0.7109375, 5.29296875, 9.875, 14.45703125, 19.0390625, 23.62109375, 28.203125, 32.78515625, 37.3671875, 41.94921875, 46.53125, 51.11328125, 55.6953125, 60.27734375, 64.859375, 69.44140625, 74.0234375, 78.60546875, 83.1875, 87.76953125, 92.3515625, 96.93359375, 101.515625, 106.09765625, 110.6796875, 115.26171875, 119.84375, 124.42578125, 129.0078125, 133.58984375, 138.171875, 142.75390625, 147.3359375, 151.91796875, 156.5]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 26.0, 173.0, 696.0, 101.0, 13.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-271.91302490234375, -239.56765747070312, -207.2222900390625, -174.87693786621094, -142.5315704345703, -110.18620300292969, -77.84085083007812, -45.4954833984375, -13.150115966796875, 19.195247650146484, 51.540611267089844, 83.88597106933594, 116.23133850097656, 148.5767059326172, 180.92205810546875, 213.26742553710938, 245.61279296875, 277.9581604003906, 310.30352783203125, 342.64886474609375, 374.9942626953125, 407.339599609375, 439.6849670410156, 472.03033447265625, 504.3757019042969, 536.7210693359375, 569.06640625, 601.4118041992188, 633.7571411132812, 666.1025390625, 698.4478759765625, 730.793212890625, 763.1385498046875, 795.48388671875, 827.8292846679688, 860.1746215820312, 892.52001953125, 924.8653564453125, 957.210693359375, 989.5560913085938, 1021.9014892578125, 1054.246826171875, 1086.5921630859375, 1118.9376220703125, 1151.282958984375, 1183.6282958984375, 1215.9736328125, 1248.319091796875, 1280.664306640625, 1313.0096435546875, 1345.35498046875, 1377.700439453125, 1410.0457763671875, 1442.39111328125, 1474.7364501953125, 1507.081787109375, 1539.42724609375, 1571.7725830078125, 1604.117919921875, 1636.46337890625, 1668.8087158203125, 1701.154052734375, 1733.4993896484375, 1765.8447265625, 1798.190185546875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 5.0, 10.0, 15.0, 10.0, 12.0, 9.0, 17.0, 20.0, 26.0, 36.0, 29.0, 29.0, 35.0, 38.0, 40.0, 39.0, 38.0, 42.0, 42.0, 50.0, 28.0, 40.0, 36.0, 44.0, 37.0, 36.0, 22.0, 25.0, 24.0, 27.0, 24.0, 24.0, 13.0, 18.0, 12.0, 5.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-160.9530029296875, -156.26988220214844, -151.58677673339844, -146.90365600585938, -142.22055053710938, -137.5374298095703, -132.8543243408203, -128.17120361328125, -123.48809051513672, -118.80497741699219, -114.12186431884766, -109.43875122070312, -104.75563049316406, -100.07252502441406, -95.389404296875, -90.70629119873047, -86.02317810058594, -81.3400650024414, -76.65695190429688, -71.97383880615234, -67.29072570800781, -62.607608795166016, -57.92449188232422, -53.24137878417969, -48.558265686035156, -43.875152587890625, -39.192039489746094, -34.5089225769043, -29.825809478759766, -25.142696380615234, -20.45958137512207, -15.776466369628906, -11.093368530273438, -6.41025447845459, -1.7271404266357422, 2.9559736251831055, 7.639087677001953, 12.322200775146484, 17.00531578063965, 21.688430786132812, 26.371543884277344, 31.054656982421875, 35.737770080566406, 40.4208869934082, 45.104000091552734, 49.787113189697266, 54.47023010253906, 59.153343200683594, 63.836456298828125, 68.51956939697266, 73.20268249511719, 77.88579559326172, 82.56890869140625, 87.25202941894531, 91.93514251708984, 96.61825561523438, 101.3013687133789, 105.98448181152344, 110.66759490966797, 115.3507080078125, 120.03382873535156, 124.71693420410156, 129.40005493164062, 134.08316040039062, 138.7662811279297]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 14.0, 5.0, 10.0, 12.0, 14.0, 20.0, 21.0, 26.0, 24.0, 27.0, 26.0, 40.0, 33.0, 41.0, 42.0, 46.0, 38.0, 31.0, 49.0, 42.0, 52.0, 45.0, 39.0, 40.0, 38.0, 33.0, 31.0, 27.0, 23.0, 14.0, 22.0, 16.0, 10.0, 5.0, 13.0, 6.0, 9.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.890625, -23.07861328125, -22.2666015625, -21.45458984375, -20.642578125, -19.83056640625, -19.0185546875, -18.20654296875, -17.39453125, -16.58251953125, -15.7705078125, -14.95849609375, -14.146484375, -13.33447265625, -12.5224609375, -11.71044921875, -10.8984375, -10.08642578125, -9.2744140625, -8.46240234375, -7.650390625, -6.83837890625, -6.0263671875, -5.21435546875, -4.40234375, -3.59033203125, -2.7783203125, -1.96630859375, -1.154296875, -0.34228515625, 0.4697265625, 1.28173828125, 2.09375, 2.90576171875, 3.7177734375, 4.52978515625, 5.341796875, 6.15380859375, 6.9658203125, 7.77783203125, 8.58984375, 9.40185546875, 10.2138671875, 11.02587890625, 11.837890625, 12.64990234375, 13.4619140625, 14.27392578125, 15.0859375, 15.89794921875, 16.7099609375, 17.52197265625, 18.333984375, 19.14599609375, 19.9580078125, 20.77001953125, 21.58203125, 22.39404296875, 23.2060546875, 24.01806640625, 24.830078125, 25.64208984375, 26.4541015625, 27.26611328125, 28.078125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 7.0, 11.0, 5.0, 13.0, 22.0, 29.0, 41.0, 64.0, 63.0, 128.0, 208.0, 259.0, 424.0, 627.0, 809.0, 1393.0, 2103.0, 3187.0, 4923.0, 7621.0, 11903.0, 18868.0, 30126.0, 50344.0, 87735.0, 160336.0, 247026.0, 177929.0, 97002.0, 55335.0, 33062.0, 20215.0, 12896.0, 8143.0, 5321.0, 3565.0, 2318.0, 1559.0, 1002.0, 659.0, 444.0, 284.0, 185.0, 135.0, 73.0, 62.0, 34.0, 26.0, 15.0, 9.0, 6.0, 3.0, 7.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.259765625, -1.222259521484375, -1.18475341796875, -1.147247314453125, -1.1097412109375, -1.072235107421875, -1.03472900390625, -0.997222900390625, -0.959716796875, -0.922210693359375, -0.88470458984375, -0.847198486328125, -0.8096923828125, -0.772186279296875, -0.73468017578125, -0.697174072265625, -0.65966796875, -0.622161865234375, -0.58465576171875, -0.547149658203125, -0.5096435546875, -0.472137451171875, -0.43463134765625, -0.397125244140625, -0.359619140625, -0.322113037109375, -0.28460693359375, -0.247100830078125, -0.2095947265625, -0.172088623046875, -0.13458251953125, -0.097076416015625, -0.0595703125, -0.022064208984375, 0.01544189453125, 0.052947998046875, 0.0904541015625, 0.127960205078125, 0.16546630859375, 0.202972412109375, 0.240478515625, 0.277984619140625, 0.31549072265625, 0.352996826171875, 0.3905029296875, 0.428009033203125, 0.46551513671875, 0.503021240234375, 0.54052734375, 0.578033447265625, 0.61553955078125, 0.653045654296875, 0.6905517578125, 0.728057861328125, 0.76556396484375, 0.803070068359375, 0.840576171875, 0.878082275390625, 0.91558837890625, 0.953094482421875, 0.9906005859375, 1.028106689453125, 1.06561279296875, 1.103118896484375, 1.140625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 15.0, 14.0, 8.0, 16.0, 16.0, 19.0, 24.0, 20.0, 27.0, 32.0, 26.0, 34.0, 35.0, 27.0, 42.0, 35.0, 36.0, 47.0, 1061.0, 43.0, 33.0, 38.0, 28.0, 37.0, 30.0, 32.0, 20.0, 34.0, 31.0, 28.0, 16.0, 20.0, 14.0, 17.0, 12.0, 9.0, 12.0, 3.0, 8.0, 5.0, 4.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.734375, -13.26416015625, -12.7939453125, -12.32373046875, -11.853515625, -11.38330078125, -10.9130859375, -10.44287109375, -9.97265625, -9.50244140625, -9.0322265625, -8.56201171875, -8.091796875, -7.62158203125, -7.1513671875, -6.68115234375, -6.2109375, -5.74072265625, -5.2705078125, -4.80029296875, -4.330078125, -3.85986328125, -3.3896484375, -2.91943359375, -2.44921875, -1.97900390625, -1.5087890625, -1.03857421875, -0.568359375, -0.09814453125, 0.3720703125, 0.84228515625, 1.3125, 1.78271484375, 2.2529296875, 2.72314453125, 3.193359375, 3.66357421875, 4.1337890625, 4.60400390625, 5.07421875, 5.54443359375, 6.0146484375, 6.48486328125, 6.955078125, 7.42529296875, 7.8955078125, 8.36572265625, 8.8359375, 9.30615234375, 9.7763671875, 10.24658203125, 10.716796875, 11.18701171875, 11.6572265625, 12.12744140625, 12.59765625, 13.06787109375, 13.5380859375, 14.00830078125, 14.478515625, 14.94873046875, 15.4189453125, 15.88916015625, 16.359375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 11.0, 13.0, 15.0, 27.0, 36.0, 58.0, 107.0, 151.0, 189.0, 238.0, 440.0, 604.0, 907.0, 1286.0, 1831.0, 2721.0, 3841.0, 5520.0, 7711.0, 11143.0, 16315.0, 24166.0, 35887.0, 55583.0, 87280.0, 143705.0, 1253959.0, 161161.0, 97957.0, 60653.0, 39631.0, 26305.0, 17600.0, 12198.0, 8513.0, 5906.0, 4125.0, 2920.0, 2012.0, 1444.0, 922.0, 607.0, 484.0, 340.0, 207.0, 135.0, 98.0, 69.0, 30.0, 30.0, 16.0, 11.0, 7.0, 5.0, 6.0, 2.0, 0.0, 1.0], "bins": [-0.93115234375, -0.9026031494140625, -0.874053955078125, -0.8455047607421875, -0.81695556640625, -0.7884063720703125, -0.759857177734375, -0.7313079833984375, -0.7027587890625, -0.6742095947265625, -0.645660400390625, -0.6171112060546875, -0.58856201171875, -0.5600128173828125, -0.531463623046875, -0.5029144287109375, -0.474365234375, -0.4458160400390625, -0.417266845703125, -0.3887176513671875, -0.36016845703125, -0.3316192626953125, -0.303070068359375, -0.2745208740234375, -0.2459716796875, -0.2174224853515625, -0.188873291015625, -0.1603240966796875, -0.13177490234375, -0.1032257080078125, -0.074676513671875, -0.0461273193359375, -0.017578125, 0.0109710693359375, 0.039520263671875, 0.0680694580078125, 0.09661865234375, 0.1251678466796875, 0.153717041015625, 0.1822662353515625, 0.2108154296875, 0.2393646240234375, 0.267913818359375, 0.2964630126953125, 0.32501220703125, 0.3535614013671875, 0.382110595703125, 0.4106597900390625, 0.439208984375, 0.4677581787109375, 0.496307373046875, 0.5248565673828125, 0.55340576171875, 0.5819549560546875, 0.610504150390625, 0.6390533447265625, 0.6676025390625, 0.6961517333984375, 0.724700927734375, 0.7532501220703125, 0.78179931640625, 0.8103485107421875, 0.838897705078125, 0.8674468994140625, 0.89599609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 3.0, 9.0, 11.0, 14.0, 15.0, 11.0, 18.0, 25.0, 30.0, 33.0, 38.0, 39.0, 40.0, 69.0, 64.0, 69.0, 66.0, 67.0, 50.0, 51.0, 52.0, 36.0, 35.0, 35.0, 23.0, 20.0, 22.0, 14.0, 8.0, 11.0, 2.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005615234375, -0.0054631829261779785, -0.005311131477355957, -0.0051590800285339355, -0.005007028579711914, -0.004854977130889893, -0.004702925682067871, -0.00455087423324585, -0.004398822784423828, -0.004246771335601807, -0.004094719886779785, -0.003942668437957764, -0.003790616989135742, -0.0036385655403137207, -0.0034865140914916992, -0.0033344626426696777, -0.0031824111938476562, -0.0030303597450256348, -0.0028783082962036133, -0.002726256847381592, -0.0025742053985595703, -0.002422153949737549, -0.0022701025009155273, -0.002118051052093506, -0.0019659996032714844, -0.0018139481544494629, -0.0016618967056274414, -0.00150984525680542, -0.0013577938079833984, -0.001205742359161377, -0.0010536909103393555, -0.000901639461517334, -0.0007495880126953125, -0.000597536563873291, -0.00044548511505126953, -0.00029343366622924805, -0.00014138221740722656, 1.0669231414794922e-05, 0.0001627206802368164, 0.0003147721290588379, 0.0004668235778808594, 0.0006188750267028809, 0.0007709264755249023, 0.0009229779243469238, 0.0010750293731689453, 0.0012270808219909668, 0.0013791322708129883, 0.0015311837196350098, 0.0016832351684570312, 0.0018352866172790527, 0.0019873380661010742, 0.0021393895149230957, 0.002291440963745117, 0.0024434924125671387, 0.00259554386138916, 0.0027475953102111816, 0.002899646759033203, 0.0030516982078552246, 0.003203749656677246, 0.0033558011054992676, 0.003507852554321289, 0.0036599040031433105, 0.003811955451965332, 0.0039640069007873535, 0.004116058349609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 10.0, 12.0, 14.0, 13.0, 28.0, 31.0, 45.0, 64.0, 63.0, 98.0, 119.0, 188.0, 247.0, 491.0, 1248.0, 78809.0, 961902.0, 3344.0, 700.0, 323.0, 207.0, 146.0, 91.0, 86.0, 50.0, 49.0, 33.0, 32.0, 21.0, 21.0, 18.0, 10.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07342529296875, -0.07062530517578125, -0.0678253173828125, -0.06502532958984375, -0.062225341796875, -0.05942535400390625, -0.0566253662109375, -0.05382537841796875, -0.051025390625, -0.04822540283203125, -0.0454254150390625, -0.04262542724609375, -0.039825439453125, -0.03702545166015625, -0.0342254638671875, -0.03142547607421875, -0.02862548828125, -0.02582550048828125, -0.0230255126953125, -0.02022552490234375, -0.017425537109375, -0.01462554931640625, -0.0118255615234375, -0.00902557373046875, -0.0062255859375, -0.00342559814453125, -0.0006256103515625, 0.00217437744140625, 0.004974365234375, 0.00777435302734375, 0.0105743408203125, 0.01337432861328125, 0.01617431640625, 0.01897430419921875, 0.0217742919921875, 0.02457427978515625, 0.027374267578125, 0.03017425537109375, 0.0329742431640625, 0.03577423095703125, 0.03857421875, 0.04137420654296875, 0.0441741943359375, 0.04697418212890625, 0.049774169921875, 0.05257415771484375, 0.0553741455078125, 0.05817413330078125, 0.06097412109375, 0.06377410888671875, 0.0665740966796875, 0.06937408447265625, 0.072174072265625, 0.07497406005859375, 0.0777740478515625, 0.08057403564453125, 0.0833740234375, 0.08617401123046875, 0.0889739990234375, 0.09177398681640625, 0.094573974609375, 0.09737396240234375, 0.1001739501953125, 0.10297393798828125, 0.10577392578125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 18.0, 90.0, 461.0, 360.0, 66.0, 13.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007264423184096813, -0.0068797217682003975, -0.006495020352303982, -0.006110318936407566, -0.00572561752051115, -0.005340916104614735, -0.004956214688718319, -0.004571513272821903, -0.0041868118569254875, -0.003802110441029072, -0.003417409025132656, -0.0030327076092362404, -0.0026480061933398247, -0.002263304777443409, -0.0018786033615469933, -0.0014939019456505775, -0.0011092005297541618, -0.0007244991138577461, -0.0003397976979613304, 4.49037179350853e-05, 0.000429605133831501, 0.0008143065497279167, 0.0011990079656243324, 0.0015837093815207481, 0.001968410797417164, 0.0023531122133135796, 0.0027378136292099953, 0.003122515045106411, 0.0035072164610028267, 0.0038919178768992424, 0.004276619292795658, 0.004661320708692074, 0.005046021193265915, 0.005430722609162331, 0.005815424025058746, 0.006200125440955162, 0.006584826856851578, 0.0069695282727479935, 0.007354229688644409, 0.007738931104540825, 0.00812363252043724, 0.008508333936333656, 0.008893035352230072, 0.009277736768126488, 0.009662438184022903, 0.01004713959991932, 0.010431841015815735, 0.01081654243171215, 0.011201243847608566, 0.011585945263504982, 0.011970646679401398, 0.012355348095297813, 0.012740049511194229, 0.013124750927090645, 0.01350945234298706, 0.013894153758883476, 0.014278855174779892, 0.014663556590676308, 0.015048258006572723, 0.015432959422469139, 0.015817660838365555, 0.01620236225426197, 0.016587063670158386, 0.016971765086054802, 0.017356466501951218]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 5.0, 3.0, 10.0, 13.0, 13.0, 15.0, 13.0, 20.0, 16.0, 14.0, 22.0, 24.0, 35.0, 34.0, 44.0, 37.0, 35.0, 27.0, 36.0, 32.0, 29.0, 39.0, 35.0, 34.0, 41.0, 39.0, 32.0, 32.0, 32.0, 36.0, 26.0, 29.0, 23.0, 13.0, 21.0, 12.0, 14.0, 14.0, 8.0, 7.0, 1.0, 5.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.002219557762145996, -0.002150637097656727, -0.0020817164331674576, -0.0020127957686781883, -0.001943875104188919, -0.0018749544396996498, -0.0018060337752103806, -0.0017371131107211113, -0.001668192446231842, -0.0015992717817425728, -0.0015303511172533035, -0.0014614304527640343, -0.001392509788274765, -0.0013235891237854958, -0.0012546684592962265, -0.0011857477948069572, -0.001116827130317688, -0.0010479064658284187, -0.0009789858013391495, -0.0009100651368498802, -0.000841144472360611, -0.0007722238078713417, -0.0007033031433820724, -0.0006343824788928032, -0.0005654618144035339, -0.0004965411499142647, -0.0004276204854249954, -0.00035869982093572617, -0.0002897791564464569, -0.00022085849195718765, -0.0001519378274679184, -8.301716297864914e-05, -1.4096498489379883e-05, 5.4824165999889374e-05, 0.00012374483048915863, 0.0001926654949784279, 0.00026158615946769714, 0.0003305068239569664, 0.00039942748844623566, 0.0004683481529355049, 0.0005372688174247742, 0.0006061894819140434, 0.0006751101464033127, 0.0007440308108925819, 0.0008129514753818512, 0.0008818721398711205, 0.0009507928043603897, 0.001019713468849659, 0.0010886341333389282, 0.0011575547978281975, 0.0012264754623174667, 0.001295396126806736, 0.0013643167912960052, 0.0014332374557852745, 0.0015021581202745438, 0.001571078784763813, 0.0016399994492530823, 0.0017089201137423515, 0.0017778407782316208, 0.00184676144272089, 0.0019156821072101593, 0.0019846027716994286, 0.002053523436188698, 0.002122444100677967, 0.0021913647651672363]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 14.0, 5.0, 10.0, 12.0, 14.0, 20.0, 21.0, 26.0, 24.0, 27.0, 26.0, 40.0, 32.0, 42.0, 42.0, 46.0, 38.0, 31.0, 49.0, 42.0, 52.0, 45.0, 39.0, 40.0, 38.0, 33.0, 31.0, 27.0, 22.0, 15.0, 22.0, 16.0, 10.0, 5.0, 13.0, 6.0, 9.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.890625, -23.07861328125, -22.2666015625, -21.45458984375, -20.642578125, -19.83056640625, -19.0185546875, -18.20654296875, -17.39453125, -16.58251953125, -15.7705078125, -14.95849609375, -14.146484375, -13.33447265625, -12.5224609375, -11.71044921875, -10.8984375, -10.08642578125, -9.2744140625, -8.46240234375, -7.650390625, -6.83837890625, -6.0263671875, -5.21435546875, -4.40234375, -3.59033203125, -2.7783203125, -1.96630859375, -1.154296875, -0.34228515625, 0.4697265625, 1.28173828125, 2.09375, 2.90576171875, 3.7177734375, 4.52978515625, 5.341796875, 6.15380859375, 6.9658203125, 7.77783203125, 8.58984375, 9.40185546875, 10.2138671875, 11.02587890625, 11.837890625, 12.64990234375, 13.4619140625, 14.27392578125, 15.0859375, 15.89794921875, 16.7099609375, 17.52197265625, 18.333984375, 19.14599609375, 19.9580078125, 20.77001953125, 21.58203125, 22.39404296875, 23.2060546875, 24.01806640625, 24.830078125, 25.64208984375, 26.4541015625, 27.26611328125, 28.078125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 5.0, 0.0, 3.0, 6.0, 8.0, 9.0, 16.0, 38.0, 44.0, 55.0, 75.0, 74.0, 118.0, 145.0, 189.0, 272.0, 384.0, 578.0, 928.0, 1457.0, 2521.0, 5073.0, 11188.0, 30406.0, 117177.0, 600904.0, 202329.0, 44917.0, 15188.0, 6359.0, 3079.0, 1641.0, 1138.0, 640.0, 426.0, 331.0, 234.0, 137.0, 120.0, 82.0, 55.0, 55.0, 34.0, 33.0, 21.0, 13.0, 20.0, 11.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.65625, -32.48193359375, -31.3076171875, -30.13330078125, -28.958984375, -27.78466796875, -26.6103515625, -25.43603515625, -24.26171875, -23.08740234375, -21.9130859375, -20.73876953125, -19.564453125, -18.39013671875, -17.2158203125, -16.04150390625, -14.8671875, -13.69287109375, -12.5185546875, -11.34423828125, -10.169921875, -8.99560546875, -7.8212890625, -6.64697265625, -5.47265625, -4.29833984375, -3.1240234375, -1.94970703125, -0.775390625, 0.39892578125, 1.5732421875, 2.74755859375, 3.921875, 5.09619140625, 6.2705078125, 7.44482421875, 8.619140625, 9.79345703125, 10.9677734375, 12.14208984375, 13.31640625, 14.49072265625, 15.6650390625, 16.83935546875, 18.013671875, 19.18798828125, 20.3623046875, 21.53662109375, 22.7109375, 23.88525390625, 25.0595703125, 26.23388671875, 27.408203125, 28.58251953125, 29.7568359375, 30.93115234375, 32.10546875, 33.27978515625, 34.4541015625, 35.62841796875, 36.802734375, 37.97705078125, 39.1513671875, 40.32568359375, 41.5]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 2.0, 6.0, 7.0, 3.0, 15.0, 23.0, 24.0, 21.0, 29.0, 49.0, 42.0, 65.0, 68.0, 107.0, 342.0, 1650.0, 170.0, 87.0, 67.0, 48.0, 58.0, 39.0, 28.0, 20.0, 22.0, 12.0, 15.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.25, -60.1181640625, -57.986328125, -55.8544921875, -53.72265625, -51.5908203125, -49.458984375, -47.3271484375, -45.1953125, -43.0634765625, -40.931640625, -38.7998046875, -36.66796875, -34.5361328125, -32.404296875, -30.2724609375, -28.140625, -26.0087890625, -23.876953125, -21.7451171875, -19.61328125, -17.4814453125, -15.349609375, -13.2177734375, -11.0859375, -8.9541015625, -6.822265625, -4.6904296875, -2.55859375, -0.4267578125, 1.705078125, 3.8369140625, 5.96875, 8.1005859375, 10.232421875, 12.3642578125, 14.49609375, 16.6279296875, 18.759765625, 20.8916015625, 23.0234375, 25.1552734375, 27.287109375, 29.4189453125, 31.55078125, 33.6826171875, 35.814453125, 37.9462890625, 40.078125, 42.2099609375, 44.341796875, 46.4736328125, 48.60546875, 50.7373046875, 52.869140625, 55.0009765625, 57.1328125, 59.2646484375, 61.396484375, 63.5283203125, 65.66015625, 67.7919921875, 69.923828125, 72.0556640625, 74.1875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 10.0, 18.0, 24.0, 18.0, 48.0, 63.0, 69.0, 138.0, 276.0, 537.0, 1592.0, 347846.0, 2791889.0, 1841.0, 585.0, 295.0, 133.0, 120.0, 74.0, 42.0, 26.0, 16.0, 15.0, 9.0, 3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.875, -174.59375, -169.3125, -164.03125, -158.75, -153.46875, -148.1875, -142.90625, -137.625, -132.34375, -127.0625, -121.78125, -116.5, -111.21875, -105.9375, -100.65625, -95.375, -90.09375, -84.8125, -79.53125, -74.25, -68.96875, -63.6875, -58.40625, -53.125, -47.84375, -42.5625, -37.28125, -32.0, -26.71875, -21.4375, -16.15625, -10.875, -5.59375, -0.3125, 4.96875, 10.25, 15.53125, 20.8125, 26.09375, 31.375, 36.65625, 41.9375, 47.21875, 52.5, 57.78125, 63.0625, 68.34375, 73.625, 78.90625, 84.1875, 89.46875, 94.75, 100.03125, 105.3125, 110.59375, 115.875, 121.15625, 126.4375, 131.71875, 137.0, 142.28125, 147.5625, 152.84375, 158.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 28.0, 588.0, 376.0, 22.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-584.1806030273438, -566.9111938476562, -549.6417846679688, -532.3723754882812, -515.1029663085938, -497.83355712890625, -480.56414794921875, -463.29473876953125, -446.02532958984375, -428.75592041015625, -411.48651123046875, -394.21710205078125, -376.94769287109375, -359.67828369140625, -342.40887451171875, -325.13946533203125, -307.87005615234375, -290.60064697265625, -273.33123779296875, -256.06182861328125, -238.79241943359375, -221.52301025390625, -204.25360107421875, -186.98419189453125, -169.71478271484375, -152.44537353515625, -135.17596435546875, -117.90655517578125, -100.63714599609375, -83.36773681640625, -66.09832763671875, -48.82891845703125, -31.5595703125, -14.2901611328125, 2.979248046875, 20.2486572265625, 37.51806640625, 54.7874755859375, 72.056884765625, 89.3262939453125, 106.595703125, 123.8651123046875, 141.134521484375, 158.4039306640625, 175.67333984375, 192.9427490234375, 210.212158203125, 227.4815673828125, 244.7509765625, 262.0203857421875, 279.289794921875, 296.5592041015625, 313.82861328125, 331.0980224609375, 348.367431640625, 365.6368408203125, 382.90625, 400.1756591796875, 417.445068359375, 434.7144775390625, 451.98388671875, 469.2532958984375, 486.522705078125, 503.7921142578125, 521.0615234375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 2.0, 10.0, 11.0, 10.0, 21.0, 17.0, 22.0, 28.0, 22.0, 22.0, 30.0, 39.0, 40.0, 47.0, 33.0, 29.0, 42.0, 44.0, 39.0, 37.0, 37.0, 42.0, 44.0, 39.0, 35.0, 33.0, 26.0, 32.0, 35.0, 20.0, 18.0, 14.0, 15.0, 10.0, 9.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.70568084716797, -97.85025024414062, -93.99481964111328, -90.13938903808594, -86.28396606445312, -82.42853546142578, -78.57310485839844, -74.7176742553711, -70.86224365234375, -67.0068130493164, -63.15138626098633, -59.295955657958984, -55.440528869628906, -51.58509826660156, -47.72966766357422, -43.874237060546875, -40.01881408691406, -36.16338348388672, -32.30795669555664, -28.452526092529297, -24.597097396850586, -20.741668701171875, -16.88623809814453, -13.03080940246582, -9.17538070678711, -5.31995153427124, -1.464522361755371, 2.3909072875976562, 6.246335983276367, 10.101764678955078, 13.957195281982422, 17.812623977661133, 21.668060302734375, 25.523488998413086, 29.378917694091797, 33.23434829711914, 37.08977508544922, 40.94520568847656, 44.800636291503906, 48.65606689453125, 52.51149368286133, 56.36692428588867, 60.22235107421875, 64.0777816772461, 67.93321228027344, 71.78863525390625, 75.64407348632812, 79.49949645996094, 83.35492706298828, 87.21035766601562, 91.06578826904297, 94.92121887207031, 98.77664184570312, 102.63207244873047, 106.48750305175781, 110.34293365478516, 114.1983642578125, 118.05379486083984, 121.90922546386719, 125.7646484375, 129.62008666992188, 133.4755096435547, 137.3309326171875, 141.18637084960938, 145.0417938232422]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 10.0, 13.0, 10.0, 12.0, 16.0, 17.0, 18.0, 23.0, 30.0, 33.0, 27.0, 33.0, 42.0, 37.0, 44.0, 50.0, 39.0, 39.0, 52.0, 42.0, 36.0, 47.0, 30.0, 33.0, 34.0, 33.0, 25.0, 31.0, 25.0, 20.0, 21.0, 14.0, 11.0, 10.0, 12.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.29736328125, -22.3759765625, -21.45458984375, -20.533203125, -19.61181640625, -18.6904296875, -17.76904296875, -16.84765625, -15.92626953125, -15.0048828125, -14.08349609375, -13.162109375, -12.24072265625, -11.3193359375, -10.39794921875, -9.4765625, -8.55517578125, -7.6337890625, -6.71240234375, -5.791015625, -4.86962890625, -3.9482421875, -3.02685546875, -2.10546875, -1.18408203125, -0.2626953125, 0.65869140625, 1.580078125, 2.50146484375, 3.4228515625, 4.34423828125, 5.265625, 6.18701171875, 7.1083984375, 8.02978515625, 8.951171875, 9.87255859375, 10.7939453125, 11.71533203125, 12.63671875, 13.55810546875, 14.4794921875, 15.40087890625, 16.322265625, 17.24365234375, 18.1650390625, 19.08642578125, 20.0078125, 20.92919921875, 21.8505859375, 22.77197265625, 23.693359375, 24.61474609375, 25.5361328125, 26.45751953125, 27.37890625, 28.30029296875, 29.2216796875, 30.14306640625, 31.064453125, 31.98583984375, 32.9072265625, 33.82861328125, 34.75]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 18.0, 13.0, 28.0, 41.0, 46.0, 66.0, 70.0, 114.0, 186.0, 230.0, 339.0, 489.0, 844.0, 1659.0, 3795.0, 10754.0, 44465.0, 2248876.0, 1828552.0, 36894.0, 9357.0, 3480.0, 1494.0, 804.0, 479.0, 308.0, 225.0, 155.0, 131.0, 100.0, 74.0, 45.0, 39.0, 21.0, 25.0, 21.0, 10.0, 5.0, 8.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.25, -111.7734375, -107.296875, -102.8203125, -98.34375, -93.8671875, -89.390625, -84.9140625, -80.4375, -75.9609375, -71.484375, -67.0078125, -62.53125, -58.0546875, -53.578125, -49.1015625, -44.625, -40.1484375, -35.671875, -31.1953125, -26.71875, -22.2421875, -17.765625, -13.2890625, -8.8125, -4.3359375, 0.140625, 4.6171875, 9.09375, 13.5703125, 18.046875, 22.5234375, 27.0, 31.4765625, 35.953125, 40.4296875, 44.90625, 49.3828125, 53.859375, 58.3359375, 62.8125, 67.2890625, 71.765625, 76.2421875, 80.71875, 85.1953125, 89.671875, 94.1484375, 98.625, 103.1015625, 107.578125, 112.0546875, 116.53125, 121.0078125, 125.484375, 129.9609375, 134.4375, 138.9140625, 143.390625, 147.8671875, 152.34375, 156.8203125, 161.296875, 165.7734375, 170.25]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 6.0, 4.0, 10.0, 14.0, 25.0, 38.0, 37.0, 66.0, 93.0, 197.0, 433.0, 1140.0, 1130.0, 411.0, 162.0, 111.0, 50.0, 48.0, 33.0, 15.0, 15.0, 14.0, 7.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.9375, -78.3759765625, -74.814453125, -71.2529296875, -67.69140625, -64.1298828125, -60.568359375, -57.0068359375, -53.4453125, -49.8837890625, -46.322265625, -42.7607421875, -39.19921875, -35.6376953125, -32.076171875, -28.5146484375, -24.953125, -21.3916015625, -17.830078125, -14.2685546875, -10.70703125, -7.1455078125, -3.583984375, -0.0224609375, 3.5390625, 7.1005859375, 10.662109375, 14.2236328125, 17.78515625, 21.3466796875, 24.908203125, 28.4697265625, 32.03125, 35.5927734375, 39.154296875, 42.7158203125, 46.27734375, 49.8388671875, 53.400390625, 56.9619140625, 60.5234375, 64.0849609375, 67.646484375, 71.2080078125, 74.76953125, 78.3310546875, 81.892578125, 85.4541015625, 89.015625, 92.5771484375, 96.138671875, 99.7001953125, 103.26171875, 106.8232421875, 110.384765625, 113.9462890625, 117.5078125, 121.0693359375, 124.630859375, 128.1923828125, 131.75390625, 135.3154296875, 138.876953125, 142.4384765625, 146.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 8.0, 7.0, 10.0, 20.0, 23.0, 53.0, 77.0, 126.0, 203.0, 274.0, 504.0, 957.0, 1741.0, 3306.0, 6786.0, 15507.0, 39942.0, 152622.0, 2858484.0, 963615.0, 96854.0, 29620.0, 11914.0, 5493.0, 2761.0, 1437.0, 749.0, 418.0, 285.0, 180.0, 108.0, 55.0, 36.0, 36.0, 24.0, 8.0, 11.0, 8.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.6875, -72.3427734375, -69.998046875, -67.6533203125, -65.30859375, -62.9638671875, -60.619140625, -58.2744140625, -55.9296875, -53.5849609375, -51.240234375, -48.8955078125, -46.55078125, -44.2060546875, -41.861328125, -39.5166015625, -37.171875, -34.8271484375, -32.482421875, -30.1376953125, -27.79296875, -25.4482421875, -23.103515625, -20.7587890625, -18.4140625, -16.0693359375, -13.724609375, -11.3798828125, -9.03515625, -6.6904296875, -4.345703125, -2.0009765625, 0.34375, 2.6884765625, 5.033203125, 7.3779296875, 9.72265625, 12.0673828125, 14.412109375, 16.7568359375, 19.1015625, 21.4462890625, 23.791015625, 26.1357421875, 28.48046875, 30.8251953125, 33.169921875, 35.5146484375, 37.859375, 40.2041015625, 42.548828125, 44.8935546875, 47.23828125, 49.5830078125, 51.927734375, 54.2724609375, 56.6171875, 58.9619140625, 61.306640625, 63.6513671875, 65.99609375, 68.3408203125, 70.685546875, 73.0302734375, 75.375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 3.0, 4.0, 9.0, 7.0, 13.0, 18.0, 16.0, 37.0, 29.0, 42.0, 65.0, 105.0, 144.0, 131.0, 96.0, 68.0, 59.0, 34.0, 23.0, 20.0, 22.0, 8.0, 11.0, 14.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-446.7537841796875, -432.40869140625, -418.0636291503906, -403.7185363769531, -389.37347412109375, -375.02838134765625, -360.68328857421875, -346.3382263183594, -331.9931335449219, -317.6480407714844, -303.302978515625, -288.9578857421875, -274.6128234863281, -260.2677307128906, -245.9226531982422, -231.57757568359375, -217.2324981689453, -202.88742065429688, -188.54234313964844, -174.197265625, -159.8521728515625, -145.50709533691406, -131.16201782226562, -116.81693267822266, -102.47185516357422, -88.12677764892578, -73.78169250488281, -59.436614990234375, -45.09153366088867, -30.74645233154297, -16.40137481689453, -2.0562896728515625, 12.288787841796875, 26.633869171142578, 40.97895050048828, 55.32402801513672, 69.66911315917969, 84.01419067382812, 98.35926818847656, 112.70435333251953, 127.04943084716797, 141.39451599121094, 155.73959350585938, 170.0846710205078, 184.42974853515625, 198.77484130859375, 213.11990356445312, 227.46499633789062, 241.81007385253906, 256.1551513671875, 270.500244140625, 284.8453063964844, 299.1903991699219, 313.53546142578125, 327.88055419921875, 342.22564697265625, 356.5707092285156, 370.9158020019531, 385.2608642578125, 399.60595703125, 413.9510192871094, 428.2961120605469, 442.64117431640625, 456.98626708984375, 471.33135986328125]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 11.0, 12.0, 14.0, 16.0, 16.0, 13.0, 26.0, 26.0, 20.0, 25.0, 32.0, 38.0, 35.0, 48.0, 38.0, 53.0, 37.0, 38.0, 34.0, 39.0, 44.0, 32.0, 52.0, 26.0, 30.0, 31.0, 44.0, 28.0, 17.0, 18.0, 11.0, 13.0, 18.0, 11.0, 6.0, 4.0, 7.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-283.0593566894531, -274.0446472167969, -265.02996826171875, -256.0152587890625, -247.00057983398438, -237.98587036132812, -228.97117614746094, -219.95648193359375, -210.94178771972656, -201.92709350585938, -192.9123992919922, -183.897705078125, -174.88299560546875, -165.86831665039062, -156.85360717773438, -147.8389129638672, -138.82421875, -129.8095245361328, -120.79483032226562, -111.7801284790039, -102.76543426513672, -93.75074005126953, -84.73603820800781, -75.72134399414062, -66.70664978027344, -57.69195556640625, -48.6772575378418, -39.662559509277344, -30.647865295410156, -21.63317108154297, -12.618473052978516, -3.6037750244140625, 5.41094970703125, 14.42564582824707, 23.44034194946289, 32.455039978027344, 41.46973419189453, 50.48442840576172, 59.49912643432617, 68.51382446289062, 77.52851867675781, 86.543212890625, 95.55790710449219, 104.5726089477539, 113.5873031616211, 122.60199737548828, 131.61669921875, 140.6313934326172, 149.64608764648438, 158.66078186035156, 167.67547607421875, 176.69017028808594, 185.70486450195312, 194.71957397460938, 203.73426818847656, 212.74896240234375, 221.76365661621094, 230.77835083007812, 239.7930450439453, 248.8077392578125, 257.82244873046875, 266.8371276855469, 275.8518371582031, 284.86651611328125, 293.8812255859375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 10.0, 15.0, 6.0, 17.0, 19.0, 16.0, 14.0, 26.0, 22.0, 28.0, 21.0, 40.0, 37.0, 47.0, 48.0, 41.0, 49.0, 45.0, 45.0, 40.0, 39.0, 38.0, 44.0, 38.0, 30.0, 28.0, 43.0, 30.0, 20.0, 14.0, 10.0, 13.0, 14.0, 9.0, 6.0, 7.0, 7.0, 2.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-520.5, -504.046875, -487.59375, -471.140625, -454.6875, -438.234375, -421.78125, -405.328125, -388.875, -372.421875, -355.96875, -339.515625, -323.0625, -306.609375, -290.15625, -273.703125, -257.25, -240.796875, -224.34375, -207.890625, -191.4375, -174.984375, -158.53125, -142.078125, -125.625, -109.171875, -92.71875, -76.265625, -59.8125, -43.359375, -26.90625, -10.453125, 6.0, 22.453125, 38.90625, 55.359375, 71.8125, 88.265625, 104.71875, 121.171875, 137.625, 154.078125, 170.53125, 186.984375, 203.4375, 219.890625, 236.34375, 252.796875, 269.25, 285.703125, 302.15625, 318.609375, 335.0625, 351.515625, 367.96875, 384.421875, 400.875, 417.328125, 433.78125, 450.234375, 466.6875, 483.140625, 499.59375, 516.046875, 532.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 1.0, 10.0, 13.0, 22.0, 32.0, 36.0, 48.0, 75.0, 113.0, 151.0, 217.0, 268.0, 449.0, 567.0, 857.0, 1153.0, 1691.0, 2406.0, 3543.0, 5058.0, 7446.0, 10813.0, 16692.0, 25385.0, 41282.0, 69844.0, 127106.0, 240968.0, 212120.0, 110619.0, 62207.0, 36922.0, 23075.0, 15331.0, 9992.0, 6746.0, 4593.0, 3139.0, 2275.0, 1584.0, 1046.0, 803.0, 527.0, 416.0, 270.0, 183.0, 142.0, 95.0, 74.0, 46.0, 32.0, 18.0, 25.0, 12.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0], "bins": [-27.0, -26.1533203125, -25.306640625, -24.4599609375, -23.61328125, -22.7666015625, -21.919921875, -21.0732421875, -20.2265625, -19.3798828125, -18.533203125, -17.6865234375, -16.83984375, -15.9931640625, -15.146484375, -14.2998046875, -13.453125, -12.6064453125, -11.759765625, -10.9130859375, -10.06640625, -9.2197265625, -8.373046875, -7.5263671875, -6.6796875, -5.8330078125, -4.986328125, -4.1396484375, -3.29296875, -2.4462890625, -1.599609375, -0.7529296875, 0.09375, 0.9404296875, 1.787109375, 2.6337890625, 3.48046875, 4.3271484375, 5.173828125, 6.0205078125, 6.8671875, 7.7138671875, 8.560546875, 9.4072265625, 10.25390625, 11.1005859375, 11.947265625, 12.7939453125, 13.640625, 14.4873046875, 15.333984375, 16.1806640625, 17.02734375, 17.8740234375, 18.720703125, 19.5673828125, 20.4140625, 21.2607421875, 22.107421875, 22.9541015625, 23.80078125, 24.6474609375, 25.494140625, 26.3408203125, 27.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 8.0, 2.0, 6.0, 7.0, 8.0, 10.0, 8.0, 13.0, 20.0, 21.0, 23.0, 22.0, 28.0, 26.0, 38.0, 44.0, 30.0, 22.0, 32.0, 43.0, 41.0, 1067.0, 42.0, 51.0, 41.0, 47.0, 36.0, 35.0, 31.0, 34.0, 26.0, 24.0, 25.0, 25.0, 14.0, 16.0, 12.0, 12.0, 4.0, 7.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-336.5, -326.26171875, -316.0234375, -305.78515625, -295.546875, -285.30859375, -275.0703125, -264.83203125, -254.59375, -244.35546875, -234.1171875, -223.87890625, -213.640625, -203.40234375, -193.1640625, -182.92578125, -172.6875, -162.44921875, -152.2109375, -141.97265625, -131.734375, -121.49609375, -111.2578125, -101.01953125, -90.78125, -80.54296875, -70.3046875, -60.06640625, -49.828125, -39.58984375, -29.3515625, -19.11328125, -8.875, 1.36328125, 11.6015625, 21.83984375, 32.078125, 42.31640625, 52.5546875, 62.79296875, 73.03125, 83.26953125, 93.5078125, 103.74609375, 113.984375, 124.22265625, 134.4609375, 144.69921875, 154.9375, 165.17578125, 175.4140625, 185.65234375, 195.890625, 206.12890625, 216.3671875, 226.60546875, 236.84375, 247.08203125, 257.3203125, 267.55859375, 277.796875, 288.03515625, 298.2734375, 308.51171875, 318.75]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 13.0, 11.0, 22.0, 25.0, 46.0, 74.0, 105.0, 144.0, 208.0, 249.0, 412.0, 548.0, 752.0, 998.0, 1440.0, 1952.0, 2781.0, 3933.0, 5519.0, 8107.0, 11892.0, 17288.0, 25933.0, 39841.0, 63058.0, 107289.0, 208280.0, 1261416.0, 125841.0, 72031.0, 44866.0, 29353.0, 19358.0, 13124.0, 8949.0, 6242.0, 4291.0, 3075.0, 2127.0, 1570.0, 1141.0, 768.0, 567.0, 440.0, 330.0, 229.0, 164.0, 117.0, 62.0, 58.0, 38.0, 24.0, 13.0, 9.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-19.109375, -18.49560546875, -17.8818359375, -17.26806640625, -16.654296875, -16.04052734375, -15.4267578125, -14.81298828125, -14.19921875, -13.58544921875, -12.9716796875, -12.35791015625, -11.744140625, -11.13037109375, -10.5166015625, -9.90283203125, -9.2890625, -8.67529296875, -8.0615234375, -7.44775390625, -6.833984375, -6.22021484375, -5.6064453125, -4.99267578125, -4.37890625, -3.76513671875, -3.1513671875, -2.53759765625, -1.923828125, -1.31005859375, -0.6962890625, -0.08251953125, 0.53125, 1.14501953125, 1.7587890625, 2.37255859375, 2.986328125, 3.60009765625, 4.2138671875, 4.82763671875, 5.44140625, 6.05517578125, 6.6689453125, 7.28271484375, 7.896484375, 8.51025390625, 9.1240234375, 9.73779296875, 10.3515625, 10.96533203125, 11.5791015625, 12.19287109375, 12.806640625, 13.42041015625, 14.0341796875, 14.64794921875, 15.26171875, 15.87548828125, 16.4892578125, 17.10302734375, 17.716796875, 18.33056640625, 18.9443359375, 19.55810546875, 20.171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 15.0, 17.0, 21.0, 35.0, 43.0, 45.0, 58.0, 39.0, 58.0, 64.0, 51.0, 73.0, 64.0, 67.0, 52.0, 54.0, 31.0, 41.0, 27.0, 30.0, 21.0, 16.0, 5.0, 13.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10699462890625, -0.10355663299560547, -0.10011863708496094, -0.0966806411743164, -0.09324264526367188, -0.08980464935302734, -0.08636665344238281, -0.08292865753173828, -0.07949066162109375, -0.07605266571044922, -0.07261466979980469, -0.06917667388916016, -0.06573867797851562, -0.062300682067871094, -0.05886268615722656, -0.05542469024658203, -0.0519866943359375, -0.04854869842529297, -0.04511070251464844, -0.041672706604003906, -0.038234710693359375, -0.034796714782714844, -0.03135871887207031, -0.02792072296142578, -0.02448272705078125, -0.02104473114013672, -0.017606735229492188, -0.014168739318847656, -0.010730743408203125, -0.007292747497558594, -0.0038547515869140625, -0.00041675567626953125, 0.003021240234375, 0.006459236145019531, 0.009897232055664062, 0.013335227966308594, 0.016773223876953125, 0.020211219787597656, 0.023649215698242188, 0.02708721160888672, 0.03052520751953125, 0.03396320343017578, 0.03740119934082031, 0.040839195251464844, 0.044277191162109375, 0.047715187072753906, 0.05115318298339844, 0.05459117889404297, 0.0580291748046875, 0.06146717071533203, 0.06490516662597656, 0.0683431625366211, 0.07178115844726562, 0.07521915435791016, 0.07865715026855469, 0.08209514617919922, 0.08553314208984375, 0.08897113800048828, 0.09240913391113281, 0.09584712982177734, 0.09928512573242188, 0.1027231216430664, 0.10616111755371094, 0.10959911346435547, 0.113037109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 3.0, 8.0, 12.0, 11.0, 18.0, 19.0, 14.0, 28.0, 42.0, 66.0, 76.0, 96.0, 193.0, 365.0, 517.0, 1018.0, 1964.0, 4338.0, 10777.0, 34959.0, 139004.0, 476753.0, 280154.0, 66545.0, 18646.0, 6760.0, 2888.0, 1401.0, 747.0, 412.0, 242.0, 143.0, 87.0, 63.0, 50.0, 37.0, 24.0, 14.0, 12.0, 9.0, 11.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.61376953125, -0.5950241088867188, -0.5762786865234375, -0.5575332641601562, -0.538787841796875, -0.5200424194335938, -0.5012969970703125, -0.48255157470703125, -0.46380615234375, -0.44506072998046875, -0.4263153076171875, -0.40756988525390625, -0.388824462890625, -0.37007904052734375, -0.3513336181640625, -0.33258819580078125, -0.3138427734375, -0.29509735107421875, -0.2763519287109375, -0.25760650634765625, -0.238861083984375, -0.22011566162109375, -0.2013702392578125, -0.18262481689453125, -0.16387939453125, -0.14513397216796875, -0.1263885498046875, -0.10764312744140625, -0.088897705078125, -0.07015228271484375, -0.0514068603515625, -0.03266143798828125, -0.013916015625, 0.00482940673828125, 0.0235748291015625, 0.04232025146484375, 0.061065673828125, 0.07981109619140625, 0.0985565185546875, 0.11730194091796875, 0.13604736328125, 0.15479278564453125, 0.1735382080078125, 0.19228363037109375, 0.211029052734375, 0.22977447509765625, 0.2485198974609375, 0.26726531982421875, 0.2860107421875, 0.30475616455078125, 0.3235015869140625, 0.34224700927734375, 0.360992431640625, 0.37973785400390625, 0.3984832763671875, 0.41722869873046875, 0.43597412109375, 0.45471954345703125, 0.4734649658203125, 0.49221038818359375, 0.510955810546875, 0.5297012329101562, 0.5484466552734375, 0.5671920776367188, 0.5859375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 22.0, 24.0, 44.0, 86.0, 108.0, 133.0, 146.0, 103.0, 90.0, 69.0, 41.0, 32.0, 29.0, 15.0, 18.0, 8.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07617875933647156, -0.07196757197380066, -0.06775639206171036, -0.06354521214962006, -0.05933402478694916, -0.05512284114956856, -0.05091165751218796, -0.04670047387480736, -0.04248929023742676, -0.03827810660004616, -0.03406692296266556, -0.029855739325284958, -0.025644555687904358, -0.021433372050523758, -0.017222188413143158, -0.013011004775762558, -0.008799821138381958, -0.004588637501001358, -0.00037745386362075806, 0.003833729773759842, 0.008044913411140442, 0.012256097048521042, 0.016467280685901642, 0.020678464323282242, 0.024889647960662842, 0.029100831598043442, 0.03331201523542404, 0.03752319887280464, 0.04173438251018524, 0.04594556614756584, 0.05015674978494644, 0.05436793342232704, 0.05857910215854645, 0.06279028952121735, 0.06700146943330765, 0.07121264934539795, 0.07542383670806885, 0.07963502407073975, 0.08384620398283005, 0.08805738389492035, 0.09226857125759125, 0.09647975862026215, 0.10069093853235245, 0.10490211844444275, 0.10911330580711365, 0.11332449316978455, 0.11753567308187485, 0.12174685299396515, 0.12595804035663605, 0.13016922771930695, 0.13438040018081665, 0.13859158754348755, 0.14280277490615845, 0.14701396226882935, 0.15122514963150024, 0.15543632209300995, 0.15964750945568085, 0.16385869681835175, 0.16806986927986145, 0.17228105664253235, 0.17649224400520325, 0.18070343136787415, 0.18491461873054504, 0.18912579119205475, 0.19333697855472565]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 8.0, 3.0, 3.0, 9.0, 6.0, 10.0, 12.0, 16.0, 18.0, 20.0, 18.0, 16.0, 23.0, 35.0, 31.0, 43.0, 29.0, 27.0, 27.0, 35.0, 39.0, 47.0, 37.0, 39.0, 38.0, 36.0, 37.0, 32.0, 45.0, 35.0, 29.0, 34.0, 22.0, 21.0, 24.0, 20.0, 10.0, 8.0, 14.0, 8.0, 7.0, 10.0, 4.0, 4.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.06549620628356934, -0.06358537077903748, -0.06167452782392502, -0.05976369231939316, -0.057852853089571, -0.05594201385974884, -0.05403117835521698, -0.05212033912539482, -0.05020949989557266, -0.048298660665750504, -0.046387821435928345, -0.044476985931396484, -0.042566146701574326, -0.04065530747175217, -0.038744471967220306, -0.03683363273739815, -0.03492279350757599, -0.03301195427775383, -0.03110111691057682, -0.02919027954339981, -0.027279440313577652, -0.025368601083755493, -0.023457763716578484, -0.021546926349401474, -0.019636087119579315, -0.017725247889757156, -0.015814410522580147, -0.013903572224080563, -0.011992733925580978, -0.010081895627081394, -0.00817105732858181, -0.006260219030082226, -0.004349380731582642, -0.0024385424330830574, -0.0005277041345834732, 0.001383134163916111, 0.003293972462415695, 0.005204810760915279, 0.007115649059414864, 0.009026487357914448, 0.010937325656414032, 0.012848163954913616, 0.0147590022534132, 0.01666983962059021, 0.01858067885041237, 0.020491518080234528, 0.022402355447411537, 0.024313192814588547, 0.026224032044410706, 0.028134871274232864, 0.030045708641409874, 0.031956546008586884, 0.03386738523840904, 0.0357782244682312, 0.03768905997276306, 0.03959989920258522, 0.04151073843240738, 0.04342157766222954, 0.0453324168920517, 0.04724325239658356, 0.049154091626405716, 0.051064930856227875, 0.052975766360759735, 0.054886605590581894, 0.05679744482040405]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 10.0, 15.0, 6.0, 17.0, 19.0, 15.0, 15.0, 26.0, 22.0, 28.0, 21.0, 40.0, 37.0, 47.0, 49.0, 40.0, 49.0, 45.0, 46.0, 39.0, 38.0, 38.0, 45.0, 37.0, 31.0, 28.0, 43.0, 29.0, 20.0, 15.0, 10.0, 13.0, 14.0, 9.0, 6.0, 7.0, 7.0, 2.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-520.5, -504.046875, -487.59375, -471.140625, -454.6875, -438.234375, -421.78125, -405.328125, -388.875, -372.421875, -355.96875, -339.515625, -323.0625, -306.609375, -290.15625, -273.703125, -257.25, -240.796875, -224.34375, -207.890625, -191.4375, -174.984375, -158.53125, -142.078125, -125.625, -109.171875, -92.71875, -76.265625, -59.8125, -43.359375, -26.90625, -10.453125, 6.0, 22.453125, 38.90625, 55.359375, 71.8125, 88.265625, 104.71875, 121.171875, 137.625, 154.078125, 170.53125, 186.984375, 203.4375, 219.890625, 236.34375, 252.796875, 269.25, 285.703125, 302.15625, 318.609375, 335.0625, 351.515625, 367.96875, 384.421875, 400.875, 417.328125, 433.78125, 450.234375, 466.6875, 483.140625, 499.59375, 516.046875, 532.5]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 5.0, 6.0, 9.0, 5.0, 14.0, 13.0, 24.0, 37.0, 36.0, 53.0, 70.0, 94.0, 143.0, 185.0, 260.0, 380.0, 596.0, 935.0, 1687.0, 3370.0, 8601.0, 26749.0, 115967.0, 640848.0, 189496.0, 38107.0, 11266.0, 4316.0, 2036.0, 1125.0, 652.0, 417.0, 306.0, 209.0, 148.0, 98.0, 70.0, 57.0, 45.0, 38.0, 21.0, 12.0, 20.0, 7.0, 6.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-97.0, -93.93359375, -90.8671875, -87.80078125, -84.734375, -81.66796875, -78.6015625, -75.53515625, -72.46875, -69.40234375, -66.3359375, -63.26953125, -60.203125, -57.13671875, -54.0703125, -51.00390625, -47.9375, -44.87109375, -41.8046875, -38.73828125, -35.671875, -32.60546875, -29.5390625, -26.47265625, -23.40625, -20.33984375, -17.2734375, -14.20703125, -11.140625, -8.07421875, -5.0078125, -1.94140625, 1.125, 4.19140625, 7.2578125, 10.32421875, 13.390625, 16.45703125, 19.5234375, 22.58984375, 25.65625, 28.72265625, 31.7890625, 34.85546875, 37.921875, 40.98828125, 44.0546875, 47.12109375, 50.1875, 53.25390625, 56.3203125, 59.38671875, 62.453125, 65.51953125, 68.5859375, 71.65234375, 74.71875, 77.78515625, 80.8515625, 83.91796875, 86.984375, 90.05078125, 93.1171875, 96.18359375, 99.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 10.0, 7.0, 9.0, 11.0, 15.0, 26.0, 31.0, 23.0, 25.0, 27.0, 38.0, 47.0, 48.0, 47.0, 47.0, 2018.0, 137.0, 34.0, 38.0, 57.0, 49.0, 45.0, 47.0, 43.0, 29.0, 24.0, 32.0, 12.0, 21.0, 12.0, 7.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-626.5, -604.0234375, -581.546875, -559.0703125, -536.59375, -514.1171875, -491.640625, -469.1640625, -446.6875, -424.2109375, -401.734375, -379.2578125, -356.78125, -334.3046875, -311.828125, -289.3515625, -266.875, -244.3984375, -221.921875, -199.4453125, -176.96875, -154.4921875, -132.015625, -109.5390625, -87.0625, -64.5859375, -42.109375, -19.6328125, 2.84375, 25.3203125, 47.796875, 70.2734375, 92.75, 115.2265625, 137.703125, 160.1796875, 182.65625, 205.1328125, 227.609375, 250.0859375, 272.5625, 295.0390625, 317.515625, 339.9921875, 362.46875, 384.9453125, 407.421875, 429.8984375, 452.375, 474.8515625, 497.328125, 519.8046875, 542.28125, 564.7578125, 587.234375, 609.7109375, 632.1875, 654.6640625, 677.140625, 699.6171875, 722.09375, 744.5703125, 767.046875, 789.5234375, 812.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 12.0, 8.0, 12.0, 16.0, 23.0, 33.0, 50.0, 55.0, 84.0, 103.0, 170.0, 231.0, 329.0, 502.0, 886.0, 1677.0, 4315.0, 17994.0, 139190.0, 2841737.0, 114873.0, 15427.0, 4029.0, 1590.0, 838.0, 465.0, 319.0, 198.0, 162.0, 103.0, 74.0, 53.0, 42.0, 32.0, 18.0, 14.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0], "bins": [-142.25, -138.4521484375, -134.654296875, -130.8564453125, -127.05859375, -123.2607421875, -119.462890625, -115.6650390625, -111.8671875, -108.0693359375, -104.271484375, -100.4736328125, -96.67578125, -92.8779296875, -89.080078125, -85.2822265625, -81.484375, -77.6865234375, -73.888671875, -70.0908203125, -66.29296875, -62.4951171875, -58.697265625, -54.8994140625, -51.1015625, -47.3037109375, -43.505859375, -39.7080078125, -35.91015625, -32.1123046875, -28.314453125, -24.5166015625, -20.71875, -16.9208984375, -13.123046875, -9.3251953125, -5.52734375, -1.7294921875, 2.068359375, 5.8662109375, 9.6640625, 13.4619140625, 17.259765625, 21.0576171875, 24.85546875, 28.6533203125, 32.451171875, 36.2490234375, 40.046875, 43.8447265625, 47.642578125, 51.4404296875, 55.23828125, 59.0361328125, 62.833984375, 66.6318359375, 70.4296875, 74.2275390625, 78.025390625, 81.8232421875, 85.62109375, 89.4189453125, 93.216796875, 97.0146484375, 100.8125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 14.0, 33.0, 94.0, 280.0, 334.0, 151.0, 45.0, 17.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3685.001220703125, -3614.29296875, -3543.5849609375, -3472.876708984375, -3402.16845703125, -3331.460205078125, -3260.752197265625, -3190.0439453125, -3119.335693359375, -3048.62744140625, -2977.91943359375, -2907.211181640625, -2836.5029296875, -2765.794677734375, -2695.086669921875, -2624.37841796875, -2553.67041015625, -2482.962158203125, -2412.254150390625, -2341.5458984375, -2270.837646484375, -2200.12939453125, -2129.42138671875, -2058.713134765625, -1988.0048828125, -1917.2967529296875, -1846.5885009765625, -1775.88037109375, -1705.172119140625, -1634.4639892578125, -1563.755859375, -1493.047607421875, -1422.3394775390625, -1351.63134765625, -1280.923095703125, -1210.2149658203125, -1139.5067138671875, -1068.798583984375, -998.0903930664062, -927.3822021484375, -856.6740112304688, -785.9658203125, -715.2576293945312, -644.5494384765625, -573.84130859375, -503.1330871582031, -432.4249267578125, -361.71673583984375, -291.008544921875, -220.30035400390625, -149.59217834472656, -78.88400268554688, -8.175811767578125, 62.532379150390625, 133.24053955078125, 203.94873046875, 274.65692138671875, 345.3651123046875, 416.07330322265625, 486.7814636230469, 557.4896240234375, 628.1978759765625, 698.906005859375, 769.6141967773438, 840.3223876953125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 6.0, 11.0, 9.0, 26.0, 19.0, 34.0, 25.0, 36.0, 46.0, 45.0, 38.0, 39.0, 43.0, 44.0, 39.0, 40.0, 48.0, 48.0, 41.0, 43.0, 40.0, 43.0, 29.0, 30.0, 20.0, 19.0, 16.0, 17.0, 13.0, 12.0, 13.0, 7.0, 5.0, 4.0, 11.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-780.2860107421875, -751.8855590820312, -723.485107421875, -695.0846557617188, -666.6842041015625, -638.2838134765625, -609.8833618164062, -581.48291015625, -553.0824584960938, -524.6820068359375, -496.28155517578125, -467.8811340332031, -439.4806823730469, -411.0802307128906, -382.6798095703125, -354.27935791015625, -325.87890625, -297.47845458984375, -269.0780029296875, -240.67758178710938, -212.27713012695312, -183.87667846679688, -155.4762420654297, -127.0758056640625, -98.67535400390625, -70.27490997314453, -41.87446594238281, -13.474021911621094, 14.926422119140625, 43.326873779296875, 71.72731018066406, 100.12774658203125, 128.5281982421875, 156.92864990234375, 185.32908630371094, 213.72952270507812, 242.12997436523438, 270.5304260253906, 298.93084716796875, 327.331298828125, 355.73175048828125, 384.1322021484375, 412.53265380859375, 440.9330749511719, 469.3335266113281, 497.7339782714844, 526.1343994140625, 554.5348510742188, 582.935302734375, 611.3357543945312, 639.7362060546875, 668.1366577148438, 696.537109375, 724.9375, 753.3379516601562, 781.7384033203125, 810.1388549804688, 838.539306640625, 866.9397583007812, 895.3402099609375, 923.7406005859375, 952.14111328125, 980.54150390625, 1008.9419555664062, 1037.3424072265625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 7.0, 9.0, 5.0, 20.0, 13.0, 15.0, 21.0, 24.0, 20.0, 22.0, 34.0, 35.0, 52.0, 89.0, 168.0, 294.0, 553.0, 1162.0, 1041946.0, 1808.0, 988.0, 485.0, 251.0, 150.0, 80.0, 49.0, 38.0, 39.0, 24.0, 22.0, 22.0, 18.0, 13.0, 14.0, 10.0, 8.0, 5.0, 8.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-451.31146240234375, -437.1623840332031, -423.0133361816406, -408.8642578125, -394.7151794433594, -380.56610107421875, -366.41705322265625, -352.2679748535156, -338.118896484375, -323.9698181152344, -309.8207702636719, -295.67169189453125, -281.5226135253906, -267.37353515625, -253.2244873046875, -239.07540893554688, -224.92636108398438, -210.7772979736328, -196.6282196044922, -182.47915649414062, -168.330078125, -154.18101501464844, -140.03195190429688, -125.88288116455078, -111.73381042480469, -97.5847396850586, -83.4356689453125, -69.28660583496094, -55.137535095214844, -40.98846435546875, -26.839401245117188, -12.690330505371094, 1.458740234375, 15.607809066772461, 29.756877899169922, 43.90594482421875, 58.055015563964844, 72.20408630371094, 86.3531494140625, 100.5022201538086, 114.65129089355469, 128.80035400390625, 142.94943237304688, 157.09849548339844, 171.24755859375, 185.39663696289062, 199.5457000732422, 213.69476318359375, 227.84384155273438, 241.99290466308594, 256.1419677734375, 270.2910461425781, 284.44012451171875, 298.58917236328125, 312.7382507324219, 326.8873291015625, 341.036376953125, 355.1854553222656, 369.3345031738281, 383.48358154296875, 397.6326599121094, 411.78173828125, 425.9307861328125, 440.0798645019531, 454.22894287109375]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 11.0, 16.0, 23.0, 24.0, 61.0, 182.0, 1149.0, 51460976.0, 477.0, 113.0, 44.0, 15.0, 10.0, 11.0, 4.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3681.113525390625, -3559.976318359375, -3438.83935546875, -3317.7021484375, -3196.56494140625, -3075.427734375, -2954.29052734375, -2833.153564453125, -2712.016357421875, -2590.879150390625, -2469.7421875, -2348.60498046875, -2227.4677734375, -2106.33056640625, -1985.1934814453125, -1864.056396484375, -1742.919189453125, -1621.781982421875, -1500.6448974609375, -1379.5078125, -1258.37060546875, -1137.2333984375, -1016.0963134765625, -894.9591674804688, -773.822021484375, -652.6848754882812, -531.5477294921875, -410.41058349609375, -289.2734375, -168.13629150390625, -46.9991455078125, 74.13800048828125, 195.275390625, 316.41253662109375, 437.5496826171875, 558.6868286132812, 679.823974609375, 800.9611206054688, 922.0982666015625, 1043.2353515625, 1164.37255859375, 1285.509765625, 1406.6468505859375, 1527.783935546875, 1648.921142578125, 1770.058349609375, 1891.1954345703125, 2012.33251953125, 2133.4697265625, 2254.60693359375, 2375.744140625, 2496.881103515625, 2618.018310546875, 2739.155517578125, 2860.29248046875, 2981.4296875, 3102.56689453125, 3223.7041015625, 3344.84130859375, 3465.978271484375, 3587.115478515625, 3708.252685546875, 3829.3896484375, 3950.52685546875, 4071.6640625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 7.0, 11.0, 17.0, 17.0, 21.0, 46.0, 79.0, 103.0, 165.0, 204.0, 324.0, 502.0, 767.0, 1043.0, 1531.0, 2345.0, 3402.0, 5015.0, 7283.0, 10586.0, 15626.0, 23421.0, 34335.0, 52150.0, 79041.0, 125825.0, 213365.0, 393452.0, 3722641.0, 779755.0, 322017.0, 180537.0, 109051.0, 68945.0, 45186.0, 29803.0, 19891.0, 13851.0, 9064.0, 6287.0, 4326.0, 2982.0, 2059.0, 1407.0, 961.0, 640.0, 452.0, 318.0, 199.0, 127.0, 86.0, 55.0, 47.0, 27.0, 18.0, 12.0, 7.0, 4.0, 4.0, 5.0], "bins": [-8.6796875, -8.4154052734375, -8.151123046875, -7.8868408203125, -7.62255859375, -7.3582763671875, -7.093994140625, -6.8297119140625, -6.5654296875, -6.3011474609375, -6.036865234375, -5.7725830078125, -5.50830078125, -5.2440185546875, -4.979736328125, -4.7154541015625, -4.451171875, -4.1868896484375, -3.922607421875, -3.6583251953125, -3.39404296875, -3.1297607421875, -2.865478515625, -2.6011962890625, -2.3369140625, -2.0726318359375, -1.808349609375, -1.5440673828125, -1.27978515625, -1.0155029296875, -0.751220703125, -0.4869384765625, -0.22265625, 0.0416259765625, 0.305908203125, 0.5701904296875, 0.83447265625, 1.0987548828125, 1.363037109375, 1.6273193359375, 1.8916015625, 2.1558837890625, 2.420166015625, 2.6844482421875, 2.94873046875, 3.2130126953125, 3.477294921875, 3.7415771484375, 4.005859375, 4.2701416015625, 4.534423828125, 4.7987060546875, 5.06298828125, 5.3272705078125, 5.591552734375, 5.8558349609375, 6.1201171875, 6.3843994140625, 6.648681640625, 6.9129638671875, 7.17724609375, 7.4415283203125, 7.705810546875, 7.9700927734375, 8.234375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 14.0, 6.0, 10.0, 10.0, 12.0, 17.0, 23.0, 19.0, 19.0, 17.0, 26.0, 28.0, 25.0, 30.0, 24.0, 31.0, 36.0, 34.0, 40.0, 34.0, 749.0, 362.0, 47.0, 40.0, 33.0, 42.0, 30.0, 31.0, 26.0, 30.0, 23.0, 16.0, 26.0, 21.0, 14.0, 13.0, 15.0, 8.0, 10.0, 5.0, 9.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-113.125, -109.689453125, -106.25390625, -102.818359375, -99.3828125, -95.947265625, -92.51171875, -89.076171875, -85.640625, -82.205078125, -78.76953125, -75.333984375, -71.8984375, -68.462890625, -65.02734375, -61.591796875, -58.15625, -54.720703125, -51.28515625, -47.849609375, -44.4140625, -40.978515625, -37.54296875, -34.107421875, -30.671875, -27.236328125, -23.80078125, -20.365234375, -16.9296875, -13.494140625, -10.05859375, -6.623046875, -3.1875, 0.248046875, 3.68359375, 7.119140625, 10.5546875, 13.990234375, 17.42578125, 20.861328125, 24.296875, 27.732421875, 31.16796875, 34.603515625, 38.0390625, 41.474609375, 44.91015625, 48.345703125, 51.78125, 55.216796875, 58.65234375, 62.087890625, 65.5234375, 68.958984375, 72.39453125, 75.830078125, 79.265625, 82.701171875, 86.13671875, 89.572265625, 93.0078125, 96.443359375, 99.87890625, 103.314453125, 106.75]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 8.0, 5.0, 14.0, 19.0, 20.0, 36.0, 51.0, 100.0, 150.0, 222.0, 384.0, 548.0, 793.0, 1179.0, 1847.0, 2678.0, 4094.0, 6282.0, 9472.0, 14530.0, 22500.0, 35155.0, 56193.0, 91646.0, 152174.0, 263524.0, 454771.0, 3695626.0, 643998.0, 334211.0, 192408.0, 114311.0, 69575.0, 43432.0, 27706.0, 17784.0, 11565.0, 7807.0, 4946.0, 3250.0, 2146.0, 1421.0, 928.0, 652.0, 446.0, 298.0, 188.0, 121.0, 85.0, 58.0, 30.0, 24.0, 15.0, 8.0, 4.0, 8.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.9140625, -7.66455078125, -7.4150390625, -7.16552734375, -6.916015625, -6.66650390625, -6.4169921875, -6.16748046875, -5.91796875, -5.66845703125, -5.4189453125, -5.16943359375, -4.919921875, -4.67041015625, -4.4208984375, -4.17138671875, -3.921875, -3.67236328125, -3.4228515625, -3.17333984375, -2.923828125, -2.67431640625, -2.4248046875, -2.17529296875, -1.92578125, -1.67626953125, -1.4267578125, -1.17724609375, -0.927734375, -0.67822265625, -0.4287109375, -0.17919921875, 0.0703125, 0.31982421875, 0.5693359375, 0.81884765625, 1.068359375, 1.31787109375, 1.5673828125, 1.81689453125, 2.06640625, 2.31591796875, 2.5654296875, 2.81494140625, 3.064453125, 3.31396484375, 3.5634765625, 3.81298828125, 4.0625, 4.31201171875, 4.5615234375, 4.81103515625, 5.060546875, 5.31005859375, 5.5595703125, 5.80908203125, 6.05859375, 6.30810546875, 6.5576171875, 6.80712890625, 7.056640625, 7.30615234375, 7.5556640625, 7.80517578125, 8.0546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 5.0, 5.0, 7.0, 11.0, 10.0, 9.0, 17.0, 15.0, 18.0, 22.0, 27.0, 24.0, 26.0, 34.0, 30.0, 45.0, 34.0, 43.0, 43.0, 129.0, 974.0, 46.0, 46.0, 51.0, 32.0, 31.0, 43.0, 29.0, 28.0, 32.0, 30.0, 19.0, 22.0, 14.0, 16.0, 13.0, 8.0, 12.0, 9.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.375, -81.4912109375, -78.607421875, -75.7236328125, -72.83984375, -69.9560546875, -67.072265625, -64.1884765625, -61.3046875, -58.4208984375, -55.537109375, -52.6533203125, -49.76953125, -46.8857421875, -44.001953125, -41.1181640625, -38.234375, -35.3505859375, -32.466796875, -29.5830078125, -26.69921875, -23.8154296875, -20.931640625, -18.0478515625, -15.1640625, -12.2802734375, -9.396484375, -6.5126953125, -3.62890625, -0.7451171875, 2.138671875, 5.0224609375, 7.90625, 10.7900390625, 13.673828125, 16.5576171875, 19.44140625, 22.3251953125, 25.208984375, 28.0927734375, 30.9765625, 33.8603515625, 36.744140625, 39.6279296875, 42.51171875, 45.3955078125, 48.279296875, 51.1630859375, 54.046875, 56.9306640625, 59.814453125, 62.6982421875, 65.58203125, 68.4658203125, 71.349609375, 74.2333984375, 77.1171875, 80.0009765625, 82.884765625, 85.7685546875, 88.65234375, 91.5361328125, 94.419921875, 97.3037109375, 100.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 8.0, 11.0, 7.0, 15.0, 26.0, 25.0, 35.0, 53.0, 62.0, 97.0, 106.0, 133.0, 185.0, 309.0, 407.0, 560.0, 870.0, 1255.0, 2018.0, 3478.0, 5630.0, 9888.0, 17078.0, 31388.0, 59766.0, 130299.0, 5716849.0, 160701.0, 67949.0, 35339.0, 19260.0, 10944.0, 6215.0, 3718.0, 2228.0, 1493.0, 876.0, 609.0, 385.0, 321.0, 212.0, 146.0, 137.0, 99.0, 73.0, 43.0, 34.0, 32.0, 16.0, 15.0, 11.0, 7.0, 5.0, 4.0, 7.0, 1.0, 3.0, 2.0], "bins": [-21.015625, -20.370849609375, -19.72607421875, -19.081298828125, -18.4365234375, -17.791748046875, -17.14697265625, -16.502197265625, -15.857421875, -15.212646484375, -14.56787109375, -13.923095703125, -13.2783203125, -12.633544921875, -11.98876953125, -11.343994140625, -10.69921875, -10.054443359375, -9.40966796875, -8.764892578125, -8.1201171875, -7.475341796875, -6.83056640625, -6.185791015625, -5.541015625, -4.896240234375, -4.25146484375, -3.606689453125, -2.9619140625, -2.317138671875, -1.67236328125, -1.027587890625, -0.3828125, 0.261962890625, 0.90673828125, 1.551513671875, 2.1962890625, 2.841064453125, 3.48583984375, 4.130615234375, 4.775390625, 5.420166015625, 6.06494140625, 6.709716796875, 7.3544921875, 7.999267578125, 8.64404296875, 9.288818359375, 9.93359375, 10.578369140625, 11.22314453125, 11.867919921875, 12.5126953125, 13.157470703125, 13.80224609375, 14.447021484375, 15.091796875, 15.736572265625, 16.38134765625, 17.026123046875, 17.6708984375, 18.315673828125, 18.96044921875, 19.605224609375, 20.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 3.0, 18.0, 8.0, 9.0, 13.0, 9.0, 18.0, 21.0, 28.0, 33.0, 31.0, 31.0, 34.0, 37.0, 35.0, 30.0, 38.0, 66.0, 1013.0, 80.0, 39.0, 37.0, 44.0, 32.0, 37.0, 40.0, 38.0, 31.0, 20.0, 23.0, 22.0, 19.0, 11.0, 12.0, 3.0, 10.0, 13.0, 5.0, 7.0, 2.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.6064453125, -62.337890625, -60.0693359375, -57.80078125, -55.5322265625, -53.263671875, -50.9951171875, -48.7265625, -46.4580078125, -44.189453125, -41.9208984375, -39.65234375, -37.3837890625, -35.115234375, -32.8466796875, -30.578125, -28.3095703125, -26.041015625, -23.7724609375, -21.50390625, -19.2353515625, -16.966796875, -14.6982421875, -12.4296875, -10.1611328125, -7.892578125, -5.6240234375, -3.35546875, -1.0869140625, 1.181640625, 3.4501953125, 5.71875, 7.9873046875, 10.255859375, 12.5244140625, 14.79296875, 17.0615234375, 19.330078125, 21.5986328125, 23.8671875, 26.1357421875, 28.404296875, 30.6728515625, 32.94140625, 35.2099609375, 37.478515625, 39.7470703125, 42.015625, 44.2841796875, 46.552734375, 48.8212890625, 51.08984375, 53.3583984375, 55.626953125, 57.8955078125, 60.1640625, 62.4326171875, 64.701171875, 66.9697265625, 69.23828125, 71.5068359375, 73.775390625, 76.0439453125, 78.3125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 15.0, 32.0, 76.0, 260.0, 423.0, 116.0, 47.0, 25.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-498.89581298828125, -487.05743408203125, -475.2190856933594, -463.3807067871094, -451.5423583984375, -439.7039794921875, -427.8656311035156, -416.0272521972656, -404.18890380859375, -392.35052490234375, -380.5121765136719, -368.6737976074219, -356.83544921875, -344.9970703125, -333.1587219238281, -321.3203430175781, -309.48199462890625, -297.64361572265625, -285.8052673339844, -273.9668884277344, -262.1285400390625, -250.29017639160156, -238.45181274414062, -226.61343383789062, -214.77505493164062, -202.9366912841797, -191.09832763671875, -179.2599639892578, -167.42160034179688, -155.58323669433594, -143.744873046875, -131.906494140625, -120.06814575195312, -108.22978210449219, -96.39141845703125, -84.55305480957031, -72.71469116210938, -60.87632369995117, -49.03795623779297, -37.19959259033203, -25.361228942871094, -13.52286434173584, -1.684499740600586, 10.153865814208984, 21.992229461669922, 33.83059310913086, 45.66896057128906, 57.50732421875, 69.34568786621094, 81.18405151367188, 93.02241516113281, 104.86077880859375, 116.69914245605469, 128.53750610351562, 140.37588500976562, 152.2142333984375, 164.0526123046875, 175.89097595214844, 187.72933959960938, 199.5677032470703, 211.40606689453125, 223.2444305419922, 235.08279418945312, 246.92117309570312, 258.759521484375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 10.0, 8.0, 10.0, 12.0, 8.0, 10.0, 19.0, 23.0, 13.0, 27.0, 26.0, 25.0, 32.0, 29.0, 39.0, 41.0, 35.0, 44.0, 44.0, 38.0, 46.0, 58.0, 43.0, 35.0, 38.0, 37.0, 23.0, 21.0, 27.0, 27.0, 19.0, 25.0, 17.0, 16.0, 17.0, 13.0, 10.0, 10.0, 10.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-171.00814819335938, -166.32424926757812, -161.64035034179688, -156.95645141601562, -152.27255249023438, -147.5886688232422, -142.90476989746094, -138.2208709716797, -133.53697204589844, -128.8530731201172, -124.16917419433594, -119.48528289794922, -114.80138397216797, -110.11748504638672, -105.43359375, -100.74969482421875, -96.0657958984375, -91.38189697265625, -86.697998046875, -82.01410675048828, -77.33020782470703, -72.64630889892578, -67.96241760253906, -63.27851867675781, -58.59461975097656, -53.91072082519531, -49.22682571411133, -44.542930603027344, -39.859031677246094, -35.175132751464844, -30.49123764038086, -25.807342529296875, -21.123458862304688, -16.43956184387207, -11.755664825439453, -7.071767807006836, -2.3878707885742188, 2.2960262298583984, 6.979923248291016, 11.663818359375, 16.34771728515625, 21.031614303588867, 25.715511322021484, 30.3994083404541, 35.08330535888672, 39.76720428466797, 44.45109939575195, 49.13499450683594, 53.81889343261719, 58.50279235839844, 63.18668746948242, 67.8705825805664, 72.55448150634766, 77.2383804321289, 81.92227172851562, 86.60617065429688, 91.29006958007812, 95.97396850585938, 100.65786743164062, 105.34175872802734, 110.0256576538086, 114.70955657958984, 119.39344787597656, 124.07734680175781, 128.76124572753906]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 9.0, 5.0, 9.0, 7.0, 18.0, 14.0, 15.0, 33.0, 34.0, 35.0, 47.0, 64.0, 75.0, 110.0, 156.0, 189.0, 288.0, 430.0, 618.0, 964.0, 1570.0, 3066.0, 7250.0, 30568.0, 4088915.0, 44389.0, 7998.0, 2957.0, 1581.0, 944.0, 581.0, 414.0, 241.0, 197.0, 127.0, 97.0, 75.0, 52.0, 29.0, 31.0, 16.0, 17.0, 12.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0], "bins": [-3.162109375, -3.08013916015625, -2.9981689453125, -2.91619873046875, -2.834228515625, -2.75225830078125, -2.6702880859375, -2.58831787109375, -2.50634765625, -2.42437744140625, -2.3424072265625, -2.26043701171875, -2.178466796875, -2.09649658203125, -2.0145263671875, -1.93255615234375, -1.8505859375, -1.76861572265625, -1.6866455078125, -1.60467529296875, -1.522705078125, -1.44073486328125, -1.3587646484375, -1.27679443359375, -1.19482421875, -1.11285400390625, -1.0308837890625, -0.94891357421875, -0.866943359375, -0.78497314453125, -0.7030029296875, -0.62103271484375, -0.5390625, -0.45709228515625, -0.3751220703125, -0.29315185546875, -0.211181640625, -0.12921142578125, -0.0472412109375, 0.03472900390625, 0.11669921875, 0.19866943359375, 0.2806396484375, 0.36260986328125, 0.444580078125, 0.52655029296875, 0.6085205078125, 0.69049072265625, 0.7724609375, 0.85443115234375, 0.9364013671875, 1.01837158203125, 1.100341796875, 1.18231201171875, 1.2642822265625, 1.34625244140625, 1.42822265625, 1.51019287109375, 1.5921630859375, 1.67413330078125, 1.756103515625, 1.83807373046875, 1.9200439453125, 2.00201416015625, 2.083984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 8.0, 6.0, 4.0, 4.0, 2.0, 8.0, 5.0, 14.0, 12.0, 9.0, 26.0, 727.0, 77.0, 20.0, 23.0, 6.0, 6.0, 6.0, 8.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.99609375, -0.9704437255859375, -0.944793701171875, -0.9191436767578125, -0.89349365234375, -0.8678436279296875, -0.842193603515625, -0.8165435791015625, -0.7908935546875, -0.7652435302734375, -0.739593505859375, -0.7139434814453125, -0.68829345703125, -0.6626434326171875, -0.636993408203125, -0.6113433837890625, -0.585693359375, -0.5600433349609375, -0.534393310546875, -0.5087432861328125, -0.48309326171875, -0.4574432373046875, -0.431793212890625, -0.4061431884765625, -0.3804931640625, -0.3548431396484375, -0.329193115234375, -0.3035430908203125, -0.27789306640625, -0.2522430419921875, -0.226593017578125, -0.2009429931640625, -0.17529296875, -0.1496429443359375, -0.123992919921875, -0.0983428955078125, -0.07269287109375, -0.0470428466796875, -0.021392822265625, 0.0042572021484375, 0.0299072265625, 0.0555572509765625, 0.081207275390625, 0.1068572998046875, 0.13250732421875, 0.1581573486328125, 0.183807373046875, 0.2094573974609375, 0.235107421875, 0.2607574462890625, 0.286407470703125, 0.3120574951171875, 0.33770751953125, 0.3633575439453125, 0.389007568359375, 0.4146575927734375, 0.4403076171875, 0.4659576416015625, 0.491607666015625, 0.5172576904296875, 0.54290771484375, 0.5685577392578125, 0.594207763671875, 0.6198577880859375, 0.6455078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 4.0, 6.0, 14.0, 9.0, 19.0, 34.0, 41.0, 44.0, 79.0, 145.0, 182.0, 362.0, 502.0, 879.0, 1356.0, 2487.0, 4572.0, 9979.0, 26473.0, 160955.0, 3793198.0, 147147.0, 26041.0, 9552.0, 4540.0, 2358.0, 1311.0, 796.0, 432.0, 290.0, 167.0, 117.0, 68.0, 43.0, 27.0, 18.0, 16.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.1522369384765625, -2.091583251953125, -2.0309295654296875, -1.97027587890625, -1.9096221923828125, -1.848968505859375, -1.7883148193359375, -1.7276611328125, -1.6670074462890625, -1.606353759765625, -1.5457000732421875, -1.48504638671875, -1.4243927001953125, -1.363739013671875, -1.3030853271484375, -1.242431640625, -1.1817779541015625, -1.121124267578125, -1.0604705810546875, -0.99981689453125, -0.9391632080078125, -0.878509521484375, -0.8178558349609375, -0.7572021484375, -0.6965484619140625, -0.635894775390625, -0.5752410888671875, -0.51458740234375, -0.4539337158203125, -0.393280029296875, -0.3326263427734375, -0.27197265625, -0.2113189697265625, -0.150665283203125, -0.0900115966796875, -0.02935791015625, 0.0312957763671875, 0.091949462890625, 0.1526031494140625, 0.2132568359375, 0.2739105224609375, 0.334564208984375, 0.3952178955078125, 0.45587158203125, 0.5165252685546875, 0.577178955078125, 0.6378326416015625, 0.698486328125, 0.7591400146484375, 0.819793701171875, 0.8804473876953125, 0.94110107421875, 1.0017547607421875, 1.062408447265625, 1.1230621337890625, 1.1837158203125, 1.2443695068359375, 1.305023193359375, 1.3656768798828125, 1.42633056640625, 1.4869842529296875, 1.547637939453125, 1.6082916259765625, 1.6689453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 10.0, 6.0, 9.0, 13.0, 12.0, 14.0, 12.0, 33.0, 51.0, 134.0, 323.0, 2206.0, 818.0, 157.0, 75.0, 62.0, 33.0, 15.0, 20.0, 6.0, 8.0, 6.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.150390625, -1.1173095703125, -1.084228515625, -1.0511474609375, -1.01806640625, -0.9849853515625, -0.951904296875, -0.9188232421875, -0.8857421875, -0.8526611328125, -0.819580078125, -0.7864990234375, -0.75341796875, -0.7203369140625, -0.687255859375, -0.6541748046875, -0.62109375, -0.5880126953125, -0.554931640625, -0.5218505859375, -0.48876953125, -0.4556884765625, -0.422607421875, -0.3895263671875, -0.3564453125, -0.3233642578125, -0.290283203125, -0.2572021484375, -0.22412109375, -0.1910400390625, -0.157958984375, -0.1248779296875, -0.091796875, -0.0587158203125, -0.025634765625, 0.0074462890625, 0.04052734375, 0.0736083984375, 0.106689453125, 0.1397705078125, 0.1728515625, 0.2059326171875, 0.239013671875, 0.2720947265625, 0.30517578125, 0.3382568359375, 0.371337890625, 0.4044189453125, 0.4375, 0.4705810546875, 0.503662109375, 0.5367431640625, 0.56982421875, 0.6029052734375, 0.635986328125, 0.6690673828125, 0.7021484375, 0.7352294921875, 0.768310546875, 0.8013916015625, 0.83447265625, 0.8675537109375, 0.900634765625, 0.9337158203125, 0.966796875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 16.0, 62.0, 312.0, 430.0, 121.0, 37.0, 9.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.919100284576416, -6.682254791259766, -6.445409774780273, -6.208564758300781, -5.971719264984131, -5.7348737716674805, -5.498028755187988, -5.261183738708496, -5.024338245391846, -4.787492752075195, -4.550647735595703, -4.313802719116211, -4.0769572257995605, -3.8401119709014893, -3.603266716003418, -3.3664214611053467, -3.1295762062072754, -2.892730951309204, -2.655885696411133, -2.4190404415130615, -2.1821951866149902, -1.945349931716919, -1.7085046768188477, -1.4716594219207764, -1.234814167022705, -0.9979689121246338, -0.7611236572265625, -0.5242784023284912, -0.2874331474304199, -0.05058789253234863, 0.18625736236572266, 0.42310261726379395, 0.6599483489990234, 0.8967936038970947, 1.133638858795166, 1.3704841136932373, 1.6073293685913086, 1.8441746234893799, 2.081019878387451, 2.3178651332855225, 2.5547103881835938, 2.791555643081665, 3.0284008979797363, 3.2652461528778076, 3.502091407775879, 3.73893666267395, 3.9757819175720215, 4.212627410888672, 4.449472427368164, 4.686317443847656, 4.923162937164307, 5.160008430480957, 5.396853446960449, 5.633698463439941, 5.870543956756592, 6.107389450073242, 6.344234466552734, 6.581079483032227, 6.817924976348877, 7.054770469665527, 7.2916154861450195, 7.528460502624512, 7.765305995941162, 8.002151489257812, 8.238996505737305]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 2.0, 2.0, 5.0, 10.0, 9.0, 18.0, 20.0, 21.0, 38.0, 50.0, 54.0, 65.0, 86.0, 94.0, 98.0, 67.0, 79.0, 65.0, 42.0, 45.0, 21.0, 20.0, 10.0, 12.0, 11.0, 7.0, 7.0, 3.0, 7.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9708611965179443, -2.8577542304992676, -2.744647264480591, -2.631540298461914, -2.518433094024658, -2.4053263664245605, -2.2922191619873047, -2.179112195968628, -2.066005229949951, -1.9528982639312744, -1.8397912979125977, -1.7266842126846313, -1.6135772466659546, -1.5004702806472778, -1.3873631954193115, -1.2742562294006348, -1.161149263381958, -1.0480422973632812, -0.9349352717399597, -0.8218282461166382, -0.7087212800979614, -0.5956143140792847, -0.48250728845596313, -0.3694002628326416, -0.25629329681396484, -0.1431863009929657, -0.030079305171966553, 0.08302769064903259, 0.19613468647003174, 0.3092416524887085, 0.42234867811203003, 0.5354557037353516, 0.6485629081726074, 0.7616698741912842, 0.8747768998146057, 0.9878839254379272, 1.100990891456604, 1.2140978574752808, 1.327204942703247, 1.4403119087219238, 1.5534188747406006, 1.6665258407592773, 1.779632806777954, 1.8927398920059204, 2.0058469772338867, 2.1189537048339844, 2.2320609092712402, 2.345167875289917, 2.4582748413085938, 2.5713818073272705, 2.6844887733459473, 2.797595739364624, 2.910702705383301, 3.0238099098205566, 3.1369168758392334, 3.25002384185791, 3.363130807876587, 3.4762377738952637, 3.5893447399139404, 3.702451705932617, 3.815558910369873, 3.9286656379699707, 4.041772842407227, 4.154879570007324, 4.26798677444458]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 11.0, 13.0, 22.0, 29.0, 31.0, 51.0, 67.0, 98.0, 139.0, 212.0, 301.0, 456.0, 711.0, 1016.0, 1703.0, 2877.0, 5166.0, 10216.0, 26254.0, 902338.0, 63504.0, 16011.0, 7302.0, 3756.0, 2246.0, 1410.0, 872.0, 561.0, 363.0, 239.0, 153.0, 137.0, 79.0, 58.0, 36.0, 28.0, 29.0, 10.0, 12.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-5.296875, -5.152801513671875, -5.00872802734375, -4.864654541015625, -4.7205810546875, -4.576507568359375, -4.43243408203125, -4.288360595703125, -4.144287109375, -4.000213623046875, -3.85614013671875, -3.712066650390625, -3.5679931640625, -3.423919677734375, -3.27984619140625, -3.135772705078125, -2.99169921875, -2.847625732421875, -2.70355224609375, -2.559478759765625, -2.4154052734375, -2.271331787109375, -2.12725830078125, -1.983184814453125, -1.839111328125, -1.695037841796875, -1.55096435546875, -1.406890869140625, -1.2628173828125, -1.118743896484375, -0.97467041015625, -0.830596923828125, -0.6865234375, -0.542449951171875, -0.39837646484375, -0.254302978515625, -0.1102294921875, 0.033843994140625, 0.17791748046875, 0.321990966796875, 0.466064453125, 0.610137939453125, 0.75421142578125, 0.898284912109375, 1.0423583984375, 1.186431884765625, 1.33050537109375, 1.474578857421875, 1.61865234375, 1.762725830078125, 1.90679931640625, 2.050872802734375, 2.1949462890625, 2.339019775390625, 2.48309326171875, 2.627166748046875, 2.771240234375, 2.915313720703125, 3.05938720703125, 3.203460693359375, 3.3475341796875, 3.491607666015625, 3.63568115234375, 3.779754638671875, 3.923828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 7.0, 4.0, 11.0, 15.0, 12.0, 15.0, 44.0, 709.0, 70.0, 21.0, 18.0, 6.0, 7.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.92724609375, -0.9031448364257812, -0.8790435791015625, -0.8549423217773438, -0.830841064453125, -0.8067398071289062, -0.7826385498046875, -0.7585372924804688, -0.73443603515625, -0.7103347778320312, -0.6862335205078125, -0.6621322631835938, -0.638031005859375, -0.6139297485351562, -0.5898284912109375, -0.5657272338867188, -0.5416259765625, -0.5175247192382812, -0.4934234619140625, -0.46932220458984375, -0.445220947265625, -0.42111968994140625, -0.3970184326171875, -0.37291717529296875, -0.34881591796875, -0.32471466064453125, -0.3006134033203125, -0.27651214599609375, -0.252410888671875, -0.22830963134765625, -0.2042083740234375, -0.18010711669921875, -0.156005859375, -0.13190460205078125, -0.1078033447265625, -0.08370208740234375, -0.059600830078125, -0.03549957275390625, -0.0113983154296875, 0.01270294189453125, 0.03680419921875, 0.06090545654296875, 0.0850067138671875, 0.10910797119140625, 0.133209228515625, 0.15731048583984375, 0.1814117431640625, 0.20551300048828125, 0.2296142578125, 0.25371551513671875, 0.2778167724609375, 0.30191802978515625, 0.326019287109375, 0.35012054443359375, 0.3742218017578125, 0.39832305908203125, 0.42242431640625, 0.44652557373046875, 0.4706268310546875, 0.49472808837890625, 0.518829345703125, 0.5429306030273438, 0.5670318603515625, 0.5911331176757812, 0.615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 8.0, 12.0, 6.0, 14.0, 23.0, 20.0, 32.0, 45.0, 74.0, 99.0, 160.0, 291.0, 460.0, 985.0, 1948.0, 4354.0, 11497.0, 36098.0, 149976.0, 613271.0, 168122.0, 39586.0, 12367.0, 4702.0, 2053.0, 1028.0, 514.0, 255.0, 180.0, 114.0, 73.0, 50.0, 29.0, 31.0, 17.0, 18.0, 14.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.375, -2.294586181640625, -2.21417236328125, -2.133758544921875, -2.0533447265625, -1.972930908203125, -1.89251708984375, -1.812103271484375, -1.731689453125, -1.651275634765625, -1.57086181640625, -1.490447998046875, -1.4100341796875, -1.329620361328125, -1.24920654296875, -1.168792724609375, -1.08837890625, -1.007965087890625, -0.92755126953125, -0.847137451171875, -0.7667236328125, -0.686309814453125, -0.60589599609375, -0.525482177734375, -0.445068359375, -0.364654541015625, -0.28424072265625, -0.203826904296875, -0.1234130859375, -0.042999267578125, 0.03741455078125, 0.117828369140625, 0.1982421875, 0.278656005859375, 0.35906982421875, 0.439483642578125, 0.5198974609375, 0.600311279296875, 0.68072509765625, 0.761138916015625, 0.841552734375, 0.921966552734375, 1.00238037109375, 1.082794189453125, 1.1632080078125, 1.243621826171875, 1.32403564453125, 1.404449462890625, 1.48486328125, 1.565277099609375, 1.64569091796875, 1.726104736328125, 1.8065185546875, 1.886932373046875, 1.96734619140625, 2.047760009765625, 2.128173828125, 2.208587646484375, 2.28900146484375, 2.369415283203125, 2.4498291015625, 2.530242919921875, 2.61065673828125, 2.691070556640625, 2.771484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 2.0, 3.0, 7.0, 4.0, 5.0, 12.0, 11.0, 14.0, 16.0, 16.0, 14.0, 14.0, 22.0, 25.0, 33.0, 31.0, 38.0, 32.0, 31.0, 33.0, 42.0, 33.0, 37.0, 33.0, 32.0, 41.0, 33.0, 30.0, 30.0, 35.0, 33.0, 34.0, 27.0, 26.0, 29.0, 20.0, 23.0, 14.0, 20.0, 8.0, 6.0, 8.0, 8.0, 9.0, 2.0, 3.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.287109375, -2.21209716796875, -2.1370849609375, -2.06207275390625, -1.987060546875, -1.91204833984375, -1.8370361328125, -1.76202392578125, -1.68701171875, -1.61199951171875, -1.5369873046875, -1.46197509765625, -1.386962890625, -1.31195068359375, -1.2369384765625, -1.16192626953125, -1.0869140625, -1.01190185546875, -0.9368896484375, -0.86187744140625, -0.786865234375, -0.71185302734375, -0.6368408203125, -0.56182861328125, -0.48681640625, -0.41180419921875, -0.3367919921875, -0.26177978515625, -0.186767578125, -0.11175537109375, -0.0367431640625, 0.03826904296875, 0.11328125, 0.18829345703125, 0.2633056640625, 0.33831787109375, 0.413330078125, 0.48834228515625, 0.5633544921875, 0.63836669921875, 0.71337890625, 0.78839111328125, 0.8634033203125, 0.93841552734375, 1.013427734375, 1.08843994140625, 1.1634521484375, 1.23846435546875, 1.3134765625, 1.38848876953125, 1.4635009765625, 1.53851318359375, 1.613525390625, 1.68853759765625, 1.7635498046875, 1.83856201171875, 1.91357421875, 1.98858642578125, 2.0635986328125, 2.13861083984375, 2.213623046875, 2.28863525390625, 2.3636474609375, 2.43865966796875, 2.513671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 14.0, 12.0, 14.0, 30.0, 32.0, 51.0, 80.0, 137.0, 252.0, 459.0, 986.0, 2850.0, 10837.0, 137551.0, 856846.0, 30058.0, 5233.0, 1634.0, 672.0, 321.0, 170.0, 102.0, 69.0, 33.0, 26.0, 21.0, 11.0, 13.0, 2.0, 3.0, 8.0, 3.0, 6.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2578125, -3.1654052734375, -3.072998046875, -2.9805908203125, -2.88818359375, -2.7957763671875, -2.703369140625, -2.6109619140625, -2.5185546875, -2.4261474609375, -2.333740234375, -2.2413330078125, -2.14892578125, -2.0565185546875, -1.964111328125, -1.8717041015625, -1.779296875, -1.6868896484375, -1.594482421875, -1.5020751953125, -1.40966796875, -1.3172607421875, -1.224853515625, -1.1324462890625, -1.0400390625, -0.9476318359375, -0.855224609375, -0.7628173828125, -0.67041015625, -0.5780029296875, -0.485595703125, -0.3931884765625, -0.30078125, -0.2083740234375, -0.115966796875, -0.0235595703125, 0.06884765625, 0.1612548828125, 0.253662109375, 0.3460693359375, 0.4384765625, 0.5308837890625, 0.623291015625, 0.7156982421875, 0.80810546875, 0.9005126953125, 0.992919921875, 1.0853271484375, 1.177734375, 1.2701416015625, 1.362548828125, 1.4549560546875, 1.54736328125, 1.6397705078125, 1.732177734375, 1.8245849609375, 1.9169921875, 2.0093994140625, 2.101806640625, 2.1942138671875, 2.28662109375, 2.3790283203125, 2.471435546875, 2.5638427734375, 2.65625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 9.0, 8.0, 8.0, 3.0, 8.0, 8.0, 16.0, 23.0, 30.0, 31.0, 40.0, 41.0, 51.0, 56.0, 80.0, 83.0, 81.0, 84.0, 63.0, 50.0, 39.0, 32.0, 39.0, 23.0, 21.0, 18.0, 12.0, 12.0, 6.0, 6.0, 5.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.52346420288086e-05, -8.207559585571289e-05, -7.891654968261719e-05, -7.575750350952148e-05, -7.259845733642578e-05, -6.943941116333008e-05, -6.628036499023438e-05, -6.312131881713867e-05, -5.996227264404297e-05, -5.6803226470947266e-05, -5.364418029785156e-05, -5.048513412475586e-05, -4.7326087951660156e-05, -4.416704177856445e-05, -4.100799560546875e-05, -3.784894943237305e-05, -3.4689903259277344e-05, -3.153085708618164e-05, -2.8371810913085938e-05, -2.5212764739990234e-05, -2.205371856689453e-05, -1.8894672393798828e-05, -1.5735626220703125e-05, -1.2576580047607422e-05, -9.417533874511719e-06, -6.258487701416016e-06, -3.0994415283203125e-06, 5.960464477539063e-08, 3.2186508178710938e-06, 6.377696990966797e-06, 9.5367431640625e-06, 1.2695789337158203e-05, 1.5854835510253906e-05, 1.901388168334961e-05, 2.2172927856445312e-05, 2.5331974029541016e-05, 2.849102020263672e-05, 3.165006637573242e-05, 3.4809112548828125e-05, 3.796815872192383e-05, 4.112720489501953e-05, 4.4286251068115234e-05, 4.744529724121094e-05, 5.060434341430664e-05, 5.3763389587402344e-05, 5.692243576049805e-05, 6.008148193359375e-05, 6.324052810668945e-05, 6.639957427978516e-05, 6.955862045288086e-05, 7.271766662597656e-05, 7.587671279907227e-05, 7.903575897216797e-05, 8.219480514526367e-05, 8.535385131835938e-05, 8.851289749145508e-05, 9.167194366455078e-05, 9.483098983764648e-05, 9.799003601074219e-05, 0.00010114908218383789, 0.0001043081283569336, 0.0001074671745300293, 0.000110626220703125, 0.0001137852668762207, 0.0001169443130493164]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 8.0, 16.0, 22.0, 34.0, 47.0, 83.0, 115.0, 219.0, 333.0, 651.0, 1537.0, 4024.0, 13972.0, 79150.0, 719401.0, 193273.0, 25095.0, 6339.0, 2169.0, 926.0, 473.0, 226.0, 159.0, 95.0, 59.0, 34.0, 19.0, 17.0, 13.0, 3.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.40625, -2.3424072265625, -2.278564453125, -2.2147216796875, -2.15087890625, -2.0870361328125, -2.023193359375, -1.9593505859375, -1.8955078125, -1.8316650390625, -1.767822265625, -1.7039794921875, -1.64013671875, -1.5762939453125, -1.512451171875, -1.4486083984375, -1.384765625, -1.3209228515625, -1.257080078125, -1.1932373046875, -1.12939453125, -1.0655517578125, -1.001708984375, -0.9378662109375, -0.8740234375, -0.8101806640625, -0.746337890625, -0.6824951171875, -0.61865234375, -0.5548095703125, -0.490966796875, -0.4271240234375, -0.36328125, -0.2994384765625, -0.235595703125, -0.1717529296875, -0.10791015625, -0.0440673828125, 0.019775390625, 0.0836181640625, 0.1474609375, 0.2113037109375, 0.275146484375, 0.3389892578125, 0.40283203125, 0.4666748046875, 0.530517578125, 0.5943603515625, 0.658203125, 0.7220458984375, 0.785888671875, 0.8497314453125, 0.91357421875, 0.9774169921875, 1.041259765625, 1.1051025390625, 1.1689453125, 1.2327880859375, 1.296630859375, 1.3604736328125, 1.42431640625, 1.4881591796875, 1.552001953125, 1.6158447265625, 1.6796875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 12.0, 15.0, 23.0, 31.0, 42.0, 59.0, 67.0, 79.0, 88.0, 110.0, 101.0, 89.0, 72.0, 51.0, 40.0, 26.0, 24.0, 23.0, 15.0, 9.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8684844970703125, -1.792633056640625, -1.7167816162109375, -1.64093017578125, -1.5650787353515625, -1.489227294921875, -1.4133758544921875, -1.3375244140625, -1.2616729736328125, -1.185821533203125, -1.1099700927734375, -1.03411865234375, -0.9582672119140625, -0.882415771484375, -0.8065643310546875, -0.730712890625, -0.6548614501953125, -0.579010009765625, -0.5031585693359375, -0.42730712890625, -0.3514556884765625, -0.275604248046875, -0.1997528076171875, -0.1239013671875, -0.0480499267578125, 0.027801513671875, 0.1036529541015625, 0.17950439453125, 0.2553558349609375, 0.331207275390625, 0.4070587158203125, 0.48291015625, 0.5587615966796875, 0.634613037109375, 0.7104644775390625, 0.78631591796875, 0.8621673583984375, 0.938018798828125, 1.0138702392578125, 1.0897216796875, 1.1655731201171875, 1.241424560546875, 1.3172760009765625, 1.39312744140625, 1.4689788818359375, 1.544830322265625, 1.6206817626953125, 1.696533203125, 1.7723846435546875, 1.848236083984375, 1.9240875244140625, 1.99993896484375, 2.0757904052734375, 2.151641845703125, 2.2274932861328125, 2.3033447265625, 2.3791961669921875, 2.455047607421875, 2.5308990478515625, 2.60675048828125, 2.6826019287109375, 2.758453369140625, 2.8343048095703125, 2.91015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 17.0, 38.0, 117.0, 443.0, 247.0, 74.0, 25.0, 10.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.22264099121094, -31.816661834716797, -30.410682678222656, -29.004703521728516, -27.598724365234375, -26.192745208740234, -24.78676414489746, -23.38078498840332, -21.97480583190918, -20.56882667541504, -19.1628475189209, -17.756866455078125, -16.350887298583984, -14.94490909576416, -13.538928985595703, -12.132949829101562, -10.726970672607422, -9.320991516113281, -7.915011882781982, -6.509032249450684, -5.103053092956543, -3.6970739364624023, -2.2910938262939453, -0.8851146697998047, 0.5208644866943359, 1.9268438816070557, 3.3328232765197754, 4.738802909851074, 6.144782066345215, 7.5507612228393555, 8.956741333007812, 10.362720489501953, 11.768699645996094, 13.174678802490234, 14.580657958984375, 15.986638069152832, 17.392616271972656, 18.798595428466797, 20.20457649230957, 21.61055564880371, 23.01653480529785, 24.422513961791992, 25.828493118286133, 27.234474182128906, 28.640453338623047, 30.046432495117188, 31.452411651611328, 32.85839080810547, 34.26436996459961, 35.67034912109375, 37.07632827758789, 38.48230743408203, 39.88828659057617, 41.29426574707031, 42.70024871826172, 44.106224060058594, 45.51220703125, 46.91818618774414, 48.32416534423828, 49.73014450073242, 51.13612365722656, 52.5421028137207, 53.948081970214844, 55.35406494140625, 56.760040283203125]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 11.0, 7.0, 12.0, 14.0, 23.0, 48.0, 65.0, 96.0, 122.0, 120.0, 105.0, 97.0, 84.0, 43.0, 32.0, 25.0, 19.0, 9.0, 11.0, 10.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.21520233154297, -41.7050895690918, -40.194976806640625, -38.68486404418945, -37.17475128173828, -35.664634704589844, -34.15452575683594, -32.6444091796875, -31.134296417236328, -29.624183654785156, -28.114070892333984, -26.603958129882812, -25.093843460083008, -23.583730697631836, -22.073617935180664, -20.56350326538086, -19.05339241027832, -17.54327964782715, -16.033166885375977, -14.523053169250488, -13.012939453125, -11.502826690673828, -9.992713928222656, -8.482600212097168, -6.972487449645996, -5.462374210357666, -3.952261209487915, -2.442148208618164, -0.932034969329834, 0.5780782699584961, 2.088191032409668, 3.5983047485351562, 5.108417510986328, 6.618530750274658, 8.128643989562988, 9.63875675201416, 11.148870468139648, 12.65898323059082, 14.169095993041992, 15.67920970916748, 17.18932342529297, 18.69943618774414, 20.209548950195312, 21.719661712646484, 23.22977638244629, 24.73988914489746, 26.250001907348633, 27.760116577148438, 29.270227432250977, 30.78034019470215, 32.29045486450195, 33.800567626953125, 35.3106803894043, 36.82079315185547, 38.33090591430664, 39.84101867675781, 41.351131439208984, 42.861244201660156, 44.37135696411133, 45.8814697265625, 47.39158248901367, 48.901695251464844, 50.41181182861328, 51.92192459106445, 53.432037353515625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 14.0, 13.0, 23.0, 32.0, 51.0, 74.0, 116.0, 149.0, 227.0, 414.0, 640.0, 969.0, 1656.0, 3096.0, 6093.0, 13926.0, 44575.0, 3462082.0, 605907.0, 33714.0, 10166.0, 4638.0, 2353.0, 1254.0, 755.0, 506.0, 274.0, 186.0, 116.0, 82.0, 53.0, 35.0, 35.0, 14.0, 10.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8359375, -5.647216796875, -5.45849609375, -5.269775390625, -5.0810546875, -4.892333984375, -4.70361328125, -4.514892578125, -4.326171875, -4.137451171875, -3.94873046875, -3.760009765625, -3.5712890625, -3.382568359375, -3.19384765625, -3.005126953125, -2.81640625, -2.627685546875, -2.43896484375, -2.250244140625, -2.0615234375, -1.872802734375, -1.68408203125, -1.495361328125, -1.306640625, -1.117919921875, -0.92919921875, -0.740478515625, -0.5517578125, -0.363037109375, -0.17431640625, 0.014404296875, 0.203125, 0.391845703125, 0.58056640625, 0.769287109375, 0.9580078125, 1.146728515625, 1.33544921875, 1.524169921875, 1.712890625, 1.901611328125, 2.09033203125, 2.279052734375, 2.4677734375, 2.656494140625, 2.84521484375, 3.033935546875, 3.22265625, 3.411376953125, 3.60009765625, 3.788818359375, 3.9775390625, 4.166259765625, 4.35498046875, 4.543701171875, 4.732421875, 4.921142578125, 5.10986328125, 5.298583984375, 5.4873046875, 5.676025390625, 5.86474609375, 6.053466796875, 6.2421875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 0.0, 5.0, 4.0, 8.0, 2.0, 6.0, 9.0, 8.0, 8.0, 11.0, 13.0, 13.0, 38.0, 110.0, 239.0, 268.0, 113.0, 38.0, 30.0, 11.0, 14.0, 8.0, 6.0, 4.0, 6.0, 1.0, 6.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50244140625, -0.4861907958984375, -0.469940185546875, -0.4536895751953125, -0.43743896484375, -0.4211883544921875, -0.404937744140625, -0.3886871337890625, -0.3724365234375, -0.3561859130859375, -0.339935302734375, -0.3236846923828125, -0.30743408203125, -0.2911834716796875, -0.274932861328125, -0.2586822509765625, -0.242431640625, -0.2261810302734375, -0.209930419921875, -0.1936798095703125, -0.17742919921875, -0.1611785888671875, -0.144927978515625, -0.1286773681640625, -0.1124267578125, -0.0961761474609375, -0.079925537109375, -0.0636749267578125, -0.04742431640625, -0.0311737060546875, -0.014923095703125, 0.0013275146484375, 0.017578125, 0.0338287353515625, 0.050079345703125, 0.0663299560546875, 0.08258056640625, 0.0988311767578125, 0.115081787109375, 0.1313323974609375, 0.1475830078125, 0.1638336181640625, 0.180084228515625, 0.1963348388671875, 0.21258544921875, 0.2288360595703125, 0.245086669921875, 0.2613372802734375, 0.277587890625, 0.2938385009765625, 0.310089111328125, 0.3263397216796875, 0.34259033203125, 0.3588409423828125, 0.375091552734375, 0.3913421630859375, 0.4075927734375, 0.4238433837890625, 0.440093994140625, 0.4563446044921875, 0.47259521484375, 0.4888458251953125, 0.505096435546875, 0.5213470458984375, 0.53759765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 12.0, 11.0, 10.0, 29.0, 39.0, 67.0, 88.0, 121.0, 223.0, 359.0, 622.0, 1057.0, 2243.0, 5402.0, 15357.0, 65279.0, 2052538.0, 1960792.0, 63996.0, 15338.0, 5397.0, 2349.0, 1186.0, 630.0, 384.0, 215.0, 172.0, 106.0, 88.0, 41.0, 23.0, 25.0, 12.0, 10.0, 11.0, 8.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.513671875, -3.39654541015625, -3.2794189453125, -3.16229248046875, -3.045166015625, -2.92803955078125, -2.8109130859375, -2.69378662109375, -2.57666015625, -2.45953369140625, -2.3424072265625, -2.22528076171875, -2.108154296875, -1.99102783203125, -1.8739013671875, -1.75677490234375, -1.6396484375, -1.52252197265625, -1.4053955078125, -1.28826904296875, -1.171142578125, -1.05401611328125, -0.9368896484375, -0.81976318359375, -0.70263671875, -0.58551025390625, -0.4683837890625, -0.35125732421875, -0.234130859375, -0.11700439453125, 0.0001220703125, 0.11724853515625, 0.234375, 0.35150146484375, 0.4686279296875, 0.58575439453125, 0.702880859375, 0.82000732421875, 0.9371337890625, 1.05426025390625, 1.17138671875, 1.28851318359375, 1.4056396484375, 1.52276611328125, 1.639892578125, 1.75701904296875, 1.8741455078125, 1.99127197265625, 2.1083984375, 2.22552490234375, 2.3426513671875, 2.45977783203125, 2.576904296875, 2.69403076171875, 2.8111572265625, 2.92828369140625, 3.04541015625, 3.16253662109375, 3.2796630859375, 3.39678955078125, 3.513916015625, 3.63104248046875, 3.7481689453125, 3.86529541015625, 3.982421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 6.0, 8.0, 17.0, 15.0, 24.0, 25.0, 38.0, 59.0, 125.0, 224.0, 953.0, 1890.0, 324.0, 126.0, 81.0, 45.0, 19.0, 20.0, 17.0, 14.0, 7.0, 5.0, 8.0, 4.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.74365234375, -0.7152328491210938, -0.6868133544921875, -0.6583938598632812, -0.629974365234375, -0.6015548706054688, -0.5731353759765625, -0.5447158813476562, -0.51629638671875, -0.48787689208984375, -0.4594573974609375, -0.43103790283203125, -0.402618408203125, -0.37419891357421875, -0.3457794189453125, -0.31735992431640625, -0.2889404296875, -0.26052093505859375, -0.2321014404296875, -0.20368194580078125, -0.175262451171875, -0.14684295654296875, -0.1184234619140625, -0.09000396728515625, -0.06158447265625, -0.03316497802734375, -0.0047454833984375, 0.02367401123046875, 0.052093505859375, 0.08051300048828125, 0.1089324951171875, 0.13735198974609375, 0.165771484375, 0.19419097900390625, 0.2226104736328125, 0.25102996826171875, 0.279449462890625, 0.30786895751953125, 0.3362884521484375, 0.36470794677734375, 0.39312744140625, 0.42154693603515625, 0.4499664306640625, 0.47838592529296875, 0.506805419921875, 0.5352249145507812, 0.5636444091796875, 0.5920639038085938, 0.6204833984375, 0.6489028930664062, 0.6773223876953125, 0.7057418823242188, 0.734161376953125, 0.7625808715820312, 0.7910003662109375, 0.8194198608398438, 0.84783935546875, 0.8762588500976562, 0.9046783447265625, 0.9330978393554688, 0.961517333984375, 0.9899368286132812, 1.0183563232421875, 1.0467758178710938, 1.0751953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 21.0, 192.0, 677.0, 83.0, 18.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.153841972351074, -6.766066551208496, -6.37829065322876, -5.990515232086182, -5.602739334106445, -5.214963912963867, -4.827188491821289, -4.439413070678711, -4.051637172698975, -3.6638615131378174, -3.27608585357666, -2.888310432434082, -2.500534772872925, -2.1127591133117676, -1.7249836921691895, -1.3372080326080322, -0.949432373046875, -0.5616567730903625, -0.1738811731338501, 0.21389436721801758, 0.6016700267791748, 0.989445686340332, 1.3772211074829102, 1.7649967670440674, 2.1527724266052246, 2.540548086166382, 2.928323745727539, 3.316099166870117, 3.7038748264312744, 4.091650485992432, 4.47942590713501, 4.867201805114746, 5.254976272583008, 5.642751693725586, 6.030527591705322, 6.4183030128479, 6.806078910827637, 7.193854331970215, 7.581629753112793, 7.969405174255371, 8.357181549072266, 8.744956970214844, 9.132732391357422, 9.5205078125, 9.908284187316895, 10.296059608459473, 10.68383502960205, 11.071610450744629, 11.459385871887207, 11.847161293029785, 12.234936714172363, 12.622713088989258, 13.010488510131836, 13.398263931274414, 13.786039352416992, 14.17381477355957, 14.561590194702148, 14.949365615844727, 15.337141036987305, 15.724916458129883, 16.11269187927246, 16.500469207763672, 16.88824462890625, 17.276020050048828, 17.663795471191406]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 13.0, 8.0, 16.0, 24.0, 29.0, 47.0, 57.0, 75.0, 106.0, 94.0, 98.0, 104.0, 67.0, 62.0, 41.0, 41.0, 27.0, 11.0, 11.0, 5.0, 8.0, 10.0, 2.0, 5.0, 3.0, 4.0, 1.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.241288185119629, -4.114683151245117, -3.9880785942077637, -3.861473798751831, -3.7348690032958984, -3.6082639694213867, -3.481659173965454, -3.3550543785095215, -3.228449583053589, -3.1018447875976562, -2.9752399921417236, -2.848635196685791, -2.7220301628112793, -2.595425605773926, -2.468820571899414, -2.3422157764434814, -2.215610980987549, -2.089006185531616, -1.9624013900756836, -1.8357964754104614, -1.7091916799545288, -1.5825868844985962, -1.455981969833374, -1.3293771743774414, -1.2027723789215088, -1.0761675834655762, -0.9495627284049988, -0.8229578733444214, -0.6963530778884888, -0.5697482824325562, -0.44314342737197876, -0.31653857231140137, -0.18993377685546875, -0.06332895159721375, 0.06327587366104126, 0.18988069891929626, 0.31648552417755127, 0.4430903196334839, 0.5696951746940613, 0.6963000297546387, 0.8229048252105713, 0.9495096206665039, 1.0761144161224365, 1.2027193307876587, 1.3293241262435913, 1.455928921699524, 1.582533836364746, 1.7091386318206787, 1.8357434272766113, 1.962348222732544, 2.0889530181884766, 2.215557813644409, 2.342162609100342, 2.4687676429748535, 2.595372438430786, 2.7219772338867188, 2.8485820293426514, 2.975186824798584, 3.1017916202545166, 3.228396415710449, 3.355001449584961, 3.4816060066223145, 3.608211040496826, 3.734815835952759, 3.8614206314086914]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 6.0, 19.0, 29.0, 33.0, 70.0, 87.0, 101.0, 185.0, 252.0, 354.0, 546.0, 948.0, 1546.0, 2656.0, 4506.0, 8996.0, 19621.0, 69580.0, 752967.0, 134894.0, 26592.0, 11111.0, 5476.0, 3088.0, 1823.0, 1120.0, 614.0, 426.0, 280.0, 189.0, 129.0, 95.0, 59.0, 50.0, 31.0, 18.0, 15.0, 11.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.26171875, -3.17022705078125, -3.0787353515625, -2.98724365234375, -2.895751953125, -2.80426025390625, -2.7127685546875, -2.62127685546875, -2.52978515625, -2.43829345703125, -2.3468017578125, -2.25531005859375, -2.163818359375, -2.07232666015625, -1.9808349609375, -1.88934326171875, -1.7978515625, -1.70635986328125, -1.6148681640625, -1.52337646484375, -1.431884765625, -1.34039306640625, -1.2489013671875, -1.15740966796875, -1.06591796875, -0.97442626953125, -0.8829345703125, -0.79144287109375, -0.699951171875, -0.60845947265625, -0.5169677734375, -0.42547607421875, -0.333984375, -0.24249267578125, -0.1510009765625, -0.05950927734375, 0.031982421875, 0.12347412109375, 0.2149658203125, 0.30645751953125, 0.39794921875, 0.48944091796875, 0.5809326171875, 0.67242431640625, 0.763916015625, 0.85540771484375, 0.9468994140625, 1.03839111328125, 1.1298828125, 1.22137451171875, 1.3128662109375, 1.40435791015625, 1.495849609375, 1.58734130859375, 1.6788330078125, 1.77032470703125, 1.86181640625, 1.95330810546875, 2.0447998046875, 2.13629150390625, 2.227783203125, 2.31927490234375, 2.4107666015625, 2.50225830078125, 2.59375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 10.0, 4.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 10.0, 15.0, 15.0, 24.0, 39.0, 109.0, 161.0, 233.0, 144.0, 73.0, 37.0, 24.0, 18.0, 12.0, 5.0, 10.0, 6.0, 7.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5205078125, -0.5061302185058594, -0.49175262451171875, -0.4773750305175781, -0.4629974365234375, -0.4486198425292969, -0.43424224853515625, -0.4198646545410156, -0.405487060546875, -0.3911094665527344, -0.37673187255859375, -0.3623542785644531, -0.3479766845703125, -0.3335990905761719, -0.31922149658203125, -0.3048439025878906, -0.29046630859375, -0.2760887145996094, -0.26171112060546875, -0.24733352661132812, -0.2329559326171875, -0.21857833862304688, -0.20420074462890625, -0.18982315063476562, -0.175445556640625, -0.16106796264648438, -0.14669036865234375, -0.13231277465820312, -0.1179351806640625, -0.10355758666992188, -0.08917999267578125, -0.07480239868164062, -0.0604248046875, -0.046047210693359375, -0.03166961669921875, -0.017292022705078125, -0.0029144287109375, 0.011463165283203125, 0.02584075927734375, 0.040218353271484375, 0.054595947265625, 0.06897354125976562, 0.08335113525390625, 0.09772872924804688, 0.1121063232421875, 0.12648391723632812, 0.14086151123046875, 0.15523910522460938, 0.16961669921875, 0.18399429321289062, 0.19837188720703125, 0.21274948120117188, 0.2271270751953125, 0.24150466918945312, 0.25588226318359375, 0.2702598571777344, 0.284637451171875, 0.2990150451660156, 0.31339263916015625, 0.3277702331542969, 0.3421478271484375, 0.3565254211425781, 0.37090301513671875, 0.3852806091308594, 0.399658203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 18.0, 65.0, 304.0, 2074.0, 33456.0, 897863.0, 109327.0, 4705.0, 528.0, 124.0, 35.0, 12.0, 11.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.11328125, -4.9140625, -4.71484375, -4.515625, -4.31640625, -4.1171875, -3.91796875, -3.71875, -3.51953125, -3.3203125, -3.12109375, -2.921875, -2.72265625, -2.5234375, -2.32421875, -2.125, -1.92578125, -1.7265625, -1.52734375, -1.328125, -1.12890625, -0.9296875, -0.73046875, -0.53125, -0.33203125, -0.1328125, 0.06640625, 0.265625, 0.46484375, 0.6640625, 0.86328125, 1.0625, 1.26171875, 1.4609375, 1.66015625, 1.859375, 2.05859375, 2.2578125, 2.45703125, 2.65625, 2.85546875, 3.0546875, 3.25390625, 3.453125, 3.65234375, 3.8515625, 4.05078125, 4.25, 4.44921875, 4.6484375, 4.84765625, 5.046875, 5.24609375, 5.4453125, 5.64453125, 5.84375, 6.04296875, 6.2421875, 6.44140625, 6.640625, 6.83984375, 7.0390625, 7.23828125, 7.4375, 7.63671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 10.0, 11.0, 10.0, 19.0, 20.0, 23.0, 20.0, 28.0, 25.0, 27.0, 35.0, 29.0, 36.0, 41.0, 40.0, 27.0, 37.0, 42.0, 40.0, 45.0, 40.0, 37.0, 37.0, 26.0, 39.0, 26.0, 34.0, 19.0, 22.0, 14.0, 17.0, 18.0, 15.0, 18.0, 10.0, 7.0, 5.0, 5.0, 6.0, 3.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.2821807861328125, -1.240142822265625, -1.1981048583984375, -1.15606689453125, -1.1140289306640625, -1.071990966796875, -1.0299530029296875, -0.9879150390625, -0.9458770751953125, -0.903839111328125, -0.8618011474609375, -0.81976318359375, -0.7777252197265625, -0.735687255859375, -0.6936492919921875, -0.651611328125, -0.6095733642578125, -0.567535400390625, -0.5254974365234375, -0.48345947265625, -0.4414215087890625, -0.399383544921875, -0.3573455810546875, -0.3153076171875, -0.2732696533203125, -0.231231689453125, -0.1891937255859375, -0.14715576171875, -0.1051177978515625, -0.063079833984375, -0.0210418701171875, 0.02099609375, 0.0630340576171875, 0.105072021484375, 0.1471099853515625, 0.18914794921875, 0.2311859130859375, 0.273223876953125, 0.3152618408203125, 0.3572998046875, 0.3993377685546875, 0.441375732421875, 0.4834136962890625, 0.52545166015625, 0.5674896240234375, 0.609527587890625, 0.6515655517578125, 0.693603515625, 0.7356414794921875, 0.777679443359375, 0.8197174072265625, 0.86175537109375, 0.9037933349609375, 0.945831298828125, 0.9878692626953125, 1.0299072265625, 1.0719451904296875, 1.113983154296875, 1.1560211181640625, 1.19805908203125, 1.2400970458984375, 1.282135009765625, 1.3241729736328125, 1.3662109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 2.0, 7.0, 4.0, 13.0, 16.0, 21.0, 34.0, 48.0, 93.0, 162.0, 389.0, 951.0, 3354.0, 21749.0, 815893.0, 193488.0, 9091.0, 1993.0, 663.0, 262.0, 122.0, 68.0, 36.0, 25.0, 11.0, 7.0, 10.0, 6.0, 5.0, 7.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.21484375, -5.083831787109375, -4.95281982421875, -4.821807861328125, -4.6907958984375, -4.559783935546875, -4.42877197265625, -4.297760009765625, -4.166748046875, -4.035736083984375, -3.90472412109375, -3.773712158203125, -3.6427001953125, -3.511688232421875, -3.38067626953125, -3.249664306640625, -3.11865234375, -2.987640380859375, -2.85662841796875, -2.725616455078125, -2.5946044921875, -2.463592529296875, -2.33258056640625, -2.201568603515625, -2.070556640625, -1.939544677734375, -1.80853271484375, -1.677520751953125, -1.5465087890625, -1.415496826171875, -1.28448486328125, -1.153472900390625, -1.0224609375, -0.891448974609375, -0.76043701171875, -0.629425048828125, -0.4984130859375, -0.367401123046875, -0.23638916015625, -0.105377197265625, 0.025634765625, 0.156646728515625, 0.28765869140625, 0.418670654296875, 0.5496826171875, 0.680694580078125, 0.81170654296875, 0.942718505859375, 1.07373046875, 1.204742431640625, 1.33575439453125, 1.466766357421875, 1.5977783203125, 1.728790283203125, 1.85980224609375, 1.990814208984375, 2.121826171875, 2.252838134765625, 2.38385009765625, 2.514862060546875, 2.6458740234375, 2.776885986328125, 2.90789794921875, 3.038909912109375, 3.169921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 8.0, 8.0, 14.0, 16.0, 24.0, 45.0, 52.0, 87.0, 110.0, 160.0, 117.0, 92.0, 78.0, 63.0, 49.0, 25.0, 20.0, 12.0, 5.0, 3.0, 5.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020968914031982422, -0.00020331144332885742, -0.00019693374633789062, -0.00019055604934692383, -0.00018417835235595703, -0.00017780065536499023, -0.00017142295837402344, -0.00016504526138305664, -0.00015866756439208984, -0.00015228986740112305, -0.00014591217041015625, -0.00013953447341918945, -0.00013315677642822266, -0.00012677907943725586, -0.00012040138244628906, -0.00011402368545532227, -0.00010764598846435547, -0.00010126829147338867, -9.489059448242188e-05, -8.851289749145508e-05, -8.213520050048828e-05, -7.575750350952148e-05, -6.937980651855469e-05, -6.300210952758789e-05, -5.6624412536621094e-05, -5.02467155456543e-05, -4.38690185546875e-05, -3.74913215637207e-05, -3.1113624572753906e-05, -2.473592758178711e-05, -1.8358230590820312e-05, -1.1980533599853516e-05, -5.602836608886719e-06, 7.748603820800781e-07, 7.152557373046875e-06, 1.3530254364013672e-05, 1.990795135498047e-05, 2.6285648345947266e-05, 3.266334533691406e-05, 3.904104232788086e-05, 4.5418739318847656e-05, 5.179643630981445e-05, 5.817413330078125e-05, 6.455183029174805e-05, 7.092952728271484e-05, 7.730722427368164e-05, 8.368492126464844e-05, 9.006261825561523e-05, 9.644031524658203e-05, 0.00010281801223754883, 0.00010919570922851562, 0.00011557340621948242, 0.00012195110321044922, 0.00012832880020141602, 0.0001347064971923828, 0.0001410841941833496, 0.0001474618911743164, 0.0001538395881652832, 0.00016021728515625, 0.0001665949821472168, 0.0001729726791381836, 0.0001793503761291504, 0.0001857280731201172, 0.00019210577011108398, 0.00019848346710205078]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 12.0, 12.0, 16.0, 24.0, 39.0, 75.0, 125.0, 226.0, 460.0, 1045.0, 2910.0, 11668.0, 98934.0, 787308.0, 127976.0, 12785.0, 2934.0, 1097.0, 431.0, 216.0, 125.0, 54.0, 24.0, 21.0, 11.0, 12.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.457275390625, -2.37939453125, -2.301513671875, -2.2236328125, -2.145751953125, -2.06787109375, -1.989990234375, -1.912109375, -1.834228515625, -1.75634765625, -1.678466796875, -1.6005859375, -1.522705078125, -1.44482421875, -1.366943359375, -1.2890625, -1.211181640625, -1.13330078125, -1.055419921875, -0.9775390625, -0.899658203125, -0.82177734375, -0.743896484375, -0.666015625, -0.588134765625, -0.51025390625, -0.432373046875, -0.3544921875, -0.276611328125, -0.19873046875, -0.120849609375, -0.04296875, 0.034912109375, 0.11279296875, 0.190673828125, 0.2685546875, 0.346435546875, 0.42431640625, 0.502197265625, 0.580078125, 0.657958984375, 0.73583984375, 0.813720703125, 0.8916015625, 0.969482421875, 1.04736328125, 1.125244140625, 1.203125, 1.281005859375, 1.35888671875, 1.436767578125, 1.5146484375, 1.592529296875, 1.67041015625, 1.748291015625, 1.826171875, 1.904052734375, 1.98193359375, 2.059814453125, 2.1376953125, 2.215576171875, 2.29345703125, 2.371337890625, 2.44921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 10.0, 6.0, 10.0, 14.0, 19.0, 34.0, 61.0, 90.0, 113.0, 137.0, 117.0, 123.0, 78.0, 78.0, 42.0, 27.0, 16.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.3187713623046875, -2.256683349609375, -2.1945953369140625, -2.13250732421875, -2.0704193115234375, -2.008331298828125, -1.9462432861328125, -1.8841552734375, -1.8220672607421875, -1.759979248046875, -1.6978912353515625, -1.63580322265625, -1.5737152099609375, -1.511627197265625, -1.4495391845703125, -1.387451171875, -1.3253631591796875, -1.263275146484375, -1.2011871337890625, -1.13909912109375, -1.0770111083984375, -1.014923095703125, -0.9528350830078125, -0.8907470703125, -0.8286590576171875, -0.766571044921875, -0.7044830322265625, -0.64239501953125, -0.5803070068359375, -0.518218994140625, -0.4561309814453125, -0.39404296875, -0.3319549560546875, -0.269866943359375, -0.2077789306640625, -0.14569091796875, -0.0836029052734375, -0.021514892578125, 0.0405731201171875, 0.1026611328125, 0.1647491455078125, 0.226837158203125, 0.2889251708984375, 0.35101318359375, 0.4131011962890625, 0.475189208984375, 0.5372772216796875, 0.599365234375, 0.6614532470703125, 0.723541259765625, 0.7856292724609375, 0.84771728515625, 0.9098052978515625, 0.971893310546875, 1.0339813232421875, 1.0960693359375, 1.1581573486328125, 1.220245361328125, 1.2823333740234375, 1.34442138671875, 1.4065093994140625, 1.468597412109375, 1.5306854248046875, 1.5927734375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 8.0, 12.0, 19.0, 46.0, 161.0, 394.0, 223.0, 82.0, 36.0, 14.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.46117401123047, -28.699419021606445, -27.93766212463379, -27.175907135009766, -26.414152145385742, -25.65239715576172, -24.890640258789062, -24.12888526916504, -23.367130279541016, -22.605375289916992, -21.843618392944336, -21.081863403320312, -20.32010841369629, -19.558353424072266, -18.79659652709961, -18.034841537475586, -17.27308464050293, -16.511329650878906, -15.749573707580566, -14.987817764282227, -14.226062774658203, -13.464306831359863, -12.702550888061523, -11.9407958984375, -11.17903995513916, -10.41728401184082, -9.655529022216797, -8.893773078918457, -8.132017135620117, -7.370262145996094, -6.608506202697754, -5.846750736236572, -5.084995269775391, -4.323239803314209, -3.5614840984344482, -2.7997283935546875, -2.037972927093506, -1.2762174606323242, -0.5144615173339844, 0.24729394912719727, 1.009049415588379, 1.77080500125885, 2.5325605869293213, 3.294316291809082, 4.056071758270264, 4.817827224731445, 5.579583168029785, 6.341338634490967, 7.103094100952148, 7.86484956741333, 8.626605033874512, 9.388360977172852, 10.150115966796875, 10.911871910095215, 11.673627853393555, 12.435382843017578, 13.197138786315918, 13.958894729614258, 14.720649719238281, 15.482405662536621, 16.24416160583496, 17.005916595458984, 17.76767349243164, 18.529428482055664, 19.291183471679688]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 5.0, 4.0, 7.0, 5.0, 15.0, 18.0, 18.0, 33.0, 47.0, 51.0, 76.0, 97.0, 105.0, 105.0, 86.0, 86.0, 76.0, 45.0, 32.0, 17.0, 17.0, 14.0, 9.0, 6.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15813446044922, -19.52935791015625, -18.900583267211914, -18.271808624267578, -17.64303207397461, -17.01425552368164, -16.385480880737305, -15.756705284118652, -15.1279296875, -14.499154090881348, -13.870378494262695, -13.241602897644043, -12.61282730102539, -11.984051704406738, -11.355276107788086, -10.726500511169434, -10.097724914550781, -9.468949317932129, -8.840173721313477, -8.211398124694824, -7.582622528076172, -6.9538469314575195, -6.325071334838867, -5.696295738220215, -5.0675201416015625, -4.43874454498291, -3.809968948364258, -3.1811933517456055, -2.552417755126953, -1.9236421585083008, -1.2948665618896484, -0.6660909652709961, -0.03731727600097656, 0.5914583206176758, 1.2202339172363281, 1.8490095138549805, 2.477785110473633, 3.106560707092285, 3.7353363037109375, 4.36411190032959, 4.992887496948242, 5.6216630935668945, 6.250438690185547, 6.879214286804199, 7.507989883422852, 8.136765480041504, 8.765541076660156, 9.394316673278809, 10.023092269897461, 10.651867866516113, 11.280643463134766, 11.909419059753418, 12.53819465637207, 13.166970252990723, 13.795745849609375, 14.424521446228027, 15.05329704284668, 15.682072639465332, 16.310848236083984, 16.939624786376953, 17.56839942932129, 18.197174072265625, 18.825950622558594, 19.454727172851562, 20.0835018157959]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 5.0, 6.0, 5.0, 7.0, 16.0, 13.0, 13.0, 26.0, 26.0, 28.0, 52.0, 49.0, 74.0, 112.0, 144.0, 198.0, 334.0, 563.0, 952.0, 1866.0, 3933.0, 11357.0, 77121.0, 4014981.0, 64959.0, 10363.0, 3380.0, 1503.0, 811.0, 482.0, 283.0, 201.0, 132.0, 90.0, 62.0, 51.0, 32.0, 14.0, 11.0, 10.0, 4.0, 7.0, 2.0, 2.0, 2.0], "bins": [-11.7578125, -11.48095703125, -11.2041015625, -10.92724609375, -10.650390625, -10.37353515625, -10.0966796875, -9.81982421875, -9.54296875, -9.26611328125, -8.9892578125, -8.71240234375, -8.435546875, -8.15869140625, -7.8818359375, -7.60498046875, -7.328125, -7.05126953125, -6.7744140625, -6.49755859375, -6.220703125, -5.94384765625, -5.6669921875, -5.39013671875, -5.11328125, -4.83642578125, -4.5595703125, -4.28271484375, -4.005859375, -3.72900390625, -3.4521484375, -3.17529296875, -2.8984375, -2.62158203125, -2.3447265625, -2.06787109375, -1.791015625, -1.51416015625, -1.2373046875, -0.96044921875, -0.68359375, -0.40673828125, -0.1298828125, 0.14697265625, 0.423828125, 0.70068359375, 0.9775390625, 1.25439453125, 1.53125, 1.80810546875, 2.0849609375, 2.36181640625, 2.638671875, 2.91552734375, 3.1923828125, 3.46923828125, 3.74609375, 4.02294921875, 4.2998046875, 4.57666015625, 4.853515625, 5.13037109375, 5.4072265625, 5.68408203125, 5.9609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 11.0, 19.0, 13.0, 28.0, 30.0, 58.0, 120.0, 158.0, 171.0, 138.0, 80.0, 54.0, 31.0, 10.0, 17.0, 7.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5743942260742188, -0.5604095458984375, -0.5464248657226562, -0.532440185546875, -0.5184555053710938, -0.5044708251953125, -0.49048614501953125, -0.47650146484375, -0.46251678466796875, -0.4485321044921875, -0.43454742431640625, -0.420562744140625, -0.40657806396484375, -0.3925933837890625, -0.37860870361328125, -0.3646240234375, -0.35063934326171875, -0.3366546630859375, -0.32266998291015625, -0.308685302734375, -0.29470062255859375, -0.2807159423828125, -0.26673126220703125, -0.25274658203125, -0.23876190185546875, -0.2247772216796875, -0.21079254150390625, -0.196807861328125, -0.18282318115234375, -0.1688385009765625, -0.15485382080078125, -0.140869140625, -0.12688446044921875, -0.1128997802734375, -0.09891510009765625, -0.084930419921875, -0.07094573974609375, -0.0569610595703125, -0.04297637939453125, -0.02899169921875, -0.01500701904296875, -0.0010223388671875, 0.01296234130859375, 0.026947021484375, 0.04093170166015625, 0.0549163818359375, 0.06890106201171875, 0.0828857421875, 0.09687042236328125, 0.1108551025390625, 0.12483978271484375, 0.138824462890625, 0.15280914306640625, 0.1667938232421875, 0.18077850341796875, 0.19476318359375, 0.20874786376953125, 0.2227325439453125, 0.23671722412109375, 0.250701904296875, 0.26468658447265625, 0.2786712646484375, 0.29265594482421875, 0.306640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 8.0, 7.0, 8.0, 12.0, 12.0, 19.0, 23.0, 49.0, 88.0, 270.0, 1897.0, 289073.0, 3899070.0, 3198.0, 326.0, 79.0, 43.0, 22.0, 20.0, 10.0, 19.0, 6.0, 10.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.8372802734375, -11.276123046875, -10.7149658203125, -10.15380859375, -9.5926513671875, -9.031494140625, -8.4703369140625, -7.9091796875, -7.3480224609375, -6.786865234375, -6.2257080078125, -5.66455078125, -5.1033935546875, -4.542236328125, -3.9810791015625, -3.419921875, -2.8587646484375, -2.297607421875, -1.7364501953125, -1.17529296875, -0.6141357421875, -0.052978515625, 0.5081787109375, 1.0693359375, 1.6304931640625, 2.191650390625, 2.7528076171875, 3.31396484375, 3.8751220703125, 4.436279296875, 4.9974365234375, 5.55859375, 6.1197509765625, 6.680908203125, 7.2420654296875, 7.80322265625, 8.3643798828125, 8.925537109375, 9.4866943359375, 10.0478515625, 10.6090087890625, 11.170166015625, 11.7313232421875, 12.29248046875, 12.8536376953125, 13.414794921875, 13.9759521484375, 14.537109375, 15.0982666015625, 15.659423828125, 16.2205810546875, 16.78173828125, 17.3428955078125, 17.904052734375, 18.4652099609375, 19.0263671875, 19.5875244140625, 20.148681640625, 20.7098388671875, 21.27099609375, 21.8321533203125, 22.393310546875, 22.9544677734375, 23.515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 6.0, 9.0, 12.0, 12.0, 21.0, 21.0, 37.0, 39.0, 83.0, 159.0, 404.0, 1728.0, 842.0, 311.0, 144.0, 67.0, 48.0, 23.0, 27.0, 17.0, 11.0, 16.0, 4.0, 8.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0], "bins": [-0.95703125, -0.9341201782226562, -0.9112091064453125, -0.8882980346679688, -0.865386962890625, -0.8424758911132812, -0.8195648193359375, -0.7966537475585938, -0.77374267578125, -0.7508316040039062, -0.7279205322265625, -0.7050094604492188, -0.682098388671875, -0.6591873168945312, -0.6362762451171875, -0.6133651733398438, -0.5904541015625, -0.5675430297851562, -0.5446319580078125, -0.5217208862304688, -0.498809814453125, -0.47589874267578125, -0.4529876708984375, -0.43007659912109375, -0.40716552734375, -0.38425445556640625, -0.3613433837890625, -0.33843231201171875, -0.315521240234375, -0.29261016845703125, -0.2696990966796875, -0.24678802490234375, -0.223876953125, -0.20096588134765625, -0.1780548095703125, -0.15514373779296875, -0.132232666015625, -0.10932159423828125, -0.0864105224609375, -0.06349945068359375, -0.04058837890625, -0.01767730712890625, 0.0052337646484375, 0.02814483642578125, 0.051055908203125, 0.07396697998046875, 0.0968780517578125, 0.11978912353515625, 0.1427001953125, 0.16561126708984375, 0.1885223388671875, 0.21143341064453125, 0.234344482421875, 0.25725555419921875, 0.2801666259765625, 0.30307769775390625, 0.32598876953125, 0.34889984130859375, 0.3718109130859375, 0.39472198486328125, 0.417633056640625, 0.44054412841796875, 0.4634552001953125, 0.48636627197265625, 0.50927734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 8.0, 19.0, 43.0, 104.0, 239.0, 294.0, 172.0, 62.0, 28.0, 12.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.606807231903076, -5.447340488433838, -5.287873268127441, -5.128406524658203, -4.968939781188965, -4.809473037719727, -4.65000581741333, -4.490539073944092, -4.331071853637695, -4.171605110168457, -4.0121378898620605, -3.8526711463928223, -3.693204402923584, -3.5337374210357666, -3.374270439147949, -3.214803695678711, -3.0553369522094727, -2.8958699703216553, -2.736403226852417, -2.5769362449645996, -2.4174695014953613, -2.258002519607544, -2.0985355377197266, -1.9390686750411987, -1.779601812362671, -1.620134949684143, -1.4606680870056152, -1.3012011051177979, -1.14173424243927, -0.9822673797607422, -0.8228004574775696, -0.663333535194397, -0.5038671493530273, -0.3444002568721771, -0.1849333643913269, -0.025466471910476685, 0.13400042057037354, 0.29346728324890137, 0.452934205532074, 0.6124011278152466, 0.7718679904937744, 0.9313348531723022, 1.09080171585083, 1.2502686977386475, 1.4097355604171753, 1.5692024230957031, 1.7286694049835205, 1.8881362676620483, 2.047603130340576, 2.2070701122283936, 2.366536855697632, 2.526003837585449, 2.6854705810546875, 2.844937562942505, 3.0044045448303223, 3.1638712882995605, 3.323338270187378, 3.4828052520751953, 3.6422719955444336, 3.801738977432251, 3.9612059593200684, 4.120672702789307, 4.280139446258545, 4.439606666564941, 4.59907341003418]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 1.0, 7.0, 3.0, 3.0, 9.0, 6.0, 7.0, 19.0, 40.0, 60.0, 59.0, 88.0, 99.0, 130.0, 129.0, 83.0, 80.0, 52.0, 43.0, 27.0, 19.0, 13.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4642257690429688, -2.3253109455108643, -2.1863961219787598, -2.0474812984466553, -1.9085664749145508, -1.7696516513824463, -1.6307368278503418, -1.4918220043182373, -1.3529071807861328, -1.2139923572540283, -1.0750775337219238, -0.9361627101898193, -0.7972478866577148, -0.6583330631256104, -0.5194182395935059, -0.38050341606140137, -0.24158859252929688, -0.10267376899719238, 0.03624105453491211, 0.1751558780670166, 0.3140707015991211, 0.4529855251312256, 0.5919003486633301, 0.7308151721954346, 0.8697299957275391, 1.0086448192596436, 1.147559642791748, 1.2864744663238525, 1.425389289855957, 1.5643041133880615, 1.703218936920166, 1.8421337604522705, 1.9810481071472168, 2.1199629306793213, 2.258877754211426, 2.3977925777435303, 2.5367074012756348, 2.6756222248077393, 2.8145370483398438, 2.9534518718719482, 3.0923666954040527, 3.2312815189361572, 3.3701963424682617, 3.509111166000366, 3.6480259895324707, 3.786940813064575, 3.9258556365966797, 4.064770698547363, 4.203685283660889, 4.342599868774414, 4.481514930725098, 4.620429992675781, 4.759344577789307, 4.898259162902832, 5.037174224853516, 5.176089286804199, 5.315003871917725, 5.45391845703125, 5.592833518981934, 5.731748580932617, 5.870663166046143, 6.009577751159668, 6.148492813110352, 6.287407875061035, 6.4263224601745605]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 1.0, 5.0, 9.0, 5.0, 17.0, 22.0, 26.0, 51.0, 93.0, 132.0, 227.0, 454.0, 814.0, 1745.0, 4550.0, 18620.0, 232932.0, 734437.0, 41866.0, 7556.0, 2612.0, 1093.0, 520.0, 312.0, 148.0, 107.0, 77.0, 32.0, 30.0, 21.0, 10.0, 14.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3515625, -3.23272705078125, -3.1138916015625, -2.99505615234375, -2.876220703125, -2.75738525390625, -2.6385498046875, -2.51971435546875, -2.40087890625, -2.28204345703125, -2.1632080078125, -2.04437255859375, -1.925537109375, -1.80670166015625, -1.6878662109375, -1.56903076171875, -1.4501953125, -1.33135986328125, -1.2125244140625, -1.09368896484375, -0.974853515625, -0.85601806640625, -0.7371826171875, -0.61834716796875, -0.49951171875, -0.38067626953125, -0.2618408203125, -0.14300537109375, -0.024169921875, 0.09466552734375, 0.2135009765625, 0.33233642578125, 0.451171875, 0.57000732421875, 0.6888427734375, 0.80767822265625, 0.926513671875, 1.04534912109375, 1.1641845703125, 1.28302001953125, 1.40185546875, 1.52069091796875, 1.6395263671875, 1.75836181640625, 1.877197265625, 1.99603271484375, 2.1148681640625, 2.23370361328125, 2.3525390625, 2.47137451171875, 2.5902099609375, 2.70904541015625, 2.827880859375, 2.94671630859375, 3.0655517578125, 3.18438720703125, 3.30322265625, 3.42205810546875, 3.5408935546875, 3.65972900390625, 3.778564453125, 3.89739990234375, 4.0162353515625, 4.13507080078125, 4.25390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 8.0, 9.0, 16.0, 21.0, 43.0, 77.0, 124.0, 167.0, 177.0, 134.0, 81.0, 45.0, 39.0, 19.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.493408203125, -0.4811134338378906, -0.46881866455078125, -0.4565238952636719, -0.4442291259765625, -0.4319343566894531, -0.41963958740234375, -0.4073448181152344, -0.395050048828125, -0.3827552795410156, -0.37046051025390625, -0.3581657409667969, -0.3458709716796875, -0.3335762023925781, -0.32128143310546875, -0.3089866638183594, -0.29669189453125, -0.2843971252441406, -0.27210235595703125, -0.2598075866699219, -0.2475128173828125, -0.23521804809570312, -0.22292327880859375, -0.21062850952148438, -0.198333740234375, -0.18603897094726562, -0.17374420166015625, -0.16144943237304688, -0.1491546630859375, -0.13685989379882812, -0.12456512451171875, -0.11227035522460938, -0.0999755859375, -0.08768081665039062, -0.07538604736328125, -0.06309127807617188, -0.0507965087890625, -0.038501739501953125, -0.02620697021484375, -0.013912200927734375, -0.001617431640625, 0.010677337646484375, 0.02297210693359375, 0.035266876220703125, 0.0475616455078125, 0.059856414794921875, 0.07215118408203125, 0.08444595336914062, 0.09674072265625, 0.10903549194335938, 0.12133026123046875, 0.13362503051757812, 0.1459197998046875, 0.15821456909179688, 0.17050933837890625, 0.18280410766601562, 0.195098876953125, 0.20739364624023438, 0.21968841552734375, 0.23198318481445312, 0.2442779541015625, 0.2565727233886719, 0.26886749267578125, 0.2811622619628906, 0.29345703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 0.0, 8.0, 6.0, 8.0, 16.0, 13.0, 11.0, 25.0, 28.0, 39.0, 48.0, 67.0, 89.0, 145.0, 174.0, 291.0, 408.0, 603.0, 1049.0, 1817.0, 3080.0, 5678.0, 10867.0, 22659.0, 50517.0, 125428.0, 309762.0, 299386.0, 121223.0, 48788.0, 22175.0, 10604.0, 5738.0, 3053.0, 1726.0, 1043.0, 628.0, 388.0, 258.0, 205.0, 124.0, 80.0, 84.0, 67.0, 45.0, 29.0, 17.0, 22.0, 10.0, 5.0, 8.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0], "bins": [-1.015625, -0.9828338623046875, -0.950042724609375, -0.9172515869140625, -0.88446044921875, -0.8516693115234375, -0.818878173828125, -0.7860870361328125, -0.7532958984375, -0.7205047607421875, -0.687713623046875, -0.6549224853515625, -0.62213134765625, -0.5893402099609375, -0.556549072265625, -0.5237579345703125, -0.490966796875, -0.4581756591796875, -0.425384521484375, -0.3925933837890625, -0.35980224609375, -0.3270111083984375, -0.294219970703125, -0.2614288330078125, -0.2286376953125, -0.1958465576171875, -0.163055419921875, -0.1302642822265625, -0.09747314453125, -0.0646820068359375, -0.031890869140625, 0.0009002685546875, 0.03369140625, 0.0664825439453125, 0.099273681640625, 0.1320648193359375, 0.16485595703125, 0.1976470947265625, 0.230438232421875, 0.2632293701171875, 0.2960205078125, 0.3288116455078125, 0.361602783203125, 0.3943939208984375, 0.42718505859375, 0.4599761962890625, 0.492767333984375, 0.5255584716796875, 0.558349609375, 0.5911407470703125, 0.623931884765625, 0.6567230224609375, 0.68951416015625, 0.7223052978515625, 0.755096435546875, 0.7878875732421875, 0.8206787109375, 0.8534698486328125, 0.886260986328125, 0.9190521240234375, 0.95184326171875, 0.9846343994140625, 1.017425537109375, 1.0502166748046875, 1.0830078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 9.0, 5.0, 6.0, 11.0, 8.0, 13.0, 11.0, 9.0, 18.0, 22.0, 23.0, 26.0, 30.0, 24.0, 29.0, 28.0, 34.0, 47.0, 40.0, 50.0, 46.0, 46.0, 35.0, 46.0, 36.0, 39.0, 41.0, 31.0, 35.0, 23.0, 20.0, 30.0, 25.0, 16.0, 9.0, 11.0, 18.0, 7.0, 7.0, 6.0, 6.0, 11.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9164886474609375, -0.885711669921875, -0.8549346923828125, -0.82415771484375, -0.7933807373046875, -0.762603759765625, -0.7318267822265625, -0.7010498046875, -0.6702728271484375, -0.639495849609375, -0.6087188720703125, -0.57794189453125, -0.5471649169921875, -0.516387939453125, -0.4856109619140625, -0.454833984375, -0.4240570068359375, -0.393280029296875, -0.3625030517578125, -0.33172607421875, -0.3009490966796875, -0.270172119140625, -0.2393951416015625, -0.2086181640625, -0.1778411865234375, -0.147064208984375, -0.1162872314453125, -0.08551025390625, -0.0547332763671875, -0.023956298828125, 0.0068206787109375, 0.03759765625, 0.0683746337890625, 0.099151611328125, 0.1299285888671875, 0.16070556640625, 0.1914825439453125, 0.222259521484375, 0.2530364990234375, 0.2838134765625, 0.3145904541015625, 0.345367431640625, 0.3761444091796875, 0.40692138671875, 0.4376983642578125, 0.468475341796875, 0.4992523193359375, 0.530029296875, 0.5608062744140625, 0.591583251953125, 0.6223602294921875, 0.65313720703125, 0.6839141845703125, 0.714691162109375, 0.7454681396484375, 0.7762451171875, 0.8070220947265625, 0.837799072265625, 0.8685760498046875, 0.89935302734375, 0.9301300048828125, 0.960906982421875, 0.9916839599609375, 1.0224609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 4.0, 9.0, 10.0, 23.0, 21.0, 25.0, 62.0, 138.0, 231.0, 562.0, 1595.0, 6556.0, 65489.0, 691168.0, 261055.0, 17164.0, 2826.0, 844.0, 368.0, 160.0, 103.0, 42.0, 33.0, 27.0, 10.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.4260406494140625, -1.370635986328125, -1.3152313232421875, -1.25982666015625, -1.2044219970703125, -1.149017333984375, -1.0936126708984375, -1.0382080078125, -0.9828033447265625, -0.927398681640625, -0.8719940185546875, -0.81658935546875, -0.7611846923828125, -0.705780029296875, -0.6503753662109375, -0.594970703125, -0.5395660400390625, -0.484161376953125, -0.4287567138671875, -0.37335205078125, -0.3179473876953125, -0.262542724609375, -0.2071380615234375, -0.1517333984375, -0.0963287353515625, -0.040924072265625, 0.0144805908203125, 0.06988525390625, 0.1252899169921875, 0.180694580078125, 0.2360992431640625, 0.29150390625, 0.3469085693359375, 0.402313232421875, 0.4577178955078125, 0.51312255859375, 0.5685272216796875, 0.623931884765625, 0.6793365478515625, 0.7347412109375, 0.7901458740234375, 0.845550537109375, 0.9009552001953125, 0.95635986328125, 1.0117645263671875, 1.067169189453125, 1.1225738525390625, 1.177978515625, 1.2333831787109375, 1.288787841796875, 1.3441925048828125, 1.39959716796875, 1.4550018310546875, 1.510406494140625, 1.5658111572265625, 1.6212158203125, 1.6766204833984375, 1.732025146484375, 1.7874298095703125, 1.84283447265625, 1.8982391357421875, 1.953643798828125, 2.0090484619140625, 2.064453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 18.0, 17.0, 27.0, 22.0, 31.0, 42.0, 52.0, 70.0, 68.0, 66.0, 84.0, 74.0, 86.0, 61.0, 65.0, 47.0, 32.0, 25.0, 28.0, 12.0, 7.0, 10.0, 11.0, 8.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012993812561035156, -0.00012583285570144653, -0.0001217275857925415, -0.00011762231588363647, -0.00011351704597473145, -0.00010941177606582642, -0.00010530650615692139, -0.00010120123624801636, -9.709596633911133e-05, -9.29906964302063e-05, -8.888542652130127e-05, -8.478015661239624e-05, -8.067488670349121e-05, -7.656961679458618e-05, -7.246434688568115e-05, -6.835907697677612e-05, -6.42538070678711e-05, -6.0148537158966064e-05, -5.6043267250061035e-05, -5.1937997341156006e-05, -4.7832727432250977e-05, -4.372745752334595e-05, -3.962218761444092e-05, -3.551691770553589e-05, -3.141164779663086e-05, -2.730637788772583e-05, -2.32011079788208e-05, -1.909583806991577e-05, -1.4990568161010742e-05, -1.0885298252105713e-05, -6.780028343200684e-06, -2.6747584342956543e-06, 1.430511474609375e-06, 5.535781383514404e-06, 9.641051292419434e-06, 1.3746321201324463e-05, 1.7851591110229492e-05, 2.195686101913452e-05, 2.606213092803955e-05, 3.016740083694458e-05, 3.427267074584961e-05, 3.837794065475464e-05, 4.248321056365967e-05, 4.65884804725647e-05, 5.0693750381469727e-05, 5.4799020290374756e-05, 5.8904290199279785e-05, 6.300956010818481e-05, 6.711483001708984e-05, 7.122009992599487e-05, 7.53253698348999e-05, 7.943063974380493e-05, 8.353590965270996e-05, 8.764117956161499e-05, 9.174644947052002e-05, 9.585171937942505e-05, 9.995698928833008e-05, 0.00010406225919723511, 0.00010816752910614014, 0.00011227279901504517, 0.0001163780689239502, 0.00012048333883285522, 0.00012458860874176025, 0.00012869387865066528, 0.0001327991485595703]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 4.0, 4.0, 8.0, 13.0, 12.0, 19.0, 23.0, 36.0, 55.0, 86.0, 125.0, 220.0, 366.0, 707.0, 1742.0, 4896.0, 19900.0, 118131.0, 543254.0, 298186.0, 45907.0, 9506.0, 2870.0, 1136.0, 495.0, 312.0, 159.0, 116.0, 65.0, 38.0, 39.0, 41.0, 14.0, 14.0, 23.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3095703125, -1.2729339599609375, -1.236297607421875, -1.1996612548828125, -1.16302490234375, -1.1263885498046875, -1.089752197265625, -1.0531158447265625, -1.0164794921875, -0.9798431396484375, -0.943206787109375, -0.9065704345703125, -0.86993408203125, -0.8332977294921875, -0.796661376953125, -0.7600250244140625, -0.723388671875, -0.6867523193359375, -0.650115966796875, -0.6134796142578125, -0.57684326171875, -0.5402069091796875, -0.503570556640625, -0.4669342041015625, -0.4302978515625, -0.3936614990234375, -0.357025146484375, -0.3203887939453125, -0.28375244140625, -0.2471160888671875, -0.210479736328125, -0.1738433837890625, -0.13720703125, -0.1005706787109375, -0.063934326171875, -0.0272979736328125, 0.00933837890625, 0.0459747314453125, 0.082611083984375, 0.1192474365234375, 0.1558837890625, 0.1925201416015625, 0.229156494140625, 0.2657928466796875, 0.30242919921875, 0.3390655517578125, 0.375701904296875, 0.4123382568359375, 0.448974609375, 0.4856109619140625, 0.522247314453125, 0.5588836669921875, 0.59552001953125, 0.6321563720703125, 0.668792724609375, 0.7054290771484375, 0.7420654296875, 0.7787017822265625, 0.815338134765625, 0.8519744873046875, 0.88861083984375, 0.9252471923828125, 0.961883544921875, 0.9985198974609375, 1.03515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 6.0, 15.0, 22.0, 31.0, 41.0, 61.0, 86.0, 100.0, 117.0, 134.0, 96.0, 88.0, 70.0, 35.0, 32.0, 17.0, 14.0, 9.0, 7.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5458984375, -0.519683837890625, -0.49346923828125, -0.467254638671875, -0.4410400390625, -0.414825439453125, -0.38861083984375, -0.362396240234375, -0.336181640625, -0.309967041015625, -0.28375244140625, -0.257537841796875, -0.2313232421875, -0.205108642578125, -0.17889404296875, -0.152679443359375, -0.12646484375, -0.100250244140625, -0.07403564453125, -0.047821044921875, -0.0216064453125, 0.004608154296875, 0.03082275390625, 0.057037353515625, 0.083251953125, 0.109466552734375, 0.13568115234375, 0.161895751953125, 0.1881103515625, 0.214324951171875, 0.24053955078125, 0.266754150390625, 0.29296875, 0.319183349609375, 0.34539794921875, 0.371612548828125, 0.3978271484375, 0.424041748046875, 0.45025634765625, 0.476470947265625, 0.502685546875, 0.528900146484375, 0.55511474609375, 0.581329345703125, 0.6075439453125, 0.633758544921875, 0.65997314453125, 0.686187744140625, 0.71240234375, 0.738616943359375, 0.76483154296875, 0.791046142578125, 0.8172607421875, 0.843475341796875, 0.86968994140625, 0.895904541015625, 0.922119140625, 0.948333740234375, 0.97454833984375, 1.000762939453125, 1.0269775390625, 1.053192138671875, 1.07940673828125, 1.105621337890625, 1.1318359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 13.0, 27.0, 75.0, 190.0, 323.0, 233.0, 86.0, 28.0, 12.0, 9.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.391127586364746, -13.728572845458984, -13.066018104553223, -12.403463363647461, -11.7409086227417, -11.078353881835938, -10.415800094604492, -9.753244400024414, -9.090690612792969, -8.428135871887207, -7.765581130981445, -7.103026390075684, -6.440471649169922, -5.77791690826416, -5.115362644195557, -4.452807903289795, -3.790252685546875, -3.1276979446411133, -2.4651432037353516, -1.802588701248169, -1.1400339603424072, -0.4774792194366455, 0.1850752830505371, 0.8476300239562988, 1.5101847648620605, 2.1727395057678223, 2.835294246673584, 3.4978487491607666, 4.160403251647949, 4.822957992553711, 5.485512733459473, 6.148067474365234, 6.81062126159668, 7.473176002502441, 8.135730743408203, 8.798285484313965, 9.460840225219727, 10.123394966125488, 10.78594970703125, 11.448503494262695, 12.111059188842773, 12.773613929748535, 13.436168670654297, 14.098723411560059, 14.76127815246582, 15.423832893371582, 16.086387634277344, 16.74894142150879, 17.411495208740234, 18.07404899597168, 18.736604690551758, 19.399158477783203, 20.06171417236328, 20.724267959594727, 21.386823654174805, 22.04937744140625, 22.711933135986328, 23.374486923217773, 24.03704261779785, 24.699596405029297, 25.362152099609375, 26.02470588684082, 26.6872615814209, 27.349815368652344, 28.012371063232422]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 7.0, 9.0, 6.0, 15.0, 14.0, 23.0, 25.0, 27.0, 41.0, 50.0, 49.0, 53.0, 69.0, 62.0, 69.0, 63.0, 53.0, 52.0, 59.0, 40.0, 41.0, 40.0, 24.0, 32.0, 23.0, 15.0, 10.0, 10.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.59659194946289, -10.22994613647461, -9.863299369812012, -9.496652603149414, -9.130006790161133, -8.763360977172852, -8.396714210510254, -8.030067443847656, -7.663421630859375, -7.2967753410339355, -6.930129051208496, -6.563482761383057, -6.196836471557617, -5.830190181732178, -5.463543891906738, -5.096897602081299, -4.730251312255859, -4.36360502243042, -3.9969587326049805, -3.630312442779541, -3.2636661529541016, -2.897019863128662, -2.5303735733032227, -2.163727283477783, -1.7970809936523438, -1.4304347038269043, -1.0637884140014648, -0.6971421241760254, -0.33049583435058594, 0.036150455474853516, 0.40279674530029297, 0.7694430351257324, 1.1360893249511719, 1.5027356147766113, 1.8693819046020508, 2.2360281944274902, 2.6026744842529297, 2.969320774078369, 3.3359670639038086, 3.702613353729248, 4.0692596435546875, 4.435905933380127, 4.802552223205566, 5.169198513031006, 5.535844802856445, 5.902491092681885, 6.269137382507324, 6.635783672332764, 7.002429962158203, 7.369076251983643, 7.735722541809082, 8.10236930847168, 8.469015121459961, 8.835660934448242, 9.20230770111084, 9.568954467773438, 9.935600280761719, 10.30224609375, 10.668892860412598, 11.035539627075195, 11.402185440063477, 11.768831253051758, 12.135478019714355, 12.502124786376953, 12.868770599365234]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 6.0, 9.0, 19.0, 33.0, 75.0, 181.0, 506.0, 3009.0, 3817357.0, 370493.0, 1997.0, 352.0, 117.0, 70.0, 25.0, 11.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.3125, -25.600341796875, -24.88818359375, -24.176025390625, -23.4638671875, -22.751708984375, -22.03955078125, -21.327392578125, -20.615234375, -19.903076171875, -19.19091796875, -18.478759765625, -17.7666015625, -17.054443359375, -16.34228515625, -15.630126953125, -14.91796875, -14.205810546875, -13.49365234375, -12.781494140625, -12.0693359375, -11.357177734375, -10.64501953125, -9.932861328125, -9.220703125, -8.508544921875, -7.79638671875, -7.084228515625, -6.3720703125, -5.659912109375, -4.94775390625, -4.235595703125, -3.5234375, -2.811279296875, -2.09912109375, -1.386962890625, -0.6748046875, 0.037353515625, 0.74951171875, 1.461669921875, 2.173828125, 2.885986328125, 3.59814453125, 4.310302734375, 5.0224609375, 5.734619140625, 6.44677734375, 7.158935546875, 7.87109375, 8.583251953125, 9.29541015625, 10.007568359375, 10.7197265625, 11.431884765625, 12.14404296875, 12.856201171875, 13.568359375, 14.280517578125, 14.99267578125, 15.704833984375, 16.4169921875, 17.129150390625, 17.84130859375, 18.553466796875, 19.265625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 16.0, 16.0, 44.0, 63.0, 96.0, 147.0, 141.0, 141.0, 114.0, 82.0, 47.0, 40.0, 16.0, 9.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6357421875, -0.6184234619140625, -0.601104736328125, -0.5837860107421875, -0.56646728515625, -0.5491485595703125, -0.531829833984375, -0.5145111083984375, -0.4971923828125, -0.4798736572265625, -0.462554931640625, -0.4452362060546875, -0.42791748046875, -0.4105987548828125, -0.393280029296875, -0.3759613037109375, -0.358642578125, -0.3413238525390625, -0.324005126953125, -0.3066864013671875, -0.28936767578125, -0.2720489501953125, -0.254730224609375, -0.2374114990234375, -0.2200927734375, -0.2027740478515625, -0.185455322265625, -0.1681365966796875, -0.15081787109375, -0.1334991455078125, -0.116180419921875, -0.0988616943359375, -0.08154296875, -0.0642242431640625, -0.046905517578125, -0.0295867919921875, -0.01226806640625, 0.0050506591796875, 0.022369384765625, 0.0396881103515625, 0.0570068359375, 0.0743255615234375, 0.091644287109375, 0.1089630126953125, 0.12628173828125, 0.1436004638671875, 0.160919189453125, 0.1782379150390625, 0.195556640625, 0.2128753662109375, 0.230194091796875, 0.2475128173828125, 0.26483154296875, 0.2821502685546875, 0.299468994140625, 0.3167877197265625, 0.3341064453125, 0.3514251708984375, 0.368743896484375, 0.3860626220703125, 0.40338134765625, 0.4207000732421875, 0.438018798828125, 0.4553375244140625, 0.47265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 5.0, 4.0, 15.0, 14.0, 25.0, 29.0, 55.0, 117.0, 192.0, 368.0, 805.0, 2056.0, 7070.0, 49591.0, 3427200.0, 674325.0, 25126.0, 4557.0, 1446.0, 607.0, 268.0, 169.0, 86.0, 58.0, 28.0, 26.0, 16.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.765625, -4.62890625, -4.4921875, -4.35546875, -4.21875, -4.08203125, -3.9453125, -3.80859375, -3.671875, -3.53515625, -3.3984375, -3.26171875, -3.125, -2.98828125, -2.8515625, -2.71484375, -2.578125, -2.44140625, -2.3046875, -2.16796875, -2.03125, -1.89453125, -1.7578125, -1.62109375, -1.484375, -1.34765625, -1.2109375, -1.07421875, -0.9375, -0.80078125, -0.6640625, -0.52734375, -0.390625, -0.25390625, -0.1171875, 0.01953125, 0.15625, 0.29296875, 0.4296875, 0.56640625, 0.703125, 0.83984375, 0.9765625, 1.11328125, 1.25, 1.38671875, 1.5234375, 1.66015625, 1.796875, 1.93359375, 2.0703125, 2.20703125, 2.34375, 2.48046875, 2.6171875, 2.75390625, 2.890625, 3.02734375, 3.1640625, 3.30078125, 3.4375, 3.57421875, 3.7109375, 3.84765625, 3.984375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 6.0, 4.0, 5.0, 15.0, 18.0, 29.0, 42.0, 68.0, 76.0, 149.0, 301.0, 816.0, 1530.0, 442.0, 196.0, 113.0, 72.0, 50.0, 33.0, 22.0, 13.0, 17.0, 13.0, 4.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497802734375, -0.4801521301269531, -0.46250152587890625, -0.4448509216308594, -0.4272003173828125, -0.4095497131347656, -0.39189910888671875, -0.3742485046386719, -0.356597900390625, -0.3389472961425781, -0.32129669189453125, -0.3036460876464844, -0.2859954833984375, -0.2683448791503906, -0.25069427490234375, -0.23304367065429688, -0.21539306640625, -0.19774246215820312, -0.18009185791015625, -0.16244125366210938, -0.1447906494140625, -0.12714004516601562, -0.10948944091796875, -0.09183883666992188, -0.074188232421875, -0.056537628173828125, -0.03888702392578125, -0.021236419677734375, -0.0035858154296875, 0.014064788818359375, 0.03171539306640625, 0.049365997314453125, 0.0670166015625, 0.08466720581054688, 0.10231781005859375, 0.11996841430664062, 0.1376190185546875, 0.15526962280273438, 0.17292022705078125, 0.19057083129882812, 0.208221435546875, 0.22587203979492188, 0.24352264404296875, 0.2611732482910156, 0.2788238525390625, 0.2964744567871094, 0.31412506103515625, 0.3317756652832031, 0.34942626953125, 0.3670768737792969, 0.38472747802734375, 0.4023780822753906, 0.4200286865234375, 0.4376792907714844, 0.45532989501953125, 0.4729804992675781, 0.490631103515625, 0.5082817077636719, 0.5259323120117188, 0.5435829162597656, 0.5612335205078125, 0.5788841247558594, 0.5965347290039062, 0.6141853332519531, 0.6318359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 6.0, 21.0, 39.0, 101.0, 136.0, 181.0, 175.0, 141.0, 88.0, 49.0, 25.0, 14.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.852826118469238, -4.728435516357422, -4.6040449142456055, -4.479654312133789, -4.355263710021973, -4.2308735847473145, -4.106482982635498, -3.9820923805236816, -3.8577017784118652, -3.733311176300049, -3.6089205741882324, -3.484530210494995, -3.3601396083831787, -3.2357490062713623, -3.111358642578125, -2.9869680404663086, -2.862577438354492, -2.738186836242676, -2.6137962341308594, -2.489405870437622, -2.3650152683258057, -2.2406246662139893, -2.116234302520752, -1.9918437004089355, -1.8674530982971191, -1.7430624961853027, -1.6186720132827759, -1.494281530380249, -1.3698909282684326, -1.2455003261566162, -1.1211098432540894, -0.9967193007469177, -0.8723289966583252, -0.7479384541511536, -0.6235479116439819, -0.4991573691368103, -0.37476682662963867, -0.25037628412246704, -0.1259857416152954, -0.0015951991081237793, 0.12279534339904785, 0.24718588590621948, 0.3715764284133911, 0.49596697092056274, 0.6203575134277344, 0.744748055934906, 0.8691385984420776, 0.9935291409492493, 1.117919683456421, 1.2423102855682373, 1.3667007684707642, 1.491091251373291, 1.6154818534851074, 1.7398724555969238, 1.8642629384994507, 1.9886534214019775, 2.113044023513794, 2.2374346256256104, 2.3618249893188477, 2.486215591430664, 2.6106061935424805, 2.734996795654297, 2.8593873977661133, 2.9837777614593506, 3.108168363571167]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 11.0, 11.0, 27.0, 19.0, 42.0, 48.0, 53.0, 57.0, 72.0, 71.0, 74.0, 92.0, 68.0, 64.0, 76.0, 63.0, 38.0, 32.0, 23.0, 12.0, 13.0, 14.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.997781276702881, -2.899254322052002, -2.800727367401123, -2.702200412750244, -2.603673219680786, -2.5051462650299072, -2.4066193103790283, -2.3080923557281494, -2.2095651626586914, -2.1110382080078125, -2.0125112533569336, -1.9139841794967651, -1.8154571056365967, -1.7169301509857178, -1.6184031963348389, -1.51987624168396, -1.421349287033081, -1.3228223323822021, -1.2242952585220337, -1.1257683038711548, -1.0272412300109863, -0.9287142753601074, -0.8301873207092285, -0.7316603064537048, -0.6331332921981812, -0.5346062779426575, -0.4360792934894562, -0.3375523090362549, -0.2390252947807312, -0.14049828052520752, -0.04197132587432861, 0.05655568838119507, 0.15508294105529785, 0.25360995531082153, 0.3521369397640228, 0.4506639242172241, 0.5491909384727478, 0.6477179527282715, 0.7462449073791504, 0.8447719216346741, 0.9432989358901978, 1.0418258905410767, 1.1403529644012451, 1.238879919052124, 1.337406873703003, 1.4359339475631714, 1.5344609022140503, 1.6329879760742188, 1.7315149307250977, 1.8300418853759766, 1.928568959236145, 2.0270957946777344, 2.1256229877471924, 2.2241499423980713, 2.32267689704895, 2.421203851699829, 2.519731044769287, 2.618257999420166, 2.716784954071045, 2.815311908721924, 2.913839101791382, 3.0123660564422607, 3.1108930110931396, 3.2094199657440186, 3.3079469203948975]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 14.0, 10.0, 21.0, 30.0, 36.0, 45.0, 60.0, 124.0, 206.0, 311.0, 537.0, 1024.0, 1908.0, 4868.0, 19311.0, 199123.0, 710148.0, 91483.0, 12036.0, 3611.0, 1577.0, 826.0, 478.0, 266.0, 162.0, 109.0, 57.0, 58.0, 29.0, 17.0, 16.0, 12.0, 8.0, 7.0, 6.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.791015625, -2.699066162109375, -2.60711669921875, -2.515167236328125, -2.4232177734375, -2.331268310546875, -2.23931884765625, -2.147369384765625, -2.055419921875, -1.963470458984375, -1.87152099609375, -1.779571533203125, -1.6876220703125, -1.595672607421875, -1.50372314453125, -1.411773681640625, -1.31982421875, -1.227874755859375, -1.13592529296875, -1.043975830078125, -0.9520263671875, -0.860076904296875, -0.76812744140625, -0.676177978515625, -0.584228515625, -0.492279052734375, -0.40032958984375, -0.308380126953125, -0.2164306640625, -0.124481201171875, -0.03253173828125, 0.059417724609375, 0.1513671875, 0.243316650390625, 0.33526611328125, 0.427215576171875, 0.5191650390625, 0.611114501953125, 0.70306396484375, 0.795013427734375, 0.886962890625, 0.978912353515625, 1.07086181640625, 1.162811279296875, 1.2547607421875, 1.346710205078125, 1.43865966796875, 1.530609130859375, 1.62255859375, 1.714508056640625, 1.80645751953125, 1.898406982421875, 1.9903564453125, 2.082305908203125, 2.17425537109375, 2.266204833984375, 2.358154296875, 2.450103759765625, 2.54205322265625, 2.634002685546875, 2.7259521484375, 2.817901611328125, 2.90985107421875, 3.001800537109375, 3.09375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 14.0, 24.0, 57.0, 91.0, 123.0, 166.0, 168.0, 134.0, 99.0, 50.0, 23.0, 20.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51220703125, -0.49456787109375, -0.4769287109375, -0.45928955078125, -0.441650390625, -0.42401123046875, -0.4063720703125, -0.38873291015625, -0.37109375, -0.35345458984375, -0.3358154296875, -0.31817626953125, -0.300537109375, -0.28289794921875, -0.2652587890625, -0.24761962890625, -0.22998046875, -0.21234130859375, -0.1947021484375, -0.17706298828125, -0.159423828125, -0.14178466796875, -0.1241455078125, -0.10650634765625, -0.0888671875, -0.07122802734375, -0.0535888671875, -0.03594970703125, -0.018310546875, -0.00067138671875, 0.0169677734375, 0.03460693359375, 0.05224609375, 0.06988525390625, 0.0875244140625, 0.10516357421875, 0.122802734375, 0.14044189453125, 0.1580810546875, 0.17572021484375, 0.193359375, 0.21099853515625, 0.2286376953125, 0.24627685546875, 0.263916015625, 0.28155517578125, 0.2991943359375, 0.31683349609375, 0.33447265625, 0.35211181640625, 0.3697509765625, 0.38739013671875, 0.405029296875, 0.42266845703125, 0.4403076171875, 0.45794677734375, 0.4755859375, 0.49322509765625, 0.5108642578125, 0.52850341796875, 0.546142578125, 0.56378173828125, 0.5814208984375, 0.59906005859375, 0.61669921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 12.0, 16.0, 16.0, 26.0, 26.0, 64.0, 102.0, 149.0, 209.0, 370.0, 587.0, 1231.0, 2554.0, 6381.0, 21002.0, 103018.0, 556303.0, 290447.0, 46836.0, 11453.0, 3994.0, 1704.0, 841.0, 487.0, 277.0, 149.0, 98.0, 56.0, 40.0, 27.0, 26.0, 12.0, 11.0, 6.0, 3.0, 6.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.043121337890625, -1.98077392578125, -1.918426513671875, -1.8560791015625, -1.793731689453125, -1.73138427734375, -1.669036865234375, -1.606689453125, -1.544342041015625, -1.48199462890625, -1.419647216796875, -1.3572998046875, -1.294952392578125, -1.23260498046875, -1.170257568359375, -1.10791015625, -1.045562744140625, -0.98321533203125, -0.920867919921875, -0.8585205078125, -0.796173095703125, -0.73382568359375, -0.671478271484375, -0.609130859375, -0.546783447265625, -0.48443603515625, -0.422088623046875, -0.3597412109375, -0.297393798828125, -0.23504638671875, -0.172698974609375, -0.1103515625, -0.048004150390625, 0.01434326171875, 0.076690673828125, 0.1390380859375, 0.201385498046875, 0.26373291015625, 0.326080322265625, 0.388427734375, 0.450775146484375, 0.51312255859375, 0.575469970703125, 0.6378173828125, 0.700164794921875, 0.76251220703125, 0.824859619140625, 0.88720703125, 0.949554443359375, 1.01190185546875, 1.074249267578125, 1.1365966796875, 1.198944091796875, 1.26129150390625, 1.323638916015625, 1.385986328125, 1.448333740234375, 1.51068115234375, 1.573028564453125, 1.6353759765625, 1.697723388671875, 1.76007080078125, 1.822418212890625, 1.884765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 10.0, 12.0, 15.0, 30.0, 38.0, 35.0, 61.0, 70.0, 97.0, 100.0, 89.0, 109.0, 81.0, 53.0, 62.0, 35.0, 34.0, 28.0, 16.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6875, -2.61358642578125, -2.5396728515625, -2.46575927734375, -2.391845703125, -2.31793212890625, -2.2440185546875, -2.17010498046875, -2.09619140625, -2.02227783203125, -1.9483642578125, -1.87445068359375, -1.800537109375, -1.72662353515625, -1.6527099609375, -1.57879638671875, -1.5048828125, -1.43096923828125, -1.3570556640625, -1.28314208984375, -1.209228515625, -1.13531494140625, -1.0614013671875, -0.98748779296875, -0.91357421875, -0.83966064453125, -0.7657470703125, -0.69183349609375, -0.617919921875, -0.54400634765625, -0.4700927734375, -0.39617919921875, -0.322265625, -0.24835205078125, -0.1744384765625, -0.10052490234375, -0.026611328125, 0.04730224609375, 0.1212158203125, 0.19512939453125, 0.26904296875, 0.34295654296875, 0.4168701171875, 0.49078369140625, 0.564697265625, 0.63861083984375, 0.7125244140625, 0.78643798828125, 0.8603515625, 0.93426513671875, 1.0081787109375, 1.08209228515625, 1.156005859375, 1.22991943359375, 1.3038330078125, 1.37774658203125, 1.45166015625, 1.52557373046875, 1.5994873046875, 1.67340087890625, 1.747314453125, 1.82122802734375, 1.8951416015625, 1.96905517578125, 2.04296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 23.0, 42.0, 89.0, 218.0, 746.0, 19820.0, 1021442.0, 5434.0, 444.0, 138.0, 72.0, 31.0, 17.0, 11.0, 11.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.080810546875, -3.88037109375, -3.679931640625, -3.4794921875, -3.279052734375, -3.07861328125, -2.878173828125, -2.677734375, -2.477294921875, -2.27685546875, -2.076416015625, -1.8759765625, -1.675537109375, -1.47509765625, -1.274658203125, -1.07421875, -0.873779296875, -0.67333984375, -0.472900390625, -0.2724609375, -0.072021484375, 0.12841796875, 0.328857421875, 0.529296875, 0.729736328125, 0.93017578125, 1.130615234375, 1.3310546875, 1.531494140625, 1.73193359375, 1.932373046875, 2.1328125, 2.333251953125, 2.53369140625, 2.734130859375, 2.9345703125, 3.135009765625, 3.33544921875, 3.535888671875, 3.736328125, 3.936767578125, 4.13720703125, 4.337646484375, 4.5380859375, 4.738525390625, 4.93896484375, 5.139404296875, 5.33984375, 5.540283203125, 5.74072265625, 5.941162109375, 6.1416015625, 6.342041015625, 6.54248046875, 6.742919921875, 6.943359375, 7.143798828125, 7.34423828125, 7.544677734375, 7.7451171875, 7.945556640625, 8.14599609375, 8.346435546875, 8.546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 10.0, 13.0, 14.0, 36.0, 52.0, 80.0, 100.0, 133.0, 135.0, 137.0, 86.0, 70.0, 42.0, 23.0, 15.0, 10.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.00028777122497558594, -0.0002812780439853668, -0.0002747848629951477, -0.0002682916820049286, -0.00026179850101470947, -0.00025530532002449036, -0.00024881213903427124, -0.00024231895804405212, -0.000235825777053833, -0.0002293325960636139, -0.00022283941507339478, -0.00021634623408317566, -0.00020985305309295654, -0.00020335987210273743, -0.0001968666911125183, -0.0001903735101222992, -0.00018388032913208008, -0.00017738714814186096, -0.00017089396715164185, -0.00016440078616142273, -0.0001579076051712036, -0.0001514144241809845, -0.00014492124319076538, -0.00013842806220054626, -0.00013193488121032715, -0.00012544170022010803, -0.00011894851922988892, -0.0001124553382396698, -0.00010596215724945068, -9.946897625923157e-05, -9.297579526901245e-05, -8.648261427879333e-05, -7.998943328857422e-05, -7.34962522983551e-05, -6.700307130813599e-05, -6.050989031791687e-05, -5.4016709327697754e-05, -4.752352833747864e-05, -4.103034734725952e-05, -3.4537166357040405e-05, -2.804398536682129e-05, -2.1550804376602173e-05, -1.5057623386383057e-05, -8.56444239616394e-06, -2.0712614059448242e-06, 4.421919584274292e-06, 1.0915100574493408e-05, 1.7408281564712524e-05, 2.390146255493164e-05, 3.0394643545150757e-05, 3.688782453536987e-05, 4.338100552558899e-05, 4.9874186515808105e-05, 5.636736750602722e-05, 6.286054849624634e-05, 6.935372948646545e-05, 7.584691047668457e-05, 8.234009146690369e-05, 8.88332724571228e-05, 9.532645344734192e-05, 0.00010181963443756104, 0.00010831281542778015, 0.00011480599641799927, 0.00012129917740821838, 0.0001277923583984375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 10.0, 7.0, 10.0, 20.0, 24.0, 34.0, 54.0, 110.0, 196.0, 448.0, 1142.0, 3401.0, 15122.0, 228185.0, 747568.0, 42781.0, 6463.0, 1752.0, 626.0, 253.0, 121.0, 76.0, 52.0, 27.0, 13.0, 14.0, 7.0, 6.0, 13.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9541015625, -1.89703369140625, -1.8399658203125, -1.78289794921875, -1.725830078125, -1.66876220703125, -1.6116943359375, -1.55462646484375, -1.49755859375, -1.44049072265625, -1.3834228515625, -1.32635498046875, -1.269287109375, -1.21221923828125, -1.1551513671875, -1.09808349609375, -1.041015625, -0.98394775390625, -0.9268798828125, -0.86981201171875, -0.812744140625, -0.75567626953125, -0.6986083984375, -0.64154052734375, -0.58447265625, -0.52740478515625, -0.4703369140625, -0.41326904296875, -0.356201171875, -0.29913330078125, -0.2420654296875, -0.18499755859375, -0.1279296875, -0.07086181640625, -0.0137939453125, 0.04327392578125, 0.100341796875, 0.15740966796875, 0.2144775390625, 0.27154541015625, 0.32861328125, 0.38568115234375, 0.4427490234375, 0.49981689453125, 0.556884765625, 0.61395263671875, 0.6710205078125, 0.72808837890625, 0.78515625, 0.84222412109375, 0.8992919921875, 0.95635986328125, 1.013427734375, 1.07049560546875, 1.1275634765625, 1.18463134765625, 1.24169921875, 1.29876708984375, 1.3558349609375, 1.41290283203125, 1.469970703125, 1.52703857421875, 1.5841064453125, 1.64117431640625, 1.6982421875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 10.0, 2.0, 6.0, 9.0, 10.0, 8.0, 18.0, 37.0, 52.0, 49.0, 87.0, 115.0, 123.0, 121.0, 90.0, 91.0, 56.0, 32.0, 23.0, 10.0, 12.0, 11.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7267532348632812, -0.7030181884765625, -0.6792831420898438, -0.655548095703125, -0.6318130493164062, -0.6080780029296875, -0.5843429565429688, -0.56060791015625, -0.5368728637695312, -0.5131378173828125, -0.48940277099609375, -0.465667724609375, -0.44193267822265625, -0.4181976318359375, -0.39446258544921875, -0.3707275390625, -0.34699249267578125, -0.3232574462890625, -0.29952239990234375, -0.275787353515625, -0.25205230712890625, -0.2283172607421875, -0.20458221435546875, -0.18084716796875, -0.15711212158203125, -0.1333770751953125, -0.10964202880859375, -0.085906982421875, -0.06217193603515625, -0.0384368896484375, -0.01470184326171875, 0.009033203125, 0.03276824951171875, 0.0565032958984375, 0.08023834228515625, 0.103973388671875, 0.12770843505859375, 0.1514434814453125, 0.17517852783203125, 0.19891357421875, 0.22264862060546875, 0.2463836669921875, 0.27011871337890625, 0.293853759765625, 0.31758880615234375, 0.3413238525390625, 0.36505889892578125, 0.3887939453125, 0.41252899169921875, 0.4362640380859375, 0.45999908447265625, 0.483734130859375, 0.5074691772460938, 0.5312042236328125, 0.5549392700195312, 0.57867431640625, 0.6024093627929688, 0.6261444091796875, 0.6498794555664062, 0.673614501953125, 0.6973495483398438, 0.7210845947265625, 0.7448196411132812, 0.7685546875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 21.0, 37.0, 117.0, 283.0, 314.0, 144.0, 43.0, 29.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.469057083129883, -17.835643768310547, -17.20223045349121, -16.568817138671875, -15.935403823852539, -15.301990509033203, -14.668578147888184, -14.035164833068848, -13.401751518249512, -12.768338203430176, -12.13492488861084, -11.501511573791504, -10.868099212646484, -10.234685897827148, -9.601272583007812, -8.967859268188477, -8.33444595336914, -7.701032638549805, -7.067619323730469, -6.434206485748291, -5.800793170928955, -5.167379856109619, -4.533967018127441, -3.9005537033081055, -3.2671403884887695, -2.6337270736694336, -2.0003139972686768, -1.3669008016586304, -0.733487606048584, -0.10007429122924805, 0.5333387851715088, 1.1667518615722656, 1.8001632690429688, 2.4335765838623047, 3.0669896602630615, 3.7004027366638184, 4.333816051483154, 4.96722936630249, 5.600642204284668, 6.234055519104004, 6.86746883392334, 7.500882148742676, 8.134295463562012, 8.767708778381348, 9.401121139526367, 10.034534454345703, 10.667947769165039, 11.301361083984375, 11.934774398803711, 12.568187713623047, 13.201601028442383, 13.835014343261719, 14.468427658081055, 15.10184097290039, 15.73525333404541, 16.368667602539062, 17.002079010009766, 17.6354923248291, 18.268905639648438, 18.902318954467773, 19.53573226928711, 20.169145584106445, 20.80255889892578, 21.435970306396484, 22.069385528564453]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 8.0, 4.0, 8.0, 12.0, 11.0, 12.0, 25.0, 27.0, 40.0, 29.0, 34.0, 41.0, 51.0, 53.0, 43.0, 57.0, 56.0, 54.0, 58.0, 42.0, 45.0, 49.0, 44.0, 33.0, 20.0, 27.0, 19.0, 16.0, 16.0, 14.0, 13.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.135211944580078, -9.859474182128906, -9.583736419677734, -9.307998657226562, -9.03226089477539, -8.756524085998535, -8.480786323547363, -8.205048561096191, -7.9293107986450195, -7.653573036193848, -7.377835273742676, -7.102097988128662, -6.82636022567749, -6.550622463226318, -6.274885177612305, -5.999147415161133, -5.723409652709961, -5.447671890258789, -5.171934127807617, -4.8961968421936035, -4.620459079742432, -4.34472131729126, -4.068984031677246, -3.793246269226074, -3.5175085067749023, -3.2417707443237305, -2.9660332202911377, -2.690295696258545, -2.414557933807373, -2.138820171356201, -1.8630826473236084, -1.587345004081726, -1.3116064071655273, -1.035868763923645, -0.7601311206817627, -0.48439347743988037, -0.20865583419799805, 0.06708180904388428, 0.3428194522857666, 0.6185570955276489, 0.8942947387695312, 1.1700323820114136, 1.445770025253296, 1.7215076684951782, 1.9972453117370605, 2.2729830741882324, 2.548720598220825, 2.824458122253418, 3.10019588470459, 3.3759336471557617, 3.6516711711883545, 3.9274086952209473, 4.203146457672119, 4.478884220123291, 4.754621505737305, 5.030359268188477, 5.306097030639648, 5.58183479309082, 5.857572555541992, 6.133309841156006, 6.409047603607178, 6.68478536605835, 6.960522651672363, 7.236260414123535, 7.511998176574707]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 10.0, 16.0, 14.0, 27.0, 34.0, 50.0, 68.0, 132.0, 166.0, 310.0, 487.0, 967.0, 1965.0, 5055.0, 18695.0, 137610.0, 3833458.0, 166658.0, 20104.0, 4997.0, 1729.0, 773.0, 413.0, 222.0, 124.0, 57.0, 36.0, 26.0, 16.0, 14.0, 6.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.962890625, -3.854400634765625, -3.74591064453125, -3.637420654296875, -3.5289306640625, -3.420440673828125, -3.31195068359375, -3.203460693359375, -3.094970703125, -2.986480712890625, -2.87799072265625, -2.769500732421875, -2.6610107421875, -2.552520751953125, -2.44403076171875, -2.335540771484375, -2.22705078125, -2.118560791015625, -2.01007080078125, -1.901580810546875, -1.7930908203125, -1.684600830078125, -1.57611083984375, -1.467620849609375, -1.359130859375, -1.250640869140625, -1.14215087890625, -1.033660888671875, -0.9251708984375, -0.816680908203125, -0.70819091796875, -0.599700927734375, -0.4912109375, -0.382720947265625, -0.27423095703125, -0.165740966796875, -0.0572509765625, 0.051239013671875, 0.15972900390625, 0.268218994140625, 0.376708984375, 0.485198974609375, 0.59368896484375, 0.702178955078125, 0.8106689453125, 0.919158935546875, 1.02764892578125, 1.136138916015625, 1.24462890625, 1.353118896484375, 1.46160888671875, 1.570098876953125, 1.6785888671875, 1.787078857421875, 1.89556884765625, 2.004058837890625, 2.112548828125, 2.221038818359375, 2.32952880859375, 2.438018798828125, 2.5465087890625, 2.654998779296875, 2.76348876953125, 2.871978759765625, 2.98046875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 15.0, 17.0, 28.0, 32.0, 55.0, 72.0, 85.0, 88.0, 89.0, 108.0, 97.0, 89.0, 66.0, 44.0, 28.0, 30.0, 14.0, 15.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.484130859375, -0.4709587097167969, -0.45778656005859375, -0.4446144104003906, -0.4314422607421875, -0.4182701110839844, -0.40509796142578125, -0.3919258117675781, -0.378753662109375, -0.3655815124511719, -0.35240936279296875, -0.3392372131347656, -0.3260650634765625, -0.3128929138183594, -0.29972076416015625, -0.2865486145019531, -0.27337646484375, -0.2602043151855469, -0.24703216552734375, -0.23386001586914062, -0.2206878662109375, -0.20751571655273438, -0.19434356689453125, -0.18117141723632812, -0.167999267578125, -0.15482711791992188, -0.14165496826171875, -0.12848281860351562, -0.1153106689453125, -0.10213851928710938, -0.08896636962890625, -0.07579421997070312, -0.0626220703125, -0.049449920654296875, -0.03627777099609375, -0.023105621337890625, -0.0099334716796875, 0.003238677978515625, 0.01641082763671875, 0.029582977294921875, 0.042755126953125, 0.055927276611328125, 0.06909942626953125, 0.08227157592773438, 0.0954437255859375, 0.10861587524414062, 0.12178802490234375, 0.13496017456054688, 0.14813232421875, 0.16130447387695312, 0.17447662353515625, 0.18764877319335938, 0.2008209228515625, 0.21399307250976562, 0.22716522216796875, 0.24033737182617188, 0.253509521484375, 0.2666816711425781, 0.27985382080078125, 0.2930259704589844, 0.3061981201171875, 0.3193702697753906, 0.33254241943359375, 0.3457145690917969, 0.35888671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 6.0, 13.0, 13.0, 18.0, 35.0, 50.0, 110.0, 162.0, 327.0, 605.0, 1446.0, 4736.0, 24648.0, 496852.0, 3589149.0, 63357.0, 8666.0, 2281.0, 860.0, 373.0, 226.0, 127.0, 84.0, 42.0, 34.0, 15.0, 12.0, 6.0, 8.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.064453125, -2.96624755859375, -2.8680419921875, -2.76983642578125, -2.671630859375, -2.57342529296875, -2.4752197265625, -2.37701416015625, -2.27880859375, -2.18060302734375, -2.0823974609375, -1.98419189453125, -1.885986328125, -1.78778076171875, -1.6895751953125, -1.59136962890625, -1.4931640625, -1.39495849609375, -1.2967529296875, -1.19854736328125, -1.100341796875, -1.00213623046875, -0.9039306640625, -0.80572509765625, -0.70751953125, -0.60931396484375, -0.5111083984375, -0.41290283203125, -0.314697265625, -0.21649169921875, -0.1182861328125, -0.02008056640625, 0.078125, 0.17633056640625, 0.2745361328125, 0.37274169921875, 0.470947265625, 0.56915283203125, 0.6673583984375, 0.76556396484375, 0.86376953125, 0.96197509765625, 1.0601806640625, 1.15838623046875, 1.256591796875, 1.35479736328125, 1.4530029296875, 1.55120849609375, 1.6494140625, 1.74761962890625, 1.8458251953125, 1.94403076171875, 2.042236328125, 2.14044189453125, 2.2386474609375, 2.33685302734375, 2.43505859375, 2.53326416015625, 2.6314697265625, 2.72967529296875, 2.827880859375, 2.92608642578125, 3.0242919921875, 3.12249755859375, 3.220703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 12.0, 5.0, 12.0, 24.0, 31.0, 38.0, 69.0, 139.0, 276.0, 732.0, 1803.0, 450.0, 206.0, 95.0, 52.0, 34.0, 22.0, 20.0, 9.0, 4.0, 9.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64892578125, -0.6299819946289062, -0.6110382080078125, -0.5920944213867188, -0.573150634765625, -0.5542068481445312, -0.5352630615234375, -0.5163192749023438, -0.49737548828125, -0.47843170166015625, -0.4594879150390625, -0.44054412841796875, -0.421600341796875, -0.40265655517578125, -0.3837127685546875, -0.36476898193359375, -0.3458251953125, -0.32688140869140625, -0.3079376220703125, -0.28899383544921875, -0.270050048828125, -0.25110626220703125, -0.2321624755859375, -0.21321868896484375, -0.19427490234375, -0.17533111572265625, -0.1563873291015625, -0.13744354248046875, -0.118499755859375, -0.09955596923828125, -0.0806121826171875, -0.06166839599609375, -0.042724609375, -0.02378082275390625, -0.0048370361328125, 0.01410675048828125, 0.033050537109375, 0.05199432373046875, 0.0709381103515625, 0.08988189697265625, 0.10882568359375, 0.12776947021484375, 0.1467132568359375, 0.16565704345703125, 0.184600830078125, 0.20354461669921875, 0.2224884033203125, 0.24143218994140625, 0.2603759765625, 0.27931976318359375, 0.2982635498046875, 0.31720733642578125, 0.336151123046875, 0.35509490966796875, 0.3740386962890625, 0.39298248291015625, 0.41192626953125, 0.43087005615234375, 0.4498138427734375, 0.46875762939453125, 0.487701416015625, 0.5066452026367188, 0.5255889892578125, 0.5445327758789062, 0.5634765625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 13.0, 47.0, 134.0, 257.0, 260.0, 178.0, 57.0, 31.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5511512756347656, -2.382310628890991, -2.213470220565796, -2.0446295738220215, -1.8757890462875366, -1.7069485187530518, -1.5381078720092773, -1.3692673444747925, -1.2004268169403076, -1.0315862894058228, -0.8627457022666931, -0.6939051151275635, -0.5250645875930786, -0.35622406005859375, -0.18738341331481934, -0.018542885780334473, 0.1502976417541504, 0.31913819909095764, 0.4879787564277649, 0.6568193435668945, 0.8256598711013794, 0.9945003986358643, 1.1633410453796387, 1.3321815729141235, 1.5010221004486084, 1.6698626279830933, 1.8387031555175781, 2.0075438022613525, 2.176384449005127, 2.3452248573303223, 2.5140655040740967, 2.682906150817871, 2.8517465591430664, 3.020587205886841, 3.189427614212036, 3.3582682609558105, 3.527108669281006, 3.6959493160247803, 3.8647899627685547, 4.03363037109375, 4.202470779418945, 4.371311187744141, 4.540152072906494, 4.7089924812316895, 4.877832889556885, 5.046673774719238, 5.215514183044434, 5.384354591369629, 5.553195476531982, 5.722035884857178, 5.890876770019531, 6.059717178344727, 6.228557586669922, 6.397397994995117, 6.566238880157471, 6.735079288482666, 6.9039201736450195, 7.072760581970215, 7.241601467132568, 7.410441875457764, 7.579282283782959, 7.7481231689453125, 7.916963577270508, 8.085803985595703, 8.254644393920898]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 9.0, 5.0, 10.0, 9.0, 17.0, 16.0, 25.0, 18.0, 26.0, 47.0, 47.0, 52.0, 43.0, 57.0, 53.0, 65.0, 64.0, 67.0, 46.0, 55.0, 41.0, 37.0, 28.0, 43.0, 24.0, 25.0, 17.0, 19.0, 8.0, 7.0, 9.0, 4.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.040316343307495, -1.9751049280166626, -1.9098936319351196, -1.844682216644287, -1.7794709205627441, -1.7142595052719116, -1.649048089981079, -1.5838367938995361, -1.5186253786087036, -1.453413963317871, -1.3882026672363281, -1.3229912519454956, -1.257779836654663, -1.1925685405731201, -1.1273571252822876, -1.062145709991455, -0.9969344139099121, -0.9317230582237244, -0.8665117025375366, -0.8013002872467041, -0.7360889315605164, -0.6708775758743286, -0.6056661605834961, -0.5404548048973083, -0.4752434492111206, -0.41003209352493286, -0.34482070803642273, -0.2796093225479126, -0.21439796686172485, -0.1491866111755371, -0.08397522568702698, -0.018763840198516846, 0.04644775390625, 0.11165912449359894, 0.17687049508094788, 0.24208186566829681, 0.30729323625564575, 0.3725045919418335, 0.43771597743034363, 0.5029273629188538, 0.5681387186050415, 0.6333500742912292, 0.698561429977417, 0.7637728452682495, 0.8289842009544373, 0.894195556640625, 0.9594069719314575, 1.02461838722229, 1.089829683303833, 1.1550410985946655, 1.2202523946762085, 1.285463809967041, 1.350675106048584, 1.4158865213394165, 1.481097936630249, 1.546309232711792, 1.6115206480026245, 1.676732063293457, 1.741943359375, 1.8071547746658325, 1.872366189956665, 1.937577486038208, 2.002788782119751, 2.068000316619873, 2.133211612701416]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 5.0, 10.0, 11.0, 21.0, 41.0, 47.0, 61.0, 102.0, 138.0, 198.0, 299.0, 448.0, 685.0, 1143.0, 2098.0, 4350.0, 11168.0, 35411.0, 128959.0, 396040.0, 327161.0, 95874.0, 27140.0, 8865.0, 3680.0, 1752.0, 998.0, 617.0, 396.0, 248.0, 187.0, 124.0, 86.0, 65.0, 35.0, 31.0, 24.0, 14.0, 10.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.4990234375, -1.4594573974609375, -1.419891357421875, -1.3803253173828125, -1.34075927734375, -1.3011932373046875, -1.261627197265625, -1.2220611572265625, -1.1824951171875, -1.1429290771484375, -1.103363037109375, -1.0637969970703125, -1.02423095703125, -0.9846649169921875, -0.945098876953125, -0.9055328369140625, -0.865966796875, -0.8264007568359375, -0.786834716796875, -0.7472686767578125, -0.70770263671875, -0.6681365966796875, -0.628570556640625, -0.5890045166015625, -0.5494384765625, -0.5098724365234375, -0.470306396484375, -0.4307403564453125, -0.39117431640625, -0.3516082763671875, -0.312042236328125, -0.2724761962890625, -0.23291015625, -0.1933441162109375, -0.153778076171875, -0.1142120361328125, -0.07464599609375, -0.0350799560546875, 0.004486083984375, 0.0440521240234375, 0.0836181640625, 0.1231842041015625, 0.162750244140625, 0.2023162841796875, 0.24188232421875, 0.2814483642578125, 0.321014404296875, 0.3605804443359375, 0.400146484375, 0.4397125244140625, 0.479278564453125, 0.5188446044921875, 0.55841064453125, 0.5979766845703125, 0.637542724609375, 0.6771087646484375, 0.7166748046875, 0.7562408447265625, 0.795806884765625, 0.8353729248046875, 0.87493896484375, 0.9145050048828125, 0.954071044921875, 0.9936370849609375, 1.033203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 12.0, 8.0, 28.0, 45.0, 62.0, 62.0, 79.0, 88.0, 99.0, 123.0, 96.0, 97.0, 58.0, 46.0, 33.0, 14.0, 12.0, 12.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3840370178222656, -0.37110137939453125, -0.3581657409667969, -0.3452301025390625, -0.3322944641113281, -0.31935882568359375, -0.3064231872558594, -0.293487548828125, -0.2805519104003906, -0.26761627197265625, -0.2546806335449219, -0.2417449951171875, -0.22880935668945312, -0.21587371826171875, -0.20293807983398438, -0.19000244140625, -0.17706680297851562, -0.16413116455078125, -0.15119552612304688, -0.1382598876953125, -0.12532424926757812, -0.11238861083984375, -0.09945297241210938, -0.086517333984375, -0.07358169555664062, -0.06064605712890625, -0.047710418701171875, -0.0347747802734375, -0.021839141845703125, -0.00890350341796875, 0.004032135009765625, 0.0169677734375, 0.029903411865234375, 0.04283905029296875, 0.055774688720703125, 0.0687103271484375, 0.08164596557617188, 0.09458160400390625, 0.10751724243164062, 0.120452880859375, 0.13338851928710938, 0.14632415771484375, 0.15925979614257812, 0.1721954345703125, 0.18513107299804688, 0.19806671142578125, 0.21100234985351562, 0.22393798828125, 0.23687362670898438, 0.24980926513671875, 0.2627449035644531, 0.2756805419921875, 0.2886161804199219, 0.30155181884765625, 0.3144874572753906, 0.327423095703125, 0.3403587341308594, 0.35329437255859375, 0.3662300109863281, 0.3791656494140625, 0.3921012878417969, 0.40503692626953125, 0.4179725646972656, 0.430908203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 7.0, 12.0, 20.0, 34.0, 33.0, 56.0, 54.0, 84.0, 148.0, 198.0, 349.0, 563.0, 1027.0, 1766.0, 3527.0, 7324.0, 16835.0, 45535.0, 142009.0, 372215.0, 298608.0, 99821.0, 33161.0, 12944.0, 5875.0, 2753.0, 1481.0, 817.0, 490.0, 286.0, 163.0, 111.0, 76.0, 52.0, 37.0, 21.0, 21.0, 13.0, 3.0, 9.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.041015625, -1.0093231201171875, -0.977630615234375, -0.9459381103515625, -0.91424560546875, -0.8825531005859375, -0.850860595703125, -0.8191680908203125, -0.7874755859375, -0.7557830810546875, -0.724090576171875, -0.6923980712890625, -0.66070556640625, -0.6290130615234375, -0.597320556640625, -0.5656280517578125, -0.533935546875, -0.5022430419921875, -0.470550537109375, -0.4388580322265625, -0.40716552734375, -0.3754730224609375, -0.343780517578125, -0.3120880126953125, -0.2803955078125, -0.2487030029296875, -0.217010498046875, -0.1853179931640625, -0.15362548828125, -0.1219329833984375, -0.090240478515625, -0.0585479736328125, -0.02685546875, 0.0048370361328125, 0.036529541015625, 0.0682220458984375, 0.09991455078125, 0.1316070556640625, 0.163299560546875, 0.1949920654296875, 0.2266845703125, 0.2583770751953125, 0.290069580078125, 0.3217620849609375, 0.35345458984375, 0.3851470947265625, 0.416839599609375, 0.4485321044921875, 0.480224609375, 0.5119171142578125, 0.543609619140625, 0.5753021240234375, 0.60699462890625, 0.6386871337890625, 0.670379638671875, 0.7020721435546875, 0.7337646484375, 0.7654571533203125, 0.797149658203125, 0.8288421630859375, 0.86053466796875, 0.8922271728515625, 0.923919677734375, 0.9556121826171875, 0.9873046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 12.0, 6.0, 3.0, 13.0, 14.0, 17.0, 14.0, 26.0, 18.0, 32.0, 18.0, 35.0, 27.0, 43.0, 49.0, 42.0, 45.0, 43.0, 44.0, 50.0, 51.0, 35.0, 55.0, 30.0, 36.0, 25.0, 33.0, 25.0, 22.0, 26.0, 19.0, 12.0, 8.0, 8.0, 10.0, 5.0, 10.0, 3.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0859375, -1.0537033081054688, -1.0214691162109375, -0.9892349243164062, -0.957000732421875, -0.9247665405273438, -0.8925323486328125, -0.8602981567382812, -0.82806396484375, -0.7958297729492188, -0.7635955810546875, -0.7313613891601562, -0.699127197265625, -0.6668930053710938, -0.6346588134765625, -0.6024246215820312, -0.5701904296875, -0.5379562377929688, -0.5057220458984375, -0.47348785400390625, -0.441253662109375, -0.40901947021484375, -0.3767852783203125, -0.34455108642578125, -0.31231689453125, -0.28008270263671875, -0.2478485107421875, -0.21561431884765625, -0.183380126953125, -0.15114593505859375, -0.1189117431640625, -0.08667755126953125, -0.054443359375, -0.02220916748046875, 0.0100250244140625, 0.04225921630859375, 0.074493408203125, 0.10672760009765625, 0.1389617919921875, 0.17119598388671875, 0.20343017578125, 0.23566436767578125, 0.2678985595703125, 0.30013275146484375, 0.332366943359375, 0.36460113525390625, 0.3968353271484375, 0.42906951904296875, 0.4613037109375, 0.49353790283203125, 0.5257720947265625, 0.5580062866210938, 0.590240478515625, 0.6224746704101562, 0.6547088623046875, 0.6869430541992188, 0.71917724609375, 0.7514114379882812, 0.7836456298828125, 0.8158798217773438, 0.848114013671875, 0.8803482055664062, 0.9125823974609375, 0.9448165893554688, 0.97705078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 2.0, 7.0, 6.0, 16.0, 21.0, 25.0, 31.0, 64.0, 129.0, 212.0, 502.0, 1349.0, 4279.0, 19453.0, 191497.0, 713626.0, 99174.0, 12973.0, 3254.0, 1058.0, 394.0, 204.0, 90.0, 60.0, 41.0, 22.0, 18.0, 6.0, 15.0, 3.0, 2.0, 8.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9384765625, -0.9119491577148438, -0.8854217529296875, -0.8588943481445312, -0.832366943359375, -0.8058395385742188, -0.7793121337890625, -0.7527847290039062, -0.72625732421875, -0.6997299194335938, -0.6732025146484375, -0.6466751098632812, -0.620147705078125, -0.5936203002929688, -0.5670928955078125, -0.5405654907226562, -0.5140380859375, -0.48751068115234375, -0.4609832763671875, -0.43445587158203125, -0.407928466796875, -0.38140106201171875, -0.3548736572265625, -0.32834625244140625, -0.30181884765625, -0.27529144287109375, -0.2487640380859375, -0.22223663330078125, -0.195709228515625, -0.16918182373046875, -0.1426544189453125, -0.11612701416015625, -0.089599609375, -0.06307220458984375, -0.0365447998046875, -0.01001739501953125, 0.016510009765625, 0.04303741455078125, 0.0695648193359375, 0.09609222412109375, 0.12261962890625, 0.14914703369140625, 0.1756744384765625, 0.20220184326171875, 0.228729248046875, 0.25525665283203125, 0.2817840576171875, 0.30831146240234375, 0.3348388671875, 0.36136627197265625, 0.3878936767578125, 0.41442108154296875, 0.440948486328125, 0.46747589111328125, 0.4940032958984375, 0.5205307006835938, 0.54705810546875, 0.5735855102539062, 0.6001129150390625, 0.6266403198242188, 0.653167724609375, 0.6796951293945312, 0.7062225341796875, 0.7327499389648438, 0.75927734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 7.0, 9.0, 14.0, 9.0, 21.0, 19.0, 26.0, 32.0, 49.0, 67.0, 63.0, 72.0, 91.0, 63.0, 81.0, 70.0, 59.0, 44.0, 52.0, 30.0, 25.0, 23.0, 13.0, 13.0, 12.0, 6.0, 7.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.28640365600586e-05, -9.023398160934448e-05, -8.760392665863037e-05, -8.497387170791626e-05, -8.234381675720215e-05, -7.971376180648804e-05, -7.708370685577393e-05, -7.445365190505981e-05, -7.18235969543457e-05, -6.919354200363159e-05, -6.656348705291748e-05, -6.393343210220337e-05, -6.130337715148926e-05, -5.8673322200775146e-05, -5.6043267250061035e-05, -5.3413212299346924e-05, -5.078315734863281e-05, -4.81531023979187e-05, -4.552304744720459e-05, -4.289299249649048e-05, -4.026293754577637e-05, -3.7632882595062256e-05, -3.5002827644348145e-05, -3.237277269363403e-05, -2.9742717742919922e-05, -2.711266279220581e-05, -2.44826078414917e-05, -2.1852552890777588e-05, -1.9222497940063477e-05, -1.6592442989349365e-05, -1.3962388038635254e-05, -1.1332333087921143e-05, -8.702278137207031e-06, -6.07222318649292e-06, -3.4421682357788086e-06, -8.121132850646973e-07, 1.817941665649414e-06, 4.447996616363525e-06, 7.078051567077637e-06, 9.708106517791748e-06, 1.233816146850586e-05, 1.496821641921997e-05, 1.7598271369934082e-05, 2.0228326320648193e-05, 2.2858381271362305e-05, 2.5488436222076416e-05, 2.8118491172790527e-05, 3.074854612350464e-05, 3.337860107421875e-05, 3.600865602493286e-05, 3.863871097564697e-05, 4.1268765926361084e-05, 4.3898820877075195e-05, 4.652887582778931e-05, 4.915893077850342e-05, 5.178898572921753e-05, 5.441904067993164e-05, 5.704909563064575e-05, 5.967915058135986e-05, 6.230920553207397e-05, 6.493926048278809e-05, 6.75693154335022e-05, 7.019937038421631e-05, 7.282942533493042e-05, 7.545948028564453e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 9.0, 9.0, 11.0, 34.0, 27.0, 62.0, 92.0, 172.0, 276.0, 575.0, 1433.0, 4419.0, 16536.0, 122334.0, 725472.0, 150519.0, 18755.0, 4823.0, 1606.0, 657.0, 278.0, 154.0, 94.0, 65.0, 42.0, 32.0, 20.0, 14.0, 7.0, 8.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.72998046875, -0.7052688598632812, -0.6805572509765625, -0.6558456420898438, -0.631134033203125, -0.6064224243164062, -0.5817108154296875, -0.5569992065429688, -0.53228759765625, -0.5075759887695312, -0.4828643798828125, -0.45815277099609375, -0.433441162109375, -0.40872955322265625, -0.3840179443359375, -0.35930633544921875, -0.3345947265625, -0.30988311767578125, -0.2851715087890625, -0.26045989990234375, -0.235748291015625, -0.21103668212890625, -0.1863250732421875, -0.16161346435546875, -0.13690185546875, -0.11219024658203125, -0.0874786376953125, -0.06276702880859375, -0.038055419921875, -0.01334381103515625, 0.0113677978515625, 0.03607940673828125, 0.060791015625, 0.08550262451171875, 0.1102142333984375, 0.13492584228515625, 0.159637451171875, 0.18434906005859375, 0.2090606689453125, 0.23377227783203125, 0.25848388671875, 0.28319549560546875, 0.3079071044921875, 0.33261871337890625, 0.357330322265625, 0.38204193115234375, 0.4067535400390625, 0.43146514892578125, 0.4561767578125, 0.48088836669921875, 0.5055999755859375, 0.5303115844726562, 0.555023193359375, 0.5797348022460938, 0.6044464111328125, 0.6291580200195312, 0.65386962890625, 0.6785812377929688, 0.7032928466796875, 0.7280044555664062, 0.752716064453125, 0.7774276733398438, 0.8021392822265625, 0.8268508911132812, 0.8515625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 0.0, 2.0, 9.0, 5.0, 7.0, 7.0, 15.0, 16.0, 32.0, 47.0, 51.0, 80.0, 104.0, 108.0, 110.0, 109.0, 73.0, 62.0, 44.0, 21.0, 20.0, 16.0, 13.0, 6.0, 10.0, 5.0, 4.0, 6.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.48779296875, -0.4734382629394531, -0.45908355712890625, -0.4447288513183594, -0.4303741455078125, -0.4160194396972656, -0.40166473388671875, -0.3873100280761719, -0.372955322265625, -0.3586006164550781, -0.34424591064453125, -0.3298912048339844, -0.3155364990234375, -0.3011817932128906, -0.28682708740234375, -0.2724723815917969, -0.25811767578125, -0.24376296997070312, -0.22940826416015625, -0.21505355834960938, -0.2006988525390625, -0.18634414672851562, -0.17198944091796875, -0.15763473510742188, -0.143280029296875, -0.12892532348632812, -0.11457061767578125, -0.10021591186523438, -0.0858612060546875, -0.07150650024414062, -0.05715179443359375, -0.042797088623046875, -0.0284423828125, -0.014087677001953125, 0.00026702880859375, 0.014621734619140625, 0.0289764404296875, 0.043331146240234375, 0.05768585205078125, 0.07204055786132812, 0.086395263671875, 0.10074996948242188, 0.11510467529296875, 0.12945938110351562, 0.1438140869140625, 0.15816879272460938, 0.17252349853515625, 0.18687820434570312, 0.20123291015625, 0.21558761596679688, 0.22994232177734375, 0.24429702758789062, 0.2586517333984375, 0.2730064392089844, 0.28736114501953125, 0.3017158508300781, 0.316070556640625, 0.3304252624511719, 0.34477996826171875, 0.3591346740722656, 0.3734893798828125, 0.3878440856933594, 0.40219879150390625, 0.4165534973144531, 0.430908203125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 14.0, 42.0, 96.0, 177.0, 249.0, 205.0, 121.0, 43.0, 16.0, 12.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.439359664916992, -10.046066284179688, -9.652771949768066, -9.259478569030762, -8.86618423461914, -8.472890853881836, -8.079597473144531, -7.68630313873291, -7.293009281158447, -6.899715423583984, -6.5064215660095215, -6.113127708435059, -5.719834327697754, -5.326539993286133, -4.933246612548828, -4.539952754974365, -4.146658897399902, -3.7533650398254395, -3.3600711822509766, -2.9667775630950928, -2.57348370552063, -2.180189847946167, -1.7868962287902832, -1.3936023712158203, -1.0003085136413574, -0.6070147156715393, -0.2137209177017212, 0.17957282066345215, 0.572866678237915, 0.9661605358123779, 1.3594541549682617, 1.7527480125427246, 2.146042823791504, 2.539336681365967, 2.9326305389404297, 3.3259241580963135, 3.7192180156707764, 4.11251163482666, 4.505805492401123, 4.899099349975586, 5.292393207550049, 5.685687065124512, 6.078980922698975, 6.4722747802734375, 6.865568161010742, 7.258862495422363, 7.652155876159668, 8.045450210571289, 8.438743591308594, 8.832036972045898, 9.22533130645752, 9.618624687194824, 10.011919021606445, 10.40521240234375, 10.798505783081055, 11.191800117492676, 11.585094451904297, 11.978387832641602, 12.371682167053223, 12.764975547790527, 13.158269882202148, 13.551563262939453, 13.944856643676758, 14.338150978088379, 14.731444358825684]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 8.0, 17.0, 11.0, 16.0, 19.0, 20.0, 17.0, 30.0, 37.0, 34.0, 37.0, 45.0, 42.0, 39.0, 36.0, 47.0, 34.0, 42.0, 28.0, 46.0, 47.0, 35.0, 36.0, 35.0, 22.0, 24.0, 29.0, 19.0, 18.0, 19.0, 13.0, 16.0, 10.0, 8.0, 11.0, 3.0, 7.0, 3.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.281522750854492, -5.109341144561768, -4.937159538269043, -4.76497745513916, -4.5927958488464355, -4.420614242553711, -4.248432636260986, -4.076251029968262, -3.904069423675537, -3.7318878173828125, -3.559705972671509, -3.387524366378784, -3.2153427600860596, -3.043160915374756, -2.8709793090820312, -2.6987977027893066, -2.526615858078003, -2.3544342517852783, -2.1822524070739746, -2.01007080078125, -1.8378891944885254, -1.6657074689865112, -1.493525743484497, -1.3213441371917725, -1.1491624116897583, -0.9769807457923889, -0.8047990798950195, -0.6326173543930054, -0.460435688495636, -0.2882540225982666, -0.11607229709625244, 0.05610930919647217, 0.22829103469848633, 0.4004727005958557, 0.5726543664932251, 0.7448360919952393, 0.9170177578926086, 1.089199423789978, 1.2613811492919922, 1.4335627555847168, 1.605744481086731, 1.7779262065887451, 1.9501078128814697, 2.1222896575927734, 2.294471263885498, 2.4666528701782227, 2.6388344764709473, 2.811016082763672, 2.9831979274749756, 3.1553795337677, 3.327561378479004, 3.4997429847717285, 3.671924591064453, 3.8441061973571777, 4.016287803649902, 4.188469886779785, 4.36065149307251, 4.532833099365234, 4.705014705657959, 4.877196311950684, 5.049378395080566, 5.221560001373291, 5.393741607666016, 5.56592321395874, 5.738104820251465]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 6.0, 10.0, 15.0, 13.0, 33.0, 29.0, 45.0, 62.0, 105.0, 85.0, 152.0, 282.0, 451.0, 697.0, 1359.0, 2619.0, 6422.0, 18194.0, 78815.0, 1057207.0, 2894476.0, 98457.0, 20806.0, 7187.0, 3093.0, 1451.0, 823.0, 443.0, 277.0, 191.0, 128.0, 94.0, 63.0, 50.0, 33.0, 24.0, 17.0, 17.0, 10.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.328125, -1.2824249267578125, -1.236724853515625, -1.1910247802734375, -1.14532470703125, -1.0996246337890625, -1.053924560546875, -1.0082244873046875, -0.9625244140625, -0.9168243408203125, -0.871124267578125, -0.8254241943359375, -0.77972412109375, -0.7340240478515625, -0.688323974609375, -0.6426239013671875, -0.596923828125, -0.5512237548828125, -0.505523681640625, -0.4598236083984375, -0.41412353515625, -0.3684234619140625, -0.322723388671875, -0.2770233154296875, -0.2313232421875, -0.1856231689453125, -0.139923095703125, -0.0942230224609375, -0.04852294921875, -0.0028228759765625, 0.042877197265625, 0.0885772705078125, 0.13427734375, 0.1799774169921875, 0.225677490234375, 0.2713775634765625, 0.31707763671875, 0.3627777099609375, 0.408477783203125, 0.4541778564453125, 0.4998779296875, 0.5455780029296875, 0.591278076171875, 0.6369781494140625, 0.68267822265625, 0.7283782958984375, 0.774078369140625, 0.8197784423828125, 0.865478515625, 0.9111785888671875, 0.956878662109375, 1.0025787353515625, 1.04827880859375, 1.0939788818359375, 1.139678955078125, 1.1853790283203125, 1.2310791015625, 1.2767791748046875, 1.322479248046875, 1.3681793212890625, 1.41387939453125, 1.4595794677734375, 1.505279541015625, 1.5509796142578125, 1.5966796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 3.0, 5.0, 22.0, 26.0, 28.0, 40.0, 57.0, 61.0, 72.0, 66.0, 96.0, 83.0, 74.0, 76.0, 71.0, 53.0, 39.0, 32.0, 26.0, 17.0, 11.0, 5.0, 9.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.337158203125, -0.3263435363769531, -0.31552886962890625, -0.3047142028808594, -0.2938995361328125, -0.2830848693847656, -0.27227020263671875, -0.2614555358886719, -0.250640869140625, -0.23982620239257812, -0.22901153564453125, -0.21819686889648438, -0.2073822021484375, -0.19656753540039062, -0.18575286865234375, -0.17493820190429688, -0.16412353515625, -0.15330886840820312, -0.14249420166015625, -0.13167953491210938, -0.1208648681640625, -0.11005020141601562, -0.09923553466796875, -0.08842086791992188, -0.077606201171875, -0.06679153442382812, -0.05597686767578125, -0.045162200927734375, -0.0343475341796875, -0.023532867431640625, -0.01271820068359375, -0.001903533935546875, 0.0089111328125, 0.019725799560546875, 0.03054046630859375, 0.041355133056640625, 0.0521697998046875, 0.06298446655273438, 0.07379913330078125, 0.08461380004882812, 0.095428466796875, 0.10624313354492188, 0.11705780029296875, 0.12787246704101562, 0.1386871337890625, 0.14950180053710938, 0.16031646728515625, 0.17113113403320312, 0.18194580078125, 0.19276046752929688, 0.20357513427734375, 0.21438980102539062, 0.2252044677734375, 0.23601913452148438, 0.24683380126953125, 0.2576484680175781, 0.268463134765625, 0.2792778015136719, 0.29009246826171875, 0.3009071350097656, 0.3117218017578125, 0.3225364685058594, 0.33335113525390625, 0.3441658020019531, 0.35498046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 18.0, 22.0, 32.0, 52.0, 97.0, 139.0, 229.0, 458.0, 1166.0, 3680.0, 16582.0, 172258.0, 3748826.0, 226760.0, 18433.0, 3475.0, 1108.0, 436.0, 199.0, 105.0, 78.0, 27.0, 28.0, 20.0, 15.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.03692626953125, -1.9761962890625, -1.91546630859375, -1.854736328125, -1.79400634765625, -1.7332763671875, -1.67254638671875, -1.61181640625, -1.55108642578125, -1.4903564453125, -1.42962646484375, -1.368896484375, -1.30816650390625, -1.2474365234375, -1.18670654296875, -1.1259765625, -1.06524658203125, -1.0045166015625, -0.94378662109375, -0.883056640625, -0.82232666015625, -0.7615966796875, -0.70086669921875, -0.64013671875, -0.57940673828125, -0.5186767578125, -0.45794677734375, -0.397216796875, -0.33648681640625, -0.2757568359375, -0.21502685546875, -0.154296875, -0.09356689453125, -0.0328369140625, 0.02789306640625, 0.088623046875, 0.14935302734375, 0.2100830078125, 0.27081298828125, 0.33154296875, 0.39227294921875, 0.4530029296875, 0.51373291015625, 0.574462890625, 0.63519287109375, 0.6959228515625, 0.75665283203125, 0.8173828125, 0.87811279296875, 0.9388427734375, 0.99957275390625, 1.060302734375, 1.12103271484375, 1.1817626953125, 1.24249267578125, 1.30322265625, 1.36395263671875, 1.4246826171875, 1.48541259765625, 1.546142578125, 1.60687255859375, 1.6676025390625, 1.72833251953125, 1.7890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 11.0, 24.0, 21.0, 30.0, 77.0, 98.0, 171.0, 437.0, 1496.0, 887.0, 365.0, 184.0, 93.0, 63.0, 33.0, 20.0, 17.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.50634765625, -0.4936408996582031, -0.48093414306640625, -0.4682273864746094, -0.4555206298828125, -0.4428138732910156, -0.43010711669921875, -0.4174003601074219, -0.404693603515625, -0.3919868469238281, -0.37928009033203125, -0.3665733337402344, -0.3538665771484375, -0.3411598205566406, -0.32845306396484375, -0.3157463073730469, -0.30303955078125, -0.2903327941894531, -0.27762603759765625, -0.2649192810058594, -0.2522125244140625, -0.23950576782226562, -0.22679901123046875, -0.21409225463867188, -0.201385498046875, -0.18867874145507812, -0.17597198486328125, -0.16326522827148438, -0.1505584716796875, -0.13785171508789062, -0.12514495849609375, -0.11243820190429688, -0.0997314453125, -0.08702468872070312, -0.07431793212890625, -0.061611175537109375, -0.0489044189453125, -0.036197662353515625, -0.02349090576171875, -0.010784149169921875, 0.001922607421875, 0.014629364013671875, 0.02733612060546875, 0.040042877197265625, 0.0527496337890625, 0.06545639038085938, 0.07816314697265625, 0.09086990356445312, 0.10357666015625, 0.11628341674804688, 0.12899017333984375, 0.14169692993164062, 0.1544036865234375, 0.16711044311523438, 0.17981719970703125, 0.19252395629882812, 0.205230712890625, 0.21793746948242188, 0.23064422607421875, 0.24335098266601562, 0.2560577392578125, 0.2687644958496094, 0.28147125244140625, 0.2941780090332031, 0.306884765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 26.0, 72.0, 156.0, 182.0, 193.0, 177.0, 105.0, 44.0, 23.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.639739990234375, -4.539134502410889, -4.438528537750244, -4.337923049926758, -4.237317085266113, -4.136711597442627, -4.036106109619141, -3.935500144958496, -3.8348946571350098, -3.7342889308929443, -3.633683204650879, -3.5330777168273926, -3.432471990585327, -3.3318662643432617, -3.2312605381011963, -3.130654811859131, -3.0300493240356445, -2.929443597793579, -2.8288378715515137, -2.7282323837280273, -2.627626657485962, -2.5270209312438965, -2.426415205001831, -2.3258094787597656, -2.2252037525177, -2.1245980262756348, -2.0239923000335693, -1.9233866930007935, -1.8227810859680176, -1.7221753597259521, -1.6215696334838867, -1.5209640264511108, -1.420358419418335, -1.3197526931762695, -1.2191470861434937, -1.1185413599014282, -1.0179357528686523, -0.9173300266265869, -0.8167243599891663, -0.7161186933517456, -0.615513026714325, -0.5149073600769043, -0.41430169343948364, -0.3136959969997406, -0.21309033036231995, -0.1124846339225769, -0.01187896728515625, 0.0887266993522644, 0.18933236598968506, 0.2899380326271057, 0.39054369926452637, 0.4911493957042694, 0.5917550325393677, 0.6923607587814331, 0.7929664254188538, 0.8935720920562744, 0.9941777586936951, 1.0947834253311157, 1.1953891515731812, 1.295994758605957, 1.3966004848480225, 1.497206211090088, 1.5978118181228638, 1.6984174251556396, 1.799023151397705]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 7.0, 4.0, 8.0, 10.0, 9.0, 10.0, 13.0, 25.0, 16.0, 24.0, 16.0, 31.0, 35.0, 41.0, 39.0, 34.0, 34.0, 41.0, 46.0, 56.0, 35.0, 43.0, 38.0, 46.0, 37.0, 36.0, 35.0, 37.0, 33.0, 29.0, 10.0, 21.0, 17.0, 22.0, 15.0, 10.0, 6.0, 7.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.938157320022583, -0.9063146114349365, -0.87447190284729, -0.8426291942596436, -0.8107865452766418, -0.7789438366889954, -0.7471011281013489, -0.7152584195137024, -0.6834157705307007, -0.6515730619430542, -0.6197303533554077, -0.5878876447677612, -0.5560449957847595, -0.524202287197113, -0.49235957860946655, -0.46051687002182007, -0.4286741614341736, -0.3968314528465271, -0.364988774061203, -0.3331460654735565, -0.3013033866882324, -0.26946067810058594, -0.23761796951293945, -0.20577527582645416, -0.17393258213996887, -0.14208988845348358, -0.1102471873164177, -0.0784044861793518, -0.046561792492866516, -0.014719098806381226, 0.01712360978126526, 0.04896630346775055, 0.08080899715423584, 0.11265169084072113, 0.14449438452720642, 0.1763370931148529, 0.2081797868013382, 0.2400224804878235, 0.27186518907546997, 0.30370789766311646, 0.33555057644844055, 0.36739328503608704, 0.39923596382141113, 0.4310786724090576, 0.4629213809967041, 0.4947640597820282, 0.5266067981719971, 0.5584494471549988, 0.5902921557426453, 0.6221348643302917, 0.6539775729179382, 0.6858202219009399, 0.7176629304885864, 0.7495056390762329, 0.7813483476638794, 0.8131910562515259, 0.8450337648391724, 0.8768764734268188, 0.9087191820144653, 0.9405618906021118, 0.9724045395851135, 1.0042471885681152, 1.0360898971557617, 1.0679326057434082, 1.0997753143310547]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 6.0, 7.0, 15.0, 14.0, 20.0, 34.0, 43.0, 72.0, 95.0, 134.0, 198.0, 301.0, 462.0, 713.0, 1170.0, 2001.0, 3642.0, 8026.0, 21909.0, 71728.0, 238188.0, 411015.0, 197377.0, 58344.0, 17936.0, 6900.0, 3349.0, 1814.0, 1028.0, 688.0, 399.0, 296.0, 184.0, 136.0, 101.0, 61.0, 35.0, 27.0, 13.0, 19.0, 14.0, 7.0, 6.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.099609375, -1.064605712890625, -1.02960205078125, -0.994598388671875, -0.9595947265625, -0.924591064453125, -0.88958740234375, -0.854583740234375, -0.819580078125, -0.784576416015625, -0.74957275390625, -0.714569091796875, -0.6795654296875, -0.644561767578125, -0.60955810546875, -0.574554443359375, -0.53955078125, -0.504547119140625, -0.46954345703125, -0.434539794921875, -0.3995361328125, -0.364532470703125, -0.32952880859375, -0.294525146484375, -0.259521484375, -0.224517822265625, -0.18951416015625, -0.154510498046875, -0.1195068359375, -0.084503173828125, -0.04949951171875, -0.014495849609375, 0.0205078125, 0.055511474609375, 0.09051513671875, 0.125518798828125, 0.1605224609375, 0.195526123046875, 0.23052978515625, 0.265533447265625, 0.300537109375, 0.335540771484375, 0.37054443359375, 0.405548095703125, 0.4405517578125, 0.475555419921875, 0.51055908203125, 0.545562744140625, 0.58056640625, 0.615570068359375, 0.65057373046875, 0.685577392578125, 0.7205810546875, 0.755584716796875, 0.79058837890625, 0.825592041015625, 0.860595703125, 0.895599365234375, 0.93060302734375, 0.965606689453125, 1.0006103515625, 1.035614013671875, 1.07061767578125, 1.105621337890625, 1.140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 3.0, 14.0, 20.0, 24.0, 36.0, 40.0, 47.0, 71.0, 69.0, 74.0, 91.0, 96.0, 81.0, 74.0, 67.0, 57.0, 31.0, 31.0, 19.0, 17.0, 8.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.333740234375, -0.3229331970214844, -0.31212615966796875, -0.3013191223144531, -0.2905120849609375, -0.2797050476074219, -0.26889801025390625, -0.2580909729003906, -0.247283935546875, -0.23647689819335938, -0.22566986083984375, -0.21486282348632812, -0.2040557861328125, -0.19324874877929688, -0.18244171142578125, -0.17163467407226562, -0.16082763671875, -0.15002059936523438, -0.13921356201171875, -0.12840652465820312, -0.1175994873046875, -0.10679244995117188, -0.09598541259765625, -0.08517837524414062, -0.074371337890625, -0.06356430053710938, -0.05275726318359375, -0.041950225830078125, -0.0311431884765625, -0.020336151123046875, -0.00952911376953125, 0.001277923583984375, 0.0120849609375, 0.022891998291015625, 0.03369903564453125, 0.044506072998046875, 0.0553131103515625, 0.06612014770507812, 0.07692718505859375, 0.08773422241210938, 0.098541259765625, 0.10934829711914062, 0.12015533447265625, 0.13096237182617188, 0.1417694091796875, 0.15257644653320312, 0.16338348388671875, 0.17419052124023438, 0.18499755859375, 0.19580459594726562, 0.20661163330078125, 0.21741867065429688, 0.2282257080078125, 0.23903274536132812, 0.24983978271484375, 0.2606468200683594, 0.271453857421875, 0.2822608947753906, 0.29306793212890625, 0.3038749694824219, 0.3146820068359375, 0.3254890441894531, 0.33629608154296875, 0.3471031188964844, 0.35791015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 10.0, 5.0, 12.0, 9.0, 27.0, 29.0, 55.0, 74.0, 157.0, 232.0, 402.0, 836.0, 1929.0, 5086.0, 16341.0, 67130.0, 303163.0, 470838.0, 137765.0, 30562.0, 8469.0, 2942.0, 1206.0, 584.0, 301.0, 156.0, 86.0, 52.0, 42.0, 16.0, 20.0, 15.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.6181640625, -1.57794189453125, -1.5377197265625, -1.49749755859375, -1.457275390625, -1.41705322265625, -1.3768310546875, -1.33660888671875, -1.29638671875, -1.25616455078125, -1.2159423828125, -1.17572021484375, -1.135498046875, -1.09527587890625, -1.0550537109375, -1.01483154296875, -0.974609375, -0.93438720703125, -0.8941650390625, -0.85394287109375, -0.813720703125, -0.77349853515625, -0.7332763671875, -0.69305419921875, -0.65283203125, -0.61260986328125, -0.5723876953125, -0.53216552734375, -0.491943359375, -0.45172119140625, -0.4114990234375, -0.37127685546875, -0.3310546875, -0.29083251953125, -0.2506103515625, -0.21038818359375, -0.170166015625, -0.12994384765625, -0.0897216796875, -0.04949951171875, -0.00927734375, 0.03094482421875, 0.0711669921875, 0.11138916015625, 0.151611328125, 0.19183349609375, 0.2320556640625, 0.27227783203125, 0.3125, 0.35272216796875, 0.3929443359375, 0.43316650390625, 0.473388671875, 0.51361083984375, 0.5538330078125, 0.59405517578125, 0.63427734375, 0.67449951171875, 0.7147216796875, 0.75494384765625, 0.795166015625, 0.83538818359375, 0.8756103515625, 0.91583251953125, 0.9560546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 5.0, 3.0, 5.0, 11.0, 6.0, 15.0, 9.0, 11.0, 24.0, 21.0, 24.0, 18.0, 27.0, 30.0, 28.0, 36.0, 57.0, 42.0, 37.0, 32.0, 46.0, 34.0, 47.0, 32.0, 41.0, 45.0, 32.0, 36.0, 34.0, 29.0, 19.0, 28.0, 27.0, 19.0, 12.0, 16.0, 12.0, 9.0, 7.0, 10.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.90087890625, -0.8718948364257812, -0.8429107666015625, -0.8139266967773438, -0.784942626953125, -0.7559585571289062, -0.7269744873046875, -0.6979904174804688, -0.66900634765625, -0.6400222778320312, -0.6110382080078125, -0.5820541381835938, -0.553070068359375, -0.5240859985351562, -0.4951019287109375, -0.46611785888671875, -0.4371337890625, -0.40814971923828125, -0.3791656494140625, -0.35018157958984375, -0.321197509765625, -0.29221343994140625, -0.2632293701171875, -0.23424530029296875, -0.20526123046875, -0.17627716064453125, -0.1472930908203125, -0.11830902099609375, -0.089324951171875, -0.06034088134765625, -0.0313568115234375, -0.00237274169921875, 0.026611328125, 0.05559539794921875, 0.0845794677734375, 0.11356353759765625, 0.142547607421875, 0.17153167724609375, 0.2005157470703125, 0.22949981689453125, 0.25848388671875, 0.28746795654296875, 0.3164520263671875, 0.34543609619140625, 0.374420166015625, 0.40340423583984375, 0.4323883056640625, 0.46137237548828125, 0.4903564453125, 0.5193405151367188, 0.5483245849609375, 0.5773086547851562, 0.606292724609375, 0.6352767944335938, 0.6642608642578125, 0.6932449340820312, 0.72222900390625, 0.7512130737304688, 0.7801971435546875, 0.8091812133789062, 0.838165283203125, 0.8671493530273438, 0.8961334228515625, 0.9251174926757812, 0.9541015625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 11.0, 22.0, 18.0, 41.0, 49.0, 104.0, 154.0, 323.0, 671.0, 1641.0, 5235.0, 23802.0, 202467.0, 664756.0, 125802.0, 16670.0, 4124.0, 1463.0, 573.0, 300.0, 125.0, 65.0, 45.0, 22.0, 14.0, 12.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74755859375, -0.7264404296875, -0.705322265625, -0.6842041015625, -0.6630859375, -0.6419677734375, -0.620849609375, -0.5997314453125, -0.57861328125, -0.5574951171875, -0.536376953125, -0.5152587890625, -0.494140625, -0.4730224609375, -0.451904296875, -0.4307861328125, -0.40966796875, -0.3885498046875, -0.367431640625, -0.3463134765625, -0.3251953125, -0.3040771484375, -0.282958984375, -0.2618408203125, -0.24072265625, -0.2196044921875, -0.198486328125, -0.1773681640625, -0.15625, -0.1351318359375, -0.114013671875, -0.0928955078125, -0.07177734375, -0.0506591796875, -0.029541015625, -0.0084228515625, 0.0126953125, 0.0338134765625, 0.054931640625, 0.0760498046875, 0.09716796875, 0.1182861328125, 0.139404296875, 0.1605224609375, 0.181640625, 0.2027587890625, 0.223876953125, 0.2449951171875, 0.26611328125, 0.2872314453125, 0.308349609375, 0.3294677734375, 0.3505859375, 0.3717041015625, 0.392822265625, 0.4139404296875, 0.43505859375, 0.4561767578125, 0.477294921875, 0.4984130859375, 0.51953125, 0.5406494140625, 0.561767578125, 0.5828857421875, 0.60400390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 9.0, 13.0, 21.0, 30.0, 44.0, 58.0, 76.0, 112.0, 121.0, 89.0, 126.0, 77.0, 50.0, 47.0, 32.0, 21.0, 13.0, 11.0, 16.0, 5.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001442432403564453, -0.00014064554125070572, -0.00013704784214496613, -0.00013345014303922653, -0.00012985244393348694, -0.00012625474482774734, -0.00012265704572200775, -0.00011905934661626816, -0.00011546164751052856, -0.00011186394840478897, -0.00010826624929904938, -0.00010466855019330978, -0.00010107085108757019, -9.74731519818306e-05, -9.3875452876091e-05, -9.027775377035141e-05, -8.668005466461182e-05, -8.308235555887222e-05, -7.948465645313263e-05, -7.588695734739304e-05, -7.228925824165344e-05, -6.869155913591385e-05, -6.509386003017426e-05, -6.149616092443466e-05, -5.789846181869507e-05, -5.4300762712955475e-05, -5.070306360721588e-05, -4.710536450147629e-05, -4.3507665395736694e-05, -3.99099662899971e-05, -3.631226718425751e-05, -3.2714568078517914e-05, -2.911686897277832e-05, -2.5519169867038727e-05, -2.1921470761299133e-05, -1.832377165555954e-05, -1.4726072549819946e-05, -1.1128373444080353e-05, -7.530674338340759e-06, -3.932975232601166e-06, -3.3527612686157227e-07, 3.2624229788780212e-06, 6.860122084617615e-06, 1.0457821190357208e-05, 1.4055520296096802e-05, 1.7653219401836395e-05, 2.125091850757599e-05, 2.4848617613315582e-05, 2.8446316719055176e-05, 3.204401582479477e-05, 3.564171493053436e-05, 3.9239414036273956e-05, 4.283711314201355e-05, 4.643481224775314e-05, 5.003251135349274e-05, 5.363021045923233e-05, 5.7227909564971924e-05, 6.082560867071152e-05, 6.442330777645111e-05, 6.80210068821907e-05, 7.16187059879303e-05, 7.521640509366989e-05, 7.881410419940948e-05, 8.241180330514908e-05, 8.600950241088867e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 12.0, 18.0, 28.0, 28.0, 55.0, 76.0, 131.0, 266.0, 468.0, 911.0, 2225.0, 6488.0, 26760.0, 179855.0, 612595.0, 181145.0, 26556.0, 6489.0, 2298.0, 1017.0, 473.0, 234.0, 143.0, 93.0, 51.0, 44.0, 20.0, 19.0, 11.0, 9.0, 8.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5917129516601562, -0.5740509033203125, -0.5563888549804688, -0.538726806640625, -0.5210647583007812, -0.5034027099609375, -0.48574066162109375, -0.46807861328125, -0.45041656494140625, -0.4327545166015625, -0.41509246826171875, -0.397430419921875, -0.37976837158203125, -0.3621063232421875, -0.34444427490234375, -0.3267822265625, -0.30912017822265625, -0.2914581298828125, -0.27379608154296875, -0.256134033203125, -0.23847198486328125, -0.2208099365234375, -0.20314788818359375, -0.18548583984375, -0.16782379150390625, -0.1501617431640625, -0.13249969482421875, -0.114837646484375, -0.09717559814453125, -0.0795135498046875, -0.06185150146484375, -0.044189453125, -0.02652740478515625, -0.0088653564453125, 0.00879669189453125, 0.026458740234375, 0.04412078857421875, 0.0617828369140625, 0.07944488525390625, 0.09710693359375, 0.11476898193359375, 0.1324310302734375, 0.15009307861328125, 0.167755126953125, 0.18541717529296875, 0.2030792236328125, 0.22074127197265625, 0.2384033203125, 0.25606536865234375, 0.2737274169921875, 0.29138946533203125, 0.309051513671875, 0.32671356201171875, 0.3443756103515625, 0.36203765869140625, 0.37969970703125, 0.39736175537109375, 0.4150238037109375, 0.43268585205078125, 0.450347900390625, 0.46800994873046875, 0.4856719970703125, 0.5033340454101562, 0.52099609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 12.0, 12.0, 19.0, 22.0, 34.0, 30.0, 47.0, 77.0, 73.0, 80.0, 114.0, 94.0, 89.0, 73.0, 56.0, 48.0, 33.0, 20.0, 14.0, 9.0, 7.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.384521484375, -0.3719673156738281, -0.35941314697265625, -0.3468589782714844, -0.3343048095703125, -0.3217506408691406, -0.30919647216796875, -0.2966423034667969, -0.284088134765625, -0.2715339660644531, -0.25897979736328125, -0.24642562866210938, -0.2338714599609375, -0.22131729125976562, -0.20876312255859375, -0.19620895385742188, -0.18365478515625, -0.17110061645507812, -0.15854644775390625, -0.14599227905273438, -0.1334381103515625, -0.12088394165039062, -0.10832977294921875, -0.09577560424804688, -0.083221435546875, -0.07066726684570312, -0.05811309814453125, -0.045558929443359375, -0.0330047607421875, -0.020450592041015625, -0.00789642333984375, 0.004657745361328125, 0.0172119140625, 0.029766082763671875, 0.04232025146484375, 0.054874420166015625, 0.0674285888671875, 0.07998275756835938, 0.09253692626953125, 0.10509109497070312, 0.117645263671875, 0.13019943237304688, 0.14275360107421875, 0.15530776977539062, 0.1678619384765625, 0.18041610717773438, 0.19297027587890625, 0.20552444458007812, 0.21807861328125, 0.23063278198242188, 0.24318695068359375, 0.2557411193847656, 0.2682952880859375, 0.2808494567871094, 0.29340362548828125, 0.3059577941894531, 0.318511962890625, 0.3310661315917969, 0.34362030029296875, 0.3561744689941406, 0.3687286376953125, 0.3812828063964844, 0.39383697509765625, 0.4063911437988281, 0.4189453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 10.0, 10.0, 17.0, 37.0, 85.0, 132.0, 158.0, 183.0, 167.0, 77.0, 56.0, 30.0, 17.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.751825332641602, -15.44526195526123, -15.13869857788086, -14.832135200500488, -14.525571823120117, -14.21900749206543, -13.912444114685059, -13.605880737304688, -13.299317359924316, -12.992753982543945, -12.686190605163574, -12.379627227783203, -12.073062896728516, -11.766499519348145, -11.459936141967773, -11.153372764587402, -10.846809387207031, -10.54024600982666, -10.233682632446289, -9.927119255065918, -9.620555877685547, -9.31399154663086, -9.007428169250488, -8.700864791870117, -8.394301414489746, -8.087738037109375, -7.781174659729004, -7.474610805511475, -7.1680474281311035, -6.861484050750732, -6.554920196533203, -6.248356819152832, -5.941794395446777, -5.635231018066406, -5.328667640686035, -5.022103786468506, -4.715540409088135, -4.408977031707764, -4.102413177490234, -3.7958498001098633, -3.489286422729492, -3.182723045349121, -2.876159429550171, -2.5695958137512207, -2.2630324363708496, -1.956468939781189, -1.6499054431915283, -1.3433418273925781, -1.036778450012207, -0.7302149534225464, -0.42365145683288574, -0.1170879602432251, 0.18947553634643555, 0.4960390329360962, 0.8026025295257568, 1.109166145324707, 1.4157295227050781, 1.7222930192947388, 2.0288565158843994, 2.3354201316833496, 2.6419835090637207, 2.948546886444092, 3.255110502243042, 3.561674118041992, 3.8682374954223633]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 8.0, 6.0, 10.0, 9.0, 18.0, 22.0, 14.0, 24.0, 43.0, 35.0, 50.0, 49.0, 61.0, 70.0, 61.0, 68.0, 64.0, 56.0, 62.0, 48.0, 42.0, 47.0, 33.0, 23.0, 19.0, 15.0, 13.0, 15.0, 4.0, 7.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.669235229492188, -8.42377758026123, -8.17832088470459, -7.932863235473633, -7.687406063079834, -7.441948890686035, -7.196491241455078, -6.951034069061279, -6.7055768966674805, -6.460119724273682, -6.214662075042725, -5.969204902648926, -5.723747730255127, -5.478290557861328, -5.232832908630371, -4.987375736236572, -4.741918563842773, -4.496461391448975, -4.251003742218018, -4.005546569824219, -3.76008939743042, -3.514631986618042, -3.269174575805664, -3.0237174034118652, -2.778259754180908, -2.5328023433685303, -2.2873451709747314, -2.0418877601623535, -1.7964305877685547, -1.5509731769561768, -1.3055158853530884, -1.06005859375, -0.8146014213562012, -0.5691441297531128, -0.323686808347702, -0.07822948694229126, 0.16722780466079712, 0.4126851558685303, 0.6581424474716187, 0.903599739074707, 1.1490570306777954, 1.3945143222808838, 1.6399716138839722, 1.8854289054870605, 2.1308863162994385, 2.3763437271118164, 2.6218008995056152, 2.867258071899414, 3.112715482711792, 3.35817289352417, 3.6036300659179688, 3.8490874767303467, 4.094544887542725, 4.340002059936523, 4.585459232330322, 4.830916404724121, 5.076374053955078, 5.321831226348877, 5.567288875579834, 5.812746047973633, 6.058203220367432, 6.3036603927612305, 6.5491180419921875, 6.794575214385986, 7.040032386779785]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 6.0, 5.0, 8.0, 12.0, 18.0, 23.0, 30.0, 56.0, 73.0, 119.0, 190.0, 347.0, 659.0, 1304.0, 2822.0, 8086.0, 36410.0, 439722.0, 3555571.0, 121322.0, 17875.0, 5197.0, 2104.0, 981.0, 489.0, 284.0, 199.0, 109.0, 72.0, 44.0, 33.0, 27.0, 15.0, 18.0, 7.0, 4.0, 3.0, 11.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8345489501953125, -1.769683837890625, -1.7048187255859375, -1.63995361328125, -1.5750885009765625, -1.510223388671875, -1.4453582763671875, -1.3804931640625, -1.3156280517578125, -1.250762939453125, -1.1858978271484375, -1.12103271484375, -1.0561676025390625, -0.991302490234375, -0.9264373779296875, -0.861572265625, -0.7967071533203125, -0.731842041015625, -0.6669769287109375, -0.60211181640625, -0.5372467041015625, -0.472381591796875, -0.4075164794921875, -0.3426513671875, -0.2777862548828125, -0.212921142578125, -0.1480560302734375, -0.08319091796875, -0.0183258056640625, 0.046539306640625, 0.1114044189453125, 0.17626953125, 0.2411346435546875, 0.305999755859375, 0.3708648681640625, 0.43572998046875, 0.5005950927734375, 0.565460205078125, 0.6303253173828125, 0.6951904296875, 0.7600555419921875, 0.824920654296875, 0.8897857666015625, 0.95465087890625, 1.0195159912109375, 1.084381103515625, 1.1492462158203125, 1.214111328125, 1.2789764404296875, 1.343841552734375, 1.4087066650390625, 1.47357177734375, 1.5384368896484375, 1.603302001953125, 1.6681671142578125, 1.7330322265625, 1.7978973388671875, 1.862762451171875, 1.9276275634765625, 1.99249267578125, 2.0573577880859375, 2.122222900390625, 2.1870880126953125, 2.251953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 10.0, 8.0, 13.0, 32.0, 36.0, 51.0, 64.0, 75.0, 90.0, 82.0, 100.0, 105.0, 81.0, 65.0, 60.0, 41.0, 21.0, 13.0, 12.0, 15.0, 4.0, 2.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387939453125, -0.3755149841308594, -0.36309051513671875, -0.3506660461425781, -0.3382415771484375, -0.3258171081542969, -0.31339263916015625, -0.3009681701660156, -0.288543701171875, -0.2761192321777344, -0.26369476318359375, -0.2512702941894531, -0.2388458251953125, -0.22642135620117188, -0.21399688720703125, -0.20157241821289062, -0.18914794921875, -0.17672348022460938, -0.16429901123046875, -0.15187454223632812, -0.1394500732421875, -0.12702560424804688, -0.11460113525390625, -0.10217666625976562, -0.089752197265625, -0.07732772827148438, -0.06490325927734375, -0.052478790283203125, -0.0400543212890625, -0.027629852294921875, -0.01520538330078125, -0.002780914306640625, 0.0096435546875, 0.022068023681640625, 0.03449249267578125, 0.046916961669921875, 0.0593414306640625, 0.07176589965820312, 0.08419036865234375, 0.09661483764648438, 0.109039306640625, 0.12146377563476562, 0.13388824462890625, 0.14631271362304688, 0.1587371826171875, 0.17116165161132812, 0.18358612060546875, 0.19601058959960938, 0.20843505859375, 0.22085952758789062, 0.23328399658203125, 0.24570846557617188, 0.2581329345703125, 0.2705574035644531, 0.28298187255859375, 0.2954063415527344, 0.307830810546875, 0.3202552795410156, 0.33267974853515625, 0.3451042175292969, 0.3575286865234375, 0.3699531555175781, 0.38237762451171875, 0.3948020935058594, 0.4072265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 6.0, 11.0, 22.0, 24.0, 46.0, 60.0, 158.0, 326.0, 764.0, 2221.0, 8743.0, 82119.0, 3901128.0, 182185.0, 12193.0, 2783.0, 854.0, 320.0, 138.0, 75.0, 25.0, 24.0, 17.0, 12.0, 6.0, 7.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.09857177734375, -2.0057373046875, -1.91290283203125, -1.820068359375, -1.72723388671875, -1.6343994140625, -1.54156494140625, -1.44873046875, -1.35589599609375, -1.2630615234375, -1.17022705078125, -1.077392578125, -0.98455810546875, -0.8917236328125, -0.79888916015625, -0.7060546875, -0.61322021484375, -0.5203857421875, -0.42755126953125, -0.334716796875, -0.24188232421875, -0.1490478515625, -0.05621337890625, 0.03662109375, 0.12945556640625, 0.2222900390625, 0.31512451171875, 0.407958984375, 0.50079345703125, 0.5936279296875, 0.68646240234375, 0.779296875, 0.87213134765625, 0.9649658203125, 1.05780029296875, 1.150634765625, 1.24346923828125, 1.3363037109375, 1.42913818359375, 1.52197265625, 1.61480712890625, 1.7076416015625, 1.80047607421875, 1.893310546875, 1.98614501953125, 2.0789794921875, 2.17181396484375, 2.2646484375, 2.35748291015625, 2.4503173828125, 2.54315185546875, 2.635986328125, 2.72882080078125, 2.8216552734375, 2.91448974609375, 3.00732421875, 3.10015869140625, 3.1929931640625, 3.28582763671875, 3.378662109375, 3.47149658203125, 3.5643310546875, 3.65716552734375, 3.75]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 11.0, 15.0, 23.0, 32.0, 42.0, 102.0, 191.0, 444.0, 1305.0, 1074.0, 403.0, 167.0, 92.0, 57.0, 34.0, 20.0, 8.0, 7.0, 12.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8203125, -0.7974929809570312, -0.7746734619140625, -0.7518539428710938, -0.729034423828125, -0.7062149047851562, -0.6833953857421875, -0.6605758666992188, -0.63775634765625, -0.6149368286132812, -0.5921173095703125, -0.5692977905273438, -0.546478271484375, -0.5236587524414062, -0.5008392333984375, -0.47801971435546875, -0.4552001953125, -0.43238067626953125, -0.4095611572265625, -0.38674163818359375, -0.363922119140625, -0.34110260009765625, -0.3182830810546875, -0.29546356201171875, -0.27264404296875, -0.24982452392578125, -0.2270050048828125, -0.20418548583984375, -0.181365966796875, -0.15854644775390625, -0.1357269287109375, -0.11290740966796875, -0.090087890625, -0.06726837158203125, -0.0444488525390625, -0.02162933349609375, 0.001190185546875, 0.02400970458984375, 0.0468292236328125, 0.06964874267578125, 0.09246826171875, 0.11528778076171875, 0.1381072998046875, 0.16092681884765625, 0.183746337890625, 0.20656585693359375, 0.2293853759765625, 0.25220489501953125, 0.2750244140625, 0.29784393310546875, 0.3206634521484375, 0.34348297119140625, 0.366302490234375, 0.38912200927734375, 0.4119415283203125, 0.43476104736328125, 0.45758056640625, 0.48040008544921875, 0.5032196044921875, 0.5260391235351562, 0.548858642578125, 0.5716781616210938, 0.5944976806640625, 0.6173171997070312, 0.64013671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 8.0, 16.0, 49.0, 115.0, 225.0, 266.0, 184.0, 79.0, 33.0, 13.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.487597465515137, -8.282448768615723, -8.077301025390625, -7.872152328491211, -7.667003631591797, -7.461855411529541, -7.256707191467285, -7.051558494567871, -6.846410274505615, -6.641262054443359, -6.436113357543945, -6.2309651374816895, -6.025816917419434, -5.8206682205200195, -5.615520000457764, -5.410371780395508, -5.205223083496094, -5.000074863433838, -4.794926166534424, -4.589777946472168, -4.384629249572754, -4.179481029510498, -3.974332809448242, -3.7691843509674072, -3.5640358924865723, -3.3588874340057373, -3.1537389755249023, -2.9485907554626465, -2.7434422969818115, -2.5382938385009766, -2.3331456184387207, -2.1279971599578857, -1.922849178314209, -1.717700719833374, -1.5125523805618286, -1.3074040412902832, -1.1022555828094482, -0.8971071243286133, -0.6919587850570679, -0.48681044578552246, -0.2816619873046875, -0.07651358842849731, 0.12863481044769287, 0.33378320932388306, 0.5389316082000732, 0.7440800666809082, 0.9492284059524536, 1.154376745223999, 1.359525203704834, 1.564673662185669, 1.7698220014572144, 1.9749703407287598, 2.1801187992095947, 2.3852672576904297, 2.5904154777526855, 2.7955639362335205, 3.0007123947143555, 3.2058608531951904, 3.4110093116760254, 3.6161575317382812, 3.821305990219116, 4.026454448699951, 4.231602668762207, 4.436751365661621, 4.641899585723877]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 3.0, 3.0, 8.0, 5.0, 10.0, 19.0, 29.0, 34.0, 40.0, 48.0, 63.0, 56.0, 82.0, 59.0, 61.0, 57.0, 59.0, 60.0, 59.0, 49.0, 48.0, 33.0, 32.0, 17.0, 23.0, 11.0, 15.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0690722465515137, -1.9785453081130981, -1.888018250465393, -1.7974913120269775, -1.706964373588562, -1.6164374351501465, -1.5259103775024414, -1.4353834390640259, -1.3448565006256104, -1.2543295621871948, -1.1638025045394897, -1.0732755661010742, -0.9827486276626587, -0.8922216296195984, -0.8016946315765381, -0.7111676931381226, -0.6206406354904175, -0.5301136374473572, -0.43958669900894165, -0.34905970096588135, -0.25853273272514343, -0.16800576448440552, -0.07747876644134521, 0.013048171997070312, 0.10357517004013062, 0.19410213828086853, 0.28462910652160645, 0.37515610456466675, 0.46568307280540466, 0.5562100410461426, 0.6467370390892029, 0.7372639775276184, 0.8277909755706787, 0.918317973613739, 1.0088449716567993, 1.0993719100952148, 1.1898988485336304, 1.280425786972046, 1.370952844619751, 1.4614797830581665, 1.552006721496582, 1.6425336599349976, 1.7330607175827026, 1.8235876560211182, 1.9141145944595337, 2.004641532897949, 2.0951685905456543, 2.1856956481933594, 2.2762227058410645, 2.3667497634887695, 2.4572765827178955, 2.5478036403656006, 2.6383306980133057, 2.7288575172424316, 2.8193845748901367, 2.909911632537842, 3.0004384517669678, 3.090965509414673, 3.181492328643799, 3.272019386291504, 3.362546443939209, 3.453073263168335, 3.54360032081604, 3.634127140045166, 3.724654197692871]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 12.0, 15.0, 14.0, 18.0, 31.0, 46.0, 70.0, 60.0, 129.0, 159.0, 199.0, 290.0, 438.0, 621.0, 1060.0, 1828.0, 3520.0, 8827.0, 31936.0, 156665.0, 516001.0, 253181.0, 50638.0, 12659.0, 4437.0, 2109.0, 1184.0, 767.0, 477.0, 337.0, 228.0, 152.0, 121.0, 105.0, 59.0, 40.0, 32.0, 19.0, 18.0, 10.0, 9.0, 7.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.349609375, -1.3040924072265625, -1.258575439453125, -1.2130584716796875, -1.16754150390625, -1.1220245361328125, -1.076507568359375, -1.0309906005859375, -0.9854736328125, -0.9399566650390625, -0.894439697265625, -0.8489227294921875, -0.80340576171875, -0.7578887939453125, -0.712371826171875, -0.6668548583984375, -0.621337890625, -0.5758209228515625, -0.530303955078125, -0.4847869873046875, -0.43927001953125, -0.3937530517578125, -0.348236083984375, -0.3027191162109375, -0.2572021484375, -0.2116851806640625, -0.166168212890625, -0.1206512451171875, -0.07513427734375, -0.0296173095703125, 0.015899658203125, 0.0614166259765625, 0.10693359375, 0.1524505615234375, 0.197967529296875, 0.2434844970703125, 0.28900146484375, 0.3345184326171875, 0.380035400390625, 0.4255523681640625, 0.4710693359375, 0.5165863037109375, 0.562103271484375, 0.6076202392578125, 0.65313720703125, 0.6986541748046875, 0.744171142578125, 0.7896881103515625, 0.835205078125, 0.8807220458984375, 0.926239013671875, 0.9717559814453125, 1.01727294921875, 1.0627899169921875, 1.108306884765625, 1.1538238525390625, 1.1993408203125, 1.2448577880859375, 1.290374755859375, 1.3358917236328125, 1.38140869140625, 1.4269256591796875, 1.472442626953125, 1.5179595947265625, 1.5634765625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 21.0, 23.0, 46.0, 77.0, 80.0, 123.0, 121.0, 135.0, 114.0, 85.0, 61.0, 44.0, 24.0, 13.0, 9.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46435546875, -0.44835662841796875, -0.4323577880859375, -0.41635894775390625, -0.400360107421875, -0.38436126708984375, -0.3683624267578125, -0.35236358642578125, -0.33636474609375, -0.32036590576171875, -0.3043670654296875, -0.28836822509765625, -0.272369384765625, -0.25637054443359375, -0.2403717041015625, -0.22437286376953125, -0.2083740234375, -0.19237518310546875, -0.1763763427734375, -0.16037750244140625, -0.144378662109375, -0.12837982177734375, -0.1123809814453125, -0.09638214111328125, -0.08038330078125, -0.06438446044921875, -0.0483856201171875, -0.03238677978515625, -0.016387939453125, -0.00038909912109375, 0.0156097412109375, 0.03160858154296875, 0.047607421875, 0.06360626220703125, 0.0796051025390625, 0.09560394287109375, 0.111602783203125, 0.12760162353515625, 0.1436004638671875, 0.15959930419921875, 0.17559814453125, 0.19159698486328125, 0.2075958251953125, 0.22359466552734375, 0.239593505859375, 0.25559234619140625, 0.2715911865234375, 0.28759002685546875, 0.3035888671875, 0.31958770751953125, 0.3355865478515625, 0.35158538818359375, 0.367584228515625, 0.38358306884765625, 0.3995819091796875, 0.41558074951171875, 0.43157958984375, 0.44757843017578125, 0.4635772705078125, 0.47957611083984375, 0.495574951171875, 0.5115737915039062, 0.5275726318359375, 0.5435714721679688, 0.5595703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 10.0, 5.0, 13.0, 15.0, 22.0, 42.0, 45.0, 62.0, 100.0, 142.0, 241.0, 386.0, 628.0, 1182.0, 2246.0, 4624.0, 11057.0, 29884.0, 86979.0, 246435.0, 371403.0, 189262.0, 64689.0, 22433.0, 8564.0, 3864.0, 1787.0, 953.0, 560.0, 328.0, 198.0, 104.0, 87.0, 52.0, 51.0, 20.0, 14.0, 14.0, 19.0, 5.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7952499389648438, -0.7706756591796875, -0.7461013793945312, -0.721527099609375, -0.6969528198242188, -0.6723785400390625, -0.6478042602539062, -0.62322998046875, -0.5986557006835938, -0.5740814208984375, -0.5495071411132812, -0.524932861328125, -0.5003585815429688, -0.4757843017578125, -0.45121002197265625, -0.4266357421875, -0.40206146240234375, -0.3774871826171875, -0.35291290283203125, -0.328338623046875, -0.30376434326171875, -0.2791900634765625, -0.25461578369140625, -0.23004150390625, -0.20546722412109375, -0.1808929443359375, -0.15631866455078125, -0.131744384765625, -0.10717010498046875, -0.0825958251953125, -0.05802154541015625, -0.033447265625, -0.00887298583984375, 0.0157012939453125, 0.04027557373046875, 0.064849853515625, 0.08942413330078125, 0.1139984130859375, 0.13857269287109375, 0.16314697265625, 0.18772125244140625, 0.2122955322265625, 0.23686981201171875, 0.261444091796875, 0.28601837158203125, 0.3105926513671875, 0.33516693115234375, 0.3597412109375, 0.38431549072265625, 0.4088897705078125, 0.43346405029296875, 0.458038330078125, 0.48261260986328125, 0.5071868896484375, 0.5317611694335938, 0.55633544921875, 0.5809097290039062, 0.6054840087890625, 0.6300582885742188, 0.654632568359375, 0.6792068481445312, 0.7037811279296875, 0.7283554077148438, 0.7529296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 4.0, 5.0, 14.0, 12.0, 18.0, 24.0, 21.0, 21.0, 36.0, 26.0, 37.0, 42.0, 41.0, 30.0, 52.0, 60.0, 36.0, 45.0, 61.0, 36.0, 56.0, 38.0, 27.0, 37.0, 23.0, 26.0, 26.0, 26.0, 28.0, 13.0, 14.0, 15.0, 8.0, 6.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.90185546875, -0.8738174438476562, -0.8457794189453125, -0.8177413940429688, -0.789703369140625, -0.7616653442382812, -0.7336273193359375, -0.7055892944335938, -0.67755126953125, -0.6495132446289062, -0.6214752197265625, -0.5934371948242188, -0.565399169921875, -0.5373611450195312, -0.5093231201171875, -0.48128509521484375, -0.4532470703125, -0.42520904541015625, -0.3971710205078125, -0.36913299560546875, -0.341094970703125, -0.31305694580078125, -0.2850189208984375, -0.25698089599609375, -0.22894287109375, -0.20090484619140625, -0.1728668212890625, -0.14482879638671875, -0.116790771484375, -0.08875274658203125, -0.0607147216796875, -0.03267669677734375, -0.004638671875, 0.02339935302734375, 0.0514373779296875, 0.07947540283203125, 0.107513427734375, 0.13555145263671875, 0.1635894775390625, 0.19162750244140625, 0.21966552734375, 0.24770355224609375, 0.2757415771484375, 0.30377960205078125, 0.331817626953125, 0.35985565185546875, 0.3878936767578125, 0.41593170166015625, 0.4439697265625, 0.47200775146484375, 0.5000457763671875, 0.5280838012695312, 0.556121826171875, 0.5841598510742188, 0.6121978759765625, 0.6402359008789062, 0.66827392578125, 0.6963119506835938, 0.7243499755859375, 0.7523880004882812, 0.780426025390625, 0.8084640502929688, 0.8365020751953125, 0.8645401000976562, 0.892578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 16.0, 33.0, 37.0, 57.0, 83.0, 147.0, 218.0, 347.0, 795.0, 1837.0, 4748.0, 17159.0, 83231.0, 419187.0, 413852.0, 81780.0, 16837.0, 4727.0, 1665.0, 737.0, 398.0, 250.0, 136.0, 84.0, 52.0, 37.0, 24.0, 18.0, 11.0, 11.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50634765625, -0.48888397216796875, -0.4714202880859375, -0.45395660400390625, -0.436492919921875, -0.41902923583984375, -0.4015655517578125, -0.38410186767578125, -0.36663818359375, -0.34917449951171875, -0.3317108154296875, -0.31424713134765625, -0.296783447265625, -0.27931976318359375, -0.2618560791015625, -0.24439239501953125, -0.2269287109375, -0.20946502685546875, -0.1920013427734375, -0.17453765869140625, -0.157073974609375, -0.13961029052734375, -0.1221466064453125, -0.10468292236328125, -0.08721923828125, -0.06975555419921875, -0.0522918701171875, -0.03482818603515625, -0.017364501953125, 9.918212890625e-05, 0.0175628662109375, 0.03502655029296875, 0.052490234375, 0.06995391845703125, 0.0874176025390625, 0.10488128662109375, 0.122344970703125, 0.13980865478515625, 0.1572723388671875, 0.17473602294921875, 0.19219970703125, 0.20966339111328125, 0.2271270751953125, 0.24459075927734375, 0.262054443359375, 0.27951812744140625, 0.2969818115234375, 0.31444549560546875, 0.3319091796875, 0.34937286376953125, 0.3668365478515625, 0.38430023193359375, 0.401763916015625, 0.41922760009765625, 0.4366912841796875, 0.45415496826171875, 0.47161865234375, 0.48908233642578125, 0.5065460205078125, 0.5240097045898438, 0.541473388671875, 0.5589370727539062, 0.5764007568359375, 0.5938644409179688, 0.611328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 6.0, 2.0, 2.0, 15.0, 17.0, 26.0, 20.0, 32.0, 27.0, 44.0, 41.0, 55.0, 71.0, 80.0, 76.0, 68.0, 76.0, 83.0, 57.0, 47.0, 34.0, 27.0, 20.0, 18.0, 11.0, 12.0, 9.0, 5.0, 7.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.530782699584961e-05, -9.285192936658859e-05, -9.039603173732758e-05, -8.794013410806656e-05, -8.548423647880554e-05, -8.302833884954453e-05, -8.057244122028351e-05, -7.811654359102249e-05, -7.566064596176147e-05, -7.320474833250046e-05, -7.074885070323944e-05, -6.829295307397842e-05, -6.583705544471741e-05, -6.338115781545639e-05, -6.0925260186195374e-05, -5.846936255693436e-05, -5.601346492767334e-05, -5.355756729841232e-05, -5.1101669669151306e-05, -4.864577203989029e-05, -4.618987441062927e-05, -4.3733976781368256e-05, -4.127807915210724e-05, -3.882218152284622e-05, -3.6366283893585205e-05, -3.391038626432419e-05, -3.145448863506317e-05, -2.8998591005802155e-05, -2.6542693376541138e-05, -2.408679574728012e-05, -2.1630898118019104e-05, -1.9175000488758087e-05, -1.671910285949707e-05, -1.4263205230236053e-05, -1.1807307600975037e-05, -9.35140997171402e-06, -6.895512342453003e-06, -4.439614713191986e-06, -1.9837170839309692e-06, 4.721805453300476e-07, 2.9280781745910645e-06, 5.383975803852081e-06, 7.839873433113098e-06, 1.0295771062374115e-05, 1.2751668691635132e-05, 1.5207566320896149e-05, 1.7663463950157166e-05, 2.0119361579418182e-05, 2.25752592086792e-05, 2.5031156837940216e-05, 2.7487054467201233e-05, 2.994295209646225e-05, 3.2398849725723267e-05, 3.4854747354984283e-05, 3.73106449842453e-05, 3.976654261350632e-05, 4.2222440242767334e-05, 4.467833787202835e-05, 4.713423550128937e-05, 4.9590133130550385e-05, 5.20460307598114e-05, 5.450192838907242e-05, 5.6957826018333435e-05, 5.941372364759445e-05, 6.186962127685547e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 7.0, 13.0, 10.0, 19.0, 27.0, 39.0, 70.0, 88.0, 153.0, 247.0, 601.0, 1370.0, 3886.0, 14157.0, 82080.0, 482245.0, 388911.0, 57976.0, 10925.0, 3269.0, 1206.0, 546.0, 266.0, 149.0, 107.0, 50.0, 55.0, 26.0, 21.0, 19.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0], "bins": [-0.76123046875, -0.7430686950683594, -0.7249069213867188, -0.7067451477050781, -0.6885833740234375, -0.6704216003417969, -0.6522598266601562, -0.6340980529785156, -0.615936279296875, -0.5977745056152344, -0.5796127319335938, -0.5614509582519531, -0.5432891845703125, -0.5251274108886719, -0.5069656372070312, -0.4888038635253906, -0.47064208984375, -0.4524803161621094, -0.43431854248046875, -0.4161567687988281, -0.3979949951171875, -0.3798332214355469, -0.36167144775390625, -0.3435096740722656, -0.325347900390625, -0.3071861267089844, -0.28902435302734375, -0.2708625793457031, -0.2527008056640625, -0.23453903198242188, -0.21637725830078125, -0.19821548461914062, -0.1800537109375, -0.16189193725585938, -0.14373016357421875, -0.12556838989257812, -0.1074066162109375, -0.08924484252929688, -0.07108306884765625, -0.052921295166015625, -0.034759521484375, -0.016597747802734375, 0.00156402587890625, 0.019725799560546875, 0.0378875732421875, 0.056049346923828125, 0.07421112060546875, 0.09237289428710938, 0.11053466796875, 0.12869644165039062, 0.14685821533203125, 0.16501998901367188, 0.1831817626953125, 0.20134353637695312, 0.21950531005859375, 0.23766708374023438, 0.255828857421875, 0.2739906311035156, 0.29215240478515625, 0.3103141784667969, 0.3284759521484375, 0.3466377258300781, 0.36479949951171875, 0.3829612731933594, 0.401123046875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 14.0, 12.0, 21.0, 32.0, 48.0, 64.0, 99.0, 102.0, 120.0, 137.0, 85.0, 68.0, 53.0, 48.0, 31.0, 26.0, 13.0, 6.0, 4.0, 5.0, 4.0, 6.0], "bins": [-0.7978515625, -0.7821407318115234, -0.7664299011230469, -0.7507190704345703, -0.7350082397460938, -0.7192974090576172, -0.7035865783691406, -0.6878757476806641, -0.6721649169921875, -0.6564540863037109, -0.6407432556152344, -0.6250324249267578, -0.6093215942382812, -0.5936107635498047, -0.5778999328613281, -0.5621891021728516, -0.546478271484375, -0.5307674407958984, -0.5150566101074219, -0.4993457794189453, -0.48363494873046875, -0.4679241180419922, -0.4522132873535156, -0.43650245666503906, -0.4207916259765625, -0.40508079528808594, -0.3893699645996094, -0.3736591339111328, -0.35794830322265625, -0.3422374725341797, -0.3265266418457031, -0.31081581115722656, -0.29510498046875, -0.27939414978027344, -0.2636833190917969, -0.2479724884033203, -0.23226165771484375, -0.2165508270263672, -0.20083999633789062, -0.18512916564941406, -0.1694183349609375, -0.15370750427246094, -0.13799667358398438, -0.12228584289550781, -0.10657501220703125, -0.09086418151855469, -0.07515335083007812, -0.05944252014160156, -0.043731689453125, -0.028020858764648438, -0.012310028076171875, 0.0034008026123046875, 0.01911163330078125, 0.03482246398925781, 0.050533294677734375, 0.06624412536621094, 0.0819549560546875, 0.09766578674316406, 0.11337661743164062, 0.1290874481201172, 0.14479827880859375, 0.1605091094970703, 0.17621994018554688, 0.19193077087402344, 0.2076416015625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 34.0, 40.0, 46.0, 80.0, 126.0, 126.0, 146.0, 118.0, 92.0, 67.0, 31.0, 27.0, 18.0, 13.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.7641825675964355, -7.555502414703369, -7.346822261810303, -7.138142108917236, -6.92946195602417, -6.7207818031311035, -6.512101173400879, -6.3034210205078125, -6.094740867614746, -5.88606071472168, -5.677380561828613, -5.468700408935547, -5.2600202560424805, -5.051340103149414, -4.842659950256348, -4.633979797363281, -4.425299644470215, -4.216619491577148, -4.007939338684082, -3.7992591857910156, -3.590579032897949, -3.381898880004883, -3.1732184886932373, -2.964538335800171, -2.7558581829071045, -2.547178030014038, -2.3384978771209717, -2.129817485809326, -1.9211374521255493, -1.712457299232483, -1.503777027130127, -1.2950968742370605, -1.0864171981811523, -0.8777370452880859, -0.6690568327903748, -0.4603766202926636, -0.25169646739959717, -0.04301631450653076, 0.1656639575958252, 0.3743441104888916, 0.583024263381958, 0.7917044162750244, 1.0003845691680908, 1.2090648412704468, 1.4177449941635132, 1.6264251470565796, 1.8351054191589355, 2.043785572052002, 2.2524657249450684, 2.4611458778381348, 2.669826030731201, 2.8785061836242676, 3.087186336517334, 3.2958664894104004, 3.504546880722046, 3.7132270336151123, 3.9219071865081787, 4.130587577819824, 4.339267730712891, 4.547947883605957, 4.756628036499023, 4.96530818939209, 5.173988342285156, 5.382668495178223, 5.591348648071289]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 8.0, 10.0, 12.0, 7.0, 9.0, 13.0, 19.0, 23.0, 24.0, 29.0, 27.0, 31.0, 35.0, 25.0, 47.0, 51.0, 49.0, 40.0, 48.0, 42.0, 46.0, 32.0, 59.0, 42.0, 45.0, 21.0, 32.0, 31.0, 19.0, 23.0, 23.0, 11.0, 13.0, 10.0, 9.0, 9.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.498128414154053, -4.342016696929932, -4.185905456542969, -4.029793739318848, -3.8736822605133057, -3.7175707817077637, -3.5614593029022217, -3.4053478240966797, -3.2492361068725586, -3.0931246280670166, -2.9370131492614746, -2.7809014320373535, -2.6247899532318115, -2.4686784744262695, -2.3125669956207275, -2.1564555168151855, -2.0003440380096436, -1.8442325592041016, -1.68812096118927, -1.532009482383728, -1.3758978843688965, -1.2197864055633545, -1.0636749267578125, -0.907563328742981, -0.751451849937439, -0.5953403115272522, -0.4392288029193878, -0.28311729431152344, -0.12700575590133667, 0.029105782508850098, 0.1852172613143921, 0.34132885932922363, 0.4974403381347656, 0.6535518765449524, 0.8096634149551392, 0.9657748937606812, 1.1218864917755127, 1.2779979705810547, 1.4341094493865967, 1.5902210474014282, 1.7463325262069702, 1.9024440050125122, 2.0585556030273438, 2.2146670818328857, 2.3707785606384277, 2.526890277862549, 2.6830015182495117, 2.839113235473633, 2.995224714279175, 3.151336193084717, 3.307447671890259, 3.463559150695801, 3.619670867919922, 3.775782346725464, 3.931893825531006, 4.088005542755127, 4.24411678314209, 4.400228500366211, 4.556339740753174, 4.712451457977295, 4.868562698364258, 5.024674415588379, 5.1807861328125, 5.336897373199463, 5.493009090423584]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 3.0, 8.0, 6.0, 18.0, 20.0, 41.0, 58.0, 95.0, 140.0, 250.0, 429.0, 894.0, 2024.0, 6688.0, 33658.0, 474468.0, 3577227.0, 79649.0, 12038.0, 3502.0, 1345.0, 680.0, 381.0, 207.0, 142.0, 98.0, 73.0, 47.0, 30.0, 15.0, 15.0, 8.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.435455322265625, -1.38067626953125, -1.325897216796875, -1.2711181640625, -1.216339111328125, -1.16156005859375, -1.106781005859375, -1.052001953125, -0.997222900390625, -0.94244384765625, -0.887664794921875, -0.8328857421875, -0.778106689453125, -0.72332763671875, -0.668548583984375, -0.61376953125, -0.558990478515625, -0.50421142578125, -0.449432373046875, -0.3946533203125, -0.339874267578125, -0.28509521484375, -0.230316162109375, -0.175537109375, -0.120758056640625, -0.06597900390625, -0.011199951171875, 0.0435791015625, 0.098358154296875, 0.15313720703125, 0.207916259765625, 0.2626953125, 0.317474365234375, 0.37225341796875, 0.427032470703125, 0.4818115234375, 0.536590576171875, 0.59136962890625, 0.646148681640625, 0.700927734375, 0.755706787109375, 0.81048583984375, 0.865264892578125, 0.9200439453125, 0.974822998046875, 1.02960205078125, 1.084381103515625, 1.13916015625, 1.193939208984375, 1.24871826171875, 1.303497314453125, 1.3582763671875, 1.413055419921875, 1.46783447265625, 1.522613525390625, 1.577392578125, 1.632171630859375, 1.68695068359375, 1.741729736328125, 1.7965087890625, 1.851287841796875, 1.90606689453125, 1.960845947265625, 2.015625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 15.0, 22.0, 45.0, 50.0, 79.0, 100.0, 93.0, 115.0, 126.0, 93.0, 74.0, 77.0, 38.0, 31.0, 15.0, 10.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46337890625, -0.44725799560546875, -0.4311370849609375, -0.41501617431640625, -0.398895263671875, -0.38277435302734375, -0.3666534423828125, -0.35053253173828125, -0.33441162109375, -0.31829071044921875, -0.3021697998046875, -0.28604888916015625, -0.269927978515625, -0.25380706787109375, -0.2376861572265625, -0.22156524658203125, -0.2054443359375, -0.18932342529296875, -0.1732025146484375, -0.15708160400390625, -0.140960693359375, -0.12483978271484375, -0.1087188720703125, -0.09259796142578125, -0.07647705078125, -0.06035614013671875, -0.0442352294921875, -0.02811431884765625, -0.011993408203125, 0.00412750244140625, 0.0202484130859375, 0.03636932373046875, 0.052490234375, 0.06861114501953125, 0.0847320556640625, 0.10085296630859375, 0.116973876953125, 0.13309478759765625, 0.1492156982421875, 0.16533660888671875, 0.18145751953125, 0.19757843017578125, 0.2136993408203125, 0.22982025146484375, 0.245941162109375, 0.26206207275390625, 0.2781829833984375, 0.29430389404296875, 0.3104248046875, 0.32654571533203125, 0.3426666259765625, 0.35878753662109375, 0.374908447265625, 0.39102935791015625, 0.4071502685546875, 0.42327117919921875, 0.43939208984375, 0.45551300048828125, 0.4716339111328125, 0.48775482177734375, 0.503875732421875, 0.5199966430664062, 0.5361175537109375, 0.5522384643554688, 0.568359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 16.0, 21.0, 48.0, 115.0, 295.0, 800.0, 2695.0, 14193.0, 161982.0, 3784692.0, 208571.0, 16433.0, 3033.0, 819.0, 297.0, 137.0, 62.0, 18.0, 13.0, 11.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.37933349609375, -1.3231201171875, -1.26690673828125, -1.210693359375, -1.15447998046875, -1.0982666015625, -1.04205322265625, -0.98583984375, -0.92962646484375, -0.8734130859375, -0.81719970703125, -0.760986328125, -0.70477294921875, -0.6485595703125, -0.59234619140625, -0.5361328125, -0.47991943359375, -0.4237060546875, -0.36749267578125, -0.311279296875, -0.25506591796875, -0.1988525390625, -0.14263916015625, -0.08642578125, -0.03021240234375, 0.0260009765625, 0.08221435546875, 0.138427734375, 0.19464111328125, 0.2508544921875, 0.30706787109375, 0.36328125, 0.41949462890625, 0.4757080078125, 0.53192138671875, 0.588134765625, 0.64434814453125, 0.7005615234375, 0.75677490234375, 0.81298828125, 0.86920166015625, 0.9254150390625, 0.98162841796875, 1.037841796875, 1.09405517578125, 1.1502685546875, 1.20648193359375, 1.2626953125, 1.31890869140625, 1.3751220703125, 1.43133544921875, 1.487548828125, 1.54376220703125, 1.5999755859375, 1.65618896484375, 1.71240234375, 1.76861572265625, 1.8248291015625, 1.88104248046875, 1.937255859375, 1.99346923828125, 2.0496826171875, 2.10589599609375, 2.162109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 7.0, 12.0, 11.0, 10.0, 19.0, 29.0, 45.0, 96.0, 128.0, 248.0, 551.0, 1640.0, 604.0, 260.0, 142.0, 97.0, 52.0, 39.0, 22.0, 19.0, 15.0, 7.0, 9.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409423828125, -0.3960151672363281, -0.38260650634765625, -0.3691978454589844, -0.3557891845703125, -0.3423805236816406, -0.32897186279296875, -0.3155632019042969, -0.302154541015625, -0.2887458801269531, -0.27533721923828125, -0.2619285583496094, -0.2485198974609375, -0.23511123657226562, -0.22170257568359375, -0.20829391479492188, -0.19488525390625, -0.18147659301757812, -0.16806793212890625, -0.15465927124023438, -0.1412506103515625, -0.12784194946289062, -0.11443328857421875, -0.10102462768554688, -0.087615966796875, -0.07420730590820312, -0.06079864501953125, -0.047389984130859375, -0.0339813232421875, -0.020572662353515625, -0.00716400146484375, 0.006244659423828125, 0.0196533203125, 0.033061981201171875, 0.04647064208984375, 0.059879302978515625, 0.0732879638671875, 0.08669662475585938, 0.10010528564453125, 0.11351394653320312, 0.126922607421875, 0.14033126831054688, 0.15373992919921875, 0.16714859008789062, 0.1805572509765625, 0.19396591186523438, 0.20737457275390625, 0.22078323364257812, 0.23419189453125, 0.24760055541992188, 0.26100921630859375, 0.2744178771972656, 0.2878265380859375, 0.3012351989746094, 0.31464385986328125, 0.3280525207519531, 0.341461181640625, 0.3548698425292969, 0.36827850341796875, 0.3816871643066406, 0.3950958251953125, 0.4085044860839844, 0.42191314697265625, 0.4353218078613281, 0.44873046875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 11.0, 24.0, 97.0, 167.0, 257.0, 230.0, 121.0, 60.0, 25.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.573794364929199, -6.42956018447876, -6.2853264808654785, -6.141092300415039, -5.9968581199646, -5.85262393951416, -5.708390235900879, -5.5641560554504395, -5.419921875, -5.2756876945495605, -5.131453990936279, -4.98721981048584, -4.8429856300354, -4.698751449584961, -4.55451774597168, -4.41028356552124, -4.266049385070801, -4.121815204620361, -3.977581262588501, -3.8333473205566406, -3.689113140106201, -3.544879198074341, -3.4006452560424805, -3.256411075592041, -3.1121773719787598, -2.9679434299468994, -2.82370924949646, -2.6794753074645996, -2.53524112701416, -2.3910071849823, -2.2467732429504395, -2.1025390625, -1.9583046436309814, -1.8140705823898315, -1.6698365211486816, -1.5256025791168213, -1.3813683986663818, -1.2371344566345215, -1.0929003953933716, -0.9486663341522217, -0.8044322729110718, -0.6601982116699219, -0.515964150428772, -0.37173014879226685, -0.22749608755111694, -0.08326202630996704, 0.060971975326538086, 0.205206036567688, 0.3494400978088379, 0.4936741590499878, 0.6379082202911377, 0.7821422219276428, 0.9263762831687927, 1.0706102848052979, 1.2148443460464478, 1.3590784072875977, 1.5033124685287476, 1.6475465297698975, 1.7917805910110474, 1.9360146522521973, 2.0802485942840576, 2.224482774734497, 2.3687167167663574, 2.512950897216797, 2.6571848392486572]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 7.0, 18.0, 16.0, 22.0, 24.0, 41.0, 35.0, 47.0, 47.0, 68.0, 59.0, 81.0, 56.0, 73.0, 68.0, 64.0, 63.0, 51.0, 44.0, 35.0, 21.0, 20.0, 18.0, 8.0, 1.0, 6.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6214098930358887, -1.563547134399414, -1.505684494972229, -1.447821855545044, -1.3899590969085693, -1.3320963382720947, -1.2742336988449097, -1.2163710594177246, -1.15850830078125, -1.1006455421447754, -1.0427829027175903, -0.9849202036857605, -0.9270575046539307, -0.8691948056221008, -0.811332106590271, -0.7534694075584412, -0.6956067085266113, -0.6377440094947815, -0.5798813104629517, -0.5220186114311218, -0.464155912399292, -0.40629321336746216, -0.3484305143356323, -0.2905678153038025, -0.23270511627197266, -0.17484241724014282, -0.11697971820831299, -0.059117019176483154, -0.0012543201446533203, 0.056608378887176514, 0.11447107791900635, 0.17233377695083618, 0.23019647598266602, 0.28805917501449585, 0.3459218740463257, 0.4037845730781555, 0.46164727210998535, 0.5195099711418152, 0.577372670173645, 0.6352353692054749, 0.6930980682373047, 0.7509607672691345, 0.8088234663009644, 0.8666861653327942, 0.924548864364624, 0.9824115633964539, 1.0402742624282837, 1.0981369018554688, 1.1559996604919434, 1.213862419128418, 1.271725058555603, 1.329587697982788, 1.3874504566192627, 1.4453132152557373, 1.5031758546829224, 1.5610384941101074, 1.618901252746582, 1.6767640113830566, 1.7346266508102417, 1.7924892902374268, 1.8503520488739014, 1.908214807510376, 1.966077446937561, 2.023940086364746, 2.0818028450012207]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 12.0, 11.0, 24.0, 19.0, 33.0, 14.0, 48.0, 41.0, 74.0, 129.0, 146.0, 165.0, 256.0, 353.0, 485.0, 738.0, 1142.0, 2071.0, 4202.0, 10851.0, 35233.0, 135600.0, 417104.0, 313490.0, 86785.0, 23613.0, 7687.0, 3304.0, 1622.0, 1009.0, 634.0, 434.0, 369.0, 215.0, 152.0, 125.0, 97.0, 59.0, 48.0, 43.0, 32.0, 21.0, 12.0, 14.0, 7.0, 5.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.2958984375, -1.257598876953125, -1.21929931640625, -1.180999755859375, -1.1427001953125, -1.104400634765625, -1.06610107421875, -1.027801513671875, -0.989501953125, -0.951202392578125, -0.91290283203125, -0.874603271484375, -0.8363037109375, -0.798004150390625, -0.75970458984375, -0.721405029296875, -0.68310546875, -0.644805908203125, -0.60650634765625, -0.568206787109375, -0.5299072265625, -0.491607666015625, -0.45330810546875, -0.415008544921875, -0.376708984375, -0.338409423828125, -0.30010986328125, -0.261810302734375, -0.2235107421875, -0.185211181640625, -0.14691162109375, -0.108612060546875, -0.0703125, -0.032012939453125, 0.00628662109375, 0.044586181640625, 0.0828857421875, 0.121185302734375, 0.15948486328125, 0.197784423828125, 0.236083984375, 0.274383544921875, 0.31268310546875, 0.350982666015625, 0.3892822265625, 0.427581787109375, 0.46588134765625, 0.504180908203125, 0.54248046875, 0.580780029296875, 0.61907958984375, 0.657379150390625, 0.6956787109375, 0.733978271484375, 0.77227783203125, 0.810577392578125, 0.848876953125, 0.887176513671875, 0.92547607421875, 0.963775634765625, 1.0020751953125, 1.040374755859375, 1.07867431640625, 1.116973876953125, 1.1552734375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 13.0, 14.0, 31.0, 37.0, 59.0, 86.0, 109.0, 106.0, 133.0, 110.0, 82.0, 83.0, 59.0, 26.0, 19.0, 12.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.4636077880859375, -0.447235107421875, -0.4308624267578125, -0.41448974609375, -0.3981170654296875, -0.381744384765625, -0.3653717041015625, -0.3489990234375, -0.3326263427734375, -0.316253662109375, -0.2998809814453125, -0.28350830078125, -0.2671356201171875, -0.250762939453125, -0.2343902587890625, -0.218017578125, -0.2016448974609375, -0.185272216796875, -0.1688995361328125, -0.15252685546875, -0.1361541748046875, -0.119781494140625, -0.1034088134765625, -0.0870361328125, -0.0706634521484375, -0.054290771484375, -0.0379180908203125, -0.02154541015625, -0.0051727294921875, 0.011199951171875, 0.0275726318359375, 0.0439453125, 0.0603179931640625, 0.076690673828125, 0.0930633544921875, 0.10943603515625, 0.1258087158203125, 0.142181396484375, 0.1585540771484375, 0.1749267578125, 0.1912994384765625, 0.207672119140625, 0.2240447998046875, 0.24041748046875, 0.2567901611328125, 0.273162841796875, 0.2895355224609375, 0.305908203125, 0.3222808837890625, 0.338653564453125, 0.3550262451171875, 0.37139892578125, 0.3877716064453125, 0.404144287109375, 0.4205169677734375, 0.4368896484375, 0.4532623291015625, 0.469635009765625, 0.4860076904296875, 0.50238037109375, 0.5187530517578125, 0.535125732421875, 0.5514984130859375, 0.56787109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 2.0, 5.0, 10.0, 9.0, 22.0, 27.0, 24.0, 58.0, 82.0, 123.0, 188.0, 288.0, 547.0, 1153.0, 2392.0, 6404.0, 18212.0, 56155.0, 178567.0, 398459.0, 258548.0, 85150.0, 26675.0, 8896.0, 3422.0, 1475.0, 691.0, 371.0, 228.0, 110.0, 83.0, 51.0, 37.0, 30.0, 17.0, 6.0, 9.0, 4.0, 7.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7318038940429688, -0.7062835693359375, -0.6807632446289062, -0.655242919921875, -0.6297225952148438, -0.6042022705078125, -0.5786819458007812, -0.55316162109375, -0.5276412963867188, -0.5021209716796875, -0.47660064697265625, -0.451080322265625, -0.42555999755859375, -0.4000396728515625, -0.37451934814453125, -0.3489990234375, -0.32347869873046875, -0.2979583740234375, -0.27243804931640625, -0.246917724609375, -0.22139739990234375, -0.1958770751953125, -0.17035675048828125, -0.14483642578125, -0.11931610107421875, -0.0937957763671875, -0.06827545166015625, -0.042755126953125, -0.01723480224609375, 0.0082855224609375, 0.03380584716796875, 0.059326171875, 0.08484649658203125, 0.1103668212890625, 0.13588714599609375, 0.161407470703125, 0.18692779541015625, 0.2124481201171875, 0.23796844482421875, 0.26348876953125, 0.28900909423828125, 0.3145294189453125, 0.34004974365234375, 0.365570068359375, 0.39109039306640625, 0.4166107177734375, 0.44213104248046875, 0.4676513671875, 0.49317169189453125, 0.5186920166015625, 0.5442123413085938, 0.569732666015625, 0.5952529907226562, 0.6207733154296875, 0.6462936401367188, 0.67181396484375, 0.6973342895507812, 0.7228546142578125, 0.7483749389648438, 0.773895263671875, 0.7994155883789062, 0.8249359130859375, 0.8504562377929688, 0.8759765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 11.0, 4.0, 4.0, 9.0, 13.0, 12.0, 12.0, 20.0, 22.0, 18.0, 26.0, 30.0, 31.0, 35.0, 37.0, 40.0, 34.0, 42.0, 42.0, 48.0, 47.0, 50.0, 43.0, 36.0, 38.0, 27.0, 30.0, 34.0, 37.0, 26.0, 22.0, 21.0, 16.0, 16.0, 12.0, 11.0, 7.0, 9.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8585433959960938, -0.8318328857421875, -0.8051223754882812, -0.778411865234375, -0.7517013549804688, -0.7249908447265625, -0.6982803344726562, -0.67156982421875, -0.6448593139648438, -0.6181488037109375, -0.5914382934570312, -0.564727783203125, -0.5380172729492188, -0.5113067626953125, -0.48459625244140625, -0.4578857421875, -0.43117523193359375, -0.4044647216796875, -0.37775421142578125, -0.351043701171875, -0.32433319091796875, -0.2976226806640625, -0.27091217041015625, -0.24420166015625, -0.21749114990234375, -0.1907806396484375, -0.16407012939453125, -0.137359619140625, -0.11064910888671875, -0.0839385986328125, -0.05722808837890625, -0.030517578125, -0.00380706787109375, 0.0229034423828125, 0.04961395263671875, 0.076324462890625, 0.10303497314453125, 0.1297454833984375, 0.15645599365234375, 0.18316650390625, 0.20987701416015625, 0.2365875244140625, 0.26329803466796875, 0.290008544921875, 0.31671905517578125, 0.3434295654296875, 0.37014007568359375, 0.3968505859375, 0.42356109619140625, 0.4502716064453125, 0.47698211669921875, 0.503692626953125, 0.5304031372070312, 0.5571136474609375, 0.5838241577148438, 0.61053466796875, 0.6372451782226562, 0.6639556884765625, 0.6906661987304688, 0.717376708984375, 0.7440872192382812, 0.7707977294921875, 0.7975082397460938, 0.82421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 7.0, 9.0, 12.0, 15.0, 21.0, 26.0, 33.0, 55.0, 94.0, 172.0, 288.0, 654.0, 1362.0, 3616.0, 15237.0, 218425.0, 741377.0, 55455.0, 7340.0, 2376.0, 925.0, 426.0, 230.0, 112.0, 79.0, 46.0, 31.0, 31.0, 26.0, 19.0, 10.0, 4.0, 14.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0615234375, -1.0305557250976562, -0.9995880126953125, -0.9686203002929688, -0.937652587890625, -0.9066848754882812, -0.8757171630859375, -0.8447494506835938, -0.81378173828125, -0.7828140258789062, -0.7518463134765625, -0.7208786010742188, -0.689910888671875, -0.6589431762695312, -0.6279754638671875, -0.5970077514648438, -0.5660400390625, -0.5350723266601562, -0.5041046142578125, -0.47313690185546875, -0.442169189453125, -0.41120147705078125, -0.3802337646484375, -0.34926605224609375, -0.31829833984375, -0.28733062744140625, -0.2563629150390625, -0.22539520263671875, -0.194427490234375, -0.16345977783203125, -0.1324920654296875, -0.10152435302734375, -0.070556640625, -0.03958892822265625, -0.0086212158203125, 0.02234649658203125, 0.053314208984375, 0.08428192138671875, 0.1152496337890625, 0.14621734619140625, 0.17718505859375, 0.20815277099609375, 0.2391204833984375, 0.27008819580078125, 0.301055908203125, 0.33202362060546875, 0.3629913330078125, 0.39395904541015625, 0.4249267578125, 0.45589447021484375, 0.4868621826171875, 0.5178298950195312, 0.548797607421875, 0.5797653198242188, 0.6107330322265625, 0.6417007446289062, 0.67266845703125, 0.7036361694335938, 0.7346038818359375, 0.7655715942382812, 0.796539306640625, 0.8275070190429688, 0.8584747314453125, 0.8894424438476562, 0.92041015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 10.0, 6.0, 10.0, 14.0, 25.0, 50.0, 68.0, 117.0, 191.0, 189.0, 142.0, 63.0, 51.0, 31.0, 14.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014710426330566406, -0.0001412220299243927, -0.00013533979654312134, -0.00012945756316184998, -0.0001235753297805786, -0.00011769309639930725, -0.00011181086301803589, -0.00010592862963676453, -0.00010004639625549316, -9.41641628742218e-05, -8.828192949295044e-05, -8.239969611167908e-05, -7.651746273040771e-05, -7.063522934913635e-05, -6.475299596786499e-05, -5.887076258659363e-05, -5.2988529205322266e-05, -4.71062958240509e-05, -4.122406244277954e-05, -3.534182906150818e-05, -2.9459595680236816e-05, -2.3577362298965454e-05, -1.7695128917694092e-05, -1.181289553642273e-05, -5.930662155151367e-06, -4.842877388000488e-08, 5.833804607391357e-06, 1.171603798866272e-05, 1.7598271369934082e-05, 2.3480504751205444e-05, 2.9362738132476807e-05, 3.524497151374817e-05, 4.112720489501953e-05, 4.7009438276290894e-05, 5.2891671657562256e-05, 5.877390503883362e-05, 6.465613842010498e-05, 7.053837180137634e-05, 7.64206051826477e-05, 8.230283856391907e-05, 8.818507194519043e-05, 9.406730532646179e-05, 9.994953870773315e-05, 0.00010583177208900452, 0.00011171400547027588, 0.00011759623885154724, 0.0001234784722328186, 0.00012936070561408997, 0.00013524293899536133, 0.0001411251723766327, 0.00014700740575790405, 0.00015288963913917542, 0.00015877187252044678, 0.00016465410590171814, 0.0001705363392829895, 0.00017641857266426086, 0.00018230080604553223, 0.0001881830394268036, 0.00019406527280807495, 0.0001999475061893463, 0.00020582973957061768, 0.00021171197295188904, 0.0002175942063331604, 0.00022347643971443176, 0.00022935867309570312]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 13.0, 18.0, 16.0, 40.0, 38.0, 60.0, 102.0, 170.0, 307.0, 592.0, 1095.0, 2387.0, 5987.0, 18732.0, 82982.0, 378388.0, 423920.0, 99839.0, 21992.0, 6652.0, 2584.0, 1170.0, 614.0, 311.0, 205.0, 108.0, 59.0, 47.0, 32.0, 30.0, 13.0, 13.0, 10.0, 5.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.57373046875, -0.55865478515625, -0.5435791015625, -0.52850341796875, -0.513427734375, -0.49835205078125, -0.4832763671875, -0.46820068359375, -0.453125, -0.43804931640625, -0.4229736328125, -0.40789794921875, -0.392822265625, -0.37774658203125, -0.3626708984375, -0.34759521484375, -0.33251953125, -0.31744384765625, -0.3023681640625, -0.28729248046875, -0.272216796875, -0.25714111328125, -0.2420654296875, -0.22698974609375, -0.2119140625, -0.19683837890625, -0.1817626953125, -0.16668701171875, -0.151611328125, -0.13653564453125, -0.1214599609375, -0.10638427734375, -0.09130859375, -0.07623291015625, -0.0611572265625, -0.04608154296875, -0.031005859375, -0.01593017578125, -0.0008544921875, 0.01422119140625, 0.029296875, 0.04437255859375, 0.0594482421875, 0.07452392578125, 0.089599609375, 0.10467529296875, 0.1197509765625, 0.13482666015625, 0.14990234375, 0.16497802734375, 0.1800537109375, 0.19512939453125, 0.210205078125, 0.22528076171875, 0.2403564453125, 0.25543212890625, 0.2705078125, 0.28558349609375, 0.3006591796875, 0.31573486328125, 0.330810546875, 0.34588623046875, 0.3609619140625, 0.37603759765625, 0.39111328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 10.0, 5.0, 4.0, 12.0, 14.0, 16.0, 23.0, 19.0, 38.0, 46.0, 58.0, 71.0, 84.0, 93.0, 80.0, 76.0, 74.0, 61.0, 39.0, 50.0, 38.0, 27.0, 14.0, 11.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431396484375, -0.41977691650390625, -0.4081573486328125, -0.39653778076171875, -0.384918212890625, -0.37329864501953125, -0.3616790771484375, -0.35005950927734375, -0.33843994140625, -0.32682037353515625, -0.3152008056640625, -0.30358123779296875, -0.291961669921875, -0.28034210205078125, -0.2687225341796875, -0.25710296630859375, -0.2454833984375, -0.23386383056640625, -0.2222442626953125, -0.21062469482421875, -0.199005126953125, -0.18738555908203125, -0.1757659912109375, -0.16414642333984375, -0.15252685546875, -0.14090728759765625, -0.1292877197265625, -0.11766815185546875, -0.106048583984375, -0.09442901611328125, -0.0828094482421875, -0.07118988037109375, -0.0595703125, -0.04795074462890625, -0.0363311767578125, -0.02471160888671875, -0.013092041015625, -0.00147247314453125, 0.0101470947265625, 0.02176666259765625, 0.03338623046875, 0.04500579833984375, 0.0566253662109375, 0.06824493408203125, 0.079864501953125, 0.09148406982421875, 0.1031036376953125, 0.11472320556640625, 0.1263427734375, 0.13796234130859375, 0.1495819091796875, 0.16120147705078125, 0.172821044921875, 0.18444061279296875, 0.1960601806640625, 0.20767974853515625, 0.21929931640625, 0.23091888427734375, 0.2425384521484375, 0.25415802001953125, 0.265777587890625, 0.27739715576171875, 0.2890167236328125, 0.30063629150390625, 0.312255859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 7.0, 5.0, 17.0, 26.0, 57.0, 83.0, 141.0, 180.0, 180.0, 142.0, 91.0, 38.0, 18.0, 11.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.774497032165527, -9.476940155029297, -9.179384231567383, -8.881827354431152, -8.584270477294922, -8.286714553833008, -7.989157676696777, -7.691601276397705, -7.394044876098633, -7.0964884757995605, -6.79893159866333, -6.501375198364258, -6.2038187980651855, -5.906262397766113, -5.608705520629883, -5.3111491203308105, -5.01359224319458, -4.716035842895508, -4.418478965759277, -4.120922565460205, -3.823366165161133, -3.5258095264434814, -3.22825288772583, -2.930696487426758, -2.6331398487091064, -2.335583209991455, -2.038026809692383, -1.7404701709747314, -1.4429136514663696, -1.1453571319580078, -0.8478004932403564, -0.5502440929412842, -0.2526874542236328, 0.04486909508705139, 0.3424256443977356, 0.6399822235107422, 0.937538743019104, 1.2350952625274658, 1.5326519012451172, 1.8302083015441895, 2.127764940261841, 2.425321578979492, 2.7228779792785645, 3.020434617996216, 3.317991256713867, 3.6155476570129395, 3.913104295730591, 4.210660934448242, 4.5082173347473145, 4.805773735046387, 5.103330612182617, 5.4008870124816895, 5.698443412780762, 5.996000289916992, 6.2935566902160645, 6.591113090515137, 6.888669967651367, 7.1862263679504395, 7.48378324508667, 7.781339645385742, 8.078896522521973, 8.376452445983887, 8.674009323120117, 8.971565246582031, 9.269122123718262]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 9.0, 8.0, 7.0, 6.0, 16.0, 10.0, 23.0, 15.0, 25.0, 27.0, 27.0, 36.0, 36.0, 48.0, 38.0, 38.0, 46.0, 35.0, 44.0, 42.0, 40.0, 44.0, 48.0, 41.0, 31.0, 36.0, 34.0, 34.0, 19.0, 20.0, 18.0, 11.0, 17.0, 16.0, 13.0, 9.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.13310432434082, -4.980539321899414, -4.827974796295166, -4.67540979385376, -4.522845268249512, -4.3702802658081055, -4.217715263366699, -4.065150260925293, -3.912585735321045, -3.7600209712982178, -3.6074562072753906, -3.4548912048339844, -3.3023264408111572, -3.14976167678833, -2.997196674346924, -2.8446319103240967, -2.6920671463012695, -2.5395023822784424, -2.3869376182556152, -2.234372615814209, -2.081807851791382, -1.9292430877685547, -1.776678204536438, -1.6241133213043213, -1.4715485572814941, -1.318983793258667, -1.1664189100265503, -1.0138540267944336, -0.8612892627716064, -0.7087244391441345, -0.5561596155166626, -0.4035947322845459, -0.25102996826171875, -0.09846514463424683, 0.0540996789932251, 0.20666450262069702, 0.35922932624816895, 0.5117941498756409, 0.6643589735031128, 0.8169238567352295, 0.9694886207580566, 1.1220533847808838, 1.2746182680130005, 1.4271831512451172, 1.5797479152679443, 1.7323126792907715, 1.8848775625228882, 2.037442445755005, 2.190007209777832, 2.342571973800659, 2.4951367378234863, 2.6477017402648926, 2.8002665042877197, 2.952831268310547, 3.105396270751953, 3.2579610347747803, 3.4105257987976074, 3.5630905628204346, 3.7156553268432617, 3.868220329284668, 4.020785331726074, 4.173349857330322, 4.3259148597717285, 4.478479385375977, 4.631044387817383]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 13.0, 10.0, 25.0, 33.0, 57.0, 111.0, 195.0, 402.0, 788.0, 2269.0, 9100.0, 92455.0, 3893900.0, 176099.0, 13359.0, 3133.0, 1116.0, 554.0, 264.0, 145.0, 86.0, 49.0, 44.0, 18.0, 12.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.33984375, -2.26806640625, -2.1962890625, -2.12451171875, -2.052734375, -1.98095703125, -1.9091796875, -1.83740234375, -1.765625, -1.69384765625, -1.6220703125, -1.55029296875, -1.478515625, -1.40673828125, -1.3349609375, -1.26318359375, -1.19140625, -1.11962890625, -1.0478515625, -0.97607421875, -0.904296875, -0.83251953125, -0.7607421875, -0.68896484375, -0.6171875, -0.54541015625, -0.4736328125, -0.40185546875, -0.330078125, -0.25830078125, -0.1865234375, -0.11474609375, -0.04296875, 0.02880859375, 0.1005859375, 0.17236328125, 0.244140625, 0.31591796875, 0.3876953125, 0.45947265625, 0.53125, 0.60302734375, 0.6748046875, 0.74658203125, 0.818359375, 0.89013671875, 0.9619140625, 1.03369140625, 1.10546875, 1.17724609375, 1.2490234375, 1.32080078125, 1.392578125, 1.46435546875, 1.5361328125, 1.60791015625, 1.6796875, 1.75146484375, 1.8232421875, 1.89501953125, 1.966796875, 2.03857421875, 2.1103515625, 2.18212890625, 2.25390625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 13.0, 32.0, 35.0, 51.0, 62.0, 96.0, 116.0, 108.0, 122.0, 95.0, 91.0, 75.0, 39.0, 20.0, 12.0, 10.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51220703125, -0.49501800537109375, -0.4778289794921875, -0.46063995361328125, -0.443450927734375, -0.42626190185546875, -0.4090728759765625, -0.39188385009765625, -0.37469482421875, -0.35750579833984375, -0.3403167724609375, -0.32312774658203125, -0.305938720703125, -0.28874969482421875, -0.2715606689453125, -0.25437164306640625, -0.2371826171875, -0.21999359130859375, -0.2028045654296875, -0.18561553955078125, -0.168426513671875, -0.15123748779296875, -0.1340484619140625, -0.11685943603515625, -0.09967041015625, -0.08248138427734375, -0.0652923583984375, -0.04810333251953125, -0.030914306640625, -0.01372528076171875, 0.0034637451171875, 0.02065277099609375, 0.037841796875, 0.05503082275390625, 0.0722198486328125, 0.08940887451171875, 0.106597900390625, 0.12378692626953125, 0.1409759521484375, 0.15816497802734375, 0.17535400390625, 0.19254302978515625, 0.2097320556640625, 0.22692108154296875, 0.244110107421875, 0.26129913330078125, 0.2784881591796875, 0.29567718505859375, 0.3128662109375, 0.33005523681640625, 0.3472442626953125, 0.36443328857421875, 0.381622314453125, 0.39881134033203125, 0.4160003662109375, 0.43318939208984375, 0.45037841796875, 0.46756744384765625, 0.4847564697265625, 0.5019454956054688, 0.519134521484375, 0.5363235473632812, 0.5535125732421875, 0.5707015991210938, 0.587890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 16.0, 24.0, 35.0, 61.0, 198.0, 520.0, 1731.0, 7214.0, 47547.0, 1197863.0, 2861966.0, 65215.0, 8830.0, 2010.0, 623.0, 228.0, 98.0, 45.0, 16.0, 14.0, 9.0, 5.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8251953125, -1.7731475830078125, -1.721099853515625, -1.6690521240234375, -1.61700439453125, -1.5649566650390625, -1.512908935546875, -1.4608612060546875, -1.4088134765625, -1.3567657470703125, -1.304718017578125, -1.2526702880859375, -1.20062255859375, -1.1485748291015625, -1.096527099609375, -1.0444793701171875, -0.992431640625, -0.9403839111328125, -0.888336181640625, -0.8362884521484375, -0.78424072265625, -0.7321929931640625, -0.680145263671875, -0.6280975341796875, -0.5760498046875, -0.5240020751953125, -0.471954345703125, -0.4199066162109375, -0.36785888671875, -0.3158111572265625, -0.263763427734375, -0.2117156982421875, -0.15966796875, -0.1076202392578125, -0.055572509765625, -0.0035247802734375, 0.04852294921875, 0.1005706787109375, 0.152618408203125, 0.2046661376953125, 0.2567138671875, 0.3087615966796875, 0.360809326171875, 0.4128570556640625, 0.46490478515625, 0.5169525146484375, 0.569000244140625, 0.6210479736328125, 0.673095703125, 0.7251434326171875, 0.777191162109375, 0.8292388916015625, 0.88128662109375, 0.9333343505859375, 0.985382080078125, 1.0374298095703125, 1.0894775390625, 1.1415252685546875, 1.193572998046875, 1.2456207275390625, 1.29766845703125, 1.3497161865234375, 1.401763916015625, 1.4538116455078125, 1.505859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 5.0, 8.0, 13.0, 14.0, 28.0, 43.0, 52.0, 81.0, 119.0, 203.0, 358.0, 902.0, 1124.0, 443.0, 237.0, 135.0, 85.0, 51.0, 39.0, 24.0, 25.0, 18.0, 10.0, 9.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.437744140625, -0.4240989685058594, -0.41045379638671875, -0.3968086242675781, -0.3831634521484375, -0.3695182800292969, -0.35587310791015625, -0.3422279357910156, -0.328582763671875, -0.3149375915527344, -0.30129241943359375, -0.2876472473144531, -0.2740020751953125, -0.2603569030761719, -0.24671173095703125, -0.23306655883789062, -0.21942138671875, -0.20577621459960938, -0.19213104248046875, -0.17848587036132812, -0.1648406982421875, -0.15119552612304688, -0.13755035400390625, -0.12390518188476562, -0.110260009765625, -0.09661483764648438, -0.08296966552734375, -0.06932449340820312, -0.0556793212890625, -0.042034149169921875, -0.02838897705078125, -0.014743804931640625, -0.0010986328125, 0.012546539306640625, 0.02619171142578125, 0.039836883544921875, 0.0534820556640625, 0.06712722778320312, 0.08077239990234375, 0.09441757202148438, 0.108062744140625, 0.12170791625976562, 0.13535308837890625, 0.14899826049804688, 0.1626434326171875, 0.17628860473632812, 0.18993377685546875, 0.20357894897460938, 0.21722412109375, 0.23086929321289062, 0.24451446533203125, 0.2581596374511719, 0.2718048095703125, 0.2854499816894531, 0.29909515380859375, 0.3127403259277344, 0.326385498046875, 0.3400306701660156, 0.35367584228515625, 0.3673210144042969, 0.3809661865234375, 0.3946113586425781, 0.40825653076171875, 0.4219017028808594, 0.435546875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 4.0, 4.0, 8.0, 22.0, 61.0, 115.0, 197.0, 265.0, 169.0, 91.0, 32.0, 25.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.444695949554443, -6.2917890548706055, -6.138882160186768, -5.9859747886657715, -5.833067893981934, -5.680160999298096, -5.527254104614258, -5.37434720993042, -5.221440315246582, -5.068533420562744, -4.915626525878906, -4.76271915435791, -4.609812259674072, -4.456905364990234, -4.3039984703063965, -4.151091575622559, -3.9981842041015625, -3.8452773094177246, -3.6923701763153076, -3.5394632816314697, -3.3865561485290527, -3.233649253845215, -3.080742359161377, -2.927835464477539, -2.774928331375122, -2.622021436691284, -2.469114303588867, -2.3162074089050293, -2.1633005142211914, -2.0103933811187744, -1.8574864864349365, -1.704579472541809, -1.5516724586486816, -1.3987654447555542, -1.2458584308624268, -1.0929515361785889, -0.9400445222854614, -0.787137508392334, -0.6342305541038513, -0.48132359981536865, -0.3284165859222412, -0.17550960183143616, -0.022602617740631104, 0.13030436635017395, 0.283211350440979, 0.43611836433410645, 0.5890253186225891, 0.7419322729110718, 0.8948392868041992, 1.0477463006973267, 1.200653314590454, 1.353560209274292, 1.5064672231674194, 1.6593742370605469, 1.8122811317443848, 1.9651881456375122, 2.1180951595306396, 2.2710020542144775, 2.4239091873168945, 2.5768160820007324, 2.7297229766845703, 2.8826301097869873, 3.035537004470825, 3.188444137573242, 3.34135103225708]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 11.0, 18.0, 11.0, 25.0, 29.0, 40.0, 40.0, 44.0, 53.0, 50.0, 62.0, 53.0, 41.0, 62.0, 60.0, 55.0, 46.0, 46.0, 38.0, 33.0, 25.0, 34.0, 21.0, 20.0, 14.0, 11.0, 6.0, 12.0, 4.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.924283504486084, -1.8664038181304932, -1.8085241317749023, -1.7506444454193115, -1.6927646398544312, -1.6348849534988403, -1.5770052671432495, -1.5191255807876587, -1.4612458944320679, -1.403366208076477, -1.3454865217208862, -1.2876067161560059, -1.229727029800415, -1.1718473434448242, -1.1139676570892334, -1.0560879707336426, -0.998208224773407, -0.9403285384178162, -0.8824487924575806, -0.8245691061019897, -0.7666894197463989, -0.7088097333908081, -0.6509299874305725, -0.5930503010749817, -0.5351705551147461, -0.4772908389568329, -0.41941115260124207, -0.36153143644332886, -0.30365175008773804, -0.24577203392982483, -0.18789231777191162, -0.1300126314163208, -0.07213294506072998, -0.014253240078687668, 0.043626464903354645, 0.10150617361068726, 0.15938587486743927, 0.21726557612419128, 0.2751452922821045, 0.3330249786376953, 0.3909046947956085, 0.44878441095352173, 0.5066640973091125, 0.5645438432693481, 0.622423529624939, 0.6803032159805298, 0.7381829023361206, 0.7960625886917114, 0.853942334651947, 0.9118220210075378, 0.9697017669677734, 1.0275814533233643, 1.085461139678955, 1.143340826034546, 1.2012205123901367, 1.2591001987457275, 1.316980004310608, 1.3748596906661987, 1.4327393770217896, 1.49061918258667, 1.5484988689422607, 1.6063785552978516, 1.6642582416534424, 1.7221379280090332, 1.780017614364624]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 5.0, 7.0, 5.0, 12.0, 16.0, 24.0, 44.0, 44.0, 66.0, 105.0, 194.0, 335.0, 528.0, 1010.0, 2176.0, 5646.0, 25224.0, 213144.0, 683062.0, 95718.0, 13800.0, 3848.0, 1573.0, 798.0, 427.0, 277.0, 155.0, 97.0, 74.0, 45.0, 24.0, 15.0, 12.0, 11.0, 5.0, 2.0, 8.0, 5.0, 3.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8564453125, -1.7909088134765625, -1.725372314453125, -1.6598358154296875, -1.59429931640625, -1.5287628173828125, -1.463226318359375, -1.3976898193359375, -1.3321533203125, -1.2666168212890625, -1.201080322265625, -1.1355438232421875, -1.07000732421875, -1.0044708251953125, -0.938934326171875, -0.8733978271484375, -0.807861328125, -0.7423248291015625, -0.676788330078125, -0.6112518310546875, -0.54571533203125, -0.4801788330078125, -0.414642333984375, -0.3491058349609375, -0.2835693359375, -0.2180328369140625, -0.152496337890625, -0.0869598388671875, -0.02142333984375, 0.0441131591796875, 0.109649658203125, 0.1751861572265625, 0.24072265625, 0.3062591552734375, 0.371795654296875, 0.4373321533203125, 0.50286865234375, 0.5684051513671875, 0.633941650390625, 0.6994781494140625, 0.7650146484375, 0.8305511474609375, 0.896087646484375, 0.9616241455078125, 1.02716064453125, 1.0926971435546875, 1.158233642578125, 1.2237701416015625, 1.289306640625, 1.3548431396484375, 1.420379638671875, 1.4859161376953125, 1.55145263671875, 1.6169891357421875, 1.682525634765625, 1.7480621337890625, 1.8135986328125, 1.8791351318359375, 1.944671630859375, 2.0102081298828125, 2.07574462890625, 2.1412811279296875, 2.206817626953125, 2.2723541259765625, 2.337890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 16.0, 32.0, 44.0, 53.0, 71.0, 121.0, 98.0, 118.0, 119.0, 100.0, 84.0, 50.0, 31.0, 22.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.4957275390625, -0.478271484375, -0.4608154296875, -0.443359375, -0.4259033203125, -0.408447265625, -0.3909912109375, -0.37353515625, -0.3560791015625, -0.338623046875, -0.3211669921875, -0.3037109375, -0.2862548828125, -0.268798828125, -0.2513427734375, -0.23388671875, -0.2164306640625, -0.198974609375, -0.1815185546875, -0.1640625, -0.1466064453125, -0.129150390625, -0.1116943359375, -0.09423828125, -0.0767822265625, -0.059326171875, -0.0418701171875, -0.0244140625, -0.0069580078125, 0.010498046875, 0.0279541015625, 0.04541015625, 0.0628662109375, 0.080322265625, 0.0977783203125, 0.115234375, 0.1326904296875, 0.150146484375, 0.1676025390625, 0.18505859375, 0.2025146484375, 0.219970703125, 0.2374267578125, 0.2548828125, 0.2723388671875, 0.289794921875, 0.3072509765625, 0.32470703125, 0.3421630859375, 0.359619140625, 0.3770751953125, 0.39453125, 0.4119873046875, 0.429443359375, 0.4468994140625, 0.46435546875, 0.4818115234375, 0.499267578125, 0.5167236328125, 0.5341796875, 0.5516357421875, 0.569091796875, 0.5865478515625, 0.60400390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 8.0, 16.0, 18.0, 18.0, 21.0, 30.0, 52.0, 59.0, 80.0, 142.0, 243.0, 457.0, 916.0, 2545.0, 7918.0, 31010.0, 151015.0, 528928.0, 254657.0, 51626.0, 12271.0, 3580.0, 1362.0, 610.0, 324.0, 205.0, 110.0, 81.0, 60.0, 41.0, 32.0, 20.0, 21.0, 9.0, 12.0, 9.0, 9.0, 3.0, 2.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.083984375, -1.0507965087890625, -1.017608642578125, -0.9844207763671875, -0.95123291015625, -0.9180450439453125, -0.884857177734375, -0.8516693115234375, -0.8184814453125, -0.7852935791015625, -0.752105712890625, -0.7189178466796875, -0.68572998046875, -0.6525421142578125, -0.619354248046875, -0.5861663818359375, -0.552978515625, -0.5197906494140625, -0.486602783203125, -0.4534149169921875, -0.42022705078125, -0.3870391845703125, -0.353851318359375, -0.3206634521484375, -0.2874755859375, -0.2542877197265625, -0.221099853515625, -0.1879119873046875, -0.15472412109375, -0.1215362548828125, -0.088348388671875, -0.0551605224609375, -0.02197265625, 0.0112152099609375, 0.044403076171875, 0.0775909423828125, 0.11077880859375, 0.1439666748046875, 0.177154541015625, 0.2103424072265625, 0.2435302734375, 0.2767181396484375, 0.309906005859375, 0.3430938720703125, 0.37628173828125, 0.4094696044921875, 0.442657470703125, 0.4758453369140625, 0.509033203125, 0.5422210693359375, 0.575408935546875, 0.6085968017578125, 0.64178466796875, 0.6749725341796875, 0.708160400390625, 0.7413482666015625, 0.7745361328125, 0.8077239990234375, 0.840911865234375, 0.8740997314453125, 0.90728759765625, 0.9404754638671875, 0.973663330078125, 1.0068511962890625, 1.0400390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 11.0, 11.0, 12.0, 11.0, 17.0, 25.0, 43.0, 30.0, 46.0, 68.0, 50.0, 46.0, 59.0, 52.0, 51.0, 44.0, 47.0, 47.0, 39.0, 44.0, 38.0, 32.0, 29.0, 31.0, 19.0, 12.0, 19.0, 16.0, 12.0, 8.0, 10.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.970703125, -0.9362030029296875, -0.901702880859375, -0.8672027587890625, -0.83270263671875, -0.7982025146484375, -0.763702392578125, -0.7292022705078125, -0.6947021484375, -0.6602020263671875, -0.625701904296875, -0.5912017822265625, -0.55670166015625, -0.5222015380859375, -0.487701416015625, -0.4532012939453125, -0.418701171875, -0.3842010498046875, -0.349700927734375, -0.3152008056640625, -0.28070068359375, -0.2462005615234375, -0.211700439453125, -0.1772003173828125, -0.1427001953125, -0.1082000732421875, -0.073699951171875, -0.0391998291015625, -0.00469970703125, 0.0298004150390625, 0.064300537109375, 0.0988006591796875, 0.13330078125, 0.1678009033203125, 0.202301025390625, 0.2368011474609375, 0.27130126953125, 0.3058013916015625, 0.340301513671875, 0.3748016357421875, 0.4093017578125, 0.4438018798828125, 0.478302001953125, 0.5128021240234375, 0.54730224609375, 0.5818023681640625, 0.616302490234375, 0.6508026123046875, 0.685302734375, 0.7198028564453125, 0.754302978515625, 0.7888031005859375, 0.82330322265625, 0.8578033447265625, 0.892303466796875, 0.9268035888671875, 0.9613037109375, 0.9958038330078125, 1.030303955078125, 1.0648040771484375, 1.09930419921875, 1.1338043212890625, 1.168304443359375, 1.2028045654296875, 1.2373046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 8.0, 8.0, 7.0, 12.0, 22.0, 29.0, 52.0, 66.0, 100.0, 157.0, 276.0, 551.0, 1279.0, 3766.0, 17632.0, 164650.0, 709518.0, 129907.0, 14820.0, 3286.0, 1131.0, 541.0, 290.0, 151.0, 84.0, 58.0, 47.0, 34.0, 22.0, 14.0, 12.0, 6.0, 12.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6160430908203125, -0.594390869140625, -0.5727386474609375, -0.55108642578125, -0.5294342041015625, -0.507781982421875, -0.4861297607421875, -0.4644775390625, -0.4428253173828125, -0.421173095703125, -0.3995208740234375, -0.37786865234375, -0.3562164306640625, -0.334564208984375, -0.3129119873046875, -0.291259765625, -0.2696075439453125, -0.247955322265625, -0.2263031005859375, -0.20465087890625, -0.1829986572265625, -0.161346435546875, -0.1396942138671875, -0.1180419921875, -0.0963897705078125, -0.074737548828125, -0.0530853271484375, -0.03143310546875, -0.0097808837890625, 0.011871337890625, 0.0335235595703125, 0.05517578125, 0.0768280029296875, 0.098480224609375, 0.1201324462890625, 0.14178466796875, 0.1634368896484375, 0.185089111328125, 0.2067413330078125, 0.2283935546875, 0.2500457763671875, 0.271697998046875, 0.2933502197265625, 0.31500244140625, 0.3366546630859375, 0.358306884765625, 0.3799591064453125, 0.401611328125, 0.4232635498046875, 0.444915771484375, 0.4665679931640625, 0.48822021484375, 0.5098724365234375, 0.531524658203125, 0.5531768798828125, 0.5748291015625, 0.5964813232421875, 0.618133544921875, 0.6397857666015625, 0.66143798828125, 0.6830902099609375, 0.704742431640625, 0.7263946533203125, 0.748046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 4.0, 3.0, 15.0, 16.0, 40.0, 54.0, 81.0, 138.0, 174.0, 147.0, 126.0, 85.0, 40.0, 31.0, 17.0, 8.0, 7.0, 6.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010389089584350586, -9.838584810495377e-05, -9.288080036640167e-05, -8.737575262784958e-05, -8.187070488929749e-05, -7.636565715074539e-05, -7.08606094121933e-05, -6.53555616736412e-05, -5.985051393508911e-05, -5.434546619653702e-05, -4.8840418457984924e-05, -4.333537071943283e-05, -3.783032298088074e-05, -3.2325275242328644e-05, -2.682022750377655e-05, -2.1315179765224457e-05, -1.5810132026672363e-05, -1.030508428812027e-05, -4.800036549568176e-06, 7.050111889839172e-07, 6.210058927536011e-06, 1.1715106666088104e-05, 1.7220154404640198e-05, 2.272520214319229e-05, 2.8230249881744385e-05, 3.373529762029648e-05, 3.924034535884857e-05, 4.4745393097400665e-05, 5.025044083595276e-05, 5.575548857450485e-05, 6.126053631305695e-05, 6.676558405160904e-05, 7.227063179016113e-05, 7.777567952871323e-05, 8.328072726726532e-05, 8.878577500581741e-05, 9.429082274436951e-05, 9.97958704829216e-05, 0.0001053009182214737, 0.00011080596596002579, 0.00011631101369857788, 0.00012181606143712997, 0.00012732110917568207, 0.00013282615691423416, 0.00013833120465278625, 0.00014383625239133835, 0.00014934130012989044, 0.00015484634786844254, 0.00016035139560699463, 0.00016585644334554672, 0.00017136149108409882, 0.0001768665388226509, 0.000182371586561203, 0.0001878766342997551, 0.0001933816820383072, 0.00019888672977685928, 0.00020439177751541138, 0.00020989682525396347, 0.00021540187299251556, 0.00022090692073106766, 0.00022641196846961975, 0.00023191701620817184, 0.00023742206394672394, 0.00024292711168527603, 0.0002484321594238281]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 15.0, 32.0, 45.0, 71.0, 117.0, 219.0, 517.0, 1403.0, 5707.0, 61908.0, 799258.0, 165502.0, 10438.0, 1974.0, 670.0, 279.0, 147.0, 87.0, 49.0, 21.0, 24.0, 14.0, 10.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.89599609375, -0.8676910400390625, -0.839385986328125, -0.8110809326171875, -0.78277587890625, -0.7544708251953125, -0.726165771484375, -0.6978607177734375, -0.6695556640625, -0.6412506103515625, -0.612945556640625, -0.5846405029296875, -0.55633544921875, -0.5280303955078125, -0.499725341796875, -0.4714202880859375, -0.443115234375, -0.4148101806640625, -0.386505126953125, -0.3582000732421875, -0.32989501953125, -0.3015899658203125, -0.273284912109375, -0.2449798583984375, -0.2166748046875, -0.1883697509765625, -0.160064697265625, -0.1317596435546875, -0.10345458984375, -0.0751495361328125, -0.046844482421875, -0.0185394287109375, 0.009765625, 0.0380706787109375, 0.066375732421875, 0.0946807861328125, 0.12298583984375, 0.1512908935546875, 0.179595947265625, 0.2079010009765625, 0.2362060546875, 0.2645111083984375, 0.292816162109375, 0.3211212158203125, 0.34942626953125, 0.3777313232421875, 0.406036376953125, 0.4343414306640625, 0.462646484375, 0.4909515380859375, 0.519256591796875, 0.5475616455078125, 0.57586669921875, 0.6041717529296875, 0.632476806640625, 0.6607818603515625, 0.6890869140625, 0.7173919677734375, 0.745697021484375, 0.7740020751953125, 0.80230712890625, 0.8306121826171875, 0.858917236328125, 0.8872222900390625, 0.91552734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 5.0, 3.0, 6.0, 5.0, 9.0, 14.0, 37.0, 41.0, 62.0, 92.0, 99.0, 116.0, 120.0, 117.0, 81.0, 60.0, 50.0, 28.0, 20.0, 11.0, 5.0, 8.0, 7.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46337890625, -0.4463653564453125, -0.429351806640625, -0.4123382568359375, -0.39532470703125, -0.3783111572265625, -0.361297607421875, -0.3442840576171875, -0.3272705078125, -0.3102569580078125, -0.293243408203125, -0.2762298583984375, -0.25921630859375, -0.2422027587890625, -0.225189208984375, -0.2081756591796875, -0.191162109375, -0.1741485595703125, -0.157135009765625, -0.1401214599609375, -0.12310791015625, -0.1060943603515625, -0.089080810546875, -0.0720672607421875, -0.0550537109375, -0.0380401611328125, -0.021026611328125, -0.0040130615234375, 0.01300048828125, 0.0300140380859375, 0.047027587890625, 0.0640411376953125, 0.0810546875, 0.0980682373046875, 0.115081787109375, 0.1320953369140625, 0.14910888671875, 0.1661224365234375, 0.183135986328125, 0.2001495361328125, 0.2171630859375, 0.2341766357421875, 0.251190185546875, 0.2682037353515625, 0.28521728515625, 0.3022308349609375, 0.319244384765625, 0.3362579345703125, 0.353271484375, 0.3702850341796875, 0.387298583984375, 0.4043121337890625, 0.42132568359375, 0.4383392333984375, 0.455352783203125, 0.4723663330078125, 0.4893798828125, 0.5063934326171875, 0.523406982421875, 0.5404205322265625, 0.55743408203125, 0.5744476318359375, 0.591461181640625, 0.6084747314453125, 0.62548828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 12.0, 17.0, 24.0, 75.0, 121.0, 173.0, 205.0, 189.0, 86.0, 52.0, 24.0, 15.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.511625289916992, -12.199226379394531, -11.886826515197754, -11.574427604675293, -11.262028694152832, -10.949628829956055, -10.637229919433594, -10.324831008911133, -10.012432098388672, -9.700033187866211, -9.387633323669434, -9.075234413146973, -8.762835502624512, -8.450435638427734, -8.138036727905273, -7.8256378173828125, -7.513237953186035, -7.200838565826416, -6.888439655303955, -6.576040267944336, -6.263641357421875, -5.951241970062256, -5.638842582702637, -5.326443672180176, -5.014044284820557, -4.7016448974609375, -4.389245986938477, -4.076846599578857, -3.7644474506378174, -3.4520483016967773, -3.139648914337158, -2.827249765396118, -2.5148496627807617, -2.2024505138397217, -1.890051245689392, -1.5776519775390625, -1.2652528285980225, -0.9528536796569824, -0.6404544115066528, -0.32805514335632324, -0.015655994415283203, 0.2967432141304016, 0.6091424226760864, 0.9215416312217712, 1.233940839767456, 1.546339988708496, 1.8587392568588257, 2.1711385250091553, 2.4835376739501953, 2.7959368228912354, 3.1083359718322754, 3.4207353591918945, 3.7331345081329346, 4.045533657073975, 4.357933044433594, 4.670331954956055, 4.982731342315674, 5.295130729675293, 5.607529640197754, 5.919929027557373, 6.232328414916992, 6.544727325439453, 6.857126712799072, 7.169526100158691, 7.481925010681152]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 9.0, 6.0, 14.0, 16.0, 18.0, 25.0, 23.0, 27.0, 45.0, 29.0, 55.0, 47.0, 47.0, 60.0, 59.0, 60.0, 53.0, 48.0, 45.0, 41.0, 45.0, 26.0, 28.0, 31.0, 31.0, 28.0, 19.0, 26.0, 12.0, 4.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.699517726898193, -6.519691467285156, -6.339865207672119, -6.160038948059082, -5.980213165283203, -5.800386905670166, -5.620560646057129, -5.440734386444092, -5.260908126831055, -5.081081867218018, -4.9012556076049805, -4.721429347991943, -4.541603088378906, -4.361777305603027, -4.18195104598999, -4.002124786376953, -3.822298526763916, -3.642472267150879, -3.462646007537842, -3.282819986343384, -3.1029937267303467, -2.9231674671173096, -2.7433414459228516, -2.5635151863098145, -2.3836889266967773, -2.2038626670837402, -2.024036407470703, -1.8442103862762451, -1.664384126663208, -1.484557867050171, -1.3047317266464233, -1.1249055862426758, -0.9450788497924805, -0.7652526497840881, -0.5854264497756958, -0.40560024976730347, -0.22577404975891113, -0.0459478497505188, 0.13387835025787354, 0.3137044906616211, 0.4935307502746582, 0.6733569502830505, 0.8531831502914429, 1.0330092906951904, 1.2128355503082275, 1.3926618099212646, 1.5724879503250122, 1.7523140907287598, 1.9321403503417969, 2.111966609954834, 2.291792869567871, 2.471618890762329, 2.651445150375366, 2.8312714099884033, 3.0110974311828613, 3.1909236907958984, 3.3707499504089355, 3.5505762100219727, 3.7304024696350098, 3.9102284908294678, 4.090054512023926, 4.269880771636963, 4.44970703125, 4.629533290863037, 4.809359550476074]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 11.0, 17.0, 15.0, 32.0, 50.0, 49.0, 84.0, 120.0, 196.0, 374.0, 762.0, 1740.0, 5156.0, 20360.0, 157991.0, 3823744.0, 154804.0, 19600.0, 5194.0, 1857.0, 841.0, 428.0, 291.0, 171.0, 108.0, 88.0, 56.0, 42.0, 24.0, 16.0, 6.0, 8.0, 6.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.69140625, -1.6409149169921875, -1.590423583984375, -1.5399322509765625, -1.48944091796875, -1.4389495849609375, -1.388458251953125, -1.3379669189453125, -1.2874755859375, -1.2369842529296875, -1.186492919921875, -1.1360015869140625, -1.08551025390625, -1.0350189208984375, -0.984527587890625, -0.9340362548828125, -0.883544921875, -0.8330535888671875, -0.782562255859375, -0.7320709228515625, -0.68157958984375, -0.6310882568359375, -0.580596923828125, -0.5301055908203125, -0.4796142578125, -0.4291229248046875, -0.378631591796875, -0.3281402587890625, -0.27764892578125, -0.2271575927734375, -0.176666259765625, -0.1261749267578125, -0.07568359375, -0.0251922607421875, 0.025299072265625, 0.0757904052734375, 0.12628173828125, 0.1767730712890625, 0.227264404296875, 0.2777557373046875, 0.3282470703125, 0.3787384033203125, 0.429229736328125, 0.4797210693359375, 0.53021240234375, 0.5807037353515625, 0.631195068359375, 0.6816864013671875, 0.732177734375, 0.7826690673828125, 0.833160400390625, 0.8836517333984375, 0.93414306640625, 0.9846343994140625, 1.035125732421875, 1.0856170654296875, 1.1361083984375, 1.1865997314453125, 1.237091064453125, 1.2875823974609375, 1.33807373046875, 1.3885650634765625, 1.439056396484375, 1.4895477294921875, 1.5400390625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 9.0, 13.0, 18.0, 36.0, 62.0, 104.0, 104.0, 114.0, 126.0, 132.0, 93.0, 65.0, 55.0, 21.0, 16.0, 15.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5686264038085938, -0.5498504638671875, -0.5310745239257812, -0.512298583984375, -0.49352264404296875, -0.4747467041015625, -0.45597076416015625, -0.43719482421875, -0.41841888427734375, -0.3996429443359375, -0.38086700439453125, -0.362091064453125, -0.34331512451171875, -0.3245391845703125, -0.30576324462890625, -0.2869873046875, -0.26821136474609375, -0.2494354248046875, -0.23065948486328125, -0.211883544921875, -0.19310760498046875, -0.1743316650390625, -0.15555572509765625, -0.13677978515625, -0.11800384521484375, -0.0992279052734375, -0.08045196533203125, -0.061676025390625, -0.04290008544921875, -0.0241241455078125, -0.00534820556640625, 0.013427734375, 0.03220367431640625, 0.0509796142578125, 0.06975555419921875, 0.088531494140625, 0.10730743408203125, 0.1260833740234375, 0.14485931396484375, 0.16363525390625, 0.18241119384765625, 0.2011871337890625, 0.21996307373046875, 0.238739013671875, 0.25751495361328125, 0.2762908935546875, 0.29506683349609375, 0.3138427734375, 0.33261871337890625, 0.3513946533203125, 0.37017059326171875, 0.388946533203125, 0.40772247314453125, 0.4264984130859375, 0.44527435302734375, 0.46405029296875, 0.48282623291015625, 0.5016021728515625, 0.5203781127929688, 0.539154052734375, 0.5579299926757812, 0.5767059326171875, 0.5954818725585938, 0.6142578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 11.0, 17.0, 26.0, 50.0, 126.0, 203.0, 353.0, 779.0, 1751.0, 4516.0, 15077.0, 73758.0, 2116064.0, 1887014.0, 72136.0, 14806.0, 4473.0, 1616.0, 764.0, 341.0, 173.0, 97.0, 53.0, 27.0, 21.0, 8.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0], "bins": [-1.791015625, -1.7512130737304688, -1.7114105224609375, -1.6716079711914062, -1.631805419921875, -1.5920028686523438, -1.5522003173828125, -1.5123977661132812, -1.47259521484375, -1.4327926635742188, -1.3929901123046875, -1.3531875610351562, -1.313385009765625, -1.2735824584960938, -1.2337799072265625, -1.1939773559570312, -1.1541748046875, -1.1143722534179688, -1.0745697021484375, -1.0347671508789062, -0.994964599609375, -0.9551620483398438, -0.9153594970703125, -0.8755569458007812, -0.83575439453125, -0.7959518432617188, -0.7561492919921875, -0.7163467407226562, -0.676544189453125, -0.6367416381835938, -0.5969390869140625, -0.5571365356445312, -0.517333984375, -0.47753143310546875, -0.4377288818359375, -0.39792633056640625, -0.358123779296875, -0.31832122802734375, -0.2785186767578125, -0.23871612548828125, -0.19891357421875, -0.15911102294921875, -0.1193084716796875, -0.07950592041015625, -0.039703369140625, 9.918212890625e-05, 0.0399017333984375, 0.07970428466796875, 0.1195068359375, 0.15930938720703125, 0.1991119384765625, 0.23891448974609375, 0.278717041015625, 0.31851959228515625, 0.3583221435546875, 0.39812469482421875, 0.43792724609375, 0.47772979736328125, 0.5175323486328125, 0.5573348999023438, 0.597137451171875, 0.6369400024414062, 0.6767425537109375, 0.7165451049804688, 0.75634765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 2.0, 8.0, 15.0, 15.0, 13.0, 39.0, 47.0, 65.0, 82.0, 175.0, 308.0, 1280.0, 1256.0, 337.0, 173.0, 91.0, 47.0, 35.0, 19.0, 17.0, 6.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.53369140625, -0.5200042724609375, -0.506317138671875, -0.4926300048828125, -0.47894287109375, -0.4652557373046875, -0.451568603515625, -0.4378814697265625, -0.4241943359375, -0.4105072021484375, -0.396820068359375, -0.3831329345703125, -0.36944580078125, -0.3557586669921875, -0.342071533203125, -0.3283843994140625, -0.314697265625, -0.3010101318359375, -0.287322998046875, -0.2736358642578125, -0.25994873046875, -0.2462615966796875, -0.232574462890625, -0.2188873291015625, -0.2052001953125, -0.1915130615234375, -0.177825927734375, -0.1641387939453125, -0.15045166015625, -0.1367645263671875, -0.123077392578125, -0.1093902587890625, -0.095703125, -0.0820159912109375, -0.068328857421875, -0.0546417236328125, -0.04095458984375, -0.0272674560546875, -0.013580322265625, 0.0001068115234375, 0.0137939453125, 0.0274810791015625, 0.041168212890625, 0.0548553466796875, 0.06854248046875, 0.0822296142578125, 0.095916748046875, 0.1096038818359375, 0.123291015625, 0.1369781494140625, 0.150665283203125, 0.1643524169921875, 0.17803955078125, 0.1917266845703125, 0.205413818359375, 0.2191009521484375, 0.2327880859375, 0.2464752197265625, 0.260162353515625, 0.2738494873046875, 0.28753662109375, 0.3012237548828125, 0.314910888671875, 0.3285980224609375, 0.34228515625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 16.0, 65.0, 164.0, 297.0, 283.0, 116.0, 38.0, 12.0, 6.0, 6.0], "bins": [-10.268869400024414, -10.091272354125977, -9.913675308227539, -9.736079216003418, -9.55848217010498, -9.380885124206543, -9.203288078308105, -9.025691986083984, -8.848094940185547, -8.67049789428711, -8.492900848388672, -8.31530475616455, -8.137707710266113, -7.960110664367676, -7.7825140953063965, -7.604917049407959, -7.42732048034668, -7.249723434448242, -7.072126865386963, -6.894529819488525, -6.716933250427246, -6.539336204528809, -6.361739635467529, -6.184142589569092, -6.006545543670654, -5.828948497772217, -5.6513519287109375, -5.4737548828125, -5.296158313751221, -5.118561267852783, -4.940964698791504, -4.763367652893066, -4.585771560668945, -4.408174514770508, -4.2305779457092285, -4.052980899810791, -3.8753843307495117, -3.6977875232696533, -3.520190715789795, -3.3425936698913574, -3.16499662399292, -2.9873998165130615, -2.809803009033203, -2.6322062015533447, -2.4546093940734863, -2.277012586593628, -2.0994157791137695, -1.9218188524246216, -1.7442221641540527, -1.5666253566741943, -1.389028549194336, -1.2114317417144775, -1.0338349342346191, -0.856238067150116, -0.6786412000656128, -0.5010443925857544, -0.323447585105896, -0.1458507627248764, 0.03174605965614319, 0.20934289693832397, 0.3869397044181824, 0.5645365118980408, 0.742133378982544, 0.9197301864624023, 1.0973269939422607]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 11.0, 17.0, 21.0, 20.0, 37.0, 39.0, 48.0, 56.0, 65.0, 69.0, 79.0, 77.0, 81.0, 66.0, 50.0, 49.0, 54.0, 45.0, 32.0, 27.0, 16.0, 11.0, 8.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4956579208374023, -2.4305272102355957, -2.36539626121521, -2.3002655506134033, -2.2351346015930176, -2.170003890991211, -2.1048731803894043, -2.0397422313690186, -1.974611520767212, -1.9094806909561157, -1.8443498611450195, -1.779219150543213, -1.7140883207321167, -1.6489574909210205, -1.5838267803192139, -1.5186959505081177, -1.4535651206970215, -1.3884342908859253, -1.323303461074829, -1.2581727504730225, -1.1930419206619263, -1.12791109085083, -1.0627803802490234, -0.9976495504379272, -0.932518720626831, -0.8673878908157349, -0.8022571206092834, -0.737126350402832, -0.6719955205917358, -0.6068646907806396, -0.5417339205741882, -0.47660312056541443, -0.4114725589752197, -0.3463417589664459, -0.2812109589576721, -0.21608015894889832, -0.1509493589401245, -0.08581855893135071, -0.020687758922576904, 0.0444430410861969, 0.1095738410949707, 0.1747046411037445, 0.2398354411125183, 0.3049662411212921, 0.3700970411300659, 0.4352278411388397, 0.5003586411476135, 0.5654894113540649, 0.6306202411651611, 0.6957510709762573, 0.7608818411827087, 0.8260126113891602, 0.8911434412002563, 0.9562742710113525, 1.0214049816131592, 1.0865358114242554, 1.1516666412353516, 1.2167974710464478, 1.281928300857544, 1.3470590114593506, 1.4121898412704468, 1.477320671081543, 1.5424513816833496, 1.6075822114944458, 1.672713041305542]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 11.0, 19.0, 28.0, 39.0, 68.0, 138.0, 257.0, 486.0, 915.0, 2183.0, 8406.0, 82226.0, 767870.0, 166882.0, 13792.0, 2909.0, 1144.0, 525.0, 276.0, 146.0, 91.0, 41.0, 34.0, 19.0, 14.0, 8.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.27215576171875, -2.2025146484375, -2.13287353515625, -2.063232421875, -1.99359130859375, -1.9239501953125, -1.85430908203125, -1.78466796875, -1.71502685546875, -1.6453857421875, -1.57574462890625, -1.506103515625, -1.43646240234375, -1.3668212890625, -1.29718017578125, -1.2275390625, -1.15789794921875, -1.0882568359375, -1.01861572265625, -0.948974609375, -0.87933349609375, -0.8096923828125, -0.74005126953125, -0.67041015625, -0.60076904296875, -0.5311279296875, -0.46148681640625, -0.391845703125, -0.32220458984375, -0.2525634765625, -0.18292236328125, -0.11328125, -0.04364013671875, 0.0260009765625, 0.09564208984375, 0.165283203125, 0.23492431640625, 0.3045654296875, 0.37420654296875, 0.44384765625, 0.51348876953125, 0.5831298828125, 0.65277099609375, 0.722412109375, 0.79205322265625, 0.8616943359375, 0.93133544921875, 1.0009765625, 1.07061767578125, 1.1402587890625, 1.20989990234375, 1.279541015625, 1.34918212890625, 1.4188232421875, 1.48846435546875, 1.55810546875, 1.62774658203125, 1.6973876953125, 1.76702880859375, 1.836669921875, 1.90631103515625, 1.9759521484375, 2.04559326171875, 2.115234375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 14.0, 20.0, 36.0, 53.0, 98.0, 117.0, 113.0, 142.0, 128.0, 94.0, 75.0, 41.0, 33.0, 19.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69921875, -0.6788406372070312, -0.6584625244140625, -0.6380844116210938, -0.617706298828125, -0.5973281860351562, -0.5769500732421875, -0.5565719604492188, -0.53619384765625, -0.5158157348632812, -0.4954376220703125, -0.47505950927734375, -0.454681396484375, -0.43430328369140625, -0.4139251708984375, -0.39354705810546875, -0.3731689453125, -0.35279083251953125, -0.3324127197265625, -0.31203460693359375, -0.291656494140625, -0.27127838134765625, -0.2509002685546875, -0.23052215576171875, -0.21014404296875, -0.18976593017578125, -0.1693878173828125, -0.14900970458984375, -0.128631591796875, -0.10825347900390625, -0.0878753662109375, -0.06749725341796875, -0.047119140625, -0.02674102783203125, -0.0063629150390625, 0.01401519775390625, 0.034393310546875, 0.05477142333984375, 0.0751495361328125, 0.09552764892578125, 0.11590576171875, 0.13628387451171875, 0.1566619873046875, 0.17704010009765625, 0.197418212890625, 0.21779632568359375, 0.2381744384765625, 0.25855255126953125, 0.2789306640625, 0.29930877685546875, 0.3196868896484375, 0.34006500244140625, 0.360443115234375, 0.38082122802734375, 0.4011993408203125, 0.42157745361328125, 0.44195556640625, 0.46233367919921875, 0.4827117919921875, 0.5030899047851562, 0.523468017578125, 0.5438461303710938, 0.5642242431640625, 0.5846023559570312, 0.60498046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 11.0, 10.0, 11.0, 18.0, 18.0, 22.0, 28.0, 54.0, 64.0, 73.0, 110.0, 156.0, 255.0, 437.0, 1102.0, 3322.0, 11312.0, 41561.0, 164282.0, 483023.0, 253700.0, 64072.0, 16876.0, 4873.0, 1612.0, 609.0, 307.0, 175.0, 115.0, 78.0, 64.0, 43.0, 38.0, 32.0, 24.0, 8.0, 13.0, 14.0, 5.0, 8.0, 1.0, 6.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.87158203125, -0.8448944091796875, -0.818206787109375, -0.7915191650390625, -0.76483154296875, -0.7381439208984375, -0.711456298828125, -0.6847686767578125, -0.6580810546875, -0.6313934326171875, -0.604705810546875, -0.5780181884765625, -0.55133056640625, -0.5246429443359375, -0.497955322265625, -0.4712677001953125, -0.444580078125, -0.4178924560546875, -0.391204833984375, -0.3645172119140625, -0.33782958984375, -0.3111419677734375, -0.284454345703125, -0.2577667236328125, -0.2310791015625, -0.2043914794921875, -0.177703857421875, -0.1510162353515625, -0.12432861328125, -0.0976409912109375, -0.070953369140625, -0.0442657470703125, -0.017578125, 0.0091094970703125, 0.035797119140625, 0.0624847412109375, 0.08917236328125, 0.1158599853515625, 0.142547607421875, 0.1692352294921875, 0.1959228515625, 0.2226104736328125, 0.249298095703125, 0.2759857177734375, 0.30267333984375, 0.3293609619140625, 0.356048583984375, 0.3827362060546875, 0.409423828125, 0.4361114501953125, 0.462799072265625, 0.4894866943359375, 0.51617431640625, 0.5428619384765625, 0.569549560546875, 0.5962371826171875, 0.6229248046875, 0.6496124267578125, 0.676300048828125, 0.7029876708984375, 0.72967529296875, 0.7563629150390625, 0.783050537109375, 0.8097381591796875, 0.83642578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 4.0, 6.0, 2.0, 7.0, 10.0, 11.0, 5.0, 12.0, 12.0, 13.0, 17.0, 21.0, 16.0, 22.0, 35.0, 31.0, 32.0, 43.0, 41.0, 28.0, 50.0, 49.0, 38.0, 45.0, 38.0, 32.0, 35.0, 32.0, 34.0, 32.0, 41.0, 29.0, 20.0, 22.0, 20.0, 21.0, 14.0, 12.0, 10.0, 14.0, 9.0, 3.0, 5.0, 9.0, 4.0, 2.0, 7.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7744140625, -0.7495346069335938, -0.7246551513671875, -0.6997756958007812, -0.674896240234375, -0.6500167846679688, -0.6251373291015625, -0.6002578735351562, -0.57537841796875, -0.5504989624023438, -0.5256195068359375, -0.5007400512695312, -0.475860595703125, -0.45098114013671875, -0.4261016845703125, -0.40122222900390625, -0.3763427734375, -0.35146331787109375, -0.3265838623046875, -0.30170440673828125, -0.276824951171875, -0.25194549560546875, -0.2270660400390625, -0.20218658447265625, -0.17730712890625, -0.15242767333984375, -0.1275482177734375, -0.10266876220703125, -0.077789306640625, -0.05290985107421875, -0.0280303955078125, -0.00315093994140625, 0.021728515625, 0.04660797119140625, 0.0714874267578125, 0.09636688232421875, 0.121246337890625, 0.14612579345703125, 0.1710052490234375, 0.19588470458984375, 0.22076416015625, 0.24564361572265625, 0.2705230712890625, 0.29540252685546875, 0.320281982421875, 0.34516143798828125, 0.3700408935546875, 0.39492034912109375, 0.4197998046875, 0.44467926025390625, 0.4695587158203125, 0.49443817138671875, 0.519317626953125, 0.5441970825195312, 0.5690765380859375, 0.5939559936523438, 0.61883544921875, 0.6437149047851562, 0.6685943603515625, 0.6934738159179688, 0.718353271484375, 0.7432327270507812, 0.7681121826171875, 0.7929916381835938, 0.81787109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 14.0, 17.0, 35.0, 59.0, 83.0, 111.0, 156.0, 219.0, 380.0, 778.0, 1714.0, 5006.0, 20803.0, 133972.0, 607704.0, 232121.0, 33818.0, 7106.0, 2268.0, 933.0, 496.0, 265.0, 176.0, 109.0, 60.0, 45.0, 30.0, 26.0, 9.0, 13.0, 8.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.2964286804199219, -0.28206634521484375, -0.2677040100097656, -0.2533416748046875, -0.23897933959960938, -0.22461700439453125, -0.21025466918945312, -0.195892333984375, -0.18152999877929688, -0.16716766357421875, -0.15280532836914062, -0.1384429931640625, -0.12408065795898438, -0.10971832275390625, -0.09535598754882812, -0.08099365234375, -0.06663131713867188, -0.05226898193359375, -0.037906646728515625, -0.0235443115234375, -0.009181976318359375, 0.00518035888671875, 0.019542694091796875, 0.033905029296875, 0.048267364501953125, 0.06262969970703125, 0.07699203491210938, 0.0913543701171875, 0.10571670532226562, 0.12007904052734375, 0.13444137573242188, 0.1488037109375, 0.16316604614257812, 0.17752838134765625, 0.19189071655273438, 0.2062530517578125, 0.22061538696289062, 0.23497772216796875, 0.24934005737304688, 0.263702392578125, 0.2780647277832031, 0.29242706298828125, 0.3067893981933594, 0.3211517333984375, 0.3355140686035156, 0.34987640380859375, 0.3642387390136719, 0.37860107421875, 0.3929634094238281, 0.40732574462890625, 0.4216880798339844, 0.4360504150390625, 0.4504127502441406, 0.46477508544921875, 0.4791374206542969, 0.493499755859375, 0.5078620910644531, 0.5222244262695312, 0.5365867614746094, 0.5509490966796875, 0.5653114318847656, 0.5796737670898438, 0.5940361022949219, 0.6083984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 5.0, 9.0, 27.0, 31.0, 41.0, 65.0, 90.0, 81.0, 118.0, 115.0, 102.0, 81.0, 72.0, 47.0, 35.0, 20.0, 21.0, 6.0, 9.0, 10.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.232759475708008e-05, -8.917786180973053e-05, -8.602812886238098e-05, -8.287839591503143e-05, -7.972866296768188e-05, -7.657893002033234e-05, -7.342919707298279e-05, -7.027946412563324e-05, -6.712973117828369e-05, -6.397999823093414e-05, -6.0830265283584595e-05, -5.7680532336235046e-05, -5.45307993888855e-05, -5.138106644153595e-05, -4.82313334941864e-05, -4.508160054683685e-05, -4.1931867599487305e-05, -3.8782134652137756e-05, -3.563240170478821e-05, -3.248266875743866e-05, -2.933293581008911e-05, -2.6183202862739563e-05, -2.3033469915390015e-05, -1.9883736968040466e-05, -1.6734004020690918e-05, -1.358427107334137e-05, -1.0434538125991821e-05, -7.284805178642273e-06, -4.135072231292725e-06, -9.853392839431763e-07, 2.164393663406372e-06, 5.31412661075592e-06, 8.463859558105469e-06, 1.1613592505455017e-05, 1.4763325452804565e-05, 1.7913058400154114e-05, 2.1062791347503662e-05, 2.421252429485321e-05, 2.736225724220276e-05, 3.0511990189552307e-05, 3.3661723136901855e-05, 3.6811456084251404e-05, 3.996118903160095e-05, 4.31109219789505e-05, 4.626065492630005e-05, 4.94103878736496e-05, 5.2560120820999146e-05, 5.5709853768348694e-05, 5.885958671569824e-05, 6.200931966304779e-05, 6.515905261039734e-05, 6.830878555774689e-05, 7.145851850509644e-05, 7.460825145244598e-05, 7.775798439979553e-05, 8.090771734714508e-05, 8.405745029449463e-05, 8.720718324184418e-05, 9.035691618919373e-05, 9.350664913654327e-05, 9.665638208389282e-05, 9.980611503124237e-05, 0.00010295584797859192, 0.00010610558092594147, 0.00010925531387329102]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 15.0, 34.0, 45.0, 100.0, 228.0, 536.0, 1579.0, 5784.0, 45591.0, 659843.0, 309537.0, 19887.0, 3485.0, 1150.0, 389.0, 179.0, 70.0, 44.0, 19.0, 10.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7696304321289062, -0.7487335205078125, -0.7278366088867188, -0.706939697265625, -0.6860427856445312, -0.6651458740234375, -0.6442489624023438, -0.62335205078125, -0.6024551391601562, -0.5815582275390625, -0.5606613159179688, -0.539764404296875, -0.5188674926757812, -0.4979705810546875, -0.47707366943359375, -0.4561767578125, -0.43527984619140625, -0.4143829345703125, -0.39348602294921875, -0.372589111328125, -0.35169219970703125, -0.3307952880859375, -0.30989837646484375, -0.28900146484375, -0.26810455322265625, -0.2472076416015625, -0.22631072998046875, -0.205413818359375, -0.18451690673828125, -0.1636199951171875, -0.14272308349609375, -0.121826171875, -0.10092926025390625, -0.0800323486328125, -0.05913543701171875, -0.038238525390625, -0.01734161376953125, 0.0035552978515625, 0.02445220947265625, 0.04534912109375, 0.06624603271484375, 0.0871429443359375, 0.10803985595703125, 0.128936767578125, 0.14983367919921875, 0.1707305908203125, 0.19162750244140625, 0.2125244140625, 0.23342132568359375, 0.2543182373046875, 0.27521514892578125, 0.296112060546875, 0.31700897216796875, 0.3379058837890625, 0.35880279541015625, 0.37969970703125, 0.40059661865234375, 0.4214935302734375, 0.44239044189453125, 0.463287353515625, 0.48418426513671875, 0.5050811767578125, 0.5259780883789062, 0.546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 19.0, 11.0, 25.0, 26.0, 41.0, 49.0, 52.0, 69.0, 98.0, 70.0, 81.0, 85.0, 69.0, 76.0, 57.0, 38.0, 29.0, 26.0, 18.0, 12.0, 8.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.39566802978515625, -0.3850860595703125, -0.37450408935546875, -0.363922119140625, -0.35334014892578125, -0.3427581787109375, -0.33217620849609375, -0.32159423828125, -0.31101226806640625, -0.3004302978515625, -0.28984832763671875, -0.279266357421875, -0.26868438720703125, -0.2581024169921875, -0.24752044677734375, -0.2369384765625, -0.22635650634765625, -0.2157745361328125, -0.20519256591796875, -0.194610595703125, -0.18402862548828125, -0.1734466552734375, -0.16286468505859375, -0.15228271484375, -0.14170074462890625, -0.1311187744140625, -0.12053680419921875, -0.109954833984375, -0.09937286376953125, -0.0887908935546875, -0.07820892333984375, -0.067626953125, -0.05704498291015625, -0.0464630126953125, -0.03588104248046875, -0.025299072265625, -0.01471710205078125, -0.0041351318359375, 0.00644683837890625, 0.01702880859375, 0.02761077880859375, 0.0381927490234375, 0.04877471923828125, 0.059356689453125, 0.06993865966796875, 0.0805206298828125, 0.09110260009765625, 0.1016845703125, 0.11226654052734375, 0.1228485107421875, 0.13343048095703125, 0.144012451171875, 0.15459442138671875, 0.1651763916015625, 0.17575836181640625, 0.18634033203125, 0.19692230224609375, 0.2075042724609375, 0.21808624267578125, 0.228668212890625, 0.23925018310546875, 0.2498321533203125, 0.26041412353515625, 0.27099609375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 39.0, 79.0, 156.0, 264.0, 224.0, 133.0, 66.0, 25.0, 11.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.559551239013672, -12.207952499389648, -11.856354713439941, -11.504755973815918, -11.153157234191895, -10.801559448242188, -10.449960708618164, -10.09836196899414, -9.746763229370117, -9.395164489746094, -9.043566703796387, -8.691967964172363, -8.34036922454834, -7.988770961761475, -7.637172698974609, -7.285573959350586, -6.933976173400879, -6.582377910614014, -6.23077917098999, -5.879180908203125, -5.527582168579102, -5.175983905792236, -4.824385643005371, -4.472786903381348, -4.121188640594482, -3.769590139389038, -3.4179916381835938, -3.0663933753967285, -2.714794874191284, -2.36319637298584, -2.0115981101989746, -1.6599996089935303, -1.3084001541137695, -0.95680171251297, -0.6052032709121704, -0.2536048889160156, 0.09799361228942871, 0.44959211349487305, 0.8011903762817383, 1.1527888774871826, 1.504387378692627, 1.8559858798980713, 2.2075843811035156, 2.559182643890381, 2.910781145095825, 3.2623796463012695, 3.6139779090881348, 3.965576410293579, 4.317174911499023, 4.668773174285889, 5.020371913909912, 5.371970176696777, 5.723568916320801, 6.075167179107666, 6.426765441894531, 6.778364181518555, 7.12996244430542, 7.481560707092285, 7.833159446716309, 8.184757232666016, 8.536355972290039, 8.887954711914062, 9.239553451538086, 9.591151237487793, 9.942749977111816]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 17.0, 11.0, 16.0, 16.0, 13.0, 25.0, 27.0, 30.0, 41.0, 41.0, 30.0, 45.0, 44.0, 35.0, 43.0, 57.0, 44.0, 41.0, 50.0, 36.0, 44.0, 36.0, 32.0, 35.0, 33.0, 33.0, 19.0, 24.0, 12.0, 11.0, 14.0, 15.0, 10.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.811568737030029, -4.672929286956787, -4.534289836883545, -4.395650386810303, -4.257011413574219, -4.118371963500977, -3.9797325134277344, -3.841093063354492, -3.70245361328125, -3.563814163208008, -3.4251747131347656, -3.2865355014801025, -3.1478960514068604, -3.009256601333618, -2.870617389678955, -2.731977939605713, -2.5933384895324707, -2.4546990394592285, -2.3160595893859863, -2.1774203777313232, -2.038780927658081, -1.9001414775848389, -1.7615021467208862, -1.6228628158569336, -1.4842233657836914, -1.3455839157104492, -1.2069445848464966, -1.068305253982544, -0.9296658039093018, -0.7910264134407043, -0.6523870229721069, -0.5137476325035095, -0.3751077651977539, -0.2364683747291565, -0.09782898426055908, 0.04081040620803833, 0.17944979667663574, 0.31808918714523315, 0.45672857761383057, 0.595367968082428, 0.7340073585510254, 0.8726467490196228, 1.0112861394882202, 1.1499254703521729, 1.288564920425415, 1.4272043704986572, 1.5658437013626099, 1.7044830322265625, 1.8431224822998047, 1.9817619323730469, 2.120401382446289, 2.259040594100952, 2.3976800441741943, 2.5363194942474365, 2.6749587059020996, 2.813598155975342, 2.952237606048584, 3.090877056121826, 3.2295165061950684, 3.3681557178497314, 3.5067951679229736, 3.645434617996216, 3.784073829650879, 3.922713279724121, 4.061352729797363]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 20.0, 27.0, 36.0, 64.0, 133.0, 216.0, 374.0, 864.0, 2516.0, 11537.0, 180052.0, 3950300.0, 39404.0, 5496.0, 1659.0, 704.0, 335.0, 192.0, 136.0, 66.0, 45.0, 34.0, 10.0, 8.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.146484375, -3.05975341796875, -2.9730224609375, -2.88629150390625, -2.799560546875, -2.71282958984375, -2.6260986328125, -2.53936767578125, -2.45263671875, -2.36590576171875, -2.2791748046875, -2.19244384765625, -2.105712890625, -2.01898193359375, -1.9322509765625, -1.84552001953125, -1.7587890625, -1.67205810546875, -1.5853271484375, -1.49859619140625, -1.411865234375, -1.32513427734375, -1.2384033203125, -1.15167236328125, -1.06494140625, -0.97821044921875, -0.8914794921875, -0.80474853515625, -0.718017578125, -0.63128662109375, -0.5445556640625, -0.45782470703125, -0.37109375, -0.28436279296875, -0.1976318359375, -0.11090087890625, -0.024169921875, 0.06256103515625, 0.1492919921875, 0.23602294921875, 0.32275390625, 0.40948486328125, 0.4962158203125, 0.58294677734375, 0.669677734375, 0.75640869140625, 0.8431396484375, 0.92987060546875, 1.0166015625, 1.10333251953125, 1.1900634765625, 1.27679443359375, 1.363525390625, 1.45025634765625, 1.5369873046875, 1.62371826171875, 1.71044921875, 1.79718017578125, 1.8839111328125, 1.97064208984375, 2.057373046875, 2.14410400390625, 2.2308349609375, 2.31756591796875, 2.404296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 20.0, 27.0, 45.0, 77.0, 107.0, 112.0, 130.0, 112.0, 112.0, 97.0, 64.0, 44.0, 24.0, 6.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6796875, -0.6596145629882812, -0.6395416259765625, -0.6194686889648438, -0.599395751953125, -0.5793228149414062, -0.5592498779296875, -0.5391769409179688, -0.51910400390625, -0.49903106689453125, -0.4789581298828125, -0.45888519287109375, -0.438812255859375, -0.41873931884765625, -0.3986663818359375, -0.37859344482421875, -0.3585205078125, -0.33844757080078125, -0.3183746337890625, -0.29830169677734375, -0.278228759765625, -0.25815582275390625, -0.2380828857421875, -0.21800994873046875, -0.19793701171875, -0.17786407470703125, -0.1577911376953125, -0.13771820068359375, -0.117645263671875, -0.09757232666015625, -0.0774993896484375, -0.05742645263671875, -0.037353515625, -0.01728057861328125, 0.0027923583984375, 0.02286529541015625, 0.042938232421875, 0.06301116943359375, 0.0830841064453125, 0.10315704345703125, 0.12322998046875, 0.14330291748046875, 0.1633758544921875, 0.18344879150390625, 0.203521728515625, 0.22359466552734375, 0.2436676025390625, 0.26374053955078125, 0.2838134765625, 0.30388641357421875, 0.3239593505859375, 0.34403228759765625, 0.364105224609375, 0.38417816162109375, 0.4042510986328125, 0.42432403564453125, 0.44439697265625, 0.46446990966796875, 0.4845428466796875, 0.5046157836914062, 0.524688720703125, 0.5447616577148438, 0.5648345947265625, 0.5849075317382812, 0.60498046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 14.0, 23.0, 38.0, 73.0, 102.0, 170.0, 288.0, 527.0, 996.0, 1968.0, 4502.0, 12091.0, 46979.0, 412169.0, 3553822.0, 123132.0, 23651.0, 7478.0, 3019.0, 1456.0, 742.0, 439.0, 215.0, 173.0, 72.0, 50.0, 34.0, 17.0, 8.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.0592041015625, -1.021728515625, -0.9842529296875, -0.94677734375, -0.9093017578125, -0.871826171875, -0.8343505859375, -0.796875, -0.7593994140625, -0.721923828125, -0.6844482421875, -0.64697265625, -0.6094970703125, -0.572021484375, -0.5345458984375, -0.4970703125, -0.4595947265625, -0.422119140625, -0.3846435546875, -0.34716796875, -0.3096923828125, -0.272216796875, -0.2347412109375, -0.197265625, -0.1597900390625, -0.122314453125, -0.0848388671875, -0.04736328125, -0.0098876953125, 0.027587890625, 0.0650634765625, 0.1025390625, 0.1400146484375, 0.177490234375, 0.2149658203125, 0.25244140625, 0.2899169921875, 0.327392578125, 0.3648681640625, 0.40234375, 0.4398193359375, 0.477294921875, 0.5147705078125, 0.55224609375, 0.5897216796875, 0.627197265625, 0.6646728515625, 0.7021484375, 0.7396240234375, 0.777099609375, 0.8145751953125, 0.85205078125, 0.8895263671875, 0.927001953125, 0.9644775390625, 1.001953125, 1.0394287109375, 1.076904296875, 1.1143798828125, 1.15185546875, 1.1893310546875, 1.226806640625, 1.2642822265625, 1.3017578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 1.0, 11.0, 25.0, 25.0, 46.0, 79.0, 170.0, 484.0, 2445.0, 399.0, 150.0, 90.0, 44.0, 22.0, 25.0, 15.0, 9.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5205078125, -0.5022048950195312, -0.4839019775390625, -0.46559906005859375, -0.447296142578125, -0.42899322509765625, -0.4106903076171875, -0.39238739013671875, -0.37408447265625, -0.35578155517578125, -0.3374786376953125, -0.31917572021484375, -0.300872802734375, -0.28256988525390625, -0.2642669677734375, -0.24596405029296875, -0.2276611328125, -0.20935821533203125, -0.1910552978515625, -0.17275238037109375, -0.154449462890625, -0.13614654541015625, -0.1178436279296875, -0.09954071044921875, -0.08123779296875, -0.06293487548828125, -0.0446319580078125, -0.02632904052734375, -0.008026123046875, 0.01027679443359375, 0.0285797119140625, 0.04688262939453125, 0.065185546875, 0.08348846435546875, 0.1017913818359375, 0.12009429931640625, 0.138397216796875, 0.15670013427734375, 0.1750030517578125, 0.19330596923828125, 0.21160888671875, 0.22991180419921875, 0.2482147216796875, 0.26651763916015625, 0.284820556640625, 0.30312347412109375, 0.3214263916015625, 0.33972930908203125, 0.3580322265625, 0.37633514404296875, 0.3946380615234375, 0.41294097900390625, 0.431243896484375, 0.44954681396484375, 0.4678497314453125, 0.48615264892578125, 0.50445556640625, 0.5227584838867188, 0.5410614013671875, 0.5593643188476562, 0.577667236328125, 0.5959701538085938, 0.6142730712890625, 0.6325759887695312, 0.65087890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 12.0, 46.0, 510.0, 388.0, 36.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.754898548126221, -4.38496732711792, -4.015035629272461, -3.64510440826416, -3.2751729488372803, -2.9052414894104004, -2.5353102684020996, -2.1653788089752197, -1.7954473495483398, -1.42551589012146, -1.0555845499038696, -0.6856532096862793, -0.3157217502593994, 0.05420970916748047, 0.42414093017578125, 0.7940723896026611, 1.164003849029541, 1.533935308456421, 1.9038666486740112, 2.2737979888916016, 2.6437294483184814, 3.0136609077453613, 3.383592128753662, 3.753523588180542, 4.123455047607422, 4.493386268615723, 4.863317966461182, 5.233249187469482, 5.603180885314941, 5.973112106323242, 6.343043327331543, 6.712974548339844, 7.082906723022461, 7.452837944030762, 7.822769641876221, 8.19270133972168, 8.56263256072998, 8.932563781738281, 9.302495002746582, 9.672426223754883, 10.0423583984375, 10.4122896194458, 10.782220840454102, 11.152153015136719, 11.52208423614502, 11.89201545715332, 12.261946678161621, 12.631877899169922, 13.001809120178223, 13.371740341186523, 13.741671562194824, 14.111602783203125, 14.481534957885742, 14.851466178894043, 15.221397399902344, 15.591328620910645, 15.961259841918945, 16.331192016601562, 16.701122283935547, 17.071054458618164, 17.44098472595215, 17.810916900634766, 18.18084716796875, 18.550779342651367, 18.920711517333984]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 6.0, 8.0, 9.0, 12.0, 14.0, 14.0, 27.0, 28.0, 27.0, 32.0, 48.0, 48.0, 54.0, 48.0, 69.0, 37.0, 62.0, 65.0, 49.0, 41.0, 46.0, 48.0, 46.0, 35.0, 21.0, 20.0, 14.0, 18.0, 9.0, 11.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3293942213058472, -1.2811225652694702, -1.2328509092330933, -1.1845792531967163, -1.1363075971603394, -1.0880359411239624, -1.039764165878296, -0.9914925694465637, -0.9432209134101868, -0.8949492573738098, -0.8466776013374329, -0.7984058856964111, -0.7501342296600342, -0.7018625736236572, -0.6535909175872803, -0.6053192615509033, -0.5570476055145264, -0.5087759494781494, -0.46050429344177246, -0.4122326076030731, -0.36396095156669617, -0.3156892955303192, -0.2674176096916199, -0.21914595365524292, -0.17087429761886597, -0.12260263413190842, -0.07433097064495087, -0.02605929970741272, 0.022212356328964233, 0.07048401236534119, 0.11875569820404053, 0.16702735424041748, 0.21529912948608398, 0.26357078552246094, 0.3118424415588379, 0.36011412739753723, 0.4083857834339142, 0.45665743947029114, 0.5049291253089905, 0.5532007813453674, 0.6014724373817444, 0.6497440934181213, 0.6980157494544983, 0.74628746509552, 0.794559121131897, 0.8428307771682739, 0.8911024332046509, 0.9393740892410278, 0.9876457452774048, 1.0359174013137817, 1.0841890573501587, 1.1324607133865356, 1.1807323694229126, 1.2290040254592896, 1.277275800704956, 1.325547456741333, 1.37381911277771, 1.422090768814087, 1.4703624248504639, 1.5186340808868408, 1.5669057369232178, 1.6151773929595947, 1.6634490489959717, 1.7117207050323486, 1.7599923610687256]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 14.0, 18.0, 21.0, 23.0, 30.0, 57.0, 54.0, 98.0, 123.0, 194.0, 278.0, 395.0, 561.0, 914.0, 1525.0, 3153.0, 9156.0, 38188.0, 187048.0, 529433.0, 215330.0, 43817.0, 10264.0, 3465.0, 1573.0, 928.0, 595.0, 400.0, 259.0, 189.0, 137.0, 100.0, 53.0, 36.0, 32.0, 25.0, 18.0, 16.0, 11.0, 8.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.37890625, -1.3389892578125, -1.299072265625, -1.2591552734375, -1.21923828125, -1.1793212890625, -1.139404296875, -1.0994873046875, -1.0595703125, -1.0196533203125, -0.979736328125, -0.9398193359375, -0.89990234375, -0.8599853515625, -0.820068359375, -0.7801513671875, -0.740234375, -0.7003173828125, -0.660400390625, -0.6204833984375, -0.58056640625, -0.5406494140625, -0.500732421875, -0.4608154296875, -0.4208984375, -0.3809814453125, -0.341064453125, -0.3011474609375, -0.26123046875, -0.2213134765625, -0.181396484375, -0.1414794921875, -0.1015625, -0.0616455078125, -0.021728515625, 0.0181884765625, 0.05810546875, 0.0980224609375, 0.137939453125, 0.1778564453125, 0.2177734375, 0.2576904296875, 0.297607421875, 0.3375244140625, 0.37744140625, 0.4173583984375, 0.457275390625, 0.4971923828125, 0.537109375, 0.5770263671875, 0.616943359375, 0.6568603515625, 0.69677734375, 0.7366943359375, 0.776611328125, 0.8165283203125, 0.8564453125, 0.8963623046875, 0.936279296875, 0.9761962890625, 1.01611328125, 1.0560302734375, 1.095947265625, 1.1358642578125, 1.17578125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 30.0, 42.0, 66.0, 91.0, 109.0, 149.0, 130.0, 104.0, 103.0, 63.0, 36.0, 27.0, 11.0, 12.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.7009735107421875, -0.679779052734375, -0.6585845947265625, -0.63739013671875, -0.6161956787109375, -0.595001220703125, -0.5738067626953125, -0.5526123046875, -0.5314178466796875, -0.510223388671875, -0.4890289306640625, -0.46783447265625, -0.4466400146484375, -0.425445556640625, -0.4042510986328125, -0.383056640625, -0.3618621826171875, -0.340667724609375, -0.3194732666015625, -0.29827880859375, -0.2770843505859375, -0.255889892578125, -0.2346954345703125, -0.2135009765625, -0.1923065185546875, -0.171112060546875, -0.1499176025390625, -0.12872314453125, -0.1075286865234375, -0.086334228515625, -0.0651397705078125, -0.0439453125, -0.0227508544921875, -0.001556396484375, 0.0196380615234375, 0.04083251953125, 0.0620269775390625, 0.083221435546875, 0.1044158935546875, 0.1256103515625, 0.1468048095703125, 0.167999267578125, 0.1891937255859375, 0.21038818359375, 0.2315826416015625, 0.252777099609375, 0.2739715576171875, 0.295166015625, 0.3163604736328125, 0.337554931640625, 0.3587493896484375, 0.37994384765625, 0.4011383056640625, 0.422332763671875, 0.4435272216796875, 0.4647216796875, 0.4859161376953125, 0.507110595703125, 0.5283050537109375, 0.54949951171875, 0.5706939697265625, 0.591888427734375, 0.6130828857421875, 0.63427734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 6.0, 10.0, 18.0, 21.0, 23.0, 28.0, 40.0, 66.0, 88.0, 134.0, 195.0, 323.0, 558.0, 1174.0, 2693.0, 7412.0, 22412.0, 69799.0, 206345.0, 390587.0, 228052.0, 78706.0, 25362.0, 8489.0, 3119.0, 1233.0, 595.0, 337.0, 207.0, 126.0, 102.0, 79.0, 47.0, 36.0, 33.0, 22.0, 18.0, 14.0, 9.0, 7.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.642578125, -0.6215438842773438, -0.6005096435546875, -0.5794754028320312, -0.558441162109375, -0.5374069213867188, -0.5163726806640625, -0.49533843994140625, -0.47430419921875, -0.45326995849609375, -0.4322357177734375, -0.41120147705078125, -0.390167236328125, -0.36913299560546875, -0.3480987548828125, -0.32706451416015625, -0.3060302734375, -0.28499603271484375, -0.2639617919921875, -0.24292755126953125, -0.221893310546875, -0.20085906982421875, -0.1798248291015625, -0.15879058837890625, -0.13775634765625, -0.11672210693359375, -0.0956878662109375, -0.07465362548828125, -0.053619384765625, -0.03258514404296875, -0.0115509033203125, 0.00948333740234375, 0.030517578125, 0.05155181884765625, 0.0725860595703125, 0.09362030029296875, 0.114654541015625, 0.13568878173828125, 0.1567230224609375, 0.17775726318359375, 0.19879150390625, 0.21982574462890625, 0.2408599853515625, 0.26189422607421875, 0.282928466796875, 0.30396270751953125, 0.3249969482421875, 0.34603118896484375, 0.3670654296875, 0.38809967041015625, 0.4091339111328125, 0.43016815185546875, 0.451202392578125, 0.47223663330078125, 0.4932708740234375, 0.5143051147460938, 0.53533935546875, 0.5563735961914062, 0.5774078369140625, 0.5984420776367188, 0.619476318359375, 0.6405105590820312, 0.6615447998046875, 0.6825790405273438, 0.70361328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 4.0, 8.0, 14.0, 12.0, 11.0, 20.0, 19.0, 23.0, 20.0, 26.0, 34.0, 39.0, 37.0, 32.0, 36.0, 39.0, 51.0, 52.0, 49.0, 52.0, 35.0, 38.0, 35.0, 32.0, 42.0, 36.0, 22.0, 24.0, 23.0, 23.0, 20.0, 20.0, 15.0, 11.0, 4.0, 8.0, 6.0, 6.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0107421875, -0.9805374145507812, -0.9503326416015625, -0.9201278686523438, -0.889923095703125, -0.8597183227539062, -0.8295135498046875, -0.7993087768554688, -0.76910400390625, -0.7388992309570312, -0.7086944580078125, -0.6784896850585938, -0.648284912109375, -0.6180801391601562, -0.5878753662109375, -0.5576705932617188, -0.5274658203125, -0.49726104736328125, -0.4670562744140625, -0.43685150146484375, -0.406646728515625, -0.37644195556640625, -0.3462371826171875, -0.31603240966796875, -0.28582763671875, -0.25562286376953125, -0.2254180908203125, -0.19521331787109375, -0.165008544921875, -0.13480377197265625, -0.1045989990234375, -0.07439422607421875, -0.044189453125, -0.01398468017578125, 0.0162200927734375, 0.04642486572265625, 0.076629638671875, 0.10683441162109375, 0.1370391845703125, 0.16724395751953125, 0.19744873046875, 0.22765350341796875, 0.2578582763671875, 0.28806304931640625, 0.318267822265625, 0.34847259521484375, 0.3786773681640625, 0.40888214111328125, 0.4390869140625, 0.46929168701171875, 0.4994964599609375, 0.5297012329101562, 0.559906005859375, 0.5901107788085938, 0.6203155517578125, 0.6505203247070312, 0.68072509765625, 0.7109298706054688, 0.7411346435546875, 0.7713394165039062, 0.801544189453125, 0.8317489624023438, 0.8619537353515625, 0.8921585083007812, 0.92236328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 9.0, 10.0, 18.0, 36.0, 44.0, 93.0, 168.0, 348.0, 777.0, 2087.0, 7075.0, 43723.0, 424502.0, 502879.0, 54650.0, 8181.0, 2222.0, 877.0, 395.0, 200.0, 87.0, 62.0, 40.0, 26.0, 14.0, 8.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.48673248291015625, -0.4705352783203125, -0.45433807373046875, -0.438140869140625, -0.42194366455078125, -0.4057464599609375, -0.38954925537109375, -0.37335205078125, -0.35715484619140625, -0.3409576416015625, -0.32476043701171875, -0.308563232421875, -0.29236602783203125, -0.2761688232421875, -0.25997161865234375, -0.2437744140625, -0.22757720947265625, -0.2113800048828125, -0.19518280029296875, -0.178985595703125, -0.16278839111328125, -0.1465911865234375, -0.13039398193359375, -0.11419677734375, -0.09799957275390625, -0.0818023681640625, -0.06560516357421875, -0.049407958984375, -0.03321075439453125, -0.0170135498046875, -0.00081634521484375, 0.015380859375, 0.03157806396484375, 0.0477752685546875, 0.06397247314453125, 0.080169677734375, 0.09636688232421875, 0.1125640869140625, 0.12876129150390625, 0.14495849609375, 0.16115570068359375, 0.1773529052734375, 0.19355010986328125, 0.209747314453125, 0.22594451904296875, 0.2421417236328125, 0.25833892822265625, 0.2745361328125, 0.29073333740234375, 0.3069305419921875, 0.32312774658203125, 0.339324951171875, 0.35552215576171875, 0.3717193603515625, 0.38791656494140625, 0.40411376953125, 0.42031097412109375, 0.4365081787109375, 0.45270538330078125, 0.468902587890625, 0.48509979248046875, 0.5012969970703125, 0.5174942016601562, 0.53369140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 10.0, 6.0, 12.0, 13.0, 22.0, 21.0, 22.0, 32.0, 41.0, 55.0, 60.0, 55.0, 71.0, 62.0, 79.0, 81.0, 57.0, 62.0, 50.0, 35.0, 27.0, 23.0, 23.0, 16.0, 19.0, 9.0, 9.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4405460357666016e-05, -4.2557716369628906e-05, -4.07099723815918e-05, -3.886222839355469e-05, -3.701448440551758e-05, -3.516674041748047e-05, -3.331899642944336e-05, -3.147125244140625e-05, -2.962350845336914e-05, -2.777576446533203e-05, -2.5928020477294922e-05, -2.4080276489257812e-05, -2.2232532501220703e-05, -2.0384788513183594e-05, -1.8537044525146484e-05, -1.6689300537109375e-05, -1.4841556549072266e-05, -1.2993812561035156e-05, -1.1146068572998047e-05, -9.298324584960938e-06, -7.450580596923828e-06, -5.602836608886719e-06, -3.7550926208496094e-06, -1.9073486328125e-06, -5.960464477539063e-08, 1.7881393432617188e-06, 3.635883331298828e-06, 5.4836273193359375e-06, 7.331371307373047e-06, 9.179115295410156e-06, 1.1026859283447266e-05, 1.2874603271484375e-05, 1.4722347259521484e-05, 1.6570091247558594e-05, 1.8417835235595703e-05, 2.0265579223632812e-05, 2.2113323211669922e-05, 2.396106719970703e-05, 2.580881118774414e-05, 2.765655517578125e-05, 2.950429916381836e-05, 3.135204315185547e-05, 3.319978713989258e-05, 3.504753112792969e-05, 3.68952751159668e-05, 3.8743019104003906e-05, 4.0590763092041016e-05, 4.2438507080078125e-05, 4.4286251068115234e-05, 4.6133995056152344e-05, 4.798173904418945e-05, 4.982948303222656e-05, 5.167722702026367e-05, 5.352497100830078e-05, 5.537271499633789e-05, 5.7220458984375e-05, 5.906820297241211e-05, 6.091594696044922e-05, 6.276369094848633e-05, 6.461143493652344e-05, 6.645917892456055e-05, 6.830692291259766e-05, 7.015466690063477e-05, 7.200241088867188e-05, 7.385015487670898e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 16.0, 20.0, 38.0, 49.0, 108.0, 164.0, 419.0, 1386.0, 6663.0, 52815.0, 536656.0, 406214.0, 37009.0, 5054.0, 1188.0, 371.0, 154.0, 93.0, 47.0, 31.0, 32.0, 18.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76904296875, -0.7476348876953125, -0.726226806640625, -0.7048187255859375, -0.68341064453125, -0.6620025634765625, -0.640594482421875, -0.6191864013671875, -0.5977783203125, -0.5763702392578125, -0.554962158203125, -0.5335540771484375, -0.51214599609375, -0.4907379150390625, -0.469329833984375, -0.4479217529296875, -0.426513671875, -0.4051055908203125, -0.383697509765625, -0.3622894287109375, -0.34088134765625, -0.3194732666015625, -0.298065185546875, -0.2766571044921875, -0.2552490234375, -0.2338409423828125, -0.212432861328125, -0.1910247802734375, -0.16961669921875, -0.1482086181640625, -0.126800537109375, -0.1053924560546875, -0.083984375, -0.0625762939453125, -0.041168212890625, -0.0197601318359375, 0.00164794921875, 0.0230560302734375, 0.044464111328125, 0.0658721923828125, 0.0872802734375, 0.1086883544921875, 0.130096435546875, 0.1515045166015625, 0.17291259765625, 0.1943206787109375, 0.215728759765625, 0.2371368408203125, 0.258544921875, 0.2799530029296875, 0.301361083984375, 0.3227691650390625, 0.34417724609375, 0.3655853271484375, 0.386993408203125, 0.4084014892578125, 0.4298095703125, 0.4512176513671875, 0.472625732421875, 0.4940338134765625, 0.51544189453125, 0.5368499755859375, 0.558258056640625, 0.5796661376953125, 0.60107421875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 5.0, 16.0, 14.0, 11.0, 20.0, 13.0, 24.0, 23.0, 43.0, 34.0, 43.0, 55.0, 70.0, 81.0, 70.0, 69.0, 75.0, 55.0, 50.0, 39.0, 25.0, 35.0, 23.0, 20.0, 11.0, 19.0, 9.0, 7.0, 8.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.330291748046875, -0.31903076171875, -0.307769775390625, -0.2965087890625, -0.285247802734375, -0.27398681640625, -0.262725830078125, -0.25146484375, -0.240203857421875, -0.22894287109375, -0.217681884765625, -0.2064208984375, -0.195159912109375, -0.18389892578125, -0.172637939453125, -0.161376953125, -0.150115966796875, -0.13885498046875, -0.127593994140625, -0.1163330078125, -0.105072021484375, -0.09381103515625, -0.082550048828125, -0.0712890625, -0.060028076171875, -0.04876708984375, -0.037506103515625, -0.0262451171875, -0.014984130859375, -0.00372314453125, 0.007537841796875, 0.018798828125, 0.030059814453125, 0.04132080078125, 0.052581787109375, 0.0638427734375, 0.075103759765625, 0.08636474609375, 0.097625732421875, 0.10888671875, 0.120147705078125, 0.13140869140625, 0.142669677734375, 0.1539306640625, 0.165191650390625, 0.17645263671875, 0.187713623046875, 0.198974609375, 0.210235595703125, 0.22149658203125, 0.232757568359375, 0.2440185546875, 0.255279541015625, 0.26654052734375, 0.277801513671875, 0.2890625, 0.300323486328125, 0.31158447265625, 0.322845458984375, 0.3341064453125, 0.345367431640625, 0.35662841796875, 0.367889404296875, 0.379150390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 9.0, 26.0, 79.0, 209.0, 276.0, 213.0, 124.0, 40.0, 19.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.354331970214844, -11.903773307800293, -11.453214645385742, -11.002655982971191, -10.55209732055664, -10.10153865814209, -9.650979995727539, -9.200422286987305, -8.749862670898438, -8.299304008483887, -7.848745346069336, -7.398186683654785, -6.947628021240234, -6.497069358825684, -6.046511173248291, -5.59595251083374, -5.145394325256348, -4.694835662841797, -4.244277000427246, -3.7937185764312744, -3.3431599140167236, -2.892601251602173, -2.442042827606201, -1.9914841651916504, -1.5409255027770996, -1.0903668403625488, -0.6398082971572876, -0.18924975395202637, 0.2613089084625244, 0.7118675708770752, 1.1624259948730469, 1.6129846572875977, 2.0635433197021484, 2.514101982116699, 2.96466064453125, 3.4152190685272217, 3.8657777309417725, 4.316336631774902, 4.766894817352295, 5.217453479766846, 5.6680121421813965, 6.118570804595947, 6.569129467010498, 7.019687652587891, 7.470246315002441, 7.920804977416992, 8.371363639831543, 8.821922302246094, 9.272480964660645, 9.723039627075195, 10.173598289489746, 10.624156951904297, 11.074715614318848, 11.525274276733398, 11.975831985473633, 12.4263916015625, 12.876949310302734, 13.327507972717285, 13.778066635131836, 14.228625297546387, 14.679183959960938, 15.129742622375488, 15.580301284790039, 16.030858993530273, 16.48141860961914]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 0.0, 6.0, 5.0, 9.0, 7.0, 9.0, 14.0, 11.0, 11.0, 14.0, 19.0, 16.0, 26.0, 20.0, 20.0, 34.0, 28.0, 42.0, 38.0, 41.0, 35.0, 40.0, 37.0, 46.0, 37.0, 36.0, 38.0, 31.0, 36.0, 35.0, 27.0, 29.0, 28.0, 22.0, 24.0, 21.0, 21.0, 13.0, 5.0, 21.0, 9.0, 10.0, 11.0, 4.0, 6.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.773796081542969, -4.630876541137695, -4.487957000732422, -4.345037460327148, -4.202117919921875, -4.059198379516602, -3.9162790775299072, -3.773359537124634, -3.6304399967193604, -3.487520456314087, -3.3446009159088135, -3.20168137550354, -3.0587620735168457, -2.9158425331115723, -2.772922992706299, -2.6300034523010254, -2.487083911895752, -2.3441643714904785, -2.201244831085205, -2.0583252906799316, -1.9154058694839478, -1.7724863290786743, -1.6295669078826904, -1.486647367477417, -1.3437278270721436, -1.2008082866668701, -1.0578887462615967, -0.9149693250656128, -0.7720497846603394, -0.6291302442550659, -0.48621076345443726, -0.3432912826538086, -0.20037174224853516, -0.057452231645584106, 0.08546727895736694, 0.228386789560318, 0.37130630016326904, 0.5142258405685425, 0.6571453213691711, 0.8000648021697998, 0.9429843425750732, 1.0859038829803467, 1.2288234233856201, 1.371742844581604, 1.5146623849868774, 1.6575819253921509, 1.8005013465881348, 1.9434208869934082, 2.0863404273986816, 2.229259967803955, 2.3721795082092285, 2.515099048614502, 2.6580185890197754, 2.800938129425049, 2.943857431411743, 3.0867769718170166, 3.22969651222229, 3.3726160526275635, 3.515535593032837, 3.6584551334381104, 3.8013744354248047, 3.944293975830078, 4.087213516235352, 4.230133056640625, 4.373052597045898]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 11.0, 11.0, 11.0, 12.0, 11.0, 21.0, 31.0, 50.0, 67.0, 81.0, 123.0, 207.0, 356.0, 639.0, 1535.0, 3959.0, 14122.0, 82710.0, 3882832.0, 176342.0, 20955.0, 5584.0, 2077.0, 972.0, 521.0, 349.0, 224.0, 147.0, 99.0, 64.0, 50.0, 21.0, 27.0, 13.0, 13.0, 7.0, 6.0, 4.0, 7.0, 8.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9013671875, -1.8431243896484375, -1.784881591796875, -1.7266387939453125, -1.66839599609375, -1.6101531982421875, -1.551910400390625, -1.4936676025390625, -1.4354248046875, -1.3771820068359375, -1.318939208984375, -1.2606964111328125, -1.20245361328125, -1.1442108154296875, -1.085968017578125, -1.0277252197265625, -0.969482421875, -0.9112396240234375, -0.852996826171875, -0.7947540283203125, -0.73651123046875, -0.6782684326171875, -0.620025634765625, -0.5617828369140625, -0.5035400390625, -0.4452972412109375, -0.387054443359375, -0.3288116455078125, -0.27056884765625, -0.2123260498046875, -0.154083251953125, -0.0958404541015625, -0.03759765625, 0.0206451416015625, 0.078887939453125, 0.1371307373046875, 0.19537353515625, 0.2536163330078125, 0.311859130859375, 0.3701019287109375, 0.4283447265625, 0.4865875244140625, 0.544830322265625, 0.6030731201171875, 0.66131591796875, 0.7195587158203125, 0.777801513671875, 0.8360443115234375, 0.894287109375, 0.9525299072265625, 1.010772705078125, 1.0690155029296875, 1.12725830078125, 1.1855010986328125, 1.243743896484375, 1.3019866943359375, 1.3602294921875, 1.4184722900390625, 1.476715087890625, 1.5349578857421875, 1.59320068359375, 1.6514434814453125, 1.709686279296875, 1.7679290771484375, 1.826171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 6.0, 16.0, 30.0, 53.0, 69.0, 106.0, 129.0, 119.0, 139.0, 115.0, 75.0, 66.0, 32.0, 19.0, 9.0, 8.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.767578125, -0.7455215454101562, -0.7234649658203125, -0.7014083862304688, -0.679351806640625, -0.6572952270507812, -0.6352386474609375, -0.6131820678710938, -0.59112548828125, -0.5690689086914062, -0.5470123291015625, -0.5249557495117188, -0.502899169921875, -0.48084259033203125, -0.4587860107421875, -0.43672943115234375, -0.4146728515625, -0.39261627197265625, -0.3705596923828125, -0.34850311279296875, -0.326446533203125, -0.30438995361328125, -0.2823333740234375, -0.26027679443359375, -0.23822021484375, -0.21616363525390625, -0.1941070556640625, -0.17205047607421875, -0.149993896484375, -0.12793731689453125, -0.1058807373046875, -0.08382415771484375, -0.061767578125, -0.03971099853515625, -0.0176544189453125, 0.00440216064453125, 0.026458740234375, 0.04851531982421875, 0.0705718994140625, 0.09262847900390625, 0.11468505859375, 0.13674163818359375, 0.1587982177734375, 0.18085479736328125, 0.202911376953125, 0.22496795654296875, 0.2470245361328125, 0.26908111572265625, 0.2911376953125, 0.31319427490234375, 0.3352508544921875, 0.35730743408203125, 0.379364013671875, 0.40142059326171875, 0.4234771728515625, 0.44553375244140625, 0.46759033203125, 0.48964691162109375, 0.5117034912109375, 0.5337600708007812, 0.555816650390625, 0.5778732299804688, 0.5999298095703125, 0.6219863891601562, 0.64404296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 10.0, 9.0, 15.0, 30.0, 38.0, 57.0, 81.0, 173.0, 285.0, 414.0, 730.0, 1342.0, 2481.0, 5198.0, 13637.0, 46751.0, 301498.0, 3601738.0, 167222.0, 32786.0, 10347.0, 4413.0, 2194.0, 1148.0, 715.0, 379.0, 254.0, 116.0, 90.0, 50.0, 30.0, 19.0, 12.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1875, -1.1539306640625, -1.120361328125, -1.0867919921875, -1.05322265625, -1.0196533203125, -0.986083984375, -0.9525146484375, -0.9189453125, -0.8853759765625, -0.851806640625, -0.8182373046875, -0.78466796875, -0.7510986328125, -0.717529296875, -0.6839599609375, -0.650390625, -0.6168212890625, -0.583251953125, -0.5496826171875, -0.51611328125, -0.4825439453125, -0.448974609375, -0.4154052734375, -0.3818359375, -0.3482666015625, -0.314697265625, -0.2811279296875, -0.24755859375, -0.2139892578125, -0.180419921875, -0.1468505859375, -0.11328125, -0.0797119140625, -0.046142578125, -0.0125732421875, 0.02099609375, 0.0545654296875, 0.088134765625, 0.1217041015625, 0.1552734375, 0.1888427734375, 0.222412109375, 0.2559814453125, 0.28955078125, 0.3231201171875, 0.356689453125, 0.3902587890625, 0.423828125, 0.4573974609375, 0.490966796875, 0.5245361328125, 0.55810546875, 0.5916748046875, 0.625244140625, 0.6588134765625, 0.6923828125, 0.7259521484375, 0.759521484375, 0.7930908203125, 0.82666015625, 0.8602294921875, 0.893798828125, 0.9273681640625, 0.9609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 14.0, 12.0, 11.0, 18.0, 34.0, 32.0, 93.0, 207.0, 993.0, 2079.0, 286.0, 117.0, 64.0, 34.0, 18.0, 17.0, 17.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6611328125, -0.6384048461914062, -0.6156768798828125, -0.5929489135742188, -0.570220947265625, -0.5474929809570312, -0.5247650146484375, -0.5020370483398438, -0.47930908203125, -0.45658111572265625, -0.4338531494140625, -0.41112518310546875, -0.388397216796875, -0.36566925048828125, -0.3429412841796875, -0.32021331787109375, -0.2974853515625, -0.27475738525390625, -0.2520294189453125, -0.22930145263671875, -0.206573486328125, -0.18384552001953125, -0.1611175537109375, -0.13838958740234375, -0.11566162109375, -0.09293365478515625, -0.0702056884765625, -0.04747772216796875, -0.024749755859375, -0.00202178955078125, 0.0207061767578125, 0.04343414306640625, 0.066162109375, 0.08889007568359375, 0.1116180419921875, 0.13434600830078125, 0.157073974609375, 0.17980194091796875, 0.2025299072265625, 0.22525787353515625, 0.24798583984375, 0.27071380615234375, 0.2934417724609375, 0.31616973876953125, 0.338897705078125, 0.36162567138671875, 0.3843536376953125, 0.40708160400390625, 0.4298095703125, 0.45253753662109375, 0.4752655029296875, 0.49799346923828125, 0.520721435546875, 0.5434494018554688, 0.5661773681640625, 0.5889053344726562, 0.61163330078125, 0.6343612670898438, 0.6570892333984375, 0.6798171997070312, 0.702545166015625, 0.7252731323242188, 0.7480010986328125, 0.7707290649414062, 0.79345703125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 8.0, 12.0, 38.0, 133.0, 281.0, 274.0, 155.0, 60.0, 22.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.252060890197754, -3.0498206615448, -2.8475801944732666, -2.6453399658203125, -2.4430997371673584, -2.2408595085144043, -2.038619041442871, -1.836378812789917, -1.6341384649276733, -1.4318981170654297, -1.2296578884124756, -1.027417540550232, -0.8251772522926331, -0.6229369640350342, -0.4206966161727905, -0.21845638751983643, -0.016216039657592773, 0.1860242635011673, 0.38826456665992737, 0.5905048847198486, 0.7927451729774475, 0.9949854612350464, 1.19722580909729, 1.3994660377502441, 1.6017063856124878, 1.8039467334747314, 2.0061869621276855, 2.2084274291992188, 2.410667657852173, 2.612907886505127, 2.81514835357666, 3.017388343811035, 3.2196288108825684, 3.4218690395355225, 3.6241095066070557, 3.8263497352600098, 4.028590202331543, 4.230830192565918, 4.433070659637451, 4.635311126708984, 4.837551116943359, 5.039791584014893, 5.242031574249268, 5.444272041320801, 5.646512508392334, 5.848752498626709, 6.050992965698242, 6.253232955932617, 6.455473899841309, 6.657714366912842, 6.859954357147217, 7.06219482421875, 7.264435291290283, 7.466675281524658, 7.668915748596191, 7.871155738830566, 8.073395729064941, 8.275635719299316, 8.477876663208008, 8.680116653442383, 8.882356643676758, 9.08459758758545, 9.286837577819824, 9.4890775680542, 9.69131851196289]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 11.0, 6.0, 23.0, 17.0, 28.0, 27.0, 33.0, 32.0, 38.0, 37.0, 50.0, 57.0, 60.0, 57.0, 53.0, 58.0, 53.0, 43.0, 55.0, 45.0, 38.0, 29.0, 30.0, 21.0, 28.0, 18.0, 14.0, 9.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.105159282684326, -2.0450165271759033, -1.984873652458191, -1.924730896949768, -1.8645880222320557, -1.8044452667236328, -1.74430251121521, -1.6841596364974976, -1.6240167617797852, -1.5638740062713623, -1.50373113155365, -1.443588376045227, -1.3834455013275146, -1.3233027458190918, -1.263159990310669, -1.2030171155929565, -1.1428743600845337, -1.0827316045761108, -1.0225887298583984, -0.9624459743499756, -0.9023030996322632, -0.8421603441238403, -0.7820175290107727, -0.7218747138977051, -0.6617318987846375, -0.6015890836715698, -0.5414462685585022, -0.48130348324775696, -0.42116066813468933, -0.3610178530216217, -0.30087506771087646, -0.24073225259780884, -0.1805894374847412, -0.12044662982225418, -0.06030382215976715, -0.00016102194786071777, 0.05998179316520691, 0.12012460827827454, 0.18026739358901978, 0.2404102087020874, 0.30055302381515503, 0.36069583892822266, 0.4208386540412903, 0.4809814393520355, 0.5411242246627808, 0.6012670993804932, 0.661409854888916, 0.7215526700019836, 0.7816954851150513, 0.8418383002281189, 0.9019811153411865, 0.9621238708496094, 1.0222667455673218, 1.0824095010757446, 1.142552375793457, 1.2026951313018799, 1.2628378868103027, 1.3229806423187256, 1.383123517036438, 1.4432662725448608, 1.5034091472625732, 1.563551902770996, 1.623694658279419, 1.6838375329971313, 1.7439804077148438]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 7.0, 20.0, 13.0, 33.0, 44.0, 63.0, 85.0, 159.0, 239.0, 395.0, 678.0, 1276.0, 2534.0, 7341.0, 37224.0, 297865.0, 579933.0, 97891.0, 14745.0, 4039.0, 1775.0, 880.0, 459.0, 297.0, 188.0, 113.0, 74.0, 58.0, 36.0, 27.0, 12.0, 9.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.013671875, -1.9595947265625, -1.905517578125, -1.8514404296875, -1.79736328125, -1.7432861328125, -1.689208984375, -1.6351318359375, -1.5810546875, -1.5269775390625, -1.472900390625, -1.4188232421875, -1.36474609375, -1.3106689453125, -1.256591796875, -1.2025146484375, -1.1484375, -1.0943603515625, -1.040283203125, -0.9862060546875, -0.93212890625, -0.8780517578125, -0.823974609375, -0.7698974609375, -0.7158203125, -0.6617431640625, -0.607666015625, -0.5535888671875, -0.49951171875, -0.4454345703125, -0.391357421875, -0.3372802734375, -0.283203125, -0.2291259765625, -0.175048828125, -0.1209716796875, -0.06689453125, -0.0128173828125, 0.041259765625, 0.0953369140625, 0.1494140625, 0.2034912109375, 0.257568359375, 0.3116455078125, 0.36572265625, 0.4197998046875, 0.473876953125, 0.5279541015625, 0.58203125, 0.6361083984375, 0.690185546875, 0.7442626953125, 0.79833984375, 0.8524169921875, 0.906494140625, 0.9605712890625, 1.0146484375, 1.0687255859375, 1.122802734375, 1.1768798828125, 1.23095703125, 1.2850341796875, 1.339111328125, 1.3931884765625, 1.447265625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 6.0, 21.0, 32.0, 56.0, 75.0, 112.0, 142.0, 102.0, 127.0, 104.0, 88.0, 46.0, 41.0, 19.0, 8.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7783203125, -0.7558517456054688, -0.7333831787109375, -0.7109146118164062, -0.688446044921875, -0.6659774780273438, -0.6435089111328125, -0.6210403442382812, -0.59857177734375, -0.5761032104492188, -0.5536346435546875, -0.5311660766601562, -0.508697509765625, -0.48622894287109375, -0.4637603759765625, -0.44129180908203125, -0.4188232421875, -0.39635467529296875, -0.3738861083984375, -0.35141754150390625, -0.328948974609375, -0.30648040771484375, -0.2840118408203125, -0.26154327392578125, -0.23907470703125, -0.21660614013671875, -0.1941375732421875, -0.17166900634765625, -0.149200439453125, -0.12673187255859375, -0.1042633056640625, -0.08179473876953125, -0.059326171875, -0.03685760498046875, -0.0143890380859375, 0.00807952880859375, 0.030548095703125, 0.05301666259765625, 0.0754852294921875, 0.09795379638671875, 0.12042236328125, 0.14289093017578125, 0.1653594970703125, 0.18782806396484375, 0.210296630859375, 0.23276519775390625, 0.2552337646484375, 0.27770233154296875, 0.3001708984375, 0.32263946533203125, 0.3451080322265625, 0.36757659912109375, 0.390045166015625, 0.41251373291015625, 0.4349822998046875, 0.45745086669921875, 0.47991943359375, 0.5023880004882812, 0.5248565673828125, 0.5473251342773438, 0.569793701171875, 0.5922622680664062, 0.6147308349609375, 0.6371994018554688, 0.65966796875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 8.0, 6.0, 6.0, 14.0, 27.0, 41.0, 65.0, 92.0, 128.0, 188.0, 429.0, 824.0, 1967.0, 5845.0, 21703.0, 115195.0, 540182.0, 295588.0, 49181.0, 10955.0, 3424.0, 1254.0, 595.0, 307.0, 175.0, 115.0, 83.0, 50.0, 41.0, 20.0, 13.0, 12.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.181640625, -1.14556884765625, -1.1094970703125, -1.07342529296875, -1.037353515625, -1.00128173828125, -0.9652099609375, -0.92913818359375, -0.89306640625, -0.85699462890625, -0.8209228515625, -0.78485107421875, -0.748779296875, -0.71270751953125, -0.6766357421875, -0.64056396484375, -0.6044921875, -0.56842041015625, -0.5323486328125, -0.49627685546875, -0.460205078125, -0.42413330078125, -0.3880615234375, -0.35198974609375, -0.31591796875, -0.27984619140625, -0.2437744140625, -0.20770263671875, -0.171630859375, -0.13555908203125, -0.0994873046875, -0.06341552734375, -0.02734375, 0.00872802734375, 0.0447998046875, 0.08087158203125, 0.116943359375, 0.15301513671875, 0.1890869140625, 0.22515869140625, 0.26123046875, 0.29730224609375, 0.3333740234375, 0.36944580078125, 0.405517578125, 0.44158935546875, 0.4776611328125, 0.51373291015625, 0.5498046875, 0.58587646484375, 0.6219482421875, 0.65802001953125, 0.694091796875, 0.73016357421875, 0.7662353515625, 0.80230712890625, 0.83837890625, 0.87445068359375, 0.9105224609375, 0.94659423828125, 0.982666015625, 1.01873779296875, 1.0548095703125, 1.09088134765625, 1.126953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 9.0, 5.0, 7.0, 18.0, 14.0, 24.0, 27.0, 38.0, 42.0, 44.0, 53.0, 61.0, 62.0, 69.0, 63.0, 67.0, 67.0, 53.0, 56.0, 49.0, 38.0, 26.0, 22.0, 21.0, 15.0, 14.0, 7.0, 10.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9267578125, -1.8786163330078125, -1.830474853515625, -1.7823333740234375, -1.73419189453125, -1.6860504150390625, -1.637908935546875, -1.5897674560546875, -1.5416259765625, -1.4934844970703125, -1.445343017578125, -1.3972015380859375, -1.34906005859375, -1.3009185791015625, -1.252777099609375, -1.2046356201171875, -1.156494140625, -1.1083526611328125, -1.060211181640625, -1.0120697021484375, -0.96392822265625, -0.9157867431640625, -0.867645263671875, -0.8195037841796875, -0.7713623046875, -0.7232208251953125, -0.675079345703125, -0.6269378662109375, -0.57879638671875, -0.5306549072265625, -0.482513427734375, -0.4343719482421875, -0.38623046875, -0.3380889892578125, -0.289947509765625, -0.2418060302734375, -0.19366455078125, -0.1455230712890625, -0.097381591796875, -0.0492401123046875, -0.0010986328125, 0.0470428466796875, 0.095184326171875, 0.1433258056640625, 0.19146728515625, 0.2396087646484375, 0.287750244140625, 0.3358917236328125, 0.384033203125, 0.4321746826171875, 0.480316162109375, 0.5284576416015625, 0.57659912109375, 0.6247406005859375, 0.672882080078125, 0.7210235595703125, 0.7691650390625, 0.8173065185546875, 0.865447998046875, 0.9135894775390625, 0.96173095703125, 1.0098724365234375, 1.058013916015625, 1.1061553955078125, 1.154296875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 5.0, 12.0, 18.0, 21.0, 17.0, 35.0, 59.0, 76.0, 127.0, 216.0, 371.0, 706.0, 1461.0, 3618.0, 10475.0, 39126.0, 179177.0, 494593.0, 243182.0, 53388.0, 13597.0, 4560.0, 1755.0, 823.0, 415.0, 256.0, 143.0, 108.0, 49.0, 42.0, 33.0, 12.0, 13.0, 14.0, 11.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.384765625, -0.37131500244140625, -0.3578643798828125, -0.34441375732421875, -0.330963134765625, -0.31751251220703125, -0.3040618896484375, -0.29061126708984375, -0.27716064453125, -0.26371002197265625, -0.2502593994140625, -0.23680877685546875, -0.223358154296875, -0.20990753173828125, -0.1964569091796875, -0.18300628662109375, -0.1695556640625, -0.15610504150390625, -0.1426544189453125, -0.12920379638671875, -0.115753173828125, -0.10230255126953125, -0.0888519287109375, -0.07540130615234375, -0.06195068359375, -0.04850006103515625, -0.0350494384765625, -0.02159881591796875, -0.008148193359375, 0.00530242919921875, 0.0187530517578125, 0.03220367431640625, 0.045654296875, 0.05910491943359375, 0.0725555419921875, 0.08600616455078125, 0.099456787109375, 0.11290740966796875, 0.1263580322265625, 0.13980865478515625, 0.15325927734375, 0.16670989990234375, 0.1801605224609375, 0.19361114501953125, 0.207061767578125, 0.22051239013671875, 0.2339630126953125, 0.24741363525390625, 0.2608642578125, 0.27431488037109375, 0.2877655029296875, 0.30121612548828125, 0.314666748046875, 0.32811737060546875, 0.3415679931640625, 0.35501861572265625, 0.36846923828125, 0.38191986083984375, 0.3953704833984375, 0.40882110595703125, 0.422271728515625, 0.43572235107421875, 0.4491729736328125, 0.46262359619140625, 0.47607421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 2.0, 9.0, 11.0, 14.0, 29.0, 39.0, 57.0, 57.0, 95.0, 91.0, 111.0, 112.0, 95.0, 73.0, 57.0, 28.0, 33.0, 26.0, 12.0, 13.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011366605758666992, -0.00011045299470424652, -0.00010723993182182312, -0.00010402686893939972, -0.00010081380605697632, -9.760074317455292e-05, -9.438768029212952e-05, -9.117461740970612e-05, -8.796155452728271e-05, -8.474849164485931e-05, -8.153542876243591e-05, -7.832236588001251e-05, -7.510930299758911e-05, -7.189624011516571e-05, -6.868317723274231e-05, -6.547011435031891e-05, -6.225705146789551e-05, -5.904398858547211e-05, -5.5830925703048706e-05, -5.2617862820625305e-05, -4.9404799938201904e-05, -4.6191737055778503e-05, -4.29786741733551e-05, -3.97656112909317e-05, -3.65525484085083e-05, -3.33394855260849e-05, -3.01264226436615e-05, -2.6913359761238098e-05, -2.3700296878814697e-05, -2.0487233996391296e-05, -1.7274171113967896e-05, -1.4061108231544495e-05, -1.0848045349121094e-05, -7.634982466697693e-06, -4.421919584274292e-06, -1.2088567018508911e-06, 2.0042061805725098e-06, 5.217269062995911e-06, 8.430331945419312e-06, 1.1643394827842712e-05, 1.4856457710266113e-05, 1.8069520592689514e-05, 2.1282583475112915e-05, 2.4495646357536316e-05, 2.7708709239959717e-05, 3.092177212238312e-05, 3.413483500480652e-05, 3.734789788722992e-05, 4.056096076965332e-05, 4.377402365207672e-05, 4.698708653450012e-05, 5.020014941692352e-05, 5.3413212299346924e-05, 5.6626275181770325e-05, 5.9839338064193726e-05, 6.305240094661713e-05, 6.626546382904053e-05, 6.947852671146393e-05, 7.269158959388733e-05, 7.590465247631073e-05, 7.911771535873413e-05, 8.233077824115753e-05, 8.554384112358093e-05, 8.875690400600433e-05, 9.196996688842773e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 10.0, 9.0, 24.0, 42.0, 55.0, 114.0, 209.0, 421.0, 1042.0, 2821.0, 10953.0, 73902.0, 514715.0, 385156.0, 47384.0, 7821.0, 2234.0, 825.0, 373.0, 170.0, 121.0, 52.0, 37.0, 23.0, 8.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5216217041015625, -0.502227783203125, -0.4828338623046875, -0.46343994140625, -0.4440460205078125, -0.424652099609375, -0.4052581787109375, -0.3858642578125, -0.3664703369140625, -0.347076416015625, -0.3276824951171875, -0.30828857421875, -0.2888946533203125, -0.269500732421875, -0.2501068115234375, -0.230712890625, -0.2113189697265625, -0.191925048828125, -0.1725311279296875, -0.15313720703125, -0.1337432861328125, -0.114349365234375, -0.0949554443359375, -0.0755615234375, -0.0561676025390625, -0.036773681640625, -0.0173797607421875, 0.00201416015625, 0.0214080810546875, 0.040802001953125, 0.0601959228515625, 0.07958984375, 0.0989837646484375, 0.118377685546875, 0.1377716064453125, 0.15716552734375, 0.1765594482421875, 0.195953369140625, 0.2153472900390625, 0.2347412109375, 0.2541351318359375, 0.273529052734375, 0.2929229736328125, 0.31231689453125, 0.3317108154296875, 0.351104736328125, 0.3704986572265625, 0.389892578125, 0.4092864990234375, 0.428680419921875, 0.4480743408203125, 0.46746826171875, 0.4868621826171875, 0.506256103515625, 0.5256500244140625, 0.5450439453125, 0.5644378662109375, 0.583831787109375, 0.6032257080078125, 0.62261962890625, 0.6420135498046875, 0.661407470703125, 0.6808013916015625, 0.7001953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 10.0, 20.0, 26.0, 42.0, 54.0, 86.0, 108.0, 122.0, 134.0, 100.0, 73.0, 59.0, 45.0, 30.0, 19.0, 22.0, 13.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.748046875, -0.7260818481445312, -0.7041168212890625, -0.6821517944335938, -0.660186767578125, -0.6382217407226562, -0.6162567138671875, -0.5942916870117188, -0.57232666015625, -0.5503616333007812, -0.5283966064453125, -0.5064315795898438, -0.484466552734375, -0.46250152587890625, -0.4405364990234375, -0.41857147216796875, -0.3966064453125, -0.37464141845703125, -0.3526763916015625, -0.33071136474609375, -0.308746337890625, -0.28678131103515625, -0.2648162841796875, -0.24285125732421875, -0.22088623046875, -0.19892120361328125, -0.1769561767578125, -0.15499114990234375, -0.133026123046875, -0.11106109619140625, -0.0890960693359375, -0.06713104248046875, -0.045166015625, -0.02320098876953125, -0.0012359619140625, 0.02072906494140625, 0.042694091796875, 0.06465911865234375, 0.0866241455078125, 0.10858917236328125, 0.13055419921875, 0.15251922607421875, 0.1744842529296875, 0.19644927978515625, 0.218414306640625, 0.24037933349609375, 0.2623443603515625, 0.28430938720703125, 0.3062744140625, 0.32823944091796875, 0.3502044677734375, 0.37216949462890625, 0.394134521484375, 0.41609954833984375, 0.4380645751953125, 0.46002960205078125, 0.48199462890625, 0.5039596557617188, 0.5259246826171875, 0.5478897094726562, 0.569854736328125, 0.5918197631835938, 0.6137847900390625, 0.6357498168945312, 0.65771484375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 11.0, 16.0, 32.0, 53.0, 97.0, 137.0, 150.0, 149.0, 129.0, 80.0, 62.0, 36.0, 19.0, 14.0, 8.0, 2.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.51634407043457, -13.23917007446289, -12.961997032165527, -12.684823036193848, -12.407649040222168, -12.130475997924805, -11.853302001953125, -11.576128005981445, -11.298954963684082, -11.021780967712402, -10.744607925415039, -10.46743392944336, -10.19025993347168, -9.913086891174316, -9.635912895202637, -9.358738899230957, -9.081565856933594, -8.804391860961914, -8.52721881866455, -8.250044822692871, -7.97287130355835, -7.695697784423828, -7.418523788452148, -7.141350269317627, -6.864175796508789, -6.587002277374268, -6.309828281402588, -6.032654762268066, -5.755481243133545, -5.478307723999023, -5.201133728027344, -4.923960208892822, -4.646786689758301, -4.369613170623779, -4.0924391746521, -3.815265655517578, -3.5380921363830566, -3.260918378829956, -2.9837446212768555, -2.706571102142334, -2.4293973445892334, -2.152223587036133, -1.8750500679016113, -1.5978763103485107, -1.3207026720046997, -1.0435290336608887, -0.7663552761077881, -0.48918163776397705, -0.21200799942016602, 0.06516566872596741, 0.34233933687210083, 0.6195130348205566, 0.8966866731643677, 1.1738603115081787, 1.4510340690612793, 1.7282077074050903, 2.0053813457489014, 2.282555103302002, 2.5597286224365234, 2.836902379989624, 3.1140761375427246, 3.391249656677246, 3.6684234142303467, 3.9455971717834473, 4.222770690917969]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 10.0, 9.0, 20.0, 14.0, 11.0, 22.0, 27.0, 14.0, 21.0, 29.0, 26.0, 35.0, 34.0, 41.0, 47.0, 41.0, 51.0, 42.0, 49.0, 58.0, 52.0, 34.0, 26.0, 31.0, 34.0, 25.0, 27.0, 21.0, 16.0, 17.0, 14.0, 9.0, 17.0, 14.0, 15.0, 8.0, 5.0, 8.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.450253486633301, -6.266421794891357, -6.082590103149414, -5.898758888244629, -5.7149271965026855, -5.531095504760742, -5.347263813018799, -5.1634321212768555, -4.97960090637207, -4.795769214630127, -4.611937522888184, -4.428106307983398, -4.244274616241455, -4.060442924499512, -3.8766112327575684, -3.692779541015625, -3.5089478492736816, -3.3251161575317383, -3.141284704208374, -2.9574530124664307, -2.7736215591430664, -2.589789867401123, -2.4059581756591797, -2.2221264839172363, -2.038295030593872, -1.8544634580612183, -1.6706318855285645, -1.486800193786621, -1.3029686212539673, -1.1191370487213135, -0.9353053569793701, -0.7514737844467163, -0.5676422119140625, -0.3838106095790863, -0.1999790072441101, -0.016147375106811523, 0.16768419742584229, 0.3515157699584961, 0.5353474617004395, 0.7191790342330933, 0.9030106067657471, 1.0868421792984009, 1.2706737518310547, 1.454505443572998, 1.6383370161056519, 1.8221685886383057, 2.006000280380249, 2.1898317337036133, 2.3736634254455566, 2.5574951171875, 2.7413265705108643, 2.9251582622528076, 3.108989715576172, 3.2928214073181152, 3.4766530990600586, 3.660484790802002, 3.844316244125366, 4.0281476974487305, 4.211979389190674, 4.395811080932617, 4.5796427726745605, 4.763474464416504, 4.947305679321289, 5.131137371063232, 5.314969062805176]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 7.0, 13.0, 18.0, 29.0, 38.0, 58.0, 117.0, 169.0, 351.0, 825.0, 3324.0, 32504.0, 4142067.0, 11544.0, 1880.0, 604.0, 289.0, 182.0, 83.0, 62.0, 38.0, 22.0, 14.0, 17.0, 7.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.44921875, -5.323455810546875, -5.19769287109375, -5.071929931640625, -4.9461669921875, -4.820404052734375, -4.69464111328125, -4.568878173828125, -4.443115234375, -4.317352294921875, -4.19158935546875, -4.065826416015625, -3.9400634765625, -3.814300537109375, -3.68853759765625, -3.562774658203125, -3.43701171875, -3.311248779296875, -3.18548583984375, -3.059722900390625, -2.9339599609375, -2.808197021484375, -2.68243408203125, -2.556671142578125, -2.430908203125, -2.305145263671875, -2.17938232421875, -2.053619384765625, -1.9278564453125, -1.802093505859375, -1.67633056640625, -1.550567626953125, -1.4248046875, -1.299041748046875, -1.17327880859375, -1.047515869140625, -0.9217529296875, -0.795989990234375, -0.67022705078125, -0.544464111328125, -0.418701171875, -0.292938232421875, -0.16717529296875, -0.041412353515625, 0.0843505859375, 0.210113525390625, 0.33587646484375, 0.461639404296875, 0.58740234375, 0.713165283203125, 0.83892822265625, 0.964691162109375, 1.0904541015625, 1.216217041015625, 1.34197998046875, 1.467742919921875, 1.593505859375, 1.719268798828125, 1.84503173828125, 1.970794677734375, 2.0965576171875, 2.222320556640625, 2.34808349609375, 2.473846435546875, 2.599609375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 8.0, 22.0, 36.0, 55.0, 67.0, 102.0, 106.0, 107.0, 113.0, 104.0, 94.0, 67.0, 42.0, 22.0, 15.0, 13.0, 11.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8203125, -0.7968292236328125, -0.773345947265625, -0.7498626708984375, -0.72637939453125, -0.7028961181640625, -0.679412841796875, -0.6559295654296875, -0.6324462890625, -0.6089630126953125, -0.585479736328125, -0.5619964599609375, -0.53851318359375, -0.5150299072265625, -0.491546630859375, -0.4680633544921875, -0.444580078125, -0.4210968017578125, -0.397613525390625, -0.3741302490234375, -0.35064697265625, -0.3271636962890625, -0.303680419921875, -0.2801971435546875, -0.2567138671875, -0.2332305908203125, -0.209747314453125, -0.1862640380859375, -0.16278076171875, -0.1392974853515625, -0.115814208984375, -0.0923309326171875, -0.06884765625, -0.0453643798828125, -0.021881103515625, 0.0016021728515625, 0.02508544921875, 0.0485687255859375, 0.072052001953125, 0.0955352783203125, 0.1190185546875, 0.1425018310546875, 0.165985107421875, 0.1894683837890625, 0.21295166015625, 0.2364349365234375, 0.259918212890625, 0.2834014892578125, 0.306884765625, 0.3303680419921875, 0.353851318359375, 0.3773345947265625, 0.40081787109375, 0.4243011474609375, 0.447784423828125, 0.4712677001953125, 0.4947509765625, 0.5182342529296875, 0.541717529296875, 0.5652008056640625, 0.58868408203125, 0.6121673583984375, 0.635650634765625, 0.6591339111328125, 0.6826171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 9.0, 11.0, 16.0, 23.0, 37.0, 46.0, 61.0, 74.0, 74.0, 101.0, 172.0, 246.0, 457.0, 1010.0, 3111.0, 14192.0, 3940284.0, 218498.0, 10944.0, 2557.0, 970.0, 436.0, 252.0, 171.0, 94.0, 83.0, 92.0, 54.0, 40.0, 37.0, 31.0, 20.0, 14.0, 9.0, 6.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.92572021484375, -1.8514404296875, -1.77716064453125, -1.702880859375, -1.62860107421875, -1.5543212890625, -1.48004150390625, -1.40576171875, -1.33148193359375, -1.2572021484375, -1.18292236328125, -1.108642578125, -1.03436279296875, -0.9600830078125, -0.88580322265625, -0.8115234375, -0.73724365234375, -0.6629638671875, -0.58868408203125, -0.514404296875, -0.44012451171875, -0.3658447265625, -0.29156494140625, -0.21728515625, -0.14300537109375, -0.0687255859375, 0.00555419921875, 0.079833984375, 0.15411376953125, 0.2283935546875, 0.30267333984375, 0.376953125, 0.45123291015625, 0.5255126953125, 0.59979248046875, 0.674072265625, 0.74835205078125, 0.8226318359375, 0.89691162109375, 0.97119140625, 1.04547119140625, 1.1197509765625, 1.19403076171875, 1.268310546875, 1.34259033203125, 1.4168701171875, 1.49114990234375, 1.5654296875, 1.63970947265625, 1.7139892578125, 1.78826904296875, 1.862548828125, 1.93682861328125, 2.0111083984375, 2.08538818359375, 2.15966796875, 2.23394775390625, 2.3082275390625, 2.38250732421875, 2.456787109375, 2.53106689453125, 2.6053466796875, 2.67962646484375, 2.75390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 32.0, 65.0, 3523.0, 353.0, 55.0, 18.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.1731243133544922, -0.15374374389648438, -0.13436317443847656, -0.11498260498046875, -0.09560203552246094, -0.07622146606445312, -0.05684089660644531, -0.0374603271484375, -0.018079757690429688, 0.001300811767578125, 0.020681381225585938, 0.04006195068359375, 0.05944252014160156, 0.07882308959960938, 0.09820365905761719, 0.117584228515625, 0.1369647979736328, 0.15634536743164062, 0.17572593688964844, 0.19510650634765625, 0.21448707580566406, 0.23386764526367188, 0.2532482147216797, 0.2726287841796875, 0.2920093536376953, 0.3113899230957031, 0.33077049255371094, 0.35015106201171875, 0.36953163146972656, 0.3889122009277344, 0.4082927703857422, 0.42767333984375, 0.4470539093017578, 0.4664344787597656, 0.48581504821777344, 0.5051956176757812, 0.5245761871337891, 0.5439567565917969, 0.5633373260498047, 0.5827178955078125, 0.6020984649658203, 0.6214790344238281, 0.6408596038818359, 0.6602401733398438, 0.6796207427978516, 0.6990013122558594, 0.7183818817138672, 0.737762451171875, 0.7571430206298828, 0.7765235900878906, 0.7959041595458984, 0.8152847290039062, 0.8346652984619141, 0.8540458679199219, 0.8734264373779297, 0.8928070068359375, 0.9121875762939453, 0.9315681457519531, 0.9509487152099609, 0.9703292846679688, 0.9897098541259766, 1.0090904235839844, 1.0284709930419922, 1.0478515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 28.0, 38.0, 94.0, 142.0, 173.0, 193.0, 127.0, 87.0, 48.0, 27.0, 15.0, 6.0, 12.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6181740760803223, -1.5613782405853271, -1.5045825242996216, -1.4477866888046265, -1.390990972518921, -1.3341951370239258, -1.2773993015289307, -1.2206034660339355, -1.16380774974823, -1.1070119142532349, -1.0502161979675293, -0.9934203624725342, -0.9366245865821838, -0.8798288106918335, -0.8230329751968384, -0.766237199306488, -0.7094414234161377, -0.6526456475257874, -0.595849871635437, -0.5390540361404419, -0.48225826025009155, -0.4254624843597412, -0.3686666786670685, -0.31187087297439575, -0.2550750970840454, -0.19827930629253387, -0.14148351550102234, -0.0846877247095108, -0.027891933917999268, 0.028903841972351074, 0.0856996476650238, 0.14249545335769653, 0.19929122924804688, 0.2560870051383972, 0.31288281083106995, 0.3696786165237427, 0.426474392414093, 0.48327016830444336, 0.5400660037994385, 0.5968617796897888, 0.6536575555801392, 0.7104533314704895, 0.7672491073608398, 0.824044942855835, 0.8808407187461853, 0.9376364946365356, 0.9944323301315308, 1.0512280464172363, 1.1080238819122314, 1.1648197174072266, 1.2216154336929321, 1.2784112691879272, 1.3352069854736328, 1.392002820968628, 1.448798656463623, 1.5055944919586182, 1.5623902082443237, 1.6191860437393188, 1.6759817600250244, 1.7327775955200195, 1.7895734310150146, 1.8463691473007202, 1.9031649827957153, 1.959960699081421, 2.016756534576416]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 9.0, 15.0, 16.0, 14.0, 25.0, 30.0, 28.0, 42.0, 27.0, 36.0, 37.0, 35.0, 39.0, 41.0, 51.0, 45.0, 51.0, 51.0, 37.0, 45.0, 40.0, 39.0, 35.0, 29.0, 26.0, 18.0, 26.0, 20.0, 17.0, 15.0, 12.0, 7.0, 6.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.782922625541687, -0.7577028870582581, -0.7324832081794739, -0.7072634696960449, -0.682043731212616, -0.656823992729187, -0.6316043138504028, -0.6063845753669739, -0.5811648368835449, -0.555945098400116, -0.5307254195213318, -0.5055056810379028, -0.4802859425544739, -0.4550662338733673, -0.42984652519226074, -0.4046267867088318, -0.3794070780277252, -0.35418736934661865, -0.3289676308631897, -0.30374792218208313, -0.2785281836986542, -0.2533084750175476, -0.22808875143527985, -0.20286902785301208, -0.17764930427074432, -0.15242958068847656, -0.1272098571062088, -0.10199014097452164, -0.07677041739225388, -0.05155070126056671, -0.02633097767829895, -0.001111254096031189, 0.024108469486236572, 0.049328193068504333, 0.0745479166507721, 0.09976763278245926, 0.12498735636472702, 0.15020707249641418, 0.17542679607868195, 0.2006465196609497, 0.22586624324321747, 0.25108596682548523, 0.2763056755065918, 0.30152541399002075, 0.3267451226711273, 0.3519648313522339, 0.37718456983566284, 0.4024043083190918, 0.42762401700019836, 0.45284372568130493, 0.4780634641647339, 0.5032832026481628, 0.528502881526947, 0.553722620010376, 0.5789423584938049, 0.6041620969772339, 0.6293817758560181, 0.654601514339447, 0.6798211932182312, 0.7050409317016602, 0.7302606701850891, 0.7554804086685181, 0.7807000875473022, 0.8059198260307312, 0.8311395645141602]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 10.0, 12.0, 25.0, 48.0, 81.0, 128.0, 223.0, 456.0, 881.0, 2001.0, 6031.0, 32415.0, 244881.0, 587826.0, 146298.0, 19596.0, 4355.0, 1599.0, 754.0, 412.0, 207.0, 122.0, 83.0, 41.0, 23.0, 12.0, 12.0, 6.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.08984375, -2.0290374755859375, -1.968231201171875, -1.9074249267578125, -1.84661865234375, -1.7858123779296875, -1.725006103515625, -1.6641998291015625, -1.6033935546875, -1.5425872802734375, -1.481781005859375, -1.4209747314453125, -1.36016845703125, -1.2993621826171875, -1.238555908203125, -1.1777496337890625, -1.116943359375, -1.0561370849609375, -0.995330810546875, -0.9345245361328125, -0.87371826171875, -0.8129119873046875, -0.752105712890625, -0.6912994384765625, -0.6304931640625, -0.5696868896484375, -0.508880615234375, -0.4480743408203125, -0.38726806640625, -0.3264617919921875, -0.265655517578125, -0.2048492431640625, -0.14404296875, -0.0832366943359375, -0.022430419921875, 0.0383758544921875, 0.09918212890625, 0.1599884033203125, 0.220794677734375, 0.2816009521484375, 0.3424072265625, 0.4032135009765625, 0.464019775390625, 0.5248260498046875, 0.58563232421875, 0.6464385986328125, 0.707244873046875, 0.7680511474609375, 0.828857421875, 0.8896636962890625, 0.950469970703125, 1.0112762451171875, 1.07208251953125, 1.1328887939453125, 1.193695068359375, 1.2545013427734375, 1.3153076171875, 1.3761138916015625, 1.436920166015625, 1.4977264404296875, 1.55853271484375, 1.6193389892578125, 1.680145263671875, 1.7409515380859375, 1.8017578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 16.0, 18.0, 24.0, 35.0, 56.0, 72.0, 86.0, 99.0, 110.0, 86.0, 91.0, 79.0, 67.0, 52.0, 39.0, 28.0, 13.0, 15.0, 2.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.822265625, -0.7988052368164062, -0.7753448486328125, -0.7518844604492188, -0.728424072265625, -0.7049636840820312, -0.6815032958984375, -0.6580429077148438, -0.63458251953125, -0.6111221313476562, -0.5876617431640625, -0.5642013549804688, -0.540740966796875, -0.5172805786132812, -0.4938201904296875, -0.47035980224609375, -0.4468994140625, -0.42343902587890625, -0.3999786376953125, -0.37651824951171875, -0.353057861328125, -0.32959747314453125, -0.3061370849609375, -0.28267669677734375, -0.25921630859375, -0.23575592041015625, -0.2122955322265625, -0.18883514404296875, -0.165374755859375, -0.14191436767578125, -0.1184539794921875, -0.09499359130859375, -0.071533203125, -0.04807281494140625, -0.0246124267578125, -0.00115203857421875, 0.022308349609375, 0.04576873779296875, 0.0692291259765625, 0.09268951416015625, 0.11614990234375, 0.13961029052734375, 0.1630706787109375, 0.18653106689453125, 0.209991455078125, 0.23345184326171875, 0.2569122314453125, 0.28037261962890625, 0.3038330078125, 0.32729339599609375, 0.3507537841796875, 0.37421417236328125, 0.397674560546875, 0.42113494873046875, 0.4445953369140625, 0.46805572509765625, 0.49151611328125, 0.5149765014648438, 0.5384368896484375, 0.5618972778320312, 0.585357666015625, 0.6088180541992188, 0.6322784423828125, 0.6557388305664062, 0.67919921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 10.0, 15.0, 15.0, 21.0, 21.0, 29.0, 39.0, 43.0, 83.0, 91.0, 130.0, 212.0, 305.0, 492.0, 983.0, 1893.0, 4123.0, 10051.0, 26722.0, 76251.0, 218860.0, 392576.0, 202971.0, 70345.0, 24795.0, 9361.0, 3849.0, 1796.0, 977.0, 543.0, 307.0, 184.0, 127.0, 77.0, 52.0, 51.0, 44.0, 34.0, 19.0, 12.0, 10.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.76416015625, -0.73907470703125, -0.7139892578125, -0.68890380859375, -0.663818359375, -0.63873291015625, -0.6136474609375, -0.58856201171875, -0.5634765625, -0.53839111328125, -0.5133056640625, -0.48822021484375, -0.463134765625, -0.43804931640625, -0.4129638671875, -0.38787841796875, -0.36279296875, -0.33770751953125, -0.3126220703125, -0.28753662109375, -0.262451171875, -0.23736572265625, -0.2122802734375, -0.18719482421875, -0.162109375, -0.13702392578125, -0.1119384765625, -0.08685302734375, -0.061767578125, -0.03668212890625, -0.0115966796875, 0.01348876953125, 0.03857421875, 0.06365966796875, 0.0887451171875, 0.11383056640625, 0.138916015625, 0.16400146484375, 0.1890869140625, 0.21417236328125, 0.2392578125, 0.26434326171875, 0.2894287109375, 0.31451416015625, 0.339599609375, 0.36468505859375, 0.3897705078125, 0.41485595703125, 0.43994140625, 0.46502685546875, 0.4901123046875, 0.51519775390625, 0.540283203125, 0.56536865234375, 0.5904541015625, 0.61553955078125, 0.640625, 0.66571044921875, 0.6907958984375, 0.71588134765625, 0.740966796875, 0.76605224609375, 0.7911376953125, 0.81622314453125, 0.84130859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 5.0, 2.0, 3.0, 7.0, 9.0, 10.0, 11.0, 14.0, 24.0, 19.0, 26.0, 28.0, 38.0, 34.0, 44.0, 34.0, 53.0, 39.0, 59.0, 41.0, 39.0, 57.0, 51.0, 51.0, 43.0, 38.0, 35.0, 25.0, 26.0, 23.0, 14.0, 23.0, 17.0, 13.0, 12.0, 6.0, 7.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.505859375, -1.453125, -1.400390625, -1.34765625, -1.294921875, -1.2421875, -1.189453125, -1.13671875, -1.083984375, -1.03125, -0.978515625, -0.92578125, -0.873046875, -0.8203125, -0.767578125, -0.71484375, -0.662109375, -0.609375, -0.556640625, -0.50390625, -0.451171875, -0.3984375, -0.345703125, -0.29296875, -0.240234375, -0.1875, -0.134765625, -0.08203125, -0.029296875, 0.0234375, 0.076171875, 0.12890625, 0.181640625, 0.234375, 0.287109375, 0.33984375, 0.392578125, 0.4453125, 0.498046875, 0.55078125, 0.603515625, 0.65625, 0.708984375, 0.76171875, 0.814453125, 0.8671875, 0.919921875, 0.97265625, 1.025390625, 1.078125, 1.130859375, 1.18359375, 1.236328125, 1.2890625, 1.341796875, 1.39453125, 1.447265625, 1.5, 1.552734375, 1.60546875, 1.658203125, 1.7109375, 1.763671875, 1.81640625, 1.869140625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 16.0, 30.0, 50.0, 77.0, 192.0, 545.0, 3599.0, 164118.0, 868558.0, 9865.0, 965.0, 284.0, 120.0, 53.0, 36.0, 12.0, 9.0, 6.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.59375, -1.52191162109375, -1.4500732421875, -1.37823486328125, -1.306396484375, -1.23455810546875, -1.1627197265625, -1.09088134765625, -1.01904296875, -0.94720458984375, -0.8753662109375, -0.80352783203125, -0.731689453125, -0.65985107421875, -0.5880126953125, -0.51617431640625, -0.4443359375, -0.37249755859375, -0.3006591796875, -0.22882080078125, -0.156982421875, -0.08514404296875, -0.0133056640625, 0.05853271484375, 0.13037109375, 0.20220947265625, 0.2740478515625, 0.34588623046875, 0.417724609375, 0.48956298828125, 0.5614013671875, 0.63323974609375, 0.705078125, 0.77691650390625, 0.8487548828125, 0.92059326171875, 0.992431640625, 1.06427001953125, 1.1361083984375, 1.20794677734375, 1.27978515625, 1.35162353515625, 1.4234619140625, 1.49530029296875, 1.567138671875, 1.63897705078125, 1.7108154296875, 1.78265380859375, 1.8544921875, 1.92633056640625, 1.9981689453125, 2.07000732421875, 2.141845703125, 2.21368408203125, 2.2855224609375, 2.35736083984375, 2.42919921875, 2.50103759765625, 2.5728759765625, 2.64471435546875, 2.716552734375, 2.78839111328125, 2.8602294921875, 2.93206787109375, 3.00390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 2.0, 7.0, 9.0, 7.0, 16.0, 11.0, 19.0, 19.0, 29.0, 35.0, 50.0, 61.0, 53.0, 66.0, 89.0, 78.0, 78.0, 69.0, 48.0, 63.0, 43.0, 26.0, 25.0, 21.0, 14.0, 11.0, 13.0, 3.0, 5.0, 2.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.666515350341797e-05, -8.389260619878769e-05, -8.112005889415741e-05, -7.834751158952713e-05, -7.557496428489685e-05, -7.280241698026657e-05, -7.002986967563629e-05, -6.725732237100601e-05, -6.448477506637573e-05, -6.171222776174545e-05, -5.893968045711517e-05, -5.6167133152484894e-05, -5.3394585847854614e-05, -5.0622038543224335e-05, -4.7849491238594055e-05, -4.5076943933963776e-05, -4.2304396629333496e-05, -3.9531849324703217e-05, -3.675930202007294e-05, -3.398675471544266e-05, -3.121420741081238e-05, -2.84416601061821e-05, -2.566911280155182e-05, -2.289656549692154e-05, -2.012401819229126e-05, -1.735147088766098e-05, -1.45789235830307e-05, -1.1806376278400421e-05, -9.033828973770142e-06, -6.261281669139862e-06, -3.4887343645095825e-06, -7.16187059879303e-07, 2.0563602447509766e-06, 4.828907549381256e-06, 7.601454854011536e-06, 1.0374002158641815e-05, 1.3146549463272095e-05, 1.5919096767902374e-05, 1.8691644072532654e-05, 2.1464191377162933e-05, 2.4236738681793213e-05, 2.7009285986423492e-05, 2.9781833291053772e-05, 3.255438059568405e-05, 3.532692790031433e-05, 3.809947520494461e-05, 4.087202250957489e-05, 4.364456981420517e-05, 4.641711711883545e-05, 4.918966442346573e-05, 5.196221172809601e-05, 5.473475903272629e-05, 5.750730633735657e-05, 6.027985364198685e-05, 6.305240094661713e-05, 6.58249482512474e-05, 6.859749555587769e-05, 7.137004286050797e-05, 7.414259016513824e-05, 7.691513746976852e-05, 7.96876847743988e-05, 8.246023207902908e-05, 8.523277938365936e-05, 8.800532668828964e-05, 9.077787399291992e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 16.0, 14.0, 28.0, 38.0, 84.0, 173.0, 348.0, 800.0, 2114.0, 7382.0, 37640.0, 349258.0, 570353.0, 64709.0, 10756.0, 2882.0, 1039.0, 420.0, 218.0, 116.0, 60.0, 26.0, 20.0, 14.0, 8.0, 12.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9203033447265625, -0.893341064453125, -0.8663787841796875, -0.83941650390625, -0.8124542236328125, -0.785491943359375, -0.7585296630859375, -0.7315673828125, -0.7046051025390625, -0.677642822265625, -0.6506805419921875, -0.62371826171875, -0.5967559814453125, -0.569793701171875, -0.5428314208984375, -0.515869140625, -0.4889068603515625, -0.461944580078125, -0.4349822998046875, -0.40802001953125, -0.3810577392578125, -0.354095458984375, -0.3271331787109375, -0.3001708984375, -0.2732086181640625, -0.246246337890625, -0.2192840576171875, -0.19232177734375, -0.1653594970703125, -0.138397216796875, -0.1114349365234375, -0.08447265625, -0.0575103759765625, -0.030548095703125, -0.0035858154296875, 0.02337646484375, 0.0503387451171875, 0.077301025390625, 0.1042633056640625, 0.1312255859375, 0.1581878662109375, 0.185150146484375, 0.2121124267578125, 0.23907470703125, 0.2660369873046875, 0.292999267578125, 0.3199615478515625, 0.346923828125, 0.3738861083984375, 0.400848388671875, 0.4278106689453125, 0.45477294921875, 0.4817352294921875, 0.508697509765625, 0.5356597900390625, 0.5626220703125, 0.5895843505859375, 0.616546630859375, 0.6435089111328125, 0.67047119140625, 0.6974334716796875, 0.724395751953125, 0.7513580322265625, 0.7783203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 8.0, 7.0, 20.0, 17.0, 25.0, 43.0, 74.0, 114.0, 125.0, 144.0, 116.0, 103.0, 72.0, 42.0, 32.0, 21.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.166412353515625, -1.12677001953125, -1.087127685546875, -1.0474853515625, -1.007843017578125, -0.96820068359375, -0.928558349609375, -0.888916015625, -0.849273681640625, -0.80963134765625, -0.769989013671875, -0.7303466796875, -0.690704345703125, -0.65106201171875, -0.611419677734375, -0.57177734375, -0.532135009765625, -0.49249267578125, -0.452850341796875, -0.4132080078125, -0.373565673828125, -0.33392333984375, -0.294281005859375, -0.254638671875, -0.214996337890625, -0.17535400390625, -0.135711669921875, -0.0960693359375, -0.056427001953125, -0.01678466796875, 0.022857666015625, 0.0625, 0.102142333984375, 0.14178466796875, 0.181427001953125, 0.2210693359375, 0.260711669921875, 0.30035400390625, 0.339996337890625, 0.379638671875, 0.419281005859375, 0.45892333984375, 0.498565673828125, 0.5382080078125, 0.577850341796875, 0.61749267578125, 0.657135009765625, 0.69677734375, 0.736419677734375, 0.77606201171875, 0.815704345703125, 0.8553466796875, 0.894989013671875, 0.93463134765625, 0.974273681640625, 1.013916015625, 1.053558349609375, 1.09320068359375, 1.132843017578125, 1.1724853515625, 1.212127685546875, 1.25177001953125, 1.291412353515625, 1.3310546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 27.0, 36.0, 63.0, 112.0, 140.0, 155.0, 146.0, 110.0, 78.0, 47.0, 33.0, 24.0, 11.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.92661190032959, -4.4984130859375, -4.07021427154541, -3.6420156955718994, -3.2138168811798096, -2.7856180667877197, -2.357419490814209, -1.9292206764221191, -1.5010218620300293, -1.0728230476379395, -0.6446243524551392, -0.21642565727233887, 0.21177315711975098, 0.6399719715118408, 1.0681705474853516, 1.4963693618774414, 1.9245681762695312, 2.352766990661621, 2.780965805053711, 3.2091643810272217, 3.6373631954193115, 4.0655622482299805, 4.493760585784912, 4.921959400177002, 5.350158214569092, 5.778357028961182, 6.2065558433532715, 6.634754180908203, 7.062952995300293, 7.491151809692383, 7.919350624084473, 8.347549438476562, 8.775747299194336, 9.203946113586426, 9.632144927978516, 10.060343742370605, 10.488542556762695, 10.916741371154785, 11.344940185546875, 11.773138046264648, 12.201337814331055, 12.629536628723145, 13.057735443115234, 13.485934257507324, 13.914133071899414, 14.342331886291504, 14.770530700683594, 15.198728561401367, 15.626927375793457, 16.055126190185547, 16.48332405090332, 16.911523818969727, 17.3397216796875, 17.767921447753906, 18.19611930847168, 18.624319076538086, 19.05251693725586, 19.480714797973633, 19.90891456604004, 20.337112426757812, 20.76531219482422, 21.193510055541992, 21.6217098236084, 22.049907684326172, 22.478107452392578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 5.0, 5.0, 7.0, 4.0, 4.0, 4.0, 13.0, 18.0, 16.0, 17.0, 22.0, 28.0, 28.0, 28.0, 26.0, 42.0, 39.0, 39.0, 41.0, 40.0, 48.0, 56.0, 41.0, 51.0, 39.0, 40.0, 51.0, 36.0, 32.0, 27.0, 25.0, 26.0, 19.0, 19.0, 9.0, 6.0, 10.0, 9.0, 6.0, 4.0, 5.0, 9.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.880712509155273, -8.599197387695312, -8.317683219909668, -8.036168098449707, -7.754653453826904, -7.473138809204102, -7.191623687744141, -6.910109043121338, -6.628594398498535, -6.347079753875732, -6.06556510925293, -5.784049987792969, -5.502535343170166, -5.221020698547363, -4.939505577087402, -4.6579909324646, -4.376476287841797, -4.094961643218994, -3.8134467601776123, -3.5319318771362305, -3.2504172325134277, -2.968902587890625, -2.687387704849243, -2.4058728218078613, -2.1243581771850586, -1.8428434133529663, -1.561328649520874, -1.2798138856887817, -0.9982991218566895, -0.7167843580245972, -0.4352695941925049, -0.1537548303604126, 0.1277608871459961, 0.4092756509780884, 0.6907904148101807, 0.972305178642273, 1.2538199424743652, 1.5353347063064575, 1.8168494701385498, 2.0983643531799316, 2.3798789978027344, 2.661393642425537, 2.942908525466919, 3.224423408508301, 3.5059380531311035, 3.7874526977539062, 4.068967819213867, 4.35048246383667, 4.631997108459473, 4.913511753082275, 5.195026397705078, 5.476541519165039, 5.758056163787842, 6.0395708084106445, 6.3210859298706055, 6.602600574493408, 6.884115219116211, 7.165629863739014, 7.447144508361816, 7.728659629821777, 8.010173797607422, 8.291688919067383, 8.573204040527344, 8.854718208312988, 9.13623332977295]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 9.0, 9.0, 20.0, 38.0, 59.0, 90.0, 172.0, 309.0, 572.0, 1179.0, 3188.0, 10581.0, 58461.0, 4036051.0, 66516.0, 11208.0, 3254.0, 1253.0, 566.0, 295.0, 182.0, 81.0, 70.0, 34.0, 29.0, 16.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.515625, -2.4519805908203125, -2.388336181640625, -2.3246917724609375, -2.26104736328125, -2.1974029541015625, -2.133758544921875, -2.0701141357421875, -2.0064697265625, -1.9428253173828125, -1.879180908203125, -1.8155364990234375, -1.75189208984375, -1.6882476806640625, -1.624603271484375, -1.5609588623046875, -1.497314453125, -1.4336700439453125, -1.370025634765625, -1.3063812255859375, -1.24273681640625, -1.1790924072265625, -1.115447998046875, -1.0518035888671875, -0.9881591796875, -0.9245147705078125, -0.860870361328125, -0.7972259521484375, -0.73358154296875, -0.6699371337890625, -0.606292724609375, -0.5426483154296875, -0.47900390625, -0.4153594970703125, -0.351715087890625, -0.2880706787109375, -0.22442626953125, -0.1607818603515625, -0.097137451171875, -0.0334930419921875, 0.0301513671875, 0.0937957763671875, 0.157440185546875, 0.2210845947265625, 0.28472900390625, 0.3483734130859375, 0.412017822265625, 0.4756622314453125, 0.539306640625, 0.6029510498046875, 0.666595458984375, 0.7302398681640625, 0.79388427734375, 0.8575286865234375, 0.921173095703125, 0.9848175048828125, 1.0484619140625, 1.1121063232421875, 1.175750732421875, 1.2393951416015625, 1.30303955078125, 1.3666839599609375, 1.430328369140625, 1.4939727783203125, 1.5576171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 13.0, 16.0, 24.0, 33.0, 41.0, 47.0, 56.0, 93.0, 75.0, 93.0, 96.0, 66.0, 85.0, 74.0, 54.0, 39.0, 27.0, 15.0, 16.0, 14.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7982406616210938, -0.7747039794921875, -0.7511672973632812, -0.727630615234375, -0.7040939331054688, -0.6805572509765625, -0.6570205688476562, -0.63348388671875, -0.6099472045898438, -0.5864105224609375, -0.5628738403320312, -0.539337158203125, -0.5158004760742188, -0.4922637939453125, -0.46872711181640625, -0.4451904296875, -0.42165374755859375, -0.3981170654296875, -0.37458038330078125, -0.351043701171875, -0.32750701904296875, -0.3039703369140625, -0.28043365478515625, -0.25689697265625, -0.23336029052734375, -0.2098236083984375, -0.18628692626953125, -0.162750244140625, -0.13921356201171875, -0.1156768798828125, -0.09214019775390625, -0.068603515625, -0.04506683349609375, -0.0215301513671875, 0.00200653076171875, 0.025543212890625, 0.04907989501953125, 0.0726165771484375, 0.09615325927734375, 0.11968994140625, 0.14322662353515625, 0.1667633056640625, 0.19029998779296875, 0.213836669921875, 0.23737335205078125, 0.2609100341796875, 0.28444671630859375, 0.3079833984375, 0.33152008056640625, 0.3550567626953125, 0.37859344482421875, 0.402130126953125, 0.42566680908203125, 0.4492034912109375, 0.47274017333984375, 0.49627685546875, 0.5198135375976562, 0.5433502197265625, 0.5668869018554688, 0.590423583984375, 0.6139602661132812, 0.6374969482421875, 0.6610336303710938, 0.6845703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 7.0, 7.0, 14.0, 21.0, 12.0, 27.0, 25.0, 32.0, 47.0, 68.0, 78.0, 134.0, 165.0, 196.0, 289.0, 407.0, 560.0, 922.0, 1607.0, 2966.0, 5980.0, 14054.0, 45808.0, 389918.0, 3640810.0, 58188.0, 16915.0, 6775.0, 3324.0, 1687.0, 1042.0, 608.0, 435.0, 284.0, 192.0, 164.0, 123.0, 68.0, 71.0, 56.0, 48.0, 36.0, 37.0, 14.0, 18.0, 8.0, 11.0, 9.0, 0.0, 2.0, 6.0, 0.0, 4.0, 4.0, 0.0, 0.0, 3.0], "bins": [-1.306640625, -1.2646026611328125, -1.222564697265625, -1.1805267333984375, -1.13848876953125, -1.0964508056640625, -1.054412841796875, -1.0123748779296875, -0.9703369140625, -0.9282989501953125, -0.886260986328125, -0.8442230224609375, -0.80218505859375, -0.7601470947265625, -0.718109130859375, -0.6760711669921875, -0.634033203125, -0.5919952392578125, -0.549957275390625, -0.5079193115234375, -0.46588134765625, -0.4238433837890625, -0.381805419921875, -0.3397674560546875, -0.2977294921875, -0.2556915283203125, -0.213653564453125, -0.1716156005859375, -0.12957763671875, -0.0875396728515625, -0.045501708984375, -0.0034637451171875, 0.03857421875, 0.0806121826171875, 0.122650146484375, 0.1646881103515625, 0.20672607421875, 0.2487640380859375, 0.290802001953125, 0.3328399658203125, 0.3748779296875, 0.4169158935546875, 0.458953857421875, 0.5009918212890625, 0.54302978515625, 0.5850677490234375, 0.627105712890625, 0.6691436767578125, 0.711181640625, 0.7532196044921875, 0.795257568359375, 0.8372955322265625, 0.87933349609375, 0.9213714599609375, 0.963409423828125, 1.0054473876953125, 1.0474853515625, 1.0895233154296875, 1.131561279296875, 1.1735992431640625, 1.21563720703125, 1.2576751708984375, 1.299713134765625, 1.3417510986328125, 1.3837890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 12.0, 12.0, 21.0, 24.0, 83.0, 134.0, 2886.0, 647.0, 113.0, 49.0, 25.0, 17.0, 8.0, 9.0, 8.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262939453125, -0.24744796752929688, -0.23195648193359375, -0.21646499633789062, -0.2009735107421875, -0.18548202514648438, -0.16999053955078125, -0.15449905395507812, -0.139007568359375, -0.12351608276367188, -0.10802459716796875, -0.09253311157226562, -0.0770416259765625, -0.061550140380859375, -0.04605865478515625, -0.030567169189453125, -0.01507568359375, 0.000415802001953125, 0.01590728759765625, 0.031398773193359375, 0.0468902587890625, 0.062381744384765625, 0.07787322998046875, 0.09336471557617188, 0.108856201171875, 0.12434768676757812, 0.13983917236328125, 0.15533065795898438, 0.1708221435546875, 0.18631362915039062, 0.20180511474609375, 0.21729660034179688, 0.2327880859375, 0.24827957153320312, 0.26377105712890625, 0.2792625427246094, 0.2947540283203125, 0.3102455139160156, 0.32573699951171875, 0.3412284851074219, 0.356719970703125, 0.3722114562988281, 0.38770294189453125, 0.4031944274902344, 0.4186859130859375, 0.4341773986816406, 0.44966888427734375, 0.4651603698730469, 0.48065185546875, 0.4961433410644531, 0.5116348266601562, 0.5271263122558594, 0.5426177978515625, 0.5581092834472656, 0.5736007690429688, 0.5890922546386719, 0.604583740234375, 0.6200752258300781, 0.6355667114257812, 0.6510581970214844, 0.6665496826171875, 0.6820411682128906, 0.6975326538085938, 0.7130241394042969, 0.728515625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 6.0, 10.0, 9.0, 5.0, 20.0, 49.0, 67.0, 112.0, 129.0, 139.0, 113.0, 111.0, 60.0, 63.0, 38.0, 31.0, 15.0, 12.0, 4.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53227961063385, -1.471066951751709, -1.4098541736602783, -1.3486413955688477, -1.2874287366867065, -1.2262160778045654, -1.1650032997131348, -1.103790521621704, -1.042577862739563, -0.9813651442527771, -0.9201524257659912, -0.8589397072792053, -0.7977269887924194, -0.7365142703056335, -0.6753015518188477, -0.6140888333320618, -0.5528761148452759, -0.49166339635849, -0.4304506778717041, -0.3692379593849182, -0.3080252408981323, -0.24681252241134644, -0.18559980392456055, -0.12438708543777466, -0.06317436695098877, -0.001961648464202881, 0.05925107002258301, 0.1204637885093689, 0.18167650699615479, 0.24288922548294067, 0.30410194396972656, 0.36531466245651245, 0.4265275001525879, 0.4877402186393738, 0.5489529371261597, 0.6101656556129456, 0.6713783740997314, 0.7325910925865173, 0.7938038110733032, 0.8550165295600891, 0.916229248046875, 0.9774419665336609, 1.0386546850204468, 1.099867343902588, 1.1610801219940186, 1.2222929000854492, 1.2835055589675903, 1.3447182178497314, 1.405930995941162, 1.4671437740325928, 1.5283564329147339, 1.589569091796875, 1.6507818698883057, 1.7119946479797363, 1.7732073068618774, 1.8344199657440186, 1.8956327438354492, 1.9568455219268799, 2.0180583000183105, 2.079270839691162, 2.1404836177825928, 2.2016963958740234, 2.262908935546875, 2.3241217136383057, 2.3853344917297363]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 14.0, 7.0, 13.0, 13.0, 20.0, 25.0, 32.0, 45.0, 44.0, 45.0, 48.0, 46.0, 82.0, 65.0, 57.0, 57.0, 57.0, 57.0, 52.0, 42.0, 35.0, 40.0, 25.0, 27.0, 11.0, 10.0, 10.0, 10.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3468122482299805, -1.3013062477111816, -1.2558001279830933, -1.2102941274642944, -1.164788007736206, -1.1192820072174072, -1.0737760066986084, -1.0282700061798096, -0.9827638864517212, -0.9372578263282776, -0.891751766204834, -0.8462457656860352, -0.8007397055625916, -0.755233645439148, -0.7097276449203491, -0.6642215847969055, -0.6187155246734619, -0.5732094645500183, -0.5277034044265747, -0.4821974039077759, -0.4366913437843323, -0.39118528366088867, -0.34567925333976746, -0.30017322301864624, -0.25466716289520264, -0.20916111767292023, -0.16365507245063782, -0.11814902722835541, -0.072642982006073, -0.02713693678379059, 0.01836910843849182, 0.06387513875961304, 0.10938107967376709, 0.1548871248960495, 0.2003931701183319, 0.24589921534061432, 0.29140526056289673, 0.33691132068634033, 0.38241735100746155, 0.42792338132858276, 0.47342944145202637, 0.51893550157547, 0.5644415616989136, 0.6099475622177124, 0.655453622341156, 0.7009596824645996, 0.7464656829833984, 0.791971743106842, 0.8374778032302856, 0.8829838633537292, 0.9284899234771729, 0.9739959239959717, 1.0195019245147705, 1.0650080442428589, 1.1105140447616577, 1.156020164489746, 1.201526165008545, 1.2470321655273438, 1.2925382852554321, 1.338044285774231, 1.3835504055023193, 1.4290564060211182, 1.474562406539917, 1.5200684070587158, 1.5655745267868042]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 7.0, 10.0, 18.0, 25.0, 44.0, 76.0, 122.0, 211.0, 344.0, 714.0, 1508.0, 3962.0, 12528.0, 47480.0, 196917.0, 452984.0, 246570.0, 61254.0, 15358.0, 4726.0, 1833.0, 850.0, 469.0, 227.0, 119.0, 73.0, 48.0, 29.0, 19.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3115234375, -1.2724761962890625, -1.233428955078125, -1.1943817138671875, -1.15533447265625, -1.1162872314453125, -1.077239990234375, -1.0381927490234375, -0.9991455078125, -0.9600982666015625, -0.921051025390625, -0.8820037841796875, -0.84295654296875, -0.8039093017578125, -0.764862060546875, -0.7258148193359375, -0.686767578125, -0.6477203369140625, -0.608673095703125, -0.5696258544921875, -0.53057861328125, -0.4915313720703125, -0.452484130859375, -0.4134368896484375, -0.3743896484375, -0.3353424072265625, -0.296295166015625, -0.2572479248046875, -0.21820068359375, -0.1791534423828125, -0.140106201171875, -0.1010589599609375, -0.06201171875, -0.0229644775390625, 0.016082763671875, 0.0551300048828125, 0.09417724609375, 0.1332244873046875, 0.172271728515625, 0.2113189697265625, 0.2503662109375, 0.2894134521484375, 0.328460693359375, 0.3675079345703125, 0.40655517578125, 0.4456024169921875, 0.484649658203125, 0.5236968994140625, 0.562744140625, 0.6017913818359375, 0.640838623046875, 0.6798858642578125, 0.71893310546875, 0.7579803466796875, 0.797027587890625, 0.8360748291015625, 0.8751220703125, 0.9141693115234375, 0.953216552734375, 0.9922637939453125, 1.03131103515625, 1.0703582763671875, 1.109405517578125, 1.1484527587890625, 1.1875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 10.0, 16.0, 17.0, 23.0, 34.0, 27.0, 42.0, 60.0, 84.0, 68.0, 76.0, 81.0, 88.0, 87.0, 66.0, 60.0, 50.0, 32.0, 24.0, 20.0, 15.0, 7.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.828125, -0.804046630859375, -0.77996826171875, -0.755889892578125, -0.7318115234375, -0.707733154296875, -0.68365478515625, -0.659576416015625, -0.635498046875, -0.611419677734375, -0.58734130859375, -0.563262939453125, -0.5391845703125, -0.515106201171875, -0.49102783203125, -0.466949462890625, -0.44287109375, -0.418792724609375, -0.39471435546875, -0.370635986328125, -0.3465576171875, -0.322479248046875, -0.29840087890625, -0.274322509765625, -0.250244140625, -0.226165771484375, -0.20208740234375, -0.178009033203125, -0.1539306640625, -0.129852294921875, -0.10577392578125, -0.081695556640625, -0.0576171875, -0.033538818359375, -0.00946044921875, 0.014617919921875, 0.0386962890625, 0.062774658203125, 0.08685302734375, 0.110931396484375, 0.135009765625, 0.159088134765625, 0.18316650390625, 0.207244873046875, 0.2313232421875, 0.255401611328125, 0.27947998046875, 0.303558349609375, 0.32763671875, 0.351715087890625, 0.37579345703125, 0.399871826171875, 0.4239501953125, 0.448028564453125, 0.47210693359375, 0.496185302734375, 0.520263671875, 0.544342041015625, 0.56842041015625, 0.592498779296875, 0.6165771484375, 0.640655517578125, 0.66473388671875, 0.688812255859375, 0.712890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 10.0, 15.0, 16.0, 16.0, 50.0, 87.0, 153.0, 266.0, 596.0, 1569.0, 6290.0, 49622.0, 628318.0, 331380.0, 24078.0, 3932.0, 1180.0, 474.0, 210.0, 122.0, 57.0, 37.0, 18.0, 17.0, 11.0, 7.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.02398681640625, -1.9561767578125, -1.88836669921875, -1.820556640625, -1.75274658203125, -1.6849365234375, -1.61712646484375, -1.54931640625, -1.48150634765625, -1.4136962890625, -1.34588623046875, -1.278076171875, -1.21026611328125, -1.1424560546875, -1.07464599609375, -1.0068359375, -0.93902587890625, -0.8712158203125, -0.80340576171875, -0.735595703125, -0.66778564453125, -0.5999755859375, -0.53216552734375, -0.46435546875, -0.39654541015625, -0.3287353515625, -0.26092529296875, -0.193115234375, -0.12530517578125, -0.0574951171875, 0.01031494140625, 0.078125, 0.14593505859375, 0.2137451171875, 0.28155517578125, 0.349365234375, 0.41717529296875, 0.4849853515625, 0.55279541015625, 0.62060546875, 0.68841552734375, 0.7562255859375, 0.82403564453125, 0.891845703125, 0.95965576171875, 1.0274658203125, 1.09527587890625, 1.1630859375, 1.23089599609375, 1.2987060546875, 1.36651611328125, 1.434326171875, 1.50213623046875, 1.5699462890625, 1.63775634765625, 1.70556640625, 1.77337646484375, 1.8411865234375, 1.90899658203125, 1.976806640625, 2.04461669921875, 2.1124267578125, 2.18023681640625, 2.248046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 16.0, 15.0, 19.0, 34.0, 38.0, 47.0, 68.0, 75.0, 82.0, 99.0, 90.0, 98.0, 69.0, 70.0, 59.0, 49.0, 20.0, 15.0, 15.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.16015625, -5.039031982421875, -4.91790771484375, -4.796783447265625, -4.6756591796875, -4.554534912109375, -4.43341064453125, -4.312286376953125, -4.191162109375, -4.070037841796875, -3.94891357421875, -3.827789306640625, -3.7066650390625, -3.585540771484375, -3.46441650390625, -3.343292236328125, -3.22216796875, -3.101043701171875, -2.97991943359375, -2.858795166015625, -2.7376708984375, -2.616546630859375, -2.49542236328125, -2.374298095703125, -2.253173828125, -2.132049560546875, -2.01092529296875, -1.889801025390625, -1.7686767578125, -1.647552490234375, -1.52642822265625, -1.405303955078125, -1.2841796875, -1.163055419921875, -1.04193115234375, -0.920806884765625, -0.7996826171875, -0.678558349609375, -0.55743408203125, -0.436309814453125, -0.315185546875, -0.194061279296875, -0.07293701171875, 0.048187255859375, 0.1693115234375, 0.290435791015625, 0.41156005859375, 0.532684326171875, 0.65380859375, 0.774932861328125, 0.89605712890625, 1.017181396484375, 1.1383056640625, 1.259429931640625, 1.38055419921875, 1.501678466796875, 1.622802734375, 1.743927001953125, 1.86505126953125, 1.986175537109375, 2.1072998046875, 2.228424072265625, 2.34954833984375, 2.470672607421875, 2.591796875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 8.0, 21.0, 25.0, 57.0, 99.0, 248.0, 920.0, 5133.0, 97288.0, 911362.0, 29801.0, 2690.0, 521.0, 195.0, 85.0, 40.0, 20.0, 18.0, 14.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6640625, -2.5996246337890625, -2.535186767578125, -2.4707489013671875, -2.40631103515625, -2.3418731689453125, -2.277435302734375, -2.2129974365234375, -2.1485595703125, -2.0841217041015625, -2.019683837890625, -1.9552459716796875, -1.89080810546875, -1.8263702392578125, -1.761932373046875, -1.6974945068359375, -1.633056640625, -1.5686187744140625, -1.504180908203125, -1.4397430419921875, -1.37530517578125, -1.3108673095703125, -1.246429443359375, -1.1819915771484375, -1.1175537109375, -1.0531158447265625, -0.988677978515625, -0.9242401123046875, -0.85980224609375, -0.7953643798828125, -0.730926513671875, -0.6664886474609375, -0.60205078125, -0.5376129150390625, -0.473175048828125, -0.4087371826171875, -0.34429931640625, -0.2798614501953125, -0.215423583984375, -0.1509857177734375, -0.0865478515625, -0.0221099853515625, 0.042327880859375, 0.1067657470703125, 0.17120361328125, 0.2356414794921875, 0.300079345703125, 0.3645172119140625, 0.428955078125, 0.4933929443359375, 0.557830810546875, 0.6222686767578125, 0.68670654296875, 0.7511444091796875, 0.815582275390625, 0.8800201416015625, 0.9444580078125, 1.0088958740234375, 1.073333740234375, 1.1377716064453125, 1.20220947265625, 1.2666473388671875, 1.331085205078125, 1.3955230712890625, 1.4599609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 6.0, 10.0, 16.0, 22.0, 36.0, 70.0, 90.0, 130.0, 146.0, 136.0, 115.0, 68.0, 48.0, 33.0, 20.0, 12.0, 13.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019121170043945312, -0.00018480047583580017, -0.00017838925123214722, -0.00017197802662849426, -0.0001655668020248413, -0.00015915557742118835, -0.0001527443528175354, -0.00014633312821388245, -0.0001399219036102295, -0.00013351067900657654, -0.00012709945440292358, -0.00012068822979927063, -0.00011427700519561768, -0.00010786578059196472, -0.00010145455598831177, -9.504333138465881e-05, -8.863210678100586e-05, -8.22208821773529e-05, -7.580965757369995e-05, -6.9398432970047e-05, -6.298720836639404e-05, -5.657598376274109e-05, -5.0164759159088135e-05, -4.375353455543518e-05, -3.7342309951782227e-05, -3.093108534812927e-05, -2.451986074447632e-05, -1.8108636140823364e-05, -1.169741153717041e-05, -5.286186933517456e-06, 1.125037670135498e-06, 7.536262273788452e-06, 1.3947486877441406e-05, 2.035871148109436e-05, 2.6769936084747314e-05, 3.318116068840027e-05, 3.959238529205322e-05, 4.600360989570618e-05, 5.241483449935913e-05, 5.8826059103012085e-05, 6.523728370666504e-05, 7.164850831031799e-05, 7.805973291397095e-05, 8.44709575176239e-05, 9.088218212127686e-05, 9.729340672492981e-05, 0.00010370463132858276, 0.00011011585593223572, 0.00011652708053588867, 0.00012293830513954163, 0.00012934952974319458, 0.00013576075434684753, 0.0001421719789505005, 0.00014858320355415344, 0.0001549944281578064, 0.00016140565276145935, 0.0001678168773651123, 0.00017422810196876526, 0.0001806393265724182, 0.00018705055117607117, 0.00019346177577972412, 0.00019987300038337708, 0.00020628422498703003, 0.00021269544959068298, 0.00021910667419433594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 13.0, 13.0, 39.0, 74.0, 139.0, 464.0, 2387.0, 31336.0, 932239.0, 77196.0, 3605.0, 659.0, 205.0, 79.0, 47.0, 22.0, 19.0, 5.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.067413330078125, -2.00201416015625, -1.936614990234375, -1.8712158203125, -1.805816650390625, -1.74041748046875, -1.675018310546875, -1.609619140625, -1.544219970703125, -1.47882080078125, -1.413421630859375, -1.3480224609375, -1.282623291015625, -1.21722412109375, -1.151824951171875, -1.08642578125, -1.021026611328125, -0.95562744140625, -0.890228271484375, -0.8248291015625, -0.759429931640625, -0.69403076171875, -0.628631591796875, -0.563232421875, -0.497833251953125, -0.43243408203125, -0.367034912109375, -0.3016357421875, -0.236236572265625, -0.17083740234375, -0.105438232421875, -0.0400390625, 0.025360107421875, 0.09075927734375, 0.156158447265625, 0.2215576171875, 0.286956787109375, 0.35235595703125, 0.417755126953125, 0.483154296875, 0.548553466796875, 0.61395263671875, 0.679351806640625, 0.7447509765625, 0.810150146484375, 0.87554931640625, 0.940948486328125, 1.00634765625, 1.071746826171875, 1.13714599609375, 1.202545166015625, 1.2679443359375, 1.333343505859375, 1.39874267578125, 1.464141845703125, 1.529541015625, 1.594940185546875, 1.66033935546875, 1.725738525390625, 1.7911376953125, 1.856536865234375, 1.92193603515625, 1.987335205078125, 2.052734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 12.0, 6.0, 12.0, 23.0, 46.0, 72.0, 111.0, 139.0, 172.0, 134.0, 96.0, 71.0, 49.0, 25.0, 13.0, 9.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87353515625, -0.8232650756835938, -0.7729949951171875, -0.7227249145507812, -0.672454833984375, -0.6221847534179688, -0.5719146728515625, -0.5216445922851562, -0.47137451171875, -0.42110443115234375, -0.3708343505859375, -0.32056427001953125, -0.270294189453125, -0.22002410888671875, -0.1697540283203125, -0.11948394775390625, -0.0692138671875, -0.01894378662109375, 0.0313262939453125, 0.08159637451171875, 0.131866455078125, 0.18213653564453125, 0.2324066162109375, 0.28267669677734375, 0.33294677734375, 0.38321685791015625, 0.4334869384765625, 0.48375701904296875, 0.534027099609375, 0.5842971801757812, 0.6345672607421875, 0.6848373413085938, 0.735107421875, 0.7853775024414062, 0.8356475830078125, 0.8859176635742188, 0.936187744140625, 0.9864578247070312, 1.0367279052734375, 1.0869979858398438, 1.13726806640625, 1.1875381469726562, 1.2378082275390625, 1.2880783081054688, 1.338348388671875, 1.3886184692382812, 1.4388885498046875, 1.4891586303710938, 1.5394287109375, 1.5896987915039062, 1.6399688720703125, 1.6902389526367188, 1.740509033203125, 1.7907791137695312, 1.8410491943359375, 1.8913192749023438, 1.94158935546875, 1.9918594360351562, 2.0421295166015625, 2.0923995971679688, 2.142669677734375, 2.1929397583007812, 2.2432098388671875, 2.2934799194335938, 2.34375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 21.0, 40.0, 97.0, 131.0, 173.0, 200.0, 154.0, 92.0, 41.0, 17.0, 13.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484781265258789, -10.873579025268555, -10.26237678527832, -9.651174545288086, -9.039972305297852, -8.428770065307617, -7.817568778991699, -7.206366539001465, -6.5951642990112305, -5.983962059020996, -5.372759819030762, -4.7615580558776855, -4.150355815887451, -3.539153575897217, -2.9279515743255615, -2.3167495727539062, -1.7055473327636719, -1.094345211982727, -0.4831430912017822, 0.1280590295791626, 0.7392611503601074, 1.3504633903503418, 1.961665391921997, 2.5728673934936523, 3.1840696334838867, 3.795271873474121, 4.4064741134643555, 5.017675876617432, 5.628878116607666, 6.2400803565979, 6.851282119750977, 7.462484359741211, 8.073688507080078, 8.684890747070312, 9.296092987060547, 9.907295227050781, 10.518497467041016, 11.12969970703125, 11.740900993347168, 12.352103233337402, 12.963305473327637, 13.574507713317871, 14.185709953308105, 14.79691219329834, 15.408113479614258, 16.019315719604492, 16.630517959594727, 17.24172019958496, 17.852922439575195, 18.46412467956543, 19.075326919555664, 19.6865291595459, 20.297731399536133, 20.908933639526367, 21.5201358795166, 22.131336212158203, 22.742538452148438, 23.353740692138672, 23.964942932128906, 24.57614517211914, 25.187347412109375, 25.79854965209961, 26.409751892089844, 27.020954132080078, 27.632156372070312]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 11.0, 9.0, 9.0, 20.0, 24.0, 25.0, 31.0, 38.0, 31.0, 37.0, 36.0, 50.0, 56.0, 44.0, 64.0, 58.0, 54.0, 61.0, 45.0, 43.0, 37.0, 41.0, 34.0, 29.0, 28.0, 15.0, 20.0, 12.0, 7.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.89755916595459, -10.513012886047363, -10.128466606140137, -9.74392032623291, -9.359374046325684, -8.974827766418457, -8.590280532836914, -8.205734252929688, -7.821188449859619, -7.436642169952393, -7.052095890045166, -6.667549133300781, -6.283002853393555, -5.898456573486328, -5.513910293579102, -5.129364013671875, -4.744817733764648, -4.360271453857422, -3.9757251739501953, -3.5911786556243896, -3.206632375717163, -2.8220860958099365, -2.437539577484131, -2.0529932975769043, -1.6684470176696777, -1.2839007377624512, -0.8993543386459351, -0.514807939529419, -0.13026165962219238, 0.2542846202850342, 0.6388311386108398, 1.0233774185180664, 1.4079227447509766, 1.7924690246582031, 2.1770153045654297, 2.5615618228912354, 2.946108102798462, 3.3306543827056885, 3.715200901031494, 4.099747180938721, 4.484293460845947, 4.868839740753174, 5.2533860206604, 5.637932777404785, 6.022479057312012, 6.407025337219238, 6.791571617126465, 7.176117897033691, 7.560664176940918, 7.9452104568481445, 8.329756736755371, 8.714303016662598, 9.098849296569824, 9.48339557647705, 9.867942810058594, 10.25248908996582, 10.637035369873047, 11.021581649780273, 11.4061279296875, 11.790674209594727, 12.175220489501953, 12.55976676940918, 12.944313049316406, 13.328859329223633, 13.71340560913086]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 9.0, 23.0, 22.0, 29.0, 47.0, 91.0, 130.0, 195.0, 344.0, 587.0, 1190.0, 2730.0, 7827.0, 39597.0, 4091889.0, 36892.0, 7507.0, 2668.0, 1122.0, 557.0, 282.0, 173.0, 129.0, 71.0, 43.0, 33.0, 28.0, 13.0, 12.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 4.0], "bins": [-3.244140625, -3.1677703857421875, -3.091400146484375, -3.0150299072265625, -2.93865966796875, -2.8622894287109375, -2.785919189453125, -2.7095489501953125, -2.6331787109375, -2.5568084716796875, -2.480438232421875, -2.4040679931640625, -2.32769775390625, -2.2513275146484375, -2.174957275390625, -2.0985870361328125, -2.022216796875, -1.9458465576171875, -1.869476318359375, -1.7931060791015625, -1.71673583984375, -1.6403656005859375, -1.563995361328125, -1.4876251220703125, -1.4112548828125, -1.3348846435546875, -1.258514404296875, -1.1821441650390625, -1.10577392578125, -1.0294036865234375, -0.953033447265625, -0.8766632080078125, -0.80029296875, -0.7239227294921875, -0.647552490234375, -0.5711822509765625, -0.49481201171875, -0.4184417724609375, -0.342071533203125, -0.2657012939453125, -0.1893310546875, -0.1129608154296875, -0.036590576171875, 0.0397796630859375, 0.11614990234375, 0.1925201416015625, 0.268890380859375, 0.3452606201171875, 0.421630859375, 0.4980010986328125, 0.574371337890625, 0.6507415771484375, 0.72711181640625, 0.8034820556640625, 0.879852294921875, 0.9562225341796875, 1.0325927734375, 1.1089630126953125, 1.185333251953125, 1.2617034912109375, 1.33807373046875, 1.4144439697265625, 1.490814208984375, 1.5671844482421875, 1.6435546875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 20.0, 27.0, 29.0, 36.0, 36.0, 44.0, 60.0, 62.0, 69.0, 76.0, 87.0, 70.0, 66.0, 50.0, 55.0, 49.0, 31.0, 27.0, 20.0, 17.0, 14.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80224609375, -0.7787017822265625, -0.755157470703125, -0.7316131591796875, -0.70806884765625, -0.6845245361328125, -0.660980224609375, -0.6374359130859375, -0.6138916015625, -0.5903472900390625, -0.566802978515625, -0.5432586669921875, -0.51971435546875, -0.4961700439453125, -0.472625732421875, -0.4490814208984375, -0.425537109375, -0.4019927978515625, -0.378448486328125, -0.3549041748046875, -0.33135986328125, -0.3078155517578125, -0.284271240234375, -0.2607269287109375, -0.2371826171875, -0.2136383056640625, -0.190093994140625, -0.1665496826171875, -0.14300537109375, -0.1194610595703125, -0.095916748046875, -0.0723724365234375, -0.048828125, -0.0252838134765625, -0.001739501953125, 0.0218048095703125, 0.04534912109375, 0.0688934326171875, 0.092437744140625, 0.1159820556640625, 0.1395263671875, 0.1630706787109375, 0.186614990234375, 0.2101593017578125, 0.23370361328125, 0.2572479248046875, 0.280792236328125, 0.3043365478515625, 0.327880859375, 0.3514251708984375, 0.374969482421875, 0.3985137939453125, 0.42205810546875, 0.4456024169921875, 0.469146728515625, 0.4926910400390625, 0.5162353515625, 0.5397796630859375, 0.563323974609375, 0.5868682861328125, 0.61041259765625, 0.6339569091796875, 0.657501220703125, 0.6810455322265625, 0.70458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 3.0, 2.0, 2.0, 5.0, 11.0, 9.0, 12.0, 15.0, 9.0, 28.0, 34.0, 25.0, 50.0, 73.0, 111.0, 209.0, 433.0, 1083.0, 3757.0, 25840.0, 4121180.0, 34556.0, 4451.0, 1229.0, 463.0, 244.0, 128.0, 67.0, 63.0, 38.0, 24.0, 22.0, 26.0, 17.0, 6.0, 4.0, 6.0, 6.0, 12.0, 7.0, 4.0, 10.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.982421875, -3.852081298828125, -3.72174072265625, -3.591400146484375, -3.4610595703125, -3.330718994140625, -3.20037841796875, -3.070037841796875, -2.939697265625, -2.809356689453125, -2.67901611328125, -2.548675537109375, -2.4183349609375, -2.287994384765625, -2.15765380859375, -2.027313232421875, -1.89697265625, -1.766632080078125, -1.63629150390625, -1.505950927734375, -1.3756103515625, -1.245269775390625, -1.11492919921875, -0.984588623046875, -0.854248046875, -0.723907470703125, -0.59356689453125, -0.463226318359375, -0.3328857421875, -0.202545166015625, -0.07220458984375, 0.058135986328125, 0.1884765625, 0.318817138671875, 0.44915771484375, 0.579498291015625, 0.7098388671875, 0.840179443359375, 0.97052001953125, 1.100860595703125, 1.231201171875, 1.361541748046875, 1.49188232421875, 1.622222900390625, 1.7525634765625, 1.882904052734375, 2.01324462890625, 2.143585205078125, 2.27392578125, 2.404266357421875, 2.53460693359375, 2.664947509765625, 2.7952880859375, 2.925628662109375, 3.05596923828125, 3.186309814453125, 3.316650390625, 3.446990966796875, 3.57733154296875, 3.707672119140625, 3.8380126953125, 3.968353271484375, 4.09869384765625, 4.229034423828125, 4.359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 7.0, 11.0, 26.0, 50.0, 183.0, 3670.0, 71.0, 29.0, 10.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66845703125, -0.6408157348632812, -0.6131744384765625, -0.5855331420898438, -0.557891845703125, -0.5302505493164062, -0.5026092529296875, -0.47496795654296875, -0.44732666015625, -0.41968536376953125, -0.3920440673828125, -0.36440277099609375, -0.336761474609375, -0.30912017822265625, -0.2814788818359375, -0.25383758544921875, -0.2261962890625, -0.19855499267578125, -0.1709136962890625, -0.14327239990234375, -0.115631103515625, -0.08798980712890625, -0.0603485107421875, -0.03270721435546875, -0.00506591796875, 0.02257537841796875, 0.0502166748046875, 0.07785797119140625, 0.105499267578125, 0.13314056396484375, 0.1607818603515625, 0.18842315673828125, 0.216064453125, 0.24370574951171875, 0.2713470458984375, 0.29898834228515625, 0.326629638671875, 0.35427093505859375, 0.3819122314453125, 0.40955352783203125, 0.43719482421875, 0.46483612060546875, 0.4924774169921875, 0.5201187133789062, 0.547760009765625, 0.5754013061523438, 0.6030426025390625, 0.6306838989257812, 0.6583251953125, 0.6859664916992188, 0.7136077880859375, 0.7412490844726562, 0.768890380859375, 0.7965316772460938, 0.8241729736328125, 0.8518142700195312, 0.87945556640625, 0.9070968627929688, 0.9347381591796875, 0.9623794555664062, 0.990020751953125, 1.0176620483398438, 1.0453033447265625, 1.0729446411132812, 1.1005859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 14.0, 13.0, 11.0, 19.0, 35.0, 37.0, 60.0, 72.0, 92.0, 98.0, 126.0, 86.0, 64.0, 68.0, 54.0, 34.0, 33.0, 24.0, 8.0, 9.0, 6.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9305427074432373, -1.881780982017517, -1.8330192565917969, -1.784257411956787, -1.735495686531067, -1.6867339611053467, -1.637972116470337, -1.5892103910446167, -1.5404486656188965, -1.4916869401931763, -1.442925214767456, -1.3941633701324463, -1.345401644706726, -1.2966399192810059, -1.247878074645996, -1.1991163492202759, -1.1503546237945557, -1.1015928983688354, -1.0528311729431152, -1.0040693283081055, -0.9553076028823853, -0.906545877456665, -0.8577840924263, -0.8090223073959351, -0.7602605819702148, -0.7114988565444946, -0.6627370715141296, -0.6139752864837646, -0.5652135610580444, -0.5164518356323242, -0.46769005060195923, -0.4189282953739166, -0.370166540145874, -0.3214047849178314, -0.2726430296897888, -0.22388127446174622, -0.1751195192337036, -0.126357764005661, -0.07759600877761841, -0.028834253549575806, 0.019927501678466797, 0.0686892569065094, 0.117451012134552, 0.1662127673625946, 0.2149745225906372, 0.2637362778186798, 0.3124980330467224, 0.361259788274765, 0.4100215435028076, 0.4587832987308502, 0.5075450539588928, 0.5563068389892578, 0.605068564414978, 0.6538302898406982, 0.7025920748710632, 0.7513538599014282, 0.8001155853271484, 0.8488773107528687, 0.8976390957832336, 0.9464008808135986, 0.9951626062393188, 1.043924331665039, 1.0926861763000488, 1.141447901725769, 1.1902096271514893]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 12.0, 8.0, 15.0, 16.0, 16.0, 22.0, 16.0, 30.0, 26.0, 38.0, 32.0, 36.0, 43.0, 41.0, 48.0, 53.0, 40.0, 41.0, 47.0, 43.0, 52.0, 42.0, 42.0, 32.0, 36.0, 22.0, 18.0, 24.0, 18.0, 14.0, 19.0, 6.0, 14.0, 2.0, 7.0, 4.0, 7.0, 5.0, 2.0, 4.0, 1.0], "bins": [-1.3384265899658203, -1.3046557903289795, -1.2708848714828491, -1.2371140718460083, -1.2033432722091675, -1.169572353363037, -1.1358015537261963, -1.1020307540893555, -1.0682599544525146, -1.0344891548156738, -1.0007182359695435, -0.9669474363327026, -0.9331766366958618, -0.8994057774543762, -0.8656349182128906, -0.8318641185760498, -0.7980931997299194, -0.7643223404884338, -0.730551540851593, -0.6967806816101074, -0.6630098819732666, -0.629239022731781, -0.5954681634902954, -0.5616973638534546, -0.527926504611969, -0.4941556751728058, -0.4603848457336426, -0.426613986492157, -0.3928431570529938, -0.35907232761383057, -0.32530146837234497, -0.29153063893318176, -0.2577599287033081, -0.2239890992641449, -0.1902182549238205, -0.1564474105834961, -0.12267658114433289, -0.08890575170516968, -0.055134907364845276, -0.021364063024520874, 0.012406766414642334, 0.04617760330438614, 0.07994844019412994, 0.11371927708387375, 0.14749011397361755, 0.18126094341278076, 0.21503178775310516, 0.24880263209342957, 0.2825734615325928, 0.316344290971756, 0.3501151204109192, 0.3838859796524048, 0.417656809091568, 0.4514276385307312, 0.4851984977722168, 0.5189692974090576, 0.5527401566505432, 0.5865110158920288, 0.6202818155288696, 0.6540526747703552, 0.6878235340118408, 0.7215943336486816, 0.7553651928901672, 0.7891360521316528, 0.8229068517684937]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 12.0, 11.0, 22.0, 25.0, 35.0, 62.0, 114.0, 173.0, 316.0, 489.0, 911.0, 1793.0, 3588.0, 7619.0, 17206.0, 41243.0, 105611.0, 243422.0, 319040.0, 181151.0, 73260.0, 28970.0, 12272.0, 5474.0, 2619.0, 1318.0, 729.0, 420.0, 244.0, 162.0, 81.0, 48.0, 48.0, 23.0, 15.0, 13.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-1.0341796875, -1.0071792602539062, -0.9801788330078125, -0.9531784057617188, -0.926177978515625, -0.8991775512695312, -0.8721771240234375, -0.8451766967773438, -0.81817626953125, -0.7911758422851562, -0.7641754150390625, -0.7371749877929688, -0.710174560546875, -0.6831741333007812, -0.6561737060546875, -0.6291732788085938, -0.6021728515625, -0.5751724243164062, -0.5481719970703125, -0.5211715698242188, -0.494171142578125, -0.46717071533203125, -0.4401702880859375, -0.41316986083984375, -0.38616943359375, -0.35916900634765625, -0.3321685791015625, -0.30516815185546875, -0.278167724609375, -0.25116729736328125, -0.2241668701171875, -0.19716644287109375, -0.170166015625, -0.14316558837890625, -0.1161651611328125, -0.08916473388671875, -0.062164306640625, -0.03516387939453125, -0.0081634521484375, 0.01883697509765625, 0.04583740234375, 0.07283782958984375, 0.0998382568359375, 0.12683868408203125, 0.153839111328125, 0.18083953857421875, 0.2078399658203125, 0.23484039306640625, 0.2618408203125, 0.28884124755859375, 0.3158416748046875, 0.34284210205078125, 0.369842529296875, 0.39684295654296875, 0.4238433837890625, 0.45084381103515625, 0.47784423828125, 0.5048446655273438, 0.5318450927734375, 0.5588455200195312, 0.585845947265625, 0.6128463745117188, 0.6398468017578125, 0.6668472290039062, 0.69384765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 5.0, 15.0, 18.0, 28.0, 20.0, 25.0, 30.0, 44.0, 45.0, 59.0, 59.0, 61.0, 85.0, 63.0, 47.0, 54.0, 52.0, 53.0, 37.0, 33.0, 25.0, 34.0, 18.0, 20.0, 9.0, 13.0, 5.0, 4.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.78857421875, -0.7654647827148438, -0.7423553466796875, -0.7192459106445312, -0.696136474609375, -0.6730270385742188, -0.6499176025390625, -0.6268081665039062, -0.60369873046875, -0.5805892944335938, -0.5574798583984375, -0.5343704223632812, -0.511260986328125, -0.48815155029296875, -0.4650421142578125, -0.44193267822265625, -0.4188232421875, -0.39571380615234375, -0.3726043701171875, -0.34949493408203125, -0.326385498046875, -0.30327606201171875, -0.2801666259765625, -0.25705718994140625, -0.23394775390625, -0.21083831787109375, -0.1877288818359375, -0.16461944580078125, -0.141510009765625, -0.11840057373046875, -0.0952911376953125, -0.07218170166015625, -0.049072265625, -0.02596282958984375, -0.0028533935546875, 0.02025604248046875, 0.043365478515625, 0.06647491455078125, 0.0895843505859375, 0.11269378662109375, 0.13580322265625, 0.15891265869140625, 0.1820220947265625, 0.20513153076171875, 0.228240966796875, 0.25135040283203125, 0.2744598388671875, 0.29756927490234375, 0.3206787109375, 0.34378814697265625, 0.3668975830078125, 0.39000701904296875, 0.413116455078125, 0.43622589111328125, 0.4593353271484375, 0.48244476318359375, 0.50555419921875, 0.5286636352539062, 0.5517730712890625, 0.5748825073242188, 0.597991943359375, 0.6211013793945312, 0.6442108154296875, 0.6673202514648438, 0.6904296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 7.0, 4.0, 12.0, 18.0, 22.0, 26.0, 47.0, 55.0, 75.0, 114.0, 187.0, 318.0, 614.0, 1460.0, 4375.0, 18701.0, 114995.0, 609957.0, 249982.0, 36141.0, 7358.0, 2127.0, 828.0, 413.0, 204.0, 154.0, 85.0, 71.0, 41.0, 29.0, 31.0, 25.0, 18.0, 8.0, 11.0, 11.0, 7.0, 4.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.66796875, -1.6153411865234375, -1.562713623046875, -1.5100860595703125, -1.45745849609375, -1.4048309326171875, -1.352203369140625, -1.2995758056640625, -1.2469482421875, -1.1943206787109375, -1.141693115234375, -1.0890655517578125, -1.03643798828125, -0.9838104248046875, -0.931182861328125, -0.8785552978515625, -0.825927734375, -0.7733001708984375, -0.720672607421875, -0.6680450439453125, -0.61541748046875, -0.5627899169921875, -0.510162353515625, -0.4575347900390625, -0.4049072265625, -0.3522796630859375, -0.299652099609375, -0.2470245361328125, -0.19439697265625, -0.1417694091796875, -0.089141845703125, -0.0365142822265625, 0.01611328125, 0.0687408447265625, 0.121368408203125, 0.1739959716796875, 0.22662353515625, 0.2792510986328125, 0.331878662109375, 0.3845062255859375, 0.4371337890625, 0.4897613525390625, 0.542388916015625, 0.5950164794921875, 0.64764404296875, 0.7002716064453125, 0.752899169921875, 0.8055267333984375, 0.858154296875, 0.9107818603515625, 0.963409423828125, 1.0160369873046875, 1.06866455078125, 1.1212921142578125, 1.173919677734375, 1.2265472412109375, 1.2791748046875, 1.3318023681640625, 1.384429931640625, 1.4370574951171875, 1.48968505859375, 1.5423126220703125, 1.594940185546875, 1.6475677490234375, 1.7001953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 7.0, 5.0, 4.0, 10.0, 19.0, 26.0, 22.0, 24.0, 34.0, 33.0, 41.0, 45.0, 49.0, 56.0, 44.0, 60.0, 61.0, 57.0, 60.0, 38.0, 42.0, 45.0, 40.0, 30.0, 29.0, 28.0, 24.0, 15.0, 13.0, 12.0, 5.0, 6.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30078125, -3.197723388671875, -3.09466552734375, -2.991607666015625, -2.8885498046875, -2.785491943359375, -2.68243408203125, -2.579376220703125, -2.476318359375, -2.373260498046875, -2.27020263671875, -2.167144775390625, -2.0640869140625, -1.961029052734375, -1.85797119140625, -1.754913330078125, -1.65185546875, -1.548797607421875, -1.44573974609375, -1.342681884765625, -1.2396240234375, -1.136566162109375, -1.03350830078125, -0.930450439453125, -0.827392578125, -0.724334716796875, -0.62127685546875, -0.518218994140625, -0.4151611328125, -0.312103271484375, -0.20904541015625, -0.105987548828125, -0.0029296875, 0.100128173828125, 0.20318603515625, 0.306243896484375, 0.4093017578125, 0.512359619140625, 0.61541748046875, 0.718475341796875, 0.821533203125, 0.924591064453125, 1.02764892578125, 1.130706787109375, 1.2337646484375, 1.336822509765625, 1.43988037109375, 1.542938232421875, 1.64599609375, 1.749053955078125, 1.85211181640625, 1.955169677734375, 2.0582275390625, 2.161285400390625, 2.26434326171875, 2.367401123046875, 2.470458984375, 2.573516845703125, 2.67657470703125, 2.779632568359375, 2.8826904296875, 2.985748291015625, 3.08880615234375, 3.191864013671875, 3.294921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 2.0, 4.0, 14.0, 17.0, 18.0, 50.0, 102.0, 283.0, 1054.0, 7289.0, 764220.0, 269615.0, 4620.0, 838.0, 239.0, 70.0, 49.0, 21.0, 18.0, 9.0, 11.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8125, -2.73193359375, -2.6513671875, -2.57080078125, -2.490234375, -2.40966796875, -2.3291015625, -2.24853515625, -2.16796875, -2.08740234375, -2.0068359375, -1.92626953125, -1.845703125, -1.76513671875, -1.6845703125, -1.60400390625, -1.5234375, -1.44287109375, -1.3623046875, -1.28173828125, -1.201171875, -1.12060546875, -1.0400390625, -0.95947265625, -0.87890625, -0.79833984375, -0.7177734375, -0.63720703125, -0.556640625, -0.47607421875, -0.3955078125, -0.31494140625, -0.234375, -0.15380859375, -0.0732421875, 0.00732421875, 0.087890625, 0.16845703125, 0.2490234375, 0.32958984375, 0.41015625, 0.49072265625, 0.5712890625, 0.65185546875, 0.732421875, 0.81298828125, 0.8935546875, 0.97412109375, 1.0546875, 1.13525390625, 1.2158203125, 1.29638671875, 1.376953125, 1.45751953125, 1.5380859375, 1.61865234375, 1.69921875, 1.77978515625, 1.8603515625, 1.94091796875, 2.021484375, 2.10205078125, 2.1826171875, 2.26318359375, 2.34375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 11.0, 28.0, 31.0, 57.0, 65.0, 92.0, 110.0, 110.0, 115.0, 101.0, 88.0, 60.0, 36.0, 17.0, 21.0, 9.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001811981201171875, -0.00017610937356948853, -0.00017102062702178955, -0.00016593188047409058, -0.0001608431339263916, -0.00015575438737869263, -0.00015066564083099365, -0.00014557689428329468, -0.0001404881477355957, -0.00013539940118789673, -0.00013031065464019775, -0.00012522190809249878, -0.0001201331615447998, -0.00011504441499710083, -0.00010995566844940186, -0.00010486692190170288, -9.97781753540039e-05, -9.468942880630493e-05, -8.960068225860596e-05, -8.451193571090698e-05, -7.942318916320801e-05, -7.433444261550903e-05, -6.924569606781006e-05, -6.415694952011108e-05, -5.906820297241211e-05, -5.3979456424713135e-05, -4.889070987701416e-05, -4.3801963329315186e-05, -3.871321678161621e-05, -3.3624470233917236e-05, -2.8535723686218262e-05, -2.3446977138519287e-05, -1.8358230590820312e-05, -1.3269484043121338e-05, -8.180737495422363e-06, -3.0919909477233887e-06, 1.996755599975586e-06, 7.0855021476745605e-06, 1.2174248695373535e-05, 1.726299524307251e-05, 2.2351741790771484e-05, 2.744048833847046e-05, 3.2529234886169434e-05, 3.761798143386841e-05, 4.270672798156738e-05, 4.779547452926636e-05, 5.288422107696533e-05, 5.797296762466431e-05, 6.306171417236328e-05, 6.815046072006226e-05, 7.323920726776123e-05, 7.83279538154602e-05, 8.341670036315918e-05, 8.850544691085815e-05, 9.359419345855713e-05, 9.86829400062561e-05, 0.00010377168655395508, 0.00010886043310165405, 0.00011394917964935303, 0.000119037926197052, 0.00012412667274475098, 0.00012921541929244995, 0.00013430416584014893, 0.0001393929123878479, 0.00014448165893554688]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 9.0, 22.0, 20.0, 52.0, 116.0, 190.0, 497.0, 1536.0, 6567.0, 66924.0, 887791.0, 75285.0, 6947.0, 1647.0, 494.0, 215.0, 102.0, 59.0, 28.0, 14.0, 13.0, 3.0, 8.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.90301513671875, -1.8548583984375, -1.80670166015625, -1.758544921875, -1.71038818359375, -1.6622314453125, -1.61407470703125, -1.56591796875, -1.51776123046875, -1.4696044921875, -1.42144775390625, -1.373291015625, -1.32513427734375, -1.2769775390625, -1.22882080078125, -1.1806640625, -1.13250732421875, -1.0843505859375, -1.03619384765625, -0.988037109375, -0.93988037109375, -0.8917236328125, -0.84356689453125, -0.79541015625, -0.74725341796875, -0.6990966796875, -0.65093994140625, -0.602783203125, -0.55462646484375, -0.5064697265625, -0.45831298828125, -0.41015625, -0.36199951171875, -0.3138427734375, -0.26568603515625, -0.217529296875, -0.16937255859375, -0.1212158203125, -0.07305908203125, -0.02490234375, 0.02325439453125, 0.0714111328125, 0.11956787109375, 0.167724609375, 0.21588134765625, 0.2640380859375, 0.31219482421875, 0.3603515625, 0.40850830078125, 0.4566650390625, 0.50482177734375, 0.552978515625, 0.60113525390625, 0.6492919921875, 0.69744873046875, 0.74560546875, 0.79376220703125, 0.8419189453125, 0.89007568359375, 0.938232421875, 0.98638916015625, 1.0345458984375, 1.08270263671875, 1.130859375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 7.0, 3.0, 5.0, 5.0, 8.0, 23.0, 29.0, 58.0, 97.0, 180.0, 197.0, 139.0, 103.0, 52.0, 28.0, 10.0, 12.0, 7.0, 3.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5322265625, -1.4740447998046875, -1.415863037109375, -1.3576812744140625, -1.29949951171875, -1.2413177490234375, -1.183135986328125, -1.1249542236328125, -1.0667724609375, -1.0085906982421875, -0.950408935546875, -0.8922271728515625, -0.83404541015625, -0.7758636474609375, -0.717681884765625, -0.6595001220703125, -0.601318359375, -0.5431365966796875, -0.484954833984375, -0.4267730712890625, -0.36859130859375, -0.3104095458984375, -0.252227783203125, -0.1940460205078125, -0.1358642578125, -0.0776824951171875, -0.019500732421875, 0.0386810302734375, 0.09686279296875, 0.1550445556640625, 0.213226318359375, 0.2714080810546875, 0.32958984375, 0.3877716064453125, 0.445953369140625, 0.5041351318359375, 0.56231689453125, 0.6204986572265625, 0.678680419921875, 0.7368621826171875, 0.7950439453125, 0.8532257080078125, 0.911407470703125, 0.9695892333984375, 1.02777099609375, 1.0859527587890625, 1.144134521484375, 1.2023162841796875, 1.260498046875, 1.3186798095703125, 1.376861572265625, 1.4350433349609375, 1.49322509765625, 1.5514068603515625, 1.609588623046875, 1.6677703857421875, 1.7259521484375, 1.7841339111328125, 1.842315673828125, 1.9004974365234375, 1.95867919921875, 2.0168609619140625, 2.075042724609375, 2.1332244873046875, 2.19140625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 10.0, 26.0, 58.0, 142.0, 236.0, 247.0, 170.0, 70.0, 30.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.619155883789062, -25.79039192199707, -24.96162986755371, -24.13286590576172, -23.304101943969727, -22.475339889526367, -21.646575927734375, -20.817813873291016, -19.989049911499023, -19.16028594970703, -18.331523895263672, -17.50275993347168, -16.673995971679688, -15.845233917236328, -15.016469955444336, -14.18770694732666, -13.358942985534668, -12.530179977416992, -11.701416015625, -10.872653007507324, -10.043889999389648, -9.215126037597656, -8.38636302947998, -7.557600021362305, -6.728836536407471, -5.900073051452637, -5.071310043334961, -4.242546558380127, -3.413783311843872, -2.585020065307617, -1.7562565803527832, -0.9274935722351074, -0.09873008728027344, 0.7300332188606262, 1.5587965250015259, 2.3875598907470703, 3.216323137283325, 4.04508638381958, 4.873849868774414, 5.70261287689209, 6.531376361846924, 7.360139846801758, 8.188902854919434, 9.01766586303711, 9.846429824829102, 10.675192832946777, 11.503955841064453, 12.332719802856445, 13.161482810974121, 13.990245819091797, 14.819009780883789, 15.647772789001465, 16.47653579711914, 17.305299758911133, 18.134063720703125, 18.962825775146484, 19.791589736938477, 20.62035369873047, 21.449115753173828, 22.27787971496582, 23.106643676757812, 23.935405731201172, 24.764169692993164, 25.592933654785156, 26.421695709228516]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 10.0, 13.0, 7.0, 21.0, 20.0, 31.0, 30.0, 48.0, 56.0, 62.0, 72.0, 72.0, 77.0, 75.0, 70.0, 57.0, 49.0, 36.0, 43.0, 27.0, 26.0, 17.0, 31.0, 20.0, 10.0, 3.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.770374298095703, -21.159971237182617, -20.54956817626953, -19.939165115356445, -19.32876205444336, -18.718360900878906, -18.10795783996582, -17.497554779052734, -16.88715171813965, -16.276748657226562, -15.666345596313477, -15.055943489074707, -14.445540428161621, -13.835137367248535, -13.224735260009766, -12.61433219909668, -12.003929138183594, -11.393526077270508, -10.783123016357422, -10.172720909118652, -9.562317848205566, -8.95191478729248, -8.341512680053711, -7.731109619140625, -7.120706558227539, -6.510303497314453, -5.899900913238525, -5.289498329162598, -4.679095268249512, -4.068692207336426, -3.458289623260498, -2.8478870391845703, -2.2374820709228516, -1.6270792484283447, -1.016676425933838, -0.40627360343933105, 0.20412921905517578, 0.8145320415496826, 1.4249348640441895, 2.035337448120117, 2.645740509033203, 3.25614333152771, 3.866546154022217, 4.4769487380981445, 5.0873517990112305, 5.697754859924316, 6.308157444000244, 6.918560028076172, 7.528963088989258, 8.139366149902344, 8.74976921081543, 9.3601713180542, 9.970574378967285, 10.580977439880371, 11.19137954711914, 11.801782608032227, 12.412185668945312, 13.022588729858398, 13.632991790771484, 14.243393898010254, 14.85379695892334, 15.464200019836426, 16.074602127075195, 16.68500518798828, 17.295408248901367]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 10.0, 7.0, 6.0, 17.0, 22.0, 18.0, 40.0, 56.0, 41.0, 87.0, 118.0, 156.0, 262.0, 400.0, 712.0, 1286.0, 2720.0, 6732.0, 21509.0, 151597.0, 3936943.0, 51127.0, 11907.0, 4265.0, 1871.0, 953.0, 521.0, 302.0, 177.0, 108.0, 81.0, 58.0, 46.0, 27.0, 22.0, 12.0, 17.0, 15.0, 8.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.9599609375, -1.9073638916015625, -1.854766845703125, -1.8021697998046875, -1.74957275390625, -1.6969757080078125, -1.644378662109375, -1.5917816162109375, -1.5391845703125, -1.4865875244140625, -1.433990478515625, -1.3813934326171875, -1.32879638671875, -1.2761993408203125, -1.223602294921875, -1.1710052490234375, -1.118408203125, -1.0658111572265625, -1.013214111328125, -0.9606170654296875, -0.90802001953125, -0.8554229736328125, -0.802825927734375, -0.7502288818359375, -0.6976318359375, -0.6450347900390625, -0.592437744140625, -0.5398406982421875, -0.48724365234375, -0.4346466064453125, -0.382049560546875, -0.3294525146484375, -0.27685546875, -0.2242584228515625, -0.171661376953125, -0.1190643310546875, -0.06646728515625, -0.0138702392578125, 0.038726806640625, 0.0913238525390625, 0.1439208984375, 0.1965179443359375, 0.249114990234375, 0.3017120361328125, 0.35430908203125, 0.4069061279296875, 0.459503173828125, 0.5121002197265625, 0.564697265625, 0.6172943115234375, 0.669891357421875, 0.7224884033203125, 0.77508544921875, 0.8276824951171875, 0.880279541015625, 0.9328765869140625, 0.9854736328125, 1.0380706787109375, 1.090667724609375, 1.1432647705078125, 1.19586181640625, 1.2484588623046875, 1.301055908203125, 1.3536529541015625, 1.40625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 11.0, 7.0, 7.0, 10.0, 14.0, 41.0, 50.0, 65.0, 78.0, 128.0, 127.0, 108.0, 104.0, 78.0, 59.0, 32.0, 26.0, 17.0, 15.0, 7.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0], "bins": [-1.9111328125, -1.8692169189453125, -1.827301025390625, -1.7853851318359375, -1.74346923828125, -1.7015533447265625, -1.659637451171875, -1.6177215576171875, -1.5758056640625, -1.5338897705078125, -1.491973876953125, -1.4500579833984375, -1.40814208984375, -1.3662261962890625, -1.324310302734375, -1.2823944091796875, -1.240478515625, -1.1985626220703125, -1.156646728515625, -1.1147308349609375, -1.07281494140625, -1.0308990478515625, -0.988983154296875, -0.9470672607421875, -0.9051513671875, -0.8632354736328125, -0.821319580078125, -0.7794036865234375, -0.73748779296875, -0.6955718994140625, -0.653656005859375, -0.6117401123046875, -0.56982421875, -0.5279083251953125, -0.485992431640625, -0.4440765380859375, -0.40216064453125, -0.3602447509765625, -0.318328857421875, -0.2764129638671875, -0.2344970703125, -0.1925811767578125, -0.150665283203125, -0.1087493896484375, -0.06683349609375, -0.0249176025390625, 0.016998291015625, 0.0589141845703125, 0.100830078125, 0.1427459716796875, 0.184661865234375, 0.2265777587890625, 0.26849365234375, 0.3104095458984375, 0.352325439453125, 0.3942413330078125, 0.4361572265625, 0.4780731201171875, 0.519989013671875, 0.5619049072265625, 0.60382080078125, 0.6457366943359375, 0.687652587890625, 0.7295684814453125, 0.771484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 7.0, 10.0, 16.0, 18.0, 24.0, 44.0, 45.0, 69.0, 81.0, 121.0, 148.0, 227.0, 291.0, 426.0, 642.0, 1266.0, 3460.0, 14911.0, 199065.0, 3928654.0, 34572.0, 5752.0, 1816.0, 809.0, 445.0, 346.0, 252.0, 176.0, 131.0, 104.0, 85.0, 60.0, 49.0, 38.0, 25.0, 18.0, 15.0, 9.0, 11.0, 9.0, 3.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5078125, -2.42193603515625, -2.3360595703125, -2.25018310546875, -2.164306640625, -2.07843017578125, -1.9925537109375, -1.90667724609375, -1.82080078125, -1.73492431640625, -1.6490478515625, -1.56317138671875, -1.477294921875, -1.39141845703125, -1.3055419921875, -1.21966552734375, -1.1337890625, -1.04791259765625, -0.9620361328125, -0.87615966796875, -0.790283203125, -0.70440673828125, -0.6185302734375, -0.53265380859375, -0.44677734375, -0.36090087890625, -0.2750244140625, -0.18914794921875, -0.103271484375, -0.01739501953125, 0.0684814453125, 0.15435791015625, 0.240234375, 0.32611083984375, 0.4119873046875, 0.49786376953125, 0.583740234375, 0.66961669921875, 0.7554931640625, 0.84136962890625, 0.92724609375, 1.01312255859375, 1.0989990234375, 1.18487548828125, 1.270751953125, 1.35662841796875, 1.4425048828125, 1.52838134765625, 1.6142578125, 1.70013427734375, 1.7860107421875, 1.87188720703125, 1.957763671875, 2.04364013671875, 2.1295166015625, 2.21539306640625, 2.30126953125, 2.38714599609375, 2.4730224609375, 2.55889892578125, 2.644775390625, 2.73065185546875, 2.8165283203125, 2.90240478515625, 2.98828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 11.0, 23.0, 39.0, 94.0, 355.0, 3312.0, 152.0, 51.0, 18.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.2567138671875, -1.204833984375, -1.1529541015625, -1.10107421875, -1.0491943359375, -0.997314453125, -0.9454345703125, -0.8935546875, -0.8416748046875, -0.789794921875, -0.7379150390625, -0.68603515625, -0.6341552734375, -0.582275390625, -0.5303955078125, -0.478515625, -0.4266357421875, -0.374755859375, -0.3228759765625, -0.27099609375, -0.2191162109375, -0.167236328125, -0.1153564453125, -0.0634765625, -0.0115966796875, 0.040283203125, 0.0921630859375, 0.14404296875, 0.1959228515625, 0.247802734375, 0.2996826171875, 0.3515625, 0.4034423828125, 0.455322265625, 0.5072021484375, 0.55908203125, 0.6109619140625, 0.662841796875, 0.7147216796875, 0.7666015625, 0.8184814453125, 0.870361328125, 0.9222412109375, 0.97412109375, 1.0260009765625, 1.077880859375, 1.1297607421875, 1.181640625, 1.2335205078125, 1.285400390625, 1.3372802734375, 1.38916015625, 1.4410400390625, 1.492919921875, 1.5447998046875, 1.5966796875, 1.6485595703125, 1.700439453125, 1.7523193359375, 1.80419921875, 1.8560791015625, 1.907958984375, 1.9598388671875, 2.01171875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 19.0, 28.0, 56.0, 77.0, 120.0, 165.0, 184.0, 161.0, 77.0, 51.0, 24.0, 15.0, 9.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.152436256408691, -3.9816713333129883, -3.810906171798706, -3.640141248703003, -3.4693763256073, -3.2986111640930176, -3.1278462409973145, -2.9570813179016113, -2.786316394805908, -2.615551471710205, -2.444786310195923, -2.2740213871002197, -2.1032564640045166, -1.932491421699524, -1.7617263793945312, -1.5909614562988281, -1.420196294784546, -1.2494312524795532, -1.07866632938385, -0.9079012870788574, -0.7371363043785095, -0.5663713216781616, -0.39560627937316895, -0.22484135627746582, -0.054076313972473145, 0.11668868362903595, 0.28745368123054504, 0.45821869373321533, 0.6289836764335632, 0.7997486591339111, 0.9705137014389038, 1.141278624534607, 1.3120436668395996, 1.4828087091445923, 1.6535736322402954, 1.824338674545288, 1.9951035976409912, 2.1658687591552734, 2.3366336822509766, 2.5073986053466797, 2.678163528442383, 2.848928451538086, 3.019693613052368, 3.1904585361480713, 3.3612234592437744, 3.5319886207580566, 3.7027535438537598, 3.873518466949463, 4.044283866882324, 4.215048789978027, 4.3858137130737305, 4.556578636169434, 4.727344036102295, 4.898108959197998, 5.068873882293701, 5.239638805389404, 5.410403728485107, 5.5811686515808105, 5.751933574676514, 5.922698974609375, 6.093463897705078, 6.264228820800781, 6.434993743896484, 6.6057586669921875, 6.776523590087891]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 1.0, 5.0, 11.0, 7.0, 13.0, 12.0, 23.0, 31.0, 35.0, 36.0, 48.0, 44.0, 44.0, 52.0, 49.0, 57.0, 59.0, 60.0, 51.0, 53.0, 48.0, 35.0, 40.0, 33.0, 43.0, 14.0, 20.0, 19.0, 12.0, 9.0, 7.0, 2.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.3887202739715576, -3.2974400520324707, -3.206159830093384, -3.114879608154297, -3.023599624633789, -2.932319402694702, -2.8410391807556152, -2.7497589588165283, -2.6584787368774414, -2.5671985149383545, -2.4759182929992676, -2.3846383094787598, -2.293358087539673, -2.202077865600586, -2.110797643661499, -2.019517421722412, -1.9282374382019043, -1.8369572162628174, -1.74567711353302, -1.654396891593933, -1.5631167888641357, -1.4718365669250488, -1.380556344985962, -1.289276123046875, -1.1979960203170776, -1.1067157983779907, -1.0154356956481934, -0.9241554737091064, -0.8328753113746643, -0.7415951490402222, -0.6503149271011353, -0.5590347647666931, -0.4677543640136719, -0.37647420167922974, -0.2851940095424652, -0.19391381740570068, -0.10263365507125854, -0.011353492736816406, 0.07992672920227051, 0.17120689153671265, 0.2624870538711548, 0.3537672162055969, 0.44504740834236145, 0.536327600479126, 0.6276077628135681, 0.7188879251480103, 0.8101681470870972, 0.9014483094215393, 0.9927284717559814, 1.0840086936950684, 1.1752887964248657, 1.2665690183639526, 1.35784912109375, 1.449129343032837, 1.5404095649719238, 1.6316897869110107, 1.722969889640808, 1.814250111579895, 1.9055302143096924, 1.9968104362487793, 2.088090658187866, 2.179370880126953, 2.270650863647461, 2.361931085586548, 2.4532113075256348]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 12.0, 9.0, 13.0, 24.0, 26.0, 48.0, 105.0, 179.0, 342.0, 832.0, 2472.0, 8889.0, 45698.0, 293943.0, 552096.0, 117193.0, 19543.0, 4565.0, 1496.0, 526.0, 250.0, 125.0, 71.0, 35.0, 24.0, 16.0, 9.0, 6.0, 7.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7626953125, -1.7024383544921875, -1.642181396484375, -1.5819244384765625, -1.52166748046875, -1.4614105224609375, -1.401153564453125, -1.3408966064453125, -1.2806396484375, -1.2203826904296875, -1.160125732421875, -1.0998687744140625, -1.03961181640625, -0.9793548583984375, -0.919097900390625, -0.8588409423828125, -0.798583984375, -0.7383270263671875, -0.678070068359375, -0.6178131103515625, -0.55755615234375, -0.4972991943359375, -0.437042236328125, -0.3767852783203125, -0.3165283203125, -0.2562713623046875, -0.196014404296875, -0.1357574462890625, -0.07550048828125, -0.0152435302734375, 0.045013427734375, 0.1052703857421875, 0.16552734375, 0.2257843017578125, 0.286041259765625, 0.3462982177734375, 0.40655517578125, 0.4668121337890625, 0.527069091796875, 0.5873260498046875, 0.6475830078125, 0.7078399658203125, 0.768096923828125, 0.8283538818359375, 0.88861083984375, 0.9488677978515625, 1.009124755859375, 1.0693817138671875, 1.129638671875, 1.1898956298828125, 1.250152587890625, 1.3104095458984375, 1.37066650390625, 1.4309234619140625, 1.491180419921875, 1.5514373779296875, 1.6116943359375, 1.6719512939453125, 1.732208251953125, 1.7924652099609375, 1.85272216796875, 1.9129791259765625, 1.973236083984375, 2.0334930419921875, 2.09375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 4.0, 11.0, 11.0, 18.0, 19.0, 45.0, 69.0, 77.0, 95.0, 87.0, 105.0, 100.0, 82.0, 70.0, 52.0, 40.0, 38.0, 25.0, 14.0, 11.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6337890625, -1.5943832397460938, -1.5549774169921875, -1.5155715942382812, -1.476165771484375, -1.4367599487304688, -1.3973541259765625, -1.3579483032226562, -1.31854248046875, -1.2791366577148438, -1.2397308349609375, -1.2003250122070312, -1.160919189453125, -1.1215133666992188, -1.0821075439453125, -1.0427017211914062, -1.0032958984375, -0.9638900756835938, -0.9244842529296875, -0.8850784301757812, -0.845672607421875, -0.8062667846679688, -0.7668609619140625, -0.7274551391601562, -0.68804931640625, -0.6486434936523438, -0.6092376708984375, -0.5698318481445312, -0.530426025390625, -0.49102020263671875, -0.4516143798828125, -0.41220855712890625, -0.372802734375, -0.33339691162109375, -0.2939910888671875, -0.25458526611328125, -0.215179443359375, -0.17577362060546875, -0.1363677978515625, -0.09696197509765625, -0.05755615234375, -0.01815032958984375, 0.0212554931640625, 0.06066131591796875, 0.100067138671875, 0.13947296142578125, 0.1788787841796875, 0.21828460693359375, 0.2576904296875, 0.29709625244140625, 0.3365020751953125, 0.37590789794921875, 0.415313720703125, 0.45471954345703125, 0.4941253662109375, 0.5335311889648438, 0.57293701171875, 0.6123428344726562, 0.6517486572265625, 0.6911544799804688, 0.730560302734375, 0.7699661254882812, 0.8093719482421875, 0.8487777709960938, 0.88818359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 11.0, 9.0, 23.0, 30.0, 56.0, 111.0, 190.0, 466.0, 1088.0, 3779.0, 28844.0, 576589.0, 411475.0, 20935.0, 3183.0, 958.0, 397.0, 187.0, 102.0, 51.0, 33.0, 20.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30859375, -3.219024658203125, -3.12945556640625, -3.039886474609375, -2.9503173828125, -2.860748291015625, -2.77117919921875, -2.681610107421875, -2.592041015625, -2.502471923828125, -2.41290283203125, -2.323333740234375, -2.2337646484375, -2.144195556640625, -2.05462646484375, -1.965057373046875, -1.87548828125, -1.785919189453125, -1.69635009765625, -1.606781005859375, -1.5172119140625, -1.427642822265625, -1.33807373046875, -1.248504638671875, -1.158935546875, -1.069366455078125, -0.97979736328125, -0.890228271484375, -0.8006591796875, -0.711090087890625, -0.62152099609375, -0.531951904296875, -0.4423828125, -0.352813720703125, -0.26324462890625, -0.173675537109375, -0.0841064453125, 0.005462646484375, 0.09503173828125, 0.184600830078125, 0.274169921875, 0.363739013671875, 0.45330810546875, 0.542877197265625, 0.6324462890625, 0.722015380859375, 0.81158447265625, 0.901153564453125, 0.99072265625, 1.080291748046875, 1.16986083984375, 1.259429931640625, 1.3489990234375, 1.438568115234375, 1.52813720703125, 1.617706298828125, 1.707275390625, 1.796844482421875, 1.88641357421875, 1.975982666015625, 2.0655517578125, 2.155120849609375, 2.24468994140625, 2.334259033203125, 2.423828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 10.0, 13.0, 12.0, 12.0, 20.0, 17.0, 22.0, 39.0, 38.0, 54.0, 49.0, 60.0, 46.0, 59.0, 64.0, 59.0, 53.0, 64.0, 45.0, 42.0, 37.0, 43.0, 31.0, 28.0, 19.0, 10.0, 12.0, 12.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.12890625, -4.028045654296875, -3.92718505859375, -3.826324462890625, -3.7254638671875, -3.624603271484375, -3.52374267578125, -3.422882080078125, -3.322021484375, -3.221160888671875, -3.12030029296875, -3.019439697265625, -2.9185791015625, -2.817718505859375, -2.71685791015625, -2.615997314453125, -2.51513671875, -2.414276123046875, -2.31341552734375, -2.212554931640625, -2.1116943359375, -2.010833740234375, -1.90997314453125, -1.809112548828125, -1.708251953125, -1.607391357421875, -1.50653076171875, -1.405670166015625, -1.3048095703125, -1.203948974609375, -1.10308837890625, -1.002227783203125, -0.9013671875, -0.800506591796875, -0.69964599609375, -0.598785400390625, -0.4979248046875, -0.397064208984375, -0.29620361328125, -0.195343017578125, -0.094482421875, 0.006378173828125, 0.10723876953125, 0.208099365234375, 0.3089599609375, 0.409820556640625, 0.51068115234375, 0.611541748046875, 0.71240234375, 0.813262939453125, 0.91412353515625, 1.014984130859375, 1.1158447265625, 1.216705322265625, 1.31756591796875, 1.418426513671875, 1.519287109375, 1.620147705078125, 1.72100830078125, 1.821868896484375, 1.9227294921875, 2.023590087890625, 2.12445068359375, 2.225311279296875, 2.326171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 8.0, 6.0, 5.0, 16.0, 13.0, 31.0, 39.0, 54.0, 113.0, 258.0, 438.0, 1113.0, 3643.0, 20107.0, 304879.0, 666572.0, 42646.0, 5718.0, 1593.0, 608.0, 295.0, 167.0, 80.0, 38.0, 30.0, 26.0, 18.0, 8.0, 4.0, 7.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0048828125, -0.98046875, -0.9560546875, -0.931640625, -0.9072265625, -0.8828125, -0.8583984375, -0.833984375, -0.8095703125, -0.78515625, -0.7607421875, -0.736328125, -0.7119140625, -0.6875, -0.6630859375, -0.638671875, -0.6142578125, -0.58984375, -0.5654296875, -0.541015625, -0.5166015625, -0.4921875, -0.4677734375, -0.443359375, -0.4189453125, -0.39453125, -0.3701171875, -0.345703125, -0.3212890625, -0.296875, -0.2724609375, -0.248046875, -0.2236328125, -0.19921875, -0.1748046875, -0.150390625, -0.1259765625, -0.1015625, -0.0771484375, -0.052734375, -0.0283203125, -0.00390625, 0.0205078125, 0.044921875, 0.0693359375, 0.09375, 0.1181640625, 0.142578125, 0.1669921875, 0.19140625, 0.2158203125, 0.240234375, 0.2646484375, 0.2890625, 0.3134765625, 0.337890625, 0.3623046875, 0.38671875, 0.4111328125, 0.435546875, 0.4599609375, 0.484375, 0.5087890625, 0.533203125, 0.5576171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 9.0, 23.0, 21.0, 22.0, 33.0, 51.0, 73.0, 57.0, 116.0, 110.0, 97.0, 103.0, 66.0, 61.0, 39.0, 26.0, 28.0, 24.0, 10.0, 5.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00015366077423095703, -0.0001497967168688774, -0.0001459326595067978, -0.00014206860214471817, -0.00013820454478263855, -0.00013434048742055893, -0.0001304764300584793, -0.0001266123726963997, -0.00012274831533432007, -0.00011888425797224045, -0.00011502020061016083, -0.00011115614324808121, -0.00010729208588600159, -0.00010342802852392197, -9.956397116184235e-05, -9.569991379976273e-05, -9.18358564376831e-05, -8.797179907560349e-05, -8.410774171352386e-05, -8.024368435144424e-05, -7.637962698936462e-05, -7.2515569627285e-05, -6.865151226520538e-05, -6.478745490312576e-05, -6.092339754104614e-05, -5.705934017896652e-05, -5.31952828168869e-05, -4.933122545480728e-05, -4.546716809272766e-05, -4.160311073064804e-05, -3.773905336856842e-05, -3.38749960064888e-05, -3.001093864440918e-05, -2.614688128232956e-05, -2.228282392024994e-05, -1.841876655817032e-05, -1.4554709196090698e-05, -1.0690651834011078e-05, -6.8265944719314575e-06, -2.962537109851837e-06, 9.015202522277832e-07, 4.7655776143074036e-06, 8.629634976387024e-06, 1.2493692338466644e-05, 1.6357749700546265e-05, 2.0221807062625885e-05, 2.4085864424705505e-05, 2.7949921786785126e-05, 3.1813979148864746e-05, 3.5678036510944366e-05, 3.954209387302399e-05, 4.340615123510361e-05, 4.727020859718323e-05, 5.113426595926285e-05, 5.499832332134247e-05, 5.886238068342209e-05, 6.272643804550171e-05, 6.659049540758133e-05, 7.045455276966095e-05, 7.431861013174057e-05, 7.818266749382019e-05, 8.204672485589981e-05, 8.591078221797943e-05, 8.977483958005905e-05, 9.363889694213867e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 4.0, 10.0, 14.0, 20.0, 36.0, 65.0, 114.0, 245.0, 605.0, 1566.0, 5650.0, 36874.0, 648435.0, 328270.0, 20547.0, 3946.0, 1183.0, 487.0, 198.0, 105.0, 54.0, 47.0, 23.0, 11.0, 15.0, 10.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.97802734375, -0.9491500854492188, -0.9202728271484375, -0.8913955688476562, -0.862518310546875, -0.8336410522460938, -0.8047637939453125, -0.7758865356445312, -0.74700927734375, -0.7181320190429688, -0.6892547607421875, -0.6603775024414062, -0.631500244140625, -0.6026229858398438, -0.5737457275390625, -0.5448684692382812, -0.5159912109375, -0.48711395263671875, -0.4582366943359375, -0.42935943603515625, -0.400482177734375, -0.37160491943359375, -0.3427276611328125, -0.31385040283203125, -0.28497314453125, -0.25609588623046875, -0.2272186279296875, -0.19834136962890625, -0.169464111328125, -0.14058685302734375, -0.1117095947265625, -0.08283233642578125, -0.053955078125, -0.02507781982421875, 0.0037994384765625, 0.03267669677734375, 0.061553955078125, 0.09043121337890625, 0.1193084716796875, 0.14818572998046875, 0.17706298828125, 0.20594024658203125, 0.2348175048828125, 0.26369476318359375, 0.292572021484375, 0.32144927978515625, 0.3503265380859375, 0.37920379638671875, 0.4080810546875, 0.43695831298828125, 0.4658355712890625, 0.49471282958984375, 0.523590087890625, 0.5524673461914062, 0.5813446044921875, 0.6102218627929688, 0.63909912109375, 0.6679763793945312, 0.6968536376953125, 0.7257308959960938, 0.754608154296875, 0.7834854125976562, 0.8123626708984375, 0.8412399291992188, 0.8701171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 12.0, 10.0, 22.0, 34.0, 25.0, 39.0, 48.0, 50.0, 88.0, 74.0, 86.0, 99.0, 80.0, 68.0, 50.0, 53.0, 47.0, 29.0, 17.0, 15.0, 13.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8037109375, -0.7822647094726562, -0.7608184814453125, -0.7393722534179688, -0.717926025390625, -0.6964797973632812, -0.6750335693359375, -0.6535873413085938, -0.63214111328125, -0.6106948852539062, -0.5892486572265625, -0.5678024291992188, -0.546356201171875, -0.5249099731445312, -0.5034637451171875, -0.48201751708984375, -0.4605712890625, -0.43912506103515625, -0.4176788330078125, -0.39623260498046875, -0.374786376953125, -0.35334014892578125, -0.3318939208984375, -0.31044769287109375, -0.28900146484375, -0.26755523681640625, -0.2461090087890625, -0.22466278076171875, -0.203216552734375, -0.18177032470703125, -0.1603240966796875, -0.13887786865234375, -0.117431640625, -0.09598541259765625, -0.0745391845703125, -0.05309295654296875, -0.031646728515625, -0.01020050048828125, 0.0112457275390625, 0.03269195556640625, 0.05413818359375, 0.07558441162109375, 0.0970306396484375, 0.11847686767578125, 0.139923095703125, 0.16136932373046875, 0.1828155517578125, 0.20426177978515625, 0.2257080078125, 0.24715423583984375, 0.2686004638671875, 0.29004669189453125, 0.311492919921875, 0.33293914794921875, 0.3543853759765625, 0.37583160400390625, 0.39727783203125, 0.41872406005859375, 0.4401702880859375, 0.46161651611328125, 0.483062744140625, 0.5045089721679688, 0.5259552001953125, 0.5474014282226562, 0.56884765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 24.0, 55.0, 143.0, 266.0, 232.0, 148.0, 78.0, 35.0, 14.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.696379661560059, -11.946297645568848, -11.196216583251953, -10.446134567260742, -9.696052551269531, -8.94597053527832, -8.195889472961426, -7.445807456970215, -6.695725917816162, -5.945644378662109, -5.195562362670898, -4.445480823516846, -3.695399045944214, -2.945317268371582, -2.1952357292175293, -1.4451537132263184, -0.6950721740722656, 0.055009543895721436, 0.8050912618637085, 1.5551729202270508, 2.3052546977996826, 3.0553364753723145, 3.805418014526367, 4.555500030517578, 5.305581569671631, 6.055663108825684, 6.8057451248168945, 7.555826663970947, 8.305908203125, 9.055990219116211, 9.806072235107422, 10.556154251098633, 11.306234359741211, 12.056316375732422, 12.806397438049316, 13.556479454040527, 14.306561470031738, 15.056642532348633, 15.806724548339844, 16.556806564331055, 17.306888580322266, 18.056970596313477, 18.807052612304688, 19.557132720947266, 20.307214736938477, 21.057296752929688, 21.8073787689209, 22.55746078491211, 23.307540893554688, 24.0576229095459, 24.80770492553711, 25.557785034179688, 26.3078670501709, 27.05794906616211, 27.80803108215332, 28.55811309814453, 29.308195114135742, 30.058277130126953, 30.808359146118164, 31.558441162109375, 32.30852127075195, 33.0586051940918, 33.808685302734375, 34.55876922607422, 35.3088493347168]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 11.0, 15.0, 12.0, 24.0, 20.0, 32.0, 38.0, 43.0, 52.0, 52.0, 63.0, 71.0, 63.0, 85.0, 60.0, 49.0, 52.0, 35.0, 49.0, 29.0, 25.0, 27.0, 28.0, 14.0, 12.0, 6.0, 5.0, 10.0, 7.0, 6.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.054407119750977, -13.55333137512207, -13.052255630493164, -12.551179885864258, -12.050104141235352, -11.549028396606445, -11.047952651977539, -10.546876907348633, -10.045801162719727, -9.54472541809082, -9.043649673461914, -8.542573928833008, -8.041498184204102, -7.540422439575195, -7.039346694946289, -6.538270950317383, -6.037195205688477, -5.53611946105957, -5.035043716430664, -4.533967971801758, -4.032892227172852, -3.5318164825439453, -3.030740737915039, -2.529664993286133, -2.0285892486572266, -1.5275135040283203, -1.026437759399414, -0.5253620147705078, -0.024286270141601562, 0.4767894744873047, 0.9778652191162109, 1.4789409637451172, 1.9800148010253906, 2.481090545654297, 2.982166290283203, 3.4832420349121094, 3.9843177795410156, 4.485393524169922, 4.986469268798828, 5.487545013427734, 5.988620758056641, 6.489696502685547, 6.990772247314453, 7.491847991943359, 7.992923736572266, 8.493999481201172, 8.995075225830078, 9.496150970458984, 9.99722671508789, 10.498302459716797, 10.999378204345703, 11.50045394897461, 12.001529693603516, 12.502605438232422, 13.003681182861328, 13.504756927490234, 14.00583267211914, 14.506908416748047, 15.007984161376953, 15.50905990600586, 16.010135650634766, 16.511211395263672, 17.012287139892578, 17.513362884521484, 18.01443862915039]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 11.0, 10.0, 12.0, 18.0, 19.0, 37.0, 50.0, 77.0, 124.0, 168.0, 259.0, 389.0, 652.0, 1178.0, 2065.0, 3675.0, 7618.0, 16978.0, 45377.0, 184570.0, 1886594.0, 1791380.0, 175690.0, 44730.0, 16656.0, 7203.0, 3677.0, 1982.0, 1171.0, 682.0, 412.0, 276.0, 182.0, 111.0, 73.0, 70.0, 39.0, 17.0, 13.0, 11.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7802734375, -0.7558822631835938, -0.7314910888671875, -0.7070999145507812, -0.682708740234375, -0.6583175659179688, -0.6339263916015625, -0.6095352172851562, -0.58514404296875, -0.5607528686523438, -0.5363616943359375, -0.5119705200195312, -0.487579345703125, -0.46318817138671875, -0.4387969970703125, -0.41440582275390625, -0.3900146484375, -0.36562347412109375, -0.3412322998046875, -0.31684112548828125, -0.292449951171875, -0.26805877685546875, -0.2436676025390625, -0.21927642822265625, -0.19488525390625, -0.17049407958984375, -0.1461029052734375, -0.12171173095703125, -0.097320556640625, -0.07292938232421875, -0.0485382080078125, -0.02414703369140625, 0.000244140625, 0.02463531494140625, 0.0490264892578125, 0.07341766357421875, 0.097808837890625, 0.12220001220703125, 0.1465911865234375, 0.17098236083984375, 0.19537353515625, 0.21976470947265625, 0.2441558837890625, 0.26854705810546875, 0.292938232421875, 0.31732940673828125, 0.3417205810546875, 0.36611175537109375, 0.3905029296875, 0.41489410400390625, 0.4392852783203125, 0.46367645263671875, 0.488067626953125, 0.5124588012695312, 0.5368499755859375, 0.5612411499023438, 0.58563232421875, 0.6100234985351562, 0.6344146728515625, 0.6588058471679688, 0.683197021484375, 0.7075881958007812, 0.7319793701171875, 0.7563705444335938, 0.78076171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 19.0, 16.0, 22.0, 30.0, 36.0, 52.0, 61.0, 54.0, 46.0, 56.0, 74.0, 79.0, 65.0, 56.0, 57.0, 40.0, 38.0, 39.0, 30.0, 23.0, 20.0, 18.0, 9.0, 15.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.81982421875, -0.795806884765625, -0.77178955078125, -0.747772216796875, -0.7237548828125, -0.699737548828125, -0.67572021484375, -0.651702880859375, -0.627685546875, -0.603668212890625, -0.57965087890625, -0.555633544921875, -0.5316162109375, -0.507598876953125, -0.48358154296875, -0.459564208984375, -0.435546875, -0.411529541015625, -0.38751220703125, -0.363494873046875, -0.3394775390625, -0.315460205078125, -0.29144287109375, -0.267425537109375, -0.243408203125, -0.219390869140625, -0.19537353515625, -0.171356201171875, -0.1473388671875, -0.123321533203125, -0.09930419921875, -0.075286865234375, -0.05126953125, -0.027252197265625, -0.00323486328125, 0.020782470703125, 0.0447998046875, 0.068817138671875, 0.09283447265625, 0.116851806640625, 0.140869140625, 0.164886474609375, 0.18890380859375, 0.212921142578125, 0.2369384765625, 0.260955810546875, 0.28497314453125, 0.308990478515625, 0.3330078125, 0.357025146484375, 0.38104248046875, 0.405059814453125, 0.4290771484375, 0.453094482421875, 0.47711181640625, 0.501129150390625, 0.525146484375, 0.549163818359375, 0.57318115234375, 0.597198486328125, 0.6212158203125, 0.645233154296875, 0.66925048828125, 0.693267822265625, 0.71728515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 16.0, 14.0, 26.0, 42.0, 82.0, 157.0, 389.0, 951.0, 3535.0, 21453.0, 867836.0, 3260075.0, 33426.0, 4448.0, 1106.0, 352.0, 148.0, 70.0, 54.0, 24.0, 23.0, 19.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.697265625, -2.61322021484375, -2.5291748046875, -2.44512939453125, -2.361083984375, -2.27703857421875, -2.1929931640625, -2.10894775390625, -2.02490234375, -1.94085693359375, -1.8568115234375, -1.77276611328125, -1.688720703125, -1.60467529296875, -1.5206298828125, -1.43658447265625, -1.3525390625, -1.26849365234375, -1.1844482421875, -1.10040283203125, -1.016357421875, -0.93231201171875, -0.8482666015625, -0.76422119140625, -0.68017578125, -0.59613037109375, -0.5120849609375, -0.42803955078125, -0.343994140625, -0.25994873046875, -0.1759033203125, -0.09185791015625, -0.0078125, 0.07623291015625, 0.1602783203125, 0.24432373046875, 0.328369140625, 0.41241455078125, 0.4964599609375, 0.58050537109375, 0.66455078125, 0.74859619140625, 0.8326416015625, 0.91668701171875, 1.000732421875, 1.08477783203125, 1.1688232421875, 1.25286865234375, 1.3369140625, 1.42095947265625, 1.5050048828125, 1.58905029296875, 1.673095703125, 1.75714111328125, 1.8411865234375, 1.92523193359375, 2.00927734375, 2.09332275390625, 2.1773681640625, 2.26141357421875, 2.345458984375, 2.42950439453125, 2.5135498046875, 2.59759521484375, 2.681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 12.0, 4.0, 12.0, 6.0, 10.0, 11.0, 15.0, 25.0, 43.0, 45.0, 98.0, 197.0, 432.0, 1009.0, 1057.0, 511.0, 215.0, 129.0, 70.0, 45.0, 28.0, 31.0, 14.0, 14.0, 5.0, 3.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.796875, -1.74700927734375, -1.6971435546875, -1.64727783203125, -1.597412109375, -1.54754638671875, -1.4976806640625, -1.44781494140625, -1.39794921875, -1.34808349609375, -1.2982177734375, -1.24835205078125, -1.198486328125, -1.14862060546875, -1.0987548828125, -1.04888916015625, -0.9990234375, -0.94915771484375, -0.8992919921875, -0.84942626953125, -0.799560546875, -0.74969482421875, -0.6998291015625, -0.64996337890625, -0.60009765625, -0.55023193359375, -0.5003662109375, -0.45050048828125, -0.400634765625, -0.35076904296875, -0.3009033203125, -0.25103759765625, -0.201171875, -0.15130615234375, -0.1014404296875, -0.05157470703125, -0.001708984375, 0.04815673828125, 0.0980224609375, 0.14788818359375, 0.19775390625, 0.24761962890625, 0.2974853515625, 0.34735107421875, 0.397216796875, 0.44708251953125, 0.4969482421875, 0.54681396484375, 0.5966796875, 0.64654541015625, 0.6964111328125, 0.74627685546875, 0.796142578125, 0.84600830078125, 0.8958740234375, 0.94573974609375, 0.99560546875, 1.04547119140625, 1.0953369140625, 1.14520263671875, 1.195068359375, 1.24493408203125, 1.2947998046875, 1.34466552734375, 1.39453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 12.0, 24.0, 48.0, 94.0, 128.0, 203.0, 175.0, 133.0, 79.0, 39.0, 19.0, 14.0, 10.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.686397552490234, -13.26620864868164, -12.846019744873047, -12.42583179473877, -12.005642890930176, -11.585453987121582, -11.165266036987305, -10.745077133178711, -10.324888229370117, -9.904699325561523, -9.48451042175293, -9.064322471618652, -8.644133567810059, -8.223944664001465, -7.803756237030029, -7.383567810058594, -6.96337890625, -6.543190002441406, -6.123001575469971, -5.702813148498535, -5.282624244689941, -4.862435340881348, -4.442246913909912, -4.022058486938477, -3.601869583129883, -3.181680917739868, -2.7614922523498535, -2.341303586959839, -1.9211149215698242, -1.5009262561798096, -1.080737590789795, -0.6605489253997803, -0.24036026000976562, 0.17982840538024902, 0.6000170707702637, 1.0202057361602783, 1.440394401550293, 1.8605830669403076, 2.2807717323303223, 2.700960397720337, 3.1211490631103516, 3.541337728500366, 3.961526393890381, 4.381714820861816, 4.80190372467041, 5.222092628479004, 5.6422810554504395, 6.062469482421875, 6.482658386230469, 6.9028472900390625, 7.323035717010498, 7.743224143981934, 8.163413047790527, 8.583601951599121, 9.003789901733398, 9.423978805541992, 9.844167709350586, 10.26435661315918, 10.684545516967773, 11.10473346710205, 11.524922370910645, 11.945111274719238, 12.365299224853516, 12.78548812866211, 13.205677032470703]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 9.0, 11.0, 16.0, 20.0, 21.0, 22.0, 41.0, 42.0, 45.0, 42.0, 43.0, 52.0, 52.0, 63.0, 68.0, 46.0, 51.0, 52.0, 48.0, 49.0, 36.0, 36.0, 27.0, 26.0, 18.0, 13.0, 18.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.923761367797852, -6.668846607208252, -6.413931846618652, -6.159017086029053, -5.904102325439453, -5.649187088012695, -5.394272327423096, -5.139357566833496, -4.8844428062438965, -4.629528045654297, -4.374613285064697, -4.119698524475098, -3.864783525466919, -3.6098687648773193, -3.3549537658691406, -3.100039005279541, -2.8451242446899414, -2.590209484100342, -2.335294723510742, -2.0803797245025635, -1.8254649639129639, -1.5705502033233643, -1.315635323524475, -1.060720443725586, -0.8058056831359863, -0.5508908629417419, -0.29597604274749756, -0.041061222553253174, 0.2138535976409912, 0.4687683582305908, 0.72368323802948, 0.9785981178283691, 1.2335128784179688, 1.4884276390075684, 1.7433425188064575, 1.9982573986053467, 2.2531721591949463, 2.508086919784546, 2.7630019187927246, 3.017916679382324, 3.272831439971924, 3.5277462005615234, 3.782660961151123, 4.037575721740723, 4.2924909591674805, 4.547405242919922, 4.80232048034668, 5.057235240936279, 5.312150001525879, 5.5670647621154785, 5.821979522705078, 6.076894283294678, 6.331809043884277, 6.586724281311035, 6.841639041900635, 7.096553802490234, 7.351468563079834, 7.606383323669434, 7.861298084259033, 8.116212844848633, 8.37112808227539, 8.626042366027832, 8.88095760345459, 9.135871887207031, 9.390787124633789]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 11.0, 26.0, 32.0, 45.0, 64.0, 101.0, 155.0, 228.0, 309.0, 638.0, 992.0, 1763.0, 3229.0, 5974.0, 11640.0, 23967.0, 49854.0, 104586.0, 200588.0, 267857.0, 188762.0, 95788.0, 46253.0, 22060.0, 10733.0, 5614.0, 2996.0, 1667.0, 981.0, 584.0, 383.0, 223.0, 143.0, 96.0, 73.0, 40.0, 18.0, 15.0, 11.0, 15.0, 5.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.64990234375, -0.6285552978515625, -0.607208251953125, -0.5858612060546875, -0.56451416015625, -0.5431671142578125, -0.521820068359375, -0.5004730224609375, -0.4791259765625, -0.4577789306640625, -0.436431884765625, -0.4150848388671875, -0.39373779296875, -0.3723907470703125, -0.351043701171875, -0.3296966552734375, -0.308349609375, -0.2870025634765625, -0.265655517578125, -0.2443084716796875, -0.22296142578125, -0.2016143798828125, -0.180267333984375, -0.1589202880859375, -0.1375732421875, -0.1162261962890625, -0.094879150390625, -0.0735321044921875, -0.05218505859375, -0.0308380126953125, -0.009490966796875, 0.0118560791015625, 0.033203125, 0.0545501708984375, 0.075897216796875, 0.0972442626953125, 0.11859130859375, 0.1399383544921875, 0.161285400390625, 0.1826324462890625, 0.2039794921875, 0.2253265380859375, 0.246673583984375, 0.2680206298828125, 0.28936767578125, 0.3107147216796875, 0.332061767578125, 0.3534088134765625, 0.374755859375, 0.3961029052734375, 0.417449951171875, 0.4387969970703125, 0.46014404296875, 0.4814910888671875, 0.502838134765625, 0.5241851806640625, 0.5455322265625, 0.5668792724609375, 0.588226318359375, 0.6095733642578125, 0.63092041015625, 0.6522674560546875, 0.673614501953125, 0.6949615478515625, 0.71630859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 12.0, 16.0, 24.0, 25.0, 30.0, 32.0, 42.0, 55.0, 41.0, 63.0, 62.0, 68.0, 76.0, 63.0, 59.0, 35.0, 54.0, 51.0, 29.0, 45.0, 22.0, 16.0, 17.0, 19.0, 4.0, 6.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.82080078125, -0.7968368530273438, -0.7728729248046875, -0.7489089965820312, -0.724945068359375, -0.7009811401367188, -0.6770172119140625, -0.6530532836914062, -0.62908935546875, -0.6051254272460938, -0.5811614990234375, -0.5571975708007812, -0.533233642578125, -0.5092697143554688, -0.4853057861328125, -0.46134185791015625, -0.4373779296875, -0.41341400146484375, -0.3894500732421875, -0.36548614501953125, -0.341522216796875, -0.31755828857421875, -0.2935943603515625, -0.26963043212890625, -0.24566650390625, -0.22170257568359375, -0.1977386474609375, -0.17377471923828125, -0.149810791015625, -0.12584686279296875, -0.1018829345703125, -0.07791900634765625, -0.053955078125, -0.02999114990234375, -0.0060272216796875, 0.01793670654296875, 0.041900634765625, 0.06586456298828125, 0.0898284912109375, 0.11379241943359375, 0.13775634765625, 0.16172027587890625, 0.1856842041015625, 0.20964813232421875, 0.233612060546875, 0.25757598876953125, 0.2815399169921875, 0.30550384521484375, 0.3294677734375, 0.35343170166015625, 0.3773956298828125, 0.40135955810546875, 0.425323486328125, 0.44928741455078125, 0.4732513427734375, 0.49721527099609375, 0.52117919921875, 0.5451431274414062, 0.5691070556640625, 0.5930709838867188, 0.617034912109375, 0.6409988403320312, 0.6649627685546875, 0.6889266967773438, 0.712890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 2.0, 4.0, 9.0, 15.0, 25.0, 29.0, 47.0, 79.0, 87.0, 169.0, 311.0, 457.0, 787.0, 1573.0, 3886.0, 15553.0, 120541.0, 696567.0, 178575.0, 21051.0, 4771.0, 1847.0, 880.0, 502.0, 299.0, 172.0, 101.0, 57.0, 50.0, 39.0, 17.0, 14.0, 10.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4521484375, -1.399505615234375, -1.34686279296875, -1.294219970703125, -1.2415771484375, -1.188934326171875, -1.13629150390625, -1.083648681640625, -1.031005859375, -0.978363037109375, -0.92572021484375, -0.873077392578125, -0.8204345703125, -0.767791748046875, -0.71514892578125, -0.662506103515625, -0.60986328125, -0.557220458984375, -0.50457763671875, -0.451934814453125, -0.3992919921875, -0.346649169921875, -0.29400634765625, -0.241363525390625, -0.188720703125, -0.136077880859375, -0.08343505859375, -0.030792236328125, 0.0218505859375, 0.074493408203125, 0.12713623046875, 0.179779052734375, 0.232421875, 0.285064697265625, 0.33770751953125, 0.390350341796875, 0.4429931640625, 0.495635986328125, 0.54827880859375, 0.600921630859375, 0.653564453125, 0.706207275390625, 0.75885009765625, 0.811492919921875, 0.8641357421875, 0.916778564453125, 0.96942138671875, 1.022064208984375, 1.07470703125, 1.127349853515625, 1.17999267578125, 1.232635498046875, 1.2852783203125, 1.337921142578125, 1.39056396484375, 1.443206787109375, 1.495849609375, 1.548492431640625, 1.60113525390625, 1.653778076171875, 1.7064208984375, 1.759063720703125, 1.81170654296875, 1.864349365234375, 1.9169921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 9.0, 11.0, 17.0, 17.0, 15.0, 14.0, 24.0, 19.0, 24.0, 21.0, 39.0, 26.0, 46.0, 37.0, 43.0, 52.0, 42.0, 47.0, 45.0, 42.0, 39.0, 44.0, 42.0, 31.0, 33.0, 36.0, 26.0, 25.0, 18.0, 19.0, 29.0, 13.0, 9.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0859375, -2.021209716796875, -1.95648193359375, -1.891754150390625, -1.8270263671875, -1.762298583984375, -1.69757080078125, -1.632843017578125, -1.568115234375, -1.503387451171875, -1.43865966796875, -1.373931884765625, -1.3092041015625, -1.244476318359375, -1.17974853515625, -1.115020751953125, -1.05029296875, -0.985565185546875, -0.92083740234375, -0.856109619140625, -0.7913818359375, -0.726654052734375, -0.66192626953125, -0.597198486328125, -0.532470703125, -0.467742919921875, -0.40301513671875, -0.338287353515625, -0.2735595703125, -0.208831787109375, -0.14410400390625, -0.079376220703125, -0.0146484375, 0.050079345703125, 0.11480712890625, 0.179534912109375, 0.2442626953125, 0.308990478515625, 0.37371826171875, 0.438446044921875, 0.503173828125, 0.567901611328125, 0.63262939453125, 0.697357177734375, 0.7620849609375, 0.826812744140625, 0.89154052734375, 0.956268310546875, 1.02099609375, 1.085723876953125, 1.15045166015625, 1.215179443359375, 1.2799072265625, 1.344635009765625, 1.40936279296875, 1.474090576171875, 1.538818359375, 1.603546142578125, 1.66827392578125, 1.733001708984375, 1.7977294921875, 1.862457275390625, 1.92718505859375, 1.991912841796875, 2.056640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 7.0, 6.0, 9.0, 18.0, 33.0, 31.0, 47.0, 87.0, 147.0, 280.0, 492.0, 1145.0, 3215.0, 13427.0, 140813.0, 798159.0, 76683.0, 9281.0, 2556.0, 959.0, 495.0, 239.0, 137.0, 82.0, 53.0, 38.0, 24.0, 19.0, 17.0, 11.0, 7.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.7060546875, -0.6828231811523438, -0.6595916748046875, -0.6363601684570312, -0.613128662109375, -0.5898971557617188, -0.5666656494140625, -0.5434341430664062, -0.52020263671875, -0.49697113037109375, -0.4737396240234375, -0.45050811767578125, -0.427276611328125, -0.40404510498046875, -0.3808135986328125, -0.35758209228515625, -0.3343505859375, -0.31111907958984375, -0.2878875732421875, -0.26465606689453125, -0.241424560546875, -0.21819305419921875, -0.1949615478515625, -0.17173004150390625, -0.14849853515625, -0.12526702880859375, -0.1020355224609375, -0.07880401611328125, -0.055572509765625, -0.03234100341796875, -0.0091094970703125, 0.01412200927734375, 0.037353515625, 0.06058502197265625, 0.0838165283203125, 0.10704803466796875, 0.130279541015625, 0.15351104736328125, 0.1767425537109375, 0.19997406005859375, 0.22320556640625, 0.24643707275390625, 0.2696685791015625, 0.29290008544921875, 0.316131591796875, 0.33936309814453125, 0.3625946044921875, 0.38582611083984375, 0.4090576171875, 0.43228912353515625, 0.4555206298828125, 0.47875213623046875, 0.501983642578125, 0.5252151489257812, 0.5484466552734375, 0.5716781616210938, 0.59490966796875, 0.6181411743164062, 0.6413726806640625, 0.6646041870117188, 0.687835693359375, 0.7110671997070312, 0.7342987060546875, 0.7575302124023438, 0.78076171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 2.0, 7.0, 10.0, 20.0, 32.0, 30.0, 57.0, 86.0, 107.0, 139.0, 140.0, 105.0, 71.0, 58.0, 46.0, 24.0, 22.0, 14.0, 11.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016045570373535156, -0.0001554153859615326, -0.00015037506818771362, -0.00014533475041389465, -0.00014029443264007568, -0.00013525411486625671, -0.00013021379709243774, -0.00012517347931861877, -0.0001201331615447998, -0.00011509284377098083, -0.00011005252599716187, -0.0001050122082233429, -9.997189044952393e-05, -9.493157267570496e-05, -8.989125490188599e-05, -8.485093712806702e-05, -7.981061935424805e-05, -7.477030158042908e-05, -6.972998380661011e-05, -6.468966603279114e-05, -5.964934825897217e-05, -5.46090304851532e-05, -4.956871271133423e-05, -4.452839493751526e-05, -3.948807716369629e-05, -3.444775938987732e-05, -2.940744161605835e-05, -2.436712384223938e-05, -1.932680606842041e-05, -1.428648829460144e-05, -9.24617052078247e-06, -4.205852746963501e-06, 8.344650268554688e-07, 5.8747828006744385e-06, 1.0915100574493408e-05, 1.5955418348312378e-05, 2.0995736122131348e-05, 2.6036053895950317e-05, 3.107637166976929e-05, 3.611668944358826e-05, 4.1157007217407227e-05, 4.6197324991226196e-05, 5.1237642765045166e-05, 5.6277960538864136e-05, 6.13182783126831e-05, 6.635859608650208e-05, 7.139891386032104e-05, 7.643923163414001e-05, 8.147954940795898e-05, 8.651986718177795e-05, 9.156018495559692e-05, 9.66005027294159e-05, 0.00010164082050323486, 0.00010668113827705383, 0.0001117214560508728, 0.00011676177382469177, 0.00012180209159851074, 0.0001268424093723297, 0.00013188272714614868, 0.00013692304491996765, 0.00014196336269378662, 0.0001470036804676056, 0.00015204399824142456, 0.00015708431601524353, 0.0001621246337890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 6.0, 8.0, 15.0, 20.0, 30.0, 60.0, 97.0, 195.0, 400.0, 992.0, 2995.0, 14116.0, 168068.0, 783142.0, 67098.0, 7829.0, 2049.0, 762.0, 297.0, 132.0, 74.0, 41.0, 33.0, 25.0, 20.0, 9.0, 6.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.91357421875, -0.8884353637695312, -0.8632965087890625, -0.8381576538085938, -0.813018798828125, -0.7878799438476562, -0.7627410888671875, -0.7376022338867188, -0.71246337890625, -0.6873245239257812, -0.6621856689453125, -0.6370468139648438, -0.611907958984375, -0.5867691040039062, -0.5616302490234375, -0.5364913940429688, -0.5113525390625, -0.48621368408203125, -0.4610748291015625, -0.43593597412109375, -0.410797119140625, -0.38565826416015625, -0.3605194091796875, -0.33538055419921875, -0.31024169921875, -0.28510284423828125, -0.2599639892578125, -0.23482513427734375, -0.209686279296875, -0.18454742431640625, -0.1594085693359375, -0.13426971435546875, -0.109130859375, -0.08399200439453125, -0.0588531494140625, -0.03371429443359375, -0.008575439453125, 0.01656341552734375, 0.0417022705078125, 0.06684112548828125, 0.09197998046875, 0.11711883544921875, 0.1422576904296875, 0.16739654541015625, 0.192535400390625, 0.21767425537109375, 0.2428131103515625, 0.26795196533203125, 0.2930908203125, 0.31822967529296875, 0.3433685302734375, 0.36850738525390625, 0.393646240234375, 0.41878509521484375, 0.4439239501953125, 0.46906280517578125, 0.49420166015625, 0.5193405151367188, 0.5444793701171875, 0.5696182250976562, 0.594757080078125, 0.6198959350585938, 0.6450347900390625, 0.6701736450195312, 0.6953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 6.0, 12.0, 19.0, 20.0, 36.0, 34.0, 54.0, 45.0, 62.0, 71.0, 90.0, 103.0, 74.0, 87.0, 58.0, 47.0, 50.0, 26.0, 19.0, 26.0, 13.0, 11.0, 5.0, 7.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74169921875, -0.7213058471679688, -0.7009124755859375, -0.6805191040039062, -0.660125732421875, -0.6397323608398438, -0.6193389892578125, -0.5989456176757812, -0.57855224609375, -0.5581588745117188, -0.5377655029296875, -0.5173721313476562, -0.496978759765625, -0.47658538818359375, -0.4561920166015625, -0.43579864501953125, -0.4154052734375, -0.39501190185546875, -0.3746185302734375, -0.35422515869140625, -0.333831787109375, -0.31343841552734375, -0.2930450439453125, -0.27265167236328125, -0.25225830078125, -0.23186492919921875, -0.2114715576171875, -0.19107818603515625, -0.170684814453125, -0.15029144287109375, -0.1298980712890625, -0.10950469970703125, -0.089111328125, -0.06871795654296875, -0.0483245849609375, -0.02793121337890625, -0.007537841796875, 0.01285552978515625, 0.0332489013671875, 0.05364227294921875, 0.07403564453125, 0.09442901611328125, 0.1148223876953125, 0.13521575927734375, 0.155609130859375, 0.17600250244140625, 0.1963958740234375, 0.21678924560546875, 0.2371826171875, 0.25757598876953125, 0.2779693603515625, 0.29836273193359375, 0.318756103515625, 0.33914947509765625, 0.3595428466796875, 0.37993621826171875, 0.40032958984375, 0.42072296142578125, 0.4411163330078125, 0.46150970458984375, 0.481903076171875, 0.5022964477539062, 0.5226898193359375, 0.5430831909179688, 0.5634765625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 1.0, 8.0, 19.0, 81.0, 267.0, 394.0, 186.0, 36.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.449127197265625, -26.548717498779297, -25.64830780029297, -24.74789810180664, -23.847488403320312, -22.947078704833984, -22.046667098999023, -21.146257400512695, -20.245847702026367, -19.34543800354004, -18.44502830505371, -17.544618606567383, -16.644207000732422, -15.74379825592041, -14.843387603759766, -13.942977905273438, -13.04256820678711, -12.142158508300781, -11.241748809814453, -10.341338157653809, -9.44092845916748, -8.540518760681152, -7.640108585357666, -6.73969841003418, -5.839288711547852, -4.938879013061523, -4.038468837738037, -3.13805890083313, -2.2376489639282227, -1.3372392654418945, -0.4368290901184082, 0.4635810852050781, 1.3639888763427734, 2.2643988132476807, 3.164808750152588, 4.065218925476074, 4.965628623962402, 5.8660383224487305, 6.766448497772217, 7.666858673095703, 8.567268371582031, 9.46767807006836, 10.368087768554688, 11.268498420715332, 12.16890811920166, 13.069317817687988, 13.969728469848633, 14.870138168334961, 15.770547866821289, 16.670957565307617, 17.571367263793945, 18.471776962280273, 19.372188568115234, 20.272598266601562, 21.17300796508789, 22.07341766357422, 22.973827362060547, 23.874237060546875, 24.774646759033203, 25.67505645751953, 26.57546615600586, 27.475875854492188, 28.37628746032715, 29.276697158813477, 30.177106857299805]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 11.0, 15.0, 14.0, 29.0, 30.0, 34.0, 39.0, 54.0, 64.0, 55.0, 68.0, 82.0, 82.0, 59.0, 61.0, 55.0, 56.0, 39.0, 25.0, 25.0, 21.0, 18.0, 18.0, 13.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.986358642578125, -11.588202476501465, -11.190046310424805, -10.791890144348145, -10.393733978271484, -9.995576858520508, -9.597420692443848, -9.199264526367188, -8.801108360290527, -8.402952194213867, -8.004796028137207, -7.606639385223389, -7.2084832191467285, -6.810327053070068, -6.41217041015625, -6.01401424407959, -5.61585807800293, -5.2177019119262695, -4.819545745849609, -4.421389102935791, -4.023232936859131, -3.6250767707824707, -3.2269203662872314, -2.828763961791992, -2.430607795715332, -2.032451629638672, -1.6342952251434326, -1.236138939857483, -0.8379826545715332, -0.4398263692855835, -0.04167008399963379, 0.35648632049560547, 0.7546424865722656, 1.1527987718582153, 1.550955057144165, 1.9491113424301147, 2.3472676277160645, 2.7454237937927246, 3.143580198287964, 3.541736602783203, 3.9398927688598633, 4.338048934936523, 4.736205101013184, 5.134361743927002, 5.532517910003662, 5.930674076080322, 6.328830718994141, 6.726986885070801, 7.125143051147461, 7.523299217224121, 7.921455383300781, 8.319611549377441, 8.717767715454102, 9.115924835205078, 9.514081001281738, 9.912237167358398, 10.310393333435059, 10.708549499511719, 11.106705665588379, 11.504861831665039, 11.903018951416016, 12.301175117492676, 12.699331283569336, 13.097487449645996, 13.495643615722656]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 10.0, 12.0, 15.0, 22.0, 34.0, 41.0, 77.0, 100.0, 168.0, 412.0, 1442.0, 9941.0, 1197001.0, 2969394.0, 13019.0, 1610.0, 449.0, 178.0, 114.0, 69.0, 44.0, 35.0, 20.0, 18.0, 13.0, 12.0, 9.0, 1.0, 2.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.123046875, -3.033935546875, -2.94482421875, -2.855712890625, -2.7666015625, -2.677490234375, -2.58837890625, -2.499267578125, -2.41015625, -2.321044921875, -2.23193359375, -2.142822265625, -2.0537109375, -1.964599609375, -1.87548828125, -1.786376953125, -1.697265625, -1.608154296875, -1.51904296875, -1.429931640625, -1.3408203125, -1.251708984375, -1.16259765625, -1.073486328125, -0.984375, -0.895263671875, -0.80615234375, -0.717041015625, -0.6279296875, -0.538818359375, -0.44970703125, -0.360595703125, -0.271484375, -0.182373046875, -0.09326171875, -0.004150390625, 0.0849609375, 0.174072265625, 0.26318359375, 0.352294921875, 0.44140625, 0.530517578125, 0.61962890625, 0.708740234375, 0.7978515625, 0.886962890625, 0.97607421875, 1.065185546875, 1.154296875, 1.243408203125, 1.33251953125, 1.421630859375, 1.5107421875, 1.599853515625, 1.68896484375, 1.778076171875, 1.8671875, 1.956298828125, 2.04541015625, 2.134521484375, 2.2236328125, 2.312744140625, 2.40185546875, 2.490966796875, 2.580078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 23.0, 21.0, 35.0, 56.0, 71.0, 73.0, 88.0, 122.0, 104.0, 78.0, 87.0, 73.0, 50.0, 46.0, 20.0, 20.0, 11.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3134765625, -1.277099609375, -1.24072265625, -1.204345703125, -1.16796875, -1.131591796875, -1.09521484375, -1.058837890625, -1.0224609375, -0.986083984375, -0.94970703125, -0.913330078125, -0.876953125, -0.840576171875, -0.80419921875, -0.767822265625, -0.7314453125, -0.695068359375, -0.65869140625, -0.622314453125, -0.5859375, -0.549560546875, -0.51318359375, -0.476806640625, -0.4404296875, -0.404052734375, -0.36767578125, -0.331298828125, -0.294921875, -0.258544921875, -0.22216796875, -0.185791015625, -0.1494140625, -0.113037109375, -0.07666015625, -0.040283203125, -0.00390625, 0.032470703125, 0.06884765625, 0.105224609375, 0.1416015625, 0.177978515625, 0.21435546875, 0.250732421875, 0.287109375, 0.323486328125, 0.35986328125, 0.396240234375, 0.4326171875, 0.468994140625, 0.50537109375, 0.541748046875, 0.578125, 0.614501953125, 0.65087890625, 0.687255859375, 0.7236328125, 0.760009765625, 0.79638671875, 0.832763671875, 0.869140625, 0.905517578125, 0.94189453125, 0.978271484375, 1.0146484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 14.0, 25.0, 47.0, 94.0, 153.0, 317.0, 667.0, 1472.0, 3827.0, 11879.0, 49447.0, 546451.0, 3406183.0, 140589.0, 23033.0, 6169.0, 2186.0, 900.0, 382.0, 216.0, 87.0, 57.0, 27.0, 12.0, 9.0, 8.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.491241455078125, -1.45123291015625, -1.411224365234375, -1.3712158203125, -1.331207275390625, -1.29119873046875, -1.251190185546875, -1.211181640625, -1.171173095703125, -1.13116455078125, -1.091156005859375, -1.0511474609375, -1.011138916015625, -0.97113037109375, -0.931121826171875, -0.89111328125, -0.851104736328125, -0.81109619140625, -0.771087646484375, -0.7310791015625, -0.691070556640625, -0.65106201171875, -0.611053466796875, -0.571044921875, -0.531036376953125, -0.49102783203125, -0.451019287109375, -0.4110107421875, -0.371002197265625, -0.33099365234375, -0.290985107421875, -0.2509765625, -0.210968017578125, -0.17095947265625, -0.130950927734375, -0.0909423828125, -0.050933837890625, -0.01092529296875, 0.029083251953125, 0.069091796875, 0.109100341796875, 0.14910888671875, 0.189117431640625, 0.2291259765625, 0.269134521484375, 0.30914306640625, 0.349151611328125, 0.38916015625, 0.429168701171875, 0.46917724609375, 0.509185791015625, 0.5491943359375, 0.589202880859375, 0.62921142578125, 0.669219970703125, 0.709228515625, 0.749237060546875, 0.78924560546875, 0.829254150390625, 0.8692626953125, 0.909271240234375, 0.94927978515625, 0.989288330078125, 1.029296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 0.0, 3.0, 3.0, 10.0, 11.0, 14.0, 5.0, 27.0, 37.0, 43.0, 70.0, 124.0, 268.0, 554.0, 1159.0, 941.0, 371.0, 172.0, 85.0, 63.0, 40.0, 22.0, 19.0, 6.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.51953125, -1.4782257080078125, -1.436920166015625, -1.3956146240234375, -1.35430908203125, -1.3130035400390625, -1.271697998046875, -1.2303924560546875, -1.1890869140625, -1.1477813720703125, -1.106475830078125, -1.0651702880859375, -1.02386474609375, -0.9825592041015625, -0.941253662109375, -0.8999481201171875, -0.858642578125, -0.8173370361328125, -0.776031494140625, -0.7347259521484375, -0.69342041015625, -0.6521148681640625, -0.610809326171875, -0.5695037841796875, -0.5281982421875, -0.4868927001953125, -0.445587158203125, -0.4042816162109375, -0.36297607421875, -0.3216705322265625, -0.280364990234375, -0.2390594482421875, -0.19775390625, -0.1564483642578125, -0.115142822265625, -0.0738372802734375, -0.03253173828125, 0.0087738037109375, 0.050079345703125, 0.0913848876953125, 0.1326904296875, 0.1739959716796875, 0.215301513671875, 0.2566070556640625, 0.29791259765625, 0.3392181396484375, 0.380523681640625, 0.4218292236328125, 0.463134765625, 0.5044403076171875, 0.545745849609375, 0.5870513916015625, 0.62835693359375, 0.6696624755859375, 0.710968017578125, 0.7522735595703125, 0.7935791015625, 0.8348846435546875, 0.876190185546875, 0.9174957275390625, 0.95880126953125, 1.0001068115234375, 1.041412353515625, 1.0827178955078125, 1.1240234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 11.0, 21.0, 59.0, 128.0, 256.0, 260.0, 138.0, 72.0, 25.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.50623321533203, -17.10053825378418, -16.694843292236328, -16.289148330688477, -15.883453369140625, -15.477758407592773, -15.072062492370605, -14.666367530822754, -14.260672569274902, -13.85497760772705, -13.4492826461792, -13.043587684631348, -12.63789176940918, -12.232196807861328, -11.826501846313477, -11.420806884765625, -11.015111923217773, -10.609416961669922, -10.20372200012207, -9.798027038574219, -9.392332077026367, -8.986637115478516, -8.580941200256348, -8.175246238708496, -7.7695512771606445, -7.363856315612793, -6.958161354064941, -6.552465915679932, -6.14677095413208, -5.7410759925842285, -5.335380554199219, -4.929685592651367, -4.523990631103516, -4.118295669555664, -3.7126004695892334, -3.3069052696228027, -2.901210308074951, -2.4955153465270996, -2.089820146560669, -1.6841249465942383, -1.2784299850463867, -0.8727349042892456, -0.4670398235321045, -0.06134474277496338, 0.34435033798217773, 0.7500452995300293, 1.15574049949646, 1.5614356994628906, 1.9671306610107422, 2.3728256225585938, 2.7785208225250244, 3.184216022491455, 3.5899109840393066, 3.995605945587158, 4.401301383972168, 4.8069963455200195, 5.212691307067871, 5.618386268615723, 6.024081230163574, 6.429776668548584, 6.8354716300964355, 7.241166591644287, 7.646862030029297, 8.052556991577148, 8.458251953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 6.0, 8.0, 14.0, 15.0, 18.0, 22.0, 22.0, 23.0, 34.0, 42.0, 41.0, 41.0, 42.0, 43.0, 66.0, 47.0, 51.0, 60.0, 48.0, 54.0, 49.0, 36.0, 39.0, 35.0, 23.0, 28.0, 14.0, 18.0, 10.0, 12.0, 12.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.527782440185547, -5.3810014724731445, -5.234220504760742, -5.087440013885498, -4.940659046173096, -4.793878078460693, -4.647097587585449, -4.500316619873047, -4.3535356521606445, -4.206754684448242, -4.05997371673584, -3.9131932258605957, -3.7664122581481934, -3.619631290435791, -3.4728505611419678, -3.3260698318481445, -3.179288864135742, -3.03250789642334, -2.8857271671295166, -2.7389464378356934, -2.592165470123291, -2.4453845024108887, -2.2986037731170654, -2.151823043823242, -2.00504207611084, -1.858261227607727, -1.7114803791046143, -1.5646995306015015, -1.4179186820983887, -1.2711378335952759, -1.124356985092163, -0.9775761365890503, -0.8307948112487793, -0.6840139627456665, -0.5372331142425537, -0.3904522657394409, -0.24367141723632812, -0.09689056873321533, 0.04989027976989746, 0.19667112827301025, 0.34345197677612305, 0.49023282527923584, 0.6370136737823486, 0.7837945222854614, 0.9305753707885742, 1.077356219291687, 1.2241370677947998, 1.3709179162979126, 1.5176987648010254, 1.6644796133041382, 1.811260461807251, 1.9580413103103638, 2.1048221588134766, 2.251603126525879, 2.398383855819702, 2.5451645851135254, 2.6919455528259277, 2.83872652053833, 2.9855072498321533, 3.1322879791259766, 3.279068946838379, 3.4258499145507812, 3.5726306438446045, 3.7194113731384277, 3.86619234085083]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 4.0, 14.0, 22.0, 21.0, 41.0, 49.0, 107.0, 122.0, 194.0, 322.0, 573.0, 1061.0, 1778.0, 3593.0, 7244.0, 15533.0, 35319.0, 83785.0, 198201.0, 323872.0, 213127.0, 92010.0, 38641.0, 16803.0, 7733.0, 3800.0, 1951.0, 1019.0, 602.0, 399.0, 222.0, 137.0, 88.0, 47.0, 33.0, 24.0, 17.0, 18.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.861328125, -0.8356552124023438, -0.8099822998046875, -0.7843093872070312, -0.758636474609375, -0.7329635620117188, -0.7072906494140625, -0.6816177368164062, -0.65594482421875, -0.6302719116210938, -0.6045989990234375, -0.5789260864257812, -0.553253173828125, -0.5275802612304688, -0.5019073486328125, -0.47623443603515625, -0.4505615234375, -0.42488861083984375, -0.3992156982421875, -0.37354278564453125, -0.347869873046875, -0.32219696044921875, -0.2965240478515625, -0.27085113525390625, -0.24517822265625, -0.21950531005859375, -0.1938323974609375, -0.16815948486328125, -0.142486572265625, -0.11681365966796875, -0.0911407470703125, -0.06546783447265625, -0.039794921875, -0.01412200927734375, 0.0115509033203125, 0.03722381591796875, 0.062896728515625, 0.08856964111328125, 0.1142425537109375, 0.13991546630859375, 0.16558837890625, 0.19126129150390625, 0.2169342041015625, 0.24260711669921875, 0.268280029296875, 0.29395294189453125, 0.3196258544921875, 0.34529876708984375, 0.3709716796875, 0.39664459228515625, 0.4223175048828125, 0.44799041748046875, 0.473663330078125, 0.49933624267578125, 0.5250091552734375, 0.5506820678710938, 0.57635498046875, 0.6020278930664062, 0.6277008056640625, 0.6533737182617188, 0.679046630859375, 0.7047195434570312, 0.7303924560546875, 0.7560653686523438, 0.78173828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 9.0, 4.0, 14.0, 18.0, 18.0, 32.0, 37.0, 46.0, 56.0, 48.0, 71.0, 79.0, 93.0, 88.0, 68.0, 63.0, 54.0, 51.0, 36.0, 32.0, 26.0, 14.0, 14.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8496780395507812, -0.8228912353515625, -0.7961044311523438, -0.769317626953125, -0.7425308227539062, -0.7157440185546875, -0.6889572143554688, -0.66217041015625, -0.6353836059570312, -0.6085968017578125, -0.5818099975585938, -0.555023193359375, -0.5282363891601562, -0.5014495849609375, -0.47466278076171875, -0.4478759765625, -0.42108917236328125, -0.3943023681640625, -0.36751556396484375, -0.340728759765625, -0.31394195556640625, -0.2871551513671875, -0.26036834716796875, -0.23358154296875, -0.20679473876953125, -0.1800079345703125, -0.15322113037109375, -0.126434326171875, -0.09964752197265625, -0.0728607177734375, -0.04607391357421875, -0.019287109375, 0.00749969482421875, 0.0342864990234375, 0.06107330322265625, 0.087860107421875, 0.11464691162109375, 0.1414337158203125, 0.16822052001953125, 0.19500732421875, 0.22179412841796875, 0.2485809326171875, 0.27536773681640625, 0.302154541015625, 0.32894134521484375, 0.3557281494140625, 0.38251495361328125, 0.4093017578125, 0.43608856201171875, 0.4628753662109375, 0.48966217041015625, 0.516448974609375, 0.5432357788085938, 0.5700225830078125, 0.5968093872070312, 0.62359619140625, 0.6503829956054688, 0.6771697998046875, 0.7039566040039062, 0.730743408203125, 0.7575302124023438, 0.7843170166015625, 0.8111038208007812, 0.837890625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 3.0, 5.0, 14.0, 14.0, 18.0, 26.0, 25.0, 52.0, 103.0, 152.0, 275.0, 538.0, 1275.0, 3899.0, 18414.0, 143086.0, 716730.0, 139751.0, 17751.0, 3820.0, 1297.0, 546.0, 308.0, 177.0, 81.0, 53.0, 42.0, 19.0, 12.0, 18.0, 14.0, 4.0, 8.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.10546875, -2.0477752685546875, -1.990081787109375, -1.9323883056640625, -1.87469482421875, -1.8170013427734375, -1.759307861328125, -1.7016143798828125, -1.6439208984375, -1.5862274169921875, -1.528533935546875, -1.4708404541015625, -1.41314697265625, -1.3554534912109375, -1.297760009765625, -1.2400665283203125, -1.182373046875, -1.1246795654296875, -1.066986083984375, -1.0092926025390625, -0.95159912109375, -0.8939056396484375, -0.836212158203125, -0.7785186767578125, -0.7208251953125, -0.6631317138671875, -0.605438232421875, -0.5477447509765625, -0.49005126953125, -0.4323577880859375, -0.374664306640625, -0.3169708251953125, -0.25927734375, -0.2015838623046875, -0.143890380859375, -0.0861968994140625, -0.02850341796875, 0.0291900634765625, 0.086883544921875, 0.1445770263671875, 0.2022705078125, 0.2599639892578125, 0.317657470703125, 0.3753509521484375, 0.43304443359375, 0.4907379150390625, 0.548431396484375, 0.6061248779296875, 0.663818359375, 0.7215118408203125, 0.779205322265625, 0.8368988037109375, 0.89459228515625, 0.9522857666015625, 1.009979248046875, 1.0676727294921875, 1.1253662109375, 1.1830596923828125, 1.240753173828125, 1.2984466552734375, 1.35614013671875, 1.4138336181640625, 1.471527099609375, 1.5292205810546875, 1.5869140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 3.0, 7.0, 7.0, 12.0, 12.0, 15.0, 16.0, 19.0, 18.0, 19.0, 30.0, 25.0, 37.0, 35.0, 40.0, 43.0, 44.0, 44.0, 32.0, 54.0, 50.0, 37.0, 26.0, 58.0, 37.0, 34.0, 35.0, 27.0, 26.0, 21.0, 19.0, 24.0, 16.0, 13.0, 15.0, 12.0, 7.0, 4.0, 5.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7890625, -1.7338409423828125, -1.678619384765625, -1.6233978271484375, -1.56817626953125, -1.5129547119140625, -1.457733154296875, -1.4025115966796875, -1.3472900390625, -1.2920684814453125, -1.236846923828125, -1.1816253662109375, -1.12640380859375, -1.0711822509765625, -1.015960693359375, -0.9607391357421875, -0.905517578125, -0.8502960205078125, -0.795074462890625, -0.7398529052734375, -0.68463134765625, -0.6294097900390625, -0.574188232421875, -0.5189666748046875, -0.4637451171875, -0.4085235595703125, -0.353302001953125, -0.2980804443359375, -0.24285888671875, -0.1876373291015625, -0.132415771484375, -0.0771942138671875, -0.02197265625, 0.0332489013671875, 0.088470458984375, 0.1436920166015625, 0.19891357421875, 0.2541351318359375, 0.309356689453125, 0.3645782470703125, 0.4197998046875, 0.4750213623046875, 0.530242919921875, 0.5854644775390625, 0.64068603515625, 0.6959075927734375, 0.751129150390625, 0.8063507080078125, 0.861572265625, 0.9167938232421875, 0.972015380859375, 1.0272369384765625, 1.08245849609375, 1.1376800537109375, 1.192901611328125, 1.2481231689453125, 1.3033447265625, 1.3585662841796875, 1.413787841796875, 1.4690093994140625, 1.52423095703125, 1.5794525146484375, 1.634674072265625, 1.6898956298828125, 1.7451171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 11.0, 16.0, 13.0, 19.0, 42.0, 55.0, 77.0, 183.0, 417.0, 1026.0, 4067.0, 42637.0, 914960.0, 77521.0, 5287.0, 1284.0, 447.0, 209.0, 103.0, 51.0, 29.0, 27.0, 18.0, 14.0, 13.0, 4.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.248046875, -1.208526611328125, -1.16900634765625, -1.129486083984375, -1.0899658203125, -1.050445556640625, -1.01092529296875, -0.971405029296875, -0.931884765625, -0.892364501953125, -0.85284423828125, -0.813323974609375, -0.7738037109375, -0.734283447265625, -0.69476318359375, -0.655242919921875, -0.61572265625, -0.576202392578125, -0.53668212890625, -0.497161865234375, -0.4576416015625, -0.418121337890625, -0.37860107421875, -0.339080810546875, -0.299560546875, -0.260040283203125, -0.22052001953125, -0.180999755859375, -0.1414794921875, -0.101959228515625, -0.06243896484375, -0.022918701171875, 0.0166015625, 0.056121826171875, 0.09564208984375, 0.135162353515625, 0.1746826171875, 0.214202880859375, 0.25372314453125, 0.293243408203125, 0.332763671875, 0.372283935546875, 0.41180419921875, 0.451324462890625, 0.4908447265625, 0.530364990234375, 0.56988525390625, 0.609405517578125, 0.64892578125, 0.688446044921875, 0.72796630859375, 0.767486572265625, 0.8070068359375, 0.846527099609375, 0.88604736328125, 0.925567626953125, 0.965087890625, 1.004608154296875, 1.04412841796875, 1.083648681640625, 1.1231689453125, 1.162689208984375, 1.20220947265625, 1.241729736328125, 1.28125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 10.0, 41.0, 162.0, 325.0, 292.0, 102.0, 31.0, 16.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002665519714355469, -0.00025072693824768066, -0.00023490190505981445, -0.00021907687187194824, -0.00020325183868408203, -0.00018742680549621582, -0.0001716017723083496, -0.0001557767391204834, -0.0001399517059326172, -0.00012412667274475098, -0.00010830163955688477, -9.247660636901855e-05, -7.665157318115234e-05, -6.082653999328613e-05, -4.500150680541992e-05, -2.917647361755371e-05, -1.33514404296875e-05, 2.473592758178711e-06, 1.8298625946044922e-05, 3.412365913391113e-05, 4.9948692321777344e-05, 6.577372550964355e-05, 8.159875869750977e-05, 9.742379188537598e-05, 0.00011324882507324219, 0.0001290738582611084, 0.0001448988914489746, 0.00016072392463684082, 0.00017654895782470703, 0.00019237399101257324, 0.00020819902420043945, 0.00022402405738830566, 0.00023984909057617188, 0.0002556741237640381, 0.0002714991569519043, 0.0002873241901397705, 0.0003031492233276367, 0.00031897425651550293, 0.00033479928970336914, 0.00035062432289123535, 0.00036644935607910156, 0.0003822743892669678, 0.000398099422454834, 0.0004139244556427002, 0.0004297494888305664, 0.0004455745220184326, 0.00046139955520629883, 0.00047722458839416504, 0.0004930496215820312, 0.0005088746547698975, 0.0005246996879577637, 0.0005405247211456299, 0.0005563497543334961, 0.0005721747875213623, 0.0005879998207092285, 0.0006038248538970947, 0.0006196498870849609, 0.0006354749202728271, 0.0006512999534606934, 0.0006671249866485596, 0.0006829500198364258, 0.000698775053024292, 0.0007146000862121582, 0.0007304251194000244, 0.0007462501525878906]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 9.0, 11.0, 8.0, 15.0, 25.0, 24.0, 41.0, 59.0, 119.0, 172.0, 320.0, 623.0, 1757.0, 5642.0, 29543.0, 306421.0, 635779.0, 55128.0, 8712.0, 2359.0, 891.0, 378.0, 195.0, 104.0, 63.0, 44.0, 28.0, 29.0, 16.0, 12.0, 8.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.671875, -0.6488265991210938, -0.6257781982421875, -0.6027297973632812, -0.579681396484375, -0.5566329956054688, -0.5335845947265625, -0.5105361938476562, -0.48748779296875, -0.46443939208984375, -0.4413909912109375, -0.41834259033203125, -0.395294189453125, -0.37224578857421875, -0.3491973876953125, -0.32614898681640625, -0.3031005859375, -0.28005218505859375, -0.2570037841796875, -0.23395538330078125, -0.210906982421875, -0.18785858154296875, -0.1648101806640625, -0.14176177978515625, -0.11871337890625, -0.09566497802734375, -0.0726165771484375, -0.04956817626953125, -0.026519775390625, -0.00347137451171875, 0.0195770263671875, 0.04262542724609375, 0.065673828125, 0.08872222900390625, 0.1117706298828125, 0.13481903076171875, 0.157867431640625, 0.18091583251953125, 0.2039642333984375, 0.22701263427734375, 0.25006103515625, 0.27310943603515625, 0.2961578369140625, 0.31920623779296875, 0.342254638671875, 0.36530303955078125, 0.3883514404296875, 0.41139984130859375, 0.4344482421875, 0.45749664306640625, 0.4805450439453125, 0.5035934448242188, 0.526641845703125, 0.5496902465820312, 0.5727386474609375, 0.5957870483398438, 0.61883544921875, 0.6418838500976562, 0.6649322509765625, 0.6879806518554688, 0.711029052734375, 0.7340774536132812, 0.7571258544921875, 0.7801742553710938, 0.80322265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 10.0, 2.0, 9.0, 10.0, 19.0, 19.0, 48.0, 48.0, 77.0, 92.0, 122.0, 123.0, 108.0, 97.0, 90.0, 55.0, 33.0, 18.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2431640625, -1.2163543701171875, -1.189544677734375, -1.1627349853515625, -1.13592529296875, -1.1091156005859375, -1.082305908203125, -1.0554962158203125, -1.0286865234375, -1.0018768310546875, -0.975067138671875, -0.9482574462890625, -0.92144775390625, -0.8946380615234375, -0.867828369140625, -0.8410186767578125, -0.814208984375, -0.7873992919921875, -0.760589599609375, -0.7337799072265625, -0.70697021484375, -0.6801605224609375, -0.653350830078125, -0.6265411376953125, -0.5997314453125, -0.5729217529296875, -0.546112060546875, -0.5193023681640625, -0.49249267578125, -0.4656829833984375, -0.438873291015625, -0.4120635986328125, -0.38525390625, -0.3584442138671875, -0.331634521484375, -0.3048248291015625, -0.27801513671875, -0.2512054443359375, -0.224395751953125, -0.1975860595703125, -0.1707763671875, -0.1439666748046875, -0.117156982421875, -0.0903472900390625, -0.06353759765625, -0.0367279052734375, -0.009918212890625, 0.0168914794921875, 0.043701171875, 0.0705108642578125, 0.097320556640625, 0.1241302490234375, 0.15093994140625, 0.1777496337890625, 0.204559326171875, 0.2313690185546875, 0.2581787109375, 0.2849884033203125, 0.311798095703125, 0.3386077880859375, 0.36541748046875, 0.3922271728515625, 0.419036865234375, 0.4458465576171875, 0.47265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 13.0, 28.0, 70.0, 131.0, 245.0, 225.0, 153.0, 72.0, 24.0, 17.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.205233097076416, -6.692345142364502, -6.179457664489746, -5.666569709777832, -5.153681755065918, -4.640794277191162, -4.127906322479248, -3.615018606185913, -3.102130889892578, -2.589243173599243, -2.076355457305908, -1.5634675025939941, -1.0505797863006592, -0.5376920700073242, -0.024804115295410156, 0.4880836009979248, 1.0009713172912598, 1.5138590335845947, 2.0267467498779297, 2.5396347045898438, 3.0525224208831787, 3.5654101371765137, 4.078298091888428, 4.591185569763184, 5.104073524475098, 5.616961479187012, 6.129848957061768, 6.642736911773682, 7.1556243896484375, 7.668512344360352, 8.181400299072266, 8.69428825378418, 9.207174301147461, 9.720062255859375, 10.232950210571289, 10.745838165283203, 11.2587251663208, 11.771613121032715, 12.284501075744629, 12.797389030456543, 13.31027603149414, 13.823163986206055, 14.336051940917969, 14.848939895629883, 15.36182689666748, 15.874714851379395, 16.387603759765625, 16.900489807128906, 17.413379669189453, 17.926267623901367, 18.43915557861328, 18.952043533325195, 19.46493148803711, 19.97781753540039, 20.490707397460938, 21.00359344482422, 21.516481399536133, 22.029369354248047, 22.54225730895996, 23.055145263671875, 23.56803321838379, 24.080921173095703, 24.593807220458984, 25.1066951751709, 25.619583129882812]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 6.0, 6.0, 10.0, 13.0, 18.0, 24.0, 24.0, 25.0, 24.0, 30.0, 35.0, 45.0, 46.0, 46.0, 40.0, 58.0, 60.0, 64.0, 51.0, 45.0, 50.0, 37.0, 37.0, 34.0, 23.0, 15.0, 18.0, 19.0, 13.0, 18.0, 11.0, 9.0, 4.0, 10.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-10.110296249389648, -9.855095863342285, -9.599895477294922, -9.344694137573242, -9.089493751525879, -8.834293365478516, -8.579092979431152, -8.323892593383789, -8.06869125366211, -7.813490867614746, -7.558290004730225, -7.303089618682861, -7.04788875579834, -6.792688369750977, -6.537487983703613, -6.28228759765625, -6.027087211608887, -5.771886825561523, -5.516685962677002, -5.261485576629639, -5.006284713745117, -4.751084327697754, -4.495883941650391, -4.240683555603027, -3.985482692718506, -3.7302820682525635, -3.475081443786621, -3.219881057739258, -2.9646804332733154, -2.709479808807373, -2.4542794227600098, -2.1990787982940674, -1.943878173828125, -1.6886775493621826, -1.4334770441055298, -1.178276538848877, -0.9230759143829346, -0.6678752899169922, -0.41267478466033936, -0.15747427940368652, 0.09772634506225586, 0.35292690992355347, 0.6081274747848511, 0.8633280396461487, 1.1185286045074463, 1.3737292289733887, 1.6289297342300415, 1.8841302394866943, 2.1393308639526367, 2.394531488418579, 2.6497321128845215, 2.9049324989318848, 3.160133123397827, 3.4153337478637695, 3.670534133911133, 3.925734758377075, 4.180935382843018, 4.436135768890381, 4.691336631774902, 4.946537017822266, 5.201737403869629, 5.45693826675415, 5.712138652801514, 5.967339515686035, 6.222539901733398]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 9.0, 11.0, 23.0, 35.0, 59.0, 114.0, 156.0, 274.0, 572.0, 1079.0, 2473.0, 6352.0, 21016.0, 112675.0, 1808041.0, 2081785.0, 125901.0, 22088.0, 6550.0, 2594.0, 1150.0, 608.0, 292.0, 163.0, 97.0, 66.0, 41.0, 18.0, 10.0, 12.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.99853515625, -0.9682998657226562, -0.9380645751953125, -0.9078292846679688, -0.877593994140625, -0.8473587036132812, -0.8171234130859375, -0.7868881225585938, -0.75665283203125, -0.7264175415039062, -0.6961822509765625, -0.6659469604492188, -0.635711669921875, -0.6054763793945312, -0.5752410888671875, -0.5450057983398438, -0.5147705078125, -0.48453521728515625, -0.4542999267578125, -0.42406463623046875, -0.393829345703125, -0.36359405517578125, -0.3333587646484375, -0.30312347412109375, -0.27288818359375, -0.24265289306640625, -0.2124176025390625, -0.18218231201171875, -0.151947021484375, -0.12171173095703125, -0.0914764404296875, -0.06124114990234375, -0.031005859375, -0.00077056884765625, 0.0294647216796875, 0.05970001220703125, 0.089935302734375, 0.12017059326171875, 0.1504058837890625, 0.18064117431640625, 0.21087646484375, 0.24111175537109375, 0.2713470458984375, 0.30158233642578125, 0.331817626953125, 0.36205291748046875, 0.3922882080078125, 0.42252349853515625, 0.4527587890625, 0.48299407958984375, 0.5132293701171875, 0.5434646606445312, 0.573699951171875, 0.6039352416992188, 0.6341705322265625, 0.6644058227539062, 0.69464111328125, 0.7248764038085938, 0.7551116943359375, 0.7853469848632812, 0.815582275390625, 0.8458175659179688, 0.8760528564453125, 0.9062881469726562, 0.9365234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 7.0, 6.0, 18.0, 27.0, 32.0, 33.0, 44.0, 47.0, 50.0, 64.0, 65.0, 100.0, 91.0, 58.0, 57.0, 78.0, 43.0, 34.0, 38.0, 28.0, 22.0, 9.0, 18.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.78271484375, -0.759674072265625, -0.73663330078125, -0.713592529296875, -0.6905517578125, -0.667510986328125, -0.64447021484375, -0.621429443359375, -0.598388671875, -0.575347900390625, -0.55230712890625, -0.529266357421875, -0.5062255859375, -0.483184814453125, -0.46014404296875, -0.437103271484375, -0.4140625, -0.391021728515625, -0.36798095703125, -0.344940185546875, -0.3218994140625, -0.298858642578125, -0.27581787109375, -0.252777099609375, -0.229736328125, -0.206695556640625, -0.18365478515625, -0.160614013671875, -0.1375732421875, -0.114532470703125, -0.09149169921875, -0.068450927734375, -0.04541015625, -0.022369384765625, 0.00067138671875, 0.023712158203125, 0.0467529296875, 0.069793701171875, 0.09283447265625, 0.115875244140625, 0.138916015625, 0.161956787109375, 0.18499755859375, 0.208038330078125, 0.2310791015625, 0.254119873046875, 0.27716064453125, 0.300201416015625, 0.3232421875, 0.346282958984375, 0.36932373046875, 0.392364501953125, 0.4154052734375, 0.438446044921875, 0.46148681640625, 0.484527587890625, 0.507568359375, 0.530609130859375, 0.55364990234375, 0.576690673828125, 0.5997314453125, 0.622772216796875, 0.64581298828125, 0.668853759765625, 0.69189453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 12.0, 13.0, 19.0, 35.0, 39.0, 83.0, 122.0, 249.0, 513.0, 1377.0, 4646.0, 27905.0, 667185.0, 3407092.0, 72685.0, 8958.0, 2079.0, 687.0, 267.0, 142.0, 64.0, 28.0, 27.0, 16.0, 9.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.7392425537109375, -1.681610107421875, -1.6239776611328125, -1.56634521484375, -1.5087127685546875, -1.451080322265625, -1.3934478759765625, -1.3358154296875, -1.2781829833984375, -1.220550537109375, -1.1629180908203125, -1.10528564453125, -1.0476531982421875, -0.990020751953125, -0.9323883056640625, -0.874755859375, -0.8171234130859375, -0.759490966796875, -0.7018585205078125, -0.64422607421875, -0.5865936279296875, -0.528961181640625, -0.4713287353515625, -0.4136962890625, -0.3560638427734375, -0.298431396484375, -0.2407989501953125, -0.18316650390625, -0.1255340576171875, -0.067901611328125, -0.0102691650390625, 0.04736328125, 0.1049957275390625, 0.162628173828125, 0.2202606201171875, 0.27789306640625, 0.3355255126953125, 0.393157958984375, 0.4507904052734375, 0.5084228515625, 0.5660552978515625, 0.623687744140625, 0.6813201904296875, 0.73895263671875, 0.7965850830078125, 0.854217529296875, 0.9118499755859375, 0.969482421875, 1.0271148681640625, 1.084747314453125, 1.1423797607421875, 1.20001220703125, 1.2576446533203125, 1.315277099609375, 1.3729095458984375, 1.4305419921875, 1.4881744384765625, 1.545806884765625, 1.6034393310546875, 1.66107177734375, 1.7187042236328125, 1.776336669921875, 1.8339691162109375, 1.8916015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 15.0, 17.0, 45.0, 76.0, 123.0, 291.0, 702.0, 1283.0, 796.0, 297.0, 163.0, 87.0, 50.0, 40.0, 19.0, 15.0, 17.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.345703125, -2.28790283203125, -2.2301025390625, -2.17230224609375, -2.114501953125, -2.05670166015625, -1.9989013671875, -1.94110107421875, -1.88330078125, -1.82550048828125, -1.7677001953125, -1.70989990234375, -1.652099609375, -1.59429931640625, -1.5364990234375, -1.47869873046875, -1.4208984375, -1.36309814453125, -1.3052978515625, -1.24749755859375, -1.189697265625, -1.13189697265625, -1.0740966796875, -1.01629638671875, -0.95849609375, -0.90069580078125, -0.8428955078125, -0.78509521484375, -0.727294921875, -0.66949462890625, -0.6116943359375, -0.55389404296875, -0.49609375, -0.43829345703125, -0.3804931640625, -0.32269287109375, -0.264892578125, -0.20709228515625, -0.1492919921875, -0.09149169921875, -0.03369140625, 0.02410888671875, 0.0819091796875, 0.13970947265625, 0.197509765625, 0.25531005859375, 0.3131103515625, 0.37091064453125, 0.4287109375, 0.48651123046875, 0.5443115234375, 0.60211181640625, 0.659912109375, 0.71771240234375, 0.7755126953125, 0.83331298828125, 0.89111328125, 0.94891357421875, 1.0067138671875, 1.06451416015625, 1.122314453125, 1.18011474609375, 1.2379150390625, 1.29571533203125, 1.353515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 20.0, 47.0, 107.0, 212.0, 272.0, 172.0, 83.0, 34.0, 15.0, 10.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.645408630371094, -15.1768159866333, -14.708223342895508, -14.239630699157715, -13.771038055419922, -13.302445411682129, -12.833852767944336, -12.365259170532227, -11.89666748046875, -11.428074836730957, -10.959482192993164, -10.490889549255371, -10.022296905517578, -9.553704261779785, -9.085111618041992, -8.616518020629883, -8.14792537689209, -7.679332733154297, -7.210740089416504, -6.742147445678711, -6.273554801940918, -5.804962158203125, -5.336369037628174, -4.867776393890381, -4.399183750152588, -3.930591106414795, -3.461998462677002, -2.99340558052063, -2.524812936782837, -2.056220293045044, -1.5876274108886719, -1.119034767150879, -0.6504421234130859, -0.1818494200706482, 0.28674328327178955, 0.7553360462188721, 1.223928689956665, 1.692521333694458, 2.16111421585083, 2.629706859588623, 3.098299503326416, 3.566892147064209, 4.035484790802002, 4.504077911376953, 4.972670555114746, 5.441263198852539, 5.909855842590332, 6.378448486328125, 6.847041130065918, 7.315633773803711, 7.784226417541504, 8.252819061279297, 8.72141170501709, 9.190004348754883, 9.658597946166992, 10.127189636230469, 10.595783233642578, 11.064375877380371, 11.532968521118164, 12.001561164855957, 12.47015380859375, 12.938746452331543, 13.407339096069336, 13.875932693481445, 14.344524383544922]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 9.0, 8.0, 10.0, 16.0, 11.0, 19.0, 26.0, 17.0, 23.0, 26.0, 34.0, 30.0, 32.0, 41.0, 41.0, 46.0, 52.0, 46.0, 46.0, 49.0, 37.0, 50.0, 44.0, 42.0, 29.0, 32.0, 28.0, 31.0, 22.0, 18.0, 19.0, 13.0, 10.0, 11.0, 6.0, 9.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.679101467132568, -5.513421535491943, -5.347741603851318, -5.182061672210693, -5.016382217407227, -4.850702285766602, -4.685022354125977, -4.519342422485352, -4.353662490844727, -4.187982559204102, -4.022302627563477, -3.8566229343414307, -3.6909430027008057, -3.5252630710601807, -3.3595833778381348, -3.1939034461975098, -3.0282235145568848, -2.8625435829162598, -2.6968636512756348, -2.531183958053589, -2.365504026412964, -2.199824094772339, -2.034144401550293, -1.868464469909668, -1.702784538269043, -1.537104606628418, -1.3714247941970825, -1.205744981765747, -1.040065050125122, -0.8743851780891418, -0.7087053060531616, -0.5430254936218262, -0.37734508514404297, -0.21166521310806274, -0.04598534107208252, 0.1196945309638977, 0.28537440299987793, 0.45105427503585815, 0.6167341470718384, 0.7824139595031738, 0.9480938911437988, 1.1137738227844238, 1.2794536352157593, 1.4451334476470947, 1.6108133792877197, 1.7764933109283447, 1.9421731233596802, 2.1078529357910156, 2.2735328674316406, 2.4392127990722656, 2.6048927307128906, 2.7705724239349365, 2.9362523555755615, 3.1019322872161865, 3.2676119804382324, 3.4332919120788574, 3.5989718437194824, 3.7646517753601074, 3.9303317070007324, 4.096011638641357, 4.261691093444824, 4.427371025085449, 4.593050956726074, 4.758730888366699, 4.924410820007324]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 16.0, 17.0, 29.0, 44.0, 54.0, 85.0, 187.0, 274.0, 547.0, 960.0, 1936.0, 4011.0, 9435.0, 23336.0, 59498.0, 149121.0, 307547.0, 280766.0, 126135.0, 49941.0, 19292.0, 8114.0, 3556.0, 1651.0, 872.0, 461.0, 269.0, 134.0, 89.0, 75.0, 36.0, 27.0, 16.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88134765625, -0.8553543090820312, -0.8293609619140625, -0.8033676147460938, -0.777374267578125, -0.7513809204101562, -0.7253875732421875, -0.6993942260742188, -0.67340087890625, -0.6474075317382812, -0.6214141845703125, -0.5954208374023438, -0.569427490234375, -0.5434341430664062, -0.5174407958984375, -0.49144744873046875, -0.4654541015625, -0.43946075439453125, -0.4134674072265625, -0.38747406005859375, -0.361480712890625, -0.33548736572265625, -0.3094940185546875, -0.28350067138671875, -0.25750732421875, -0.23151397705078125, -0.2055206298828125, -0.17952728271484375, -0.153533935546875, -0.12754058837890625, -0.1015472412109375, -0.07555389404296875, -0.049560546875, -0.02356719970703125, 0.0024261474609375, 0.02841949462890625, 0.054412841796875, 0.08040618896484375, 0.1063995361328125, 0.13239288330078125, 0.15838623046875, 0.18437957763671875, 0.2103729248046875, 0.23636627197265625, 0.262359619140625, 0.28835296630859375, 0.3143463134765625, 0.34033966064453125, 0.3663330078125, 0.39232635498046875, 0.4183197021484375, 0.44431304931640625, 0.470306396484375, 0.49629974365234375, 0.5222930908203125, 0.5482864379882812, 0.57427978515625, 0.6002731323242188, 0.6262664794921875, 0.6522598266601562, 0.678253173828125, 0.7042465209960938, 0.7302398681640625, 0.7562332153320312, 0.7822265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 12.0, 23.0, 20.0, 34.0, 42.0, 49.0, 51.0, 59.0, 74.0, 83.0, 88.0, 77.0, 69.0, 63.0, 61.0, 45.0, 37.0, 29.0, 17.0, 14.0, 11.0, 8.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.83642578125, -0.811981201171875, -0.78753662109375, -0.763092041015625, -0.7386474609375, -0.714202880859375, -0.68975830078125, -0.665313720703125, -0.640869140625, -0.616424560546875, -0.59197998046875, -0.567535400390625, -0.5430908203125, -0.518646240234375, -0.49420166015625, -0.469757080078125, -0.4453125, -0.420867919921875, -0.39642333984375, -0.371978759765625, -0.3475341796875, -0.323089599609375, -0.29864501953125, -0.274200439453125, -0.249755859375, -0.225311279296875, -0.20086669921875, -0.176422119140625, -0.1519775390625, -0.127532958984375, -0.10308837890625, -0.078643798828125, -0.05419921875, -0.029754638671875, -0.00531005859375, 0.019134521484375, 0.0435791015625, 0.068023681640625, 0.09246826171875, 0.116912841796875, 0.141357421875, 0.165802001953125, 0.19024658203125, 0.214691162109375, 0.2391357421875, 0.263580322265625, 0.28802490234375, 0.312469482421875, 0.3369140625, 0.361358642578125, 0.38580322265625, 0.410247802734375, 0.4346923828125, 0.459136962890625, 0.48358154296875, 0.508026123046875, 0.532470703125, 0.556915283203125, 0.58135986328125, 0.605804443359375, 0.6302490234375, 0.654693603515625, 0.67913818359375, 0.703582763671875, 0.72802734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 11.0, 11.0, 11.0, 15.0, 28.0, 46.0, 55.0, 77.0, 86.0, 115.0, 175.0, 218.0, 353.0, 521.0, 818.0, 1395.0, 2811.0, 7787.0, 29062.0, 149717.0, 618599.0, 185060.0, 35310.0, 8971.0, 3121.0, 1536.0, 797.0, 528.0, 362.0, 268.0, 162.0, 123.0, 115.0, 74.0, 50.0, 39.0, 36.0, 26.0, 10.0, 7.0, 14.0, 8.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.166656494140625, -1.12432861328125, -1.082000732421875, -1.0396728515625, -0.997344970703125, -0.95501708984375, -0.912689208984375, -0.870361328125, -0.828033447265625, -0.78570556640625, -0.743377685546875, -0.7010498046875, -0.658721923828125, -0.61639404296875, -0.574066162109375, -0.53173828125, -0.489410400390625, -0.44708251953125, -0.404754638671875, -0.3624267578125, -0.320098876953125, -0.27777099609375, -0.235443115234375, -0.193115234375, -0.150787353515625, -0.10845947265625, -0.066131591796875, -0.0238037109375, 0.018524169921875, 0.06085205078125, 0.103179931640625, 0.1455078125, 0.187835693359375, 0.23016357421875, 0.272491455078125, 0.3148193359375, 0.357147216796875, 0.39947509765625, 0.441802978515625, 0.484130859375, 0.526458740234375, 0.56878662109375, 0.611114501953125, 0.6534423828125, 0.695770263671875, 0.73809814453125, 0.780426025390625, 0.82275390625, 0.865081787109375, 0.90740966796875, 0.949737548828125, 0.9920654296875, 1.034393310546875, 1.07672119140625, 1.119049072265625, 1.161376953125, 1.203704833984375, 1.24603271484375, 1.288360595703125, 1.3306884765625, 1.373016357421875, 1.41534423828125, 1.457672119140625, 1.5]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 3.0, 3.0, 3.0, 4.0, 9.0, 8.0, 14.0, 15.0, 25.0, 26.0, 18.0, 30.0, 33.0, 29.0, 28.0, 43.0, 31.0, 46.0, 48.0, 46.0, 62.0, 55.0, 46.0, 37.0, 47.0, 40.0, 42.0, 35.0, 25.0, 19.0, 17.0, 18.0, 20.0, 13.0, 18.0, 10.0, 7.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.318359375, -2.248809814453125, -2.17926025390625, -2.109710693359375, -2.0401611328125, -1.970611572265625, -1.90106201171875, -1.831512451171875, -1.761962890625, -1.692413330078125, -1.62286376953125, -1.553314208984375, -1.4837646484375, -1.414215087890625, -1.34466552734375, -1.275115966796875, -1.20556640625, -1.136016845703125, -1.06646728515625, -0.996917724609375, -0.9273681640625, -0.857818603515625, -0.78826904296875, -0.718719482421875, -0.649169921875, -0.579620361328125, -0.51007080078125, -0.440521240234375, -0.3709716796875, -0.301422119140625, -0.23187255859375, -0.162322998046875, -0.0927734375, -0.023223876953125, 0.04632568359375, 0.115875244140625, 0.1854248046875, 0.254974365234375, 0.32452392578125, 0.394073486328125, 0.463623046875, 0.533172607421875, 0.60272216796875, 0.672271728515625, 0.7418212890625, 0.811370849609375, 0.88092041015625, 0.950469970703125, 1.02001953125, 1.089569091796875, 1.15911865234375, 1.228668212890625, 1.2982177734375, 1.367767333984375, 1.43731689453125, 1.506866455078125, 1.576416015625, 1.645965576171875, 1.71551513671875, 1.785064697265625, 1.8546142578125, 1.924163818359375, 1.99371337890625, 2.063262939453125, 2.1328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 21.0, 23.0, 32.0, 45.0, 105.0, 208.0, 534.0, 1429.0, 5334.0, 44471.0, 887868.0, 97309.0, 8014.0, 1946.0, 670.0, 264.0, 111.0, 64.0, 32.0, 19.0, 13.0, 9.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1057815551757812, -1.0728912353515625, -1.0400009155273438, -1.007110595703125, -0.9742202758789062, -0.9413299560546875, -0.9084396362304688, -0.87554931640625, -0.8426589965820312, -0.8097686767578125, -0.7768783569335938, -0.743988037109375, -0.7110977172851562, -0.6782073974609375, -0.6453170776367188, -0.6124267578125, -0.5795364379882812, -0.5466461181640625, -0.5137557983398438, -0.480865478515625, -0.44797515869140625, -0.4150848388671875, -0.38219451904296875, -0.34930419921875, -0.31641387939453125, -0.2835235595703125, -0.25063323974609375, -0.217742919921875, -0.18485260009765625, -0.1519622802734375, -0.11907196044921875, -0.086181640625, -0.05329132080078125, -0.0204010009765625, 0.01248931884765625, 0.045379638671875, 0.07826995849609375, 0.1111602783203125, 0.14405059814453125, 0.17694091796875, 0.20983123779296875, 0.2427215576171875, 0.27561187744140625, 0.308502197265625, 0.34139251708984375, 0.3742828369140625, 0.40717315673828125, 0.4400634765625, 0.47295379638671875, 0.5058441162109375, 0.5387344360351562, 0.571624755859375, 0.6045150756835938, 0.6374053955078125, 0.6702957153320312, 0.70318603515625, 0.7360763549804688, 0.7689666748046875, 0.8018569946289062, 0.834747314453125, 0.8676376342773438, 0.9005279541015625, 0.9334182739257812, 0.96630859375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 16.0, 14.0, 16.0, 29.0, 46.0, 57.0, 73.0, 99.0, 109.0, 137.0, 110.0, 85.0, 60.0, 45.0, 29.0, 20.0, 12.0, 5.0, 6.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00022518634796142578, -0.00021913275122642517, -0.00021307915449142456, -0.00020702555775642395, -0.00020097196102142334, -0.00019491836428642273, -0.00018886476755142212, -0.0001828111708164215, -0.0001767575740814209, -0.0001707039773464203, -0.00016465038061141968, -0.00015859678387641907, -0.00015254318714141846, -0.00014648959040641785, -0.00014043599367141724, -0.00013438239693641663, -0.00012832880020141602, -0.0001222752034664154, -0.0001162216067314148, -0.00011016800999641418, -0.00010411441326141357, -9.806081652641296e-05, -9.200721979141235e-05, -8.595362305641174e-05, -7.990002632141113e-05, -7.384642958641052e-05, -6.779283285140991e-05, -6.17392361164093e-05, -5.568563938140869e-05, -4.963204264640808e-05, -4.357844591140747e-05, -3.752484917640686e-05, -3.147125244140625e-05, -2.541765570640564e-05, -1.936405897140503e-05, -1.3310462236404419e-05, -7.256865501403809e-06, -1.2032687664031982e-06, 4.850327968597412e-06, 1.0903924703598022e-05, 1.6957521438598633e-05, 2.3011118173599243e-05, 2.9064714908599854e-05, 3.5118311643600464e-05, 4.1171908378601074e-05, 4.7225505113601685e-05, 5.3279101848602295e-05, 5.9332698583602905e-05, 6.538629531860352e-05, 7.143989205360413e-05, 7.749348878860474e-05, 8.354708552360535e-05, 8.960068225860596e-05, 9.565427899360657e-05, 0.00010170787572860718, 0.00010776147246360779, 0.0001138150691986084, 0.00011986866593360901, 0.00012592226266860962, 0.00013197585940361023, 0.00013802945613861084, 0.00014408305287361145, 0.00015013664960861206, 0.00015619024634361267, 0.00016224384307861328]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 10.0, 6.0, 11.0, 10.0, 14.0, 29.0, 23.0, 45.0, 66.0, 131.0, 203.0, 305.0, 646.0, 1310.0, 3517.0, 12085.0, 78135.0, 776079.0, 150084.0, 17771.0, 4584.0, 1799.0, 763.0, 386.0, 210.0, 103.0, 79.0, 47.0, 29.0, 17.0, 16.0, 9.0, 12.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8388671875, -0.8159637451171875, -0.793060302734375, -0.7701568603515625, -0.74725341796875, -0.7243499755859375, -0.701446533203125, -0.6785430908203125, -0.6556396484375, -0.6327362060546875, -0.609832763671875, -0.5869293212890625, -0.56402587890625, -0.5411224365234375, -0.518218994140625, -0.4953155517578125, -0.472412109375, -0.4495086669921875, -0.426605224609375, -0.4037017822265625, -0.38079833984375, -0.3578948974609375, -0.334991455078125, -0.3120880126953125, -0.2891845703125, -0.2662811279296875, -0.243377685546875, -0.2204742431640625, -0.19757080078125, -0.1746673583984375, -0.151763916015625, -0.1288604736328125, -0.10595703125, -0.0830535888671875, -0.060150146484375, -0.0372467041015625, -0.01434326171875, 0.0085601806640625, 0.031463623046875, 0.0543670654296875, 0.0772705078125, 0.1001739501953125, 0.123077392578125, 0.1459808349609375, 0.16888427734375, 0.1917877197265625, 0.214691162109375, 0.2375946044921875, 0.260498046875, 0.2834014892578125, 0.306304931640625, 0.3292083740234375, 0.35211181640625, 0.3750152587890625, 0.397918701171875, 0.4208221435546875, 0.4437255859375, 0.4666290283203125, 0.489532470703125, 0.5124359130859375, 0.53533935546875, 0.5582427978515625, 0.581146240234375, 0.6040496826171875, 0.626953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 11.0, 10.0, 12.0, 18.0, 27.0, 38.0, 58.0, 77.0, 96.0, 99.0, 110.0, 94.0, 75.0, 61.0, 64.0, 43.0, 26.0, 26.0, 13.0, 11.0, 6.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73388671875, -0.7111282348632812, -0.6883697509765625, -0.6656112670898438, -0.642852783203125, -0.6200942993164062, -0.5973358154296875, -0.5745773315429688, -0.55181884765625, -0.5290603637695312, -0.5063018798828125, -0.48354339599609375, -0.460784912109375, -0.43802642822265625, -0.4152679443359375, -0.39250946044921875, -0.3697509765625, -0.34699249267578125, -0.3242340087890625, -0.30147552490234375, -0.278717041015625, -0.25595855712890625, -0.2332000732421875, -0.21044158935546875, -0.18768310546875, -0.16492462158203125, -0.1421661376953125, -0.11940765380859375, -0.096649169921875, -0.07389068603515625, -0.0511322021484375, -0.02837371826171875, -0.005615234375, 0.01714324951171875, 0.0399017333984375, 0.06266021728515625, 0.085418701171875, 0.10817718505859375, 0.1309356689453125, 0.15369415283203125, 0.17645263671875, 0.19921112060546875, 0.2219696044921875, 0.24472808837890625, 0.267486572265625, 0.29024505615234375, 0.3130035400390625, 0.33576202392578125, 0.3585205078125, 0.38127899169921875, 0.4040374755859375, 0.42679595947265625, 0.449554443359375, 0.47231292724609375, 0.4950714111328125, 0.5178298950195312, 0.54058837890625, 0.5633468627929688, 0.5861053466796875, 0.6088638305664062, 0.631622314453125, 0.6543807983398438, 0.6771392822265625, 0.6998977661132812, 0.72265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 9.0, 14.0, 30.0, 74.0, 142.0, 275.0, 255.0, 110.0, 52.0, 25.0, 9.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.005552291870117, -20.43624496459961, -19.86693572998047, -19.29762840270996, -18.728321075439453, -18.159013748168945, -17.589706420898438, -17.020397186279297, -16.45108985900879, -15.881782531738281, -15.312474250793457, -14.743165969848633, -14.173858642578125, -13.604551315307617, -13.035243034362793, -12.465934753417969, -11.896627426147461, -11.327320098876953, -10.758011817932129, -10.188703536987305, -9.619396209716797, -9.050088882446289, -8.480780601501465, -7.911472797393799, -7.342164993286133, -6.772857189178467, -6.203549385070801, -5.634241580963135, -5.064933776855469, -4.495625972747803, -3.9263181686401367, -3.3570103645324707, -2.787700653076172, -2.218392848968506, -1.6490850448608398, -1.0797772407531738, -0.5104694366455078, 0.0588383674621582, 0.6281461715698242, 1.1974539756774902, 1.7667617797851562, 2.3360695838928223, 2.9053773880004883, 3.4746851921081543, 4.04399299621582, 4.613300800323486, 5.182608604431152, 5.751916408538818, 6.321224212646484, 6.89053201675415, 7.459839820861816, 8.02914810180664, 8.598455429077148, 9.167762756347656, 9.73707103729248, 10.306379318237305, 10.875686645507812, 11.44499397277832, 12.014302253723145, 12.583610534667969, 13.152917861938477, 13.722225189208984, 14.291533470153809, 14.860841751098633, 15.43014907836914]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 6.0, 15.0, 5.0, 15.0, 14.0, 21.0, 32.0, 27.0, 22.0, 21.0, 37.0, 31.0, 44.0, 44.0, 51.0, 55.0, 84.0, 68.0, 47.0, 45.0, 37.0, 31.0, 33.0, 29.0, 22.0, 20.0, 18.0, 13.0, 20.0, 20.0, 13.0, 6.0, 10.0, 6.0, 11.0, 6.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.886995315551758, -9.6072416305542, -9.327488899230957, -9.047735214233398, -8.767982482910156, -8.488228797912598, -8.208475112915039, -7.928721904754639, -7.648968696594238, -7.369215488433838, -7.0894622802734375, -6.809708595275879, -6.5299553871154785, -6.250202178955078, -5.9704484939575195, -5.690695285797119, -5.410942077636719, -5.131188869476318, -4.851435661315918, -4.571681976318359, -4.291928768157959, -4.012175559997559, -3.732422113418579, -3.4526686668395996, -3.172915458679199, -2.893162250518799, -2.6134088039398193, -2.33365535736084, -2.0539021492004395, -1.7741488218307495, -1.4943954944610596, -1.2146421670913696, -0.9348888397216797, -0.6551355123519897, -0.3753821849822998, -0.09562885761260986, 0.18412446975708008, 0.46387779712677, 0.74363112449646, 1.02338445186615, 1.3031377792358398, 1.5828911066055298, 1.8626444339752197, 2.142397880554199, 2.4221510887145996, 2.701904296875, 2.9816577434539795, 3.261411190032959, 3.5411643981933594, 3.8209176063537598, 4.10067081451416, 4.380424499511719, 4.660177707672119, 4.9399309158325195, 5.219684600830078, 5.4994378089904785, 5.779191017150879, 6.058944225311279, 6.33869743347168, 6.618451118469238, 6.898204326629639, 7.177957534790039, 7.457711219787598, 7.737464427947998, 8.017217636108398]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 6.0, 6.0, 7.0, 10.0, 15.0, 14.0, 18.0, 37.0, 48.0, 92.0, 112.0, 154.0, 230.0, 329.0, 576.0, 803.0, 1432.0, 2611.0, 5187.0, 11558.0, 29692.0, 99908.0, 469829.0, 2118270.0, 1153260.0, 210292.0, 54098.0, 18737.0, 7952.0, 3885.0, 1985.0, 1163.0, 673.0, 435.0, 277.0, 182.0, 118.0, 97.0, 61.0, 37.0, 24.0, 24.0, 8.0, 9.0, 9.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-0.57421875, -0.5585975646972656, -0.5429763793945312, -0.5273551940917969, -0.5117340087890625, -0.4961128234863281, -0.48049163818359375, -0.4648704528808594, -0.449249267578125, -0.4336280822753906, -0.41800689697265625, -0.4023857116699219, -0.3867645263671875, -0.3711433410644531, -0.35552215576171875, -0.3399009704589844, -0.32427978515625, -0.3086585998535156, -0.29303741455078125, -0.2774162292480469, -0.2617950439453125, -0.24617385864257812, -0.23055267333984375, -0.21493148803710938, -0.199310302734375, -0.18368911743164062, -0.16806793212890625, -0.15244674682617188, -0.1368255615234375, -0.12120437622070312, -0.10558319091796875, -0.08996200561523438, -0.0743408203125, -0.058719635009765625, -0.04309844970703125, -0.027477264404296875, -0.0118560791015625, 0.003765106201171875, 0.01938629150390625, 0.035007476806640625, 0.050628662109375, 0.06624984741210938, 0.08187103271484375, 0.09749221801757812, 0.1131134033203125, 0.12873458862304688, 0.14435577392578125, 0.15997695922851562, 0.17559814453125, 0.19121932983398438, 0.20684051513671875, 0.22246170043945312, 0.2380828857421875, 0.2537040710449219, 0.26932525634765625, 0.2849464416503906, 0.300567626953125, 0.3161888122558594, 0.33180999755859375, 0.3474311828613281, 0.3630523681640625, 0.3786735534667969, 0.39429473876953125, 0.4099159240722656, 0.425537109375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 13.0, 20.0, 21.0, 18.0, 32.0, 33.0, 40.0, 64.0, 71.0, 91.0, 86.0, 87.0, 72.0, 66.0, 60.0, 43.0, 45.0, 37.0, 29.0, 21.0, 7.0, 9.0, 8.0, 11.0, 7.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9248046875, -0.8998641967773438, -0.8749237060546875, -0.8499832153320312, -0.825042724609375, -0.8001022338867188, -0.7751617431640625, -0.7502212524414062, -0.72528076171875, -0.7003402709960938, -0.6753997802734375, -0.6504592895507812, -0.625518798828125, -0.6005783081054688, -0.5756378173828125, -0.5506973266601562, -0.5257568359375, -0.5008163452148438, -0.4758758544921875, -0.45093536376953125, -0.425994873046875, -0.40105438232421875, -0.3761138916015625, -0.35117340087890625, -0.32623291015625, -0.30129241943359375, -0.2763519287109375, -0.25141143798828125, -0.226470947265625, -0.20153045654296875, -0.1765899658203125, -0.15164947509765625, -0.126708984375, -0.10176849365234375, -0.0768280029296875, -0.05188751220703125, -0.026947021484375, -0.00200653076171875, 0.0229339599609375, 0.04787445068359375, 0.07281494140625, 0.09775543212890625, 0.1226959228515625, 0.14763641357421875, 0.172576904296875, 0.19751739501953125, 0.2224578857421875, 0.24739837646484375, 0.2723388671875, 0.29727935791015625, 0.3222198486328125, 0.34716033935546875, 0.372100830078125, 0.39704132080078125, 0.4219818115234375, 0.44692230224609375, 0.47186279296875, 0.49680328369140625, 0.5217437744140625, 0.5466842651367188, 0.571624755859375, 0.5965652465820312, 0.6215057373046875, 0.6464462280273438, 0.67138671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 11.0, 6.0, 14.0, 18.0, 27.0, 38.0, 46.0, 65.0, 133.0, 157.0, 252.0, 470.0, 976.0, 2367.0, 7928.0, 41141.0, 712388.0, 3282073.0, 120849.0, 18187.0, 4379.0, 1415.0, 574.0, 306.0, 175.0, 106.0, 52.0, 44.0, 27.0, 11.0, 14.0, 10.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2900390625, -1.25, -1.2099609375, -1.169921875, -1.1298828125, -1.08984375, -1.0498046875, -1.009765625, -0.9697265625, -0.9296875, -0.8896484375, -0.849609375, -0.8095703125, -0.76953125, -0.7294921875, -0.689453125, -0.6494140625, -0.609375, -0.5693359375, -0.529296875, -0.4892578125, -0.44921875, -0.4091796875, -0.369140625, -0.3291015625, -0.2890625, -0.2490234375, -0.208984375, -0.1689453125, -0.12890625, -0.0888671875, -0.048828125, -0.0087890625, 0.03125, 0.0712890625, 0.111328125, 0.1513671875, 0.19140625, 0.2314453125, 0.271484375, 0.3115234375, 0.3515625, 0.3916015625, 0.431640625, 0.4716796875, 0.51171875, 0.5517578125, 0.591796875, 0.6318359375, 0.671875, 0.7119140625, 0.751953125, 0.7919921875, 0.83203125, 0.8720703125, 0.912109375, 0.9521484375, 0.9921875, 1.0322265625, 1.072265625, 1.1123046875, 1.15234375, 1.1923828125, 1.232421875, 1.2724609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 3.0, 10.0, 9.0, 9.0, 23.0, 29.0, 26.0, 57.0, 88.0, 196.0, 385.0, 684.0, 846.0, 731.0, 369.0, 208.0, 122.0, 77.0, 48.0, 45.0, 33.0, 25.0, 10.0, 6.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.451171875, -1.4125518798828125, -1.373931884765625, -1.3353118896484375, -1.29669189453125, -1.2580718994140625, -1.219451904296875, -1.1808319091796875, -1.1422119140625, -1.1035919189453125, -1.064971923828125, -1.0263519287109375, -0.98773193359375, -0.9491119384765625, -0.910491943359375, -0.8718719482421875, -0.833251953125, -0.7946319580078125, -0.756011962890625, -0.7173919677734375, -0.67877197265625, -0.6401519775390625, -0.601531982421875, -0.5629119873046875, -0.5242919921875, -0.4856719970703125, -0.447052001953125, -0.4084320068359375, -0.36981201171875, -0.3311920166015625, -0.292572021484375, -0.2539520263671875, -0.21533203125, -0.1767120361328125, -0.138092041015625, -0.0994720458984375, -0.06085205078125, -0.0222320556640625, 0.016387939453125, 0.0550079345703125, 0.0936279296875, 0.1322479248046875, 0.170867919921875, 0.2094879150390625, 0.24810791015625, 0.2867279052734375, 0.325347900390625, 0.3639678955078125, 0.402587890625, 0.4412078857421875, 0.479827880859375, 0.5184478759765625, 0.55706787109375, 0.5956878662109375, 0.634307861328125, 0.6729278564453125, 0.7115478515625, 0.7501678466796875, 0.788787841796875, 0.8274078369140625, 0.86602783203125, 0.9046478271484375, 0.943267822265625, 0.9818878173828125, 1.0205078125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 25.0, 88.0, 265.0, 340.0, 180.0, 65.0, 18.0, 7.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.717849731445312, -15.069784164428711, -14.42171859741211, -13.773653030395508, -13.12558650970459, -12.477520942687988, -11.829455375671387, -11.181388854980469, -10.533323287963867, -9.885257720947266, -9.237192153930664, -8.589126586914062, -7.9410600662231445, -7.292994499206543, -6.644928932189941, -5.996862888336182, -5.348797798156738, -4.700732231140137, -4.052666187286377, -3.4046006202697754, -2.7565348148345947, -2.108469009399414, -1.4604034423828125, -0.8123373985290527, -0.16427183151245117, 0.4837939143180847, 1.1318596601486206, 1.7799253463745117, 2.4279911518096924, 3.076056957244873, 3.7241225242614746, 4.372188568115234, 5.020254135131836, 5.6683197021484375, 6.316385746002197, 6.964451313018799, 7.612517356872559, 8.26058292388916, 8.908648490905762, 9.55671501159668, 10.204780578613281, 10.852846145629883, 11.500911712646484, 12.148977279663086, 12.797043800354004, 13.445109367370605, 14.093174934387207, 14.741241455078125, 15.38930606842041, 16.037372589111328, 16.68543815612793, 17.33350372314453, 17.981569290161133, 18.629634857177734, 19.277700424194336, 19.925765991210938, 20.57383155822754, 21.22189712524414, 21.869962692260742, 22.518028259277344, 23.166093826293945, 23.814159393310547, 24.46222686767578, 25.110292434692383, 25.758358001708984]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 5.0, 7.0, 3.0, 8.0, 6.0, 20.0, 16.0, 25.0, 41.0, 27.0, 45.0, 41.0, 48.0, 63.0, 66.0, 53.0, 59.0, 56.0, 46.0, 51.0, 54.0, 39.0, 31.0, 32.0, 30.0, 20.0, 23.0, 20.0, 19.0, 10.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.452091217041016, -5.278045654296875, -5.104000091552734, -4.929954528808594, -4.755908966064453, -4.581862926483154, -4.407817363739014, -4.233771800994873, -4.059726238250732, -3.885680675506592, -3.711635112762451, -3.5375893115997314, -3.363543748855591, -3.18949818611145, -3.0154523849487305, -2.84140682220459, -2.667361259460449, -2.4933156967163086, -2.319270133972168, -2.1452243328094482, -1.9711787700653076, -1.797133207321167, -1.6230875253677368, -1.4490418434143066, -1.274996280670166, -1.1009507179260254, -0.9269050359725952, -0.7528594136238098, -0.5788137912750244, -0.404768168926239, -0.2307225465774536, -0.05667686462402344, 0.11736869812011719, 0.2914143204689026, 0.465459942817688, 0.6395055651664734, 0.8135511875152588, 0.9875968098640442, 1.1616424322128296, 1.3356881141662598, 1.5097336769104004, 1.683779239654541, 1.8578249216079712, 2.0318706035614014, 2.205916166305542, 2.3799617290496826, 2.5540075302124023, 2.728053092956543, 2.9020986557006836, 3.076144218444824, 3.250189781188965, 3.4242355823516846, 3.598281145095825, 3.772326707839966, 3.9463725090026855, 4.120418071746826, 4.294463634490967, 4.468509197235107, 4.642554759979248, 4.816600322723389, 4.9906463623046875, 5.164691925048828, 5.338737487792969, 5.512783050537109, 5.68682861328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 20.0, 4.0, 16.0, 29.0, 26.0, 64.0, 91.0, 134.0, 221.0, 324.0, 512.0, 859.0, 1397.0, 2296.0, 4122.0, 7519.0, 14305.0, 27524.0, 55244.0, 113443.0, 223348.0, 272271.0, 163133.0, 79110.0, 39086.0, 19640.0, 10175.0, 5677.0, 3166.0, 1784.0, 1099.0, 695.0, 401.0, 267.0, 174.0, 130.0, 79.0, 53.0, 40.0, 22.0, 15.0, 9.0, 10.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.652740478515625, -0.63116455078125, -0.609588623046875, -0.5880126953125, -0.566436767578125, -0.54486083984375, -0.523284912109375, -0.501708984375, -0.480133056640625, -0.45855712890625, -0.436981201171875, -0.4154052734375, -0.393829345703125, -0.37225341796875, -0.350677490234375, -0.3291015625, -0.307525634765625, -0.28594970703125, -0.264373779296875, -0.2427978515625, -0.221221923828125, -0.19964599609375, -0.178070068359375, -0.156494140625, -0.134918212890625, -0.11334228515625, -0.091766357421875, -0.0701904296875, -0.048614501953125, -0.02703857421875, -0.005462646484375, 0.01611328125, 0.037689208984375, 0.05926513671875, 0.080841064453125, 0.1024169921875, 0.123992919921875, 0.14556884765625, 0.167144775390625, 0.188720703125, 0.210296630859375, 0.23187255859375, 0.253448486328125, 0.2750244140625, 0.296600341796875, 0.31817626953125, 0.339752197265625, 0.361328125, 0.382904052734375, 0.40447998046875, 0.426055908203125, 0.4476318359375, 0.469207763671875, 0.49078369140625, 0.512359619140625, 0.533935546875, 0.555511474609375, 0.57708740234375, 0.598663330078125, 0.6202392578125, 0.641815185546875, 0.66339111328125, 0.684967041015625, 0.70654296875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 7.0, 16.0, 13.0, 26.0, 26.0, 34.0, 56.0, 49.0, 81.0, 68.0, 75.0, 67.0, 75.0, 80.0, 66.0, 61.0, 57.0, 35.0, 29.0, 25.0, 12.0, 11.0, 10.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8974609375, -0.8722152709960938, -0.8469696044921875, -0.8217239379882812, -0.796478271484375, -0.7712326049804688, -0.7459869384765625, -0.7207412719726562, -0.69549560546875, -0.6702499389648438, -0.6450042724609375, -0.6197586059570312, -0.594512939453125, -0.5692672729492188, -0.5440216064453125, -0.5187759399414062, -0.4935302734375, -0.46828460693359375, -0.4430389404296875, -0.41779327392578125, -0.392547607421875, -0.36730194091796875, -0.3420562744140625, -0.31681060791015625, -0.29156494140625, -0.26631927490234375, -0.2410736083984375, -0.21582794189453125, -0.190582275390625, -0.16533660888671875, -0.1400909423828125, -0.11484527587890625, -0.089599609375, -0.06435394287109375, -0.0391082763671875, -0.01386260986328125, 0.011383056640625, 0.03662872314453125, 0.0618743896484375, 0.08712005615234375, 0.11236572265625, 0.13761138916015625, 0.1628570556640625, 0.18810272216796875, 0.213348388671875, 0.23859405517578125, 0.2638397216796875, 0.28908538818359375, 0.3143310546875, 0.33957672119140625, 0.3648223876953125, 0.39006805419921875, 0.415313720703125, 0.44055938720703125, 0.4658050537109375, 0.49105072021484375, 0.51629638671875, 0.5415420532226562, 0.5667877197265625, 0.5920333862304688, 0.617279052734375, 0.6425247192382812, 0.6677703857421875, 0.6930160522460938, 0.71826171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 5.0, 16.0, 14.0, 29.0, 39.0, 50.0, 77.0, 130.0, 196.0, 298.0, 472.0, 785.0, 1654.0, 4112.0, 17896.0, 119542.0, 700552.0, 169199.0, 24164.0, 5064.0, 1812.0, 905.0, 551.0, 328.0, 196.0, 149.0, 98.0, 59.0, 44.0, 31.0, 30.0, 16.0, 11.0, 4.0, 2.0, 8.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.443572998046875, -1.38714599609375, -1.330718994140625, -1.2742919921875, -1.217864990234375, -1.16143798828125, -1.105010986328125, -1.048583984375, -0.992156982421875, -0.93572998046875, -0.879302978515625, -0.8228759765625, -0.766448974609375, -0.71002197265625, -0.653594970703125, -0.59716796875, -0.540740966796875, -0.48431396484375, -0.427886962890625, -0.3714599609375, -0.315032958984375, -0.25860595703125, -0.202178955078125, -0.145751953125, -0.089324951171875, -0.03289794921875, 0.023529052734375, 0.0799560546875, 0.136383056640625, 0.19281005859375, 0.249237060546875, 0.3056640625, 0.362091064453125, 0.41851806640625, 0.474945068359375, 0.5313720703125, 0.587799072265625, 0.64422607421875, 0.700653076171875, 0.757080078125, 0.813507080078125, 0.86993408203125, 0.926361083984375, 0.9827880859375, 1.039215087890625, 1.09564208984375, 1.152069091796875, 1.20849609375, 1.264923095703125, 1.32135009765625, 1.377777099609375, 1.4342041015625, 1.490631103515625, 1.54705810546875, 1.603485107421875, 1.659912109375, 1.716339111328125, 1.77276611328125, 1.829193115234375, 1.8856201171875, 1.942047119140625, 1.99847412109375, 2.054901123046875, 2.111328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 6.0, 5.0, 7.0, 6.0, 11.0, 9.0, 18.0, 17.0, 18.0, 37.0, 30.0, 25.0, 39.0, 38.0, 37.0, 35.0, 60.0, 48.0, 49.0, 50.0, 65.0, 42.0, 49.0, 41.0, 41.0, 30.0, 25.0, 23.0, 19.0, 23.0, 13.0, 20.0, 16.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.696136474609375, -1.63641357421875, -1.576690673828125, -1.5169677734375, -1.457244873046875, -1.39752197265625, -1.337799072265625, -1.278076171875, -1.218353271484375, -1.15863037109375, -1.098907470703125, -1.0391845703125, -0.979461669921875, -0.91973876953125, -0.860015869140625, -0.80029296875, -0.740570068359375, -0.68084716796875, -0.621124267578125, -0.5614013671875, -0.501678466796875, -0.44195556640625, -0.382232666015625, -0.322509765625, -0.262786865234375, -0.20306396484375, -0.143341064453125, -0.0836181640625, -0.023895263671875, 0.03582763671875, 0.095550537109375, 0.1552734375, 0.214996337890625, 0.27471923828125, 0.334442138671875, 0.3941650390625, 0.453887939453125, 0.51361083984375, 0.573333740234375, 0.633056640625, 0.692779541015625, 0.75250244140625, 0.812225341796875, 0.8719482421875, 0.931671142578125, 0.99139404296875, 1.051116943359375, 1.11083984375, 1.170562744140625, 1.23028564453125, 1.290008544921875, 1.3497314453125, 1.409454345703125, 1.46917724609375, 1.528900146484375, 1.588623046875, 1.648345947265625, 1.70806884765625, 1.767791748046875, 1.8275146484375, 1.887237548828125, 1.94696044921875, 2.006683349609375, 2.06640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 11.0, 17.0, 20.0, 20.0, 25.0, 49.0, 94.0, 150.0, 287.0, 621.0, 1442.0, 3840.0, 12478.0, 50227.0, 306122.0, 579971.0, 68855.0, 16158.0, 4892.0, 1694.0, 786.0, 344.0, 157.0, 106.0, 61.0, 38.0, 26.0, 16.0, 13.0, 12.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.564453125, -0.5463027954101562, -0.5281524658203125, -0.5100021362304688, -0.491851806640625, -0.47370147705078125, -0.4555511474609375, -0.43740081787109375, -0.41925048828125, -0.40110015869140625, -0.3829498291015625, -0.36479949951171875, -0.346649169921875, -0.32849884033203125, -0.3103485107421875, -0.29219818115234375, -0.2740478515625, -0.25589752197265625, -0.2377471923828125, -0.21959686279296875, -0.201446533203125, -0.18329620361328125, -0.1651458740234375, -0.14699554443359375, -0.12884521484375, -0.11069488525390625, -0.0925445556640625, -0.07439422607421875, -0.056243896484375, -0.03809356689453125, -0.0199432373046875, -0.00179290771484375, 0.016357421875, 0.03450775146484375, 0.0526580810546875, 0.07080841064453125, 0.088958740234375, 0.10710906982421875, 0.1252593994140625, 0.14340972900390625, 0.16156005859375, 0.17971038818359375, 0.1978607177734375, 0.21601104736328125, 0.234161376953125, 0.25231170654296875, 0.2704620361328125, 0.28861236572265625, 0.3067626953125, 0.32491302490234375, 0.3430633544921875, 0.36121368408203125, 0.379364013671875, 0.39751434326171875, 0.4156646728515625, 0.43381500244140625, 0.45196533203125, 0.47011566162109375, 0.4882659912109375, 0.5064163208007812, 0.524566650390625, 0.5427169799804688, 0.5608673095703125, 0.5790176391601562, 0.59716796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 8.0, 12.0, 18.0, 27.0, 36.0, 40.0, 62.0, 95.0, 120.0, 128.0, 123.0, 72.0, 53.0, 39.0, 24.0, 23.0, 21.0, 16.0, 7.0, 10.0, 4.0, 8.0, 4.0, 2.0, 6.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002028942108154297, -0.00019639357924461365, -0.0001898929476737976, -0.00018339231610298157, -0.00017689168453216553, -0.0001703910529613495, -0.00016389042139053345, -0.0001573897898197174, -0.00015088915824890137, -0.00014438852667808533, -0.0001378878951072693, -0.00013138726353645325, -0.0001248866319656372, -0.00011838600039482117, -0.00011188536882400513, -0.00010538473725318909, -9.888410568237305e-05, -9.238347411155701e-05, -8.588284254074097e-05, -7.938221096992493e-05, -7.288157939910889e-05, -6.638094782829285e-05, -5.988031625747681e-05, -5.3379684686660767e-05, -4.6879053115844727e-05, -4.0378421545028687e-05, -3.3877789974212646e-05, -2.7377158403396606e-05, -2.0876526832580566e-05, -1.4375895261764526e-05, -7.875263690948486e-06, -1.3746321201324463e-06, 5.125999450683594e-06, 1.1626631021499634e-05, 1.8127262592315674e-05, 2.4627894163131714e-05, 3.1128525733947754e-05, 3.7629157304763794e-05, 4.4129788875579834e-05, 5.0630420446395874e-05, 5.7131052017211914e-05, 6.363168358802795e-05, 7.0132315158844e-05, 7.663294672966003e-05, 8.313357830047607e-05, 8.963420987129211e-05, 9.613484144210815e-05, 0.0001026354730129242, 0.00010913610458374023, 0.00011563673615455627, 0.00012213736772537231, 0.00012863799929618835, 0.0001351386308670044, 0.00014163926243782043, 0.00014813989400863647, 0.00015464052557945251, 0.00016114115715026855, 0.0001676417887210846, 0.00017414242029190063, 0.00018064305186271667, 0.00018714368343353271, 0.00019364431500434875, 0.0002001449465751648, 0.00020664557814598083, 0.00021314620971679688]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 6.0, 7.0, 8.0, 20.0, 16.0, 32.0, 51.0, 80.0, 134.0, 249.0, 494.0, 955.0, 2302.0, 6379.0, 25159.0, 162554.0, 707979.0, 113626.0, 19323.0, 5338.0, 1953.0, 862.0, 430.0, 252.0, 121.0, 86.0, 39.0, 19.0, 15.0, 18.0, 11.0, 7.0, 10.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6513671875, -0.6318740844726562, -0.6123809814453125, -0.5928878784179688, -0.573394775390625, -0.5539016723632812, -0.5344085693359375, -0.5149154663085938, -0.49542236328125, -0.47592926025390625, -0.4564361572265625, -0.43694305419921875, -0.417449951171875, -0.39795684814453125, -0.3784637451171875, -0.35897064208984375, -0.3394775390625, -0.31998443603515625, -0.3004913330078125, -0.28099822998046875, -0.261505126953125, -0.24201202392578125, -0.2225189208984375, -0.20302581787109375, -0.18353271484375, -0.16403961181640625, -0.1445465087890625, -0.12505340576171875, -0.105560302734375, -0.08606719970703125, -0.0665740966796875, -0.04708099365234375, -0.027587890625, -0.00809478759765625, 0.0113983154296875, 0.03089141845703125, 0.050384521484375, 0.06987762451171875, 0.0893707275390625, 0.10886383056640625, 0.12835693359375, 0.14785003662109375, 0.1673431396484375, 0.18683624267578125, 0.206329345703125, 0.22582244873046875, 0.2453155517578125, 0.26480865478515625, 0.2843017578125, 0.30379486083984375, 0.3232879638671875, 0.34278106689453125, 0.362274169921875, 0.38176727294921875, 0.4012603759765625, 0.42075347900390625, 0.44024658203125, 0.45973968505859375, 0.4792327880859375, 0.49872589111328125, 0.518218994140625, 0.5377120971679688, 0.5572052001953125, 0.5766983032226562, 0.59619140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 7.0, 7.0, 13.0, 13.0, 21.0, 34.0, 47.0, 72.0, 83.0, 109.0, 118.0, 109.0, 92.0, 84.0, 61.0, 35.0, 19.0, 26.0, 19.0, 11.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88671875, -0.8646240234375, -0.842529296875, -0.8204345703125, -0.79833984375, -0.7762451171875, -0.754150390625, -0.7320556640625, -0.7099609375, -0.6878662109375, -0.665771484375, -0.6436767578125, -0.62158203125, -0.5994873046875, -0.577392578125, -0.5552978515625, -0.533203125, -0.5111083984375, -0.489013671875, -0.4669189453125, -0.44482421875, -0.4227294921875, -0.400634765625, -0.3785400390625, -0.3564453125, -0.3343505859375, -0.312255859375, -0.2901611328125, -0.26806640625, -0.2459716796875, -0.223876953125, -0.2017822265625, -0.1796875, -0.1575927734375, -0.135498046875, -0.1134033203125, -0.09130859375, -0.0692138671875, -0.047119140625, -0.0250244140625, -0.0029296875, 0.0191650390625, 0.041259765625, 0.0633544921875, 0.08544921875, 0.1075439453125, 0.129638671875, 0.1517333984375, 0.173828125, 0.1959228515625, 0.218017578125, 0.2401123046875, 0.26220703125, 0.2843017578125, 0.306396484375, 0.3284912109375, 0.3505859375, 0.3726806640625, 0.394775390625, 0.4168701171875, 0.43896484375, 0.4610595703125, 0.483154296875, 0.5052490234375, 0.52734375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 5.0, 3.0, 9.0, 24.0, 37.0, 89.0, 144.0, 274.0, 182.0, 113.0, 60.0, 27.0, 16.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.544530868530273, -16.093183517456055, -15.641834259033203, -15.190485954284668, -14.739137649536133, -14.287790298461914, -13.836441040039062, -13.385093688964844, -12.933745384216309, -12.482397079467773, -12.031048774719238, -11.579700469970703, -11.128352165222168, -10.677003860473633, -10.225656509399414, -9.774308204650879, -9.322959899902344, -8.871611595153809, -8.420263290405273, -7.968914985656738, -7.517567157745361, -7.066218852996826, -6.614870548248291, -6.163522720336914, -5.7121734619140625, -5.260825157165527, -4.809476852416992, -4.358128547668457, -3.90678071975708, -3.455432415008545, -3.0040841102600098, -2.5527360439300537, -2.1013879776000977, -1.650039792060852, -1.1986916065216064, -0.7473433017730713, -0.2959951162338257, 0.15535306930541992, 0.6067013740539551, 1.0580494403839111, 1.5093977451324463, 1.960745930671692, 2.4120941162109375, 2.8634424209594727, 3.314790725708008, 3.766138792037964, 4.217487335205078, 4.668835163116455, 5.12018346786499, 5.571531772613525, 6.0228800773620605, 6.4742279052734375, 6.925576210021973, 7.376924514770508, 7.828272819519043, 8.279621124267578, 8.730969429016113, 9.182317733764648, 9.633666038513184, 10.085014343261719, 10.536362648010254, 10.987710952758789, 11.439058303833008, 11.890406608581543, 12.341754913330078]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 2.0, 6.0, 3.0, 11.0, 11.0, 10.0, 15.0, 15.0, 13.0, 16.0, 15.0, 23.0, 17.0, 22.0, 34.0, 36.0, 36.0, 45.0, 45.0, 75.0, 69.0, 71.0, 55.0, 37.0, 49.0, 24.0, 33.0, 42.0, 30.0, 13.0, 24.0, 18.0, 20.0, 12.0, 12.0, 8.0, 9.0, 12.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.604677677154541, -7.371061325073242, -7.137444496154785, -6.903828144073486, -6.6702117919921875, -6.436595439910889, -6.20297908782959, -5.969362258911133, -5.735745906829834, -5.502129554748535, -5.268512725830078, -5.034896373748779, -4.8012800216674805, -4.567663669586182, -4.334047317504883, -4.100430488586426, -3.866814136505127, -3.633197784423828, -3.39958119392395, -3.1659646034240723, -2.9323482513427734, -2.6987318992614746, -2.4651153087615967, -2.2314987182617188, -1.99788236618042, -1.7642658948898315, -1.5306494235992432, -1.2970329523086548, -1.0634164810180664, -0.829800009727478, -0.5961835384368896, -0.36256706714630127, -0.1289501190185547, 0.10466635227203369, 0.33828282356262207, 0.5718992948532104, 0.8055157661437988, 1.0391322374343872, 1.2727487087249756, 1.506365180015564, 1.7399816513061523, 1.9735981225967407, 2.207214593887329, 2.440831184387207, 2.674447536468506, 2.9080638885498047, 3.1416804790496826, 3.3752970695495605, 3.6089134216308594, 3.842529773712158, 4.076146125793457, 4.309762954711914, 4.543379306793213, 4.776995658874512, 5.010612487792969, 5.244228839874268, 5.477845191955566, 5.711461544036865, 5.945077896118164, 6.178694725036621, 6.41231107711792, 6.645927429199219, 6.879544258117676, 7.113160610198975, 7.346776962280273]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 8.0, 11.0, 14.0, 9.0, 14.0, 23.0, 33.0, 39.0, 64.0, 77.0, 96.0, 125.0, 205.0, 300.0, 437.0, 727.0, 1124.0, 1924.0, 4051.0, 10384.0, 33555.0, 162232.0, 1198844.0, 2320689.0, 371189.0, 59688.0, 15744.0, 6034.0, 2710.0, 1430.0, 785.0, 505.0, 377.0, 240.0, 169.0, 113.0, 100.0, 70.0, 41.0, 30.0, 21.0, 18.0, 9.0, 14.0, 11.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.6845703125, -0.665130615234375, -0.64569091796875, -0.626251220703125, -0.6068115234375, -0.587371826171875, -0.56793212890625, -0.548492431640625, -0.529052734375, -0.509613037109375, -0.49017333984375, -0.470733642578125, -0.4512939453125, -0.431854248046875, -0.41241455078125, -0.392974853515625, -0.37353515625, -0.354095458984375, -0.33465576171875, -0.315216064453125, -0.2957763671875, -0.276336669921875, -0.25689697265625, -0.237457275390625, -0.218017578125, -0.198577880859375, -0.17913818359375, -0.159698486328125, -0.1402587890625, -0.120819091796875, -0.10137939453125, -0.081939697265625, -0.0625, -0.043060302734375, -0.02362060546875, -0.004180908203125, 0.0152587890625, 0.034698486328125, 0.05413818359375, 0.073577880859375, 0.093017578125, 0.112457275390625, 0.13189697265625, 0.151336669921875, 0.1707763671875, 0.190216064453125, 0.20965576171875, 0.229095458984375, 0.24853515625, 0.267974853515625, 0.28741455078125, 0.306854248046875, 0.3262939453125, 0.345733642578125, 0.36517333984375, 0.384613037109375, 0.404052734375, 0.423492431640625, 0.44293212890625, 0.462371826171875, 0.4818115234375, 0.501251220703125, 0.52069091796875, 0.540130615234375, 0.5595703125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 12.0, 13.0, 19.0, 28.0, 39.0, 50.0, 56.0, 66.0, 72.0, 65.0, 86.0, 82.0, 79.0, 71.0, 51.0, 46.0, 37.0, 36.0, 19.0, 23.0, 11.0, 10.0, 11.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.912109375, -0.8873443603515625, -0.862579345703125, -0.8378143310546875, -0.81304931640625, -0.7882843017578125, -0.763519287109375, -0.7387542724609375, -0.7139892578125, -0.6892242431640625, -0.664459228515625, -0.6396942138671875, -0.61492919921875, -0.5901641845703125, -0.565399169921875, -0.5406341552734375, -0.515869140625, -0.4911041259765625, -0.466339111328125, -0.4415740966796875, -0.41680908203125, -0.3920440673828125, -0.367279052734375, -0.3425140380859375, -0.3177490234375, -0.2929840087890625, -0.268218994140625, -0.2434539794921875, -0.21868896484375, -0.1939239501953125, -0.169158935546875, -0.1443939208984375, -0.11962890625, -0.0948638916015625, -0.070098876953125, -0.0453338623046875, -0.02056884765625, 0.0041961669921875, 0.028961181640625, 0.0537261962890625, 0.0784912109375, 0.1032562255859375, 0.128021240234375, 0.1527862548828125, 0.17755126953125, 0.2023162841796875, 0.227081298828125, 0.2518463134765625, 0.276611328125, 0.3013763427734375, 0.326141357421875, 0.3509063720703125, 0.37567138671875, 0.4004364013671875, 0.425201416015625, 0.4499664306640625, 0.4747314453125, 0.4994964599609375, 0.524261474609375, 0.5490264892578125, 0.57379150390625, 0.5985565185546875, 0.623321533203125, 0.6480865478515625, 0.6728515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 16.0, 14.0, 14.0, 22.0, 30.0, 54.0, 68.0, 80.0, 135.0, 231.0, 361.0, 770.0, 1747.0, 4928.0, 25187.0, 674290.0, 3408030.0, 65555.0, 8628.0, 2277.0, 874.0, 396.0, 207.0, 130.0, 70.0, 63.0, 27.0, 18.0, 15.0, 7.0, 8.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.630859375, -1.5802001953125, -1.529541015625, -1.4788818359375, -1.42822265625, -1.3775634765625, -1.326904296875, -1.2762451171875, -1.2255859375, -1.1749267578125, -1.124267578125, -1.0736083984375, -1.02294921875, -0.9722900390625, -0.921630859375, -0.8709716796875, -0.8203125, -0.7696533203125, -0.718994140625, -0.6683349609375, -0.61767578125, -0.5670166015625, -0.516357421875, -0.4656982421875, -0.4150390625, -0.3643798828125, -0.313720703125, -0.2630615234375, -0.21240234375, -0.1617431640625, -0.111083984375, -0.0604248046875, -0.009765625, 0.0408935546875, 0.091552734375, 0.1422119140625, 0.19287109375, 0.2435302734375, 0.294189453125, 0.3448486328125, 0.3955078125, 0.4461669921875, 0.496826171875, 0.5474853515625, 0.59814453125, 0.6488037109375, 0.699462890625, 0.7501220703125, 0.80078125, 0.8514404296875, 0.902099609375, 0.9527587890625, 1.00341796875, 1.0540771484375, 1.104736328125, 1.1553955078125, 1.2060546875, 1.2567138671875, 1.307373046875, 1.3580322265625, 1.40869140625, 1.4593505859375, 1.510009765625, 1.5606689453125, 1.611328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 12.0, 9.0, 30.0, 24.0, 42.0, 78.0, 135.0, 237.0, 460.0, 752.0, 858.0, 606.0, 345.0, 182.0, 98.0, 62.0, 38.0, 22.0, 13.0, 15.0, 11.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0], "bins": [-1.623046875, -1.5846176147460938, -1.5461883544921875, -1.5077590942382812, -1.469329833984375, -1.4309005737304688, -1.3924713134765625, -1.3540420532226562, -1.31561279296875, -1.2771835327148438, -1.2387542724609375, -1.2003250122070312, -1.161895751953125, -1.1234664916992188, -1.0850372314453125, -1.0466079711914062, -1.0081787109375, -0.9697494506835938, -0.9313201904296875, -0.8928909301757812, -0.854461669921875, -0.8160324096679688, -0.7776031494140625, -0.7391738891601562, -0.70074462890625, -0.6623153686523438, -0.6238861083984375, -0.5854568481445312, -0.547027587890625, -0.5085983276367188, -0.4701690673828125, -0.43173980712890625, -0.393310546875, -0.35488128662109375, -0.3164520263671875, -0.27802276611328125, -0.239593505859375, -0.20116424560546875, -0.1627349853515625, -0.12430572509765625, -0.08587646484375, -0.04744720458984375, -0.0090179443359375, 0.02941131591796875, 0.067840576171875, 0.10626983642578125, 0.1446990966796875, 0.18312835693359375, 0.2215576171875, 0.25998687744140625, 0.2984161376953125, 0.33684539794921875, 0.375274658203125, 0.41370391845703125, 0.4521331787109375, 0.49056243896484375, 0.52899169921875, 0.5674209594726562, 0.6058502197265625, 0.6442794799804688, 0.682708740234375, 0.7211380004882812, 0.7595672607421875, 0.7979965209960938, 0.83642578125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 17.0, 54.0, 110.0, 165.0, 173.0, 193.0, 115.0, 70.0, 29.0, 19.0, 12.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.369527816772461, -12.996055603027344, -12.62258243560791, -12.249110221862793, -11.87563705444336, -11.502164840698242, -11.128692626953125, -10.755219459533691, -10.381746292114258, -10.00827407836914, -9.634800910949707, -9.26132869720459, -8.887855529785156, -8.514383316040039, -8.140911102294922, -7.767437934875488, -7.393965721130371, -7.020493030548096, -6.64702033996582, -6.273548126220703, -5.9000749588012695, -5.526602745056152, -5.153130054473877, -4.779657363891602, -4.406184673309326, -4.032711982727051, -3.6592392921447754, -3.285766839981079, -2.9122941493988037, -2.5388214588165283, -2.165349006652832, -1.7918763160705566, -1.4184045791625977, -1.0449318885803223, -0.6714593172073364, -0.2979867458343506, 0.0754859447479248, 0.4489586353302002, 0.8224310874938965, 1.1959037780761719, 1.5693764686584473, 1.9428491592407227, 2.316321849822998, 2.6897943019866943, 3.0632669925689697, 3.436739683151245, 3.8102121353149414, 4.183684825897217, 4.557157516479492, 4.930630207061768, 5.304102897644043, 5.67757511138916, 6.051048278808594, 6.424520492553711, 6.797993183135986, 7.171465873718262, 7.544938564300537, 7.9184112548828125, 8.29188346862793, 8.665356636047363, 9.03882884979248, 9.412302017211914, 9.785774230957031, 10.159246444702148, 10.532719612121582]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 10.0, 13.0, 8.0, 22.0, 18.0, 20.0, 18.0, 30.0, 35.0, 39.0, 43.0, 37.0, 49.0, 59.0, 47.0, 52.0, 49.0, 43.0, 39.0, 37.0, 43.0, 40.0, 36.0, 25.0, 25.0, 27.0, 16.0, 14.0, 15.0, 17.0, 8.0, 10.0, 11.0, 8.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.286811828613281, -5.130206108093262, -4.973600387573242, -4.816994667053223, -4.660388946533203, -4.503783226013184, -4.347177505493164, -4.1905717849731445, -4.033966064453125, -3.8773603439331055, -3.720754623413086, -3.5641489028930664, -3.407543182373047, -3.2509374618530273, -3.094331979751587, -2.9377262592315674, -2.781120777130127, -2.6245150566101074, -2.467909336090088, -2.3113036155700684, -2.154697895050049, -1.9980922937393188, -1.8414866924285889, -1.6848809719085693, -1.5282752513885498, -1.3716695308685303, -1.2150638103485107, -1.0584582090377808, -0.9018524885177612, -0.7452467679977417, -0.5886411070823669, -0.4320354461669922, -0.27542972564697266, -0.11882403492927551, 0.03778165578842163, 0.19438734650611877, 0.3509930372238159, 0.5075987577438354, 0.6642044186592102, 0.820810079574585, 0.9774158000946045, 1.134021520614624, 1.2906272411346436, 1.4472328424453735, 1.603838562965393, 1.7604442834854126, 1.9170498847961426, 2.073655605316162, 2.2302613258361816, 2.386867046356201, 2.5434727668762207, 2.7000784873962402, 2.8566842079162598, 3.0132899284362793, 3.1698954105377197, 3.3265011310577393, 3.483106851577759, 3.6397125720977783, 3.796318292617798, 3.9529240131378174, 4.109529495239258, 4.266135215759277, 4.422740936279297, 4.579346656799316, 4.735952377319336]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 14.0, 16.0, 35.0, 42.0, 58.0, 78.0, 145.0, 234.0, 351.0, 577.0, 892.0, 1608.0, 2834.0, 5284.0, 10934.0, 23501.0, 54898.0, 129465.0, 258400.0, 281321.0, 155530.0, 66614.0, 28608.0, 13009.0, 6476.0, 3163.0, 1803.0, 990.0, 604.0, 359.0, 217.0, 164.0, 91.0, 68.0, 42.0, 40.0, 26.0, 11.0, 10.0, 12.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7626953125, -0.7381820678710938, -0.7136688232421875, -0.6891555786132812, -0.664642333984375, -0.6401290893554688, -0.6156158447265625, -0.5911026000976562, -0.56658935546875, -0.5420761108398438, -0.5175628662109375, -0.49304962158203125, -0.468536376953125, -0.44402313232421875, -0.4195098876953125, -0.39499664306640625, -0.3704833984375, -0.34597015380859375, -0.3214569091796875, -0.29694366455078125, -0.272430419921875, -0.24791717529296875, -0.2234039306640625, -0.19889068603515625, -0.17437744140625, -0.14986419677734375, -0.1253509521484375, -0.10083770751953125, -0.076324462890625, -0.05181121826171875, -0.0272979736328125, -0.00278472900390625, 0.021728515625, 0.04624176025390625, 0.0707550048828125, 0.09526824951171875, 0.119781494140625, 0.14429473876953125, 0.1688079833984375, 0.19332122802734375, 0.21783447265625, 0.24234771728515625, 0.2668609619140625, 0.29137420654296875, 0.315887451171875, 0.34040069580078125, 0.3649139404296875, 0.38942718505859375, 0.4139404296875, 0.43845367431640625, 0.4629669189453125, 0.48748016357421875, 0.511993408203125, 0.5365066528320312, 0.5610198974609375, 0.5855331420898438, 0.61004638671875, 0.6345596313476562, 0.6590728759765625, 0.6835861206054688, 0.708099365234375, 0.7326126098632812, 0.7571258544921875, 0.7816390991210938, 0.80615234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 17.0, 9.0, 14.0, 21.0, 38.0, 45.0, 43.0, 55.0, 59.0, 86.0, 77.0, 77.0, 86.0, 60.0, 77.0, 50.0, 35.0, 34.0, 32.0, 19.0, 19.0, 11.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.93408203125, -0.9090118408203125, -0.883941650390625, -0.8588714599609375, -0.83380126953125, -0.8087310791015625, -0.783660888671875, -0.7585906982421875, -0.7335205078125, -0.7084503173828125, -0.683380126953125, -0.6583099365234375, -0.63323974609375, -0.6081695556640625, -0.583099365234375, -0.5580291748046875, -0.532958984375, -0.5078887939453125, -0.482818603515625, -0.4577484130859375, -0.43267822265625, -0.4076080322265625, -0.382537841796875, -0.3574676513671875, -0.3323974609375, -0.3073272705078125, -0.282257080078125, -0.2571868896484375, -0.23211669921875, -0.2070465087890625, -0.181976318359375, -0.1569061279296875, -0.1318359375, -0.1067657470703125, -0.081695556640625, -0.0566253662109375, -0.03155517578125, -0.0064849853515625, 0.018585205078125, 0.0436553955078125, 0.0687255859375, 0.0937957763671875, 0.118865966796875, 0.1439361572265625, 0.16900634765625, 0.1940765380859375, 0.219146728515625, 0.2442169189453125, 0.269287109375, 0.2943572998046875, 0.319427490234375, 0.3444976806640625, 0.36956787109375, 0.3946380615234375, 0.419708251953125, 0.4447784423828125, 0.4698486328125, 0.4949188232421875, 0.519989013671875, 0.5450592041015625, 0.57012939453125, 0.5951995849609375, 0.620269775390625, 0.6453399658203125, 0.67041015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 13.0, 8.0, 9.0, 12.0, 17.0, 29.0, 38.0, 31.0, 61.0, 78.0, 124.0, 184.0, 305.0, 648.0, 1367.0, 3675.0, 10977.0, 40248.0, 173655.0, 599504.0, 163013.0, 37750.0, 10456.0, 3493.0, 1294.0, 612.0, 344.0, 194.0, 95.0, 77.0, 53.0, 45.0, 35.0, 27.0, 14.0, 15.0, 9.0, 9.0, 11.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.390625, -1.347808837890625, -1.30499267578125, -1.262176513671875, -1.2193603515625, -1.176544189453125, -1.13372802734375, -1.090911865234375, -1.048095703125, -1.005279541015625, -0.96246337890625, -0.919647216796875, -0.8768310546875, -0.834014892578125, -0.79119873046875, -0.748382568359375, -0.70556640625, -0.662750244140625, -0.61993408203125, -0.577117919921875, -0.5343017578125, -0.491485595703125, -0.44866943359375, -0.405853271484375, -0.363037109375, -0.320220947265625, -0.27740478515625, -0.234588623046875, -0.1917724609375, -0.148956298828125, -0.10614013671875, -0.063323974609375, -0.0205078125, 0.022308349609375, 0.06512451171875, 0.107940673828125, 0.1507568359375, 0.193572998046875, 0.23638916015625, 0.279205322265625, 0.322021484375, 0.364837646484375, 0.40765380859375, 0.450469970703125, 0.4932861328125, 0.536102294921875, 0.57891845703125, 0.621734619140625, 0.66455078125, 0.707366943359375, 0.75018310546875, 0.792999267578125, 0.8358154296875, 0.878631591796875, 0.92144775390625, 0.964263916015625, 1.007080078125, 1.049896240234375, 1.09271240234375, 1.135528564453125, 1.1783447265625, 1.221160888671875, 1.26397705078125, 1.306793212890625, 1.349609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 9.0, 7.0, 10.0, 10.0, 16.0, 27.0, 26.0, 34.0, 41.0, 43.0, 43.0, 44.0, 52.0, 55.0, 85.0, 67.0, 73.0, 62.0, 47.0, 41.0, 42.0, 25.0, 27.0, 18.0, 29.0, 10.0, 6.0, 8.0, 7.0, 10.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88671875, -2.81036376953125, -2.7340087890625, -2.65765380859375, -2.581298828125, -2.50494384765625, -2.4285888671875, -2.35223388671875, -2.27587890625, -2.19952392578125, -2.1231689453125, -2.04681396484375, -1.970458984375, -1.89410400390625, -1.8177490234375, -1.74139404296875, -1.6650390625, -1.58868408203125, -1.5123291015625, -1.43597412109375, -1.359619140625, -1.28326416015625, -1.2069091796875, -1.13055419921875, -1.05419921875, -0.97784423828125, -0.9014892578125, -0.82513427734375, -0.748779296875, -0.67242431640625, -0.5960693359375, -0.51971435546875, -0.443359375, -0.36700439453125, -0.2906494140625, -0.21429443359375, -0.137939453125, -0.06158447265625, 0.0147705078125, 0.09112548828125, 0.16748046875, 0.24383544921875, 0.3201904296875, 0.39654541015625, 0.472900390625, 0.54925537109375, 0.6256103515625, 0.70196533203125, 0.7783203125, 0.85467529296875, 0.9310302734375, 1.00738525390625, 1.083740234375, 1.16009521484375, 1.2364501953125, 1.31280517578125, 1.38916015625, 1.46551513671875, 1.5418701171875, 1.61822509765625, 1.694580078125, 1.77093505859375, 1.8472900390625, 1.92364501953125, 2.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 2.0, 9.0, 8.0, 15.0, 25.0, 27.0, 57.0, 102.0, 157.0, 399.0, 892.0, 2477.0, 8181.0, 32605.0, 172537.0, 682252.0, 115642.0, 23456.0, 6344.0, 1901.0, 778.0, 302.0, 167.0, 85.0, 46.0, 25.0, 20.0, 12.0, 4.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6757659912109375, -0.657196044921875, -0.6386260986328125, -0.62005615234375, -0.6014862060546875, -0.582916259765625, -0.5643463134765625, -0.5457763671875, -0.5272064208984375, -0.508636474609375, -0.4900665283203125, -0.47149658203125, -0.4529266357421875, -0.434356689453125, -0.4157867431640625, -0.397216796875, -0.3786468505859375, -0.360076904296875, -0.3415069580078125, -0.32293701171875, -0.3043670654296875, -0.285797119140625, -0.2672271728515625, -0.2486572265625, -0.2300872802734375, -0.211517333984375, -0.1929473876953125, -0.17437744140625, -0.1558074951171875, -0.137237548828125, -0.1186676025390625, -0.10009765625, -0.0815277099609375, -0.062957763671875, -0.0443878173828125, -0.02581787109375, -0.0072479248046875, 0.011322021484375, 0.0298919677734375, 0.0484619140625, 0.0670318603515625, 0.085601806640625, 0.1041717529296875, 0.12274169921875, 0.1413116455078125, 0.159881591796875, 0.1784515380859375, 0.197021484375, 0.2155914306640625, 0.234161376953125, 0.2527313232421875, 0.27130126953125, 0.2898712158203125, 0.308441162109375, 0.3270111083984375, 0.3455810546875, 0.3641510009765625, 0.382720947265625, 0.4012908935546875, 0.41986083984375, 0.4384307861328125, 0.457000732421875, 0.4755706787109375, 0.494140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 13.0, 8.0, 5.0, 20.0, 20.0, 22.0, 36.0, 46.0, 63.0, 90.0, 105.0, 87.0, 93.0, 72.0, 61.0, 39.0, 41.0, 28.0, 25.0, 20.0, 13.0, 5.0, 10.0, 8.0, 8.0, 4.0, 8.0, 8.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0001709461212158203, -0.00016579777002334595, -0.00016064941883087158, -0.00015550106763839722, -0.00015035271644592285, -0.00014520436525344849, -0.00014005601406097412, -0.00013490766286849976, -0.0001297593116760254, -0.00012461096048355103, -0.00011946260929107666, -0.0001143142580986023, -0.00010916590690612793, -0.00010401755571365356, -9.88692045211792e-05, -9.372085332870483e-05, -8.857250213623047e-05, -8.34241509437561e-05, -7.827579975128174e-05, -7.312744855880737e-05, -6.797909736633301e-05, -6.283074617385864e-05, -5.768239498138428e-05, -5.253404378890991e-05, -4.738569259643555e-05, -4.223734140396118e-05, -3.7088990211486816e-05, -3.194063901901245e-05, -2.6792287826538086e-05, -2.164393663406372e-05, -1.6495585441589355e-05, -1.134723424911499e-05, -6.198883056640625e-06, -1.0505318641662598e-06, 4.0978193283081055e-06, 9.24617052078247e-06, 1.4394521713256836e-05, 1.95428729057312e-05, 2.4691224098205566e-05, 2.983957529067993e-05, 3.49879264831543e-05, 4.013627767562866e-05, 4.528462886810303e-05, 5.043298006057739e-05, 5.558133125305176e-05, 6.072968244552612e-05, 6.587803363800049e-05, 7.102638483047485e-05, 7.617473602294922e-05, 8.132308721542358e-05, 8.647143840789795e-05, 9.161978960037231e-05, 9.676814079284668e-05, 0.00010191649198532104, 0.00010706484317779541, 0.00011221319437026978, 0.00011736154556274414, 0.0001225098967552185, 0.00012765824794769287, 0.00013280659914016724, 0.0001379549503326416, 0.00014310330152511597, 0.00014825165271759033, 0.0001534000039100647, 0.00015854835510253906]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 9.0, 7.0, 25.0, 39.0, 72.0, 121.0, 399.0, 1332.0, 7417.0, 68262.0, 780280.0, 172290.0, 15141.0, 2233.0, 537.0, 205.0, 74.0, 51.0, 24.0, 18.0, 10.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0818023681640625, -1.055206298828125, -1.0286102294921875, -1.00201416015625, -0.9754180908203125, -0.948822021484375, -0.9222259521484375, -0.8956298828125, -0.8690338134765625, -0.842437744140625, -0.8158416748046875, -0.78924560546875, -0.7626495361328125, -0.736053466796875, -0.7094573974609375, -0.682861328125, -0.6562652587890625, -0.629669189453125, -0.6030731201171875, -0.57647705078125, -0.5498809814453125, -0.523284912109375, -0.4966888427734375, -0.4700927734375, -0.4434967041015625, -0.416900634765625, -0.3903045654296875, -0.36370849609375, -0.3371124267578125, -0.310516357421875, -0.2839202880859375, -0.25732421875, -0.2307281494140625, -0.204132080078125, -0.1775360107421875, -0.15093994140625, -0.1243438720703125, -0.097747802734375, -0.0711517333984375, -0.0445556640625, -0.0179595947265625, 0.008636474609375, 0.0352325439453125, 0.06182861328125, 0.0884246826171875, 0.115020751953125, 0.1416168212890625, 0.168212890625, 0.1948089599609375, 0.221405029296875, 0.2480010986328125, 0.27459716796875, 0.3011932373046875, 0.327789306640625, 0.3543853759765625, 0.3809814453125, 0.4075775146484375, 0.434173583984375, 0.4607696533203125, 0.48736572265625, 0.5139617919921875, 0.540557861328125, 0.5671539306640625, 0.59375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 5.0, 7.0, 21.0, 28.0, 51.0, 72.0, 82.0, 145.0, 128.0, 112.0, 116.0, 77.0, 51.0, 41.0, 25.0, 16.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.2216796875, -1.1960372924804688, -1.1703948974609375, -1.1447525024414062, -1.119110107421875, -1.0934677124023438, -1.0678253173828125, -1.0421829223632812, -1.01654052734375, -0.9908981323242188, -0.9652557373046875, -0.9396133422851562, -0.913970947265625, -0.8883285522460938, -0.8626861572265625, -0.8370437622070312, -0.8114013671875, -0.7857589721679688, -0.7601165771484375, -0.7344741821289062, -0.708831787109375, -0.6831893920898438, -0.6575469970703125, -0.6319046020507812, -0.60626220703125, -0.5806198120117188, -0.5549774169921875, -0.5293350219726562, -0.503692626953125, -0.47805023193359375, -0.4524078369140625, -0.42676544189453125, -0.401123046875, -0.37548065185546875, -0.3498382568359375, -0.32419586181640625, -0.298553466796875, -0.27291107177734375, -0.2472686767578125, -0.22162628173828125, -0.19598388671875, -0.17034149169921875, -0.1446990966796875, -0.11905670166015625, -0.093414306640625, -0.06777191162109375, -0.0421295166015625, -0.01648712158203125, 0.0091552734375, 0.03479766845703125, 0.0604400634765625, 0.08608245849609375, 0.111724853515625, 0.13736724853515625, 0.1630096435546875, 0.18865203857421875, 0.21429443359375, 0.23993682861328125, 0.2655792236328125, 0.29122161865234375, 0.316864013671875, 0.34250640869140625, 0.3681488037109375, 0.39379119873046875, 0.41943359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 6.0, 20.0, 23.0, 71.0, 138.0, 241.0, 277.0, 117.0, 56.0, 29.0, 9.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.208133697509766, -26.675291061401367, -26.14244842529297, -25.60960578918457, -25.076763153076172, -24.54391860961914, -24.011077880859375, -23.478233337402344, -22.945390701293945, -22.412548065185547, -21.87970542907715, -21.34686279296875, -20.81402015686035, -20.281177520751953, -19.748332977294922, -19.215490341186523, -18.682647705078125, -18.149805068969727, -17.616962432861328, -17.08411979675293, -16.55127716064453, -16.0184326171875, -15.485590934753418, -14.95274829864502, -14.419906616210938, -13.887063980102539, -13.35422134399414, -12.821378707885742, -12.288535118103027, -11.755692481994629, -11.22284984588623, -10.690007209777832, -10.157164573669434, -9.624321937561035, -9.091479301452637, -8.558635711669922, -8.025793075561523, -7.492950439453125, -6.960107803344727, -6.427265167236328, -5.8944220542907715, -5.361579418182373, -4.828736305236816, -4.295893669128418, -3.7630507946014404, -3.230207920074463, -2.6973652839660645, -2.164522409439087, -1.6316795349121094, -1.0988366603851318, -0.5659939050674438, -0.03315114974975586, 0.4996917247772217, 1.0325345993041992, 1.5653772354125977, 2.098220109939575, 2.6310629844665527, 3.1639058589935303, 3.696748733520508, 4.229591369628906, 4.762434005737305, 5.295277118682861, 5.82811975479126, 6.360962867736816, 6.893805503845215]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 9.0, 9.0, 14.0, 16.0, 14.0, 15.0, 20.0, 17.0, 25.0, 37.0, 30.0, 38.0, 33.0, 41.0, 50.0, 59.0, 84.0, 78.0, 60.0, 39.0, 33.0, 30.0, 43.0, 28.0, 25.0, 26.0, 17.0, 17.0, 11.0, 8.0, 10.0, 8.0, 10.0, 7.0, 3.0, 7.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.202334880828857, -6.960450172424316, -6.718564987182617, -6.476679801940918, -6.234795093536377, -5.992910385131836, -5.751025199890137, -5.5091400146484375, -5.2672553062438965, -5.0253705978393555, -4.783485412597656, -4.541600227355957, -4.299715518951416, -4.057830810546875, -3.815945625305176, -3.5740606784820557, -3.3321757316589355, -3.0902907848358154, -2.8484058380126953, -2.606520891189575, -2.364635944366455, -2.122750997543335, -1.8808660507202148, -1.6389811038970947, -1.3970961570739746, -1.1552112102508545, -0.9133262634277344, -0.6714413166046143, -0.42955636978149414, -0.18767142295837402, 0.054213523864746094, 0.2960984706878662, 0.5379829406738281, 0.7798678874969482, 1.0217528343200684, 1.2636377811431885, 1.5055227279663086, 1.7474076747894287, 1.9892926216125488, 2.231177568435669, 2.473062515258789, 2.714947462081909, 2.9568324089050293, 3.1987173557281494, 3.4406023025512695, 3.6824872493743896, 3.9243721961975098, 4.166256904602051, 4.40814208984375, 4.650027275085449, 4.89191198348999, 5.133796691894531, 5.3756818771362305, 5.61756706237793, 5.859451770782471, 6.101336479187012, 6.343221664428711, 6.58510684967041, 6.826991558074951, 7.068876266479492, 7.310761451721191, 7.552646636962891, 7.794531345367432, 8.036416053771973, 8.278301239013672]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 9.0, 11.0, 8.0, 21.0, 21.0, 19.0, 31.0, 37.0, 55.0, 74.0, 134.0, 167.0, 252.0, 387.0, 657.0, 1172.0, 2405.0, 7155.0, 34762.0, 306157.0, 2744876.0, 989648.0, 84770.0, 13414.0, 4044.0, 1642.0, 827.0, 494.0, 321.0, 201.0, 147.0, 98.0, 50.0, 45.0, 32.0, 19.0, 23.0, 17.0, 15.0, 13.0, 13.0, 8.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.89892578125, -0.8730392456054688, -0.8471527099609375, -0.8212661743164062, -0.795379638671875, -0.7694931030273438, -0.7436065673828125, -0.7177200317382812, -0.69183349609375, -0.6659469604492188, -0.6400604248046875, -0.6141738891601562, -0.588287353515625, -0.5624008178710938, -0.5365142822265625, -0.5106277465820312, -0.4847412109375, -0.45885467529296875, -0.4329681396484375, -0.40708160400390625, -0.381195068359375, -0.35530853271484375, -0.3294219970703125, -0.30353546142578125, -0.27764892578125, -0.25176239013671875, -0.2258758544921875, -0.19998931884765625, -0.174102783203125, -0.14821624755859375, -0.1223297119140625, -0.09644317626953125, -0.070556640625, -0.04467010498046875, -0.0187835693359375, 0.00710296630859375, 0.032989501953125, 0.05887603759765625, 0.0847625732421875, 0.11064910888671875, 0.13653564453125, 0.16242218017578125, 0.1883087158203125, 0.21419525146484375, 0.240081787109375, 0.26596832275390625, 0.2918548583984375, 0.31774139404296875, 0.3436279296875, 0.36951446533203125, 0.3954010009765625, 0.42128753662109375, 0.447174072265625, 0.47306060791015625, 0.4989471435546875, 0.5248336791992188, 0.55072021484375, 0.5766067504882812, 0.6024932861328125, 0.6283798217773438, 0.654266357421875, 0.6801528930664062, 0.7060394287109375, 0.7319259643554688, 0.7578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 12.0, 6.0, 17.0, 11.0, 16.0, 33.0, 30.0, 50.0, 46.0, 62.0, 66.0, 74.0, 86.0, 81.0, 61.0, 72.0, 61.0, 52.0, 43.0, 28.0, 31.0, 18.0, 19.0, 10.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93994140625, -0.914459228515625, -0.88897705078125, -0.863494873046875, -0.8380126953125, -0.812530517578125, -0.78704833984375, -0.761566162109375, -0.736083984375, -0.710601806640625, -0.68511962890625, -0.659637451171875, -0.6341552734375, -0.608673095703125, -0.58319091796875, -0.557708740234375, -0.5322265625, -0.506744384765625, -0.48126220703125, -0.455780029296875, -0.4302978515625, -0.404815673828125, -0.37933349609375, -0.353851318359375, -0.328369140625, -0.302886962890625, -0.27740478515625, -0.251922607421875, -0.2264404296875, -0.200958251953125, -0.17547607421875, -0.149993896484375, -0.12451171875, -0.099029541015625, -0.07354736328125, -0.048065185546875, -0.0225830078125, 0.002899169921875, 0.02838134765625, 0.053863525390625, 0.079345703125, 0.104827880859375, 0.13031005859375, 0.155792236328125, 0.1812744140625, 0.206756591796875, 0.23223876953125, 0.257720947265625, 0.283203125, 0.308685302734375, 0.33416748046875, 0.359649658203125, 0.3851318359375, 0.410614013671875, 0.43609619140625, 0.461578369140625, 0.487060546875, 0.512542724609375, 0.53802490234375, 0.563507080078125, 0.5889892578125, 0.614471435546875, 0.63995361328125, 0.665435791015625, 0.69091796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 14.0, 26.0, 37.0, 71.0, 162.0, 335.0, 712.0, 2044.0, 11246.0, 812771.0, 3342145.0, 20659.0, 2597.0, 807.0, 306.0, 151.0, 100.0, 54.0, 13.0, 11.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.443359375, -2.367279052734375, -2.29119873046875, -2.215118408203125, -2.1390380859375, -2.062957763671875, -1.98687744140625, -1.910797119140625, -1.834716796875, -1.758636474609375, -1.68255615234375, -1.606475830078125, -1.5303955078125, -1.454315185546875, -1.37823486328125, -1.302154541015625, -1.22607421875, -1.149993896484375, -1.07391357421875, -0.997833251953125, -0.9217529296875, -0.845672607421875, -0.76959228515625, -0.693511962890625, -0.617431640625, -0.541351318359375, -0.46527099609375, -0.389190673828125, -0.3131103515625, -0.237030029296875, -0.16094970703125, -0.084869384765625, -0.0087890625, 0.067291259765625, 0.14337158203125, 0.219451904296875, 0.2955322265625, 0.371612548828125, 0.44769287109375, 0.523773193359375, 0.599853515625, 0.675933837890625, 0.75201416015625, 0.828094482421875, 0.9041748046875, 0.980255126953125, 1.05633544921875, 1.132415771484375, 1.20849609375, 1.284576416015625, 1.36065673828125, 1.436737060546875, 1.5128173828125, 1.588897705078125, 1.66497802734375, 1.741058349609375, 1.817138671875, 1.893218994140625, 1.96929931640625, 2.045379638671875, 2.1214599609375, 2.197540283203125, 2.27362060546875, 2.349700927734375, 2.42578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 10.0, 11.0, 16.0, 24.0, 30.0, 59.0, 107.0, 219.0, 444.0, 734.0, 932.0, 664.0, 366.0, 169.0, 111.0, 63.0, 41.0, 19.0, 16.0, 8.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.470611572265625, -1.42657470703125, -1.382537841796875, -1.3385009765625, -1.294464111328125, -1.25042724609375, -1.206390380859375, -1.162353515625, -1.118316650390625, -1.07427978515625, -1.030242919921875, -0.9862060546875, -0.942169189453125, -0.89813232421875, -0.854095458984375, -0.81005859375, -0.766021728515625, -0.72198486328125, -0.677947998046875, -0.6339111328125, -0.589874267578125, -0.54583740234375, -0.501800537109375, -0.457763671875, -0.413726806640625, -0.36968994140625, -0.325653076171875, -0.2816162109375, -0.237579345703125, -0.19354248046875, -0.149505615234375, -0.10546875, -0.061431884765625, -0.01739501953125, 0.026641845703125, 0.0706787109375, 0.114715576171875, 0.15875244140625, 0.202789306640625, 0.246826171875, 0.290863037109375, 0.33489990234375, 0.378936767578125, 0.4229736328125, 0.467010498046875, 0.51104736328125, 0.555084228515625, 0.59912109375, 0.643157958984375, 0.68719482421875, 0.731231689453125, 0.7752685546875, 0.819305419921875, 0.86334228515625, 0.907379150390625, 0.951416015625, 0.995452880859375, 1.03948974609375, 1.083526611328125, 1.1275634765625, 1.171600341796875, 1.21563720703125, 1.259674072265625, 1.3037109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 10.0, 35.0, 53.0, 88.0, 148.0, 160.0, 163.0, 114.0, 92.0, 48.0, 32.0, 15.0, 13.0, 9.0, 5.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.978214263916016, -5.6743268966674805, -5.370439529418945, -5.06655216217041, -4.762664794921875, -4.45877742767334, -4.154890537261963, -3.8510031700134277, -3.5471158027648926, -3.2432284355163574, -2.9393410682678223, -2.635453939437866, -2.331566572189331, -2.027679204940796, -1.7237919569015503, -1.4199047088623047, -1.1160173416137695, -0.8121300339698792, -0.5082427263259888, -0.2043554186820984, 0.09953188896179199, 0.40341925621032715, 0.7073065042495728, 1.0111937522888184, 1.3150811195373535, 1.6189684867858887, 1.9228557348251343, 2.22674298286438, 2.530630350112915, 2.83451771736145, 3.1384048461914062, 3.4422922134399414, 3.7461795806884766, 4.050066947937012, 4.353954315185547, 4.657841682434082, 4.961729049682617, 5.265616416931152, 5.569503307342529, 5.8733906745910645, 6.1772780418396, 6.481165409088135, 6.78505277633667, 7.088940143585205, 7.392827033996582, 7.696714401245117, 8.000601768493652, 8.304489135742188, 8.608376502990723, 8.912263870239258, 9.216151237487793, 9.520038604736328, 9.823925971984863, 10.127813339233398, 10.431700706481934, 10.735588073730469, 11.039474487304688, 11.343361854553223, 11.647249221801758, 11.951136589050293, 12.255023956298828, 12.558911323547363, 12.862798690795898, 13.166685104370117, 13.470573425292969]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 5.0, 14.0, 12.0, 13.0, 20.0, 18.0, 22.0, 19.0, 39.0, 31.0, 31.0, 41.0, 35.0, 50.0, 48.0, 41.0, 61.0, 40.0, 45.0, 56.0, 37.0, 28.0, 42.0, 41.0, 21.0, 23.0, 27.0, 22.0, 18.0, 22.0, 10.0, 14.0, 9.0, 9.0, 8.0, 3.0, 3.0, 1.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.281271457672119, -4.141806602478027, -4.002341270446777, -3.8628764152526855, -3.7234115600585938, -3.583946704864502, -3.444481611251831, -3.30501651763916, -3.1655516624450684, -3.0260868072509766, -2.8866217136383057, -2.7471566200256348, -2.607691764831543, -2.468226909637451, -2.3287618160247803, -2.1892967224121094, -2.0498318672180176, -1.9103668928146362, -1.7709019184112549, -1.6314369440078735, -1.4919719696044922, -1.3525069952011108, -1.2130420207977295, -1.0735770463943481, -0.9341120719909668, -0.7946470975875854, -0.6551821231842041, -0.5157171487808228, -0.3762521743774414, -0.23678719997406006, -0.09732222557067871, 0.04214274883270264, 0.1816082000732422, 0.32107317447662354, 0.4605381488800049, 0.6000031232833862, 0.7394680976867676, 0.8789330720901489, 1.0183980464935303, 1.1578630208969116, 1.297327995300293, 1.4367929697036743, 1.5762579441070557, 1.715722918510437, 1.8551878929138184, 1.9946528673171997, 2.134117841720581, 2.273582935333252, 2.4130477905273438, 2.5525126457214355, 2.6919777393341064, 2.8314428329467773, 2.970907688140869, 3.110372543334961, 3.249837636947632, 3.3893027305603027, 3.5287675857543945, 3.6682324409484863, 3.8076975345611572, 3.947162628173828, 4.08662748336792, 4.226092338562012, 4.365557670593262, 4.5050225257873535, 4.644487380981445]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 9.0, 4.0, 14.0, 15.0, 20.0, 27.0, 38.0, 44.0, 68.0, 94.0, 123.0, 176.0, 286.0, 537.0, 876.0, 1542.0, 2897.0, 5504.0, 11310.0, 24102.0, 53421.0, 120178.0, 247896.0, 287459.0, 159706.0, 70853.0, 31478.0, 14529.0, 7050.0, 3534.0, 1943.0, 1064.0, 611.0, 385.0, 248.0, 149.0, 109.0, 75.0, 62.0, 40.0, 11.0, 22.0, 15.0, 9.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.72412109375, -0.7022933959960938, -0.6804656982421875, -0.6586380004882812, -0.636810302734375, -0.6149826049804688, -0.5931549072265625, -0.5713272094726562, -0.54949951171875, -0.5276718139648438, -0.5058441162109375, -0.48401641845703125, -0.462188720703125, -0.44036102294921875, -0.4185333251953125, -0.39670562744140625, -0.3748779296875, -0.35305023193359375, -0.3312225341796875, -0.30939483642578125, -0.287567138671875, -0.26573944091796875, -0.2439117431640625, -0.22208404541015625, -0.20025634765625, -0.17842864990234375, -0.1566009521484375, -0.13477325439453125, -0.112945556640625, -0.09111785888671875, -0.0692901611328125, -0.04746246337890625, -0.025634765625, -0.00380706787109375, 0.0180206298828125, 0.03984832763671875, 0.061676025390625, 0.08350372314453125, 0.1053314208984375, 0.12715911865234375, 0.14898681640625, 0.17081451416015625, 0.1926422119140625, 0.21446990966796875, 0.236297607421875, 0.25812530517578125, 0.2799530029296875, 0.30178070068359375, 0.3236083984375, 0.34543609619140625, 0.3672637939453125, 0.38909149169921875, 0.410919189453125, 0.43274688720703125, 0.4545745849609375, 0.47640228271484375, 0.49822998046875, 0.5200576782226562, 0.5418853759765625, 0.5637130737304688, 0.585540771484375, 0.6073684692382812, 0.6291961669921875, 0.6510238647460938, 0.6728515625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 5.0, 8.0, 12.0, 11.0, 25.0, 26.0, 36.0, 31.0, 48.0, 70.0, 57.0, 79.0, 85.0, 56.0, 71.0, 72.0, 63.0, 49.0, 59.0, 32.0, 33.0, 16.0, 13.0, 9.0, 12.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95556640625, -0.9297943115234375, -0.904022216796875, -0.8782501220703125, -0.85247802734375, -0.8267059326171875, -0.800933837890625, -0.7751617431640625, -0.7493896484375, -0.7236175537109375, -0.697845458984375, -0.6720733642578125, -0.64630126953125, -0.6205291748046875, -0.594757080078125, -0.5689849853515625, -0.543212890625, -0.5174407958984375, -0.491668701171875, -0.4658966064453125, -0.44012451171875, -0.4143524169921875, -0.388580322265625, -0.3628082275390625, -0.3370361328125, -0.3112640380859375, -0.285491943359375, -0.2597198486328125, -0.23394775390625, -0.2081756591796875, -0.182403564453125, -0.1566314697265625, -0.130859375, -0.1050872802734375, -0.079315185546875, -0.0535430908203125, -0.02777099609375, -0.0019989013671875, 0.023773193359375, 0.0495452880859375, 0.0753173828125, 0.1010894775390625, 0.126861572265625, 0.1526336669921875, 0.17840576171875, 0.2041778564453125, 0.229949951171875, 0.2557220458984375, 0.281494140625, 0.3072662353515625, 0.333038330078125, 0.3588104248046875, 0.38458251953125, 0.4103546142578125, 0.436126708984375, 0.4618988037109375, 0.4876708984375, 0.5134429931640625, 0.539215087890625, 0.5649871826171875, 0.59075927734375, 0.6165313720703125, 0.642303466796875, 0.6680755615234375, 0.69384765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 3.0, 16.0, 19.0, 48.0, 60.0, 85.0, 162.0, 221.0, 421.0, 779.0, 1727.0, 5233.0, 24527.0, 169281.0, 720611.0, 102326.0, 16216.0, 3839.0, 1332.0, 639.0, 388.0, 217.0, 132.0, 89.0, 52.0, 30.0, 21.0, 21.0, 10.0, 7.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.572265625, -1.5205078125, -1.46875, -1.4169921875, -1.365234375, -1.3134765625, -1.26171875, -1.2099609375, -1.158203125, -1.1064453125, -1.0546875, -1.0029296875, -0.951171875, -0.8994140625, -0.84765625, -0.7958984375, -0.744140625, -0.6923828125, -0.640625, -0.5888671875, -0.537109375, -0.4853515625, -0.43359375, -0.3818359375, -0.330078125, -0.2783203125, -0.2265625, -0.1748046875, -0.123046875, -0.0712890625, -0.01953125, 0.0322265625, 0.083984375, 0.1357421875, 0.1875, 0.2392578125, 0.291015625, 0.3427734375, 0.39453125, 0.4462890625, 0.498046875, 0.5498046875, 0.6015625, 0.6533203125, 0.705078125, 0.7568359375, 0.80859375, 0.8603515625, 0.912109375, 0.9638671875, 1.015625, 1.0673828125, 1.119140625, 1.1708984375, 1.22265625, 1.2744140625, 1.326171875, 1.3779296875, 1.4296875, 1.4814453125, 1.533203125, 1.5849609375, 1.63671875, 1.6884765625, 1.740234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 14.0, 17.0, 17.0, 24.0, 33.0, 42.0, 42.0, 66.0, 71.0, 67.0, 66.0, 77.0, 72.0, 73.0, 67.0, 53.0, 48.0, 26.0, 27.0, 29.0, 22.0, 10.0, 12.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.21923828125, -2.1240234375, -2.02880859375, -1.93359375, -1.83837890625, -1.7431640625, -1.64794921875, -1.552734375, -1.45751953125, -1.3623046875, -1.26708984375, -1.171875, -1.07666015625, -0.9814453125, -0.88623046875, -0.791015625, -0.69580078125, -0.6005859375, -0.50537109375, -0.41015625, -0.31494140625, -0.2197265625, -0.12451171875, -0.029296875, 0.06591796875, 0.1611328125, 0.25634765625, 0.3515625, 0.44677734375, 0.5419921875, 0.63720703125, 0.732421875, 0.82763671875, 0.9228515625, 1.01806640625, 1.11328125, 1.20849609375, 1.3037109375, 1.39892578125, 1.494140625, 1.58935546875, 1.6845703125, 1.77978515625, 1.875, 1.97021484375, 2.0654296875, 2.16064453125, 2.255859375, 2.35107421875, 2.4462890625, 2.54150390625, 2.63671875, 2.73193359375, 2.8271484375, 2.92236328125, 3.017578125, 3.11279296875, 3.2080078125, 3.30322265625, 3.3984375, 3.49365234375, 3.5888671875, 3.68408203125, 3.779296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 8.0, 11.0, 13.0, 8.0, 12.0, 23.0, 26.0, 49.0, 53.0, 92.0, 127.0, 233.0, 376.0, 592.0, 1124.0, 2331.0, 5333.0, 13626.0, 39447.0, 131230.0, 606508.0, 169447.0, 48942.0, 16620.0, 6423.0, 2784.0, 1369.0, 645.0, 414.0, 220.0, 151.0, 96.0, 63.0, 43.0, 29.0, 21.0, 15.0, 20.0, 8.0, 7.0, 5.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.319091796875, -0.30866241455078125, -0.2982330322265625, -0.28780364990234375, -0.277374267578125, -0.26694488525390625, -0.2565155029296875, -0.24608612060546875, -0.23565673828125, -0.22522735595703125, -0.2147979736328125, -0.20436859130859375, -0.193939208984375, -0.18350982666015625, -0.1730804443359375, -0.16265106201171875, -0.1522216796875, -0.14179229736328125, -0.1313629150390625, -0.12093353271484375, -0.110504150390625, -0.10007476806640625, -0.0896453857421875, -0.07921600341796875, -0.06878662109375, -0.05835723876953125, -0.0479278564453125, -0.03749847412109375, -0.027069091796875, -0.01663970947265625, -0.0062103271484375, 0.00421905517578125, 0.0146484375, 0.02507781982421875, 0.0355072021484375, 0.04593658447265625, 0.056365966796875, 0.06679534912109375, 0.0772247314453125, 0.08765411376953125, 0.09808349609375, 0.10851287841796875, 0.1189422607421875, 0.12937164306640625, 0.139801025390625, 0.15023040771484375, 0.1606597900390625, 0.17108917236328125, 0.1815185546875, 0.19194793701171875, 0.2023773193359375, 0.21280670166015625, 0.223236083984375, 0.23366546630859375, 0.2440948486328125, 0.25452423095703125, 0.26495361328125, 0.27538299560546875, 0.2858123779296875, 0.29624176025390625, 0.306671142578125, 0.31710052490234375, 0.3275299072265625, 0.33795928955078125, 0.348388671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 6.0, 6.0, 15.0, 14.0, 19.0, 38.0, 28.0, 49.0, 56.0, 87.0, 109.0, 128.0, 116.0, 71.0, 47.0, 50.0, 26.0, 33.0, 23.0, 11.0, 19.0, 9.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00016832351684570312, -0.00016340985894203186, -0.0001584962010383606, -0.00015358254313468933, -0.00014866888523101807, -0.0001437552273273468, -0.00013884156942367554, -0.00013392791152000427, -0.000129014253616333, -0.00012410059571266174, -0.00011918693780899048, -0.00011427327990531921, -0.00010935962200164795, -0.00010444596409797668, -9.953230619430542e-05, -9.461864829063416e-05, -8.970499038696289e-05, -8.479133248329163e-05, -7.987767457962036e-05, -7.49640166759491e-05, -7.005035877227783e-05, -6.513670086860657e-05, -6.02230429649353e-05, -5.530938506126404e-05, -5.0395727157592773e-05, -4.548206925392151e-05, -4.0568411350250244e-05, -3.565475344657898e-05, -3.0741095542907715e-05, -2.582743763923645e-05, -2.0913779735565186e-05, -1.600012183189392e-05, -1.1086463928222656e-05, -6.172806024551392e-06, -1.259148120880127e-06, 3.6545097827911377e-06, 8.568167686462402e-06, 1.3481825590133667e-05, 1.839548349380493e-05, 2.3309141397476196e-05, 2.822279930114746e-05, 3.3136457204818726e-05, 3.805011510848999e-05, 4.2963773012161255e-05, 4.787743091583252e-05, 5.2791088819503784e-05, 5.770474672317505e-05, 6.261840462684631e-05, 6.753206253051758e-05, 7.244572043418884e-05, 7.735937833786011e-05, 8.227303624153137e-05, 8.718669414520264e-05, 9.21003520488739e-05, 9.701400995254517e-05, 0.00010192766785621643, 0.0001068413257598877, 0.00011175498366355896, 0.00011666864156723022, 0.00012158229947090149, 0.00012649595737457275, 0.00013140961527824402, 0.00013632327318191528, 0.00014123693108558655, 0.0001461505889892578]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 6.0, 7.0, 13.0, 8.0, 34.0, 40.0, 83.0, 97.0, 225.0, 468.0, 964.0, 2544.0, 8834.0, 36810.0, 220415.0, 674906.0, 79503.0, 16410.0, 4376.0, 1519.0, 600.0, 287.0, 162.0, 91.0, 58.0, 35.0, 23.0, 10.0, 4.0, 6.0, 8.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.40283203125, -0.38747406005859375, -0.3721160888671875, -0.35675811767578125, -0.341400146484375, -0.32604217529296875, -0.3106842041015625, -0.29532623291015625, -0.27996826171875, -0.26461029052734375, -0.2492523193359375, -0.23389434814453125, -0.218536376953125, -0.20317840576171875, -0.1878204345703125, -0.17246246337890625, -0.1571044921875, -0.14174652099609375, -0.1263885498046875, -0.11103057861328125, -0.095672607421875, -0.08031463623046875, -0.0649566650390625, -0.04959869384765625, -0.03424072265625, -0.01888275146484375, -0.0035247802734375, 0.01183319091796875, 0.027191162109375, 0.04254913330078125, 0.0579071044921875, 0.07326507568359375, 0.088623046875, 0.10398101806640625, 0.1193389892578125, 0.13469696044921875, 0.150054931640625, 0.16541290283203125, 0.1807708740234375, 0.19612884521484375, 0.21148681640625, 0.22684478759765625, 0.2422027587890625, 0.25756072998046875, 0.272918701171875, 0.28827667236328125, 0.3036346435546875, 0.31899261474609375, 0.3343505859375, 0.34970855712890625, 0.3650665283203125, 0.38042449951171875, 0.395782470703125, 0.41114044189453125, 0.4264984130859375, 0.44185638427734375, 0.45721435546875, 0.47257232666015625, 0.4879302978515625, 0.5032882690429688, 0.518646240234375, 0.5340042114257812, 0.5493621826171875, 0.5647201538085938, 0.580078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 8.0, 11.0, 15.0, 24.0, 31.0, 23.0, 45.0, 56.0, 96.0, 126.0, 118.0, 124.0, 88.0, 67.0, 52.0, 37.0, 21.0, 21.0, 9.0, 14.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5359420776367188, -0.5171966552734375, -0.49845123291015625, -0.479705810546875, -0.46096038818359375, -0.4422149658203125, -0.42346954345703125, -0.40472412109375, -0.38597869873046875, -0.3672332763671875, -0.34848785400390625, -0.329742431640625, -0.31099700927734375, -0.2922515869140625, -0.27350616455078125, -0.2547607421875, -0.23601531982421875, -0.2172698974609375, -0.19852447509765625, -0.179779052734375, -0.16103363037109375, -0.1422882080078125, -0.12354278564453125, -0.10479736328125, -0.08605194091796875, -0.0673065185546875, -0.04856109619140625, -0.029815673828125, -0.01107025146484375, 0.0076751708984375, 0.02642059326171875, 0.045166015625, 0.06391143798828125, 0.0826568603515625, 0.10140228271484375, 0.120147705078125, 0.13889312744140625, 0.1576385498046875, 0.17638397216796875, 0.19512939453125, 0.21387481689453125, 0.2326202392578125, 0.25136566162109375, 0.270111083984375, 0.28885650634765625, 0.3076019287109375, 0.32634735107421875, 0.3450927734375, 0.36383819580078125, 0.3825836181640625, 0.40132904052734375, 0.420074462890625, 0.43881988525390625, 0.4575653076171875, 0.47631072998046875, 0.49505615234375, 0.5138015747070312, 0.5325469970703125, 0.5512924194335938, 0.570037841796875, 0.5887832641601562, 0.6075286865234375, 0.6262741088867188, 0.64501953125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 11.0, 17.0, 29.0, 89.0, 156.0, 374.0, 174.0, 85.0, 35.0, 16.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.33283519744873, -14.846481323242188, -14.360127449035645, -13.873773574829102, -13.387419700622559, -12.901065826416016, -12.414711952209473, -11.92835807800293, -11.442004203796387, -10.955650329589844, -10.4692964553833, -9.982942581176758, -9.496588706970215, -9.010234832763672, -8.523880958557129, -8.037527084350586, -7.551173210144043, -7.0648193359375, -6.578465461730957, -6.092111587524414, -5.605757713317871, -5.119403839111328, -4.633049964904785, -4.146696090698242, -3.660342216491699, -3.1739883422851562, -2.6876344680786133, -2.2012805938720703, -1.7149267196655273, -1.2285728454589844, -0.7422189712524414, -0.25586509704589844, 0.23048877716064453, 0.7168426513671875, 1.2031965255737305, 1.6895503997802734, 2.1759042739868164, 2.6622581481933594, 3.1486120223999023, 3.6349658966064453, 4.121319770812988, 4.607673645019531, 5.094027519226074, 5.580381393432617, 6.06673526763916, 6.553089141845703, 7.039443016052246, 7.525796890258789, 8.012150764465332, 8.498504638671875, 8.984858512878418, 9.471212387084961, 9.957566261291504, 10.443920135498047, 10.93027400970459, 11.416627883911133, 11.902981758117676, 12.389335632324219, 12.875689506530762, 13.362043380737305, 13.848397254943848, 14.33475112915039, 14.821105003356934, 15.307458877563477, 15.79381275177002]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 7.0, 8.0, 8.0, 13.0, 7.0, 15.0, 18.0, 24.0, 25.0, 27.0, 30.0, 39.0, 43.0, 40.0, 92.0, 138.0, 105.0, 55.0, 48.0, 57.0, 26.0, 31.0, 25.0, 16.0, 23.0, 11.0, 11.0, 10.0, 10.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881823539733887, -8.582170486450195, -8.282517433166504, -7.982863903045654, -7.683210849761963, -7.383557319641113, -7.083904266357422, -6.7842512130737305, -6.484598159790039, -6.184945106506348, -5.885291576385498, -5.585638523101807, -5.285985469818115, -4.986331939697266, -4.686678886413574, -4.387025833129883, -4.087372303009033, -3.7877190113067627, -3.4880659580230713, -3.188412666320801, -2.8887596130371094, -2.589106321334839, -2.2894530296325684, -1.989799976348877, -1.6901466846466064, -1.3904935121536255, -1.0908403396606445, -0.791187047958374, -0.49153387546539307, -0.1918807029724121, 0.1077725887298584, 0.4074256420135498, 0.7070789337158203, 1.0067321062088013, 1.3063852787017822, 1.6060385704040527, 1.9056917428970337, 2.2053449153900146, 2.504998207092285, 2.8046512603759766, 3.104304552078247, 3.4039578437805176, 3.703610897064209, 4.003264427185059, 4.30291748046875, 4.602570533752441, 4.902223587036133, 5.201876640319824, 5.501530170440674, 5.801183223724365, 6.100836753845215, 6.400489807128906, 6.700142860412598, 6.999795913696289, 7.299449443817139, 7.59910249710083, 7.89875602722168, 8.198409080505371, 8.498062133789062, 8.79771614074707, 9.097369194030762, 9.397022247314453, 9.696675300598145, 9.996328353881836, 10.295981407165527]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 9.0, 2.0, 5.0, 5.0, 3.0, 4.0, 11.0, 16.0, 10.0, 14.0, 35.0, 30.0, 43.0, 52.0, 62.0, 98.0, 118.0, 128.0, 164.0, 204.0, 330.0, 463.0, 842.0, 2018.0, 9324.0, 92975.0, 2053423.0, 1934745.0, 85450.0, 9251.0, 1964.0, 752.0, 430.0, 291.0, 227.0, 169.0, 122.0, 103.0, 97.0, 72.0, 52.0, 33.0, 41.0, 23.0, 25.0, 15.0, 11.0, 8.0, 8.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2724609375, -1.2326812744140625, -1.192901611328125, -1.1531219482421875, -1.11334228515625, -1.0735626220703125, -1.033782958984375, -0.9940032958984375, -0.9542236328125, -0.9144439697265625, -0.874664306640625, -0.8348846435546875, -0.79510498046875, -0.7553253173828125, -0.715545654296875, -0.6757659912109375, -0.635986328125, -0.5962066650390625, -0.556427001953125, -0.5166473388671875, -0.47686767578125, -0.4370880126953125, -0.397308349609375, -0.3575286865234375, -0.3177490234375, -0.2779693603515625, -0.238189697265625, -0.1984100341796875, -0.15863037109375, -0.1188507080078125, -0.079071044921875, -0.0392913818359375, 0.00048828125, 0.0402679443359375, 0.080047607421875, 0.1198272705078125, 0.15960693359375, 0.1993865966796875, 0.239166259765625, 0.2789459228515625, 0.3187255859375, 0.3585052490234375, 0.398284912109375, 0.4380645751953125, 0.47784423828125, 0.5176239013671875, 0.557403564453125, 0.5971832275390625, 0.636962890625, 0.6767425537109375, 0.716522216796875, 0.7563018798828125, 0.79608154296875, 0.8358612060546875, 0.875640869140625, 0.9154205322265625, 0.9552001953125, 0.9949798583984375, 1.034759521484375, 1.0745391845703125, 1.11431884765625, 1.1540985107421875, 1.193878173828125, 1.2336578369140625, 1.2734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 0.0, 5.0, 7.0, 8.0, 13.0, 8.0, 21.0, 24.0, 30.0, 47.0, 58.0, 63.0, 51.0, 91.0, 79.0, 67.0, 74.0, 81.0, 48.0, 53.0, 48.0, 26.0, 37.0, 15.0, 15.0, 12.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.94775390625, -0.922149658203125, -0.89654541015625, -0.870941162109375, -0.8453369140625, -0.819732666015625, -0.79412841796875, -0.768524169921875, -0.742919921875, -0.717315673828125, -0.69171142578125, -0.666107177734375, -0.6405029296875, -0.614898681640625, -0.58929443359375, -0.563690185546875, -0.5380859375, -0.512481689453125, -0.48687744140625, -0.461273193359375, -0.4356689453125, -0.410064697265625, -0.38446044921875, -0.358856201171875, -0.333251953125, -0.307647705078125, -0.28204345703125, -0.256439208984375, -0.2308349609375, -0.205230712890625, -0.17962646484375, -0.154022216796875, -0.12841796875, -0.102813720703125, -0.07720947265625, -0.051605224609375, -0.0260009765625, -0.000396728515625, 0.02520751953125, 0.050811767578125, 0.076416015625, 0.102020263671875, 0.12762451171875, 0.153228759765625, 0.1788330078125, 0.204437255859375, 0.23004150390625, 0.255645751953125, 0.28125, 0.306854248046875, 0.33245849609375, 0.358062744140625, 0.3836669921875, 0.409271240234375, 0.43487548828125, 0.460479736328125, 0.486083984375, 0.511688232421875, 0.53729248046875, 0.562896728515625, 0.5885009765625, 0.614105224609375, 0.63970947265625, 0.665313720703125, 0.69091796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 13.0, 9.0, 13.0, 16.0, 33.0, 59.0, 94.0, 96.0, 239.0, 493.0, 1563.0, 9043.0, 278146.0, 3842428.0, 55996.0, 4290.0, 965.0, 336.0, 176.0, 92.0, 73.0, 44.0, 21.0, 14.0, 16.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8037567138671875, -1.729583740234375, -1.6554107666015625, -1.58123779296875, -1.5070648193359375, -1.432891845703125, -1.3587188720703125, -1.2845458984375, -1.2103729248046875, -1.136199951171875, -1.0620269775390625, -0.98785400390625, -0.9136810302734375, -0.839508056640625, -0.7653350830078125, -0.691162109375, -0.6169891357421875, -0.542816162109375, -0.4686431884765625, -0.39447021484375, -0.3202972412109375, -0.246124267578125, -0.1719512939453125, -0.0977783203125, -0.0236053466796875, 0.050567626953125, 0.1247406005859375, 0.19891357421875, 0.2730865478515625, 0.347259521484375, 0.4214324951171875, 0.49560546875, 0.5697784423828125, 0.643951416015625, 0.7181243896484375, 0.79229736328125, 0.8664703369140625, 0.940643310546875, 1.0148162841796875, 1.0889892578125, 1.1631622314453125, 1.237335205078125, 1.3115081787109375, 1.38568115234375, 1.4598541259765625, 1.534027099609375, 1.6082000732421875, 1.682373046875, 1.7565460205078125, 1.830718994140625, 1.9048919677734375, 1.97906494140625, 2.0532379150390625, 2.127410888671875, 2.2015838623046875, 2.2757568359375, 2.3499298095703125, 2.424102783203125, 2.4982757568359375, 2.57244873046875, 2.6466217041015625, 2.720794677734375, 2.7949676513671875, 2.869140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 24.0, 32.0, 54.0, 123.0, 291.0, 688.0, 1196.0, 925.0, 431.0, 150.0, 79.0, 44.0, 12.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.29296875, -3.2158050537109375, -3.138641357421875, -3.0614776611328125, -2.98431396484375, -2.9071502685546875, -2.829986572265625, -2.7528228759765625, -2.6756591796875, -2.5984954833984375, -2.521331787109375, -2.4441680908203125, -2.36700439453125, -2.2898406982421875, -2.212677001953125, -2.1355133056640625, -2.058349609375, -1.9811859130859375, -1.904022216796875, -1.8268585205078125, -1.74969482421875, -1.6725311279296875, -1.595367431640625, -1.5182037353515625, -1.4410400390625, -1.3638763427734375, -1.286712646484375, -1.2095489501953125, -1.13238525390625, -1.0552215576171875, -0.978057861328125, -0.9008941650390625, -0.82373046875, -0.7465667724609375, -0.669403076171875, -0.5922393798828125, -0.51507568359375, -0.4379119873046875, -0.360748291015625, -0.2835845947265625, -0.2064208984375, -0.1292572021484375, -0.052093505859375, 0.0250701904296875, 0.10223388671875, 0.1793975830078125, 0.256561279296875, 0.3337249755859375, 0.410888671875, 0.4880523681640625, 0.565216064453125, 0.6423797607421875, 0.71954345703125, 0.7967071533203125, 0.873870849609375, 0.9510345458984375, 1.0281982421875, 1.1053619384765625, 1.182525634765625, 1.2596893310546875, 1.33685302734375, 1.4140167236328125, 1.491180419921875, 1.5683441162109375, 1.6455078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 32.0, 38.0, 88.0, 159.0, 223.0, 192.0, 115.0, 68.0, 35.0, 10.0, 12.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.97688102722168, -17.535297393798828, -17.093713760375977, -16.652128219604492, -16.21054458618164, -15.768960952758789, -15.327377319335938, -14.88579273223877, -14.444209098815918, -14.002625465393066, -13.561040878295898, -13.119457244873047, -12.677872657775879, -12.236289024353027, -11.79470443725586, -11.353120803833008, -10.911537170410156, -10.469953536987305, -10.028368949890137, -9.586785316467285, -9.145200729370117, -8.703617095947266, -8.262033462524414, -7.820448875427246, -7.378864288330078, -6.937280178070068, -6.495696067810059, -6.054112434387207, -5.612528324127197, -5.1709442138671875, -4.729360103607178, -4.287775993347168, -3.8461923599243164, -3.4046082496643066, -2.963024377822876, -2.521440267562866, -2.0798563957214355, -1.6382722854614258, -1.196688175201416, -0.7551043033599854, -0.3135201930999756, 0.12806382775306702, 0.5696478486061096, 1.0112318992614746, 1.4528158903121948, 1.894399881362915, 2.335983991622925, 2.7775678634643555, 3.2191519737243652, 3.660736083984375, 4.102320194244385, 4.5439043045043945, 4.985487937927246, 5.427072048187256, 5.868656158447266, 6.310239791870117, 6.751824378967285, 7.193408489227295, 7.634992599487305, 8.076576232910156, 8.518160820007324, 8.959744453430176, 9.401329040527344, 9.842912673950195, 10.284496307373047]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 12.0, 15.0, 18.0, 27.0, 23.0, 37.0, 47.0, 48.0, 54.0, 70.0, 102.0, 107.0, 71.0, 74.0, 56.0, 46.0, 41.0, 37.0, 30.0, 17.0, 22.0, 12.0, 13.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.853775978088379, -4.56828498840332, -4.28279447555542, -3.9973034858703613, -3.711812734603882, -3.4263219833374023, -3.1408309936523438, -2.8553402423858643, -2.5698494911193848, -2.2843587398529053, -1.9988678693771362, -1.7133769989013672, -1.4278862476348877, -1.1423954963684082, -0.8569046258926392, -0.5714137554168701, -0.2859230041503906, -0.0004321932792663574, 0.2850586175918579, 0.5705494284629822, 0.8560402393341064, 1.141530990600586, 1.427021861076355, 1.712512731552124, 1.9980034828186035, 2.283494234085083, 2.5689849853515625, 2.854475975036621, 3.1399667263031006, 3.42545747756958, 3.7109484672546387, 3.996439218521118, 4.281930923461914, 4.567421913146973, 4.852912425994873, 5.138403415679932, 5.423893928527832, 5.709384918212891, 5.994875907897949, 6.280366897583008, 6.565857410430908, 6.851348400115967, 7.136838912963867, 7.422329902648926, 7.707820892333984, 7.993311405181885, 8.278801918029785, 8.564292907714844, 8.849783897399902, 9.135274887084961, 9.42076587677002, 9.706255912780762, 9.99174690246582, 10.277237892150879, 10.562728881835938, 10.848219871520996, 11.133710861206055, 11.419201850891113, 11.704692840576172, 11.990182876586914, 12.275673866271973, 12.561164855957031, 12.84665584564209, 13.132146835327148, 13.41763687133789]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 8.0, 6.0, 13.0, 11.0, 16.0, 27.0, 46.0, 58.0, 74.0, 135.0, 192.0, 294.0, 485.0, 844.0, 1500.0, 2744.0, 4879.0, 9612.0, 19926.0, 44741.0, 110006.0, 273733.0, 327787.0, 144203.0, 56991.0, 24819.0, 11969.0, 5986.0, 3161.0, 1719.0, 968.0, 594.0, 344.0, 221.0, 126.0, 100.0, 69.0, 43.0, 34.0, 24.0, 13.0, 8.0, 9.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.82470703125, -0.7982254028320312, -0.7717437744140625, -0.7452621459960938, -0.718780517578125, -0.6922988891601562, -0.6658172607421875, -0.6393356323242188, -0.61285400390625, -0.5863723754882812, -0.5598907470703125, -0.5334091186523438, -0.506927490234375, -0.48044586181640625, -0.4539642333984375, -0.42748260498046875, -0.4010009765625, -0.37451934814453125, -0.3480377197265625, -0.32155609130859375, -0.295074462890625, -0.26859283447265625, -0.2421112060546875, -0.21562957763671875, -0.18914794921875, -0.16266632080078125, -0.1361846923828125, -0.10970306396484375, -0.083221435546875, -0.05673980712890625, -0.0302581787109375, -0.00377655029296875, 0.022705078125, 0.04918670654296875, 0.0756683349609375, 0.10214996337890625, 0.128631591796875, 0.15511322021484375, 0.1815948486328125, 0.20807647705078125, 0.23455810546875, 0.26103973388671875, 0.2875213623046875, 0.31400299072265625, 0.340484619140625, 0.36696624755859375, 0.3934478759765625, 0.41992950439453125, 0.4464111328125, 0.47289276123046875, 0.4993743896484375, 0.5258560180664062, 0.552337646484375, 0.5788192749023438, 0.6053009033203125, 0.6317825317382812, 0.65826416015625, 0.6847457885742188, 0.7112274169921875, 0.7377090454101562, 0.764190673828125, 0.7906723022460938, 0.8171539306640625, 0.8436355590820312, 0.8701171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 1.0, 6.0, 5.0, 16.0, 13.0, 14.0, 27.0, 31.0, 31.0, 46.0, 55.0, 66.0, 70.0, 73.0, 64.0, 73.0, 76.0, 48.0, 66.0, 50.0, 34.0, 27.0, 29.0, 24.0, 16.0, 13.0, 6.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97607421875, -0.9494476318359375, -0.922821044921875, -0.8961944580078125, -0.86956787109375, -0.8429412841796875, -0.816314697265625, -0.7896881103515625, -0.7630615234375, -0.7364349365234375, -0.709808349609375, -0.6831817626953125, -0.65655517578125, -0.6299285888671875, -0.603302001953125, -0.5766754150390625, -0.550048828125, -0.5234222412109375, -0.496795654296875, -0.4701690673828125, -0.44354248046875, -0.4169158935546875, -0.390289306640625, -0.3636627197265625, -0.3370361328125, -0.3104095458984375, -0.283782958984375, -0.2571563720703125, -0.23052978515625, -0.2039031982421875, -0.177276611328125, -0.1506500244140625, -0.1240234375, -0.0973968505859375, -0.070770263671875, -0.0441436767578125, -0.01751708984375, 0.0091094970703125, 0.035736083984375, 0.0623626708984375, 0.0889892578125, 0.1156158447265625, 0.142242431640625, 0.1688690185546875, 0.19549560546875, 0.2221221923828125, 0.248748779296875, 0.2753753662109375, 0.302001953125, 0.3286285400390625, 0.355255126953125, 0.3818817138671875, 0.40850830078125, 0.4351348876953125, 0.461761474609375, 0.4883880615234375, 0.5150146484375, 0.5416412353515625, 0.568267822265625, 0.5948944091796875, 0.62152099609375, 0.6481475830078125, 0.674774169921875, 0.7014007568359375, 0.72802734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 11.0, 9.0, 22.0, 27.0, 41.0, 54.0, 95.0, 141.0, 238.0, 407.0, 677.0, 1267.0, 3477.0, 17797.0, 262444.0, 724222.0, 29489.0, 4669.0, 1580.0, 757.0, 419.0, 229.0, 165.0, 95.0, 64.0, 53.0, 23.0, 33.0, 15.0, 9.0, 7.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.47979736328125, -2.4049072265625, -2.33001708984375, -2.255126953125, -2.18023681640625, -2.1053466796875, -2.03045654296875, -1.95556640625, -1.88067626953125, -1.8057861328125, -1.73089599609375, -1.656005859375, -1.58111572265625, -1.5062255859375, -1.43133544921875, -1.3564453125, -1.28155517578125, -1.2066650390625, -1.13177490234375, -1.056884765625, -0.98199462890625, -0.9071044921875, -0.83221435546875, -0.75732421875, -0.68243408203125, -0.6075439453125, -0.53265380859375, -0.457763671875, -0.38287353515625, -0.3079833984375, -0.23309326171875, -0.158203125, -0.08331298828125, -0.0084228515625, 0.06646728515625, 0.141357421875, 0.21624755859375, 0.2911376953125, 0.36602783203125, 0.44091796875, 0.51580810546875, 0.5906982421875, 0.66558837890625, 0.740478515625, 0.81536865234375, 0.8902587890625, 0.96514892578125, 1.0400390625, 1.11492919921875, 1.1898193359375, 1.26470947265625, 1.339599609375, 1.41448974609375, 1.4893798828125, 1.56427001953125, 1.63916015625, 1.71405029296875, 1.7889404296875, 1.86383056640625, 1.938720703125, 2.01361083984375, 2.0885009765625, 2.16339111328125, 2.23828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 8.0, 7.0, 13.0, 23.0, 25.0, 27.0, 38.0, 56.0, 73.0, 88.0, 113.0, 100.0, 97.0, 83.0, 64.0, 43.0, 45.0, 27.0, 20.0, 11.0, 13.0, 4.0, 8.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6875, -4.559356689453125, -4.43121337890625, -4.303070068359375, -4.1749267578125, -4.046783447265625, -3.91864013671875, -3.790496826171875, -3.662353515625, -3.534210205078125, -3.40606689453125, -3.277923583984375, -3.1497802734375, -3.021636962890625, -2.89349365234375, -2.765350341796875, -2.63720703125, -2.509063720703125, -2.38092041015625, -2.252777099609375, -2.1246337890625, -1.996490478515625, -1.86834716796875, -1.740203857421875, -1.612060546875, -1.483917236328125, -1.35577392578125, -1.227630615234375, -1.0994873046875, -0.971343994140625, -0.84320068359375, -0.715057373046875, -0.5869140625, -0.458770751953125, -0.33062744140625, -0.202484130859375, -0.0743408203125, 0.053802490234375, 0.18194580078125, 0.310089111328125, 0.438232421875, 0.566375732421875, 0.69451904296875, 0.822662353515625, 0.9508056640625, 1.078948974609375, 1.20709228515625, 1.335235595703125, 1.46337890625, 1.591522216796875, 1.71966552734375, 1.847808837890625, 1.9759521484375, 2.104095458984375, 2.23223876953125, 2.360382080078125, 2.488525390625, 2.616668701171875, 2.74481201171875, 2.872955322265625, 3.0010986328125, 3.129241943359375, 3.25738525390625, 3.385528564453125, 3.513671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 19.0, 27.0, 38.0, 52.0, 74.0, 107.0, 230.0, 409.0, 741.0, 1521.0, 3986.0, 12256.0, 51274.0, 307829.0, 591733.0, 57025.0, 13599.0, 4266.0, 1545.0, 774.0, 412.0, 219.0, 145.0, 86.0, 52.0, 29.0, 18.0, 20.0, 11.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.38818359375, -0.3756752014160156, -0.36316680908203125, -0.3506584167480469, -0.3381500244140625, -0.3256416320800781, -0.31313323974609375, -0.3006248474121094, -0.288116455078125, -0.2756080627441406, -0.26309967041015625, -0.2505912780761719, -0.2380828857421875, -0.22557449340820312, -0.21306610107421875, -0.20055770874023438, -0.18804931640625, -0.17554092407226562, -0.16303253173828125, -0.15052413940429688, -0.1380157470703125, -0.12550735473632812, -0.11299896240234375, -0.10049057006835938, -0.087982177734375, -0.07547378540039062, -0.06296539306640625, -0.050457000732421875, -0.0379486083984375, -0.025440216064453125, -0.01293182373046875, -0.000423431396484375, 0.0120849609375, 0.024593353271484375, 0.03710174560546875, 0.049610137939453125, 0.0621185302734375, 0.07462692260742188, 0.08713531494140625, 0.09964370727539062, 0.112152099609375, 0.12466049194335938, 0.13716888427734375, 0.14967727661132812, 0.1621856689453125, 0.17469406127929688, 0.18720245361328125, 0.19971084594726562, 0.21221923828125, 0.22472763061523438, 0.23723602294921875, 0.24974441528320312, 0.2622528076171875, 0.2747611999511719, 0.28726959228515625, 0.2997779846191406, 0.312286376953125, 0.3247947692871094, 0.33730316162109375, 0.3498115539550781, 0.3623199462890625, 0.3748283386230469, 0.38733673095703125, 0.3998451232910156, 0.412353515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 5.0, 5.0, 9.0, 13.0, 8.0, 13.0, 15.0, 16.0, 21.0, 36.0, 60.0, 63.0, 71.0, 97.0, 106.0, 104.0, 73.0, 53.0, 47.0, 36.0, 29.0, 28.0, 24.0, 8.0, 13.0, 6.0, 4.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001575946807861328, -0.00015300512313842773, -0.00014841556549072266, -0.00014382600784301758, -0.0001392364501953125, -0.00013464689254760742, -0.00013005733489990234, -0.00012546777725219727, -0.00012087821960449219, -0.00011628866195678711, -0.00011169910430908203, -0.00010710954666137695, -0.00010251998901367188, -9.79304313659668e-05, -9.334087371826172e-05, -8.875131607055664e-05, -8.416175842285156e-05, -7.957220077514648e-05, -7.49826431274414e-05, -7.039308547973633e-05, -6.580352783203125e-05, -6.121397018432617e-05, -5.6624412536621094e-05, -5.2034854888916016e-05, -4.744529724121094e-05, -4.285573959350586e-05, -3.826618194580078e-05, -3.36766242980957e-05, -2.9087066650390625e-05, -2.4497509002685547e-05, -1.990795135498047e-05, -1.531839370727539e-05, -1.0728836059570312e-05, -6.139278411865234e-06, -1.5497207641601562e-06, 3.039836883544922e-06, 7.62939453125e-06, 1.2218952178955078e-05, 1.6808509826660156e-05, 2.1398067474365234e-05, 2.5987625122070312e-05, 3.057718276977539e-05, 3.516674041748047e-05, 3.975629806518555e-05, 4.4345855712890625e-05, 4.89354133605957e-05, 5.352497100830078e-05, 5.811452865600586e-05, 6.270408630371094e-05, 6.729364395141602e-05, 7.18832015991211e-05, 7.647275924682617e-05, 8.106231689453125e-05, 8.565187454223633e-05, 9.02414321899414e-05, 9.483098983764648e-05, 9.942054748535156e-05, 0.00010401010513305664, 0.00010859966278076172, 0.0001131892204284668, 0.00011777877807617188, 0.00012236833572387695, 0.00012695789337158203, 0.0001315474510192871, 0.0001361370086669922]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 7.0, 9.0, 19.0, 18.0, 33.0, 47.0, 76.0, 88.0, 180.0, 268.0, 529.0, 1114.0, 2380.0, 7066.0, 28533.0, 162430.0, 722866.0, 95574.0, 18382.0, 5120.0, 1864.0, 861.0, 454.0, 235.0, 117.0, 81.0, 64.0, 35.0, 38.0, 16.0, 16.0, 9.0, 8.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.397216796875, -0.38494110107421875, -0.3726654052734375, -0.36038970947265625, -0.348114013671875, -0.33583831787109375, -0.3235626220703125, -0.31128692626953125, -0.29901123046875, -0.28673553466796875, -0.2744598388671875, -0.26218414306640625, -0.249908447265625, -0.23763275146484375, -0.2253570556640625, -0.21308135986328125, -0.2008056640625, -0.18852996826171875, -0.1762542724609375, -0.16397857666015625, -0.151702880859375, -0.13942718505859375, -0.1271514892578125, -0.11487579345703125, -0.10260009765625, -0.09032440185546875, -0.0780487060546875, -0.06577301025390625, -0.053497314453125, -0.04122161865234375, -0.0289459228515625, -0.01667022705078125, -0.00439453125, 0.00788116455078125, 0.0201568603515625, 0.03243255615234375, 0.044708251953125, 0.05698394775390625, 0.0692596435546875, 0.08153533935546875, 0.09381103515625, 0.10608673095703125, 0.1183624267578125, 0.13063812255859375, 0.142913818359375, 0.15518951416015625, 0.1674652099609375, 0.17974090576171875, 0.1920166015625, 0.20429229736328125, 0.2165679931640625, 0.22884368896484375, 0.241119384765625, 0.25339508056640625, 0.2656707763671875, 0.27794647216796875, 0.29022216796875, 0.30249786376953125, 0.3147735595703125, 0.32704925537109375, 0.339324951171875, 0.35160064697265625, 0.3638763427734375, 0.37615203857421875, 0.388427734375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 15.0, 10.0, 8.0, 27.0, 32.0, 39.0, 82.0, 90.0, 114.0, 111.0, 113.0, 92.0, 65.0, 55.0, 39.0, 31.0, 22.0, 17.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.6279296875, -0.612213134765625, -0.59649658203125, -0.580780029296875, -0.5650634765625, -0.549346923828125, -0.53363037109375, -0.517913818359375, -0.502197265625, -0.486480712890625, -0.47076416015625, -0.455047607421875, -0.4393310546875, -0.423614501953125, -0.40789794921875, -0.392181396484375, -0.37646484375, -0.360748291015625, -0.34503173828125, -0.329315185546875, -0.3135986328125, -0.297882080078125, -0.28216552734375, -0.266448974609375, -0.250732421875, -0.235015869140625, -0.21929931640625, -0.203582763671875, -0.1878662109375, -0.172149658203125, -0.15643310546875, -0.140716552734375, -0.125, -0.109283447265625, -0.09356689453125, -0.077850341796875, -0.0621337890625, -0.046417236328125, -0.03070068359375, -0.014984130859375, 0.000732421875, 0.016448974609375, 0.03216552734375, 0.047882080078125, 0.0635986328125, 0.079315185546875, 0.09503173828125, 0.110748291015625, 0.12646484375, 0.142181396484375, 0.15789794921875, 0.173614501953125, 0.1893310546875, 0.205047607421875, 0.22076416015625, 0.236480712890625, 0.252197265625, 0.267913818359375, 0.28363037109375, 0.299346923828125, 0.3150634765625, 0.330780029296875, 0.34649658203125, 0.362213134765625, 0.3779296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 12.0, 15.0, 43.0, 94.0, 153.0, 429.0, 144.0, 57.0, 27.0, 14.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.384563446044922, -21.88277816772461, -21.380992889404297, -20.879207611083984, -20.377422332763672, -19.875635147094727, -19.373849868774414, -18.8720645904541, -18.37027931213379, -17.868494033813477, -17.366708755493164, -16.86492347717285, -16.363136291503906, -15.86135196685791, -15.359565734863281, -14.857780456542969, -14.355995178222656, -13.854209899902344, -13.352424621582031, -12.850638389587402, -12.34885311126709, -11.847067832946777, -11.345281600952148, -10.843496322631836, -10.341711044311523, -9.839925765991211, -9.338140487670898, -8.83635425567627, -8.334568977355957, -7.8327836990356445, -7.330997943878174, -6.829212188720703, -6.327426910400391, -5.825641632080078, -5.323855876922607, -4.822070121765137, -4.320284843444824, -3.8184993267059326, -3.316713809967041, -2.8149282932281494, -2.313142776489258, -1.8113572597503662, -1.3095717430114746, -0.807786226272583, -0.3060007095336914, 0.1957848072052002, 0.6975703239440918, 1.1993558406829834, 1.701141357421875, 2.2029268741607666, 2.704712390899658, 3.20649790763855, 3.7082834243774414, 4.210068702697754, 4.711854457855225, 5.213640213012695, 5.715425491333008, 6.21721076965332, 6.718996524810791, 7.220782279968262, 7.722567558288574, 8.224352836608887, 8.726139068603516, 9.227924346923828, 9.72970962524414]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 5.0, 10.0, 8.0, 11.0, 7.0, 16.0, 13.0, 21.0, 22.0, 20.0, 30.0, 22.0, 30.0, 27.0, 37.0, 67.0, 137.0, 136.0, 59.0, 43.0, 32.0, 29.0, 27.0, 26.0, 25.0, 22.0, 13.0, 18.0, 13.0, 13.0, 13.0, 7.0, 5.0, 5.0, 7.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.575469017028809, -8.307669639587402, -8.039871215820312, -7.772071838378906, -7.5042724609375, -7.236473560333252, -6.968674659729004, -6.700875282287598, -6.43307638168335, -6.165277481079102, -5.897478103637695, -5.629679203033447, -5.361880302429199, -5.094080924987793, -4.826282024383545, -4.558483123779297, -4.290683746337891, -4.022884845733643, -3.7550854682922363, -3.4872865676879883, -3.219487428665161, -2.951688289642334, -2.683889389038086, -2.416090250015259, -2.1482911109924316, -1.8804919719696045, -1.612692952156067, -1.3448939323425293, -1.0770947933197021, -0.809295654296875, -0.5414966344833374, -0.2736976146697998, -0.005898475646972656, 0.2619006037712097, 0.5296996831893921, 0.7974987626075745, 1.0652978420257568, 1.333096981048584, 1.6008960008621216, 1.8686950206756592, 2.1364941596984863, 2.4042932987213135, 2.6720924377441406, 2.9398913383483887, 3.207690477371216, 3.475489616394043, 3.743288516998291, 4.011087417602539, 4.278886795043945, 4.546685695648193, 4.8144850730896, 5.082283973693848, 5.350083351135254, 5.617882251739502, 5.88568115234375, 6.153480529785156, 6.421279430389404, 6.689078330993652, 6.956877708435059, 7.224676609039307, 7.492475509643555, 7.760274887084961, 8.028074264526367, 8.295872688293457, 8.563672065734863]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 0.0, 6.0, 11.0, 5.0, 17.0, 19.0, 26.0, 30.0, 50.0, 73.0, 101.0, 142.0, 211.0, 350.0, 566.0, 961.0, 1751.0, 3350.0, 7161.0, 19857.0, 69576.0, 293016.0, 1089307.0, 1762328.0, 704586.0, 171265.0, 43800.0, 13659.0, 5722.0, 2645.0, 1430.0, 769.0, 528.0, 319.0, 197.0, 141.0, 92.0, 63.0, 52.0, 29.0, 28.0, 11.0, 7.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.841796875, -0.817962646484375, -0.79412841796875, -0.770294189453125, -0.7464599609375, -0.722625732421875, -0.69879150390625, -0.674957275390625, -0.651123046875, -0.627288818359375, -0.60345458984375, -0.579620361328125, -0.5557861328125, -0.531951904296875, -0.50811767578125, -0.484283447265625, -0.46044921875, -0.436614990234375, -0.41278076171875, -0.388946533203125, -0.3651123046875, -0.341278076171875, -0.31744384765625, -0.293609619140625, -0.269775390625, -0.245941162109375, -0.22210693359375, -0.198272705078125, -0.1744384765625, -0.150604248046875, -0.12677001953125, -0.102935791015625, -0.0791015625, -0.055267333984375, -0.03143310546875, -0.007598876953125, 0.0162353515625, 0.040069580078125, 0.06390380859375, 0.087738037109375, 0.111572265625, 0.135406494140625, 0.15924072265625, 0.183074951171875, 0.2069091796875, 0.230743408203125, 0.25457763671875, 0.278411865234375, 0.30224609375, 0.326080322265625, 0.34991455078125, 0.373748779296875, 0.3975830078125, 0.421417236328125, 0.44525146484375, 0.469085693359375, 0.492919921875, 0.516754150390625, 0.54058837890625, 0.564422607421875, 0.5882568359375, 0.612091064453125, 0.63592529296875, 0.659759521484375, 0.68359375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 7.0, 14.0, 13.0, 8.0, 20.0, 34.0, 47.0, 42.0, 43.0, 65.0, 69.0, 73.0, 68.0, 62.0, 72.0, 67.0, 64.0, 49.0, 49.0, 29.0, 25.0, 16.0, 15.0, 19.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98046875, -0.9552688598632812, -0.9300689697265625, -0.9048690795898438, -0.879669189453125, -0.8544692993164062, -0.8292694091796875, -0.8040695190429688, -0.77886962890625, -0.7536697387695312, -0.7284698486328125, -0.7032699584960938, -0.678070068359375, -0.6528701782226562, -0.6276702880859375, -0.6024703979492188, -0.5772705078125, -0.5520706176757812, -0.5268707275390625, -0.5016708374023438, -0.476470947265625, -0.45127105712890625, -0.4260711669921875, -0.40087127685546875, -0.37567138671875, -0.35047149658203125, -0.3252716064453125, -0.30007171630859375, -0.274871826171875, -0.24967193603515625, -0.2244720458984375, -0.19927215576171875, -0.174072265625, -0.14887237548828125, -0.1236724853515625, -0.09847259521484375, -0.073272705078125, -0.04807281494140625, -0.0228729248046875, 0.00232696533203125, 0.02752685546875, 0.05272674560546875, 0.0779266357421875, 0.10312652587890625, 0.128326416015625, 0.15352630615234375, 0.1787261962890625, 0.20392608642578125, 0.2291259765625, 0.25432586669921875, 0.2795257568359375, 0.30472564697265625, 0.329925537109375, 0.35512542724609375, 0.3803253173828125, 0.40552520751953125, 0.43072509765625, 0.45592498779296875, 0.4811248779296875, 0.5063247680664062, 0.531524658203125, 0.5567245483398438, 0.5819244384765625, 0.6071243286132812, 0.63232421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 11.0, 17.0, 14.0, 28.0, 39.0, 47.0, 103.0, 152.0, 282.0, 515.0, 1065.0, 3236.0, 24509.0, 3801719.0, 351352.0, 7671.0, 1786.0, 811.0, 357.0, 217.0, 136.0, 62.0, 40.0, 30.0, 20.0, 21.0, 8.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.75, -3.628173828125, -3.50634765625, -3.384521484375, -3.2626953125, -3.140869140625, -3.01904296875, -2.897216796875, -2.775390625, -2.653564453125, -2.53173828125, -2.409912109375, -2.2880859375, -2.166259765625, -2.04443359375, -1.922607421875, -1.80078125, -1.678955078125, -1.55712890625, -1.435302734375, -1.3134765625, -1.191650390625, -1.06982421875, -0.947998046875, -0.826171875, -0.704345703125, -0.58251953125, -0.460693359375, -0.3388671875, -0.217041015625, -0.09521484375, 0.026611328125, 0.1484375, 0.270263671875, 0.39208984375, 0.513916015625, 0.6357421875, 0.757568359375, 0.87939453125, 1.001220703125, 1.123046875, 1.244873046875, 1.36669921875, 1.488525390625, 1.6103515625, 1.732177734375, 1.85400390625, 1.975830078125, 2.09765625, 2.219482421875, 2.34130859375, 2.463134765625, 2.5849609375, 2.706787109375, 2.82861328125, 2.950439453125, 3.072265625, 3.194091796875, 3.31591796875, 3.437744140625, 3.5595703125, 3.681396484375, 3.80322265625, 3.925048828125, 4.046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 23.0, 24.0, 38.0, 63.0, 97.0, 159.0, 276.0, 436.0, 647.0, 778.0, 602.0, 375.0, 198.0, 120.0, 75.0, 57.0, 40.0, 24.0, 10.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.31402587890625, -3.2276611328125, -3.14129638671875, -3.054931640625, -2.96856689453125, -2.8822021484375, -2.79583740234375, -2.70947265625, -2.62310791015625, -2.5367431640625, -2.45037841796875, -2.364013671875, -2.27764892578125, -2.1912841796875, -2.10491943359375, -2.0185546875, -1.93218994140625, -1.8458251953125, -1.75946044921875, -1.673095703125, -1.58673095703125, -1.5003662109375, -1.41400146484375, -1.32763671875, -1.24127197265625, -1.1549072265625, -1.06854248046875, -0.982177734375, -0.89581298828125, -0.8094482421875, -0.72308349609375, -0.63671875, -0.55035400390625, -0.4639892578125, -0.37762451171875, -0.291259765625, -0.20489501953125, -0.1185302734375, -0.03216552734375, 0.05419921875, 0.14056396484375, 0.2269287109375, 0.31329345703125, 0.399658203125, 0.48602294921875, 0.5723876953125, 0.65875244140625, 0.7451171875, 0.83148193359375, 0.9178466796875, 1.00421142578125, 1.090576171875, 1.17694091796875, 1.2633056640625, 1.34967041015625, 1.43603515625, 1.52239990234375, 1.6087646484375, 1.69512939453125, 1.781494140625, 1.86785888671875, 1.9542236328125, 2.04058837890625, 2.126953125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 7.0, 3.0, 0.0, 1.0, 8.0, 16.0, 22.0, 68.0, 153.0, 295.0, 255.0, 92.0, 45.0, 23.0, 12.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.16006088256836, -53.98428726196289, -52.808509826660156, -51.63273620605469, -50.45696258544922, -49.28118896484375, -48.105411529541016, -46.92963790893555, -45.75386047363281, -44.578086853027344, -43.40230941772461, -42.22653579711914, -41.05076217651367, -39.87498474121094, -38.69921112060547, -37.5234375, -36.34766387939453, -35.17189025878906, -33.99611282348633, -32.82033920288086, -31.64456558227539, -30.46879005432129, -29.293014526367188, -28.11724090576172, -26.941465377807617, -25.765689849853516, -24.589916229248047, -23.414140701293945, -22.238365173339844, -21.062591552734375, -19.886816024780273, -18.711040496826172, -17.53527069091797, -16.359495162963867, -15.183721542358398, -14.007946014404297, -12.832171440124512, -11.656396865844727, -10.480621337890625, -9.30484676361084, -8.129072189331055, -6.9532976150512695, -5.777522563934326, -4.601747512817383, -3.4259729385375977, -2.2501983642578125, -1.0744233131408691, 0.10135173797607422, 1.2771263122558594, 2.4529011249542236, 3.628675937652588, 4.804450988769531, 5.980225563049316, 7.156000137329102, 8.331775665283203, 9.507550239562988, 10.683324813842773, 11.859099388122559, 13.034873962402344, 14.210649490356445, 15.38642406463623, 16.562198638916016, 17.737974166870117, 18.91374969482422, 20.089523315429688]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 11.0, 16.0, 16.0, 39.0, 27.0, 61.0, 68.0, 79.0, 100.0, 127.0, 91.0, 79.0, 49.0, 47.0, 52.0, 37.0, 31.0, 19.0, 15.0, 15.0, 5.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.348106384277344, -17.676523208618164, -17.00493812561035, -16.333354949951172, -15.66176986694336, -14.99018669128418, -14.318602561950684, -13.647018432617188, -12.975434303283691, -12.303850173950195, -11.6322660446167, -10.960681915283203, -10.289098739624023, -9.617513656616211, -8.945930480957031, -8.274346351623535, -7.602762222290039, -6.931178092956543, -6.259593963623047, -5.588010311126709, -4.916426181793213, -4.244842052459717, -3.573258399963379, -2.901674270629883, -2.2300901412963867, -1.5585061311721802, -0.8869221210479736, -0.21533823013305664, 0.45624589920043945, 1.1278300285339355, 1.7994136810302734, 2.4709978103637695, 3.1425819396972656, 3.8141660690307617, 4.485750198364258, 5.157333850860596, 5.828917980194092, 6.500502109527588, 7.172085762023926, 7.843669891357422, 8.515254020690918, 9.186838150024414, 9.85842227935791, 10.530006408691406, 11.201589584350586, 11.873174667358398, 12.544757843017578, 13.216341972351074, 13.88792610168457, 14.559510231018066, 15.231094360351562, 15.902677536010742, 16.574262619018555, 17.245845794677734, 17.917430877685547, 18.589014053344727, 19.260597229003906, 19.932180404663086, 20.6037654876709, 21.275348663330078, 21.94693374633789, 22.61851692199707, 23.29010009765625, 23.961685180664062, 24.633270263671875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 10.0, 9.0, 11.0, 17.0, 25.0, 30.0, 54.0, 81.0, 153.0, 241.0, 620.0, 1531.0, 5992.0, 33942.0, 485991.0, 477474.0, 33594.0, 6008.0, 1573.0, 584.0, 261.0, 129.0, 69.0, 52.0, 29.0, 22.0, 13.0, 9.0, 9.0, 3.0, 4.0, 10.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.078704833984375, -2.00701904296875, -1.935333251953125, -1.8636474609375, -1.791961669921875, -1.72027587890625, -1.648590087890625, -1.576904296875, -1.505218505859375, -1.43353271484375, -1.361846923828125, -1.2901611328125, -1.218475341796875, -1.14678955078125, -1.075103759765625, -1.00341796875, -0.931732177734375, -0.86004638671875, -0.788360595703125, -0.7166748046875, -0.644989013671875, -0.57330322265625, -0.501617431640625, -0.429931640625, -0.358245849609375, -0.28656005859375, -0.214874267578125, -0.1431884765625, -0.071502685546875, 0.00018310546875, 0.071868896484375, 0.1435546875, 0.215240478515625, 0.28692626953125, 0.358612060546875, 0.4302978515625, 0.501983642578125, 0.57366943359375, 0.645355224609375, 0.717041015625, 0.788726806640625, 0.86041259765625, 0.932098388671875, 1.0037841796875, 1.075469970703125, 1.14715576171875, 1.218841552734375, 1.29052734375, 1.362213134765625, 1.43389892578125, 1.505584716796875, 1.5772705078125, 1.648956298828125, 1.72064208984375, 1.792327880859375, 1.864013671875, 1.935699462890625, 2.00738525390625, 2.079071044921875, 2.1507568359375, 2.222442626953125, 2.29412841796875, 2.365814208984375, 2.4375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 6.0, 18.0, 34.0, 61.0, 66.0, 106.0, 134.0, 144.0, 132.0, 103.0, 69.0, 52.0, 30.0, 24.0, 11.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7365264892578125, -1.673248291015625, -1.6099700927734375, -1.54669189453125, -1.4834136962890625, -1.420135498046875, -1.3568572998046875, -1.2935791015625, -1.2303009033203125, -1.167022705078125, -1.1037445068359375, -1.04046630859375, -0.9771881103515625, -0.913909912109375, -0.8506317138671875, -0.787353515625, -0.7240753173828125, -0.660797119140625, -0.5975189208984375, -0.53424072265625, -0.4709625244140625, -0.407684326171875, -0.3444061279296875, -0.2811279296875, -0.2178497314453125, -0.154571533203125, -0.0912933349609375, -0.02801513671875, 0.0352630615234375, 0.098541259765625, 0.1618194580078125, 0.22509765625, 0.2883758544921875, 0.351654052734375, 0.4149322509765625, 0.47821044921875, 0.5414886474609375, 0.604766845703125, 0.6680450439453125, 0.7313232421875, 0.7946014404296875, 0.857879638671875, 0.9211578369140625, 0.98443603515625, 1.0477142333984375, 1.110992431640625, 1.1742706298828125, 1.237548828125, 1.3008270263671875, 1.364105224609375, 1.4273834228515625, 1.49066162109375, 1.5539398193359375, 1.617218017578125, 1.6804962158203125, 1.7437744140625, 1.8070526123046875, 1.870330810546875, 1.9336090087890625, 1.99688720703125, 2.0601654052734375, 2.123443603515625, 2.1867218017578125, 2.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 3.0, 8.0, 13.0, 13.0, 17.0, 20.0, 35.0, 46.0, 56.0, 82.0, 111.0, 176.0, 303.0, 467.0, 988.0, 2311.0, 7858.0, 47991.0, 877114.0, 93031.0, 11987.0, 3126.0, 1202.0, 589.0, 353.0, 188.0, 125.0, 90.0, 52.0, 46.0, 38.0, 28.0, 19.0, 15.0, 11.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9072265625, -1.8537139892578125, -1.800201416015625, -1.7466888427734375, -1.69317626953125, -1.6396636962890625, -1.586151123046875, -1.5326385498046875, -1.4791259765625, -1.4256134033203125, -1.372100830078125, -1.3185882568359375, -1.26507568359375, -1.2115631103515625, -1.158050537109375, -1.1045379638671875, -1.051025390625, -0.9975128173828125, -0.944000244140625, -0.8904876708984375, -0.83697509765625, -0.7834625244140625, -0.729949951171875, -0.6764373779296875, -0.6229248046875, -0.5694122314453125, -0.515899658203125, -0.4623870849609375, -0.40887451171875, -0.3553619384765625, -0.301849365234375, -0.2483367919921875, -0.19482421875, -0.1413116455078125, -0.087799072265625, -0.0342864990234375, 0.01922607421875, 0.0727386474609375, 0.126251220703125, 0.1797637939453125, 0.2332763671875, 0.2867889404296875, 0.340301513671875, 0.3938140869140625, 0.44732666015625, 0.5008392333984375, 0.554351806640625, 0.6078643798828125, 0.661376953125, 0.7148895263671875, 0.768402099609375, 0.8219146728515625, 0.87542724609375, 0.9289398193359375, 0.982452392578125, 1.0359649658203125, 1.0894775390625, 1.1429901123046875, 1.196502685546875, 1.2500152587890625, 1.30352783203125, 1.3570404052734375, 1.410552978515625, 1.4640655517578125, 1.517578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 15.0, 3.0, 8.0, 10.0, 12.0, 19.0, 21.0, 29.0, 30.0, 35.0, 51.0, 73.0, 73.0, 70.0, 113.0, 76.0, 56.0, 58.0, 42.0, 38.0, 31.0, 22.0, 23.0, 26.0, 12.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.40234375, -4.29046630859375, -4.1785888671875, -4.06671142578125, -3.954833984375, -3.84295654296875, -3.7310791015625, -3.61920166015625, -3.50732421875, -3.39544677734375, -3.2835693359375, -3.17169189453125, -3.059814453125, -2.94793701171875, -2.8360595703125, -2.72418212890625, -2.6123046875, -2.50042724609375, -2.3885498046875, -2.27667236328125, -2.164794921875, -2.05291748046875, -1.9410400390625, -1.82916259765625, -1.71728515625, -1.60540771484375, -1.4935302734375, -1.38165283203125, -1.269775390625, -1.15789794921875, -1.0460205078125, -0.93414306640625, -0.822265625, -0.71038818359375, -0.5985107421875, -0.48663330078125, -0.374755859375, -0.26287841796875, -0.1510009765625, -0.03912353515625, 0.07275390625, 0.18463134765625, 0.2965087890625, 0.40838623046875, 0.520263671875, 0.63214111328125, 0.7440185546875, 0.85589599609375, 0.9677734375, 1.07965087890625, 1.1915283203125, 1.30340576171875, 1.415283203125, 1.52716064453125, 1.6390380859375, 1.75091552734375, 1.86279296875, 1.97467041015625, 2.0865478515625, 2.19842529296875, 2.310302734375, 2.42218017578125, 2.5340576171875, 2.64593505859375, 2.7578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 4.0, 10.0, 12.0, 21.0, 31.0, 38.0, 71.0, 93.0, 106.0, 215.0, 357.0, 688.0, 1572.0, 3936.0, 12765.0, 56429.0, 848122.0, 96493.0, 18363.0, 5257.0, 1965.0, 896.0, 421.0, 240.0, 165.0, 80.0, 54.0, 42.0, 37.0, 19.0, 11.0, 11.0, 6.0, 8.0, 6.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391357421875, -0.3803749084472656, -0.36939239501953125, -0.3584098815917969, -0.3474273681640625, -0.3364448547363281, -0.32546234130859375, -0.3144798278808594, -0.303497314453125, -0.2925148010253906, -0.28153228759765625, -0.2705497741699219, -0.2595672607421875, -0.24858474731445312, -0.23760223388671875, -0.22661972045898438, -0.21563720703125, -0.20465469360351562, -0.19367218017578125, -0.18268966674804688, -0.1717071533203125, -0.16072463989257812, -0.14974212646484375, -0.13875961303710938, -0.127777099609375, -0.11679458618164062, -0.10581207275390625, -0.09482955932617188, -0.0838470458984375, -0.07286453247070312, -0.06188201904296875, -0.050899505615234375, -0.0399169921875, -0.028934478759765625, -0.01795196533203125, -0.006969451904296875, 0.0040130615234375, 0.014995574951171875, 0.02597808837890625, 0.036960601806640625, 0.047943115234375, 0.058925628662109375, 0.06990814208984375, 0.08089065551757812, 0.0918731689453125, 0.10285568237304688, 0.11383819580078125, 0.12482070922851562, 0.13580322265625, 0.14678573608398438, 0.15776824951171875, 0.16875076293945312, 0.1797332763671875, 0.19071578979492188, 0.20169830322265625, 0.21268081665039062, 0.223663330078125, 0.23464584350585938, 0.24562835693359375, 0.2566108703613281, 0.2675933837890625, 0.2785758972167969, 0.28955841064453125, 0.3005409240722656, 0.3115234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 7.0, 7.0, 9.0, 12.0, 10.0, 22.0, 27.0, 43.0, 36.0, 69.0, 108.0, 133.0, 141.0, 100.0, 65.0, 45.0, 34.0, 31.0, 20.0, 9.0, 10.0, 8.0, 8.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0001628398895263672, -0.00015853624790906906, -0.00015423260629177094, -0.0001499289646744728, -0.00014562532305717468, -0.00014132168143987656, -0.00013701803982257843, -0.0001327143982052803, -0.00012841075658798218, -0.00012410711497068405, -0.00011980347335338593, -0.0001154998317360878, -0.00011119619011878967, -0.00010689254850149155, -0.00010258890688419342, -9.82852652668953e-05, -9.398162364959717e-05, -8.967798203229904e-05, -8.537434041500092e-05, -8.107069879770279e-05, -7.676705718040466e-05, -7.246341556310654e-05, -6.815977394580841e-05, -6.385613232851028e-05, -5.955249071121216e-05, -5.524884909391403e-05, -5.0945207476615906e-05, -4.664156585931778e-05, -4.233792424201965e-05, -3.803428262472153e-05, -3.37306410074234e-05, -2.9426999390125275e-05, -2.512335777282715e-05, -2.0819716155529022e-05, -1.6516074538230896e-05, -1.221243292093277e-05, -7.908791303634644e-06, -3.6051496863365173e-06, 6.984919309616089e-07, 5.002133548259735e-06, 9.305775165557861e-06, 1.3609416782855988e-05, 1.7913058400154114e-05, 2.221670001745224e-05, 2.6520341634750366e-05, 3.082398325204849e-05, 3.512762486934662e-05, 3.9431266486644745e-05, 4.373490810394287e-05, 4.8038549721241e-05, 5.2342191338539124e-05, 5.664583295583725e-05, 6.0949474573135376e-05, 6.52531161904335e-05, 6.955675780773163e-05, 7.386039942502975e-05, 7.816404104232788e-05, 8.246768265962601e-05, 8.677132427692413e-05, 9.107496589422226e-05, 9.537860751152039e-05, 9.968224912881851e-05, 0.00010398589074611664, 0.00010828953236341476, 0.00011259317398071289]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 13.0, 7.0, 21.0, 17.0, 26.0, 53.0, 59.0, 120.0, 181.0, 303.0, 499.0, 990.0, 1972.0, 4321.0, 10786.0, 33436.0, 192392.0, 733436.0, 46088.0, 13759.0, 5236.0, 2262.0, 1141.0, 617.0, 315.0, 207.0, 124.0, 48.0, 30.0, 29.0, 18.0, 12.0, 7.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18167495727539062, -0.17414093017578125, -0.16660690307617188, -0.1590728759765625, -0.15153884887695312, -0.14400482177734375, -0.13647079467773438, -0.128936767578125, -0.12140274047851562, -0.11386871337890625, -0.10633468627929688, -0.0988006591796875, -0.09126663208007812, -0.08373260498046875, -0.07619857788085938, -0.06866455078125, -0.061130523681640625, -0.05359649658203125, -0.046062469482421875, -0.0385284423828125, -0.030994415283203125, -0.02346038818359375, -0.015926361083984375, -0.008392333984375, -0.000858306884765625, 0.00667572021484375, 0.014209747314453125, 0.0217437744140625, 0.029277801513671875, 0.03681182861328125, 0.044345855712890625, 0.0518798828125, 0.059413909912109375, 0.06694793701171875, 0.07448196411132812, 0.0820159912109375, 0.08955001831054688, 0.09708404541015625, 0.10461807250976562, 0.112152099609375, 0.11968612670898438, 0.12722015380859375, 0.13475418090820312, 0.1422882080078125, 0.14982223510742188, 0.15735626220703125, 0.16489028930664062, 0.17242431640625, 0.17995834350585938, 0.18749237060546875, 0.19502639770507812, 0.2025604248046875, 0.21009445190429688, 0.21762847900390625, 0.22516250610351562, 0.232696533203125, 0.24023056030273438, 0.24776458740234375, 0.2552986145019531, 0.2628326416015625, 0.2703666687011719, 0.27790069580078125, 0.2854347229003906, 0.29296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 4.0, 6.0, 1.0, 3.0, 9.0, 7.0, 9.0, 11.0, 13.0, 18.0, 18.0, 25.0, 30.0, 45.0, 41.0, 77.0, 94.0, 116.0, 86.0, 92.0, 67.0, 45.0, 48.0, 21.0, 20.0, 9.0, 14.0, 6.0, 16.0, 9.0, 8.0, 3.0, 4.0, 2.0, 11.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.3974609375, -0.3878898620605469, -0.37831878662109375, -0.3687477111816406, -0.3591766357421875, -0.3496055603027344, -0.34003448486328125, -0.3304634094238281, -0.320892333984375, -0.3113212585449219, -0.30175018310546875, -0.2921791076660156, -0.2826080322265625, -0.2730369567871094, -0.26346588134765625, -0.2538948059082031, -0.24432373046875, -0.23475265502929688, -0.22518157958984375, -0.21561050415039062, -0.2060394287109375, -0.19646835327148438, -0.18689727783203125, -0.17732620239257812, -0.167755126953125, -0.15818405151367188, -0.14861297607421875, -0.13904190063476562, -0.1294708251953125, -0.11989974975585938, -0.11032867431640625, -0.10075759887695312, -0.0911865234375, -0.08161544799804688, -0.07204437255859375, -0.062473297119140625, -0.0529022216796875, -0.043331146240234375, -0.03376007080078125, -0.024188995361328125, -0.014617919921875, -0.005046844482421875, 0.00452423095703125, 0.014095306396484375, 0.0236663818359375, 0.033237457275390625, 0.04280853271484375, 0.052379608154296875, 0.06195068359375, 0.07152175903320312, 0.08109283447265625, 0.09066390991210938, 0.1002349853515625, 0.10980606079101562, 0.11937713623046875, 0.12894821166992188, 0.138519287109375, 0.14809036254882812, 0.15766143798828125, 0.16723251342773438, 0.1768035888671875, 0.18637466430664062, 0.19594573974609375, 0.20551681518554688, 0.215087890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 8.0, 18.0, 32.0, 74.0, 197.0, 479.0, 68.0, 63.0, 29.0, 6.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.75851058959961, -15.283124923706055, -14.807740211486816, -14.332355499267578, -13.856969833374023, -13.381584167480469, -12.90619945526123, -12.430814743041992, -11.955429077148438, -11.480043411254883, -11.004658699035645, -10.529273986816406, -10.053888320922852, -9.578502655029297, -9.103117942810059, -8.62773323059082, -8.152347564697266, -7.676962375640869, -7.201577186584473, -6.726191997528076, -6.25080680847168, -5.775421619415283, -5.300036430358887, -4.82465124130249, -4.349266052246094, -3.8738808631896973, -3.398495674133301, -2.9231104850769043, -2.447725296020508, -1.9723401069641113, -1.4969549179077148, -1.0215697288513184, -0.5461854934692383, -0.0708003044128418, 0.4045848846435547, 0.8799700736999512, 1.3553552627563477, 1.8307404518127441, 2.3061256408691406, 2.781510829925537, 3.2568960189819336, 3.73228120803833, 4.207666397094727, 4.683051586151123, 5.1584367752075195, 5.633821964263916, 6.1092071533203125, 6.584592342376709, 7.0599775314331055, 7.535362720489502, 8.010747909545898, 8.486133575439453, 8.961518287658691, 9.43690299987793, 9.912288665771484, 10.387674331665039, 10.863059043884277, 11.338443756103516, 11.81382942199707, 12.289215087890625, 12.764599800109863, 13.239984512329102, 13.715370178222656, 14.190755844116211, 14.66614055633545]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 12.0, 8.0, 12.0, 11.0, 13.0, 23.0, 19.0, 33.0, 31.0, 33.0, 139.0, 338.0, 73.0, 37.0, 25.0, 30.0, 24.0, 24.0, 28.0, 25.0, 10.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.105731964111328, -10.80048656463623, -10.495241165161133, -10.189995765686035, -9.884750366210938, -9.57950496673584, -9.274259567260742, -8.969014167785645, -8.663768768310547, -8.35852336883545, -8.053277969360352, -7.748032569885254, -7.442787170410156, -7.137541770935059, -6.832296371459961, -6.527050971984863, -6.221806049346924, -5.916560649871826, -5.6113152503967285, -5.306069850921631, -5.000824451446533, -4.6955790519714355, -4.390334129333496, -4.085088729858398, -3.7798430919647217, -3.474597692489624, -3.1693522930145264, -2.864107131958008, -2.55886173248291, -2.2536163330078125, -1.9483709335327148, -1.6431255340576172, -1.3378801345825195, -1.0326347351074219, -0.727389395236969, -0.4221440553665161, -0.11689865589141846, 0.1883467435836792, 0.4935920238494873, 0.798837423324585, 1.1040828227996826, 1.4093282222747803, 1.714573621749878, 2.0198187828063965, 2.325064182281494, 2.630309581756592, 2.9355549812316895, 3.240800380706787, 3.5460457801818848, 3.8512911796569824, 4.15653657913208, 4.461781978607178, 4.767027378082275, 5.072272777557373, 5.3775177001953125, 5.68276309967041, 5.988008499145508, 6.2932538986206055, 6.598499298095703, 6.903744697570801, 7.208990097045898, 7.514235496520996, 7.819480895996094, 8.124726295471191, 8.429971694946289]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 21.0, 9.0, 27.0, 17.0, 32.0, 27.0, 49.0, 50.0, 66.0, 218.0, 146.0, 48.0, 42.0, 34.0, 26.0, 22.0, 21.0, 15.0, 17.0, 15.0, 11.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.740234375, -0.7168350219726562, -0.6934356689453125, -0.6700363159179688, -0.646636962890625, -0.6232376098632812, -0.5998382568359375, -0.5764389038085938, -0.55303955078125, -0.5296401977539062, -0.5062408447265625, -0.48284149169921875, -0.459442138671875, -0.43604278564453125, -0.4126434326171875, -0.38924407958984375, -0.3658447265625, -0.34244537353515625, -0.3190460205078125, -0.29564666748046875, -0.272247314453125, -0.24884796142578125, -0.2254486083984375, -0.20204925537109375, -0.17864990234375, -0.15525054931640625, -0.1318511962890625, -0.10845184326171875, -0.085052490234375, -0.06165313720703125, -0.0382537841796875, -0.01485443115234375, 0.008544921875, 0.03194427490234375, 0.0553436279296875, 0.07874298095703125, 0.102142333984375, 0.12554168701171875, 0.1489410400390625, 0.17234039306640625, 0.19573974609375, 0.21913909912109375, 0.2425384521484375, 0.26593780517578125, 0.289337158203125, 0.31273651123046875, 0.3361358642578125, 0.35953521728515625, 0.3829345703125, 0.40633392333984375, 0.4297332763671875, 0.45313262939453125, 0.476531982421875, 0.49993133544921875, 0.5233306884765625, 0.5467300415039062, 0.57012939453125, 0.5935287475585938, 0.6169281005859375, 0.6403274536132812, 0.663726806640625, 0.6871261596679688, 0.7105255126953125, 0.7339248657226562, 0.75732421875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 11.0, 6.0, 4.0, 13.0, 27.0, 38.0, 63.0, 58.0, 132.0, 230.0, 606.0, 2136.0, 10770.0, 8347408.0, 22437.0, 3119.0, 814.0, 285.0, 145.0, 105.0, 56.0, 24.0, 19.0, 20.0, 14.0, 7.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.430327415466309, -6.197672367095947, -5.965016841888428, -5.732361793518066, -5.499706745147705, -5.267051696777344, -5.034396171569824, -4.801741123199463, -4.569086074829102, -4.33643102645874, -4.103775501251221, -3.8711204528808594, -3.638465404510498, -3.4058101177215576, -3.173154830932617, -2.940499782562256, -2.7078444957733154, -2.475189208984375, -2.2425341606140137, -2.0098788738250732, -1.777223825454712, -1.5445685386657715, -1.3119133710861206, -1.0792582035064697, -0.8466030359268188, -0.613947868347168, -0.3812926709651947, -0.14863747358322144, 0.08401769399642944, 0.3166729211807251, 0.549328088760376, 0.7819832563400269, 1.0146384239196777, 1.2472935914993286, 1.4799487590789795, 1.71260404586792, 1.9452590942382812, 2.1779143810272217, 2.410569667816162, 2.6432247161865234, 2.8758797645568848, 3.108535051345825, 3.3411900997161865, 3.573845386505127, 3.8065004348754883, 4.039155960083008, 4.271811008453369, 4.5044660568237305, 4.73712158203125, 4.969776630401611, 5.202432155609131, 5.435087203979492, 5.6677422523498535, 5.900397300720215, 6.133052825927734, 6.365707874298096, 6.598362922668457, 6.831017971038818, 7.063673496246338, 7.296328544616699, 7.5289835929870605, 7.761638641357422, 7.994294166564941, 8.226949691772461, 8.459604263305664]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 11.0, 5.0, 0.0, 4.0, 3.0, 4.0, 7.0, 10.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.243095874786377, -5.058807373046875, -4.874518394470215, -4.690229892730713, -4.505941390991211, -4.321652889251709, -4.137364387512207, -3.953075408935547, -3.768786907196045, -3.584498405456543, -3.400209665298462, -3.215920925140381, -3.031632423400879, -2.847343921661377, -2.663055181503296, -2.478766441345215, -2.294477939605713, -2.110189437866211, -1.9259006977081299, -1.7416120767593384, -1.5573234558105469, -1.3730348348617554, -1.1887462139129639, -1.0044575929641724, -0.8201689720153809, -0.6358803510665894, -0.45159173011779785, -0.26730310916900635, -0.08301448822021484, 0.10127413272857666, 0.28556275367736816, 0.46985137462615967, 0.6541399955749512, 0.8384286165237427, 1.0227172374725342, 1.2070058584213257, 1.3912944793701172, 1.5755831003189087, 1.7598717212677002, 1.9441603422164917, 2.128448963165283, 2.312737464904785, 2.497026205062866, 2.6813149452209473, 2.865603446960449, 3.049891948699951, 3.2341806888580322, 3.4184694290161133, 3.6027579307556152, 3.787046432495117, 3.9713351726531982, 4.155623912811279, 4.339912414550781, 4.524200916290283, 4.708489418029785, 4.892778396606445, 5.077066898345947, 5.261355400085449, 5.445644378662109, 5.629932880401611, 5.814221382141113, 5.998509883880615, 6.182798385620117, 6.367087364196777, 6.551375865936279]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 5.0, 12.0, 14.0, 18.0, 15.0, 28.0, 40.0, 50.0, 96.0, 115.0, 216.0, 289.0, 619.0, 1277.0, 3117.0, 8882.0, 27000.0, 91343.0, 226016.0, 114665.0, 33315.0, 10358.0, 3566.0, 1409.0, 677.0, 352.0, 215.0, 151.0, 102.0, 82.0, 47.0, 51.0, 26.0, 25.0, 15.0, 13.0, 7.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.79498291015625, -5.6055908203125, -5.41619873046875, -5.226806640625, -5.03741455078125, -4.8480224609375, -4.65863037109375, -4.46923828125, -4.27984619140625, -4.0904541015625, -3.90106201171875, -3.711669921875, -3.52227783203125, -3.3328857421875, -3.14349365234375, -2.9541015625, -2.76470947265625, -2.5753173828125, -2.38592529296875, -2.196533203125, -2.00714111328125, -1.8177490234375, -1.62835693359375, -1.43896484375, -1.24957275390625, -1.0601806640625, -0.87078857421875, -0.681396484375, -0.49200439453125, -0.3026123046875, -0.11322021484375, 0.076171875, 0.26556396484375, 0.4549560546875, 0.64434814453125, 0.833740234375, 1.02313232421875, 1.2125244140625, 1.40191650390625, 1.59130859375, 1.78070068359375, 1.9700927734375, 2.15948486328125, 2.348876953125, 2.53826904296875, 2.7276611328125, 2.91705322265625, 3.1064453125, 3.29583740234375, 3.4852294921875, 3.67462158203125, 3.864013671875, 4.05340576171875, 4.2427978515625, 4.43218994140625, 4.62158203125, 4.81097412109375, 5.0003662109375, 5.18975830078125, 5.379150390625, 5.56854248046875, 5.7579345703125, 5.94732666015625, 6.13671875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 15.0, 34.0, 39.0, 76.0, 119.0, 163.0, 160.0, 145.0, 111.0, 60.0, 33.0, 31.0, 13.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.95703125, -1.888214111328125, -1.81939697265625, -1.750579833984375, -1.6817626953125, -1.612945556640625, -1.54412841796875, -1.475311279296875, -1.406494140625, -1.337677001953125, -1.26885986328125, -1.200042724609375, -1.1312255859375, -1.062408447265625, -0.99359130859375, -0.924774169921875, -0.85595703125, -0.787139892578125, -0.71832275390625, -0.649505615234375, -0.5806884765625, -0.511871337890625, -0.44305419921875, -0.374237060546875, -0.305419921875, -0.236602783203125, -0.16778564453125, -0.098968505859375, -0.0301513671875, 0.038665771484375, 0.10748291015625, 0.176300048828125, 0.2451171875, 0.313934326171875, 0.38275146484375, 0.451568603515625, 0.5203857421875, 0.589202880859375, 0.65802001953125, 0.726837158203125, 0.795654296875, 0.864471435546875, 0.93328857421875, 1.002105712890625, 1.0709228515625, 1.139739990234375, 1.20855712890625, 1.277374267578125, 1.34619140625, 1.415008544921875, 1.48382568359375, 1.552642822265625, 1.6214599609375, 1.690277099609375, 1.75909423828125, 1.827911376953125, 1.896728515625, 1.965545654296875, 2.03436279296875, 2.103179931640625, 2.1719970703125, 2.240814208984375, 2.30963134765625, 2.378448486328125, 2.447265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 9.0, 17.0, 34.0, 45.0, 82.0, 77.0, 75.0, 43.0, 24.0, 12.0, 12.0, 6.0, 5.0, 7.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.181715488433838, -5.986423015594482, -5.791130542755127, -5.5958380699157715, -5.400545597076416, -5.2052531242370605, -5.009961128234863, -4.814668655395508, -4.619376182556152, -4.424083709716797, -4.228791236877441, -4.033498764038086, -3.8382062911987305, -3.642913818359375, -3.4476215839385986, -3.252329111099243, -3.0570363998413086, -2.861743927001953, -2.6664514541625977, -2.471158981323242, -2.2758665084838867, -2.0805740356445312, -1.8852818012237549, -1.6899893283843994, -1.494696855545044, -1.2994043827056885, -1.104111909866333, -0.9088195562362671, -0.7135270833969116, -0.5182346105575562, -0.32294225692749023, -0.12764978408813477, 0.0676422119140625, 0.2629346549510956, 0.45822709798812866, 0.6535195112228394, 0.8488119840621948, 1.0441044569015503, 1.2393968105316162, 1.4346892833709717, 1.6299817562103271, 1.8252742290496826, 2.020566701889038, 2.2158589363098145, 2.41115140914917, 2.6064438819885254, 2.801736354827881, 2.9970288276672363, 3.192321300506592, 3.3876137733459473, 3.5829062461853027, 3.778198719024658, 3.9734911918640137, 4.168783664703369, 4.364075660705566, 4.559368133544922, 4.754660606384277, 4.949953079223633, 5.145245552062988, 5.340538024902344, 5.535830497741699, 5.731122970581055, 5.92641544342041, 6.121707916259766, 6.317000389099121]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 13.0, 33.0, 68.0, 102.0, 89.0, 55.0, 26.0, 10.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7101640701293945, -4.532390117645264, -4.354616641998291, -4.17684268951416, -3.9990689754486084, -3.8212952613830566, -3.643521547317505, -3.465747833251953, -3.2879738807678223, -3.1102001667022705, -2.9324264526367188, -2.754652500152588, -2.576878786087036, -2.3991050720214844, -2.2213313579559326, -2.043557643890381, -1.865783929824829, -1.6880102157592773, -1.510236382484436, -1.3324626684188843, -1.154688835144043, -0.9769151210784912, -0.7991414070129395, -0.6213675737380981, -0.4435938596725464, -0.26582008600234985, -0.08804634213447571, 0.08972740173339844, 0.26750117540359497, 0.4452749490737915, 0.6230486631393433, 0.8008224964141846, 0.9785962104797363, 1.156369924545288, 1.3341437578201294, 1.5119174718856812, 1.6896913051605225, 1.8674650192260742, 2.045238733291626, 2.2230124473571777, 2.4007863998413086, 2.5785601139068604, 2.756333827972412, 2.934107780456543, 3.1118814945220947, 3.2896552085876465, 3.4674289226531982, 3.64520263671875, 3.8229763507843018, 4.0007500648498535, 4.178524017333984, 4.356297492980957, 4.534071445465088, 4.711845397949219, 4.889618873596191, 5.067392826080322, 5.245166301727295, 5.422940254211426, 5.600713729858398, 5.778487682342529, 5.956261157989502, 6.134035110473633, 6.3118085861206055, 6.489582538604736, 6.667356491088867]}, "eval/loss": 4.671250343322754, "eval/wer": 1.9355811186037286, "eval/runtime": 785.3163, "eval/samples_per_second": 3.364, "eval/steps_per_second": 0.281} \ No newline at end of file