{"train/loss": 5.5014, "train/learning_rate": 9.94e-05, "train/epoch": 0.49, "train/global_step": 500, "_runtime": 2323, "_timestamp": 1646202879, "_step": 499, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 12.0, 14.0, 54.0, 159.0, 427.0, 210.0, 70.0, 34.0, 18.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-137.7477569580078, -119.74454498291016, -101.7413330078125, -83.73812103271484, -65.73490905761719, -47.73169708251953, -29.728485107421875, -11.725273132324219, 6.2779388427734375, 24.281150817871094, 42.28436279296875, 60.287574768066406, 78.29078674316406, 96.29399871826172, 114.29721069335938, 132.3004150390625, 150.3036346435547, 168.30685424804688, 186.31005859375, 204.31326293945312, 222.3164825439453, 240.3197021484375, 258.3229064941406, 276.32611083984375, 294.329345703125, 312.3325500488281, 330.33575439453125, 348.3389892578125, 366.3421936035156, 384.34539794921875, 402.3486328125, 420.3518371582031, 438.35498046875, 456.3581848144531, 474.36138916015625, 492.3646240234375, 510.3678283691406, 528.3710327148438, 546.374267578125, 564.37744140625, 582.3806762695312, 600.3839111328125, 618.3870849609375, 636.3903198242188, 654.3935546875, 672.396728515625, 690.3999633789062, 708.4031372070312, 726.4063720703125, 744.4096069335938, 762.4127807617188, 780.416015625, 798.419189453125, 816.4224243164062, 834.4256591796875, 852.4288330078125, 870.4320678710938, 888.435302734375, 906.4384765625, 924.4417114257812, 942.4449462890625, 960.4481201171875, 978.4513549804688, 996.4545288085938, 1014.457763671875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 5.0, 11.0, 21.0, 15.0, 15.0, 22.0, 24.0, 27.0, 19.0, 40.0, 26.0, 29.0, 35.0, 34.0, 38.0, 44.0, 27.0, 54.0, 50.0, 46.0, 40.0, 39.0, 29.0, 34.0, 30.0, 31.0, 22.0, 18.0, 23.0, 24.0, 12.0, 17.0, 18.0, 9.0, 7.0, 13.0, 6.0, 7.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-428.36077880859375, -414.86602783203125, -401.3713073730469, -387.8765563964844, -374.3818054199219, -360.8870849609375, -347.392333984375, -333.8975830078125, -320.40283203125, -306.9080810546875, -293.4133605957031, -279.9186096191406, -266.4238586425781, -252.9291229248047, -239.43438720703125, -225.93963623046875, -212.44491577148438, -198.95018005371094, -185.45542907714844, -171.960693359375, -158.4659423828125, -144.97120666503906, -131.47647094726562, -117.98172760009766, -104.48698425292969, -90.99224090576172, -77.49749755859375, -64.00276184082031, -50.508018493652344, -37.013275146484375, -23.518539428710938, -10.023796081542969, 3.470916748046875, 16.96565818786621, 30.460399627685547, 43.95513916015625, 57.44988250732422, 70.94462585449219, 84.43936157226562, 97.9341049194336, 111.42884826660156, 124.92359161376953, 138.4183349609375, 151.91307067871094, 165.40780639648438, 178.90255737304688, 192.3972930908203, 205.89202880859375, 219.38677978515625, 232.8815155029297, 246.3762664794922, 259.8710021972656, 273.3657531738281, 286.8604736328125, 300.355224609375, 313.8499755859375, 327.3447265625, 340.8394775390625, 354.3341979980469, 367.8289489746094, 381.3236999511719, 394.81842041015625, 408.31317138671875, 421.80792236328125, 435.3026428222656]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 3.0, 7.0, 10.0, 18.0, 17.0, 23.0, 20.0, 32.0, 32.0, 28.0, 48.0, 42.0, 43.0, 51.0, 56.0, 41.0, 70.0, 63.0, 50.0, 40.0, 51.0, 38.0, 39.0, 22.0, 32.0, 31.0, 17.0, 12.0, 14.0, 15.0, 6.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.6875, -25.923828125, -25.16015625, -24.396484375, -23.6328125, -22.869140625, -22.10546875, -21.341796875, -20.578125, -19.814453125, -19.05078125, -18.287109375, -17.5234375, -16.759765625, -15.99609375, -15.232421875, -14.46875, -13.705078125, -12.94140625, -12.177734375, -11.4140625, -10.650390625, -9.88671875, -9.123046875, -8.359375, -7.595703125, -6.83203125, -6.068359375, -5.3046875, -4.541015625, -3.77734375, -3.013671875, -2.25, -1.486328125, -0.72265625, 0.041015625, 0.8046875, 1.568359375, 2.33203125, 3.095703125, 3.859375, 4.623046875, 5.38671875, 6.150390625, 6.9140625, 7.677734375, 8.44140625, 9.205078125, 9.96875, 10.732421875, 11.49609375, 12.259765625, 13.0234375, 13.787109375, 14.55078125, 15.314453125, 16.078125, 16.841796875, 17.60546875, 18.369140625, 19.1328125, 19.896484375, 20.66015625, 21.423828125, 22.1875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 8.0, 11.0, 19.0, 18.0, 23.0, 40.0, 43.0, 79.0, 79.0, 163.0, 211.0, 281.0, 448.0, 692.0, 1070.0, 1834.0, 3454.0, 7373.0, 17263.0, 55457.0, 2888956.0, 1146331.0, 42617.0, 14359.0, 6125.0, 3010.0, 1564.0, 958.0, 551.0, 396.0, 252.0, 180.0, 111.0, 94.0, 54.0, 46.0, 27.0, 21.0, 16.0, 14.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-123.375, -119.83984375, -116.3046875, -112.76953125, -109.234375, -105.69921875, -102.1640625, -98.62890625, -95.09375, -91.55859375, -88.0234375, -84.48828125, -80.953125, -77.41796875, -73.8828125, -70.34765625, -66.8125, -63.27734375, -59.7421875, -56.20703125, -52.671875, -49.13671875, -45.6015625, -42.06640625, -38.53125, -34.99609375, -31.4609375, -27.92578125, -24.390625, -20.85546875, -17.3203125, -13.78515625, -10.25, -6.71484375, -3.1796875, 0.35546875, 3.890625, 7.42578125, 10.9609375, 14.49609375, 18.03125, 21.56640625, 25.1015625, 28.63671875, 32.171875, 35.70703125, 39.2421875, 42.77734375, 46.3125, 49.84765625, 53.3828125, 56.91796875, 60.453125, 63.98828125, 67.5234375, 71.05859375, 74.59375, 78.12890625, 81.6640625, 85.19921875, 88.734375, 92.26953125, 95.8046875, 99.33984375, 102.875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 11.0, 8.0, 7.0, 9.0, 12.0, 22.0, 36.0, 50.0, 77.0, 120.0, 298.0, 962.0, 1501.0, 504.0, 159.0, 71.0, 69.0, 43.0, 27.0, 27.0, 10.0, 18.0, 10.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.625, -129.341796875, -125.05859375, -120.775390625, -116.4921875, -112.208984375, -107.92578125, -103.642578125, -99.359375, -95.076171875, -90.79296875, -86.509765625, -82.2265625, -77.943359375, -73.66015625, -69.376953125, -65.09375, -60.810546875, -56.52734375, -52.244140625, -47.9609375, -43.677734375, -39.39453125, -35.111328125, -30.828125, -26.544921875, -22.26171875, -17.978515625, -13.6953125, -9.412109375, -5.12890625, -0.845703125, 3.4375, 7.720703125, 12.00390625, 16.287109375, 20.5703125, 24.853515625, 29.13671875, 33.419921875, 37.703125, 41.986328125, 46.26953125, 50.552734375, 54.8359375, 59.119140625, 63.40234375, 67.685546875, 71.96875, 76.251953125, 80.53515625, 84.818359375, 89.1015625, 93.384765625, 97.66796875, 101.951171875, 106.234375, 110.517578125, 114.80078125, 119.083984375, 123.3671875, 127.650390625, 131.93359375, 136.216796875, 140.5]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 11.0, 9.0, 14.0, 22.0, 23.0, 21.0, 31.0, 62.0, 101.0, 154.0, 349.0, 1082.0, 6044.0, 89072.0, 4053568.0, 38605.0, 3558.0, 789.0, 303.0, 152.0, 88.0, 54.0, 51.0, 36.0, 25.0, 16.0, 10.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-434.25, -420.41015625, -406.5703125, -392.73046875, -378.890625, -365.05078125, -351.2109375, -337.37109375, -323.53125, -309.69140625, -295.8515625, -282.01171875, -268.171875, -254.33203125, -240.4921875, -226.65234375, -212.8125, -198.97265625, -185.1328125, -171.29296875, -157.453125, -143.61328125, -129.7734375, -115.93359375, -102.09375, -88.25390625, -74.4140625, -60.57421875, -46.734375, -32.89453125, -19.0546875, -5.21484375, 8.625, 22.46484375, 36.3046875, 50.14453125, 63.984375, 77.82421875, 91.6640625, 105.50390625, 119.34375, 133.18359375, 147.0234375, 160.86328125, 174.703125, 188.54296875, 202.3828125, 216.22265625, 230.0625, 243.90234375, 257.7421875, 271.58203125, 285.421875, 299.26171875, 313.1015625, 326.94140625, 340.78125, 354.62109375, 368.4609375, 382.30078125, 396.140625, 409.98046875, 423.8203125, 437.66015625, 451.5]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 13.0, 43.0, 178.0, 660.0, 94.0, 19.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1595.5902099609375, -1559.6495361328125, -1523.7088623046875, -1487.768310546875, -1451.82763671875, -1415.886962890625, -1379.9462890625, -1344.005615234375, -1308.06494140625, -1272.124267578125, -1236.18359375, -1200.2430419921875, -1164.3023681640625, -1128.3616943359375, -1092.4210205078125, -1056.4803466796875, -1020.539794921875, -984.59912109375, -948.6585083007812, -912.7178344726562, -876.7772216796875, -840.8365478515625, -804.8958740234375, -768.9552001953125, -733.0145874023438, -697.0739135742188, -661.13330078125, -625.192626953125, -589.251953125, -553.3113403320312, -517.3706665039062, -481.4300231933594, -445.489501953125, -409.5488586425781, -373.60821533203125, -337.66754150390625, -301.7268981933594, -265.7862548828125, -229.84559631347656, -193.90493774414062, -157.96429443359375, -122.02364349365234, -86.08299255371094, -50.14234161376953, -14.201690673828125, 21.73895263671875, 57.67961120605469, 93.62026977539062, 129.5609130859375, 165.50155639648438, 201.4422149658203, 237.38287353515625, 273.3235168457031, 309.26416015625, 345.204833984375, 381.1454772949219, 417.08612060546875, 453.0267639160156, 488.9674072265625, 524.9080810546875, 560.8487548828125, 596.7893676757812, 632.7300415039062, 668.670654296875, 704.611328125]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 7.0, 7.0, 13.0, 10.0, 16.0, 18.0, 25.0, 22.0, 24.0, 24.0, 36.0, 33.0, 30.0, 40.0, 47.0, 49.0, 61.0, 40.0, 43.0, 49.0, 50.0, 40.0, 45.0, 33.0, 28.0, 31.0, 20.0, 22.0, 24.0, 19.0, 14.0, 7.0, 10.0, 13.0, 6.0, 11.0, 13.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-306.07330322265625, -296.5806579589844, -287.0880126953125, -277.59539794921875, -268.1027526855469, -258.610107421875, -249.1174774169922, -239.62484741210938, -230.1322021484375, -220.63955688476562, -211.1469268798828, -201.654296875, -192.16165161132812, -182.66900634765625, -173.17637634277344, -163.68374633789062, -154.19110107421875, -144.69845581054688, -135.20582580566406, -125.71318817138672, -116.22055053710938, -106.72791290283203, -97.23527526855469, -87.74263763427734, -78.25, -68.75736236572266, -59.26472473144531, -49.77208709716797, -40.279449462890625, -30.78681182861328, -21.294174194335938, -11.801536560058594, -2.308868408203125, 7.183769226074219, 16.676406860351562, 26.169044494628906, 35.66168212890625, 45.154319763183594, 54.64695739746094, 64.13959503173828, 73.63223266601562, 83.12487030029297, 92.61750793457031, 102.11014556884766, 111.602783203125, 121.09542083740234, 130.5880584716797, 140.0806884765625, 149.57333374023438, 159.06597900390625, 168.55860900878906, 178.05123901367188, 187.54388427734375, 197.03652954101562, 206.52915954589844, 216.02178955078125, 225.51443481445312, 235.007080078125, 244.4997100830078, 253.99234008789062, 263.4849853515625, 272.9776306152344, 282.47027587890625, 291.962890625, 301.4555358886719]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 5.0, 13.0, 8.0, 22.0, 16.0, 20.0, 21.0, 31.0, 28.0, 33.0, 41.0, 48.0, 49.0, 69.0, 47.0, 60.0, 43.0, 52.0, 47.0, 45.0, 55.0, 42.0, 35.0, 27.0, 26.0, 15.0, 24.0, 17.0, 7.0, 14.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.671875, -28.8642578125, -28.056640625, -27.2490234375, -26.44140625, -25.6337890625, -24.826171875, -24.0185546875, -23.2109375, -22.4033203125, -21.595703125, -20.7880859375, -19.98046875, -19.1728515625, -18.365234375, -17.5576171875, -16.75, -15.9423828125, -15.134765625, -14.3271484375, -13.51953125, -12.7119140625, -11.904296875, -11.0966796875, -10.2890625, -9.4814453125, -8.673828125, -7.8662109375, -7.05859375, -6.2509765625, -5.443359375, -4.6357421875, -3.828125, -3.0205078125, -2.212890625, -1.4052734375, -0.59765625, 0.2099609375, 1.017578125, 1.8251953125, 2.6328125, 3.4404296875, 4.248046875, 5.0556640625, 5.86328125, 6.6708984375, 7.478515625, 8.2861328125, 9.09375, 9.9013671875, 10.708984375, 11.5166015625, 12.32421875, 13.1318359375, 13.939453125, 14.7470703125, 15.5546875, 16.3623046875, 17.169921875, 17.9775390625, 18.78515625, 19.5927734375, 20.400390625, 21.2080078125, 22.015625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 9.0, 10.0, 19.0, 17.0, 24.0, 31.0, 50.0, 75.0, 90.0, 152.0, 218.0, 383.0, 550.0, 986.0, 1489.0, 2417.0, 3966.0, 6795.0, 11216.0, 19512.0, 35146.0, 68001.0, 148036.0, 323843.0, 221834.0, 95431.0, 46596.0, 25463.0, 14614.0, 8438.0, 4941.0, 3020.0, 1893.0, 1145.0, 735.0, 468.0, 295.0, 219.0, 147.0, 86.0, 65.0, 37.0, 23.0, 19.0, 10.0, 7.0, 12.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0], "bins": [-1.3671875, -1.32781982421875, -1.2884521484375, -1.24908447265625, -1.209716796875, -1.17034912109375, -1.1309814453125, -1.09161376953125, -1.05224609375, -1.01287841796875, -0.9735107421875, -0.93414306640625, -0.894775390625, -0.85540771484375, -0.8160400390625, -0.77667236328125, -0.7373046875, -0.69793701171875, -0.6585693359375, -0.61920166015625, -0.579833984375, -0.54046630859375, -0.5010986328125, -0.46173095703125, -0.42236328125, -0.38299560546875, -0.3436279296875, -0.30426025390625, -0.264892578125, -0.22552490234375, -0.1861572265625, -0.14678955078125, -0.107421875, -0.06805419921875, -0.0286865234375, 0.01068115234375, 0.050048828125, 0.08941650390625, 0.1287841796875, 0.16815185546875, 0.20751953125, 0.24688720703125, 0.2862548828125, 0.32562255859375, 0.364990234375, 0.40435791015625, 0.4437255859375, 0.48309326171875, 0.5224609375, 0.56182861328125, 0.6011962890625, 0.64056396484375, 0.679931640625, 0.71929931640625, 0.7586669921875, 0.79803466796875, 0.83740234375, 0.87677001953125, 0.9161376953125, 0.95550537109375, 0.994873046875, 1.03424072265625, 1.0736083984375, 1.11297607421875, 1.15234375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 10.0, 4.0, 4.0, 7.0, 8.0, 11.0, 14.0, 15.0, 20.0, 16.0, 11.0, 20.0, 31.0, 27.0, 24.0, 29.0, 28.0, 37.0, 28.0, 35.0, 45.0, 37.0, 43.0, 1054.0, 40.0, 32.0, 37.0, 41.0, 29.0, 22.0, 26.0, 37.0, 31.0, 23.0, 19.0, 28.0, 11.0, 9.0, 14.0, 20.0, 11.0, 12.0, 3.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.421875, -12.01904296875, -11.6162109375, -11.21337890625, -10.810546875, -10.40771484375, -10.0048828125, -9.60205078125, -9.19921875, -8.79638671875, -8.3935546875, -7.99072265625, -7.587890625, -7.18505859375, -6.7822265625, -6.37939453125, -5.9765625, -5.57373046875, -5.1708984375, -4.76806640625, -4.365234375, -3.96240234375, -3.5595703125, -3.15673828125, -2.75390625, -2.35107421875, -1.9482421875, -1.54541015625, -1.142578125, -0.73974609375, -0.3369140625, 0.06591796875, 0.46875, 0.87158203125, 1.2744140625, 1.67724609375, 2.080078125, 2.48291015625, 2.8857421875, 3.28857421875, 3.69140625, 4.09423828125, 4.4970703125, 4.89990234375, 5.302734375, 5.70556640625, 6.1083984375, 6.51123046875, 6.9140625, 7.31689453125, 7.7197265625, 8.12255859375, 8.525390625, 8.92822265625, 9.3310546875, 9.73388671875, 10.13671875, 10.53955078125, 10.9423828125, 11.34521484375, 11.748046875, 12.15087890625, 12.5537109375, 12.95654296875, 13.359375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 8.0, 15.0, 15.0, 26.0, 29.0, 44.0, 71.0, 96.0, 163.0, 225.0, 324.0, 448.0, 694.0, 1029.0, 1628.0, 2482.0, 3821.0, 5799.0, 9377.0, 14857.0, 24339.0, 40531.0, 73002.0, 145234.0, 1327772.0, 214938.0, 96798.0, 52180.0, 30687.0, 18316.0, 11561.0, 7386.0, 4648.0, 2899.0, 1949.0, 1271.0, 834.0, 549.0, 353.0, 243.0, 157.0, 110.0, 77.0, 38.0, 38.0, 21.0, 11.0, 16.0, 11.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.0537109375, -1.0194091796875, -0.985107421875, -0.9508056640625, -0.91650390625, -0.8822021484375, -0.847900390625, -0.8135986328125, -0.779296875, -0.7449951171875, -0.710693359375, -0.6763916015625, -0.64208984375, -0.6077880859375, -0.573486328125, -0.5391845703125, -0.5048828125, -0.4705810546875, -0.436279296875, -0.4019775390625, -0.36767578125, -0.3333740234375, -0.299072265625, -0.2647705078125, -0.23046875, -0.1961669921875, -0.161865234375, -0.1275634765625, -0.09326171875, -0.0589599609375, -0.024658203125, 0.0096435546875, 0.0439453125, 0.0782470703125, 0.112548828125, 0.1468505859375, 0.18115234375, 0.2154541015625, 0.249755859375, 0.2840576171875, 0.318359375, 0.3526611328125, 0.386962890625, 0.4212646484375, 0.45556640625, 0.4898681640625, 0.524169921875, 0.5584716796875, 0.5927734375, 0.6270751953125, 0.661376953125, 0.6956787109375, 0.72998046875, 0.7642822265625, 0.798583984375, 0.8328857421875, 0.8671875, 0.9014892578125, 0.935791015625, 0.9700927734375, 1.00439453125, 1.0386962890625, 1.072998046875, 1.1072998046875, 1.1416015625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 7.0, 8.0, 14.0, 17.0, 10.0, 22.0, 29.0, 39.0, 41.0, 48.0, 62.0, 51.0, 65.0, 71.0, 81.0, 84.0, 58.0, 55.0, 45.0, 44.0, 30.0, 19.0, 25.0, 15.0, 7.0, 10.0, 6.0, 6.0, 4.0, 10.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015716552734375, -0.015219926834106445, -0.01472330093383789, -0.014226675033569336, -0.013730049133300781, -0.013233423233032227, -0.012736797332763672, -0.012240171432495117, -0.011743545532226562, -0.011246919631958008, -0.010750293731689453, -0.010253667831420898, -0.009757041931152344, -0.009260416030883789, -0.008763790130615234, -0.00826716423034668, -0.007770538330078125, -0.00727391242980957, -0.006777286529541016, -0.006280660629272461, -0.005784034729003906, -0.0052874088287353516, -0.004790782928466797, -0.004294157028198242, -0.0037975311279296875, -0.003300905227661133, -0.002804279327392578, -0.0023076534271240234, -0.0018110275268554688, -0.001314401626586914, -0.0008177757263183594, -0.0003211498260498047, 0.00017547607421875, 0.0006721019744873047, 0.0011687278747558594, 0.001665353775024414, 0.0021619796752929688, 0.0026586055755615234, 0.003155231475830078, 0.003651857376098633, 0.0041484832763671875, 0.004645109176635742, 0.005141735076904297, 0.0056383609771728516, 0.006134986877441406, 0.006631612777709961, 0.007128238677978516, 0.00762486457824707, 0.008121490478515625, 0.00861811637878418, 0.009114742279052734, 0.009611368179321289, 0.010107994079589844, 0.010604619979858398, 0.011101245880126953, 0.011597871780395508, 0.012094497680664062, 0.012591123580932617, 0.013087749481201172, 0.013584375381469727, 0.014081001281738281, 0.014577627182006836, 0.01507425308227539, 0.015570878982543945, 0.0160675048828125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 10.0, 13.0, 14.0, 16.0, 33.0, 35.0, 38.0, 42.0, 65.0, 102.0, 118.0, 140.0, 194.0, 265.0, 797.0, 668427.0, 376337.0, 773.0, 258.0, 212.0, 152.0, 130.0, 75.0, 67.0, 65.0, 33.0, 28.0, 21.0, 14.0, 15.0, 14.0, 15.0, 9.0, 5.0, 2.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.302001953125, -0.2922554016113281, -0.28250885009765625, -0.2727622985839844, -0.2630157470703125, -0.2532691955566406, -0.24352264404296875, -0.23377609252929688, -0.224029541015625, -0.21428298950195312, -0.20453643798828125, -0.19478988647460938, -0.1850433349609375, -0.17529678344726562, -0.16555023193359375, -0.15580368041992188, -0.14605712890625, -0.13631057739257812, -0.12656402587890625, -0.11681747436523438, -0.1070709228515625, -0.09732437133789062, -0.08757781982421875, -0.07783126831054688, -0.068084716796875, -0.058338165283203125, -0.04859161376953125, -0.038845062255859375, -0.0290985107421875, -0.019351959228515625, -0.00960540771484375, 0.000141143798828125, 0.0098876953125, 0.019634246826171875, 0.02938079833984375, 0.039127349853515625, 0.0488739013671875, 0.058620452880859375, 0.06836700439453125, 0.07811355590820312, 0.087860107421875, 0.09760665893554688, 0.10735321044921875, 0.11709976196289062, 0.1268463134765625, 0.13659286499023438, 0.14633941650390625, 0.15608596801757812, 0.16583251953125, 0.17557907104492188, 0.18532562255859375, 0.19507217407226562, 0.2048187255859375, 0.21456527709960938, 0.22431182861328125, 0.23405838012695312, 0.243804931640625, 0.2535514831542969, 0.26329803466796875, 0.2730445861816406, 0.2827911376953125, 0.2925376892089844, 0.30228424072265625, 0.3120307922363281, 0.32177734375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 844.0, 170.0], "bins": [-0.2517983019351959, -0.24779370427131653, -0.24378910660743713, -0.23978449404239655, -0.23577989637851715, -0.23177529871463776, -0.22777068614959717, -0.22376608848571777, -0.21976149082183838, -0.21575689315795898, -0.2117522954940796, -0.207747682929039, -0.2037430852651596, -0.1997384876012802, -0.19573387503623962, -0.19172927737236023, -0.18772467970848083, -0.18372008204460144, -0.17971548438072205, -0.17571087181568146, -0.17170627415180206, -0.16770167648792267, -0.16369706392288208, -0.15969246625900269, -0.1556878685951233, -0.1516832709312439, -0.1476786732673645, -0.1436740607023239, -0.13966946303844452, -0.13566486537456512, -0.13166025280952454, -0.12765565514564514, -0.12365106493234634, -0.11964645981788635, -0.11564186215400696, -0.11163726449012756, -0.10763265937566757, -0.10362805426120758, -0.09962345659732819, -0.09561885893344879, -0.0916142538189888, -0.08760964870452881, -0.08360505104064941, -0.07960045337677002, -0.07559584826231003, -0.07159124314785004, -0.06758664548397064, -0.06358204782009125, -0.059577446430921555, -0.05557284504175186, -0.05156824365258217, -0.047563642263412476, -0.04355904087424278, -0.03955443948507309, -0.0355498380959034, -0.031545236706733704, -0.02754063531756401, -0.023536033928394318, -0.019531432539224625, -0.015526831150054932, -0.011522229760885239, -0.007517628371715546, -0.0035130269825458527, 0.0004915744066238403, 0.004496176727116108]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 9.0, 7.0, 18.0, 17.0, 30.0, 54.0, 51.0, 53.0, 59.0, 72.0, 88.0, 79.0, 83.0, 83.0, 68.0, 53.0, 40.0, 49.0, 27.0, 25.0, 15.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013592243194580078, -0.013156288303434849, -0.01272033341228962, -0.01228437852114439, -0.01184842362999916, -0.011412468738853931, -0.010976513847708702, -0.010540558956563473, -0.010104604065418243, -0.009668649174273014, -0.009232694283127785, -0.008796739391982555, -0.008360784500837326, -0.007924829609692097, -0.007488874718546867, -0.007052919827401638, -0.006616964936256409, -0.006181010045111179, -0.00574505515396595, -0.005309100262820721, -0.004873145371675491, -0.004437190480530262, -0.004001235589385033, -0.0035652806982398033, -0.003129325807094574, -0.0026933709159493446, -0.0022574160248041153, -0.001821461133658886, -0.0013855062425136566, -0.0009495513513684273, -0.0005135964602231979, -7.76415690779686e-05, 0.00035831332206726074, 0.0007942682132124901, 0.0012302231043577194, 0.0016661779955029488, 0.002102132886648178, 0.0025380877777934074, 0.0029740426689386368, 0.003409997560083866, 0.0038459524512290955, 0.004281907342374325, 0.004717862233519554, 0.0051538171246647835, 0.005589772015810013, 0.006025726906955242, 0.0064616817981004715, 0.006897636689245701, 0.00733359158039093, 0.0077695464715361595, 0.008205501362681389, 0.008641456253826618, 0.009077411144971848, 0.009513366036117077, 0.009949320927262306, 0.010385275818407536, 0.010821230709552765, 0.011257185600697994, 0.011693140491843224, 0.012129095382988453, 0.012565050274133682, 0.013001005165278912, 0.013436960056424141, 0.01387291494756937, 0.0143088698387146]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 5.0, 13.0, 8.0, 22.0, 16.0, 20.0, 21.0, 31.0, 28.0, 33.0, 41.0, 48.0, 49.0, 69.0, 47.0, 60.0, 43.0, 52.0, 47.0, 45.0, 55.0, 42.0, 35.0, 27.0, 26.0, 15.0, 24.0, 17.0, 7.0, 14.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.671875, -28.8642578125, -28.056640625, -27.2490234375, -26.44140625, -25.6337890625, -24.826171875, -24.0185546875, -23.2109375, -22.4033203125, -21.595703125, -20.7880859375, -19.98046875, -19.1728515625, -18.365234375, -17.5576171875, -16.75, -15.9423828125, -15.134765625, -14.3271484375, -13.51953125, -12.7119140625, -11.904296875, -11.0966796875, -10.2890625, -9.4814453125, -8.673828125, -7.8662109375, -7.05859375, -6.2509765625, -5.443359375, -4.6357421875, -3.828125, -3.0205078125, -2.212890625, -1.4052734375, -0.59765625, 0.2099609375, 1.017578125, 1.8251953125, 2.6328125, 3.4404296875, 4.248046875, 5.0556640625, 5.86328125, 6.6708984375, 7.478515625, 8.2861328125, 9.09375, 9.9013671875, 10.708984375, 11.5166015625, 12.32421875, 13.1318359375, 13.939453125, 14.7470703125, 15.5546875, 16.3623046875, 17.169921875, 17.9775390625, 18.78515625, 19.5927734375, 20.400390625, 21.2080078125, 22.015625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 6.0, 12.0, 9.0, 15.0, 19.0, 29.0, 43.0, 72.0, 115.0, 173.0, 287.0, 444.0, 767.0, 1151.0, 1951.0, 3351.0, 6262.0, 13005.0, 35173.0, 171646.0, 673034.0, 94029.0, 24467.0, 10167.0, 5077.0, 2874.0, 1697.0, 981.0, 595.0, 400.0, 236.0, 143.0, 99.0, 63.0, 42.0, 39.0, 25.0, 16.0, 15.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-86.3125, -83.9375, -81.5625, -79.1875, -76.8125, -74.4375, -72.0625, -69.6875, -67.3125, -64.9375, -62.5625, -60.1875, -57.8125, -55.4375, -53.0625, -50.6875, -48.3125, -45.9375, -43.5625, -41.1875, -38.8125, -36.4375, -34.0625, -31.6875, -29.3125, -26.9375, -24.5625, -22.1875, -19.8125, -17.4375, -15.0625, -12.6875, -10.3125, -7.9375, -5.5625, -3.1875, -0.8125, 1.5625, 3.9375, 6.3125, 8.6875, 11.0625, 13.4375, 15.8125, 18.1875, 20.5625, 22.9375, 25.3125, 27.6875, 30.0625, 32.4375, 34.8125, 37.1875, 39.5625, 41.9375, 44.3125, 46.6875, 49.0625, 51.4375, 53.8125, 56.1875, 58.5625, 60.9375, 63.3125, 65.6875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 11.0, 9.0, 3.0, 17.0, 20.0, 17.0, 26.0, 29.0, 32.0, 36.0, 33.0, 56.0, 39.0, 67.0, 78.0, 312.0, 1675.0, 128.0, 48.0, 56.0, 44.0, 48.0, 37.0, 34.0, 27.0, 23.0, 20.0, 26.0, 19.0, 12.0, 10.0, 14.0, 11.0, 4.0, 3.0, 2.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-86.0, -83.5537109375, -81.107421875, -78.6611328125, -76.21484375, -73.7685546875, -71.322265625, -68.8759765625, -66.4296875, -63.9833984375, -61.537109375, -59.0908203125, -56.64453125, -54.1982421875, -51.751953125, -49.3056640625, -46.859375, -44.4130859375, -41.966796875, -39.5205078125, -37.07421875, -34.6279296875, -32.181640625, -29.7353515625, -27.2890625, -24.8427734375, -22.396484375, -19.9501953125, -17.50390625, -15.0576171875, -12.611328125, -10.1650390625, -7.71875, -5.2724609375, -2.826171875, -0.3798828125, 2.06640625, 4.5126953125, 6.958984375, 9.4052734375, 11.8515625, 14.2978515625, 16.744140625, 19.1904296875, 21.63671875, 24.0830078125, 26.529296875, 28.9755859375, 31.421875, 33.8681640625, 36.314453125, 38.7607421875, 41.20703125, 43.6533203125, 46.099609375, 48.5458984375, 50.9921875, 53.4384765625, 55.884765625, 58.3310546875, 60.77734375, 63.2236328125, 65.669921875, 68.1162109375, 70.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 2.0, 5.0, 3.0, 7.0, 11.0, 10.0, 13.0, 19.0, 20.0, 18.0, 20.0, 28.0, 32.0, 48.0, 73.0, 84.0, 172.0, 567.0, 6762.0, 3123705.0, 12929.0, 632.0, 172.0, 89.0, 69.0, 33.0, 40.0, 22.0, 21.0, 21.0, 13.0, 18.0, 9.0, 5.0, 10.0, 9.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.25, -319.6484375, -308.046875, -296.4453125, -284.84375, -273.2421875, -261.640625, -250.0390625, -238.4375, -226.8359375, -215.234375, -203.6328125, -192.03125, -180.4296875, -168.828125, -157.2265625, -145.625, -134.0234375, -122.421875, -110.8203125, -99.21875, -87.6171875, -76.015625, -64.4140625, -52.8125, -41.2109375, -29.609375, -18.0078125, -6.40625, 5.1953125, 16.796875, 28.3984375, 40.0, 51.6015625, 63.203125, 74.8046875, 86.40625, 98.0078125, 109.609375, 121.2109375, 132.8125, 144.4140625, 156.015625, 167.6171875, 179.21875, 190.8203125, 202.421875, 214.0234375, 225.625, 237.2265625, 248.828125, 260.4296875, 272.03125, 283.6328125, 295.234375, 306.8359375, 318.4375, 330.0390625, 341.640625, 353.2421875, 364.84375, 376.4453125, 388.046875, 399.6484375, 411.25]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [969.0, 50.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.86767578125, 15.905780792236328, 76.67923736572266, 137.45269775390625, 198.2261505126953, 258.9996032714844, 319.7730712890625, 380.5465087890625, 441.3199768066406, 502.09344482421875, 562.8668823242188, 623.640380859375, 684.413818359375, 745.187255859375, 805.960693359375, 866.734130859375, 927.5076293945312, 988.2810668945312, 1049.0545654296875, 1109.8280029296875, 1170.6014404296875, 1231.3748779296875, 1292.1484375, 1352.921875, 1413.6953125, 1474.46875, 1535.2421875, 1596.015625, 1656.7891845703125, 1717.5626220703125, 1778.3360595703125, 1839.1094970703125, 1899.8829345703125, 1960.6563720703125, 2021.4298095703125, 2082.203369140625, 2142.976806640625, 2203.750244140625, 2264.523681640625, 2325.297119140625, 2386.070556640625, 2446.843994140625, 2507.617431640625, 2568.390869140625, 2629.164306640625, 2689.937744140625, 2750.71142578125, 2811.48486328125, 2872.25830078125, 2933.03173828125, 2993.80517578125, 3054.57861328125, 3115.35205078125, 3176.12548828125, 3236.89892578125, 3297.67236328125, 3358.44580078125, 3419.21923828125, 3479.99267578125, 3540.76611328125, 3601.53955078125, 3662.31298828125, 3723.08642578125, 3783.85986328125, 3844.633544921875]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 5.0, 6.0, 11.0, 5.0, 13.0, 23.0, 17.0, 23.0, 16.0, 28.0, 25.0, 28.0, 28.0, 25.0, 30.0, 40.0, 36.0, 45.0, 37.0, 39.0, 42.0, 37.0, 45.0, 41.0, 36.0, 49.0, 30.0, 31.0, 28.0, 26.0, 33.0, 21.0, 19.0, 16.0, 12.0, 12.0, 6.0, 7.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-228.02313232421875, -220.68858337402344, -213.35401916503906, -206.01947021484375, -198.68492126464844, -191.35037231445312, -184.01580810546875, -176.68125915527344, -169.34671020507812, -162.0121612548828, -154.67759704589844, -147.34304809570312, -140.0084991455078, -132.6739501953125, -125.33938598632812, -118.00483703613281, -110.67028045654297, -103.33572387695312, -96.00117492675781, -88.66661834716797, -81.33206939697266, -73.99751281738281, -66.6629638671875, -59.328407287597656, -51.99385452270508, -44.6593017578125, -37.32474899291992, -29.99019432067871, -22.655641555786133, -15.321086883544922, -7.986534118652344, -0.6519813537597656, 6.6825714111328125, 14.01712417602539, 21.35167694091797, 28.68623161315918, 36.020782470703125, 43.35533905029297, 50.68989181518555, 58.024444580078125, 65.35899353027344, 72.69355010986328, 80.0280990600586, 87.36265563964844, 94.69720458984375, 102.0317611694336, 109.36631774902344, 116.70086669921875, 124.0354232788086, 131.36997985839844, 138.70452880859375, 146.03907775878906, 153.37364196777344, 160.70819091796875, 168.04273986816406, 175.37728881835938, 182.71185302734375, 190.04640197753906, 197.38096618652344, 204.71551513671875, 212.05006408691406, 219.38461303710938, 226.71917724609375, 234.05372619628906, 241.38827514648438]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 10.0, 7.0, 12.0, 18.0, 25.0, 21.0, 25.0, 21.0, 37.0, 31.0, 36.0, 52.0, 56.0, 57.0, 40.0, 70.0, 39.0, 47.0, 51.0, 58.0, 43.0, 44.0, 29.0, 25.0, 25.0, 26.0, 17.0, 14.0, 15.0, 11.0, 10.0, 1.0, 6.0, 5.0, 1.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-31.515625, -30.655029296875, -29.79443359375, -28.933837890625, -28.0732421875, -27.212646484375, -26.35205078125, -25.491455078125, -24.630859375, -23.770263671875, -22.90966796875, -22.049072265625, -21.1884765625, -20.327880859375, -19.46728515625, -18.606689453125, -17.74609375, -16.885498046875, -16.02490234375, -15.164306640625, -14.3037109375, -13.443115234375, -12.58251953125, -11.721923828125, -10.861328125, -10.000732421875, -9.14013671875, -8.279541015625, -7.4189453125, -6.558349609375, -5.69775390625, -4.837158203125, -3.9765625, -3.115966796875, -2.25537109375, -1.394775390625, -0.5341796875, 0.326416015625, 1.18701171875, 2.047607421875, 2.908203125, 3.768798828125, 4.62939453125, 5.489990234375, 6.3505859375, 7.211181640625, 8.07177734375, 8.932373046875, 9.79296875, 10.653564453125, 11.51416015625, 12.374755859375, 13.2353515625, 14.095947265625, 14.95654296875, 15.817138671875, 16.677734375, 17.538330078125, 18.39892578125, 19.259521484375, 20.1201171875, 20.980712890625, 21.84130859375, 22.701904296875, 23.5625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 8.0, 12.0, 14.0, 22.0, 25.0, 46.0, 79.0, 89.0, 154.0, 219.0, 382.0, 614.0, 1211.0, 3015.0, 8990.0, 56148.0, 4038779.0, 68760.0, 9634.0, 3113.0, 1288.0, 634.0, 354.0, 222.0, 133.0, 93.0, 68.0, 45.0, 35.0, 20.0, 18.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-195.875, -190.51171875, -185.1484375, -179.78515625, -174.421875, -169.05859375, -163.6953125, -158.33203125, -152.96875, -147.60546875, -142.2421875, -136.87890625, -131.515625, -126.15234375, -120.7890625, -115.42578125, -110.0625, -104.69921875, -99.3359375, -93.97265625, -88.609375, -83.24609375, -77.8828125, -72.51953125, -67.15625, -61.79296875, -56.4296875, -51.06640625, -45.703125, -40.33984375, -34.9765625, -29.61328125, -24.25, -18.88671875, -13.5234375, -8.16015625, -2.796875, 2.56640625, 7.9296875, 13.29296875, 18.65625, 24.01953125, 29.3828125, 34.74609375, 40.109375, 45.47265625, 50.8359375, 56.19921875, 61.5625, 66.92578125, 72.2890625, 77.65234375, 83.015625, 88.37890625, 93.7421875, 99.10546875, 104.46875, 109.83203125, 115.1953125, 120.55859375, 125.921875, 131.28515625, 136.6484375, 142.01171875, 147.375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 7.0, 12.0, 12.0, 24.0, 32.0, 41.0, 85.0, 304.0, 1334.0, 1515.0, 388.0, 113.0, 72.0, 27.0, 40.0, 18.0, 13.0, 11.0, 9.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-214.375, -209.71875, -205.0625, -200.40625, -195.75, -191.09375, -186.4375, -181.78125, -177.125, -172.46875, -167.8125, -163.15625, -158.5, -153.84375, -149.1875, -144.53125, -139.875, -135.21875, -130.5625, -125.90625, -121.25, -116.59375, -111.9375, -107.28125, -102.625, -97.96875, -93.3125, -88.65625, -84.0, -79.34375, -74.6875, -70.03125, -65.375, -60.71875, -56.0625, -51.40625, -46.75, -42.09375, -37.4375, -32.78125, -28.125, -23.46875, -18.8125, -14.15625, -9.5, -4.84375, -0.1875, 4.46875, 9.125, 13.78125, 18.4375, 23.09375, 27.75, 32.40625, 37.0625, 41.71875, 46.375, 51.03125, 55.6875, 60.34375, 65.0, 69.65625, 74.3125, 78.96875, 83.625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 10.0, 19.0, 21.0, 23.0, 24.0, 31.0, 57.0, 96.0, 170.0, 343.0, 799.0, 1953.0, 5621.0, 19156.0, 110234.0, 3896952.0, 128354.0, 20801.0, 5966.0, 2029.0, 824.0, 327.0, 162.0, 85.0, 64.0, 33.0, 28.0, 16.0, 15.0, 12.0, 11.0, 0.0, 8.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-181.75, -174.8984375, -168.046875, -161.1953125, -154.34375, -147.4921875, -140.640625, -133.7890625, -126.9375, -120.0859375, -113.234375, -106.3828125, -99.53125, -92.6796875, -85.828125, -78.9765625, -72.125, -65.2734375, -58.421875, -51.5703125, -44.71875, -37.8671875, -31.015625, -24.1640625, -17.3125, -10.4609375, -3.609375, 3.2421875, 10.09375, 16.9453125, 23.796875, 30.6484375, 37.5, 44.3515625, 51.203125, 58.0546875, 64.90625, 71.7578125, 78.609375, 85.4609375, 92.3125, 99.1640625, 106.015625, 112.8671875, 119.71875, 126.5703125, 133.421875, 140.2734375, 147.125, 153.9765625, 160.828125, 167.6796875, 174.53125, 181.3828125, 188.234375, 195.0859375, 201.9375, 208.7890625, 215.640625, 222.4921875, 229.34375, 236.1953125, 243.046875, 249.8984375, 256.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 25.0, 126.0, 610.0, 192.0, 46.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1158.3404541015625, -1119.2901611328125, -1080.2398681640625, -1041.189453125, -1002.13916015625, -963.0888671875, -924.03857421875, -884.98828125, -845.9379272460938, -806.8876342773438, -767.8372802734375, -728.7869873046875, -689.7366943359375, -650.6863403320312, -611.6360473632812, -572.585693359375, -533.535400390625, -494.4850769042969, -455.43475341796875, -416.38446044921875, -377.3341369628906, -338.2838134765625, -299.2335205078125, -260.1831970214844, -221.13287353515625, -182.08255004882812, -143.03224182128906, -103.98192596435547, -64.93161010742188, -25.88128662109375, 13.169021606445312, 52.219329833984375, 91.269775390625, 130.32009887695312, 169.3704071044922, 208.42071533203125, 247.47103881835938, 286.5213623046875, 325.5716552734375, 364.6219787597656, 403.67230224609375, 442.7226257324219, 481.77294921875, 520.8232421875, 559.87353515625, 598.9238891601562, 637.9741821289062, 677.0245361328125, 716.0748291015625, 755.1251220703125, 794.1754760742188, 833.2257690429688, 872.276123046875, 911.326416015625, 950.376708984375, 989.427001953125, 1028.477294921875, 1067.527587890625, 1106.577880859375, 1145.6282958984375, 1184.6785888671875, 1223.7288818359375, 1262.7791748046875, 1301.8294677734375, 1340.8798828125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 5.0, 10.0, 7.0, 15.0, 11.0, 13.0, 15.0, 27.0, 35.0, 33.0, 40.0, 42.0, 38.0, 48.0, 40.0, 42.0, 36.0, 51.0, 43.0, 51.0, 45.0, 44.0, 43.0, 41.0, 38.0, 31.0, 22.0, 27.0, 13.0, 15.0, 15.0, 12.0, 12.0, 7.0, 8.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.433837890625, -219.14378356933594, -210.8537139892578, -202.56365966796875, -194.27359008789062, -185.98353576660156, -177.6934814453125, -169.40341186523438, -161.11334228515625, -152.8232879638672, -144.53321838378906, -136.2431640625, -127.95309448242188, -119.66304016113281, -111.37297821044922, -103.08291625976562, -94.79286193847656, -86.50279998779297, -78.21273803710938, -69.92268371582031, -61.63261795043945, -53.34255599975586, -45.05249786376953, -36.76243591308594, -28.472373962402344, -20.18231201171875, -11.892251968383789, -3.602191925048828, 4.687870025634766, 12.97793197631836, 21.267990112304688, 29.55805206298828, 37.848114013671875, 46.13817596435547, 54.42823791503906, 62.71829605102539, 71.00836181640625, 79.29841613769531, 87.5884780883789, 95.8785400390625, 104.1686019897461, 112.45866394042969, 120.74872589111328, 129.03878784179688, 137.32884216308594, 145.61891174316406, 153.90896606445312, 162.19903564453125, 170.4890899658203, 178.77914428710938, 187.0692138671875, 195.35926818847656, 203.6493377685547, 211.93939208984375, 220.22946166992188, 228.51951599121094, 236.8095703125, 245.09962463378906, 253.3896942138672, 261.67974853515625, 269.9698181152344, 278.2598876953125, 286.5499267578125, 294.8399963378906, 303.13006591796875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 14.0, 7.0, 23.0, 17.0, 14.0, 23.0, 22.0, 40.0, 43.0, 36.0, 41.0, 43.0, 50.0, 58.0, 48.0, 54.0, 59.0, 56.0, 48.0, 48.0, 33.0, 46.0, 28.0, 25.0, 22.0, 25.0, 12.0, 15.0, 13.0, 8.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.75, -32.788818359375, -31.82763671875, -30.866455078125, -29.9052734375, -28.944091796875, -27.98291015625, -27.021728515625, -26.060546875, -25.099365234375, -24.13818359375, -23.177001953125, -22.2158203125, -21.254638671875, -20.29345703125, -19.332275390625, -18.37109375, -17.409912109375, -16.44873046875, -15.487548828125, -14.5263671875, -13.565185546875, -12.60400390625, -11.642822265625, -10.681640625, -9.720458984375, -8.75927734375, -7.798095703125, -6.8369140625, -5.875732421875, -4.91455078125, -3.953369140625, -2.9921875, -2.031005859375, -1.06982421875, -0.108642578125, 0.8525390625, 1.813720703125, 2.77490234375, 3.736083984375, 4.697265625, 5.658447265625, 6.61962890625, 7.580810546875, 8.5419921875, 9.503173828125, 10.46435546875, 11.425537109375, 12.38671875, 13.347900390625, 14.30908203125, 15.270263671875, 16.2314453125, 17.192626953125, 18.15380859375, 19.114990234375, 20.076171875, 21.037353515625, 21.99853515625, 22.959716796875, 23.9208984375, 24.882080078125, 25.84326171875, 26.804443359375, 27.765625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 13.0, 19.0, 31.0, 32.0, 42.0, 69.0, 86.0, 126.0, 183.0, 296.0, 419.0, 661.0, 1106.0, 1813.0, 3138.0, 5270.0, 8793.0, 15012.0, 26838.0, 49970.0, 100179.0, 233324.0, 318161.0, 137384.0, 65255.0, 34164.0, 19064.0, 10901.0, 6391.0, 3716.0, 2314.0, 1372.0, 848.0, 524.0, 345.0, 226.0, 130.0, 106.0, 65.0, 46.0, 37.0, 29.0, 9.0, 14.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.474609375, -1.42578125, -1.376953125, -1.328125, -1.279296875, -1.23046875, -1.181640625, -1.1328125, -1.083984375, -1.03515625, -0.986328125, -0.9375, -0.888671875, -0.83984375, -0.791015625, -0.7421875, -0.693359375, -0.64453125, -0.595703125, -0.546875, -0.498046875, -0.44921875, -0.400390625, -0.3515625, -0.302734375, -0.25390625, -0.205078125, -0.15625, -0.107421875, -0.05859375, -0.009765625, 0.0390625, 0.087890625, 0.13671875, 0.185546875, 0.234375, 0.283203125, 0.33203125, 0.380859375, 0.4296875, 0.478515625, 0.52734375, 0.576171875, 0.625, 0.673828125, 0.72265625, 0.771484375, 0.8203125, 0.869140625, 0.91796875, 0.966796875, 1.015625, 1.064453125, 1.11328125, 1.162109375, 1.2109375, 1.259765625, 1.30859375, 1.357421875, 1.40625, 1.455078125, 1.50390625, 1.552734375, 1.6015625, 1.650390625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 9.0, 7.0, 17.0, 12.0, 19.0, 26.0, 34.0, 27.0, 32.0, 25.0, 42.0, 38.0, 56.0, 45.0, 31.0, 42.0, 34.0, 1070.0, 46.0, 44.0, 41.0, 33.0, 40.0, 29.0, 35.0, 36.0, 22.0, 24.0, 23.0, 15.0, 17.0, 10.0, 11.0, 3.0, 12.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.1025390625, -15.548828125, -14.9951171875, -14.44140625, -13.8876953125, -13.333984375, -12.7802734375, -12.2265625, -11.6728515625, -11.119140625, -10.5654296875, -10.01171875, -9.4580078125, -8.904296875, -8.3505859375, -7.796875, -7.2431640625, -6.689453125, -6.1357421875, -5.58203125, -5.0283203125, -4.474609375, -3.9208984375, -3.3671875, -2.8134765625, -2.259765625, -1.7060546875, -1.15234375, -0.5986328125, -0.044921875, 0.5087890625, 1.0625, 1.6162109375, 2.169921875, 2.7236328125, 3.27734375, 3.8310546875, 4.384765625, 4.9384765625, 5.4921875, 6.0458984375, 6.599609375, 7.1533203125, 7.70703125, 8.2607421875, 8.814453125, 9.3681640625, 9.921875, 10.4755859375, 11.029296875, 11.5830078125, 12.13671875, 12.6904296875, 13.244140625, 13.7978515625, 14.3515625, 14.9052734375, 15.458984375, 16.0126953125, 16.56640625, 17.1201171875, 17.673828125, 18.2275390625, 18.78125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 7.0, 7.0, 15.0, 18.0, 34.0, 48.0, 57.0, 97.0, 170.0, 265.0, 393.0, 660.0, 1038.0, 1743.0, 2916.0, 5142.0, 8879.0, 15756.0, 28804.0, 54168.0, 109825.0, 311440.0, 1296276.0, 125653.0, 60718.0, 31820.0, 17644.0, 9825.0, 5581.0, 3280.0, 1854.0, 1147.0, 667.0, 428.0, 282.0, 174.0, 99.0, 63.0, 41.0, 37.0, 24.0, 5.0, 10.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.455078125, -1.40826416015625, -1.3614501953125, -1.31463623046875, -1.267822265625, -1.22100830078125, -1.1741943359375, -1.12738037109375, -1.08056640625, -1.03375244140625, -0.9869384765625, -0.94012451171875, -0.893310546875, -0.84649658203125, -0.7996826171875, -0.75286865234375, -0.7060546875, -0.65924072265625, -0.6124267578125, -0.56561279296875, -0.518798828125, -0.47198486328125, -0.4251708984375, -0.37835693359375, -0.33154296875, -0.28472900390625, -0.2379150390625, -0.19110107421875, -0.144287109375, -0.09747314453125, -0.0506591796875, -0.00384521484375, 0.04296875, 0.08978271484375, 0.1365966796875, 0.18341064453125, 0.230224609375, 0.27703857421875, 0.3238525390625, 0.37066650390625, 0.41748046875, 0.46429443359375, 0.5111083984375, 0.55792236328125, 0.604736328125, 0.65155029296875, 0.6983642578125, 0.74517822265625, 0.7919921875, 0.83880615234375, 0.8856201171875, 0.93243408203125, 0.979248046875, 1.02606201171875, 1.0728759765625, 1.11968994140625, 1.16650390625, 1.21331787109375, 1.2601318359375, 1.30694580078125, 1.353759765625, 1.40057373046875, 1.4473876953125, 1.49420166015625, 1.541015625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 4.0, 5.0, 4.0, 16.0, 13.0, 14.0, 21.0, 22.0, 32.0, 40.0, 79.0, 87.0, 126.0, 132.0, 107.0, 66.0, 44.0, 31.0, 21.0, 25.0, 16.0, 15.0, 9.0, 9.0, 14.0, 12.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0174102783203125, -0.016900181770324707, -0.016390085220336914, -0.01587998867034912, -0.015369892120361328, -0.014859795570373535, -0.014349699020385742, -0.01383960247039795, -0.013329505920410156, -0.012819409370422363, -0.01230931282043457, -0.011799216270446777, -0.011289119720458984, -0.010779023170471191, -0.010268926620483398, -0.009758830070495605, -0.009248733520507812, -0.00873863697052002, -0.008228540420532227, -0.007718443870544434, -0.007208347320556641, -0.006698250770568848, -0.006188154220581055, -0.005678057670593262, -0.005167961120605469, -0.004657864570617676, -0.004147768020629883, -0.00363767147064209, -0.003127574920654297, -0.002617478370666504, -0.002107381820678711, -0.001597285270690918, -0.001087188720703125, -0.000577092170715332, -6.699562072753906e-05, 0.0004431009292602539, 0.0009531974792480469, 0.0014632940292358398, 0.001973390579223633, 0.0024834871292114258, 0.0029935836791992188, 0.0035036802291870117, 0.004013776779174805, 0.004523873329162598, 0.005033969879150391, 0.005544066429138184, 0.0060541629791259766, 0.0065642595291137695, 0.0070743560791015625, 0.0075844526290893555, 0.008094549179077148, 0.008604645729064941, 0.009114742279052734, 0.009624838829040527, 0.01013493537902832, 0.010645031929016113, 0.011155128479003906, 0.0116652250289917, 0.012175321578979492, 0.012685418128967285, 0.013195514678955078, 0.013705611228942871, 0.014215707778930664, 0.014725804328918457, 0.01523590087890625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 14.0, 16.0, 21.0, 21.0, 27.0, 41.0, 33.0, 47.0, 64.0, 87.0, 126.0, 217.0, 531.0, 5361.0, 998082.0, 41921.0, 1047.0, 280.0, 131.0, 94.0, 73.0, 59.0, 49.0, 30.0, 29.0, 34.0, 29.0, 20.0, 16.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.290283203125, -0.28167724609375, -0.2730712890625, -0.26446533203125, -0.255859375, -0.24725341796875, -0.2386474609375, -0.23004150390625, -0.221435546875, -0.21282958984375, -0.2042236328125, -0.19561767578125, -0.18701171875, -0.17840576171875, -0.1697998046875, -0.16119384765625, -0.152587890625, -0.14398193359375, -0.1353759765625, -0.12677001953125, -0.1181640625, -0.10955810546875, -0.1009521484375, -0.09234619140625, -0.083740234375, -0.07513427734375, -0.0665283203125, -0.05792236328125, -0.04931640625, -0.04071044921875, -0.0321044921875, -0.02349853515625, -0.014892578125, -0.00628662109375, 0.0023193359375, 0.01092529296875, 0.01953125, 0.02813720703125, 0.0367431640625, 0.04534912109375, 0.053955078125, 0.06256103515625, 0.0711669921875, 0.07977294921875, 0.08837890625, 0.09698486328125, 0.1055908203125, 0.11419677734375, 0.122802734375, 0.13140869140625, 0.1400146484375, 0.14862060546875, 0.1572265625, 0.16583251953125, 0.1744384765625, 0.18304443359375, 0.191650390625, 0.20025634765625, 0.2088623046875, 0.21746826171875, 0.22607421875, 0.23468017578125, 0.2432861328125, 0.25189208984375, 0.260498046875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 33.0, 794.0, 183.0, 8.0], "bins": [-0.15262740850448608, -0.15015652775764465, -0.14768564701080322, -0.1452147662639618, -0.14274387061595917, -0.14027298986911774, -0.1378021091222763, -0.13533122837543488, -0.13286034762859344, -0.13038946688175201, -0.12791858613491058, -0.12544770538806915, -0.12297681719064713, -0.1205059289932251, -0.11803504824638367, -0.11556416749954224, -0.11309327930212021, -0.11062239855527878, -0.10815151035785675, -0.10568062961101532, -0.10320974886417389, -0.10073886811733246, -0.09826797991991043, -0.095797099173069, -0.09332621097564697, -0.09085533022880554, -0.08838444203138351, -0.08591356128454208, -0.08344268053770065, -0.08097179234027863, -0.0785009115934372, -0.07603003084659576, -0.07355915755033493, -0.0710882768034935, -0.06861738860607147, -0.06614650785923004, -0.06367562711238861, -0.06120474264025688, -0.05873385816812515, -0.05626297742128372, -0.053792089223861694, -0.051321204751729965, -0.048850324004888535, -0.046379439532756805, -0.043908558785915375, -0.041437674313783646, -0.038966789841651917, -0.036495909094810486, -0.03402502462267876, -0.03155414015054703, -0.029083259403705597, -0.026612374931573868, -0.024141492322087288, -0.021670609712600708, -0.01919972524046898, -0.0167288426309824, -0.014257960021495819, -0.01178707741200924, -0.009316193871200085, -0.0068453107960522175, -0.00437442772090435, -0.0019035451114177704, 0.0005673384293913841, 0.0030382219702005386, 0.005509104114025831]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 9.0, 12.0, 12.0, 16.0, 18.0, 19.0, 25.0, 24.0, 32.0, 33.0, 36.0, 50.0, 45.0, 48.0, 47.0, 47.0, 49.0, 56.0, 42.0, 48.0, 43.0, 33.0, 37.0, 40.0, 35.0, 18.0, 28.0, 23.0, 18.0, 13.0, 12.0, 7.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.009079039096832275, -0.008834026753902435, -0.008589014410972595, -0.008344002068042755, -0.008098989725112915, -0.007853977382183075, -0.007608965039253235, -0.007363952696323395, -0.007118940353393555, -0.006873928010463715, -0.0066289156675338745, -0.006383903324604034, -0.006138890981674194, -0.005893878638744354, -0.005648866295814514, -0.005403853952884674, -0.005158841609954834, -0.004913829267024994, -0.004668816924095154, -0.004423804581165314, -0.004178792238235474, -0.0039337798953056335, -0.0036887675523757935, -0.0034437552094459534, -0.0031987428665161133, -0.002953730523586273, -0.002708718180656433, -0.002463705837726593, -0.002218693494796753, -0.001973681151866913, -0.0017286688089370728, -0.0014836564660072327, -0.0012386441230773926, -0.0009936317801475525, -0.0007486194372177124, -0.0005036070942878723, -0.0002585947513580322, -1.3582408428192139e-05, 0.00023142993450164795, 0.00047644227743148804, 0.0007214546203613281, 0.0009664669632911682, 0.0012114793062210083, 0.0014564916491508484, 0.0017015039920806885, 0.0019465163350105286, 0.0021915286779403687, 0.0024365410208702087, 0.002681553363800049, 0.002926565706729889, 0.003171578049659729, 0.003416590392589569, 0.003661602735519409, 0.003906615078449249, 0.004151627421379089, 0.0043966397643089294, 0.0046416521072387695, 0.00488666445016861, 0.00513167679309845, 0.00537668913602829, 0.00562170147895813, 0.00586671382188797, 0.00611172616481781, 0.00635673850774765, 0.00660175085067749]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 14.0, 7.0, 23.0, 17.0, 14.0, 23.0, 22.0, 40.0, 43.0, 36.0, 41.0, 43.0, 50.0, 58.0, 48.0, 54.0, 59.0, 56.0, 48.0, 48.0, 33.0, 46.0, 28.0, 25.0, 22.0, 25.0, 12.0, 15.0, 13.0, 8.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.75, -32.788818359375, -31.82763671875, -30.866455078125, -29.9052734375, -28.944091796875, -27.98291015625, -27.021728515625, -26.060546875, -25.099365234375, -24.13818359375, -23.177001953125, -22.2158203125, -21.254638671875, -20.29345703125, -19.332275390625, -18.37109375, -17.409912109375, -16.44873046875, -15.487548828125, -14.5263671875, -13.565185546875, -12.60400390625, -11.642822265625, -10.681640625, -9.720458984375, -8.75927734375, -7.798095703125, -6.8369140625, -5.875732421875, -4.91455078125, -3.953369140625, -2.9921875, -2.031005859375, -1.06982421875, -0.108642578125, 0.8525390625, 1.813720703125, 2.77490234375, 3.736083984375, 4.697265625, 5.658447265625, 6.61962890625, 7.580810546875, 8.5419921875, 9.503173828125, 10.46435546875, 11.425537109375, 12.38671875, 13.347900390625, 14.30908203125, 15.270263671875, 16.2314453125, 17.192626953125, 18.15380859375, 19.114990234375, 20.076171875, 21.037353515625, 21.99853515625, 22.959716796875, 23.9208984375, 24.882080078125, 25.84326171875, 26.804443359375, 27.765625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 12.0, 13.0, 22.0, 37.0, 46.0, 76.0, 122.0, 142.0, 234.0, 308.0, 540.0, 929.0, 1822.0, 4150.0, 11245.0, 35205.0, 154908.0, 663081.0, 126878.0, 31118.0, 9872.0, 3769.0, 1602.0, 872.0, 532.0, 291.0, 213.0, 142.0, 96.0, 66.0, 60.0, 35.0, 28.0, 16.0, 17.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.03125, -29.13330078125, -28.2353515625, -27.33740234375, -26.439453125, -25.54150390625, -24.6435546875, -23.74560546875, -22.84765625, -21.94970703125, -21.0517578125, -20.15380859375, -19.255859375, -18.35791015625, -17.4599609375, -16.56201171875, -15.6640625, -14.76611328125, -13.8681640625, -12.97021484375, -12.072265625, -11.17431640625, -10.2763671875, -9.37841796875, -8.48046875, -7.58251953125, -6.6845703125, -5.78662109375, -4.888671875, -3.99072265625, -3.0927734375, -2.19482421875, -1.296875, -0.39892578125, 0.4990234375, 1.39697265625, 2.294921875, 3.19287109375, 4.0908203125, 4.98876953125, 5.88671875, 6.78466796875, 7.6826171875, 8.58056640625, 9.478515625, 10.37646484375, 11.2744140625, 12.17236328125, 13.0703125, 13.96826171875, 14.8662109375, 15.76416015625, 16.662109375, 17.56005859375, 18.4580078125, 19.35595703125, 20.25390625, 21.15185546875, 22.0498046875, 22.94775390625, 23.845703125, 24.74365234375, 25.6416015625, 26.53955078125, 27.4375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 9.0, 15.0, 10.0, 14.0, 17.0, 19.0, 29.0, 35.0, 25.0, 37.0, 33.0, 33.0, 52.0, 42.0, 56.0, 168.0, 1954.0, 52.0, 30.0, 37.0, 51.0, 56.0, 32.0, 29.0, 32.0, 27.0, 24.0, 15.0, 24.0, 18.0, 5.0, 11.0, 8.0, 7.0, 4.0, 5.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.8125, -101.6513671875, -98.490234375, -95.3291015625, -92.16796875, -89.0068359375, -85.845703125, -82.6845703125, -79.5234375, -76.3623046875, -73.201171875, -70.0400390625, -66.87890625, -63.7177734375, -60.556640625, -57.3955078125, -54.234375, -51.0732421875, -47.912109375, -44.7509765625, -41.58984375, -38.4287109375, -35.267578125, -32.1064453125, -28.9453125, -25.7841796875, -22.623046875, -19.4619140625, -16.30078125, -13.1396484375, -9.978515625, -6.8173828125, -3.65625, -0.4951171875, 2.666015625, 5.8271484375, 8.98828125, 12.1494140625, 15.310546875, 18.4716796875, 21.6328125, 24.7939453125, 27.955078125, 31.1162109375, 34.27734375, 37.4384765625, 40.599609375, 43.7607421875, 46.921875, 50.0830078125, 53.244140625, 56.4052734375, 59.56640625, 62.7275390625, 65.888671875, 69.0498046875, 72.2109375, 75.3720703125, 78.533203125, 81.6943359375, 84.85546875, 88.0166015625, 91.177734375, 94.3388671875, 97.5]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 13.0, 15.0, 23.0, 23.0, 20.0, 50.0, 34.0, 46.0, 59.0, 115.0, 156.0, 256.0, 690.0, 2779.0, 3130698.0, 8954.0, 821.0, 323.0, 170.0, 88.0, 61.0, 53.0, 40.0, 33.0, 36.0, 16.0, 18.0, 12.0, 12.0, 15.0, 9.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.5, -218.1328125, -210.765625, -203.3984375, -196.03125, -188.6640625, -181.296875, -173.9296875, -166.5625, -159.1953125, -151.828125, -144.4609375, -137.09375, -129.7265625, -122.359375, -114.9921875, -107.625, -100.2578125, -92.890625, -85.5234375, -78.15625, -70.7890625, -63.421875, -56.0546875, -48.6875, -41.3203125, -33.953125, -26.5859375, -19.21875, -11.8515625, -4.484375, 2.8828125, 10.25, 17.6171875, 24.984375, 32.3515625, 39.71875, 47.0859375, 54.453125, 61.8203125, 69.1875, 76.5546875, 83.921875, 91.2890625, 98.65625, 106.0234375, 113.390625, 120.7578125, 128.125, 135.4921875, 142.859375, 150.2265625, 157.59375, 164.9609375, 172.328125, 179.6953125, 187.0625, 194.4296875, 201.796875, 209.1640625, 216.53125, 223.8984375, 231.265625, 238.6328125, 246.0]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [615.0, 405.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.915279388427734, 1.1850128173828125, 21.28530502319336, 41.385597229003906, 61.48588943481445, 81.586181640625, 101.68647766113281, 121.78675842285156, 141.88705444335938, 161.9873504638672, 182.087646484375, 202.18792724609375, 222.28822326660156, 242.38851928710938, 262.4888000488281, 282.589111328125, 302.68939208984375, 322.7896728515625, 342.8899841308594, 362.9902648925781, 383.090576171875, 403.19085693359375, 423.2911376953125, 443.39141845703125, 463.4917297363281, 483.5920104980469, 503.69232177734375, 523.7926025390625, 543.8928833007812, 563.9931640625, 584.093505859375, 604.1937866210938, 624.2940673828125, 644.3943481445312, 664.49462890625, 684.594970703125, 704.6952514648438, 724.7955322265625, 744.8958129882812, 764.99609375, 785.096435546875, 805.1967163085938, 825.2969970703125, 845.3973388671875, 865.4976196289062, 885.597900390625, 905.6981811523438, 925.7984619140625, 945.8987426757812, 965.9990234375, 986.0993041992188, 1006.1996459960938, 1026.2999267578125, 1046.400146484375, 1066.50048828125, 1086.600830078125, 1106.7010498046875, 1126.8013916015625, 1146.901611328125, 1167.001953125, 1187.1021728515625, 1207.2025146484375, 1227.3028564453125, 1247.403076171875, 1267.50341796875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 6.0, 14.0, 8.0, 9.0, 15.0, 14.0, 28.0, 18.0, 33.0, 21.0, 37.0, 37.0, 28.0, 26.0, 35.0, 37.0, 24.0, 31.0, 40.0, 35.0, 44.0, 45.0, 47.0, 36.0, 40.0, 38.0, 25.0, 27.0, 31.0, 20.0, 28.0, 13.0, 14.0, 22.0, 9.0, 9.0, 9.0, 9.0, 5.0, 5.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-281.6238708496094, -272.5931396484375, -263.56243896484375, -254.53170776367188, -245.50099182128906, -236.47027587890625, -227.43954467773438, -218.40882873535156, -209.37811279296875, -200.34739685058594, -191.31668090820312, -182.28594970703125, -173.25523376464844, -164.22451782226562, -155.19378662109375, -146.16307067871094, -137.13235473632812, -128.1016387939453, -119.07091522216797, -110.04019165039062, -101.00947570800781, -91.978759765625, -82.94803619384766, -73.91731262207031, -64.8865966796875, -55.85587692260742, -46.825157165527344, -37.794437408447266, -28.763717651367188, -19.73299789428711, -10.702278137207031, -1.6715583801269531, 7.35919189453125, 16.389911651611328, 25.420631408691406, 34.451351165771484, 43.48207092285156, 52.51279067993164, 61.54351043701172, 70.57423400878906, 79.60494995117188, 88.63566589355469, 97.66638946533203, 106.69711303710938, 115.72782897949219, 124.758544921875, 133.78927612304688, 142.8199920654297, 151.8507080078125, 160.8814239501953, 169.91213989257812, 178.94287109375, 187.9735870361328, 197.00430297851562, 206.0350341796875, 215.0657501220703, 224.09646606445312, 233.12718200683594, 242.15789794921875, 251.18862915039062, 260.2193603515625, 269.25006103515625, 278.2807922363281, 287.3114929199219, 296.34222412109375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 11.0, 16.0, 17.0, 14.0, 20.0, 18.0, 31.0, 30.0, 47.0, 35.0, 40.0, 42.0, 47.0, 56.0, 52.0, 48.0, 55.0, 61.0, 46.0, 49.0, 39.0, 33.0, 32.0, 27.0, 25.0, 23.0, 15.0, 15.0, 10.0, 10.0, 10.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.759033203125, -31.79931640625, -30.839599609375, -29.8798828125, -28.920166015625, -27.96044921875, -27.000732421875, -26.041015625, -25.081298828125, -24.12158203125, -23.161865234375, -22.2021484375, -21.242431640625, -20.28271484375, -19.322998046875, -18.36328125, -17.403564453125, -16.44384765625, -15.484130859375, -14.5244140625, -13.564697265625, -12.60498046875, -11.645263671875, -10.685546875, -9.725830078125, -8.76611328125, -7.806396484375, -6.8466796875, -5.886962890625, -4.92724609375, -3.967529296875, -3.0078125, -2.048095703125, -1.08837890625, -0.128662109375, 0.8310546875, 1.790771484375, 2.75048828125, 3.710205078125, 4.669921875, 5.629638671875, 6.58935546875, 7.549072265625, 8.5087890625, 9.468505859375, 10.42822265625, 11.387939453125, 12.34765625, 13.307373046875, 14.26708984375, 15.226806640625, 16.1865234375, 17.146240234375, 18.10595703125, 19.065673828125, 20.025390625, 20.985107421875, 21.94482421875, 22.904541015625, 23.8642578125, 24.823974609375, 25.78369140625, 26.743408203125, 27.703125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 13.0, 14.0, 14.0, 17.0, 22.0, 23.0, 51.0, 71.0, 110.0, 170.0, 288.0, 665.0, 1917.0, 6761.0, 75707.0, 4076109.0, 25335.0, 4400.0, 1395.0, 493.0, 284.0, 130.0, 94.0, 42.0, 44.0, 28.0, 20.0, 15.0, 10.0, 13.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.875, -235.033203125, -228.19140625, -221.349609375, -214.5078125, -207.666015625, -200.82421875, -193.982421875, -187.140625, -180.298828125, -173.45703125, -166.615234375, -159.7734375, -152.931640625, -146.08984375, -139.248046875, -132.40625, -125.564453125, -118.72265625, -111.880859375, -105.0390625, -98.197265625, -91.35546875, -84.513671875, -77.671875, -70.830078125, -63.98828125, -57.146484375, -50.3046875, -43.462890625, -36.62109375, -29.779296875, -22.9375, -16.095703125, -9.25390625, -2.412109375, 4.4296875, 11.271484375, 18.11328125, 24.955078125, 31.796875, 38.638671875, 45.48046875, 52.322265625, 59.1640625, 66.005859375, 72.84765625, 79.689453125, 86.53125, 93.373046875, 100.21484375, 107.056640625, 113.8984375, 120.740234375, 127.58203125, 134.423828125, 141.265625, 148.107421875, 154.94921875, 161.791015625, 168.6328125, 175.474609375, 182.31640625, 189.158203125, 196.0]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 12.0, 8.0, 8.0, 6.0, 8.0, 17.0, 17.0, 34.0, 41.0, 83.0, 237.0, 857.0, 1607.0, 686.0, 205.0, 77.0, 47.0, 25.0, 21.0, 16.0, 16.0, 12.0, 3.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.3125, -67.6376953125, -63.962890625, -60.2880859375, -56.61328125, -52.9384765625, -49.263671875, -45.5888671875, -41.9140625, -38.2392578125, -34.564453125, -30.8896484375, -27.21484375, -23.5400390625, -19.865234375, -16.1904296875, -12.515625, -8.8408203125, -5.166015625, -1.4912109375, 2.18359375, 5.8583984375, 9.533203125, 13.2080078125, 16.8828125, 20.5576171875, 24.232421875, 27.9072265625, 31.58203125, 35.2568359375, 38.931640625, 42.6064453125, 46.28125, 49.9560546875, 53.630859375, 57.3056640625, 60.98046875, 64.6552734375, 68.330078125, 72.0048828125, 75.6796875, 79.3544921875, 83.029296875, 86.7041015625, 90.37890625, 94.0537109375, 97.728515625, 101.4033203125, 105.078125, 108.7529296875, 112.427734375, 116.1025390625, 119.77734375, 123.4521484375, 127.126953125, 130.8017578125, 134.4765625, 138.1513671875, 141.826171875, 145.5009765625, 149.17578125, 152.8505859375, 156.525390625, 160.2001953125, 163.875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 4.0, 7.0, 5.0, 8.0, 10.0, 14.0, 17.0, 36.0, 49.0, 58.0, 83.0, 195.0, 324.0, 578.0, 1196.0, 2455.0, 5371.0, 12405.0, 36755.0, 379472.0, 3640501.0, 79306.0, 20238.0, 8031.0, 3499.0, 1757.0, 847.0, 417.0, 261.0, 135.0, 79.0, 52.0, 25.0, 24.0, 19.0, 15.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-191.625, -186.029296875, -180.43359375, -174.837890625, -169.2421875, -163.646484375, -158.05078125, -152.455078125, -146.859375, -141.263671875, -135.66796875, -130.072265625, -124.4765625, -118.880859375, -113.28515625, -107.689453125, -102.09375, -96.498046875, -90.90234375, -85.306640625, -79.7109375, -74.115234375, -68.51953125, -62.923828125, -57.328125, -51.732421875, -46.13671875, -40.541015625, -34.9453125, -29.349609375, -23.75390625, -18.158203125, -12.5625, -6.966796875, -1.37109375, 4.224609375, 9.8203125, 15.416015625, 21.01171875, 26.607421875, 32.203125, 37.798828125, 43.39453125, 48.990234375, 54.5859375, 60.181640625, 65.77734375, 71.373046875, 76.96875, 82.564453125, 88.16015625, 93.755859375, 99.3515625, 104.947265625, 110.54296875, 116.138671875, 121.734375, 127.330078125, 132.92578125, 138.521484375, 144.1171875, 149.712890625, 155.30859375, 160.904296875, 166.5]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 12.0, 14.0, 27.0, 57.0, 114.0, 237.0, 273.0, 133.0, 64.0, 28.0, 23.0, 12.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0], "bins": [-894.5339965820312, -877.389404296875, -860.2448120117188, -843.1002197265625, -825.9556274414062, -808.81103515625, -791.6664428710938, -774.5218505859375, -757.377197265625, -740.2326049804688, -723.0880126953125, -705.9434204101562, -688.798828125, -671.6542358398438, -654.5096435546875, -637.364990234375, -620.220458984375, -603.0758666992188, -585.9312744140625, -568.7866821289062, -551.64208984375, -534.4974975585938, -517.3529052734375, -500.2082824707031, -483.0636901855469, -465.9190979003906, -448.7745056152344, -431.6299133300781, -414.48529052734375, -397.3406982421875, -380.19610595703125, -363.051513671875, -345.906982421875, -328.76239013671875, -311.6177978515625, -294.47320556640625, -277.32861328125, -260.18402099609375, -243.03939819335938, -225.89480590820312, -208.75021362304688, -191.60562133789062, -174.46102905273438, -157.31642150878906, -140.1718292236328, -123.02723693847656, -105.88263702392578, -88.738037109375, -71.59344482421875, -54.448848724365234, -37.30425262451172, -20.159656524658203, -3.0150604248046875, 14.129531860351562, 31.274131774902344, 48.418731689453125, 65.56332397460938, 82.70791625976562, 99.8525161743164, 116.99711608886719, 134.14170837402344, 151.2863006591797, 168.430908203125, 185.57550048828125, 202.7200927734375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 6.0, 5.0, 7.0, 9.0, 11.0, 13.0, 17.0, 19.0, 19.0, 25.0, 29.0, 27.0, 17.0, 42.0, 40.0, 52.0, 44.0, 37.0, 55.0, 41.0, 55.0, 42.0, 43.0, 45.0, 53.0, 31.0, 34.0, 31.0, 23.0, 23.0, 20.0, 18.0, 14.0, 12.0, 16.0, 5.0, 14.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-255.06039428710938, -247.67257690429688, -240.28475952148438, -232.89694213867188, -225.50912475585938, -218.12130737304688, -210.73348999023438, -203.34568786621094, -195.95787048339844, -188.57005310058594, -181.18223571777344, -173.79441833496094, -166.40660095214844, -159.018798828125, -151.6309814453125, -144.2431640625, -136.8553466796875, -129.467529296875, -122.0797119140625, -114.69189453125, -107.30408477783203, -99.91626739501953, -92.52845001220703, -85.14064025878906, -77.7528076171875, -70.364990234375, -62.977176666259766, -55.589359283447266, -48.20154571533203, -40.81372833251953, -33.42591094970703, -26.038097381591797, -18.650283813476562, -11.262468338012695, -3.8746519088745117, 3.513164520263672, 10.900979995727539, 18.288795471191406, 25.676612854003906, 33.06442642211914, 40.45224380493164, 47.84006118774414, 55.227874755859375, 62.615692138671875, 70.00350952148438, 77.39132690429688, 84.77914428710938, 92.16695404052734, 99.55477142333984, 106.94258880615234, 114.33040618896484, 121.71821594238281, 129.1060333251953, 136.4938507080078, 143.8816680908203, 151.2694854736328, 158.6573028564453, 166.0451202392578, 173.4329376220703, 180.8207550048828, 188.2085723876953, 195.59637451171875, 202.98419189453125, 210.37200927734375, 217.75982666015625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 6.0, 6.0, 8.0, 15.0, 13.0, 13.0, 14.0, 18.0, 25.0, 30.0, 34.0, 39.0, 32.0, 38.0, 33.0, 40.0, 45.0, 49.0, 58.0, 52.0, 46.0, 52.0, 44.0, 34.0, 47.0, 32.0, 32.0, 16.0, 23.0, 20.0, 18.0, 12.0, 12.0, 6.0, 6.0, 9.0, 5.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.21875, -32.30615234375, -31.3935546875, -30.48095703125, -29.568359375, -28.65576171875, -27.7431640625, -26.83056640625, -25.91796875, -25.00537109375, -24.0927734375, -23.18017578125, -22.267578125, -21.35498046875, -20.4423828125, -19.52978515625, -18.6171875, -17.70458984375, -16.7919921875, -15.87939453125, -14.966796875, -14.05419921875, -13.1416015625, -12.22900390625, -11.31640625, -10.40380859375, -9.4912109375, -8.57861328125, -7.666015625, -6.75341796875, -5.8408203125, -4.92822265625, -4.015625, -3.10302734375, -2.1904296875, -1.27783203125, -0.365234375, 0.54736328125, 1.4599609375, 2.37255859375, 3.28515625, 4.19775390625, 5.1103515625, 6.02294921875, 6.935546875, 7.84814453125, 8.7607421875, 9.67333984375, 10.5859375, 11.49853515625, 12.4111328125, 13.32373046875, 14.236328125, 15.14892578125, 16.0615234375, 16.97412109375, 17.88671875, 18.79931640625, 19.7119140625, 20.62451171875, 21.537109375, 22.44970703125, 23.3623046875, 24.27490234375, 25.1875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 8.0, 10.0, 17.0, 26.0, 39.0, 53.0, 78.0, 123.0, 145.0, 251.0, 419.0, 636.0, 942.0, 1537.0, 2419.0, 3889.0, 6219.0, 10307.0, 16984.0, 29091.0, 51045.0, 95703.0, 204148.0, 305142.0, 146948.0, 72931.0, 39874.0, 23456.0, 13850.0, 8392.0, 5122.0, 3199.0, 2026.0, 1193.0, 835.0, 486.0, 328.0, 231.0, 138.0, 105.0, 71.0, 32.0, 37.0, 14.0, 18.0, 8.0, 11.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.40625, -1.3613128662109375, -1.316375732421875, -1.2714385986328125, -1.22650146484375, -1.1815643310546875, -1.136627197265625, -1.0916900634765625, -1.0467529296875, -1.0018157958984375, -0.956878662109375, -0.9119415283203125, -0.86700439453125, -0.8220672607421875, -0.777130126953125, -0.7321929931640625, -0.687255859375, -0.6423187255859375, -0.597381591796875, -0.5524444580078125, -0.50750732421875, -0.4625701904296875, -0.417633056640625, -0.3726959228515625, -0.3277587890625, -0.2828216552734375, -0.237884521484375, -0.1929473876953125, -0.14801025390625, -0.1030731201171875, -0.058135986328125, -0.0131988525390625, 0.03173828125, 0.0766754150390625, 0.121612548828125, 0.1665496826171875, 0.21148681640625, 0.2564239501953125, 0.301361083984375, 0.3462982177734375, 0.3912353515625, 0.4361724853515625, 0.481109619140625, 0.5260467529296875, 0.57098388671875, 0.6159210205078125, 0.660858154296875, 0.7057952880859375, 0.750732421875, 0.7956695556640625, 0.840606689453125, 0.8855438232421875, 0.93048095703125, 0.9754180908203125, 1.020355224609375, 1.0652923583984375, 1.1102294921875, 1.1551666259765625, 1.200103759765625, 1.2450408935546875, 1.28997802734375, 1.3349151611328125, 1.379852294921875, 1.4247894287109375, 1.4697265625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 11.0, 7.0, 14.0, 7.0, 11.0, 10.0, 9.0, 14.0, 20.0, 18.0, 15.0, 19.0, 38.0, 33.0, 51.0, 31.0, 38.0, 36.0, 41.0, 38.0, 28.0, 1061.0, 40.0, 45.0, 38.0, 29.0, 35.0, 34.0, 25.0, 29.0, 30.0, 27.0, 14.0, 27.0, 24.0, 18.0, 10.0, 16.0, 10.0, 8.0, 5.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.953125, -16.41162109375, -15.8701171875, -15.32861328125, -14.787109375, -14.24560546875, -13.7041015625, -13.16259765625, -12.62109375, -12.07958984375, -11.5380859375, -10.99658203125, -10.455078125, -9.91357421875, -9.3720703125, -8.83056640625, -8.2890625, -7.74755859375, -7.2060546875, -6.66455078125, -6.123046875, -5.58154296875, -5.0400390625, -4.49853515625, -3.95703125, -3.41552734375, -2.8740234375, -2.33251953125, -1.791015625, -1.24951171875, -0.7080078125, -0.16650390625, 0.375, 0.91650390625, 1.4580078125, 1.99951171875, 2.541015625, 3.08251953125, 3.6240234375, 4.16552734375, 4.70703125, 5.24853515625, 5.7900390625, 6.33154296875, 6.873046875, 7.41455078125, 7.9560546875, 8.49755859375, 9.0390625, 9.58056640625, 10.1220703125, 10.66357421875, 11.205078125, 11.74658203125, 12.2880859375, 12.82958984375, 13.37109375, 13.91259765625, 14.4541015625, 14.99560546875, 15.537109375, 16.07861328125, 16.6201171875, 17.16162109375, 17.703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 12.0, 13.0, 21.0, 33.0, 37.0, 54.0, 81.0, 110.0, 166.0, 264.0, 365.0, 589.0, 882.0, 1302.0, 1957.0, 3223.0, 5204.0, 8002.0, 12892.0, 20920.0, 35044.0, 61704.0, 117043.0, 784133.0, 772772.0, 117581.0, 61718.0, 35076.0, 20713.0, 12899.0, 7962.0, 5107.0, 3212.0, 2066.0, 1350.0, 871.0, 613.0, 390.0, 247.0, 168.0, 99.0, 72.0, 59.0, 33.0, 25.0, 17.0, 12.0, 9.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.3466796875, -1.3032379150390625, -1.259796142578125, -1.2163543701171875, -1.17291259765625, -1.1294708251953125, -1.086029052734375, -1.0425872802734375, -0.9991455078125, -0.9557037353515625, -0.912261962890625, -0.8688201904296875, -0.82537841796875, -0.7819366455078125, -0.738494873046875, -0.6950531005859375, -0.651611328125, -0.6081695556640625, -0.564727783203125, -0.5212860107421875, -0.47784423828125, -0.4344024658203125, -0.390960693359375, -0.3475189208984375, -0.3040771484375, -0.2606353759765625, -0.217193603515625, -0.1737518310546875, -0.13031005859375, -0.0868682861328125, -0.043426513671875, 1.52587890625e-05, 0.04345703125, 0.0868988037109375, 0.130340576171875, 0.1737823486328125, 0.21722412109375, 0.2606658935546875, 0.304107666015625, 0.3475494384765625, 0.3909912109375, 0.4344329833984375, 0.477874755859375, 0.5213165283203125, 0.56475830078125, 0.6082000732421875, 0.651641845703125, 0.6950836181640625, 0.738525390625, 0.7819671630859375, 0.825408935546875, 0.8688507080078125, 0.91229248046875, 0.9557342529296875, 0.999176025390625, 1.0426177978515625, 1.0860595703125, 1.1295013427734375, 1.172943115234375, 1.2163848876953125, 1.25982666015625, 1.3032684326171875, 1.346710205078125, 1.3901519775390625, 1.43359375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 16.0, 12.0, 26.0, 26.0, 45.0, 54.0, 74.0, 99.0, 119.0, 138.0, 89.0, 68.0, 48.0, 43.0, 29.0, 22.0, 17.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03240966796875, -0.031482696533203125, -0.03055572509765625, -0.029628753662109375, -0.0287017822265625, -0.027774810791015625, -0.02684783935546875, -0.025920867919921875, -0.024993896484375, -0.024066925048828125, -0.02313995361328125, -0.022212982177734375, -0.0212860107421875, -0.020359039306640625, -0.01943206787109375, -0.018505096435546875, -0.017578125, -0.016651153564453125, -0.01572418212890625, -0.014797210693359375, -0.0138702392578125, -0.012943267822265625, -0.01201629638671875, -0.011089324951171875, -0.010162353515625, -0.009235382080078125, -0.00830841064453125, -0.007381439208984375, -0.0064544677734375, -0.005527496337890625, -0.00460052490234375, -0.003673553466796875, -0.00274658203125, -0.001819610595703125, -0.00089263916015625, 3.4332275390625e-05, 0.0009613037109375, 0.001888275146484375, 0.00281524658203125, 0.003742218017578125, 0.004669189453125, 0.005596160888671875, 0.00652313232421875, 0.007450103759765625, 0.0083770751953125, 0.009304046630859375, 0.01023101806640625, 0.011157989501953125, 0.0120849609375, 0.013011932373046875, 0.01393890380859375, 0.014865875244140625, 0.0157928466796875, 0.016719818115234375, 0.01764678955078125, 0.018573760986328125, 0.019500732421875, 0.020427703857421875, 0.02135467529296875, 0.022281646728515625, 0.0232086181640625, 0.024135589599609375, 0.02506256103515625, 0.025989532470703125, 0.02691650390625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 4.0, 5.0, 6.0, 4.0, 8.0, 7.0, 16.0, 21.0, 31.0, 46.0, 61.0, 72.0, 125.0, 185.0, 381.0, 1565.0, 42731.0, 992914.0, 8735.0, 829.0, 281.0, 156.0, 100.0, 78.0, 50.0, 36.0, 33.0, 17.0, 16.0, 8.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.452880859375, -0.4384193420410156, -0.42395782470703125, -0.4094963073730469, -0.3950347900390625, -0.3805732727050781, -0.36611175537109375, -0.3516502380371094, -0.337188720703125, -0.3227272033691406, -0.30826568603515625, -0.2938041687011719, -0.2793426513671875, -0.2648811340332031, -0.25041961669921875, -0.23595809936523438, -0.22149658203125, -0.20703506469726562, -0.19257354736328125, -0.17811203002929688, -0.1636505126953125, -0.14918899536132812, -0.13472747802734375, -0.12026596069335938, -0.105804443359375, -0.09134292602539062, -0.07688140869140625, -0.062419891357421875, -0.0479583740234375, -0.033496856689453125, -0.01903533935546875, -0.004573822021484375, 0.0098876953125, 0.024349212646484375, 0.03881072998046875, 0.053272247314453125, 0.0677337646484375, 0.08219528198242188, 0.09665679931640625, 0.11111831665039062, 0.125579833984375, 0.14004135131835938, 0.15450286865234375, 0.16896438598632812, 0.1834259033203125, 0.19788742065429688, 0.21234893798828125, 0.22681045532226562, 0.24127197265625, 0.2557334899902344, 0.27019500732421875, 0.2846565246582031, 0.2991180419921875, 0.3135795593261719, 0.32804107666015625, 0.3425025939941406, 0.356964111328125, 0.3714256286621094, 0.38588714599609375, 0.4003486633300781, 0.4148101806640625, 0.4292716979980469, 0.44373321533203125, 0.4581947326660156, 0.47265625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 27.0, 145.0, 671.0, 143.0, 24.0, 4.0], "bins": [-0.16430501639842987, -0.1615900844335556, -0.15887513756752014, -0.15616020560264587, -0.1534452587366104, -0.15073032677173615, -0.14801537990570068, -0.14530044794082642, -0.14258550107479095, -0.1398705691099167, -0.13715562224388123, -0.13444069027900696, -0.1317257434129715, -0.12901081144809723, -0.12629586458206177, -0.1235809326171875, -0.12086600065231323, -0.11815106123685837, -0.1154361218214035, -0.11272118240594864, -0.11000624299049377, -0.1072913110256195, -0.10457636415958405, -0.10186143219470978, -0.09914648532867432, -0.09643154591321945, -0.09371660649776459, -0.09100166708230972, -0.08828672766685486, -0.08557179570198059, -0.08285684883594513, -0.08014191687107086, -0.077426977455616, -0.07471203804016113, -0.07199709862470627, -0.0692821592092514, -0.06656721979379654, -0.06385228037834167, -0.06113734468817711, -0.05842240899801254, -0.05570746958255768, -0.052992530167102814, -0.05027759075164795, -0.047562651336193085, -0.04484771564602852, -0.042132776230573654, -0.03941783681511879, -0.036702901124954224, -0.03398795798420906, -0.031273018568754196, -0.02855808101594448, -0.025843141600489616, -0.0231282040476799, -0.020413264632225037, -0.017698325216770172, -0.014983387663960457, -0.012268448248505592, -0.009553509764373302, -0.006838570814579725, -0.004123631864786148, -0.0014086933806538582, 0.0013062451034784317, 0.004021184518933296, 0.0067361220717430115, 0.009451061487197876]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 6.0, 7.0, 7.0, 4.0, 15.0, 10.0, 22.0, 19.0, 17.0, 22.0, 20.0, 23.0, 28.0, 37.0, 25.0, 40.0, 46.0, 38.0, 40.0, 34.0, 44.0, 34.0, 35.0, 36.0, 35.0, 49.0, 34.0, 27.0, 37.0, 25.0, 29.0, 25.0, 27.0, 25.0, 18.0, 12.0, 12.0, 9.0, 4.0, 9.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.012568652629852295, -0.01219777762889862, -0.011826902627944946, -0.011456027626991272, -0.011085152626037598, -0.010714277625083923, -0.010343402624130249, -0.009972527623176575, -0.0096016526222229, -0.009230777621269226, -0.008859902620315552, -0.008489027619361877, -0.008118152618408203, -0.007747277617454529, -0.0073764026165008545, -0.00700552761554718, -0.006634652614593506, -0.0062637776136398315, -0.005892902612686157, -0.005522027611732483, -0.005151152610778809, -0.004780277609825134, -0.00440940260887146, -0.004038527607917786, -0.0036676526069641113, -0.003296777606010437, -0.0029259026050567627, -0.0025550276041030884, -0.002184152603149414, -0.0018132776021957397, -0.0014424026012420654, -0.0010715276002883911, -0.0007006525993347168, -0.0003297775983810425, 4.1097402572631836e-05, 0.00041197240352630615, 0.0007828474044799805, 0.0011537224054336548, 0.001524597406387329, 0.0018954724073410034, 0.0022663474082946777, 0.002637222409248352, 0.0030080974102020264, 0.0033789724111557007, 0.003749847412109375, 0.004120722413063049, 0.004491597414016724, 0.004862472414970398, 0.005233347415924072, 0.005604222416877747, 0.005975097417831421, 0.006345972418785095, 0.0067168474197387695, 0.007087722420692444, 0.007458597421646118, 0.007829472422599792, 0.008200347423553467, 0.008571222424507141, 0.008942097425460815, 0.00931297242641449, 0.009683847427368164, 0.010054722428321838, 0.010425597429275513, 0.010796472430229187, 0.011167347431182861]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 6.0, 6.0, 8.0, 15.0, 13.0, 13.0, 14.0, 18.0, 25.0, 30.0, 34.0, 39.0, 32.0, 38.0, 33.0, 40.0, 45.0, 49.0, 58.0, 52.0, 46.0, 52.0, 44.0, 34.0, 47.0, 32.0, 32.0, 16.0, 23.0, 20.0, 18.0, 12.0, 12.0, 6.0, 6.0, 9.0, 5.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.21875, -32.30615234375, -31.3935546875, -30.48095703125, -29.568359375, -28.65576171875, -27.7431640625, -26.83056640625, -25.91796875, -25.00537109375, -24.0927734375, -23.18017578125, -22.267578125, -21.35498046875, -20.4423828125, -19.52978515625, -18.6171875, -17.70458984375, -16.7919921875, -15.87939453125, -14.966796875, -14.05419921875, -13.1416015625, -12.22900390625, -11.31640625, -10.40380859375, -9.4912109375, -8.57861328125, -7.666015625, -6.75341796875, -5.8408203125, -4.92822265625, -4.015625, -3.10302734375, -2.1904296875, -1.27783203125, -0.365234375, 0.54736328125, 1.4599609375, 2.37255859375, 3.28515625, 4.19775390625, 5.1103515625, 6.02294921875, 6.935546875, 7.84814453125, 8.7607421875, 9.67333984375, 10.5859375, 11.49853515625, 12.4111328125, 13.32373046875, 14.236328125, 15.14892578125, 16.0615234375, 16.97412109375, 17.88671875, 18.79931640625, 19.7119140625, 20.62451171875, 21.537109375, 22.44970703125, 23.3623046875, 24.27490234375, 25.1875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 9.0, 8.0, 9.0, 25.0, 29.0, 32.0, 60.0, 102.0, 161.0, 303.0, 496.0, 971.0, 1903.0, 4013.0, 9328.0, 23480.0, 66954.0, 270755.0, 500695.0, 110130.0, 34638.0, 13357.0, 5827.0, 2472.0, 1248.0, 676.0, 316.0, 181.0, 112.0, 90.0, 42.0, 35.0, 24.0, 17.0, 9.0, 12.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.53125, -18.99169921875, -18.4521484375, -17.91259765625, -17.373046875, -16.83349609375, -16.2939453125, -15.75439453125, -15.21484375, -14.67529296875, -14.1357421875, -13.59619140625, -13.056640625, -12.51708984375, -11.9775390625, -11.43798828125, -10.8984375, -10.35888671875, -9.8193359375, -9.27978515625, -8.740234375, -8.20068359375, -7.6611328125, -7.12158203125, -6.58203125, -6.04248046875, -5.5029296875, -4.96337890625, -4.423828125, -3.88427734375, -3.3447265625, -2.80517578125, -2.265625, -1.72607421875, -1.1865234375, -0.64697265625, -0.107421875, 0.43212890625, 0.9716796875, 1.51123046875, 2.05078125, 2.59033203125, 3.1298828125, 3.66943359375, 4.208984375, 4.74853515625, 5.2880859375, 5.82763671875, 6.3671875, 6.90673828125, 7.4462890625, 7.98583984375, 8.525390625, 9.06494140625, 9.6044921875, 10.14404296875, 10.68359375, 11.22314453125, 11.7626953125, 12.30224609375, 12.841796875, 13.38134765625, 13.9208984375, 14.46044921875, 15.0]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 13.0, 12.0, 12.0, 17.0, 16.0, 26.0, 22.0, 14.0, 28.0, 36.0, 42.0, 41.0, 42.0, 56.0, 50.0, 68.0, 2008.0, 77.0, 68.0, 42.0, 44.0, 37.0, 28.0, 36.0, 40.0, 23.0, 37.0, 22.0, 20.0, 19.0, 15.0, 5.0, 7.0, 11.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.875, -104.5751953125, -101.275390625, -97.9755859375, -94.67578125, -91.3759765625, -88.076171875, -84.7763671875, -81.4765625, -78.1767578125, -74.876953125, -71.5771484375, -68.27734375, -64.9775390625, -61.677734375, -58.3779296875, -55.078125, -51.7783203125, -48.478515625, -45.1787109375, -41.87890625, -38.5791015625, -35.279296875, -31.9794921875, -28.6796875, -25.3798828125, -22.080078125, -18.7802734375, -15.48046875, -12.1806640625, -8.880859375, -5.5810546875, -2.28125, 1.0185546875, 4.318359375, 7.6181640625, 10.91796875, 14.2177734375, 17.517578125, 20.8173828125, 24.1171875, 27.4169921875, 30.716796875, 34.0166015625, 37.31640625, 40.6162109375, 43.916015625, 47.2158203125, 50.515625, 53.8154296875, 57.115234375, 60.4150390625, 63.71484375, 67.0146484375, 70.314453125, 73.6142578125, 76.9140625, 80.2138671875, 83.513671875, 86.8134765625, 90.11328125, 93.4130859375, 96.712890625, 100.0126953125, 103.3125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 11.0, 5.0, 5.0, 14.0, 22.0, 19.0, 18.0, 47.0, 28.0, 43.0, 53.0, 61.0, 142.0, 306.0, 619.0, 1741.0, 24816.0, 3108507.0, 6756.0, 1342.0, 447.0, 229.0, 132.0, 87.0, 57.0, 32.0, 28.0, 21.0, 28.0, 19.0, 14.0, 14.0, 11.0, 12.0, 7.0, 4.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.375, -174.62109375, -168.8671875, -163.11328125, -157.359375, -151.60546875, -145.8515625, -140.09765625, -134.34375, -128.58984375, -122.8359375, -117.08203125, -111.328125, -105.57421875, -99.8203125, -94.06640625, -88.3125, -82.55859375, -76.8046875, -71.05078125, -65.296875, -59.54296875, -53.7890625, -48.03515625, -42.28125, -36.52734375, -30.7734375, -25.01953125, -19.265625, -13.51171875, -7.7578125, -2.00390625, 3.75, 9.50390625, 15.2578125, 21.01171875, 26.765625, 32.51953125, 38.2734375, 44.02734375, 49.78125, 55.53515625, 61.2890625, 67.04296875, 72.796875, 78.55078125, 84.3046875, 90.05859375, 95.8125, 101.56640625, 107.3203125, 113.07421875, 118.828125, 124.58203125, 130.3359375, 136.08984375, 141.84375, 147.59765625, 153.3515625, 159.10546875, 164.859375, 170.61328125, 176.3671875, 182.12109375, 187.875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 26.0, 580.0, 367.0, 40.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-663.2680053710938, -650.4867553710938, -637.7055053710938, -624.9241943359375, -612.1429443359375, -599.3616943359375, -586.5804443359375, -573.7991943359375, -561.0178833007812, -548.2366333007812, -535.4553833007812, -522.674072265625, -509.892822265625, -497.111572265625, -484.330322265625, -471.5490417480469, -458.767822265625, -445.986572265625, -433.2052917480469, -420.4240417480469, -407.64276123046875, -394.86151123046875, -382.08026123046875, -369.2989807128906, -356.5177001953125, -343.7364501953125, -330.9551696777344, -318.1739196777344, -305.39263916015625, -292.61138916015625, -279.83013916015625, -267.0488586425781, -254.2676239013672, -241.48635864257812, -228.70509338378906, -215.923828125, -203.142578125, -190.36131286621094, -177.58004760742188, -164.79879760742188, -152.01751708984375, -139.2362518310547, -126.45499420166016, -113.6737289428711, -100.89247131347656, -88.1112060546875, -75.32994079589844, -62.548683166503906, -49.767425537109375, -36.98616409301758, -24.20490074157715, -11.423637390136719, 1.3576240539550781, 14.138885498046875, 26.920150756835938, 39.70140838623047, 52.48267364501953, 65.2639389038086, 78.04519653320312, 90.82646179199219, 103.60772705078125, 116.38898468017578, 129.17025756835938, 141.95150756835938, 154.73277282714844]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 2.0, 6.0, 8.0, 12.0, 8.0, 13.0, 16.0, 20.0, 19.0, 16.0, 24.0, 22.0, 34.0, 35.0, 32.0, 37.0, 36.0, 37.0, 39.0, 43.0, 51.0, 40.0, 45.0, 39.0, 37.0, 31.0, 33.0, 30.0, 34.0, 22.0, 39.0, 19.0, 25.0, 17.0, 14.0, 11.0, 11.0, 5.0, 2.0, 7.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-301.5364074707031, -291.8893737792969, -282.2423400878906, -272.5953063964844, -262.94830322265625, -253.30125427246094, -243.65423583984375, -234.0072021484375, -224.36016845703125, -214.713134765625, -205.06610107421875, -195.41908264160156, -185.7720489501953, -176.12501525878906, -166.47799682617188, -156.83096313476562, -147.18392944335938, -137.53689575195312, -127.8898696899414, -118.24284362792969, -108.59580993652344, -98.94877624511719, -89.30175018310547, -79.65472412109375, -70.0076904296875, -60.360660552978516, -50.71363067626953, -41.06660079956055, -31.419570922851562, -21.772541046142578, -12.125511169433594, -2.478485107421875, 7.168548583984375, 16.81557846069336, 26.462608337402344, 36.10963821411133, 45.75666809082031, 55.4036979675293, 65.05072784423828, 74.69775390625, 84.34478759765625, 93.9918212890625, 103.63884735107422, 113.28587341308594, 122.93290710449219, 132.57994079589844, 142.22695922851562, 151.87399291992188, 161.52102661132812, 171.16806030273438, 180.81509399414062, 190.4621124267578, 200.10914611816406, 209.7561798095703, 219.4031982421875, 229.05023193359375, 238.697265625, 248.34429931640625, 257.9913330078125, 267.63836669921875, 277.285400390625, 286.9324035644531, 296.5794372558594, 306.2264709472656, 315.8735046386719]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 10.0, 14.0, 11.0, 13.0, 15.0, 18.0, 28.0, 21.0, 29.0, 34.0, 37.0, 32.0, 40.0, 35.0, 43.0, 54.0, 45.0, 52.0, 58.0, 45.0, 51.0, 33.0, 36.0, 42.0, 35.0, 22.0, 16.0, 21.0, 21.0, 11.0, 13.0, 7.0, 13.0, 6.0, 6.0, 5.0, 4.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-32.75, -31.835205078125, -30.92041015625, -30.005615234375, -29.0908203125, -28.176025390625, -27.26123046875, -26.346435546875, -25.431640625, -24.516845703125, -23.60205078125, -22.687255859375, -21.7724609375, -20.857666015625, -19.94287109375, -19.028076171875, -18.11328125, -17.198486328125, -16.28369140625, -15.368896484375, -14.4541015625, -13.539306640625, -12.62451171875, -11.709716796875, -10.794921875, -9.880126953125, -8.96533203125, -8.050537109375, -7.1357421875, -6.220947265625, -5.30615234375, -4.391357421875, -3.4765625, -2.561767578125, -1.64697265625, -0.732177734375, 0.1826171875, 1.097412109375, 2.01220703125, 2.927001953125, 3.841796875, 4.756591796875, 5.67138671875, 6.586181640625, 7.5009765625, 8.415771484375, 9.33056640625, 10.245361328125, 11.16015625, 12.074951171875, 12.98974609375, 13.904541015625, 14.8193359375, 15.734130859375, 16.64892578125, 17.563720703125, 18.478515625, 19.393310546875, 20.30810546875, 21.222900390625, 22.1376953125, 23.052490234375, 23.96728515625, 24.882080078125, 25.796875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 3.0, 9.0, 14.0, 11.0, 13.0, 15.0, 26.0, 22.0, 43.0, 48.0, 73.0, 129.0, 227.0, 470.0, 1047.0, 2765.0, 9541.0, 415606.0, 3739322.0, 18018.0, 4127.0, 1389.0, 620.0, 270.0, 164.0, 102.0, 46.0, 29.0, 22.0, 20.0, 16.0, 13.0, 8.0, 14.0, 5.0, 8.0, 4.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-207.375, -201.642578125, -195.91015625, -190.177734375, -184.4453125, -178.712890625, -172.98046875, -167.248046875, -161.515625, -155.783203125, -150.05078125, -144.318359375, -138.5859375, -132.853515625, -127.12109375, -121.388671875, -115.65625, -109.923828125, -104.19140625, -98.458984375, -92.7265625, -86.994140625, -81.26171875, -75.529296875, -69.796875, -64.064453125, -58.33203125, -52.599609375, -46.8671875, -41.134765625, -35.40234375, -29.669921875, -23.9375, -18.205078125, -12.47265625, -6.740234375, -1.0078125, 4.724609375, 10.45703125, 16.189453125, 21.921875, 27.654296875, 33.38671875, 39.119140625, 44.8515625, 50.583984375, 56.31640625, 62.048828125, 67.78125, 73.513671875, 79.24609375, 84.978515625, 90.7109375, 96.443359375, 102.17578125, 107.908203125, 113.640625, 119.373046875, 125.10546875, 130.837890625, 136.5703125, 142.302734375, 148.03515625, 153.767578125, 159.5]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 11.0, 10.0, 8.0, 9.0, 15.0, 13.0, 14.0, 24.0, 27.0, 74.0, 160.0, 362.0, 817.0, 1247.0, 664.0, 292.0, 112.0, 48.0, 29.0, 19.0, 24.0, 11.0, 16.0, 9.0, 9.0, 2.0, 3.0, 2.0, 8.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-95.5, -92.873046875, -90.24609375, -87.619140625, -84.9921875, -82.365234375, -79.73828125, -77.111328125, -74.484375, -71.857421875, -69.23046875, -66.603515625, -63.9765625, -61.349609375, -58.72265625, -56.095703125, -53.46875, -50.841796875, -48.21484375, -45.587890625, -42.9609375, -40.333984375, -37.70703125, -35.080078125, -32.453125, -29.826171875, -27.19921875, -24.572265625, -21.9453125, -19.318359375, -16.69140625, -14.064453125, -11.4375, -8.810546875, -6.18359375, -3.556640625, -0.9296875, 1.697265625, 4.32421875, 6.951171875, 9.578125, 12.205078125, 14.83203125, 17.458984375, 20.0859375, 22.712890625, 25.33984375, 27.966796875, 30.59375, 33.220703125, 35.84765625, 38.474609375, 41.1015625, 43.728515625, 46.35546875, 48.982421875, 51.609375, 54.236328125, 56.86328125, 59.490234375, 62.1171875, 64.744140625, 67.37109375, 69.998046875, 72.625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 12.0, 13.0, 23.0, 37.0, 60.0, 105.0, 175.0, 302.0, 507.0, 892.0, 1653.0, 3171.0, 6540.0, 14430.0, 42757.0, 739559.0, 3279486.0, 68900.0, 19250.0, 8083.0, 3843.0, 1973.0, 997.0, 628.0, 352.0, 197.0, 126.0, 76.0, 42.0, 30.0, 16.0, 12.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.375, -133.458984375, -128.54296875, -123.626953125, -118.7109375, -113.794921875, -108.87890625, -103.962890625, -99.046875, -94.130859375, -89.21484375, -84.298828125, -79.3828125, -74.466796875, -69.55078125, -64.634765625, -59.71875, -54.802734375, -49.88671875, -44.970703125, -40.0546875, -35.138671875, -30.22265625, -25.306640625, -20.390625, -15.474609375, -10.55859375, -5.642578125, -0.7265625, 4.189453125, 9.10546875, 14.021484375, 18.9375, 23.853515625, 28.76953125, 33.685546875, 38.6015625, 43.517578125, 48.43359375, 53.349609375, 58.265625, 63.181640625, 68.09765625, 73.013671875, 77.9296875, 82.845703125, 87.76171875, 92.677734375, 97.59375, 102.509765625, 107.42578125, 112.341796875, 117.2578125, 122.173828125, 127.08984375, 132.005859375, 136.921875, 141.837890625, 146.75390625, 151.669921875, 156.5859375, 161.501953125, 166.41796875, 171.333984375, 176.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 7.0, 6.0, 7.0, 21.0, 14.0, 19.0, 56.0, 78.0, 154.0, 202.0, 179.0, 109.0, 47.0, 32.0, 28.0, 12.0, 8.0, 8.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-483.0494384765625, -470.2247009277344, -457.3999328613281, -444.5751953125, -431.7504577636719, -418.92572021484375, -406.1009521484375, -393.2762145996094, -380.45147705078125, -367.6267395019531, -354.8019714355469, -341.97723388671875, -329.1524963378906, -316.3277587890625, -303.50299072265625, -290.6782531738281, -277.8534851074219, -265.02874755859375, -252.20399475097656, -239.37924194335938, -226.55450439453125, -213.72975158691406, -200.90499877929688, -188.08026123046875, -175.25550842285156, -162.43075561523438, -149.60601806640625, -136.78126525878906, -123.9565200805664, -111.13177490234375, -98.30702209472656, -85.4822769165039, -72.65756225585938, -59.83281707763672, -47.0080680847168, -34.183319091796875, -21.35857391357422, -8.533828735351562, 4.290924072265625, 17.11566925048828, 29.940414428710938, 42.765159606933594, 55.589908599853516, 68.41465759277344, 81.2394027709961, 94.06414794921875, 106.88890075683594, 119.7136459350586, 132.53839111328125, 145.36314392089844, 158.18788146972656, 171.01263427734375, 183.83737182617188, 196.66212463378906, 209.48687744140625, 222.31161499023438, 235.13636779785156, 247.96112060546875, 260.7858581542969, 273.610595703125, 286.43536376953125, 299.2601013183594, 312.0848388671875, 324.90960693359375, 337.7343444824219]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 0.0, 3.0, 3.0, 8.0, 1.0, 9.0, 13.0, 10.0, 12.0, 12.0, 14.0, 18.0, 28.0, 30.0, 27.0, 34.0, 27.0, 29.0, 38.0, 33.0, 41.0, 33.0, 30.0, 40.0, 53.0, 42.0, 31.0, 34.0, 31.0, 24.0, 32.0, 35.0, 29.0, 28.0, 25.0, 28.0, 19.0, 18.0, 11.0, 18.0, 13.0, 8.0, 6.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-173.11122131347656, -167.31906127929688, -161.52688598632812, -155.73472595214844, -149.94256591796875, -144.150390625, -138.3582305908203, -132.56607055664062, -126.7739028930664, -120.98173522949219, -115.1895751953125, -109.39740753173828, -103.60523986816406, -97.81307983398438, -92.02091217041016, -86.22874450683594, -80.43658447265625, -74.64441680908203, -68.85225677490234, -63.060089111328125, -57.26792526245117, -51.47576141357422, -45.68359375, -39.89142990112305, -34.099266052246094, -28.30710220336914, -22.514936447143555, -16.72277069091797, -10.930606842041016, -5.1384429931640625, 0.6537246704101562, 6.445888519287109, 12.238067626953125, 18.030231475830078, 23.822397232055664, 29.61456298828125, 35.4067268371582, 41.198890686035156, 46.991058349609375, 52.78322219848633, 58.57538604736328, 64.3675537109375, 70.15971374511719, 75.9518814086914, 81.74404907226562, 87.53620910644531, 93.32837677001953, 99.12054443359375, 104.91270446777344, 110.70487213134766, 116.49703216552734, 122.28919982910156, 128.08135986328125, 133.87353515625, 139.6656951904297, 145.45785522460938, 151.25003051757812, 157.0421905517578, 162.83436584472656, 168.62652587890625, 174.41868591308594, 180.21084594726562, 186.00302124023438, 191.79518127441406, 197.58734130859375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 2.0, 12.0, 10.0, 7.0, 12.0, 20.0, 15.0, 14.0, 28.0, 20.0, 32.0, 31.0, 33.0, 30.0, 49.0, 54.0, 43.0, 50.0, 52.0, 57.0, 39.0, 32.0, 39.0, 43.0, 29.0, 33.0, 23.0, 33.0, 29.0, 18.0, 20.0, 12.0, 9.0, 12.0, 5.0, 7.0, 10.0, 7.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-32.4375, -31.529052734375, -30.62060546875, -29.712158203125, -28.8037109375, -27.895263671875, -26.98681640625, -26.078369140625, -25.169921875, -24.261474609375, -23.35302734375, -22.444580078125, -21.5361328125, -20.627685546875, -19.71923828125, -18.810791015625, -17.90234375, -16.993896484375, -16.08544921875, -15.177001953125, -14.2685546875, -13.360107421875, -12.45166015625, -11.543212890625, -10.634765625, -9.726318359375, -8.81787109375, -7.909423828125, -7.0009765625, -6.092529296875, -5.18408203125, -4.275634765625, -3.3671875, -2.458740234375, -1.55029296875, -0.641845703125, 0.2666015625, 1.175048828125, 2.08349609375, 2.991943359375, 3.900390625, 4.808837890625, 5.71728515625, 6.625732421875, 7.5341796875, 8.442626953125, 9.35107421875, 10.259521484375, 11.16796875, 12.076416015625, 12.98486328125, 13.893310546875, 14.8017578125, 15.710205078125, 16.61865234375, 17.527099609375, 18.435546875, 19.343994140625, 20.25244140625, 21.160888671875, 22.0693359375, 22.977783203125, 23.88623046875, 24.794677734375, 25.703125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 8.0, 6.0, 17.0, 11.0, 21.0, 37.0, 60.0, 75.0, 87.0, 147.0, 231.0, 326.0, 488.0, 702.0, 1021.0, 1410.0, 2154.0, 3198.0, 4752.0, 7444.0, 11118.0, 17603.0, 27838.0, 45911.0, 81538.0, 162298.0, 291364.0, 173409.0, 85885.0, 47776.0, 29010.0, 18201.0, 11629.0, 7431.0, 4977.0, 3379.0, 2209.0, 1491.0, 1050.0, 667.0, 483.0, 332.0, 222.0, 149.0, 125.0, 80.0, 55.0, 35.0, 34.0, 19.0, 21.0, 10.0, 5.0, 0.0, 1.0, 5.0, 4.0], "bins": [-1.4140625, -1.3719024658203125, -1.329742431640625, -1.2875823974609375, -1.24542236328125, -1.2032623291015625, -1.161102294921875, -1.1189422607421875, -1.0767822265625, -1.0346221923828125, -0.992462158203125, -0.9503021240234375, -0.90814208984375, -0.8659820556640625, -0.823822021484375, -0.7816619873046875, -0.739501953125, -0.6973419189453125, -0.655181884765625, -0.6130218505859375, -0.57086181640625, -0.5287017822265625, -0.486541748046875, -0.4443817138671875, -0.4022216796875, -0.3600616455078125, -0.317901611328125, -0.2757415771484375, -0.23358154296875, -0.1914215087890625, -0.149261474609375, -0.1071014404296875, -0.06494140625, -0.0227813720703125, 0.019378662109375, 0.0615386962890625, 0.10369873046875, 0.1458587646484375, 0.188018798828125, 0.2301788330078125, 0.2723388671875, 0.3144989013671875, 0.356658935546875, 0.3988189697265625, 0.44097900390625, 0.4831390380859375, 0.525299072265625, 0.5674591064453125, 0.609619140625, 0.6517791748046875, 0.693939208984375, 0.7360992431640625, 0.77825927734375, 0.8204193115234375, 0.862579345703125, 0.9047393798828125, 0.9468994140625, 0.9890594482421875, 1.031219482421875, 1.0733795166015625, 1.11553955078125, 1.1576995849609375, 1.199859619140625, 1.2420196533203125, 1.2841796875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 7.0, 6.0, 5.0, 18.0, 12.0, 12.0, 13.0, 24.0, 17.0, 27.0, 22.0, 20.0, 33.0, 28.0, 33.0, 28.0, 37.0, 45.0, 30.0, 39.0, 36.0, 1055.0, 30.0, 49.0, 38.0, 35.0, 30.0, 40.0, 27.0, 28.0, 30.0, 24.0, 18.0, 18.0, 20.0, 14.0, 9.0, 11.0, 14.0, 8.0, 9.0, 10.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-18.515625, -17.96337890625, -17.4111328125, -16.85888671875, -16.306640625, -15.75439453125, -15.2021484375, -14.64990234375, -14.09765625, -13.54541015625, -12.9931640625, -12.44091796875, -11.888671875, -11.33642578125, -10.7841796875, -10.23193359375, -9.6796875, -9.12744140625, -8.5751953125, -8.02294921875, -7.470703125, -6.91845703125, -6.3662109375, -5.81396484375, -5.26171875, -4.70947265625, -4.1572265625, -3.60498046875, -3.052734375, -2.50048828125, -1.9482421875, -1.39599609375, -0.84375, -0.29150390625, 0.2607421875, 0.81298828125, 1.365234375, 1.91748046875, 2.4697265625, 3.02197265625, 3.57421875, 4.12646484375, 4.6787109375, 5.23095703125, 5.783203125, 6.33544921875, 6.8876953125, 7.43994140625, 7.9921875, 8.54443359375, 9.0966796875, 9.64892578125, 10.201171875, 10.75341796875, 11.3056640625, 11.85791015625, 12.41015625, 12.96240234375, 13.5146484375, 14.06689453125, 14.619140625, 15.17138671875, 15.7236328125, 16.27587890625, 16.828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 10.0, 21.0, 30.0, 39.0, 50.0, 79.0, 110.0, 162.0, 239.0, 324.0, 534.0, 796.0, 1212.0, 1704.0, 2677.0, 4266.0, 6551.0, 10283.0, 16507.0, 26783.0, 45244.0, 80609.0, 167190.0, 1347251.0, 177579.0, 84948.0, 46759.0, 27901.0, 17206.0, 10764.0, 6790.0, 4331.0, 2763.0, 1806.0, 1222.0, 789.0, 504.0, 344.0, 242.0, 140.0, 118.0, 77.0, 63.0, 36.0, 26.0, 14.0, 9.0, 7.0, 0.0, 6.0, 7.0, 2.0, 3.0], "bins": [-1.5703125, -1.52484130859375, -1.4793701171875, -1.43389892578125, -1.388427734375, -1.34295654296875, -1.2974853515625, -1.25201416015625, -1.20654296875, -1.16107177734375, -1.1156005859375, -1.07012939453125, -1.024658203125, -0.97918701171875, -0.9337158203125, -0.88824462890625, -0.8427734375, -0.79730224609375, -0.7518310546875, -0.70635986328125, -0.660888671875, -0.61541748046875, -0.5699462890625, -0.52447509765625, -0.47900390625, -0.43353271484375, -0.3880615234375, -0.34259033203125, -0.297119140625, -0.25164794921875, -0.2061767578125, -0.16070556640625, -0.115234375, -0.06976318359375, -0.0242919921875, 0.02117919921875, 0.066650390625, 0.11212158203125, 0.1575927734375, 0.20306396484375, 0.24853515625, 0.29400634765625, 0.3394775390625, 0.38494873046875, 0.430419921875, 0.47589111328125, 0.5213623046875, 0.56683349609375, 0.6123046875, 0.65777587890625, 0.7032470703125, 0.74871826171875, 0.794189453125, 0.83966064453125, 0.8851318359375, 0.93060302734375, 0.97607421875, 1.02154541015625, 1.0670166015625, 1.11248779296875, 1.157958984375, 1.20343017578125, 1.2489013671875, 1.29437255859375, 1.33984375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 2.0, 5.0, 10.0, 10.0, 10.0, 10.0, 18.0, 18.0, 28.0, 24.0, 39.0, 40.0, 50.0, 73.0, 81.0, 118.0, 90.0, 77.0, 60.0, 32.0, 49.0, 26.0, 28.0, 12.0, 17.0, 11.0, 16.0, 8.0, 7.0, 4.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0196990966796875, -0.019016027450561523, -0.018332958221435547, -0.01764988899230957, -0.016966819763183594, -0.016283750534057617, -0.01560068130493164, -0.014917612075805664, -0.014234542846679688, -0.013551473617553711, -0.012868404388427734, -0.012185335159301758, -0.011502265930175781, -0.010819196701049805, -0.010136127471923828, -0.009453058242797852, -0.008769989013671875, -0.008086919784545898, -0.007403850555419922, -0.006720781326293945, -0.006037712097167969, -0.005354642868041992, -0.004671573638916016, -0.003988504409790039, -0.0033054351806640625, -0.002622365951538086, -0.0019392967224121094, -0.0012562274932861328, -0.0005731582641601562, 0.00010991096496582031, 0.0007929801940917969, 0.0014760494232177734, 0.00215911865234375, 0.0028421878814697266, 0.003525257110595703, 0.00420832633972168, 0.004891395568847656, 0.005574464797973633, 0.006257534027099609, 0.006940603256225586, 0.0076236724853515625, 0.008306741714477539, 0.008989810943603516, 0.009672880172729492, 0.010355949401855469, 0.011039018630981445, 0.011722087860107422, 0.012405157089233398, 0.013088226318359375, 0.013771295547485352, 0.014454364776611328, 0.015137434005737305, 0.01582050323486328, 0.016503572463989258, 0.017186641693115234, 0.01786971092224121, 0.018552780151367188, 0.019235849380493164, 0.01991891860961914, 0.020601987838745117, 0.021285057067871094, 0.02196812629699707, 0.022651195526123047, 0.023334264755249023, 0.024017333984375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 8.0, 10.0, 5.0, 11.0, 11.0, 23.0, 28.0, 32.0, 41.0, 49.0, 70.0, 91.0, 127.0, 182.0, 340.0, 1235.0, 12500.0, 865461.0, 161229.0, 5449.0, 750.0, 263.0, 161.0, 110.0, 87.0, 66.0, 44.0, 43.0, 25.0, 23.0, 21.0, 11.0, 12.0, 4.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.352783203125, -0.34265899658203125, -0.3325347900390625, -0.32241058349609375, -0.312286376953125, -0.30216217041015625, -0.2920379638671875, -0.28191375732421875, -0.27178955078125, -0.26166534423828125, -0.2515411376953125, -0.24141693115234375, -0.231292724609375, -0.22116851806640625, -0.2110443115234375, -0.20092010498046875, -0.1907958984375, -0.18067169189453125, -0.1705474853515625, -0.16042327880859375, -0.150299072265625, -0.14017486572265625, -0.1300506591796875, -0.11992645263671875, -0.10980224609375, -0.09967803955078125, -0.0895538330078125, -0.07942962646484375, -0.069305419921875, -0.05918121337890625, -0.0490570068359375, -0.03893280029296875, -0.02880859375, -0.01868438720703125, -0.0085601806640625, 0.00156402587890625, 0.011688232421875, 0.02181243896484375, 0.0319366455078125, 0.04206085205078125, 0.05218505859375, 0.06230926513671875, 0.0724334716796875, 0.08255767822265625, 0.092681884765625, 0.10280609130859375, 0.1129302978515625, 0.12305450439453125, 0.1331787109375, 0.14330291748046875, 0.1534271240234375, 0.16355133056640625, 0.173675537109375, 0.18379974365234375, 0.1939239501953125, 0.20404815673828125, 0.21417236328125, 0.22429656982421875, 0.2344207763671875, 0.24454498291015625, 0.254669189453125, 0.26479339599609375, 0.2749176025390625, 0.28504180908203125, 0.295166015625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 11.0, 56.0, 537.0, 371.0, 36.0, 1.0, 3.0], "bins": [-0.20111361145973206, -0.19775904715061188, -0.1944044828414917, -0.19104990363121033, -0.18769533932209015, -0.18434077501296997, -0.1809862107038498, -0.17763164639472961, -0.17427708208560944, -0.17092251777648926, -0.16756795346736908, -0.1642133891582489, -0.16085880994796753, -0.15750424563884735, -0.15414968132972717, -0.150795117020607, -0.14744055271148682, -0.14408598840236664, -0.14073142409324646, -0.1373768448829651, -0.1340222805738449, -0.13066771626472473, -0.12731315195560455, -0.12395858764648438, -0.120604008436203, -0.11724944412708282, -0.11389487236738205, -0.11054030805826187, -0.1071857437491417, -0.10383117198944092, -0.10047660768032074, -0.09712204337120056, -0.09376747161149979, -0.09041290730237961, -0.08705833554267883, -0.08370377123355865, -0.08034920692443848, -0.0769946426153183, -0.07364007085561752, -0.07028550654649734, -0.06693094223737717, -0.06357637792825699, -0.06022180989384651, -0.056867241859436035, -0.05351267755031586, -0.05015810951590538, -0.046803541481494904, -0.043448977172374725, -0.04009440541267395, -0.036739837378263474, -0.033385273069143295, -0.03003070503473282, -0.02667613886296749, -0.023321572691202164, -0.019967004656791687, -0.01661243848502636, -0.013257873244583607, -0.009903306141495705, -0.006548739969730377, -0.003194172866642475, 0.00016039330512285233, 0.0035149594768881798, 0.0068695275112986565, 0.010224093683063984, 0.013578659854829311]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 9.0, 13.0, 5.0, 15.0, 24.0, 17.0, 23.0, 28.0, 34.0, 36.0, 47.0, 46.0, 51.0, 50.0, 37.0, 52.0, 42.0, 48.0, 55.0, 31.0, 44.0, 33.0, 28.0, 46.0, 29.0, 26.0, 13.0, 22.0, 15.0, 16.0, 11.0, 11.0, 7.0, 7.0, 10.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012270510196685791, -0.011865060776472092, -0.011459611356258392, -0.011054161936044693, -0.010648712515830994, -0.010243263095617294, -0.009837813675403595, -0.009432364255189896, -0.009026914834976196, -0.008621465414762497, -0.008216015994548798, -0.007810566574335098, -0.007405117154121399, -0.0069996677339077, -0.006594218313694, -0.006188768893480301, -0.0057833194732666016, -0.005377870053052902, -0.004972420632839203, -0.0045669712126255035, -0.004161521792411804, -0.003756072372198105, -0.0033506229519844055, -0.002945173531770706, -0.002539724111557007, -0.0021342746913433075, -0.0017288252711296082, -0.0013233758509159088, -0.0009179264307022095, -0.0005124770104885101, -0.00010702759027481079, 0.00029842182993888855, 0.0007038712501525879, 0.0011093206703662872, 0.0015147700905799866, 0.001920219510793686, 0.0023256689310073853, 0.0027311183512210846, 0.003136567771434784, 0.0035420171916484833, 0.003947466611862183, 0.004352916032075882, 0.004758365452289581, 0.005163814872503281, 0.00556926429271698, 0.005974713712930679, 0.006380163133144379, 0.006785612553358078, 0.007191061973571777, 0.007596511393785477, 0.008001960813999176, 0.008407410234212875, 0.008812859654426575, 0.009218309074640274, 0.009623758494853973, 0.010029207915067673, 0.010434657335281372, 0.010840106755495071, 0.01124555617570877, 0.01165100559592247, 0.01205645501613617, 0.012461904436349869, 0.012867353856563568, 0.013272803276777267, 0.013678252696990967]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 2.0, 12.0, 10.0, 7.0, 12.0, 20.0, 15.0, 14.0, 28.0, 20.0, 32.0, 31.0, 33.0, 30.0, 49.0, 54.0, 44.0, 51.0, 51.0, 56.0, 39.0, 34.0, 37.0, 43.0, 29.0, 33.0, 23.0, 33.0, 30.0, 17.0, 20.0, 12.0, 9.0, 12.0, 5.0, 7.0, 10.0, 7.0, 10.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-32.4375, -31.52880859375, -30.6201171875, -29.71142578125, -28.802734375, -27.89404296875, -26.9853515625, -26.07666015625, -25.16796875, -24.25927734375, -23.3505859375, -22.44189453125, -21.533203125, -20.62451171875, -19.7158203125, -18.80712890625, -17.8984375, -16.98974609375, -16.0810546875, -15.17236328125, -14.263671875, -13.35498046875, -12.4462890625, -11.53759765625, -10.62890625, -9.72021484375, -8.8115234375, -7.90283203125, -6.994140625, -6.08544921875, -5.1767578125, -4.26806640625, -3.359375, -2.45068359375, -1.5419921875, -0.63330078125, 0.275390625, 1.18408203125, 2.0927734375, 3.00146484375, 3.91015625, 4.81884765625, 5.7275390625, 6.63623046875, 7.544921875, 8.45361328125, 9.3623046875, 10.27099609375, 11.1796875, 12.08837890625, 12.9970703125, 13.90576171875, 14.814453125, 15.72314453125, 16.6318359375, 17.54052734375, 18.44921875, 19.35791015625, 20.2666015625, 21.17529296875, 22.083984375, 22.99267578125, 23.9013671875, 24.81005859375, 25.71875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 6.0, 14.0, 22.0, 25.0, 31.0, 47.0, 56.0, 71.0, 101.0, 125.0, 201.0, 281.0, 420.0, 605.0, 807.0, 1193.0, 1891.0, 3117.0, 6968.0, 50173.0, 885533.0, 78888.0, 8439.0, 3295.0, 1981.0, 1320.0, 840.0, 592.0, 423.0, 303.0, 239.0, 136.0, 108.0, 83.0, 54.0, 49.0, 32.0, 20.0, 16.0, 14.0, 7.0, 4.0, 9.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.15625, -46.470703125, -44.78515625, -43.099609375, -41.4140625, -39.728515625, -38.04296875, -36.357421875, -34.671875, -32.986328125, -31.30078125, -29.615234375, -27.9296875, -26.244140625, -24.55859375, -22.873046875, -21.1875, -19.501953125, -17.81640625, -16.130859375, -14.4453125, -12.759765625, -11.07421875, -9.388671875, -7.703125, -6.017578125, -4.33203125, -2.646484375, -0.9609375, 0.724609375, 2.41015625, 4.095703125, 5.78125, 7.466796875, 9.15234375, 10.837890625, 12.5234375, 14.208984375, 15.89453125, 17.580078125, 19.265625, 20.951171875, 22.63671875, 24.322265625, 26.0078125, 27.693359375, 29.37890625, 31.064453125, 32.75, 34.435546875, 36.12109375, 37.806640625, 39.4921875, 41.177734375, 42.86328125, 44.548828125, 46.234375, 47.919921875, 49.60546875, 51.291015625, 52.9765625, 54.662109375, 56.34765625, 58.033203125, 59.71875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 9.0, 12.0, 15.0, 15.0, 20.0, 20.0, 29.0, 20.0, 33.0, 32.0, 39.0, 32.0, 29.0, 44.0, 50.0, 60.0, 1988.0, 122.0, 52.0, 47.0, 37.0, 42.0, 34.0, 39.0, 25.0, 34.0, 26.0, 15.0, 23.0, 20.0, 13.0, 12.0, 10.0, 13.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-108.75, -105.525390625, -102.30078125, -99.076171875, -95.8515625, -92.626953125, -89.40234375, -86.177734375, -82.953125, -79.728515625, -76.50390625, -73.279296875, -70.0546875, -66.830078125, -63.60546875, -60.380859375, -57.15625, -53.931640625, -50.70703125, -47.482421875, -44.2578125, -41.033203125, -37.80859375, -34.583984375, -31.359375, -28.134765625, -24.91015625, -21.685546875, -18.4609375, -15.236328125, -12.01171875, -8.787109375, -5.5625, -2.337890625, 0.88671875, 4.111328125, 7.3359375, 10.560546875, 13.78515625, 17.009765625, 20.234375, 23.458984375, 26.68359375, 29.908203125, 33.1328125, 36.357421875, 39.58203125, 42.806640625, 46.03125, 49.255859375, 52.48046875, 55.705078125, 58.9296875, 62.154296875, 65.37890625, 68.603515625, 71.828125, 75.052734375, 78.27734375, 81.501953125, 84.7265625, 87.951171875, 91.17578125, 94.400390625, 97.625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 7.0, 14.0, 14.0, 12.0, 13.0, 23.0, 25.0, 17.0, 35.0, 55.0, 53.0, 88.0, 133.0, 219.0, 385.0, 1084.0, 3748.0, 56607.0, 3071513.0, 8362.0, 1776.0, 672.0, 278.0, 157.0, 99.0, 68.0, 54.0, 32.0, 33.0, 19.0, 20.0, 18.0, 19.0, 9.0, 12.0, 5.0, 2.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-156.75, -151.56640625, -146.3828125, -141.19921875, -136.015625, -130.83203125, -125.6484375, -120.46484375, -115.28125, -110.09765625, -104.9140625, -99.73046875, -94.546875, -89.36328125, -84.1796875, -78.99609375, -73.8125, -68.62890625, -63.4453125, -58.26171875, -53.078125, -47.89453125, -42.7109375, -37.52734375, -32.34375, -27.16015625, -21.9765625, -16.79296875, -11.609375, -6.42578125, -1.2421875, 3.94140625, 9.125, 14.30859375, 19.4921875, 24.67578125, 29.859375, 35.04296875, 40.2265625, 45.41015625, 50.59375, 55.77734375, 60.9609375, 66.14453125, 71.328125, 76.51171875, 81.6953125, 86.87890625, 92.0625, 97.24609375, 102.4296875, 107.61328125, 112.796875, 117.98046875, 123.1640625, 128.34765625, 133.53125, 138.71484375, 143.8984375, 149.08203125, 154.265625, 159.44921875, 164.6328125, 169.81640625, 175.0]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 68.0, 658.0, 271.0, 14.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.49669647216797, -68.96754455566406, -54.43840026855469, -39.90924835205078, -25.38010025024414, -10.8509521484375, 3.6781997680664062, 18.20734405517578, 32.73649597167969, 47.26564407348633, 61.79479217529297, 76.32394409179688, 90.85308837890625, 105.38224029541016, 119.91139221191406, 134.44053649902344, 148.96969604492188, 163.49884033203125, 178.0279998779297, 192.55714416503906, 207.08628845214844, 221.61544799804688, 236.14459228515625, 250.67373657226562, 265.202880859375, 279.7320251464844, 294.26116943359375, 308.79034423828125, 323.3194885253906, 337.8486328125, 352.3777770996094, 366.90692138671875, 381.4360656738281, 395.9652099609375, 410.4943542480469, 425.02349853515625, 439.55267333984375, 454.0818176269531, 468.6109619140625, 483.1401062011719, 497.66925048828125, 512.1984252929688, 526.7275390625, 541.2567138671875, 555.7858276367188, 570.3150024414062, 584.8441162109375, 599.373291015625, 613.9024658203125, 628.431640625, 642.9607543945312, 657.4899291992188, 672.01904296875, 686.5482177734375, 701.077392578125, 715.6065063476562, 730.1356201171875, 744.664794921875, 759.1939086914062, 773.7230834960938, 788.252197265625, 802.7813720703125, 817.310546875, 831.8396606445312, 846.3688354492188]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 9.0, 11.0, 11.0, 14.0, 16.0, 19.0, 24.0, 25.0, 24.0, 40.0, 35.0, 42.0, 40.0, 49.0, 55.0, 55.0, 50.0, 60.0, 58.0, 38.0, 34.0, 40.0, 33.0, 32.0, 38.0, 28.0, 13.0, 19.0, 16.0, 7.0, 14.0, 11.0, 8.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-377.87835693359375, -367.0213928222656, -356.1644287109375, -345.3074645996094, -334.45050048828125, -323.5935363769531, -312.736572265625, -301.8796081542969, -291.02264404296875, -280.1656799316406, -269.3087158203125, -258.4517517089844, -247.59478759765625, -236.73782348632812, -225.880859375, -215.02389526367188, -204.16693115234375, -193.30996704101562, -182.4530029296875, -171.59603881835938, -160.73907470703125, -149.88211059570312, -139.025146484375, -128.16818237304688, -117.31121826171875, -106.45425415039062, -95.5972900390625, -84.74032592773438, -73.88336181640625, -63.026397705078125, -52.16943359375, -41.312469482421875, -30.45550537109375, -19.598541259765625, -8.7415771484375, 2.115386962890625, 12.97235107421875, 23.829315185546875, 34.686279296875, 45.543243408203125, 56.40020751953125, 67.25717163085938, 78.1141357421875, 88.97109985351562, 99.82806396484375, 110.68502807617188, 121.5419921875, 132.39895629882812, 143.25592041015625, 154.11288452148438, 164.9698486328125, 175.82681274414062, 186.68377685546875, 197.54074096679688, 208.397705078125, 219.25466918945312, 230.11163330078125, 240.96859741210938, 251.8255615234375, 262.6825256347656, 273.53948974609375, 284.3964538574219, 295.25341796875, 306.1103820800781, 316.96734619140625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 8.0, 9.0, 10.0, 7.0, 6.0, 23.0, 13.0, 21.0, 13.0, 30.0, 37.0, 28.0, 31.0, 31.0, 44.0, 58.0, 36.0, 51.0, 55.0, 52.0, 46.0, 37.0, 34.0, 40.0, 35.0, 33.0, 35.0, 22.0, 29.0, 22.0, 19.0, 7.0, 12.0, 13.0, 6.0, 5.0, 7.0, 12.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-33.03125, -32.108642578125, -31.18603515625, -30.263427734375, -29.3408203125, -28.418212890625, -27.49560546875, -26.572998046875, -25.650390625, -24.727783203125, -23.80517578125, -22.882568359375, -21.9599609375, -21.037353515625, -20.11474609375, -19.192138671875, -18.26953125, -17.346923828125, -16.42431640625, -15.501708984375, -14.5791015625, -13.656494140625, -12.73388671875, -11.811279296875, -10.888671875, -9.966064453125, -9.04345703125, -8.120849609375, -7.1982421875, -6.275634765625, -5.35302734375, -4.430419921875, -3.5078125, -2.585205078125, -1.66259765625, -0.739990234375, 0.1826171875, 1.105224609375, 2.02783203125, 2.950439453125, 3.873046875, 4.795654296875, 5.71826171875, 6.640869140625, 7.5634765625, 8.486083984375, 9.40869140625, 10.331298828125, 11.25390625, 12.176513671875, 13.09912109375, 14.021728515625, 14.9443359375, 15.866943359375, 16.78955078125, 17.712158203125, 18.634765625, 19.557373046875, 20.47998046875, 21.402587890625, 22.3251953125, 23.247802734375, 24.17041015625, 25.093017578125, 26.015625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 8.0, 13.0, 12.0, 14.0, 26.0, 31.0, 53.0, 67.0, 70.0, 137.0, 203.0, 305.0, 483.0, 777.0, 1252.0, 2219.0, 4188.0, 8243.0, 20241.0, 444759.0, 3565528.0, 115687.0, 14784.0, 6584.0, 3462.0, 1963.0, 1202.0, 669.0, 455.0, 252.0, 178.0, 146.0, 80.0, 49.0, 41.0, 30.0, 21.0, 4.0, 9.0, 16.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-104.125, -101.177734375, -98.23046875, -95.283203125, -92.3359375, -89.388671875, -86.44140625, -83.494140625, -80.546875, -77.599609375, -74.65234375, -71.705078125, -68.7578125, -65.810546875, -62.86328125, -59.916015625, -56.96875, -54.021484375, -51.07421875, -48.126953125, -45.1796875, -42.232421875, -39.28515625, -36.337890625, -33.390625, -30.443359375, -27.49609375, -24.548828125, -21.6015625, -18.654296875, -15.70703125, -12.759765625, -9.8125, -6.865234375, -3.91796875, -0.970703125, 1.9765625, 4.923828125, 7.87109375, 10.818359375, 13.765625, 16.712890625, 19.66015625, 22.607421875, 25.5546875, 28.501953125, 31.44921875, 34.396484375, 37.34375, 40.291015625, 43.23828125, 46.185546875, 49.1328125, 52.080078125, 55.02734375, 57.974609375, 60.921875, 63.869140625, 66.81640625, 69.763671875, 72.7109375, 75.658203125, 78.60546875, 81.552734375, 84.5]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 8.0, 10.0, 10.0, 12.0, 20.0, 20.0, 36.0, 60.0, 139.0, 469.0, 1161.0, 1250.0, 496.0, 156.0, 60.0, 33.0, 31.0, 22.0, 7.0, 12.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.5625, -81.1865234375, -77.810546875, -74.4345703125, -71.05859375, -67.6826171875, -64.306640625, -60.9306640625, -57.5546875, -54.1787109375, -50.802734375, -47.4267578125, -44.05078125, -40.6748046875, -37.298828125, -33.9228515625, -30.546875, -27.1708984375, -23.794921875, -20.4189453125, -17.04296875, -13.6669921875, -10.291015625, -6.9150390625, -3.5390625, -0.1630859375, 3.212890625, 6.5888671875, 9.96484375, 13.3408203125, 16.716796875, 20.0927734375, 23.46875, 26.8447265625, 30.220703125, 33.5966796875, 36.97265625, 40.3486328125, 43.724609375, 47.1005859375, 50.4765625, 53.8525390625, 57.228515625, 60.6044921875, 63.98046875, 67.3564453125, 70.732421875, 74.1083984375, 77.484375, 80.8603515625, 84.236328125, 87.6123046875, 90.98828125, 94.3642578125, 97.740234375, 101.1162109375, 104.4921875, 107.8681640625, 111.244140625, 114.6201171875, 117.99609375, 121.3720703125, 124.748046875, 128.1240234375, 131.5]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 14.0, 14.0, 18.0, 27.0, 55.0, 59.0, 99.0, 153.0, 216.0, 364.0, 587.0, 995.0, 1495.0, 2614.0, 4201.0, 7870.0, 16151.0, 43033.0, 384658.0, 3558917.0, 117523.0, 27985.0, 11979.0, 6090.0, 3507.0, 2126.0, 1332.0, 809.0, 528.0, 295.0, 202.0, 112.0, 88.0, 46.0, 35.0, 34.0, 19.0, 5.0, 8.0, 3.0, 8.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-147.25, -142.9580078125, -138.666015625, -134.3740234375, -130.08203125, -125.7900390625, -121.498046875, -117.2060546875, -112.9140625, -108.6220703125, -104.330078125, -100.0380859375, -95.74609375, -91.4541015625, -87.162109375, -82.8701171875, -78.578125, -74.2861328125, -69.994140625, -65.7021484375, -61.41015625, -57.1181640625, -52.826171875, -48.5341796875, -44.2421875, -39.9501953125, -35.658203125, -31.3662109375, -27.07421875, -22.7822265625, -18.490234375, -14.1982421875, -9.90625, -5.6142578125, -1.322265625, 2.9697265625, 7.26171875, 11.5537109375, 15.845703125, 20.1376953125, 24.4296875, 28.7216796875, 33.013671875, 37.3056640625, 41.59765625, 45.8896484375, 50.181640625, 54.4736328125, 58.765625, 63.0576171875, 67.349609375, 71.6416015625, 75.93359375, 80.2255859375, 84.517578125, 88.8095703125, 93.1015625, 97.3935546875, 101.685546875, 105.9775390625, 110.26953125, 114.5615234375, 118.853515625, 123.1455078125, 127.4375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 10.0, 25.0, 44.0, 84.0, 199.0, 336.0, 156.0, 58.0, 35.0, 24.0, 16.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-383.6897277832031, -361.6182556152344, -339.5467834472656, -317.4753112792969, -295.4038391113281, -273.3323669433594, -251.2609100341797, -229.18943786621094, -207.1179656982422, -185.04649353027344, -162.9750213623047, -140.903564453125, -118.83208465576172, -96.76061248779297, -74.68914794921875, -52.61767578125, -30.54620361328125, -8.474733352661133, 13.596736907958984, 35.66820526123047, 57.73967742919922, 79.81114959716797, 101.88261413574219, 123.95408630371094, 146.0255584716797, 168.09703063964844, 190.1685028076172, 212.23995971679688, 234.31143188476562, 256.3829040527344, 278.4543762207031, 300.5258483886719, 322.59735107421875, 344.6688232421875, 366.74029541015625, 388.811767578125, 410.88323974609375, 432.9547119140625, 455.02618408203125, 477.09765625, 499.16912841796875, 521.2406005859375, 543.3120727539062, 565.383544921875, 587.4550170898438, 609.5264892578125, 631.5979614257812, 653.66943359375, 675.7408447265625, 697.8123168945312, 719.8837890625, 741.9552612304688, 764.0267333984375, 786.0982055664062, 808.169677734375, 830.2411499023438, 852.3126220703125, 874.3840942382812, 896.45556640625, 918.5270385742188, 940.5985107421875, 962.6699829101562, 984.741455078125, 1006.8129272460938, 1028.8843994140625]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 3.0, 6.0, 3.0, 12.0, 4.0, 12.0, 16.0, 19.0, 21.0, 28.0, 25.0, 26.0, 30.0, 42.0, 27.0, 42.0, 29.0, 50.0, 40.0, 40.0, 45.0, 48.0, 31.0, 40.0, 52.0, 39.0, 35.0, 37.0, 32.0, 31.0, 28.0, 22.0, 21.0, 14.0, 8.0, 3.0, 10.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-228.30801391601562, -221.19290161132812, -214.07778930664062, -206.96266174316406, -199.84754943847656, -192.73243713378906, -185.6173095703125, -178.502197265625, -171.3870849609375, -164.27197265625, -157.1568603515625, -150.04173278808594, -142.92662048339844, -135.81150817871094, -128.69638061523438, -121.58126831054688, -114.46615600585938, -107.35104370117188, -100.23592376708984, -93.12080383300781, -86.00569152832031, -78.89057922363281, -71.77545928955078, -64.66033935546875, -57.54522705078125, -50.430110931396484, -43.31499481201172, -36.19987869262695, -29.084762573242188, -21.969646453857422, -14.854530334472656, -7.739414215087891, -0.624298095703125, 6.490818023681641, 13.605934143066406, 20.721050262451172, 27.836166381835938, 34.9512825012207, 42.06639862060547, 49.181514739990234, 56.296630859375, 63.411746978759766, 70.52686309814453, 77.64198303222656, 84.75709533691406, 91.87220764160156, 98.9873275756836, 106.10244750976562, 113.21755981445312, 120.33267211914062, 127.44779205322266, 134.5629119873047, 141.6780242919922, 148.7931365966797, 155.90826416015625, 163.02337646484375, 170.13848876953125, 177.25360107421875, 184.36871337890625, 191.4838409423828, 198.5989532470703, 205.7140655517578, 212.82919311523438, 219.94430541992188, 227.05941772460938]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 8.0, 5.0, 3.0, 11.0, 16.0, 13.0, 21.0, 15.0, 20.0, 32.0, 27.0, 32.0, 32.0, 33.0, 35.0, 34.0, 46.0, 56.0, 62.0, 57.0, 46.0, 40.0, 34.0, 50.0, 37.0, 34.0, 24.0, 28.0, 25.0, 18.0, 15.0, 18.0, 14.0, 13.0, 10.0, 13.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.09375, -33.090087890625, -32.08642578125, -31.082763671875, -30.0791015625, -29.075439453125, -28.07177734375, -27.068115234375, -26.064453125, -25.060791015625, -24.05712890625, -23.053466796875, -22.0498046875, -21.046142578125, -20.04248046875, -19.038818359375, -18.03515625, -17.031494140625, -16.02783203125, -15.024169921875, -14.0205078125, -13.016845703125, -12.01318359375, -11.009521484375, -10.005859375, -9.002197265625, -7.99853515625, -6.994873046875, -5.9912109375, -4.987548828125, -3.98388671875, -2.980224609375, -1.9765625, -0.972900390625, 0.03076171875, 1.034423828125, 2.0380859375, 3.041748046875, 4.04541015625, 5.049072265625, 6.052734375, 7.056396484375, 8.06005859375, 9.063720703125, 10.0673828125, 11.071044921875, 12.07470703125, 13.078369140625, 14.08203125, 15.085693359375, 16.08935546875, 17.093017578125, 18.0966796875, 19.100341796875, 20.10400390625, 21.107666015625, 22.111328125, 23.114990234375, 24.11865234375, 25.122314453125, 26.1259765625, 27.129638671875, 28.13330078125, 29.136962890625, 30.140625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 12.0, 12.0, 16.0, 21.0, 39.0, 60.0, 84.0, 100.0, 169.0, 244.0, 348.0, 546.0, 771.0, 1151.0, 1739.0, 2551.0, 3923.0, 5957.0, 8948.0, 14097.0, 22026.0, 35705.0, 59938.0, 110165.0, 232521.0, 255165.0, 121710.0, 65163.0, 38251.0, 23773.0, 15106.0, 9488.0, 6252.0, 4066.0, 2843.0, 1836.0, 1215.0, 806.0, 539.0, 362.0, 274.0, 180.0, 120.0, 75.0, 63.0, 36.0, 29.0, 13.0, 19.0, 9.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5078125, -1.4608001708984375, -1.413787841796875, -1.3667755126953125, -1.31976318359375, -1.2727508544921875, -1.225738525390625, -1.1787261962890625, -1.1317138671875, -1.0847015380859375, -1.037689208984375, -0.9906768798828125, -0.94366455078125, -0.8966522216796875, -0.849639892578125, -0.8026275634765625, -0.755615234375, -0.7086029052734375, -0.661590576171875, -0.6145782470703125, -0.56756591796875, -0.5205535888671875, -0.473541259765625, -0.4265289306640625, -0.3795166015625, -0.3325042724609375, -0.285491943359375, -0.2384796142578125, -0.19146728515625, -0.1444549560546875, -0.097442626953125, -0.0504302978515625, -0.00341796875, 0.0435943603515625, 0.090606689453125, 0.1376190185546875, 0.18463134765625, 0.2316436767578125, 0.278656005859375, 0.3256683349609375, 0.3726806640625, 0.4196929931640625, 0.466705322265625, 0.5137176513671875, 0.56072998046875, 0.6077423095703125, 0.654754638671875, 0.7017669677734375, 0.748779296875, 0.7957916259765625, 0.842803955078125, 0.8898162841796875, 0.93682861328125, 0.9838409423828125, 1.030853271484375, 1.0778656005859375, 1.1248779296875, 1.1718902587890625, 1.218902587890625, 1.2659149169921875, 1.31292724609375, 1.3599395751953125, 1.406951904296875, 1.4539642333984375, 1.5009765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 12.0, 7.0, 7.0, 12.0, 14.0, 16.0, 24.0, 22.0, 19.0, 21.0, 24.0, 23.0, 32.0, 36.0, 36.0, 41.0, 46.0, 40.0, 51.0, 36.0, 1063.0, 35.0, 39.0, 33.0, 42.0, 39.0, 30.0, 25.0, 34.0, 35.0, 23.0, 14.0, 14.0, 19.0, 10.0, 11.0, 11.0, 1.0, 5.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.328125, -17.739501953125, -17.15087890625, -16.562255859375, -15.9736328125, -15.385009765625, -14.79638671875, -14.207763671875, -13.619140625, -13.030517578125, -12.44189453125, -11.853271484375, -11.2646484375, -10.676025390625, -10.08740234375, -9.498779296875, -8.91015625, -8.321533203125, -7.73291015625, -7.144287109375, -6.5556640625, -5.967041015625, -5.37841796875, -4.789794921875, -4.201171875, -3.612548828125, -3.02392578125, -2.435302734375, -1.8466796875, -1.258056640625, -0.66943359375, -0.080810546875, 0.5078125, 1.096435546875, 1.68505859375, 2.273681640625, 2.8623046875, 3.450927734375, 4.03955078125, 4.628173828125, 5.216796875, 5.805419921875, 6.39404296875, 6.982666015625, 7.5712890625, 8.159912109375, 8.74853515625, 9.337158203125, 9.92578125, 10.514404296875, 11.10302734375, 11.691650390625, 12.2802734375, 12.868896484375, 13.45751953125, 14.046142578125, 14.634765625, 15.223388671875, 15.81201171875, 16.400634765625, 16.9892578125, 17.577880859375, 18.16650390625, 18.755126953125, 19.34375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 0.0, 2.0, 5.0, 10.0, 11.0, 24.0, 27.0, 31.0, 52.0, 75.0, 106.0, 174.0, 214.0, 378.0, 552.0, 788.0, 1191.0, 1876.0, 3086.0, 4757.0, 7592.0, 13081.0, 21586.0, 38175.0, 69695.0, 143680.0, 1339581.0, 227624.0, 99069.0, 51115.0, 28669.0, 16959.0, 10163.0, 6216.0, 3868.0, 2416.0, 1527.0, 937.0, 621.0, 419.0, 283.0, 178.0, 103.0, 64.0, 47.0, 39.0, 23.0, 18.0, 12.0, 8.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.458984375, -1.409942626953125, -1.36090087890625, -1.311859130859375, -1.2628173828125, -1.213775634765625, -1.16473388671875, -1.115692138671875, -1.066650390625, -1.017608642578125, -0.96856689453125, -0.919525146484375, -0.8704833984375, -0.821441650390625, -0.77239990234375, -0.723358154296875, -0.67431640625, -0.625274658203125, -0.57623291015625, -0.527191162109375, -0.4781494140625, -0.429107666015625, -0.38006591796875, -0.331024169921875, -0.281982421875, -0.232940673828125, -0.18389892578125, -0.134857177734375, -0.0858154296875, -0.036773681640625, 0.01226806640625, 0.061309814453125, 0.1103515625, 0.159393310546875, 0.20843505859375, 0.257476806640625, 0.3065185546875, 0.355560302734375, 0.40460205078125, 0.453643798828125, 0.502685546875, 0.551727294921875, 0.60076904296875, 0.649810791015625, 0.6988525390625, 0.747894287109375, 0.79693603515625, 0.845977783203125, 0.89501953125, 0.944061279296875, 0.99310302734375, 1.042144775390625, 1.0911865234375, 1.140228271484375, 1.18927001953125, 1.238311767578125, 1.287353515625, 1.336395263671875, 1.38543701171875, 1.434478759765625, 1.4835205078125, 1.532562255859375, 1.58160400390625, 1.630645751953125, 1.6796875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 7.0, 8.0, 16.0, 26.0, 27.0, 25.0, 29.0, 25.0, 44.0, 69.0, 91.0, 108.0, 87.0, 89.0, 69.0, 46.0, 40.0, 31.0, 26.0, 31.0, 21.0, 20.0, 15.0, 13.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0246124267578125, -0.023933887481689453, -0.023255348205566406, -0.02257680892944336, -0.021898269653320312, -0.021219730377197266, -0.02054119110107422, -0.019862651824951172, -0.019184112548828125, -0.018505573272705078, -0.01782703399658203, -0.017148494720458984, -0.016469955444335938, -0.01579141616821289, -0.015112876892089844, -0.014434337615966797, -0.01375579833984375, -0.013077259063720703, -0.012398719787597656, -0.01172018051147461, -0.011041641235351562, -0.010363101959228516, -0.009684562683105469, -0.009006023406982422, -0.008327484130859375, -0.007648944854736328, -0.006970405578613281, -0.006291866302490234, -0.0056133270263671875, -0.004934787750244141, -0.004256248474121094, -0.003577709197998047, -0.002899169921875, -0.002220630645751953, -0.0015420913696289062, -0.0008635520935058594, -0.0001850128173828125, 0.0004935264587402344, 0.0011720657348632812, 0.0018506050109863281, 0.002529144287109375, 0.003207683563232422, 0.0038862228393554688, 0.004564762115478516, 0.0052433013916015625, 0.005921840667724609, 0.006600379943847656, 0.007278919219970703, 0.00795745849609375, 0.008635997772216797, 0.009314537048339844, 0.00999307632446289, 0.010671615600585938, 0.011350154876708984, 0.012028694152832031, 0.012707233428955078, 0.013385772705078125, 0.014064311981201172, 0.014742851257324219, 0.015421390533447266, 0.016099929809570312, 0.01677846908569336, 0.017457008361816406, 0.018135547637939453, 0.0188140869140625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 11.0, 14.0, 17.0, 34.0, 46.0, 48.0, 78.0, 130.0, 176.0, 273.0, 850.0, 11052.0, 890122.0, 140562.0, 3874.0, 549.0, 231.0, 142.0, 92.0, 80.0, 55.0, 33.0, 22.0, 10.0, 10.0, 10.0, 8.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.29161834716796875, -0.2807464599609375, -0.26987457275390625, -0.259002685546875, -0.24813079833984375, -0.2372589111328125, -0.22638702392578125, -0.21551513671875, -0.20464324951171875, -0.1937713623046875, -0.18289947509765625, -0.172027587890625, -0.16115570068359375, -0.1502838134765625, -0.13941192626953125, -0.1285400390625, -0.11766815185546875, -0.1067962646484375, -0.09592437744140625, -0.085052490234375, -0.07418060302734375, -0.0633087158203125, -0.05243682861328125, -0.04156494140625, -0.03069305419921875, -0.0198211669921875, -0.00894927978515625, 0.001922607421875, 0.01279449462890625, 0.0236663818359375, 0.03453826904296875, 0.04541015625, 0.05628204345703125, 0.0671539306640625, 0.07802581787109375, 0.088897705078125, 0.09976959228515625, 0.1106414794921875, 0.12151336669921875, 0.13238525390625, 0.14325714111328125, 0.1541290283203125, 0.16500091552734375, 0.175872802734375, 0.18674468994140625, 0.1976165771484375, 0.20848846435546875, 0.2193603515625, 0.23023223876953125, 0.2411041259765625, 0.25197601318359375, 0.262847900390625, 0.27371978759765625, 0.2845916748046875, 0.29546356201171875, 0.30633544921875, 0.31720733642578125, 0.3280792236328125, 0.33895111083984375, 0.349822998046875, 0.36069488525390625, 0.3715667724609375, 0.38243865966796875, 0.393310546875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 17.0, 16.0, 29.0, 65.0, 239.0, 414.0, 143.0, 51.0, 17.0, 10.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06522466242313385, -0.06387220323085785, -0.06251974403858185, -0.06116728484630585, -0.059814825654029846, -0.058462366461753845, -0.057109907269477844, -0.05575744807720184, -0.05440498888492584, -0.05305252969264984, -0.05170007050037384, -0.05034761130809784, -0.04899515211582184, -0.04764269292354584, -0.046290233731269836, -0.044937774538993835, -0.043585315346717834, -0.042232856154441833, -0.04088039696216583, -0.03952793776988983, -0.03817547857761383, -0.03682301938533783, -0.03547056019306183, -0.03411810100078583, -0.032765645533800125, -0.031413186341524124, -0.030060727149248123, -0.028708267956972122, -0.02735580876469612, -0.02600334957242012, -0.02465089038014412, -0.02329843118786812, -0.021945973858237267, -0.020593514665961266, -0.019241055473685265, -0.017888596281409264, -0.016536137089133263, -0.015183677896857262, -0.013831219635903835, -0.012478760443627834, -0.011126301251351833, -0.009773842059075832, -0.008421382866799831, -0.007068924140185118, -0.005716464947909117, -0.004364005755633116, -0.003011547029018402, -0.0016590878367424011, -0.00030662864446640015, 0.001045830431394279, 0.002398289507254958, 0.0037507484667003155, 0.0051032076589763165, 0.006455666851252317, 0.007808125577867031, 0.009160584770143032, 0.010513043962419033, 0.011865503154695034, 0.013217962346971035, 0.014570420607924461, 0.015922879800200462, 0.017275338992476463, 0.018627798184752464, 0.019980257377028465, 0.021332716569304466]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 7.0, 8.0, 6.0, 6.0, 15.0, 14.0, 25.0, 20.0, 34.0, 26.0, 27.0, 28.0, 33.0, 37.0, 41.0, 39.0, 53.0, 48.0, 42.0, 53.0, 53.0, 42.0, 50.0, 37.0, 32.0, 44.0, 30.0, 29.0, 23.0, 14.0, 12.0, 6.0, 20.0, 9.0, 10.0, 8.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.012850642204284668, -0.012486969120800495, -0.012123296037316322, -0.01175962295383215, -0.011395949870347977, -0.011032276786863804, -0.010668603703379631, -0.010304930619895458, -0.009941257536411285, -0.009577584452927113, -0.00921391136944294, -0.008850238285958767, -0.008486565202474594, -0.008122892118990421, -0.0077592190355062485, -0.007395545952022076, -0.007031872868537903, -0.00666819978505373, -0.006304526701569557, -0.005940853618085384, -0.0055771805346012115, -0.005213507451117039, -0.004849834367632866, -0.004486161284148693, -0.00412248820066452, -0.0037588151171803474, -0.0033951420336961746, -0.003031468950212002, -0.002667795866727829, -0.002304122783243656, -0.0019404496997594833, -0.0015767766162753105, -0.0012131035327911377, -0.0008494304493069649, -0.00048575736582279205, -0.00012208428233861923, 0.0002415888011455536, 0.0006052618846297264, 0.0009689349681138992, 0.001332608051598072, 0.0016962811350822449, 0.0020599542185664177, 0.0024236273020505905, 0.0027873003855347633, 0.003150973469018936, 0.003514646552503109, 0.003878319635987282, 0.004241992719471455, 0.0046056658029556274, 0.0049693388864398, 0.005333011969923973, 0.005696685053408146, 0.006060358136892319, 0.0064240312203764915, 0.006787704303860664, 0.007151377387344837, 0.00751505047082901, 0.007878723554313183, 0.008242396637797356, 0.008606069721281528, 0.008969742804765701, 0.009333415888249874, 0.009697088971734047, 0.01006076205521822, 0.010424435138702393]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 8.0, 5.0, 3.0, 11.0, 16.0, 13.0, 21.0, 15.0, 20.0, 32.0, 27.0, 32.0, 32.0, 33.0, 35.0, 34.0, 46.0, 56.0, 62.0, 57.0, 46.0, 40.0, 34.0, 50.0, 37.0, 34.0, 24.0, 28.0, 25.0, 18.0, 15.0, 18.0, 14.0, 13.0, 10.0, 13.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.09375, -33.090087890625, -32.08642578125, -31.082763671875, -30.0791015625, -29.075439453125, -28.07177734375, -27.068115234375, -26.064453125, -25.060791015625, -24.05712890625, -23.053466796875, -22.0498046875, -21.046142578125, -20.04248046875, -19.038818359375, -18.03515625, -17.031494140625, -16.02783203125, -15.024169921875, -14.0205078125, -13.016845703125, -12.01318359375, -11.009521484375, -10.005859375, -9.002197265625, -7.99853515625, -6.994873046875, -5.9912109375, -4.987548828125, -3.98388671875, -2.980224609375, -1.9765625, -0.972900390625, 0.03076171875, 1.034423828125, 2.0380859375, 3.041748046875, 4.04541015625, 5.049072265625, 6.052734375, 7.056396484375, 8.06005859375, 9.063720703125, 10.0673828125, 11.071044921875, 12.07470703125, 13.078369140625, 14.08203125, 15.085693359375, 16.08935546875, 17.093017578125, 18.0966796875, 19.100341796875, 20.10400390625, 21.107666015625, 22.111328125, 23.114990234375, 24.11865234375, 25.122314453125, 26.1259765625, 27.129638671875, 28.13330078125, 29.136962890625, 30.140625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 3.0, 6.0, 16.0, 16.0, 22.0, 29.0, 29.0, 56.0, 92.0, 155.0, 268.0, 545.0, 1139.0, 2746.0, 7328.0, 24102.0, 95942.0, 572587.0, 267737.0, 52652.0, 14613.0, 4809.0, 1871.0, 777.0, 409.0, 206.0, 120.0, 87.0, 39.0, 36.0, 23.0, 18.0, 17.0, 9.0, 18.0, 7.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.1875, -20.560546875, -19.93359375, -19.306640625, -18.6796875, -18.052734375, -17.42578125, -16.798828125, -16.171875, -15.544921875, -14.91796875, -14.291015625, -13.6640625, -13.037109375, -12.41015625, -11.783203125, -11.15625, -10.529296875, -9.90234375, -9.275390625, -8.6484375, -8.021484375, -7.39453125, -6.767578125, -6.140625, -5.513671875, -4.88671875, -4.259765625, -3.6328125, -3.005859375, -2.37890625, -1.751953125, -1.125, -0.498046875, 0.12890625, 0.755859375, 1.3828125, 2.009765625, 2.63671875, 3.263671875, 3.890625, 4.517578125, 5.14453125, 5.771484375, 6.3984375, 7.025390625, 7.65234375, 8.279296875, 8.90625, 9.533203125, 10.16015625, 10.787109375, 11.4140625, 12.041015625, 12.66796875, 13.294921875, 13.921875, 14.548828125, 15.17578125, 15.802734375, 16.4296875, 17.056640625, 17.68359375, 18.310546875, 18.9375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 12.0, 7.0, 16.0, 12.0, 18.0, 16.0, 26.0, 28.0, 24.0, 34.0, 24.0, 30.0, 29.0, 33.0, 37.0, 40.0, 214.0, 1891.0, 54.0, 54.0, 38.0, 41.0, 29.0, 27.0, 36.0, 35.0, 31.0, 23.0, 38.0, 20.0, 19.0, 9.0, 11.0, 14.0, 7.0, 9.0, 5.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-84.25, -81.4541015625, -78.658203125, -75.8623046875, -73.06640625, -70.2705078125, -67.474609375, -64.6787109375, -61.8828125, -59.0869140625, -56.291015625, -53.4951171875, -50.69921875, -47.9033203125, -45.107421875, -42.3115234375, -39.515625, -36.7197265625, -33.923828125, -31.1279296875, -28.33203125, -25.5361328125, -22.740234375, -19.9443359375, -17.1484375, -14.3525390625, -11.556640625, -8.7607421875, -5.96484375, -3.1689453125, -0.373046875, 2.4228515625, 5.21875, 8.0146484375, 10.810546875, 13.6064453125, 16.40234375, 19.1982421875, 21.994140625, 24.7900390625, 27.5859375, 30.3818359375, 33.177734375, 35.9736328125, 38.76953125, 41.5654296875, 44.361328125, 47.1572265625, 49.953125, 52.7490234375, 55.544921875, 58.3408203125, 61.13671875, 63.9326171875, 66.728515625, 69.5244140625, 72.3203125, 75.1162109375, 77.912109375, 80.7080078125, 83.50390625, 86.2998046875, 89.095703125, 91.8916015625, 94.6875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 4.0, 10.0, 6.0, 12.0, 13.0, 10.0, 23.0, 23.0, 41.0, 34.0, 50.0, 56.0, 75.0, 92.0, 146.0, 223.0, 331.0, 646.0, 2144.0, 3009687.0, 129205.0, 1350.0, 546.0, 278.0, 168.0, 116.0, 80.0, 65.0, 45.0, 42.0, 33.0, 25.0, 19.0, 14.0, 14.0, 10.0, 12.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-157.75, -153.091796875, -148.43359375, -143.775390625, -139.1171875, -134.458984375, -129.80078125, -125.142578125, -120.484375, -115.826171875, -111.16796875, -106.509765625, -101.8515625, -97.193359375, -92.53515625, -87.876953125, -83.21875, -78.560546875, -73.90234375, -69.244140625, -64.5859375, -59.927734375, -55.26953125, -50.611328125, -45.953125, -41.294921875, -36.63671875, -31.978515625, -27.3203125, -22.662109375, -18.00390625, -13.345703125, -8.6875, -4.029296875, 0.62890625, 5.287109375, 9.9453125, 14.603515625, 19.26171875, 23.919921875, 28.578125, 33.236328125, 37.89453125, 42.552734375, 47.2109375, 51.869140625, 56.52734375, 61.185546875, 65.84375, 70.501953125, 75.16015625, 79.818359375, 84.4765625, 89.134765625, 93.79296875, 98.451171875, 103.109375, 107.767578125, 112.42578125, 117.083984375, 121.7421875, 126.400390625, 131.05859375, 135.716796875, 140.375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 21.0, 893.0, 105.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.62777709960938, -67.1789779663086, -48.73017501831055, -30.2813720703125, -11.832572937011719, 6.6162261962890625, 25.065032958984375, 43.513824462890625, 61.96263122558594, 80.41143035888672, 98.8602294921875, 117.30903625488281, 135.75784301757812, 154.20663452148438, 172.6554412841797, 191.10423278808594, 209.55303955078125, 228.00184631347656, 246.4506378173828, 264.8994445800781, 283.3482360839844, 301.79705810546875, 320.245849609375, 338.69464111328125, 357.1434326171875, 375.59222412109375, 394.0410461425781, 412.4898376464844, 430.9386291503906, 449.387451171875, 467.83624267578125, 486.2850341796875, 504.73382568359375, 523.1826171875, 541.6314086914062, 560.0802001953125, 578.529052734375, 596.9778442382812, 615.4266357421875, 633.8754272460938, 652.32421875, 670.7730102539062, 689.2218017578125, 707.670654296875, 726.1194458007812, 744.5682373046875, 763.0170288085938, 781.4658203125, 799.9146728515625, 818.3634643554688, 836.812255859375, 855.2611083984375, 873.7098999023438, 892.15869140625, 910.6074829101562, 929.0562744140625, 947.5050659179688, 965.953857421875, 984.4026489257812, 1002.8514404296875, 1021.30029296875, 1039.7490234375, 1058.1978759765625, 1076.646728515625, 1095.095458984375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 9.0, 3.0, 9.0, 15.0, 10.0, 15.0, 11.0, 15.0, 17.0, 16.0, 31.0, 25.0, 29.0, 36.0, 28.0, 35.0, 45.0, 38.0, 42.0, 33.0, 45.0, 43.0, 40.0, 35.0, 34.0, 36.0, 39.0, 43.0, 22.0, 28.0, 34.0, 25.0, 17.0, 18.0, 21.0, 10.0, 9.0, 5.0, 9.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-301.77392578125, -292.3157653808594, -282.8575744628906, -273.3994140625, -263.9412536621094, -254.4830780029297, -245.02490234375, -235.56674194335938, -226.1085662841797, -216.650390625, -207.19223022460938, -197.7340545654297, -188.27587890625, -178.81771850585938, -169.3595428466797, -159.9013671875, -150.44320678710938, -140.9850311279297, -131.52687072753906, -122.06869506835938, -112.61052703857422, -103.15235900878906, -93.69418334960938, -84.23601531982422, -74.77784729003906, -65.3196792602539, -55.861507415771484, -46.40333557128906, -36.945167541503906, -27.48699951171875, -18.028827667236328, -8.570655822753906, 0.887542724609375, 10.345712661743164, 19.803882598876953, 29.262052536010742, 38.72022247314453, 48.17839050292969, 57.63656234741211, 67.09473419189453, 76.55290222167969, 86.01107025146484, 95.46923828125, 104.92741394042969, 114.38558197021484, 123.84375, 133.3019256591797, 142.76010131835938, 152.21826171875, 161.6764373779297, 171.1345977783203, 180.5927734375, 190.05093383789062, 199.5091094970703, 208.96728515625, 218.42544555664062, 227.8836212158203, 237.341796875, 246.79995727539062, 256.25811767578125, 265.71630859375, 275.1744689941406, 284.63262939453125, 294.0908203125, 303.5489807128906]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 4.0, 4.0, 10.0, 9.0, 16.0, 17.0, 22.0, 15.0, 32.0, 29.0, 32.0, 28.0, 39.0, 36.0, 34.0, 35.0, 58.0, 62.0, 56.0, 48.0, 40.0, 39.0, 50.0, 31.0, 38.0, 27.0, 24.0, 29.0, 19.0, 14.0, 17.0, 18.0, 12.0, 11.0, 10.0, 12.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.625, -33.613525390625, -32.60205078125, -31.590576171875, -30.5791015625, -29.567626953125, -28.55615234375, -27.544677734375, -26.533203125, -25.521728515625, -24.51025390625, -23.498779296875, -22.4873046875, -21.475830078125, -20.46435546875, -19.452880859375, -18.44140625, -17.429931640625, -16.41845703125, -15.406982421875, -14.3955078125, -13.384033203125, -12.37255859375, -11.361083984375, -10.349609375, -9.338134765625, -8.32666015625, -7.315185546875, -6.3037109375, -5.292236328125, -4.28076171875, -3.269287109375, -2.2578125, -1.246337890625, -0.23486328125, 0.776611328125, 1.7880859375, 2.799560546875, 3.81103515625, 4.822509765625, 5.833984375, 6.845458984375, 7.85693359375, 8.868408203125, 9.8798828125, 10.891357421875, 11.90283203125, 12.914306640625, 13.92578125, 14.937255859375, 15.94873046875, 16.960205078125, 17.9716796875, 18.983154296875, 19.99462890625, 21.006103515625, 22.017578125, 23.029052734375, 24.04052734375, 25.052001953125, 26.0634765625, 27.074951171875, 28.08642578125, 29.097900390625, 30.109375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 5.0, 14.0, 11.0, 18.0, 23.0, 33.0, 63.0, 59.0, 119.0, 170.0, 286.0, 481.0, 783.0, 1394.0, 2667.0, 5515.0, 13404.0, 163783.0, 3775296.0, 203582.0, 14589.0, 5650.0, 2877.0, 1398.0, 811.0, 432.0, 303.0, 184.0, 107.0, 71.0, 29.0, 34.0, 22.0, 16.0, 19.0, 9.0, 4.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-129.0, -125.263671875, -121.52734375, -117.791015625, -114.0546875, -110.318359375, -106.58203125, -102.845703125, -99.109375, -95.373046875, -91.63671875, -87.900390625, -84.1640625, -80.427734375, -76.69140625, -72.955078125, -69.21875, -65.482421875, -61.74609375, -58.009765625, -54.2734375, -50.537109375, -46.80078125, -43.064453125, -39.328125, -35.591796875, -31.85546875, -28.119140625, -24.3828125, -20.646484375, -16.91015625, -13.173828125, -9.4375, -5.701171875, -1.96484375, 1.771484375, 5.5078125, 9.244140625, 12.98046875, 16.716796875, 20.453125, 24.189453125, 27.92578125, 31.662109375, 35.3984375, 39.134765625, 42.87109375, 46.607421875, 50.34375, 54.080078125, 57.81640625, 61.552734375, 65.2890625, 69.025390625, 72.76171875, 76.498046875, 80.234375, 83.970703125, 87.70703125, 91.443359375, 95.1796875, 98.916015625, 102.65234375, 106.388671875, 110.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 9.0, 7.0, 12.0, 13.0, 24.0, 12.0, 28.0, 43.0, 80.0, 190.0, 529.0, 1261.0, 1069.0, 430.0, 152.0, 60.0, 26.0, 22.0, 22.0, 9.0, 14.0, 12.0, 9.0, 4.0, 6.0, 6.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-127.375, -124.0986328125, -120.822265625, -117.5458984375, -114.26953125, -110.9931640625, -107.716796875, -104.4404296875, -101.1640625, -97.8876953125, -94.611328125, -91.3349609375, -88.05859375, -84.7822265625, -81.505859375, -78.2294921875, -74.953125, -71.6767578125, -68.400390625, -65.1240234375, -61.84765625, -58.5712890625, -55.294921875, -52.0185546875, -48.7421875, -45.4658203125, -42.189453125, -38.9130859375, -35.63671875, -32.3603515625, -29.083984375, -25.8076171875, -22.53125, -19.2548828125, -15.978515625, -12.7021484375, -9.42578125, -6.1494140625, -2.873046875, 0.4033203125, 3.6796875, 6.9560546875, 10.232421875, 13.5087890625, 16.78515625, 20.0615234375, 23.337890625, 26.6142578125, 29.890625, 33.1669921875, 36.443359375, 39.7197265625, 42.99609375, 46.2724609375, 49.548828125, 52.8251953125, 56.1015625, 59.3779296875, 62.654296875, 65.9306640625, 69.20703125, 72.4833984375, 75.759765625, 79.0361328125, 82.3125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 9.0, 9.0, 15.0, 26.0, 31.0, 53.0, 63.0, 101.0, 126.0, 246.0, 362.0, 631.0, 991.0, 1844.0, 3380.0, 6460.0, 13184.0, 31685.0, 134571.0, 3564825.0, 356389.0, 44570.0, 17137.0, 8149.0, 4103.0, 2234.0, 1177.0, 684.0, 413.0, 237.0, 175.0, 117.0, 74.0, 58.0, 38.0, 27.0, 25.0, 16.0, 12.0, 6.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-120.9375, -116.7177734375, -112.498046875, -108.2783203125, -104.05859375, -99.8388671875, -95.619140625, -91.3994140625, -87.1796875, -82.9599609375, -78.740234375, -74.5205078125, -70.30078125, -66.0810546875, -61.861328125, -57.6416015625, -53.421875, -49.2021484375, -44.982421875, -40.7626953125, -36.54296875, -32.3232421875, -28.103515625, -23.8837890625, -19.6640625, -15.4443359375, -11.224609375, -7.0048828125, -2.78515625, 1.4345703125, 5.654296875, 9.8740234375, 14.09375, 18.3134765625, 22.533203125, 26.7529296875, 30.97265625, 35.1923828125, 39.412109375, 43.6318359375, 47.8515625, 52.0712890625, 56.291015625, 60.5107421875, 64.73046875, 68.9501953125, 73.169921875, 77.3896484375, 81.609375, 85.8291015625, 90.048828125, 94.2685546875, 98.48828125, 102.7080078125, 106.927734375, 111.1474609375, 115.3671875, 119.5869140625, 123.806640625, 128.0263671875, 132.24609375, 136.4658203125, 140.685546875, 144.9052734375, 149.125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 5.0, 13.0, 15.0, 20.0, 35.0, 40.0, 57.0, 95.0, 175.0, 192.0, 126.0, 78.0, 52.0, 36.0, 19.0, 16.0, 8.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-570.85302734375, -557.64697265625, -544.4409790039062, -531.2349243164062, -518.0289306640625, -504.8229064941406, -491.61688232421875, -478.41082763671875, -465.204833984375, -451.9988098144531, -438.79278564453125, -425.5867614746094, -412.3807373046875, -399.1747131347656, -385.96868896484375, -372.76263427734375, -359.5566101074219, -346.3505859375, -333.1445617675781, -319.93853759765625, -306.7325134277344, -293.5264892578125, -280.3204345703125, -267.11444091796875, -253.9084014892578, -240.70237731933594, -227.49635314941406, -214.29031372070312, -201.08428955078125, -187.87826538085938, -174.6722412109375, -161.46621704101562, -148.26019287109375, -135.05416870117188, -121.84814453125, -108.6421127319336, -95.43608856201172, -82.23006439208984, -69.02403259277344, -55.81800842285156, -42.61198425292969, -29.40595817565918, -16.199932098388672, -2.9939041137695312, 10.212120056152344, 23.41814422607422, 36.624176025390625, 49.8302001953125, 63.036224365234375, 76.24224853515625, 89.44827270507812, 102.65430450439453, 115.8603286743164, 129.06634521484375, 142.2723846435547, 155.47840881347656, 168.68443298339844, 181.8904571533203, 195.0964813232422, 208.30252075195312, 221.508544921875, 234.71456909179688, 247.92059326171875, 261.1266174316406, 274.3326416015625]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 14.0, 18.0, 12.0, 13.0, 21.0, 24.0, 17.0, 20.0, 31.0, 35.0, 30.0, 30.0, 31.0, 35.0, 48.0, 51.0, 39.0, 36.0, 49.0, 44.0, 30.0, 31.0, 31.0, 32.0, 38.0, 36.0, 16.0, 28.0, 23.0, 22.0, 21.0, 10.0, 14.0, 8.0, 6.0, 9.0, 6.0, 3.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-190.68612670898438, -184.14071655273438, -177.59530639648438, -171.04989624023438, -164.50448608398438, -157.95907592773438, -151.41366577148438, -144.86825561523438, -138.32284545898438, -131.77743530273438, -125.23202514648438, -118.68661499023438, -112.14120483398438, -105.59579467773438, -99.05038452148438, -92.50497436523438, -85.9595718383789, -79.4141616821289, -72.8687515258789, -66.3233413696289, -59.777931213378906, -53.23252487182617, -46.68711471557617, -40.14170455932617, -33.59629440307617, -27.050884246826172, -20.505474090576172, -13.960065841674805, -7.414655685424805, -0.8692474365234375, 5.6761627197265625, 12.221572875976562, 18.766983032226562, 25.312393188476562, 31.857803344726562, 38.40321350097656, 44.94862365722656, 51.4940299987793, 58.0394401550293, 64.58485412597656, 71.13026428222656, 77.67567443847656, 84.22108459472656, 90.76649475097656, 97.31190490722656, 103.85731506347656, 110.40272521972656, 116.94813537597656, 123.49353790283203, 130.0389404296875, 136.5843505859375, 143.1297607421875, 149.6751708984375, 156.2205810546875, 162.7659912109375, 169.3114013671875, 175.8568115234375, 182.4022216796875, 188.9476318359375, 195.4930419921875, 202.0384521484375, 208.5838623046875, 215.1292724609375, 221.6746826171875, 228.2200927734375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 10.0, 13.0, 9.0, 16.0, 11.0, 16.0, 27.0, 27.0, 33.0, 18.0, 34.0, 32.0, 40.0, 34.0, 45.0, 37.0, 46.0, 55.0, 46.0, 46.0, 48.0, 39.0, 43.0, 33.0, 40.0, 26.0, 18.0, 24.0, 24.0, 16.0, 12.0, 12.0, 15.0, 9.0, 5.0, 12.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.0, -30.9912109375, -29.982421875, -28.9736328125, -27.96484375, -26.9560546875, -25.947265625, -24.9384765625, -23.9296875, -22.9208984375, -21.912109375, -20.9033203125, -19.89453125, -18.8857421875, -17.876953125, -16.8681640625, -15.859375, -14.8505859375, -13.841796875, -12.8330078125, -11.82421875, -10.8154296875, -9.806640625, -8.7978515625, -7.7890625, -6.7802734375, -5.771484375, -4.7626953125, -3.75390625, -2.7451171875, -1.736328125, -0.7275390625, 0.28125, 1.2900390625, 2.298828125, 3.3076171875, 4.31640625, 5.3251953125, 6.333984375, 7.3427734375, 8.3515625, 9.3603515625, 10.369140625, 11.3779296875, 12.38671875, 13.3955078125, 14.404296875, 15.4130859375, 16.421875, 17.4306640625, 18.439453125, 19.4482421875, 20.45703125, 21.4658203125, 22.474609375, 23.4833984375, 24.4921875, 25.5009765625, 26.509765625, 27.5185546875, 28.52734375, 29.5361328125, 30.544921875, 31.5537109375, 32.5625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 8.0, 7.0, 11.0, 11.0, 31.0, 31.0, 46.0, 70.0, 122.0, 164.0, 222.0, 321.0, 461.0, 689.0, 1078.0, 1582.0, 2536.0, 3955.0, 6385.0, 10522.0, 18144.0, 32091.0, 58406.0, 116898.0, 273176.0, 270483.0, 115483.0, 58047.0, 31687.0, 17923.0, 10386.0, 6368.0, 3931.0, 2493.0, 1643.0, 1020.0, 678.0, 452.0, 319.0, 209.0, 130.0, 89.0, 75.0, 53.0, 54.0, 25.0, 13.0, 15.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.841796875, -1.7842254638671875, -1.726654052734375, -1.6690826416015625, -1.61151123046875, -1.5539398193359375, -1.496368408203125, -1.4387969970703125, -1.3812255859375, -1.3236541748046875, -1.266082763671875, -1.2085113525390625, -1.15093994140625, -1.0933685302734375, -1.035797119140625, -0.9782257080078125, -0.920654296875, -0.8630828857421875, -0.805511474609375, -0.7479400634765625, -0.69036865234375, -0.6327972412109375, -0.575225830078125, -0.5176544189453125, -0.4600830078125, -0.4025115966796875, -0.344940185546875, -0.2873687744140625, -0.22979736328125, -0.1722259521484375, -0.114654541015625, -0.0570831298828125, 0.00048828125, 0.0580596923828125, 0.115631103515625, 0.1732025146484375, 0.23077392578125, 0.2883453369140625, 0.345916748046875, 0.4034881591796875, 0.4610595703125, 0.5186309814453125, 0.576202392578125, 0.6337738037109375, 0.69134521484375, 0.7489166259765625, 0.806488037109375, 0.8640594482421875, 0.921630859375, 0.9792022705078125, 1.036773681640625, 1.0943450927734375, 1.15191650390625, 1.2094879150390625, 1.267059326171875, 1.3246307373046875, 1.3822021484375, 1.4397735595703125, 1.497344970703125, 1.5549163818359375, 1.61248779296875, 1.6700592041015625, 1.727630615234375, 1.7852020263671875, 1.8427734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 0.0, 10.0, 9.0, 18.0, 16.0, 12.0, 18.0, 22.0, 17.0, 32.0, 28.0, 34.0, 42.0, 46.0, 30.0, 44.0, 45.0, 44.0, 1059.0, 39.0, 41.0, 40.0, 40.0, 31.0, 31.0, 33.0, 32.0, 31.0, 19.0, 26.0, 20.0, 18.0, 20.0, 17.0, 13.0, 10.0, 5.0, 6.0, 12.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0], "bins": [-24.40625, -23.761962890625, -23.11767578125, -22.473388671875, -21.8291015625, -21.184814453125, -20.54052734375, -19.896240234375, -19.251953125, -18.607666015625, -17.96337890625, -17.319091796875, -16.6748046875, -16.030517578125, -15.38623046875, -14.741943359375, -14.09765625, -13.453369140625, -12.80908203125, -12.164794921875, -11.5205078125, -10.876220703125, -10.23193359375, -9.587646484375, -8.943359375, -8.299072265625, -7.65478515625, -7.010498046875, -6.3662109375, -5.721923828125, -5.07763671875, -4.433349609375, -3.7890625, -3.144775390625, -2.50048828125, -1.856201171875, -1.2119140625, -0.567626953125, 0.07666015625, 0.720947265625, 1.365234375, 2.009521484375, 2.65380859375, 3.298095703125, 3.9423828125, 4.586669921875, 5.23095703125, 5.875244140625, 6.51953125, 7.163818359375, 7.80810546875, 8.452392578125, 9.0966796875, 9.740966796875, 10.38525390625, 11.029541015625, 11.673828125, 12.318115234375, 12.96240234375, 13.606689453125, 14.2509765625, 14.895263671875, 15.53955078125, 16.183837890625, 16.828125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 6.0, 5.0, 11.0, 13.0, 17.0, 37.0, 51.0, 59.0, 112.0, 181.0, 228.0, 367.0, 579.0, 884.0, 1488.0, 2256.0, 3649.0, 6053.0, 9925.0, 16739.0, 28540.0, 50233.0, 94451.0, 220907.0, 1356829.0, 141103.0, 69067.0, 38035.0, 21808.0, 12814.0, 7849.0, 4830.0, 2866.0, 1820.0, 1180.0, 728.0, 449.0, 331.0, 199.0, 131.0, 110.0, 53.0, 53.0, 33.0, 18.0, 5.0, 10.0, 8.0, 4.0, 3.0, 4.0], "bins": [-1.9892578125, -1.9358673095703125, -1.882476806640625, -1.8290863037109375, -1.77569580078125, -1.7223052978515625, -1.668914794921875, -1.6155242919921875, -1.5621337890625, -1.5087432861328125, -1.455352783203125, -1.4019622802734375, -1.34857177734375, -1.2951812744140625, -1.241790771484375, -1.1884002685546875, -1.135009765625, -1.0816192626953125, -1.028228759765625, -0.9748382568359375, -0.92144775390625, -0.8680572509765625, -0.814666748046875, -0.7612762451171875, -0.7078857421875, -0.6544952392578125, -0.601104736328125, -0.5477142333984375, -0.49432373046875, -0.4409332275390625, -0.387542724609375, -0.3341522216796875, -0.28076171875, -0.2273712158203125, -0.173980712890625, -0.1205902099609375, -0.06719970703125, -0.0138092041015625, 0.039581298828125, 0.0929718017578125, 0.1463623046875, 0.1997528076171875, 0.253143310546875, 0.3065338134765625, 0.35992431640625, 0.4133148193359375, 0.466705322265625, 0.5200958251953125, 0.573486328125, 0.6268768310546875, 0.680267333984375, 0.7336578369140625, 0.78704833984375, 0.8404388427734375, 0.893829345703125, 0.9472198486328125, 1.0006103515625, 1.0540008544921875, 1.107391357421875, 1.1607818603515625, 1.21417236328125, 1.2675628662109375, 1.320953369140625, 1.3743438720703125, 1.427734375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 1.0, 6.0, 8.0, 9.0, 7.0, 10.0, 18.0, 31.0, 20.0, 45.0, 45.0, 76.0, 93.0, 107.0, 128.0, 106.0, 89.0, 51.0, 23.0, 24.0, 24.0, 20.0, 11.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0251617431640625, -0.02435159683227539, -0.02354145050048828, -0.022731304168701172, -0.021921157836914062, -0.021111011505126953, -0.020300865173339844, -0.019490718841552734, -0.018680572509765625, -0.017870426177978516, -0.017060279846191406, -0.016250133514404297, -0.015439987182617188, -0.014629840850830078, -0.013819694519042969, -0.01300954818725586, -0.01219940185546875, -0.01138925552368164, -0.010579109191894531, -0.009768962860107422, -0.008958816528320312, -0.008148670196533203, -0.007338523864746094, -0.006528377532958984, -0.005718231201171875, -0.004908084869384766, -0.004097938537597656, -0.003287792205810547, -0.0024776458740234375, -0.0016674995422363281, -0.0008573532104492188, -4.7206878662109375e-05, 0.000762939453125, 0.0015730857849121094, 0.0023832321166992188, 0.003193378448486328, 0.0040035247802734375, 0.004813671112060547, 0.005623817443847656, 0.006433963775634766, 0.007244110107421875, 0.008054256439208984, 0.008864402770996094, 0.009674549102783203, 0.010484695434570312, 0.011294841766357422, 0.012104988098144531, 0.01291513442993164, 0.01372528076171875, 0.01453542709350586, 0.015345573425292969, 0.016155719757080078, 0.016965866088867188, 0.017776012420654297, 0.018586158752441406, 0.019396305084228516, 0.020206451416015625, 0.021016597747802734, 0.021826744079589844, 0.022636890411376953, 0.023447036743164062, 0.024257183074951172, 0.02506732940673828, 0.02587747573852539, 0.0266876220703125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 6.0, 6.0, 12.0, 8.0, 27.0, 26.0, 58.0, 57.0, 84.0, 163.0, 462.0, 2433.0, 52710.0, 979013.0, 11665.0, 1114.0, 282.0, 133.0, 86.0, 53.0, 50.0, 26.0, 9.0, 17.0, 10.0, 10.0, 3.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42578125, -0.412994384765625, -0.40020751953125, -0.387420654296875, -0.3746337890625, -0.361846923828125, -0.34906005859375, -0.336273193359375, -0.323486328125, -0.310699462890625, -0.29791259765625, -0.285125732421875, -0.2723388671875, -0.259552001953125, -0.24676513671875, -0.233978271484375, -0.22119140625, -0.208404541015625, -0.19561767578125, -0.182830810546875, -0.1700439453125, -0.157257080078125, -0.14447021484375, -0.131683349609375, -0.118896484375, -0.106109619140625, -0.09332275390625, -0.080535888671875, -0.0677490234375, -0.054962158203125, -0.04217529296875, -0.029388427734375, -0.0166015625, -0.003814697265625, 0.00897216796875, 0.021759033203125, 0.0345458984375, 0.047332763671875, 0.06011962890625, 0.072906494140625, 0.085693359375, 0.098480224609375, 0.11126708984375, 0.124053955078125, 0.1368408203125, 0.149627685546875, 0.16241455078125, 0.175201416015625, 0.18798828125, 0.200775146484375, 0.21356201171875, 0.226348876953125, 0.2391357421875, 0.251922607421875, 0.26470947265625, 0.277496337890625, 0.290283203125, 0.303070068359375, 0.31585693359375, 0.328643798828125, 0.3414306640625, 0.354217529296875, 0.36700439453125, 0.379791259765625, 0.392578125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 13.0, 33.0, 67.0, 231.0, 453.0, 115.0, 54.0, 21.0, 12.0, 4.0, 0.0, 2.0], "bins": [-0.07912231981754303, -0.07771774381399155, -0.07631316781044006, -0.07490859180688858, -0.0735040158033371, -0.07209943979978561, -0.07069486379623413, -0.06929028779268265, -0.06788571178913116, -0.06648113578557968, -0.0650765597820282, -0.06367198377847672, -0.06226740777492523, -0.06086283177137375, -0.059458255767822266, -0.05805367976427078, -0.0566491037607193, -0.055244527757167816, -0.05383995175361633, -0.05243537575006485, -0.05103079974651337, -0.049626223742961884, -0.0482216477394104, -0.04681707173585892, -0.045412495732307434, -0.04400791972875595, -0.04260334372520447, -0.041198767721652985, -0.0397941917181015, -0.03838961571455002, -0.036985039710998535, -0.03558046370744705, -0.03417588397860527, -0.03277130797505379, -0.031366731971502304, -0.02996215596795082, -0.028557579964399338, -0.027153003960847855, -0.02574842795729637, -0.02434385195374489, -0.022939275950193405, -0.021534699946641922, -0.02013012394309044, -0.018725547939538956, -0.017320971935987473, -0.01591639593243599, -0.014511819928884506, -0.013107243925333023, -0.01170266792178154, -0.010298091918230057, -0.008893515914678574, -0.0074889399111270905, -0.006084363907575607, -0.004679787904024124, -0.003275211900472641, -0.0018706358969211578, -0.0004660598933696747, 0.0009385161101818085, 0.0023430921137332916, 0.0037476681172847748, 0.005152244120836258, 0.006556820124387741, 0.007961396127939224, 0.009365972131490707, 0.01077054813504219]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 3.0, 12.0, 14.0, 13.0, 19.0, 26.0, 25.0, 27.0, 14.0, 28.0, 46.0, 37.0, 34.0, 40.0, 49.0, 38.0, 52.0, 35.0, 48.0, 41.0, 39.0, 31.0, 34.0, 25.0, 36.0, 24.0, 32.0, 32.0, 22.0, 14.0, 15.0, 15.0, 9.0, 7.0, 10.0, 9.0, 7.0, 11.0, 4.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.0127488374710083, -0.012401076965034008, -0.012053316459059715, -0.011705555953085423, -0.01135779544711113, -0.011010034941136837, -0.010662274435162544, -0.010314513929188251, -0.009966753423213959, -0.009618992917239666, -0.009271232411265373, -0.00892347190529108, -0.008575711399316788, -0.008227950893342495, -0.007880190387368202, -0.0075324298813939095, -0.007184669375419617, -0.006836908869445324, -0.006489148363471031, -0.0061413878574967384, -0.005793627351522446, -0.005445866845548153, -0.00509810633957386, -0.004750345833599567, -0.004402585327625275, -0.004054824821650982, -0.003707064315676689, -0.0033593038097023964, -0.0030115433037281036, -0.002663782797753811, -0.002316022291779518, -0.0019682617858052254, -0.0016205012798309326, -0.0012727407738566399, -0.0009249802678823471, -0.0005772197619080544, -0.0002294592559337616, 0.00011830125004053116, 0.0004660617560148239, 0.0008138222619891167, 0.0011615827679634094, 0.0015093432739377022, 0.001857103779911995, 0.0022048642858862877, 0.0025526247918605804, 0.002900385297834873, 0.003248145803809166, 0.0035959063097834587, 0.0039436668157577515, 0.004291427321732044, 0.004639187827706337, 0.00498694833368063, 0.0053347088396549225, 0.005682469345629215, 0.006030229851603508, 0.006377990357577801, 0.0067257508635520935, 0.007073511369526386, 0.007421271875500679, 0.007769032381474972, 0.008116792887449265, 0.008464553393423557, 0.00881231389939785, 0.009160074405372143, 0.009507834911346436]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 2.0, 10.0, 13.0, 9.0, 16.0, 11.0, 16.0, 27.0, 27.0, 33.0, 18.0, 34.0, 32.0, 40.0, 34.0, 45.0, 37.0, 46.0, 55.0, 46.0, 46.0, 48.0, 39.0, 43.0, 33.0, 40.0, 26.0, 18.0, 24.0, 24.0, 16.0, 12.0, 12.0, 15.0, 9.0, 5.0, 12.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.0, -30.9912109375, -29.982421875, -28.9736328125, -27.96484375, -26.9560546875, -25.947265625, -24.9384765625, -23.9296875, -22.9208984375, -21.912109375, -20.9033203125, -19.89453125, -18.8857421875, -17.876953125, -16.8681640625, -15.859375, -14.8505859375, -13.841796875, -12.8330078125, -11.82421875, -10.8154296875, -9.806640625, -8.7978515625, -7.7890625, -6.7802734375, -5.771484375, -4.7626953125, -3.75390625, -2.7451171875, -1.736328125, -0.7275390625, 0.28125, 1.2900390625, 2.298828125, 3.3076171875, 4.31640625, 5.3251953125, 6.333984375, 7.3427734375, 8.3515625, 9.3603515625, 10.369140625, 11.3779296875, 12.38671875, 13.3955078125, 14.404296875, 15.4130859375, 16.421875, 17.4306640625, 18.439453125, 19.4482421875, 20.45703125, 21.4658203125, 22.474609375, 23.4833984375, 24.4921875, 25.5009765625, 26.509765625, 27.5185546875, 28.52734375, 29.5361328125, 30.544921875, 31.5537109375, 32.5625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 9.0, 17.0, 20.0, 27.0, 30.0, 47.0, 51.0, 62.0, 113.0, 120.0, 152.0, 201.0, 284.0, 396.0, 469.0, 630.0, 933.0, 1343.0, 2186.0, 3760.0, 8127.0, 25861.0, 181847.0, 715203.0, 76104.0, 15505.0, 5751.0, 3058.0, 1811.0, 1206.0, 777.0, 637.0, 426.0, 339.0, 233.0, 187.0, 140.0, 114.0, 74.0, 62.0, 56.0, 33.0, 35.0, 20.0, 19.0, 16.0, 10.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0], "bins": [-38.96875, -37.7626953125, -36.556640625, -35.3505859375, -34.14453125, -32.9384765625, -31.732421875, -30.5263671875, -29.3203125, -28.1142578125, -26.908203125, -25.7021484375, -24.49609375, -23.2900390625, -22.083984375, -20.8779296875, -19.671875, -18.4658203125, -17.259765625, -16.0537109375, -14.84765625, -13.6416015625, -12.435546875, -11.2294921875, -10.0234375, -8.8173828125, -7.611328125, -6.4052734375, -5.19921875, -3.9931640625, -2.787109375, -1.5810546875, -0.375, 0.8310546875, 2.037109375, 3.2431640625, 4.44921875, 5.6552734375, 6.861328125, 8.0673828125, 9.2734375, 10.4794921875, 11.685546875, 12.8916015625, 14.09765625, 15.3037109375, 16.509765625, 17.7158203125, 18.921875, 20.1279296875, 21.333984375, 22.5400390625, 23.74609375, 24.9521484375, 26.158203125, 27.3642578125, 28.5703125, 29.7763671875, 30.982421875, 32.1884765625, 33.39453125, 34.6005859375, 35.806640625, 37.0126953125, 38.21875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 7.0, 5.0, 6.0, 9.0, 9.0, 9.0, 17.0, 20.0, 14.0, 16.0, 27.0, 23.0, 25.0, 29.0, 39.0, 32.0, 48.0, 52.0, 53.0, 70.0, 386.0, 1639.0, 71.0, 58.0, 42.0, 37.0, 49.0, 34.0, 39.0, 19.0, 22.0, 30.0, 22.0, 14.0, 15.0, 8.0, 9.0, 4.0, 8.0, 5.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.9375, -81.912109375, -78.88671875, -75.861328125, -72.8359375, -69.810546875, -66.78515625, -63.759765625, -60.734375, -57.708984375, -54.68359375, -51.658203125, -48.6328125, -45.607421875, -42.58203125, -39.556640625, -36.53125, -33.505859375, -30.48046875, -27.455078125, -24.4296875, -21.404296875, -18.37890625, -15.353515625, -12.328125, -9.302734375, -6.27734375, -3.251953125, -0.2265625, 2.798828125, 5.82421875, 8.849609375, 11.875, 14.900390625, 17.92578125, 20.951171875, 23.9765625, 27.001953125, 30.02734375, 33.052734375, 36.078125, 39.103515625, 42.12890625, 45.154296875, 48.1796875, 51.205078125, 54.23046875, 57.255859375, 60.28125, 63.306640625, 66.33203125, 69.357421875, 72.3828125, 75.408203125, 78.43359375, 81.458984375, 84.484375, 87.509765625, 90.53515625, 93.560546875, 96.5859375, 99.611328125, 102.63671875, 105.662109375, 108.6875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 6.0, 9.0, 9.0, 11.0, 14.0, 17.0, 21.0, 39.0, 57.0, 62.0, 89.0, 169.0, 332.0, 829.0, 3311.0, 32280.0, 3078066.0, 25917.0, 2834.0, 723.0, 358.0, 165.0, 98.0, 67.0, 55.0, 33.0, 28.0, 28.0, 13.0, 10.0, 7.0, 11.0, 6.0, 2.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-226.75, -219.54296875, -212.3359375, -205.12890625, -197.921875, -190.71484375, -183.5078125, -176.30078125, -169.09375, -161.88671875, -154.6796875, -147.47265625, -140.265625, -133.05859375, -125.8515625, -118.64453125, -111.4375, -104.23046875, -97.0234375, -89.81640625, -82.609375, -75.40234375, -68.1953125, -60.98828125, -53.78125, -46.57421875, -39.3671875, -32.16015625, -24.953125, -17.74609375, -10.5390625, -3.33203125, 3.875, 11.08203125, 18.2890625, 25.49609375, 32.703125, 39.91015625, 47.1171875, 54.32421875, 61.53125, 68.73828125, 75.9453125, 83.15234375, 90.359375, 97.56640625, 104.7734375, 111.98046875, 119.1875, 126.39453125, 133.6015625, 140.80859375, 148.015625, 155.22265625, 162.4296875, 169.63671875, 176.84375, 184.05078125, 191.2578125, 198.46484375, 205.671875, 212.87890625, 220.0859375, 227.29296875, 234.5]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 6.0, 21.0, 48.0, 89.0, 162.0, 227.0, 170.0, 120.0, 65.0, 42.0, 29.0, 7.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-287.5108337402344, -281.60833740234375, -275.70587158203125, -269.8033752441406, -263.9009094238281, -257.9984130859375, -252.09593200683594, -246.19345092773438, -240.29095458984375, -234.3884735107422, -228.48599243164062, -222.58349609375, -216.68101501464844, -210.77853393554688, -204.8760528564453, -198.97357177734375, -193.0710906982422, -187.16860961914062, -181.26612854003906, -175.3636474609375, -169.46115112304688, -163.5586700439453, -157.65618896484375, -151.7537078857422, -145.85122680664062, -139.94874572753906, -134.0462646484375, -128.14376831054688, -122.24128723144531, -116.33880615234375, -110.43632507324219, -104.53384399414062, -98.63134002685547, -92.7288589477539, -86.82637023925781, -80.92388916015625, -75.02140808105469, -69.1189193725586, -63.21643829345703, -57.3139533996582, -51.411468505859375, -45.50898361206055, -39.60649871826172, -33.704017639160156, -27.801532745361328, -21.8990478515625, -15.996566772460938, -10.09408187866211, -4.191596984863281, 1.7108869552612305, 7.613370895385742, 13.515853881835938, 19.418338775634766, 25.320823669433594, 31.223304748535156, 37.125789642333984, 43.02827453613281, 48.93075942993164, 54.83324432373047, 60.73572540283203, 66.63821411132812, 72.54069519042969, 78.44317626953125, 84.34565734863281, 90.2481460571289]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 10.0, 9.0, 11.0, 10.0, 17.0, 20.0, 23.0, 27.0, 23.0, 24.0, 18.0, 28.0, 46.0, 43.0, 32.0, 35.0, 52.0, 38.0, 48.0, 36.0, 35.0, 44.0, 33.0, 30.0, 26.0, 30.0, 23.0, 34.0, 25.0, 22.0, 18.0, 17.0, 16.0, 13.0, 12.0, 5.0, 8.0, 8.0, 7.0, 2.0, 8.0, 3.0, 7.0, 2.0, 2.0, 0.0, 0.0, 6.0, 3.0], "bins": [-278.3049621582031, -269.94921875, -261.59344482421875, -253.23768615722656, -244.88192749023438, -236.52618408203125, -228.17042541503906, -219.81466674804688, -211.4589080810547, -203.1031494140625, -194.7473907470703, -186.39163208007812, -178.035888671875, -169.68011474609375, -161.32437133789062, -152.96861267089844, -144.61285400390625, -136.25709533691406, -127.90133666992188, -119.54558563232422, -111.18982696533203, -102.83406829833984, -94.47831726074219, -86.12255859375, -77.76679992675781, -69.41104125976562, -61.0552864074707, -52.69953155517578, -44.343772888183594, -35.988014221191406, -27.632259368896484, -19.276504516601562, -10.920745849609375, -2.5649890899658203, 5.790767669677734, 14.146524429321289, 22.502281188964844, 30.85803985595703, 39.21379470825195, 47.569549560546875, 55.92530822753906, 64.28106689453125, 72.63682556152344, 80.9925765991211, 89.34833526611328, 97.70409393310547, 106.05984497070312, 114.41560363769531, 122.7713623046875, 131.1271209716797, 139.48287963867188, 147.83863830566406, 156.19439697265625, 164.55014038085938, 172.90589904785156, 181.26165771484375, 189.61741638183594, 197.97317504882812, 206.3289337158203, 214.6846923828125, 223.04043579101562, 231.39620971679688, 239.751953125, 248.1077117919922, 256.4634704589844]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 9.0, 8.0, 13.0, 19.0, 17.0, 25.0, 19.0, 27.0, 21.0, 24.0, 35.0, 46.0, 33.0, 42.0, 35.0, 54.0, 44.0, 49.0, 47.0, 51.0, 50.0, 40.0, 30.0, 37.0, 37.0, 22.0, 17.0, 22.0, 20.0, 16.0, 9.0, 15.0, 11.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.15625, -32.12353515625, -31.0908203125, -30.05810546875, -29.025390625, -27.99267578125, -26.9599609375, -25.92724609375, -24.89453125, -23.86181640625, -22.8291015625, -21.79638671875, -20.763671875, -19.73095703125, -18.6982421875, -17.66552734375, -16.6328125, -15.60009765625, -14.5673828125, -13.53466796875, -12.501953125, -11.46923828125, -10.4365234375, -9.40380859375, -8.37109375, -7.33837890625, -6.3056640625, -5.27294921875, -4.240234375, -3.20751953125, -2.1748046875, -1.14208984375, -0.109375, 0.92333984375, 1.9560546875, 2.98876953125, 4.021484375, 5.05419921875, 6.0869140625, 7.11962890625, 8.15234375, 9.18505859375, 10.2177734375, 11.25048828125, 12.283203125, 13.31591796875, 14.3486328125, 15.38134765625, 16.4140625, 17.44677734375, 18.4794921875, 19.51220703125, 20.544921875, 21.57763671875, 22.6103515625, 23.64306640625, 24.67578125, 25.70849609375, 26.7412109375, 27.77392578125, 28.806640625, 29.83935546875, 30.8720703125, 31.90478515625, 32.9375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 6.0, 12.0, 26.0, 30.0, 37.0, 50.0, 78.0, 112.0, 164.0, 225.0, 364.0, 562.0, 879.0, 1479.0, 2468.0, 4379.0, 8417.0, 25250.0, 399412.0, 3415528.0, 295265.0, 21600.0, 7760.0, 3986.0, 2297.0, 1318.0, 892.0, 537.0, 362.0, 239.0, 157.0, 106.0, 73.0, 58.0, 43.0, 30.0, 18.0, 9.0, 15.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-93.8125, -91.0078125, -88.203125, -85.3984375, -82.59375, -79.7890625, -76.984375, -74.1796875, -71.375, -68.5703125, -65.765625, -62.9609375, -60.15625, -57.3515625, -54.546875, -51.7421875, -48.9375, -46.1328125, -43.328125, -40.5234375, -37.71875, -34.9140625, -32.109375, -29.3046875, -26.5, -23.6953125, -20.890625, -18.0859375, -15.28125, -12.4765625, -9.671875, -6.8671875, -4.0625, -1.2578125, 1.546875, 4.3515625, 7.15625, 9.9609375, 12.765625, 15.5703125, 18.375, 21.1796875, 23.984375, 26.7890625, 29.59375, 32.3984375, 35.203125, 38.0078125, 40.8125, 43.6171875, 46.421875, 49.2265625, 52.03125, 54.8359375, 57.640625, 60.4453125, 63.25, 66.0546875, 68.859375, 71.6640625, 74.46875, 77.2734375, 80.078125, 82.8828125, 85.6875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 6.0, 10.0, 12.0, 16.0, 18.0, 25.0, 36.0, 69.0, 116.0, 358.0, 831.0, 1250.0, 696.0, 275.0, 125.0, 47.0, 27.0, 26.0, 21.0, 9.0, 13.0, 13.0, 11.0, 8.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.625, -105.466796875, -102.30859375, -99.150390625, -95.9921875, -92.833984375, -89.67578125, -86.517578125, -83.359375, -80.201171875, -77.04296875, -73.884765625, -70.7265625, -67.568359375, -64.41015625, -61.251953125, -58.09375, -54.935546875, -51.77734375, -48.619140625, -45.4609375, -42.302734375, -39.14453125, -35.986328125, -32.828125, -29.669921875, -26.51171875, -23.353515625, -20.1953125, -17.037109375, -13.87890625, -10.720703125, -7.5625, -4.404296875, -1.24609375, 1.912109375, 5.0703125, 8.228515625, 11.38671875, 14.544921875, 17.703125, 20.861328125, 24.01953125, 27.177734375, 30.3359375, 33.494140625, 36.65234375, 39.810546875, 42.96875, 46.126953125, 49.28515625, 52.443359375, 55.6015625, 58.759765625, 61.91796875, 65.076171875, 68.234375, 71.392578125, 74.55078125, 77.708984375, 80.8671875, 84.025390625, 87.18359375, 90.341796875, 93.5]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 20.0, 23.0, 27.0, 36.0, 54.0, 76.0, 100.0, 140.0, 211.0, 323.0, 475.0, 708.0, 963.0, 1516.0, 2255.0, 3859.0, 6191.0, 10559.0, 19235.0, 41458.0, 173536.0, 3251033.0, 558261.0, 63885.0, 25858.0, 13056.0, 7649.0, 4465.0, 2720.0, 1774.0, 1171.0, 819.0, 550.0, 365.0, 267.0, 191.0, 123.0, 79.0, 81.0, 41.0, 35.0, 29.0, 15.0, 12.0, 6.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-99.125, -95.896484375, -92.66796875, -89.439453125, -86.2109375, -82.982421875, -79.75390625, -76.525390625, -73.296875, -70.068359375, -66.83984375, -63.611328125, -60.3828125, -57.154296875, -53.92578125, -50.697265625, -47.46875, -44.240234375, -41.01171875, -37.783203125, -34.5546875, -31.326171875, -28.09765625, -24.869140625, -21.640625, -18.412109375, -15.18359375, -11.955078125, -8.7265625, -5.498046875, -2.26953125, 0.958984375, 4.1875, 7.416015625, 10.64453125, 13.873046875, 17.1015625, 20.330078125, 23.55859375, 26.787109375, 30.015625, 33.244140625, 36.47265625, 39.701171875, 42.9296875, 46.158203125, 49.38671875, 52.615234375, 55.84375, 59.072265625, 62.30078125, 65.529296875, 68.7578125, 71.986328125, 75.21484375, 78.443359375, 81.671875, 84.900390625, 88.12890625, 91.357421875, 94.5859375, 97.814453125, 101.04296875, 104.271484375, 107.5]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 21.0, 48.0, 58.0, 98.0, 248.0, 266.0, 121.0, 56.0, 22.0, 19.0, 22.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-311.68115234375, -289.49346923828125, -267.3057861328125, -245.1180877685547, -222.93038940429688, -200.74270629882812, -178.55502319335938, -156.36732482910156, -134.1796417236328, -111.99195098876953, -89.80426025390625, -67.6165771484375, -45.42888641357422, -23.241195678710938, -1.0535125732421875, 21.134185791015625, 43.321868896484375, 65.50955963134766, 87.69725036621094, 109.88493347167969, 132.0726318359375, 154.26031494140625, 176.447998046875, 198.6356964111328, 220.82337951660156, 243.0110626220703, 265.1987609863281, 287.3864440917969, 309.5741271972656, 331.7618408203125, 353.94952392578125, 376.13720703125, 398.32489013671875, 420.5125732421875, 442.70025634765625, 464.887939453125, 487.0756530761719, 509.2633361816406, 531.4510498046875, 553.6387329101562, 575.826416015625, 598.0140991210938, 620.2017822265625, 642.3894653320312, 664.5771484375, 686.764892578125, 708.9525146484375, 731.1402587890625, 753.327880859375, 775.5155639648438, 797.7032470703125, 819.8909301757812, 842.07861328125, 864.266357421875, 886.4539794921875, 908.6417236328125, 930.8294067382812, 953.01708984375, 975.2047729492188, 997.3924560546875, 1019.5801391601562, 1041.767822265625, 1063.95556640625, 1086.1431884765625, 1108.3309326171875]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 6.0, 4.0, 6.0, 3.0, 14.0, 10.0, 5.0, 11.0, 15.0, 30.0, 18.0, 26.0, 29.0, 22.0, 25.0, 36.0, 33.0, 30.0, 22.0, 40.0, 36.0, 33.0, 29.0, 37.0, 40.0, 31.0, 37.0, 37.0, 43.0, 22.0, 25.0, 29.0, 28.0, 24.0, 31.0, 18.0, 21.0, 13.0, 6.0, 10.0, 11.0, 14.0, 6.0, 8.0, 4.0, 10.0, 2.0, 2.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-197.08865356445312, -190.61080932617188, -184.1329803466797, -177.65513610839844, -171.1772918701172, -164.699462890625, -158.22161865234375, -151.7437744140625, -145.26593017578125, -138.7880859375, -132.3102569580078, -125.83241271972656, -119.35456848144531, -112.8767318725586, -106.39889526367188, -99.92105102539062, -93.4432144165039, -86.96537780761719, -80.48753356933594, -74.00969696044922, -67.53185272216797, -61.05401611328125, -54.576175689697266, -48.09833526611328, -41.6204948425293, -35.14265441894531, -28.664813995361328, -22.186975479125977, -15.709135055541992, -9.23129653930664, -2.7534561157226562, 3.724384307861328, 10.202224731445312, 16.680065155029297, 23.15790557861328, 29.635744094848633, 36.11358642578125, 42.59142303466797, 49.06926345825195, 55.54710388183594, 62.02494430541992, 68.5027847290039, 74.98062133789062, 81.45846557617188, 87.9363021850586, 94.41413879394531, 100.89198303222656, 107.36982727050781, 113.84766387939453, 120.32550048828125, 126.8033447265625, 133.28118896484375, 139.75901794433594, 146.2368621826172, 152.71470642089844, 159.19253540039062, 165.67037963867188, 172.14822387695312, 178.6260528564453, 185.10389709472656, 191.5817413330078, 198.0595703125, 204.53741455078125, 211.0152587890625, 217.49310302734375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 10.0, 12.0, 9.0, 9.0, 15.0, 18.0, 22.0, 25.0, 30.0, 28.0, 25.0, 30.0, 35.0, 36.0, 44.0, 34.0, 45.0, 46.0, 53.0, 52.0, 49.0, 38.0, 25.0, 43.0, 36.0, 28.0, 33.0, 32.0, 18.0, 17.0, 14.0, 14.0, 11.0, 14.0, 10.0, 8.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.676513671875, -34.60302734375, -33.529541015625, -32.4560546875, -31.382568359375, -30.30908203125, -29.235595703125, -28.162109375, -27.088623046875, -26.01513671875, -24.941650390625, -23.8681640625, -22.794677734375, -21.72119140625, -20.647705078125, -19.57421875, -18.500732421875, -17.42724609375, -16.353759765625, -15.2802734375, -14.206787109375, -13.13330078125, -12.059814453125, -10.986328125, -9.912841796875, -8.83935546875, -7.765869140625, -6.6923828125, -5.618896484375, -4.54541015625, -3.471923828125, -2.3984375, -1.324951171875, -0.25146484375, 0.822021484375, 1.8955078125, 2.968994140625, 4.04248046875, 5.115966796875, 6.189453125, 7.262939453125, 8.33642578125, 9.409912109375, 10.4833984375, 11.556884765625, 12.63037109375, 13.703857421875, 14.77734375, 15.850830078125, 16.92431640625, 17.997802734375, 19.0712890625, 20.144775390625, 21.21826171875, 22.291748046875, 23.365234375, 24.438720703125, 25.51220703125, 26.585693359375, 27.6591796875, 28.732666015625, 29.80615234375, 30.879638671875, 31.953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 20.0, 20.0, 36.0, 52.0, 64.0, 144.0, 191.0, 298.0, 447.0, 737.0, 1156.0, 1850.0, 2948.0, 4915.0, 8095.0, 13425.0, 22826.0, 39408.0, 72810.0, 150662.0, 326391.0, 197865.0, 89212.0, 47613.0, 27302.0, 15703.0, 9341.0, 5737.0, 3458.0, 2102.0, 1400.0, 880.0, 523.0, 323.0, 209.0, 128.0, 95.0, 56.0, 31.0, 22.0, 19.0, 10.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.134765625, -2.0731658935546875, -2.011566162109375, -1.9499664306640625, -1.88836669921875, -1.8267669677734375, -1.765167236328125, -1.7035675048828125, -1.6419677734375, -1.5803680419921875, -1.518768310546875, -1.4571685791015625, -1.39556884765625, -1.3339691162109375, -1.272369384765625, -1.2107696533203125, -1.149169921875, -1.0875701904296875, -1.025970458984375, -0.9643707275390625, -0.90277099609375, -0.8411712646484375, -0.779571533203125, -0.7179718017578125, -0.6563720703125, -0.5947723388671875, -0.533172607421875, -0.4715728759765625, -0.40997314453125, -0.3483734130859375, -0.286773681640625, -0.2251739501953125, -0.16357421875, -0.1019744873046875, -0.040374755859375, 0.0212249755859375, 0.08282470703125, 0.1444244384765625, 0.206024169921875, 0.2676239013671875, 0.3292236328125, 0.3908233642578125, 0.452423095703125, 0.5140228271484375, 0.57562255859375, 0.6372222900390625, 0.698822021484375, 0.7604217529296875, 0.822021484375, 0.8836212158203125, 0.945220947265625, 1.0068206787109375, 1.06842041015625, 1.1300201416015625, 1.191619873046875, 1.2532196044921875, 1.3148193359375, 1.3764190673828125, 1.438018798828125, 1.4996185302734375, 1.56121826171875, 1.6228179931640625, 1.684417724609375, 1.7460174560546875, 1.8076171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 11.0, 14.0, 17.0, 20.0, 20.0, 24.0, 28.0, 24.0, 31.0, 33.0, 35.0, 34.0, 39.0, 37.0, 41.0, 52.0, 1063.0, 31.0, 43.0, 27.0, 51.0, 24.0, 37.0, 32.0, 28.0, 27.0, 26.0, 26.0, 25.0, 16.0, 20.0, 10.0, 10.0, 14.0, 10.0, 7.0, 2.0, 3.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.890625, -21.21728515625, -20.5439453125, -19.87060546875, -19.197265625, -18.52392578125, -17.8505859375, -17.17724609375, -16.50390625, -15.83056640625, -15.1572265625, -14.48388671875, -13.810546875, -13.13720703125, -12.4638671875, -11.79052734375, -11.1171875, -10.44384765625, -9.7705078125, -9.09716796875, -8.423828125, -7.75048828125, -7.0771484375, -6.40380859375, -5.73046875, -5.05712890625, -4.3837890625, -3.71044921875, -3.037109375, -2.36376953125, -1.6904296875, -1.01708984375, -0.34375, 0.32958984375, 1.0029296875, 1.67626953125, 2.349609375, 3.02294921875, 3.6962890625, 4.36962890625, 5.04296875, 5.71630859375, 6.3896484375, 7.06298828125, 7.736328125, 8.40966796875, 9.0830078125, 9.75634765625, 10.4296875, 11.10302734375, 11.7763671875, 12.44970703125, 13.123046875, 13.79638671875, 14.4697265625, 15.14306640625, 15.81640625, 16.48974609375, 17.1630859375, 17.83642578125, 18.509765625, 19.18310546875, 19.8564453125, 20.52978515625, 21.203125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 10.0, 13.0, 17.0, 23.0, 25.0, 56.0, 67.0, 111.0, 155.0, 260.0, 379.0, 607.0, 952.0, 1425.0, 2349.0, 3761.0, 6117.0, 10216.0, 17241.0, 29579.0, 52700.0, 100934.0, 253500.0, 1333392.0, 130802.0, 64690.0, 35883.0, 20623.0, 11997.0, 7352.0, 4335.0, 2704.0, 1673.0, 1106.0, 695.0, 462.0, 283.0, 216.0, 131.0, 94.0, 70.0, 35.0, 34.0, 16.0, 14.0, 11.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.853515625, -1.7958984375, -1.73828125, -1.6806640625, -1.623046875, -1.5654296875, -1.5078125, -1.4501953125, -1.392578125, -1.3349609375, -1.27734375, -1.2197265625, -1.162109375, -1.1044921875, -1.046875, -0.9892578125, -0.931640625, -0.8740234375, -0.81640625, -0.7587890625, -0.701171875, -0.6435546875, -0.5859375, -0.5283203125, -0.470703125, -0.4130859375, -0.35546875, -0.2978515625, -0.240234375, -0.1826171875, -0.125, -0.0673828125, -0.009765625, 0.0478515625, 0.10546875, 0.1630859375, 0.220703125, 0.2783203125, 0.3359375, 0.3935546875, 0.451171875, 0.5087890625, 0.56640625, 0.6240234375, 0.681640625, 0.7392578125, 0.796875, 0.8544921875, 0.912109375, 0.9697265625, 1.02734375, 1.0849609375, 1.142578125, 1.2001953125, 1.2578125, 1.3154296875, 1.373046875, 1.4306640625, 1.48828125, 1.5458984375, 1.603515625, 1.6611328125, 1.71875, 1.7763671875, 1.833984375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 0.0, 7.0, 5.0, 6.0, 4.0, 9.0, 11.0, 15.0, 20.0, 20.0, 22.0, 32.0, 47.0, 40.0, 44.0, 63.0, 83.0, 113.0, 89.0, 45.0, 54.0, 34.0, 40.0, 28.0, 39.0, 22.0, 20.0, 14.0, 14.0, 14.0, 12.0, 2.0, 8.0, 4.0, 4.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0248870849609375, -0.024206876754760742, -0.023526668548583984, -0.022846460342407227, -0.02216625213623047, -0.02148604393005371, -0.020805835723876953, -0.020125627517700195, -0.019445419311523438, -0.01876521110534668, -0.018085002899169922, -0.017404794692993164, -0.016724586486816406, -0.01604437828063965, -0.01536417007446289, -0.014683961868286133, -0.014003753662109375, -0.013323545455932617, -0.01264333724975586, -0.011963129043579102, -0.011282920837402344, -0.010602712631225586, -0.009922504425048828, -0.00924229621887207, -0.008562088012695312, -0.007881879806518555, -0.007201671600341797, -0.006521463394165039, -0.005841255187988281, -0.0051610469818115234, -0.004480838775634766, -0.003800630569458008, -0.00312042236328125, -0.002440214157104492, -0.0017600059509277344, -0.0010797977447509766, -0.00039958953857421875, 0.00028061866760253906, 0.0009608268737792969, 0.0016410350799560547, 0.0023212432861328125, 0.0030014514923095703, 0.003681659698486328, 0.004361867904663086, 0.005042076110839844, 0.0057222843170166016, 0.006402492523193359, 0.007082700729370117, 0.007762908935546875, 0.008443117141723633, 0.00912332534790039, 0.009803533554077148, 0.010483741760253906, 0.011163949966430664, 0.011844158172607422, 0.01252436637878418, 0.013204574584960938, 0.013884782791137695, 0.014564990997314453, 0.015245199203491211, 0.01592540740966797, 0.016605615615844727, 0.017285823822021484, 0.017966032028198242, 0.018646240234375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 2.0, 4.0, 9.0, 5.0, 4.0, 6.0, 11.0, 15.0, 22.0, 27.0, 32.0, 44.0, 56.0, 70.0, 102.0, 161.0, 250.0, 829.0, 6108.0, 141603.0, 878285.0, 18278.0, 1587.0, 410.0, 185.0, 126.0, 95.0, 51.0, 47.0, 32.0, 26.0, 20.0, 16.0, 8.0, 5.0, 7.0, 5.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2939453125, -0.2835235595703125, -0.273101806640625, -0.2626800537109375, -0.25225830078125, -0.2418365478515625, -0.231414794921875, -0.2209930419921875, -0.2105712890625, -0.2001495361328125, -0.189727783203125, -0.1793060302734375, -0.16888427734375, -0.1584625244140625, -0.148040771484375, -0.1376190185546875, -0.127197265625, -0.1167755126953125, -0.106353759765625, -0.0959320068359375, -0.08551025390625, -0.0750885009765625, -0.064666748046875, -0.0542449951171875, -0.0438232421875, -0.0334014892578125, -0.022979736328125, -0.0125579833984375, -0.00213623046875, 0.0082855224609375, 0.018707275390625, 0.0291290283203125, 0.03955078125, 0.0499725341796875, 0.060394287109375, 0.0708160400390625, 0.08123779296875, 0.0916595458984375, 0.102081298828125, 0.1125030517578125, 0.1229248046875, 0.1333465576171875, 0.143768310546875, 0.1541900634765625, 0.16461181640625, 0.1750335693359375, 0.185455322265625, 0.1958770751953125, 0.206298828125, 0.2167205810546875, 0.227142333984375, 0.2375640869140625, 0.24798583984375, 0.2584075927734375, 0.268829345703125, 0.2792510986328125, 0.2896728515625, 0.3000946044921875, 0.310516357421875, 0.3209381103515625, 0.33135986328125, 0.3417816162109375, 0.352203369140625, 0.3626251220703125, 0.373046875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 25.0, 72.0, 260.0, 540.0, 81.0, 26.0, 5.0, 4.0], "bins": [-0.1447385996580124, -0.14229464530944824, -0.1398507058620453, -0.13740675151348114, -0.134962797164917, -0.13251885771751404, -0.1300749033689499, -0.12763094902038574, -0.1251869946718216, -0.12274304777383804, -0.1202990934252739, -0.11785514652729034, -0.1154111921787262, -0.11296724528074265, -0.1105232983827591, -0.10807934403419495, -0.10563540458679199, -0.10319145768880844, -0.1007475033402443, -0.09830355644226074, -0.0958596020936966, -0.09341565519571304, -0.09097170829772949, -0.08852775394916534, -0.0860837996006012, -0.08363985270261765, -0.0811958983540535, -0.07875195145606995, -0.0763079971075058, -0.07386405020952225, -0.0714201033115387, -0.06897614896297455, -0.0665321946144104, -0.06408824771642685, -0.0616442933678627, -0.05920034646987915, -0.0567563958466053, -0.05431244522333145, -0.0518684946000576, -0.04942454397678375, -0.0469805970788002, -0.04453664645552635, -0.0420926958322525, -0.03964874893426895, -0.0372047983109951, -0.03476084768772125, -0.0323168970644474, -0.029872948303818703, -0.027428999543190002, -0.024985048919916153, -0.022541100159287453, -0.020097149536013603, -0.017653200775384903, -0.015209250152111053, -0.012765299528837204, -0.010321350768208504, -0.007877400144934654, -0.005433450452983379, -0.002989500295370817, -0.000545550137758255, 0.0018983995541930199, 0.004342349246144295, 0.006786299869418144, 0.009230248630046844, 0.011674199253320694]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 3.0, 4.0, 6.0, 4.0, 15.0, 10.0, 9.0, 18.0, 19.0, 17.0, 25.0, 22.0, 34.0, 32.0, 34.0, 41.0, 48.0, 41.0, 26.0, 55.0, 58.0, 45.0, 53.0, 35.0, 49.0, 45.0, 36.0, 33.0, 34.0, 24.0, 16.0, 25.0, 16.0, 21.0, 11.0, 11.0, 13.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.016730785369873047, -0.016304954886436462, -0.01587912254035473, -0.01545329112559557, -0.01502745971083641, -0.014601628296077251, -0.014175796881318092, -0.013749965466558933, -0.013324134051799774, -0.012898302637040615, -0.012472471222281456, -0.012046639807522297, -0.011620808392763138, -0.011194976978003979, -0.01076914556324482, -0.01034331414848566, -0.009917482733726501, -0.009491651318967342, -0.009065819904208183, -0.008639988489449024, -0.008214157074689865, -0.007788325659930706, -0.007362494245171547, -0.006936662830412388, -0.006510831415653229, -0.00608500000089407, -0.005659168586134911, -0.0052333371713757515, -0.004807505756616592, -0.004381674341857433, -0.003955842927098274, -0.003530011512339115, -0.003104180097579956, -0.002678348682820797, -0.002252517268061638, -0.0018266858533024788, -0.0014008544385433197, -0.0009750230237841606, -0.0005491916090250015, -0.00012336019426584244, 0.00030247122049331665, 0.0007283026352524757, 0.0011541340500116348, 0.001579965464770794, 0.002005796879529953, 0.002431628294289112, 0.002857459709048271, 0.0032832911238074303, 0.0037091225385665894, 0.0041349539533257484, 0.0045607853680849075, 0.004986616782844067, 0.005412448197603226, 0.005838279612362385, 0.006264111027121544, 0.006689942441880703, 0.007115773856639862, 0.007541605271399021, 0.00796743668615818, 0.00839326810091734, 0.008819099515676498, 0.009244930930435658, 0.009670762345194817, 0.010096593759953976, 0.010522425174713135]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 10.0, 12.0, 9.0, 9.0, 15.0, 18.0, 22.0, 25.0, 30.0, 28.0, 25.0, 30.0, 35.0, 36.0, 44.0, 34.0, 45.0, 46.0, 53.0, 52.0, 49.0, 38.0, 25.0, 43.0, 36.0, 28.0, 33.0, 32.0, 18.0, 17.0, 14.0, 14.0, 11.0, 14.0, 10.0, 8.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.676513671875, -34.60302734375, -33.529541015625, -32.4560546875, -31.382568359375, -30.30908203125, -29.235595703125, -28.162109375, -27.088623046875, -26.01513671875, -24.941650390625, -23.8681640625, -22.794677734375, -21.72119140625, -20.647705078125, -19.57421875, -18.500732421875, -17.42724609375, -16.353759765625, -15.2802734375, -14.206787109375, -13.13330078125, -12.059814453125, -10.986328125, -9.912841796875, -8.83935546875, -7.765869140625, -6.6923828125, -5.618896484375, -4.54541015625, -3.471923828125, -2.3984375, -1.324951171875, -0.25146484375, 0.822021484375, 1.8955078125, 2.968994140625, 4.04248046875, 5.115966796875, 6.189453125, 7.262939453125, 8.33642578125, 9.409912109375, 10.4833984375, 11.556884765625, 12.63037109375, 13.703857421875, 14.77734375, 15.850830078125, 16.92431640625, 17.997802734375, 19.0712890625, 20.144775390625, 21.21826171875, 22.291748046875, 23.365234375, 24.438720703125, 25.51220703125, 26.585693359375, 27.6591796875, 28.732666015625, 29.80615234375, 30.879638671875, 31.953125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 3.0, 5.0, 11.0, 16.0, 22.0, 32.0, 25.0, 51.0, 71.0, 98.0, 163.0, 248.0, 348.0, 576.0, 944.0, 1756.0, 3195.0, 6523.0, 14515.0, 39111.0, 132827.0, 513970.0, 234452.0, 60439.0, 20710.0, 8832.0, 4191.0, 2243.0, 1204.0, 746.0, 414.0, 249.0, 159.0, 103.0, 76.0, 56.0, 38.0, 35.0, 27.0, 16.0, 23.0, 8.0, 7.0, 8.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.234375, -20.622314453125, -20.01025390625, -19.398193359375, -18.7861328125, -18.174072265625, -17.56201171875, -16.949951171875, -16.337890625, -15.725830078125, -15.11376953125, -14.501708984375, -13.8896484375, -13.277587890625, -12.66552734375, -12.053466796875, -11.44140625, -10.829345703125, -10.21728515625, -9.605224609375, -8.9931640625, -8.381103515625, -7.76904296875, -7.156982421875, -6.544921875, -5.932861328125, -5.32080078125, -4.708740234375, -4.0966796875, -3.484619140625, -2.87255859375, -2.260498046875, -1.6484375, -1.036376953125, -0.42431640625, 0.187744140625, 0.7998046875, 1.411865234375, 2.02392578125, 2.635986328125, 3.248046875, 3.860107421875, 4.47216796875, 5.084228515625, 5.6962890625, 6.308349609375, 6.92041015625, 7.532470703125, 8.14453125, 8.756591796875, 9.36865234375, 9.980712890625, 10.5927734375, 11.204833984375, 11.81689453125, 12.428955078125, 13.041015625, 13.653076171875, 14.26513671875, 14.877197265625, 15.4892578125, 16.101318359375, 16.71337890625, 17.325439453125, 17.9375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 0.0, 4.0, 3.0, 6.0, 8.0, 9.0, 9.0, 16.0, 11.0, 16.0, 21.0, 29.0, 16.0, 36.0, 30.0, 42.0, 51.0, 36.0, 34.0, 71.0, 144.0, 1897.0, 100.0, 43.0, 56.0, 33.0, 37.0, 45.0, 30.0, 37.0, 27.0, 25.0, 20.0, 17.0, 25.0, 14.0, 16.0, 9.0, 8.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-123.75, -120.2509765625, -116.751953125, -113.2529296875, -109.75390625, -106.2548828125, -102.755859375, -99.2568359375, -95.7578125, -92.2587890625, -88.759765625, -85.2607421875, -81.76171875, -78.2626953125, -74.763671875, -71.2646484375, -67.765625, -64.2666015625, -60.767578125, -57.2685546875, -53.76953125, -50.2705078125, -46.771484375, -43.2724609375, -39.7734375, -36.2744140625, -32.775390625, -29.2763671875, -25.77734375, -22.2783203125, -18.779296875, -15.2802734375, -11.78125, -8.2822265625, -4.783203125, -1.2841796875, 2.21484375, 5.7138671875, 9.212890625, 12.7119140625, 16.2109375, 19.7099609375, 23.208984375, 26.7080078125, 30.20703125, 33.7060546875, 37.205078125, 40.7041015625, 44.203125, 47.7021484375, 51.201171875, 54.7001953125, 58.19921875, 61.6982421875, 65.197265625, 68.6962890625, 72.1953125, 75.6943359375, 79.193359375, 82.6923828125, 86.19140625, 89.6904296875, 93.189453125, 96.6884765625, 100.1875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 14.0, 3.0, 11.0, 10.0, 13.0, 19.0, 31.0, 22.0, 36.0, 45.0, 77.0, 65.0, 104.0, 145.0, 175.0, 290.0, 669.0, 2367.0, 520663.0, 2616517.0, 2691.0, 737.0, 272.0, 185.0, 140.0, 91.0, 82.0, 46.0, 29.0, 43.0, 23.0, 14.0, 12.0, 16.0, 9.0, 11.0, 8.0, 4.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.0, -187.08203125, -180.1640625, -173.24609375, -166.328125, -159.41015625, -152.4921875, -145.57421875, -138.65625, -131.73828125, -124.8203125, -117.90234375, -110.984375, -104.06640625, -97.1484375, -90.23046875, -83.3125, -76.39453125, -69.4765625, -62.55859375, -55.640625, -48.72265625, -41.8046875, -34.88671875, -27.96875, -21.05078125, -14.1328125, -7.21484375, -0.296875, 6.62109375, 13.5390625, 20.45703125, 27.375, 34.29296875, 41.2109375, 48.12890625, 55.046875, 61.96484375, 68.8828125, 75.80078125, 82.71875, 89.63671875, 96.5546875, 103.47265625, 110.390625, 117.30859375, 124.2265625, 131.14453125, 138.0625, 144.98046875, 151.8984375, 158.81640625, 165.734375, 172.65234375, 179.5703125, 186.48828125, 193.40625, 200.32421875, 207.2421875, 214.16015625, 221.078125, 227.99609375, 234.9140625, 241.83203125, 248.75]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [983.0, 34.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.62297058105469, 16.221084594726562, 67.06513977050781, 117.90919494628906, 168.7532501220703, 219.59730529785156, 270.44134521484375, 321.285400390625, 372.12945556640625, 422.9735107421875, 473.81756591796875, 524.66162109375, 575.5056762695312, 626.3497314453125, 677.1937866210938, 728.037841796875, 778.8818969726562, 829.7259521484375, 880.5700073242188, 931.4140625, 982.2581176757812, 1033.1021728515625, 1083.9462890625, 1134.790283203125, 1185.6343994140625, 1236.478515625, 1287.322509765625, 1338.16650390625, 1389.0106201171875, 1439.854736328125, 1490.69873046875, 1541.542724609375, 1592.38671875, 1643.230712890625, 1694.0748291015625, 1744.9189453125, 1795.762939453125, 1846.60693359375, 1897.4510498046875, 1948.295166015625, 1999.13916015625, 2049.983154296875, 2100.8271484375, 2151.67138671875, 2202.515380859375, 2253.359375, 2304.20361328125, 2355.047607421875, 2405.8916015625, 2456.735595703125, 2507.57958984375, 2558.423828125, 2609.267822265625, 2660.11181640625, 2710.9560546875, 2761.800048828125, 2812.64404296875, 2863.488037109375, 2914.33203125, 2965.17626953125, 3016.020263671875, 3066.8642578125, 3117.70849609375, 3168.552490234375, 3219.396484375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 6.0, 5.0, 2.0, 11.0, 14.0, 17.0, 28.0, 13.0, 20.0, 28.0, 24.0, 32.0, 36.0, 38.0, 34.0, 37.0, 52.0, 34.0, 45.0, 48.0, 43.0, 43.0, 41.0, 44.0, 30.0, 42.0, 30.0, 28.0, 36.0, 22.0, 21.0, 20.0, 11.0, 13.0, 12.0, 8.0, 10.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-289.0094909667969, -279.8565673828125, -270.70361328125, -261.5506896972656, -252.39776611328125, -243.2448272705078, -234.09188842773438, -224.93896484375, -215.78602600097656, -206.63308715820312, -197.48016357421875, -188.3272247314453, -179.17428588867188, -170.0213623046875, -160.86842346191406, -151.71548461914062, -142.56256103515625, -133.4096221923828, -124.25669860839844, -115.103759765625, -105.9508285522461, -96.79789733886719, -87.64495849609375, -78.49202728271484, -69.33909606933594, -60.18616485595703, -51.03322982788086, -41.88029479980469, -32.72736358642578, -23.574432373046875, -14.421497344970703, -5.268562316894531, 3.884368896484375, 13.037302017211914, 22.190235137939453, 31.343168258666992, 40.49610137939453, 49.64903259277344, 58.80196762084961, 67.95490264892578, 77.10783386230469, 86.2607650756836, 95.4136962890625, 104.56663513183594, 113.71956634521484, 122.87249755859375, 132.0254364013672, 141.17837524414062, 150.331298828125, 159.48423767089844, 168.6371612548828, 177.79010009765625, 186.94302368164062, 196.09596252441406, 205.2489013671875, 214.40182495117188, 223.5547637939453, 232.70770263671875, 241.86062622070312, 251.01356506347656, 260.16650390625, 269.3194274902344, 278.47235107421875, 287.62530517578125, 296.7782287597656]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 6.0, 10.0, 8.0, 11.0, 10.0, 14.0, 16.0, 21.0, 20.0, 33.0, 28.0, 20.0, 29.0, 33.0, 33.0, 45.0, 38.0, 44.0, 45.0, 41.0, 53.0, 59.0, 33.0, 27.0, 39.0, 44.0, 28.0, 37.0, 26.0, 26.0, 17.0, 16.0, 11.0, 10.0, 14.0, 10.0, 11.0, 8.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.53125, -34.4736328125, -33.416015625, -32.3583984375, -31.30078125, -30.2431640625, -29.185546875, -28.1279296875, -27.0703125, -26.0126953125, -24.955078125, -23.8974609375, -22.83984375, -21.7822265625, -20.724609375, -19.6669921875, -18.609375, -17.5517578125, -16.494140625, -15.4365234375, -14.37890625, -13.3212890625, -12.263671875, -11.2060546875, -10.1484375, -9.0908203125, -8.033203125, -6.9755859375, -5.91796875, -4.8603515625, -3.802734375, -2.7451171875, -1.6875, -0.6298828125, 0.427734375, 1.4853515625, 2.54296875, 3.6005859375, 4.658203125, 5.7158203125, 6.7734375, 7.8310546875, 8.888671875, 9.9462890625, 11.00390625, 12.0615234375, 13.119140625, 14.1767578125, 15.234375, 16.2919921875, 17.349609375, 18.4072265625, 19.46484375, 20.5224609375, 21.580078125, 22.6376953125, 23.6953125, 24.7529296875, 25.810546875, 26.8681640625, 27.92578125, 28.9833984375, 30.041015625, 31.0986328125, 32.15625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 16.0, 11.0, 19.0, 31.0, 27.0, 53.0, 87.0, 95.0, 166.0, 282.0, 504.0, 850.0, 1555.0, 3049.0, 6586.0, 15913.0, 323769.0, 3690491.0, 126693.0, 12672.0, 5446.0, 2606.0, 1411.0, 735.0, 427.0, 262.0, 160.0, 106.0, 65.0, 32.0, 27.0, 22.0, 21.0, 9.0, 17.0, 6.0, 12.0, 5.0, 5.0, 1.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.5, -125.501953125, -121.50390625, -117.505859375, -113.5078125, -109.509765625, -105.51171875, -101.513671875, -97.515625, -93.517578125, -89.51953125, -85.521484375, -81.5234375, -77.525390625, -73.52734375, -69.529296875, -65.53125, -61.533203125, -57.53515625, -53.537109375, -49.5390625, -45.541015625, -41.54296875, -37.544921875, -33.546875, -29.548828125, -25.55078125, -21.552734375, -17.5546875, -13.556640625, -9.55859375, -5.560546875, -1.5625, 2.435546875, 6.43359375, 10.431640625, 14.4296875, 18.427734375, 22.42578125, 26.423828125, 30.421875, 34.419921875, 38.41796875, 42.416015625, 46.4140625, 50.412109375, 54.41015625, 58.408203125, 62.40625, 66.404296875, 70.40234375, 74.400390625, 78.3984375, 82.396484375, 86.39453125, 90.392578125, 94.390625, 98.388671875, 102.38671875, 106.384765625, 110.3828125, 114.380859375, 118.37890625, 122.376953125, 126.375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 3.0, 9.0, 4.0, 9.0, 15.0, 18.0, 27.0, 63.0, 149.0, 504.0, 1241.0, 1242.0, 427.0, 131.0, 59.0, 36.0, 20.0, 26.0, 21.0, 10.0, 15.0, 8.0, 11.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.0625, -116.0576171875, -112.052734375, -108.0478515625, -104.04296875, -100.0380859375, -96.033203125, -92.0283203125, -88.0234375, -84.0185546875, -80.013671875, -76.0087890625, -72.00390625, -67.9990234375, -63.994140625, -59.9892578125, -55.984375, -51.9794921875, -47.974609375, -43.9697265625, -39.96484375, -35.9599609375, -31.955078125, -27.9501953125, -23.9453125, -19.9404296875, -15.935546875, -11.9306640625, -7.92578125, -3.9208984375, 0.083984375, 4.0888671875, 8.09375, 12.0986328125, 16.103515625, 20.1083984375, 24.11328125, 28.1181640625, 32.123046875, 36.1279296875, 40.1328125, 44.1376953125, 48.142578125, 52.1474609375, 56.15234375, 60.1572265625, 64.162109375, 68.1669921875, 72.171875, 76.1767578125, 80.181640625, 84.1865234375, 88.19140625, 92.1962890625, 96.201171875, 100.2060546875, 104.2109375, 108.2158203125, 112.220703125, 116.2255859375, 120.23046875, 124.2353515625, 128.240234375, 132.2451171875, 136.25]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 13.0, 20.0, 29.0, 42.0, 96.0, 170.0, 320.0, 745.0, 1798.0, 4836.0, 15441.0, 80991.0, 3948966.0, 113932.0, 17921.0, 5494.0, 1970.0, 774.0, 359.0, 158.0, 93.0, 43.0, 18.0, 16.0, 9.0, 7.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-286.0, -277.4765625, -268.953125, -260.4296875, -251.90625, -243.3828125, -234.859375, -226.3359375, -217.8125, -209.2890625, -200.765625, -192.2421875, -183.71875, -175.1953125, -166.671875, -158.1484375, -149.625, -141.1015625, -132.578125, -124.0546875, -115.53125, -107.0078125, -98.484375, -89.9609375, -81.4375, -72.9140625, -64.390625, -55.8671875, -47.34375, -38.8203125, -30.296875, -21.7734375, -13.25, -4.7265625, 3.796875, 12.3203125, 20.84375, 29.3671875, 37.890625, 46.4140625, 54.9375, 63.4609375, 71.984375, 80.5078125, 89.03125, 97.5546875, 106.078125, 114.6015625, 123.125, 131.6484375, 140.171875, 148.6953125, 157.21875, 165.7421875, 174.265625, 182.7890625, 191.3125, 199.8359375, 208.359375, 216.8828125, 225.40625, 233.9296875, 242.453125, 250.9765625, 259.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 26.0, 23.0, 25.0, 48.0, 89.0, 154.0, 242.0, 153.0, 66.0, 63.0, 34.0, 23.0, 11.0, 17.0, 4.0, 11.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-526.2769165039062, -507.6903991699219, -489.1039123535156, -470.51739501953125, -451.930908203125, -433.3443908691406, -414.75787353515625, -396.17138671875, -377.5848693847656, -358.99835205078125, -340.411865234375, -321.8253479003906, -303.23883056640625, -284.65234375, -266.0658264160156, -247.4793243408203, -228.892822265625, -210.3063201904297, -191.71981811523438, -173.13330078125, -154.5467987060547, -135.96029663085938, -117.37378692626953, -98.78727722167969, -80.20077514648438, -61.6142692565918, -43.02776336669922, -24.44125747680664, -5.8547515869140625, 12.73175048828125, 31.318260192871094, 49.90476989746094, 68.4913330078125, 87.07783508300781, 105.66434478759766, 124.2508544921875, 142.8373565673828, 161.42385864257812, 180.0103759765625, 198.5968780517578, 217.18338012695312, 235.76988220214844, 254.35638427734375, 272.9429016113281, 291.5294189453125, 310.11590576171875, 328.7024230957031, 347.2889404296875, 365.87542724609375, 384.4619445800781, 403.0484313964844, 421.63494873046875, 440.221435546875, 458.8079528808594, 477.39447021484375, 495.98095703125, 514.5675048828125, 533.1539916992188, 551.7405395507812, 570.3270263671875, 588.9135131835938, 607.5, 626.0865478515625, 644.6730346679688, 663.259521484375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 1.0, 3.0, 6.0, 8.0, 15.0, 9.0, 7.0, 15.0, 15.0, 27.0, 24.0, 28.0, 29.0, 34.0, 39.0, 49.0, 39.0, 47.0, 51.0, 47.0, 55.0, 45.0, 48.0, 48.0, 35.0, 41.0, 33.0, 37.0, 29.0, 23.0, 26.0, 18.0, 16.0, 15.0, 7.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.3556213378906, -258.1657409667969, -248.97589111328125, -239.7860107421875, -230.5961456298828, -221.40628051757812, -212.21641540527344, -203.02655029296875, -193.836669921875, -184.6468048095703, -175.45693969726562, -166.26705932617188, -157.0771942138672, -147.8873291015625, -138.6974639892578, -129.50759887695312, -120.31773376464844, -111.12786865234375, -101.93799591064453, -92.74813079833984, -83.55825805664062, -74.36839294433594, -65.17852783203125, -55.98865509033203, -46.798789978027344, -37.60892105102539, -28.41905403137207, -19.22918701171875, -10.039318084716797, -0.8494491577148438, 8.340415954589844, 17.530288696289062, 26.72015380859375, 35.9100227355957, 45.099891662597656, 54.289756774902344, 63.4796257019043, 72.66949462890625, 81.85935974121094, 91.04923248291016, 100.23909759521484, 109.42896270751953, 118.61883544921875, 127.80870056152344, 136.99856567382812, 146.18844604492188, 155.3782958984375, 164.56817626953125, 173.75804138183594, 182.94790649414062, 192.1377716064453, 201.32763671875, 210.51751708984375, 219.70738220214844, 228.89724731445312, 238.08712768554688, 247.2769775390625, 256.46685791015625, 265.6567077636719, 274.8465881347656, 284.03643798828125, 293.226318359375, 302.41619873046875, 311.6060485839844, 320.7959289550781]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 6.0, 6.0, 6.0, 6.0, 5.0, 15.0, 12.0, 24.0, 22.0, 19.0, 32.0, 39.0, 27.0, 28.0, 28.0, 39.0, 41.0, 50.0, 55.0, 35.0, 49.0, 51.0, 45.0, 48.0, 50.0, 38.0, 29.0, 30.0, 29.0, 28.0, 24.0, 20.0, 11.0, 11.0, 12.0, 9.0, 4.0, 9.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.5, -39.2998046875, -38.099609375, -36.8994140625, -35.69921875, -34.4990234375, -33.298828125, -32.0986328125, -30.8984375, -29.6982421875, -28.498046875, -27.2978515625, -26.09765625, -24.8974609375, -23.697265625, -22.4970703125, -21.296875, -20.0966796875, -18.896484375, -17.6962890625, -16.49609375, -15.2958984375, -14.095703125, -12.8955078125, -11.6953125, -10.4951171875, -9.294921875, -8.0947265625, -6.89453125, -5.6943359375, -4.494140625, -3.2939453125, -2.09375, -0.8935546875, 0.306640625, 1.5068359375, 2.70703125, 3.9072265625, 5.107421875, 6.3076171875, 7.5078125, 8.7080078125, 9.908203125, 11.1083984375, 12.30859375, 13.5087890625, 14.708984375, 15.9091796875, 17.109375, 18.3095703125, 19.509765625, 20.7099609375, 21.91015625, 23.1103515625, 24.310546875, 25.5107421875, 26.7109375, 27.9111328125, 29.111328125, 30.3115234375, 31.51171875, 32.7119140625, 33.912109375, 35.1123046875, 36.3125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 11.0, 15.0, 34.0, 42.0, 55.0, 108.0, 162.0, 223.0, 329.0, 491.0, 750.0, 1096.0, 1769.0, 2492.0, 3895.0, 6036.0, 9192.0, 14599.0, 22901.0, 36243.0, 61083.0, 112519.0, 233094.0, 249141.0, 122071.0, 64665.0, 38417.0, 23810.0, 15137.0, 9812.0, 6207.0, 4144.0, 2778.0, 1724.0, 1175.0, 749.0, 488.0, 385.0, 207.0, 151.0, 101.0, 76.0, 52.0, 32.0, 25.0, 12.0, 14.0, 10.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0], "bins": [-1.806640625, -1.751983642578125, -1.69732666015625, -1.642669677734375, -1.5880126953125, -1.533355712890625, -1.47869873046875, -1.424041748046875, -1.369384765625, -1.314727783203125, -1.26007080078125, -1.205413818359375, -1.1507568359375, -1.096099853515625, -1.04144287109375, -0.986785888671875, -0.93212890625, -0.877471923828125, -0.82281494140625, -0.768157958984375, -0.7135009765625, -0.658843994140625, -0.60418701171875, -0.549530029296875, -0.494873046875, -0.440216064453125, -0.38555908203125, -0.330902099609375, -0.2762451171875, -0.221588134765625, -0.16693115234375, -0.112274169921875, -0.0576171875, -0.002960205078125, 0.05169677734375, 0.106353759765625, 0.1610107421875, 0.215667724609375, 0.27032470703125, 0.324981689453125, 0.379638671875, 0.434295654296875, 0.48895263671875, 0.543609619140625, 0.5982666015625, 0.652923583984375, 0.70758056640625, 0.762237548828125, 0.81689453125, 0.871551513671875, 0.92620849609375, 0.980865478515625, 1.0355224609375, 1.090179443359375, 1.14483642578125, 1.199493408203125, 1.254150390625, 1.308807373046875, 1.36346435546875, 1.418121337890625, 1.4727783203125, 1.527435302734375, 1.58209228515625, 1.636749267578125, 1.69140625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 9.0, 19.0, 12.0, 10.0, 17.0, 13.0, 19.0, 19.0, 23.0, 29.0, 30.0, 36.0, 40.0, 45.0, 36.0, 35.0, 42.0, 42.0, 1065.0, 51.0, 28.0, 38.0, 40.0, 45.0, 41.0, 28.0, 27.0, 19.0, 24.0, 24.0, 18.0, 15.0, 14.0, 7.0, 10.0, 9.0, 6.0, 7.0, 5.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.953125, -22.239501953125, -21.52587890625, -20.812255859375, -20.0986328125, -19.385009765625, -18.67138671875, -17.957763671875, -17.244140625, -16.530517578125, -15.81689453125, -15.103271484375, -14.3896484375, -13.676025390625, -12.96240234375, -12.248779296875, -11.53515625, -10.821533203125, -10.10791015625, -9.394287109375, -8.6806640625, -7.967041015625, -7.25341796875, -6.539794921875, -5.826171875, -5.112548828125, -4.39892578125, -3.685302734375, -2.9716796875, -2.258056640625, -1.54443359375, -0.830810546875, -0.1171875, 0.596435546875, 1.31005859375, 2.023681640625, 2.7373046875, 3.450927734375, 4.16455078125, 4.878173828125, 5.591796875, 6.305419921875, 7.01904296875, 7.732666015625, 8.4462890625, 9.159912109375, 9.87353515625, 10.587158203125, 11.30078125, 12.014404296875, 12.72802734375, 13.441650390625, 14.1552734375, 14.868896484375, 15.58251953125, 16.296142578125, 17.009765625, 17.723388671875, 18.43701171875, 19.150634765625, 19.8642578125, 20.577880859375, 21.29150390625, 22.005126953125, 22.71875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 5.0, 15.0, 9.0, 18.0, 17.0, 40.0, 53.0, 83.0, 115.0, 163.0, 273.0, 414.0, 602.0, 866.0, 1388.0, 2226.0, 3448.0, 5536.0, 8795.0, 14297.0, 24064.0, 42479.0, 78699.0, 169873.0, 1368688.0, 182401.0, 83465.0, 44085.0, 25066.0, 14966.0, 9129.0, 5701.0, 3652.0, 2296.0, 1446.0, 950.0, 612.0, 394.0, 262.0, 177.0, 127.0, 70.0, 50.0, 40.0, 25.0, 19.0, 14.0, 9.0, 5.0, 6.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.9189453125, -1.8599700927734375, -1.800994873046875, -1.7420196533203125, -1.68304443359375, -1.6240692138671875, -1.565093994140625, -1.5061187744140625, -1.4471435546875, -1.3881683349609375, -1.329193115234375, -1.2702178955078125, -1.21124267578125, -1.1522674560546875, -1.093292236328125, -1.0343170166015625, -0.975341796875, -0.9163665771484375, -0.857391357421875, -0.7984161376953125, -0.73944091796875, -0.6804656982421875, -0.621490478515625, -0.5625152587890625, -0.5035400390625, -0.4445648193359375, -0.385589599609375, -0.3266143798828125, -0.26763916015625, -0.2086639404296875, -0.149688720703125, -0.0907135009765625, -0.03173828125, 0.0272369384765625, 0.086212158203125, 0.1451873779296875, 0.20416259765625, 0.2631378173828125, 0.322113037109375, 0.3810882568359375, 0.4400634765625, 0.4990386962890625, 0.558013916015625, 0.6169891357421875, 0.67596435546875, 0.7349395751953125, 0.793914794921875, 0.8528900146484375, 0.911865234375, 0.9708404541015625, 1.029815673828125, 1.0887908935546875, 1.14776611328125, 1.2067413330078125, 1.265716552734375, 1.3246917724609375, 1.3836669921875, 1.4426422119140625, 1.501617431640625, 1.5605926513671875, 1.61956787109375, 1.6785430908203125, 1.737518310546875, 1.7964935302734375, 1.85546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 13.0, 16.0, 20.0, 23.0, 25.0, 34.0, 49.0, 64.0, 69.0, 78.0, 79.0, 82.0, 71.0, 62.0, 53.0, 42.0, 33.0, 24.0, 19.0, 18.0, 19.0, 16.0, 13.0, 9.0, 4.0, 14.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0274658203125, -0.02664923667907715, -0.025832653045654297, -0.025016069412231445, -0.024199485778808594, -0.023382902145385742, -0.02256631851196289, -0.02174973487854004, -0.020933151245117188, -0.020116567611694336, -0.019299983978271484, -0.018483400344848633, -0.01766681671142578, -0.01685023307800293, -0.016033649444580078, -0.015217065811157227, -0.014400482177734375, -0.013583898544311523, -0.012767314910888672, -0.01195073127746582, -0.011134147644042969, -0.010317564010620117, -0.009500980377197266, -0.008684396743774414, -0.007867813110351562, -0.007051229476928711, -0.006234645843505859, -0.005418062210083008, -0.004601478576660156, -0.0037848949432373047, -0.002968311309814453, -0.0021517276763916016, -0.00133514404296875, -0.0005185604095458984, 0.0002980232238769531, 0.0011146068572998047, 0.0019311904907226562, 0.002747774124145508, 0.0035643577575683594, 0.004380941390991211, 0.0051975250244140625, 0.006014108657836914, 0.006830692291259766, 0.007647275924682617, 0.008463859558105469, 0.00928044319152832, 0.010097026824951172, 0.010913610458374023, 0.011730194091796875, 0.012546777725219727, 0.013363361358642578, 0.01417994499206543, 0.014996528625488281, 0.015813112258911133, 0.016629695892333984, 0.017446279525756836, 0.018262863159179688, 0.01907944679260254, 0.01989603042602539, 0.020712614059448242, 0.021529197692871094, 0.022345781326293945, 0.023162364959716797, 0.02397894859313965, 0.0247955322265625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 12.0, 5.0, 9.0, 17.0, 19.0, 37.0, 39.0, 54.0, 51.0, 77.0, 108.0, 178.0, 481.0, 2820.0, 45435.0, 952243.0, 43156.0, 2723.0, 467.0, 203.0, 116.0, 73.0, 62.0, 39.0, 28.0, 20.0, 16.0, 11.0, 10.0, 7.0, 7.0, 3.0, 5.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382568359375, -0.3700218200683594, -0.35747528076171875, -0.3449287414550781, -0.3323822021484375, -0.3198356628417969, -0.30728912353515625, -0.2947425842285156, -0.282196044921875, -0.2696495056152344, -0.25710296630859375, -0.24455642700195312, -0.2320098876953125, -0.21946334838867188, -0.20691680908203125, -0.19437026977539062, -0.18182373046875, -0.16927719116210938, -0.15673065185546875, -0.14418411254882812, -0.1316375732421875, -0.11909103393554688, -0.10654449462890625, -0.09399795532226562, -0.081451416015625, -0.06890487670898438, -0.05635833740234375, -0.043811798095703125, -0.0312652587890625, -0.018718719482421875, -0.00617218017578125, 0.006374359130859375, 0.0189208984375, 0.031467437744140625, 0.04401397705078125, 0.056560516357421875, 0.0691070556640625, 0.08165359497070312, 0.09420013427734375, 0.10674667358398438, 0.119293212890625, 0.13183975219726562, 0.14438629150390625, 0.15693283081054688, 0.1694793701171875, 0.18202590942382812, 0.19457244873046875, 0.20711898803710938, 0.21966552734375, 0.23221206665039062, 0.24475860595703125, 0.2573051452636719, 0.2698516845703125, 0.2823982238769531, 0.29494476318359375, 0.3074913024902344, 0.320037841796875, 0.3325843811035156, 0.34513092041015625, 0.3576774597167969, 0.3702239990234375, 0.3827705383300781, 0.39531707763671875, 0.4078636169433594, 0.42041015625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 46.0, 239.0, 616.0, 87.0, 13.0, 6.0], "bins": [-0.20605339109897614, -0.20263195037841797, -0.1992105096578598, -0.19578906893730164, -0.19236762821674347, -0.1889461874961853, -0.18552473187446594, -0.18210329115390778, -0.1786818504333496, -0.17526040971279144, -0.17183896899223328, -0.1684175282716751, -0.16499608755111694, -0.16157463192939758, -0.15815319120883942, -0.15473175048828125, -0.15131030976772308, -0.14788886904716492, -0.14446742832660675, -0.14104598760604858, -0.13762454688549042, -0.13420310616493225, -0.1307816505432129, -0.12736020982265472, -0.12393877655267715, -0.12051733583211899, -0.11709589511156082, -0.11367444694042206, -0.11025300621986389, -0.10683156549930573, -0.10341012477874756, -0.09998868405818939, -0.09656722843647003, -0.09314578771591187, -0.0897243469953537, -0.08630289882421494, -0.08288145810365677, -0.0794600173830986, -0.07603857666254044, -0.07261712849140167, -0.0691956952214241, -0.06577425450086594, -0.06235281005501747, -0.058931369334459305, -0.05550992488861084, -0.05208848416805267, -0.04866704344749451, -0.04524559900164604, -0.04182415455579758, -0.03840271383523941, -0.034981269389390945, -0.03155982866883278, -0.028138384222984314, -0.024716943502426147, -0.02129550091922283, -0.017874058336019516, -0.0144526157528162, -0.011031173169612885, -0.007609731052070856, -0.004188288934528828, -0.0007668463513255119, 0.002654595300555229, 0.006076037883758545, 0.00949748046696186, 0.012918923050165176]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 8.0, 9.0, 10.0, 14.0, 13.0, 18.0, 20.0, 25.0, 20.0, 23.0, 26.0, 29.0, 34.0, 36.0, 47.0, 46.0, 54.0, 38.0, 54.0, 48.0, 31.0, 35.0, 37.0, 31.0, 39.0, 38.0, 27.0, 36.0, 26.0, 24.0, 25.0, 18.0, 11.0, 16.0, 12.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.014981687068939209, -0.014536437578499317, -0.014091188088059425, -0.013645938597619534, -0.013200689107179642, -0.01275543961673975, -0.012310190126299858, -0.011864940635859966, -0.011419691145420074, -0.010974441654980183, -0.01052919216454029, -0.010083942674100399, -0.009638693183660507, -0.009193443693220615, -0.008748194202780724, -0.008302944712340832, -0.00785769522190094, -0.007412445731461048, -0.006967196241021156, -0.0065219467505812645, -0.006076697260141373, -0.005631447769701481, -0.005186198279261589, -0.004740948788821697, -0.004295699298381805, -0.0038504498079419136, -0.003405200317502022, -0.00295995082706213, -0.002514701336622238, -0.0020694518461823463, -0.0016242023557424545, -0.0011789528653025627, -0.0007337033748626709, -0.0002884538844227791, 0.00015679560601711273, 0.0006020450964570045, 0.0010472945868968964, 0.0014925440773367882, 0.00193779356777668, 0.002383043058216572, 0.0028282925486564636, 0.0032735420390963554, 0.0037187915295362473, 0.004164041019976139, 0.004609290510416031, 0.005054540000855923, 0.0054997894912958145, 0.005945038981735706, 0.006390288472175598, 0.00683553796261549, 0.007280787453055382, 0.007726036943495274, 0.008171286433935165, 0.008616535924375057, 0.009061785414814949, 0.00950703490525484, 0.009952284395694733, 0.010397533886134624, 0.010842783376574516, 0.011288032867014408, 0.0117332823574543, 0.012178531847894192, 0.012623781338334084, 0.013069030828773975, 0.013514280319213867]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 6.0, 6.0, 6.0, 6.0, 5.0, 15.0, 12.0, 24.0, 22.0, 19.0, 32.0, 39.0, 27.0, 28.0, 28.0, 39.0, 41.0, 50.0, 55.0, 35.0, 49.0, 51.0, 45.0, 48.0, 50.0, 38.0, 29.0, 30.0, 29.0, 28.0, 24.0, 20.0, 11.0, 11.0, 12.0, 9.0, 4.0, 9.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.5, -39.2998046875, -38.099609375, -36.8994140625, -35.69921875, -34.4990234375, -33.298828125, -32.0986328125, -30.8984375, -29.6982421875, -28.498046875, -27.2978515625, -26.09765625, -24.8974609375, -23.697265625, -22.4970703125, -21.296875, -20.0966796875, -18.896484375, -17.6962890625, -16.49609375, -15.2958984375, -14.095703125, -12.8955078125, -11.6953125, -10.4951171875, -9.294921875, -8.0947265625, -6.89453125, -5.6943359375, -4.494140625, -3.2939453125, -2.09375, -0.8935546875, 0.306640625, 1.5068359375, 2.70703125, 3.9072265625, 5.107421875, 6.3076171875, 7.5078125, 8.7080078125, 9.908203125, 11.1083984375, 12.30859375, 13.5087890625, 14.708984375, 15.9091796875, 17.109375, 18.3095703125, 19.509765625, 20.7099609375, 21.91015625, 23.1103515625, 24.310546875, 25.5107421875, 26.7109375, 27.9111328125, 29.111328125, 30.3115234375, 31.51171875, 32.7119140625, 33.912109375, 35.1123046875, 36.3125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 9.0, 12.0, 10.0, 23.0, 35.0, 45.0, 63.0, 106.0, 119.0, 192.0, 235.0, 413.0, 573.0, 778.0, 1129.0, 1648.0, 2573.0, 4523.0, 10602.0, 96319.0, 859261.0, 50058.0, 8480.0, 3936.0, 2405.0, 1548.0, 1062.0, 725.0, 494.0, 333.0, 244.0, 186.0, 107.0, 92.0, 66.0, 39.0, 24.0, 24.0, 24.0, 13.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-55.375, -53.76513671875, -52.1552734375, -50.54541015625, -48.935546875, -47.32568359375, -45.7158203125, -44.10595703125, -42.49609375, -40.88623046875, -39.2763671875, -37.66650390625, -36.056640625, -34.44677734375, -32.8369140625, -31.22705078125, -29.6171875, -28.00732421875, -26.3974609375, -24.78759765625, -23.177734375, -21.56787109375, -19.9580078125, -18.34814453125, -16.73828125, -15.12841796875, -13.5185546875, -11.90869140625, -10.298828125, -8.68896484375, -7.0791015625, -5.46923828125, -3.859375, -2.24951171875, -0.6396484375, 0.97021484375, 2.580078125, 4.18994140625, 5.7998046875, 7.40966796875, 9.01953125, 10.62939453125, 12.2392578125, 13.84912109375, 15.458984375, 17.06884765625, 18.6787109375, 20.28857421875, 21.8984375, 23.50830078125, 25.1181640625, 26.72802734375, 28.337890625, 29.94775390625, 31.5576171875, 33.16748046875, 34.77734375, 36.38720703125, 37.9970703125, 39.60693359375, 41.216796875, 42.82666015625, 44.4365234375, 46.04638671875, 47.65625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 7.0, 16.0, 10.0, 15.0, 19.0, 21.0, 30.0, 26.0, 32.0, 34.0, 48.0, 40.0, 41.0, 33.0, 51.0, 61.0, 171.0, 1823.0, 114.0, 54.0, 44.0, 36.0, 39.0, 29.0, 38.0, 33.0, 16.0, 27.0, 18.0, 14.0, 12.0, 11.0, 16.0, 9.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.9375, -101.4912109375, -98.044921875, -94.5986328125, -91.15234375, -87.7060546875, -84.259765625, -80.8134765625, -77.3671875, -73.9208984375, -70.474609375, -67.0283203125, -63.58203125, -60.1357421875, -56.689453125, -53.2431640625, -49.796875, -46.3505859375, -42.904296875, -39.4580078125, -36.01171875, -32.5654296875, -29.119140625, -25.6728515625, -22.2265625, -18.7802734375, -15.333984375, -11.8876953125, -8.44140625, -4.9951171875, -1.548828125, 1.8974609375, 5.34375, 8.7900390625, 12.236328125, 15.6826171875, 19.12890625, 22.5751953125, 26.021484375, 29.4677734375, 32.9140625, 36.3603515625, 39.806640625, 43.2529296875, 46.69921875, 50.1455078125, 53.591796875, 57.0380859375, 60.484375, 63.9306640625, 67.376953125, 70.8232421875, 74.26953125, 77.7158203125, 81.162109375, 84.6083984375, 88.0546875, 91.5009765625, 94.947265625, 98.3935546875, 101.83984375, 105.2861328125, 108.732421875, 112.1787109375, 115.625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 12.0, 28.0, 52.0, 73.0, 276.0, 1141.0, 11141.0, 3123284.0, 8209.0, 1016.0, 251.0, 88.0, 49.0, 21.0, 17.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-542.5, -522.734375, -502.96875, -483.203125, -463.4375, -443.671875, -423.90625, -404.140625, -384.375, -364.609375, -344.84375, -325.078125, -305.3125, -285.546875, -265.78125, -246.015625, -226.25, -206.484375, -186.71875, -166.953125, -147.1875, -127.421875, -107.65625, -87.890625, -68.125, -48.359375, -28.59375, -8.828125, 10.9375, 30.703125, 50.46875, 70.234375, 90.0, 109.765625, 129.53125, 149.296875, 169.0625, 188.828125, 208.59375, 228.359375, 248.125, 267.890625, 287.65625, 307.421875, 327.1875, 346.953125, 366.71875, 386.484375, 406.25, 426.015625, 445.78125, 465.546875, 485.3125, 505.078125, 524.84375, 544.609375, 564.375, 584.140625, 603.90625, 623.671875, 643.4375, 663.203125, 682.96875, 702.734375, 722.5]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 20.0, 877.0, 123.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-417.8130187988281, -363.2269592285156, -308.64093017578125, -254.05487060546875, -199.4688262939453, -144.88278198242188, -90.29672241210938, -35.710693359375, 18.8753662109375, 73.46141052246094, 128.04745483398438, 182.63351440429688, 237.2195587158203, 291.80560302734375, 346.39166259765625, 400.9776916503906, 455.5637512207031, 510.1498107910156, 564.73583984375, 619.3218994140625, 673.907958984375, 728.4940185546875, 783.080078125, 837.6660766601562, 892.2521362304688, 946.8381958007812, 1001.4242553710938, 1056.01025390625, 1110.5963134765625, 1165.182373046875, 1219.7684326171875, 1274.3544921875, 1328.9405517578125, 1383.526611328125, 1438.1126708984375, 1492.69873046875, 1547.2847900390625, 1601.870849609375, 1656.456787109375, 1711.0428466796875, 1765.62890625, 1820.2149658203125, 1874.801025390625, 1929.3870849609375, 1983.97314453125, 2038.55908203125, 2093.145263671875, 2147.731201171875, 2202.3173828125, 2256.9033203125, 2311.489501953125, 2366.075439453125, 2420.66162109375, 2475.24755859375, 2529.833740234375, 2584.419677734375, 2639.005615234375, 2693.591552734375, 2748.177734375, 2802.763671875, 2857.349853515625, 2911.935791015625, 2966.52197265625, 3021.10791015625, 3075.694091796875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 6.0, 5.0, 14.0, 9.0, 12.0, 18.0, 18.0, 18.0, 21.0, 14.0, 27.0, 19.0, 31.0, 31.0, 28.0, 29.0, 39.0, 34.0, 41.0, 43.0, 49.0, 37.0, 37.0, 52.0, 44.0, 43.0, 35.0, 31.0, 24.0, 24.0, 22.0, 15.0, 21.0, 20.0, 14.0, 9.0, 15.0, 7.0, 12.0, 8.0, 9.0, 9.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-350.0292663574219, -340.3514099121094, -330.67352294921875, -320.99566650390625, -311.31781005859375, -301.6399230957031, -291.9620666503906, -282.2841796875, -272.6063232421875, -262.928466796875, -253.25057983398438, -243.57272338867188, -233.8948516845703, -224.21697998046875, -214.53912353515625, -204.8612518310547, -195.18338012695312, -185.50550842285156, -175.82763671875, -166.1497802734375, -156.47190856933594, -146.79403686523438, -137.11618041992188, -127.43830871582031, -117.76043701171875, -108.08256530761719, -98.40470123291016, -88.72683715820312, -79.04896545410156, -69.37109375, -59.69322967529297, -50.01536560058594, -40.33746337890625, -30.659595489501953, -20.981727600097656, -11.30385971069336, -1.6259918212890625, 8.051876068115234, 17.72974395751953, 27.407608032226562, 37.085479736328125, 46.76334762573242, 56.44121551513672, 66.11907958984375, 75.79695129394531, 85.47482299804688, 95.1526870727539, 104.83055114746094, 114.5084228515625, 124.18629455566406, 133.86416625976562, 143.54202270507812, 153.2198944091797, 162.89776611328125, 172.57562255859375, 182.2534942626953, 191.93136596679688, 201.60923767089844, 211.287109375, 220.9649658203125, 230.64283752441406, 240.32070922851562, 249.99856567382812, 259.67645263671875, 269.35430908203125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 2.0, 3.0, 11.0, 6.0, 11.0, 14.0, 20.0, 19.0, 24.0, 18.0, 33.0, 35.0, 23.0, 32.0, 29.0, 44.0, 41.0, 48.0, 52.0, 51.0, 38.0, 49.0, 51.0, 43.0, 48.0, 32.0, 38.0, 29.0, 27.0, 17.0, 28.0, 18.0, 11.0, 11.0, 10.0, 10.0, 7.0, 5.0, 4.0, 1.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.3125, -40.07666015625, -38.8408203125, -37.60498046875, -36.369140625, -35.13330078125, -33.8974609375, -32.66162109375, -31.42578125, -30.18994140625, -28.9541015625, -27.71826171875, -26.482421875, -25.24658203125, -24.0107421875, -22.77490234375, -21.5390625, -20.30322265625, -19.0673828125, -17.83154296875, -16.595703125, -15.35986328125, -14.1240234375, -12.88818359375, -11.65234375, -10.41650390625, -9.1806640625, -7.94482421875, -6.708984375, -5.47314453125, -4.2373046875, -3.00146484375, -1.765625, -0.52978515625, 0.7060546875, 1.94189453125, 3.177734375, 4.41357421875, 5.6494140625, 6.88525390625, 8.12109375, 9.35693359375, 10.5927734375, 11.82861328125, 13.064453125, 14.30029296875, 15.5361328125, 16.77197265625, 18.0078125, 19.24365234375, 20.4794921875, 21.71533203125, 22.951171875, 24.18701171875, 25.4228515625, 26.65869140625, 27.89453125, 29.13037109375, 30.3662109375, 31.60205078125, 32.837890625, 34.07373046875, 35.3095703125, 36.54541015625, 37.78125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 16.0, 14.0, 20.0, 29.0, 33.0, 54.0, 86.0, 97.0, 168.0, 211.0, 292.0, 432.0, 694.0, 1043.0, 1636.0, 2586.0, 4173.0, 7133.0, 14357.0, 91166.0, 1513143.0, 2366608.0, 150959.0, 19254.0, 7899.0, 4458.0, 2733.0, 1743.0, 1069.0, 720.0, 453.0, 301.0, 203.0, 144.0, 92.0, 81.0, 42.0, 44.0, 14.0, 21.0, 13.0, 4.0, 11.0, 4.0, 4.0, 2.0, 4.0, 0.0, 4.0], "bins": [-95.1875, -92.5498046875, -89.912109375, -87.2744140625, -84.63671875, -81.9990234375, -79.361328125, -76.7236328125, -74.0859375, -71.4482421875, -68.810546875, -66.1728515625, -63.53515625, -60.8974609375, -58.259765625, -55.6220703125, -52.984375, -50.3466796875, -47.708984375, -45.0712890625, -42.43359375, -39.7958984375, -37.158203125, -34.5205078125, -31.8828125, -29.2451171875, -26.607421875, -23.9697265625, -21.33203125, -18.6943359375, -16.056640625, -13.4189453125, -10.78125, -8.1435546875, -5.505859375, -2.8681640625, -0.23046875, 2.4072265625, 5.044921875, 7.6826171875, 10.3203125, 12.9580078125, 15.595703125, 18.2333984375, 20.87109375, 23.5087890625, 26.146484375, 28.7841796875, 31.421875, 34.0595703125, 36.697265625, 39.3349609375, 41.97265625, 44.6103515625, 47.248046875, 49.8857421875, 52.5234375, 55.1611328125, 57.798828125, 60.4365234375, 63.07421875, 65.7119140625, 68.349609375, 70.9873046875, 73.625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 11.0, 12.0, 7.0, 19.0, 15.0, 24.0, 55.0, 70.0, 155.0, 380.0, 951.0, 1246.0, 589.0, 221.0, 108.0, 50.0, 34.0, 21.0, 23.0, 16.0, 4.0, 12.0, 10.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.625, -116.884765625, -113.14453125, -109.404296875, -105.6640625, -101.923828125, -98.18359375, -94.443359375, -90.703125, -86.962890625, -83.22265625, -79.482421875, -75.7421875, -72.001953125, -68.26171875, -64.521484375, -60.78125, -57.041015625, -53.30078125, -49.560546875, -45.8203125, -42.080078125, -38.33984375, -34.599609375, -30.859375, -27.119140625, -23.37890625, -19.638671875, -15.8984375, -12.158203125, -8.41796875, -4.677734375, -0.9375, 2.802734375, 6.54296875, 10.283203125, 14.0234375, 17.763671875, 21.50390625, 25.244140625, 28.984375, 32.724609375, 36.46484375, 40.205078125, 43.9453125, 47.685546875, 51.42578125, 55.166015625, 58.90625, 62.646484375, 66.38671875, 70.126953125, 73.8671875, 77.607421875, 81.34765625, 85.087890625, 88.828125, 92.568359375, 96.30859375, 100.048828125, 103.7890625, 107.529296875, 111.26953125, 115.009765625, 118.75]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 12.0, 18.0, 38.0, 39.0, 60.0, 111.0, 157.0, 241.0, 329.0, 584.0, 961.0, 1704.0, 3098.0, 5944.0, 12259.0, 31327.0, 136399.0, 3565833.0, 357119.0, 45715.0, 16172.0, 7416.0, 3700.0, 1996.0, 1103.0, 686.0, 438.0, 255.0, 183.0, 116.0, 95.0, 48.0, 33.0, 26.0, 21.0, 13.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.25, -155.34375, -150.4375, -145.53125, -140.625, -135.71875, -130.8125, -125.90625, -121.0, -116.09375, -111.1875, -106.28125, -101.375, -96.46875, -91.5625, -86.65625, -81.75, -76.84375, -71.9375, -67.03125, -62.125, -57.21875, -52.3125, -47.40625, -42.5, -37.59375, -32.6875, -27.78125, -22.875, -17.96875, -13.0625, -8.15625, -3.25, 1.65625, 6.5625, 11.46875, 16.375, 21.28125, 26.1875, 31.09375, 36.0, 40.90625, 45.8125, 50.71875, 55.625, 60.53125, 65.4375, 70.34375, 75.25, 80.15625, 85.0625, 89.96875, 94.875, 99.78125, 104.6875, 109.59375, 114.5, 119.40625, 124.3125, 129.21875, 134.125, 139.03125, 143.9375, 148.84375, 153.75]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 14.0, 25.0, 48.0, 84.0, 169.0, 268.0, 190.0, 79.0, 47.0, 41.0, 15.0, 11.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.8214111328125, -276.0696716308594, -252.31793212890625, -228.56619262695312, -204.814453125, -181.06271362304688, -157.3109588623047, -133.55921936035156, -109.80747985839844, -86.05574035644531, -62.30399703979492, -38.55225372314453, -14.800514221191406, 8.951225280761719, 32.702972412109375, 56.4547119140625, 80.20645141601562, 103.95819091796875, 127.70993041992188, 151.461669921875, 175.21340942382812, 198.96514892578125, 222.71690368652344, 246.46864318847656, 270.22039794921875, 293.9721374511719, 317.723876953125, 341.4756164550781, 365.22735595703125, 388.9790954589844, 412.7308349609375, 436.48260498046875, 460.23431396484375, 483.9860534667969, 507.73779296875, 531.4895629882812, 555.2412719726562, 578.9930419921875, 602.7447509765625, 626.4965209960938, 650.2482299804688, 674.0, 697.751708984375, 721.5034790039062, 745.2551879882812, 769.0069580078125, 792.7586669921875, 816.5104370117188, 840.26220703125, 864.0139770507812, 887.7656860351562, 911.5174560546875, 935.2691650390625, 959.0209350585938, 982.7726440429688, 1006.5244140625, 1030.276123046875, 1054.02783203125, 1077.7796630859375, 1101.5313720703125, 1125.2830810546875, 1149.0347900390625, 1172.78662109375, 1196.538330078125, 1220.2900390625]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 12.0, 9.0, 12.0, 13.0, 11.0, 14.0, 15.0, 15.0, 20.0, 26.0, 17.0, 34.0, 30.0, 35.0, 31.0, 36.0, 31.0, 39.0, 30.0, 40.0, 38.0, 39.0, 40.0, 42.0, 36.0, 37.0, 32.0, 31.0, 32.0, 19.0, 20.0, 21.0, 18.0, 21.0, 17.0, 18.0, 10.0, 19.0, 6.0, 8.0, 4.0, 5.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-227.4165802001953, -220.11477661132812, -212.81298828125, -205.5111846923828, -198.20938110351562, -190.90757751464844, -183.60577392578125, -176.30398559570312, -169.00218200683594, -161.70037841796875, -154.39859008789062, -147.09678649902344, -139.79498291015625, -132.49317932128906, -125.1913833618164, -117.88958740234375, -110.58778381347656, -103.28598022460938, -95.98418426513672, -88.68238830566406, -81.38058471679688, -74.07878112792969, -66.77698516845703, -59.47518539428711, -52.17338562011719, -44.871585845947266, -37.569786071777344, -30.267986297607422, -22.9661865234375, -15.664386749267578, -8.362586975097656, -1.0607872009277344, 6.24102783203125, 13.542827606201172, 20.844627380371094, 28.146427154541016, 35.44822692871094, 42.75002670288086, 50.05182647705078, 57.3536262512207, 64.65542602539062, 71.95722961425781, 79.25902557373047, 86.56082153320312, 93.86262512207031, 101.1644287109375, 108.46622467041016, 115.76802062988281, 123.06982421875, 130.3716278076172, 137.67343139648438, 144.9752197265625, 152.2770233154297, 159.57882690429688, 166.880615234375, 174.1824188232422, 181.48422241210938, 188.78602600097656, 196.08782958984375, 203.38961791992188, 210.69142150878906, 217.99322509765625, 225.29501342773438, 232.59681701660156, 239.89862060546875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 6.0, 7.0, 8.0, 9.0, 16.0, 16.0, 15.0, 15.0, 13.0, 25.0, 27.0, 29.0, 26.0, 45.0, 35.0, 30.0, 37.0, 39.0, 31.0, 43.0, 37.0, 55.0, 46.0, 43.0, 33.0, 46.0, 28.0, 31.0, 23.0, 26.0, 27.0, 27.0, 17.0, 11.0, 15.0, 14.0, 7.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-40.21875, -39.09228515625, -37.9658203125, -36.83935546875, -35.712890625, -34.58642578125, -33.4599609375, -32.33349609375, -31.20703125, -30.08056640625, -28.9541015625, -27.82763671875, -26.701171875, -25.57470703125, -24.4482421875, -23.32177734375, -22.1953125, -21.06884765625, -19.9423828125, -18.81591796875, -17.689453125, -16.56298828125, -15.4365234375, -14.31005859375, -13.18359375, -12.05712890625, -10.9306640625, -9.80419921875, -8.677734375, -7.55126953125, -6.4248046875, -5.29833984375, -4.171875, -3.04541015625, -1.9189453125, -0.79248046875, 0.333984375, 1.46044921875, 2.5869140625, 3.71337890625, 4.83984375, 5.96630859375, 7.0927734375, 8.21923828125, 9.345703125, 10.47216796875, 11.5986328125, 12.72509765625, 13.8515625, 14.97802734375, 16.1044921875, 17.23095703125, 18.357421875, 19.48388671875, 20.6103515625, 21.73681640625, 22.86328125, 23.98974609375, 25.1162109375, 26.24267578125, 27.369140625, 28.49560546875, 29.6220703125, 30.74853515625, 31.875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 1.0, 16.0, 8.0, 10.0, 22.0, 34.0, 68.0, 101.0, 144.0, 214.0, 336.0, 450.0, 692.0, 1015.0, 1506.0, 2404.0, 3497.0, 5333.0, 8157.0, 12610.0, 19990.0, 32515.0, 54584.0, 97890.0, 189910.0, 266712.0, 150307.0, 78757.0, 45322.0, 27566.0, 16976.0, 10794.0, 7053.0, 4587.0, 2944.0, 2002.0, 1311.0, 866.0, 622.0, 395.0, 272.0, 163.0, 130.0, 100.0, 50.0, 41.0, 21.0, 22.0, 15.0, 9.0, 9.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5849609375, -1.5290069580078125, -1.473052978515625, -1.4170989990234375, -1.36114501953125, -1.3051910400390625, -1.249237060546875, -1.1932830810546875, -1.1373291015625, -1.0813751220703125, -1.025421142578125, -0.9694671630859375, -0.91351318359375, -0.8575592041015625, -0.801605224609375, -0.7456512451171875, -0.689697265625, -0.6337432861328125, -0.577789306640625, -0.5218353271484375, -0.46588134765625, -0.4099273681640625, -0.353973388671875, -0.2980194091796875, -0.2420654296875, -0.1861114501953125, -0.130157470703125, -0.0742034912109375, -0.01824951171875, 0.0377044677734375, 0.093658447265625, 0.1496124267578125, 0.20556640625, 0.2615203857421875, 0.317474365234375, 0.3734283447265625, 0.42938232421875, 0.4853363037109375, 0.541290283203125, 0.5972442626953125, 0.6531982421875, 0.7091522216796875, 0.765106201171875, 0.8210601806640625, 0.87701416015625, 0.9329681396484375, 0.988922119140625, 1.0448760986328125, 1.100830078125, 1.1567840576171875, 1.212738037109375, 1.2686920166015625, 1.32464599609375, 1.3805999755859375, 1.436553955078125, 1.4925079345703125, 1.5484619140625, 1.6044158935546875, 1.660369873046875, 1.7163238525390625, 1.77227783203125, 1.8282318115234375, 1.884185791015625, 1.9401397705078125, 1.99609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 10.0, 13.0, 9.0, 13.0, 18.0, 16.0, 30.0, 23.0, 24.0, 32.0, 35.0, 25.0, 31.0, 40.0, 33.0, 41.0, 33.0, 1061.0, 51.0, 41.0, 34.0, 45.0, 38.0, 36.0, 32.0, 29.0, 24.0, 17.0, 20.0, 24.0, 16.0, 15.0, 12.0, 14.0, 7.0, 12.0, 6.0, 6.0, 7.0, 3.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-20.671875, -19.974365234375, -19.27685546875, -18.579345703125, -17.8818359375, -17.184326171875, -16.48681640625, -15.789306640625, -15.091796875, -14.394287109375, -13.69677734375, -12.999267578125, -12.3017578125, -11.604248046875, -10.90673828125, -10.209228515625, -9.51171875, -8.814208984375, -8.11669921875, -7.419189453125, -6.7216796875, -6.024169921875, -5.32666015625, -4.629150390625, -3.931640625, -3.234130859375, -2.53662109375, -1.839111328125, -1.1416015625, -0.444091796875, 0.25341796875, 0.950927734375, 1.6484375, 2.345947265625, 3.04345703125, 3.740966796875, 4.4384765625, 5.135986328125, 5.83349609375, 6.531005859375, 7.228515625, 7.926025390625, 8.62353515625, 9.321044921875, 10.0185546875, 10.716064453125, 11.41357421875, 12.111083984375, 12.80859375, 13.506103515625, 14.20361328125, 14.901123046875, 15.5986328125, 16.296142578125, 16.99365234375, 17.691162109375, 18.388671875, 19.086181640625, 19.78369140625, 20.481201171875, 21.1787109375, 21.876220703125, 22.57373046875, 23.271240234375, 23.96875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 14.0, 9.0, 14.0, 13.0, 35.0, 50.0, 80.0, 105.0, 179.0, 223.0, 328.0, 519.0, 713.0, 1101.0, 1704.0, 2592.0, 3885.0, 6018.0, 9601.0, 15128.0, 25070.0, 43006.0, 80086.0, 172986.0, 1365798.0, 175979.0, 80386.0, 43733.0, 25210.0, 15388.0, 9541.0, 6082.0, 3873.0, 2546.0, 1701.0, 1112.0, 745.0, 476.0, 343.0, 222.0, 164.0, 121.0, 86.0, 52.0, 34.0, 23.0, 17.0, 14.0, 10.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.818359375, -1.758758544921875, -1.69915771484375, -1.639556884765625, -1.5799560546875, -1.520355224609375, -1.46075439453125, -1.401153564453125, -1.341552734375, -1.281951904296875, -1.22235107421875, -1.162750244140625, -1.1031494140625, -1.043548583984375, -0.98394775390625, -0.924346923828125, -0.86474609375, -0.805145263671875, -0.74554443359375, -0.685943603515625, -0.6263427734375, -0.566741943359375, -0.50714111328125, -0.447540283203125, -0.387939453125, -0.328338623046875, -0.26873779296875, -0.209136962890625, -0.1495361328125, -0.089935302734375, -0.03033447265625, 0.029266357421875, 0.0888671875, 0.148468017578125, 0.20806884765625, 0.267669677734375, 0.3272705078125, 0.386871337890625, 0.44647216796875, 0.506072998046875, 0.565673828125, 0.625274658203125, 0.68487548828125, 0.744476318359375, 0.8040771484375, 0.863677978515625, 0.92327880859375, 0.982879638671875, 1.04248046875, 1.102081298828125, 1.16168212890625, 1.221282958984375, 1.2808837890625, 1.340484619140625, 1.40008544921875, 1.459686279296875, 1.519287109375, 1.578887939453125, 1.63848876953125, 1.698089599609375, 1.7576904296875, 1.817291259765625, 1.87689208984375, 1.936492919921875, 1.99609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 10.0, 12.0, 10.0, 9.0, 10.0, 24.0, 24.0, 35.0, 41.0, 49.0, 46.0, 50.0, 83.0, 76.0, 91.0, 66.0, 71.0, 53.0, 37.0, 44.0, 31.0, 22.0, 17.0, 12.0, 9.0, 8.0, 8.0, 5.0, 8.0, 5.0, 4.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0217742919921875, -0.021062612533569336, -0.020350933074951172, -0.019639253616333008, -0.018927574157714844, -0.01821589469909668, -0.017504215240478516, -0.01679253578186035, -0.016080856323242188, -0.015369176864624023, -0.01465749740600586, -0.013945817947387695, -0.013234138488769531, -0.012522459030151367, -0.011810779571533203, -0.011099100112915039, -0.010387420654296875, -0.009675741195678711, -0.008964061737060547, -0.008252382278442383, -0.007540702819824219, -0.006829023361206055, -0.006117343902587891, -0.0054056644439697266, -0.0046939849853515625, -0.0039823055267333984, -0.0032706260681152344, -0.0025589466094970703, -0.0018472671508789062, -0.0011355876922607422, -0.0004239082336425781, 0.00028777122497558594, 0.00099945068359375, 0.001711130142211914, 0.002422809600830078, 0.003134489059448242, 0.0038461685180664062, 0.00455784797668457, 0.005269527435302734, 0.0059812068939208984, 0.0066928863525390625, 0.0074045658111572266, 0.00811624526977539, 0.008827924728393555, 0.009539604187011719, 0.010251283645629883, 0.010962963104248047, 0.011674642562866211, 0.012386322021484375, 0.013098001480102539, 0.013809680938720703, 0.014521360397338867, 0.015233039855957031, 0.015944719314575195, 0.01665639877319336, 0.017368078231811523, 0.018079757690429688, 0.01879143714904785, 0.019503116607666016, 0.02021479606628418, 0.020926475524902344, 0.021638154983520508, 0.022349834442138672, 0.023061513900756836, 0.023773193359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 9.0, 9.0, 7.0, 14.0, 11.0, 14.0, 19.0, 33.0, 37.0, 51.0, 65.0, 99.0, 172.0, 516.0, 3303.0, 59391.0, 953349.0, 28517.0, 2069.0, 358.0, 156.0, 90.0, 75.0, 50.0, 28.0, 24.0, 16.0, 16.0, 10.0, 11.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.39697265625, -0.3850860595703125, -0.373199462890625, -0.3613128662109375, -0.34942626953125, -0.3375396728515625, -0.325653076171875, -0.3137664794921875, -0.3018798828125, -0.2899932861328125, -0.278106689453125, -0.2662200927734375, -0.25433349609375, -0.2424468994140625, -0.230560302734375, -0.2186737060546875, -0.206787109375, -0.1949005126953125, -0.183013916015625, -0.1711273193359375, -0.15924072265625, -0.1473541259765625, -0.135467529296875, -0.1235809326171875, -0.1116943359375, -0.0998077392578125, -0.087921142578125, -0.0760345458984375, -0.06414794921875, -0.0522613525390625, -0.040374755859375, -0.0284881591796875, -0.0166015625, -0.0047149658203125, 0.007171630859375, 0.0190582275390625, 0.03094482421875, 0.0428314208984375, 0.054718017578125, 0.0666046142578125, 0.0784912109375, 0.0903778076171875, 0.102264404296875, 0.1141510009765625, 0.12603759765625, 0.1379241943359375, 0.149810791015625, 0.1616973876953125, 0.173583984375, 0.1854705810546875, 0.197357177734375, 0.2092437744140625, 0.22113037109375, 0.2330169677734375, 0.244903564453125, 0.2567901611328125, 0.2686767578125, 0.2805633544921875, 0.292449951171875, 0.3043365478515625, 0.31622314453125, 0.3281097412109375, 0.339996337890625, 0.3518829345703125, 0.36376953125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 47.0, 608.0, 317.0, 40.0, 7.0], "bins": [-0.2597496807575226, -0.2554858922958374, -0.2512221038341522, -0.24695831537246704, -0.24269452691078186, -0.23843073844909668, -0.2341669499874115, -0.22990316152572632, -0.22563937306404114, -0.22137558460235596, -0.21711179614067078, -0.2128480076789856, -0.20858421921730042, -0.20432043075561523, -0.20005664229393005, -0.19579285383224487, -0.1915290653705597, -0.1872652769088745, -0.18300148844718933, -0.17873769998550415, -0.17447391152381897, -0.1702101230621338, -0.1659463346004486, -0.16168254613876343, -0.15741875767707825, -0.15315496921539307, -0.14889118075370789, -0.1446273922920227, -0.14036360383033752, -0.13609981536865234, -0.13183602690696716, -0.12757223844528198, -0.1233084499835968, -0.11904466152191162, -0.11478087306022644, -0.11051708459854126, -0.10625329613685608, -0.1019895076751709, -0.09772571921348572, -0.09346193075180054, -0.08919814229011536, -0.08493435382843018, -0.080670565366745, -0.07640677690505981, -0.07214298844337463, -0.06787919998168945, -0.06361541152000427, -0.05935162305831909, -0.05508783459663391, -0.05082404613494873, -0.04656025767326355, -0.04229646921157837, -0.03803268074989319, -0.03376889228820801, -0.029505103826522827, -0.025241315364837646, -0.020977528765797615, -0.016713740304112434, -0.012449951842427254, -0.008186163380742073, -0.003922374919056892, 0.00034141354262828827, 0.004605202004313469, 0.00886899046599865, 0.01313277892768383]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 0.0, 6.0, 6.0, 7.0, 11.0, 10.0, 17.0, 21.0, 22.0, 28.0, 26.0, 30.0, 31.0, 29.0, 35.0, 40.0, 45.0, 58.0, 45.0, 44.0, 51.0, 36.0, 59.0, 46.0, 38.0, 32.0, 38.0, 24.0, 27.0, 24.0, 17.0, 19.0, 20.0, 12.0, 9.0, 8.0, 7.0, 5.0, 6.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011905908584594727, -0.01147399190813303, -0.011042075231671333, -0.010610158555209637, -0.01017824187874794, -0.009746325202286243, -0.009314408525824547, -0.00888249184936285, -0.008450575172901154, -0.008018658496439457, -0.00758674181997776, -0.007154825143516064, -0.006722908467054367, -0.0062909917905926704, -0.005859075114130974, -0.005427158437669277, -0.004995241761207581, -0.004563325084745884, -0.004131408408284187, -0.0036994917318224907, -0.003267575055360794, -0.0028356583788990974, -0.002403741702437401, -0.001971825025975704, -0.0015399083495140076, -0.001107991673052311, -0.0006760749965906143, -0.0002441583201289177, 0.00018775835633277893, 0.0006196750327944756, 0.0010515917092561722, 0.0014835083857178688, 0.0019154250621795654, 0.002347341738641262, 0.0027792584151029587, 0.0032111750915646553, 0.003643091768026352, 0.0040750084444880486, 0.004506925120949745, 0.004938841797411442, 0.005370758473873138, 0.005802675150334835, 0.006234591826796532, 0.006666508503258228, 0.007098425179719925, 0.0075303418561816216, 0.007962258532643318, 0.008394175209105015, 0.008826091885566711, 0.009258008562028408, 0.009689925238490105, 0.010121841914951801, 0.010553758591413498, 0.010985675267875195, 0.011417591944336891, 0.011849508620798588, 0.012281425297260284, 0.012713341973721981, 0.013145258650183678, 0.013577175326645374, 0.014009092003107071, 0.014441008679568768, 0.014872925356030464, 0.01530484203249216, 0.015736758708953857]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 6.0, 7.0, 8.0, 9.0, 16.0, 16.0, 15.0, 15.0, 13.0, 25.0, 26.0, 30.0, 26.0, 45.0, 35.0, 30.0, 37.0, 39.0, 31.0, 43.0, 37.0, 55.0, 46.0, 43.0, 33.0, 46.0, 27.0, 31.0, 24.0, 26.0, 27.0, 27.0, 17.0, 11.0, 15.0, 14.0, 7.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-40.21875, -39.092529296875, -37.96630859375, -36.840087890625, -35.7138671875, -34.587646484375, -33.46142578125, -32.335205078125, -31.208984375, -30.082763671875, -28.95654296875, -27.830322265625, -26.7041015625, -25.577880859375, -24.45166015625, -23.325439453125, -22.19921875, -21.072998046875, -19.94677734375, -18.820556640625, -17.6943359375, -16.568115234375, -15.44189453125, -14.315673828125, -13.189453125, -12.063232421875, -10.93701171875, -9.810791015625, -8.6845703125, -7.558349609375, -6.43212890625, -5.305908203125, -4.1796875, -3.053466796875, -1.92724609375, -0.801025390625, 0.3251953125, 1.451416015625, 2.57763671875, 3.703857421875, 4.830078125, 5.956298828125, 7.08251953125, 8.208740234375, 9.3349609375, 10.461181640625, 11.58740234375, 12.713623046875, 13.83984375, 14.966064453125, 16.09228515625, 17.218505859375, 18.3447265625, 19.470947265625, 20.59716796875, 21.723388671875, 22.849609375, 23.975830078125, 25.10205078125, 26.228271484375, 27.3544921875, 28.480712890625, 29.60693359375, 30.733154296875, 31.859375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 2.0, 5.0, 9.0, 10.0, 8.0, 12.0, 19.0, 39.0, 53.0, 67.0, 76.0, 117.0, 132.0, 182.0, 279.0, 402.0, 519.0, 786.0, 1100.0, 1701.0, 2450.0, 3908.0, 6707.0, 12651.0, 29148.0, 89096.0, 392241.0, 363800.0, 84681.0, 27832.0, 12348.0, 6614.0, 3751.0, 2454.0, 1587.0, 1146.0, 736.0, 500.0, 380.0, 238.0, 223.0, 154.0, 108.0, 77.0, 59.0, 49.0, 31.0, 27.0, 18.0, 4.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-25.46875, -24.619140625, -23.76953125, -22.919921875, -22.0703125, -21.220703125, -20.37109375, -19.521484375, -18.671875, -17.822265625, -16.97265625, -16.123046875, -15.2734375, -14.423828125, -13.57421875, -12.724609375, -11.875, -11.025390625, -10.17578125, -9.326171875, -8.4765625, -7.626953125, -6.77734375, -5.927734375, -5.078125, -4.228515625, -3.37890625, -2.529296875, -1.6796875, -0.830078125, 0.01953125, 0.869140625, 1.71875, 2.568359375, 3.41796875, 4.267578125, 5.1171875, 5.966796875, 6.81640625, 7.666015625, 8.515625, 9.365234375, 10.21484375, 11.064453125, 11.9140625, 12.763671875, 13.61328125, 14.462890625, 15.3125, 16.162109375, 17.01171875, 17.861328125, 18.7109375, 19.560546875, 20.41015625, 21.259765625, 22.109375, 22.958984375, 23.80859375, 24.658203125, 25.5078125, 26.357421875, 27.20703125, 28.056640625, 28.90625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 3.0, 6.0, 13.0, 16.0, 12.0, 22.0, 11.0, 22.0, 20.0, 27.0, 22.0, 32.0, 31.0, 44.0, 43.0, 37.0, 61.0, 158.0, 1790.0, 165.0, 75.0, 59.0, 39.0, 30.0, 32.0, 26.0, 25.0, 35.0, 32.0, 25.0, 20.0, 17.0, 12.0, 10.0, 16.0, 10.0, 8.0, 13.0, 8.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-132.875, -129.33203125, -125.7890625, -122.24609375, -118.703125, -115.16015625, -111.6171875, -108.07421875, -104.53125, -100.98828125, -97.4453125, -93.90234375, -90.359375, -86.81640625, -83.2734375, -79.73046875, -76.1875, -72.64453125, -69.1015625, -65.55859375, -62.015625, -58.47265625, -54.9296875, -51.38671875, -47.84375, -44.30078125, -40.7578125, -37.21484375, -33.671875, -30.12890625, -26.5859375, -23.04296875, -19.5, -15.95703125, -12.4140625, -8.87109375, -5.328125, -1.78515625, 1.7578125, 5.30078125, 8.84375, 12.38671875, 15.9296875, 19.47265625, 23.015625, 26.55859375, 30.1015625, 33.64453125, 37.1875, 40.73046875, 44.2734375, 47.81640625, 51.359375, 54.90234375, 58.4453125, 61.98828125, 65.53125, 69.07421875, 72.6171875, 76.16015625, 79.703125, 83.24609375, 86.7890625, 90.33203125, 93.875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 10.0, 15.0, 19.0, 23.0, 23.0, 29.0, 51.0, 66.0, 78.0, 97.0, 117.0, 164.0, 186.0, 315.0, 1070.0, 10068.0, 3056477.0, 72470.0, 2884.0, 583.0, 236.0, 144.0, 122.0, 113.0, 74.0, 50.0, 31.0, 24.0, 41.0, 25.0, 27.0, 16.0, 11.0, 5.0, 8.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-262.25, -253.4375, -244.625, -235.8125, -227.0, -218.1875, -209.375, -200.5625, -191.75, -182.9375, -174.125, -165.3125, -156.5, -147.6875, -138.875, -130.0625, -121.25, -112.4375, -103.625, -94.8125, -86.0, -77.1875, -68.375, -59.5625, -50.75, -41.9375, -33.125, -24.3125, -15.5, -6.6875, 2.125, 10.9375, 19.75, 28.5625, 37.375, 46.1875, 55.0, 63.8125, 72.625, 81.4375, 90.25, 99.0625, 107.875, 116.6875, 125.5, 134.3125, 143.125, 151.9375, 160.75, 169.5625, 178.375, 187.1875, 196.0, 204.8125, 213.625, 222.4375, 231.25, 240.0625, 248.875, 257.6875, 266.5, 275.3125, 284.125, 292.9375, 301.75]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 258.0, 727.0, 29.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.9928436279297, -91.32991027832031, -49.666969299316406, -8.0040283203125, 33.658905029296875, 75.32183837890625, 116.98478698730469, 158.64772033691406, 200.31065368652344, 241.9735870361328, 283.63653564453125, 325.2994689941406, 366.96240234375, 408.6253356933594, 450.28826904296875, 491.95123291015625, 533.6141357421875, 575.277099609375, 616.9400024414062, 658.6029663085938, 700.265869140625, 741.9288330078125, 783.591796875, 825.2546997070312, 866.9176635742188, 908.5806274414062, 950.2435302734375, 991.906494140625, 1033.5694580078125, 1075.2322998046875, 1116.895263671875, 1158.5582275390625, 1200.2210693359375, 1241.884033203125, 1283.5469970703125, 1325.2098388671875, 1366.872802734375, 1408.5357666015625, 1450.19873046875, 1491.861572265625, 1533.5245361328125, 1575.1875, 1616.8504638671875, 1658.5133056640625, 1700.17626953125, 1741.8392333984375, 1783.502197265625, 1825.1650390625, 1866.828125, 1908.4910888671875, 1950.154052734375, 1991.81689453125, 2033.4798583984375, 2075.142822265625, 2116.8056640625, 2158.46875, 2200.131591796875, 2241.79443359375, 2283.45751953125, 2325.120361328125, 2366.783447265625, 2408.4462890625, 2450.109130859375, 2491.772216796875, 2533.43505859375]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 16.0, 10.0, 13.0, 17.0, 22.0, 18.0, 25.0, 18.0, 28.0, 33.0, 47.0, 36.0, 33.0, 33.0, 41.0, 32.0, 45.0, 47.0, 42.0, 45.0, 38.0, 43.0, 50.0, 39.0, 28.0, 28.0, 34.0, 14.0, 29.0, 17.0, 10.0, 11.0, 5.0, 8.0, 9.0, 9.0, 3.0, 3.0, 0.0, 5.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-322.0838623046875, -312.42578125, -302.7677001953125, -293.1096496582031, -283.4515686035156, -273.7934875488281, -264.13543701171875, -254.47735595703125, -244.81927490234375, -235.16119384765625, -225.5031280517578, -215.84506225585938, -206.18698120117188, -196.52890014648438, -186.87083435058594, -177.2127685546875, -167.5546875, -157.8966064453125, -148.23854064941406, -138.58047485351562, -128.92239379882812, -119.26432037353516, -109.60624694824219, -99.94817352294922, -90.29010009765625, -80.63202667236328, -70.97395324707031, -61.315879821777344, -51.657806396484375, -41.999732971191406, -32.34165954589844, -22.68358612060547, -13.0255126953125, -3.3674392700195312, 6.2906341552734375, 15.948707580566406, 25.606781005859375, 35.264854431152344, 44.92292785644531, 54.58100128173828, 64.23907470703125, 73.89714813232422, 83.55522155761719, 93.21329498291016, 102.87136840820312, 112.5294418334961, 122.18751525878906, 131.8455810546875, 141.503662109375, 151.1617431640625, 160.81980895996094, 170.47787475585938, 180.13595581054688, 189.79403686523438, 199.4521026611328, 209.11016845703125, 218.76824951171875, 228.42633056640625, 238.0843963623047, 247.74246215820312, 257.4005432128906, 267.0586242675781, 276.7166748046875, 286.374755859375, 296.0328369140625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 4.0, 4.0, 7.0, 3.0, 10.0, 13.0, 9.0, 8.0, 14.0, 14.0, 18.0, 6.0, 22.0, 24.0, 29.0, 26.0, 35.0, 26.0, 37.0, 34.0, 43.0, 41.0, 27.0, 34.0, 39.0, 45.0, 45.0, 45.0, 35.0, 30.0, 36.0, 28.0, 32.0, 25.0, 25.0, 21.0, 20.0, 14.0, 16.0, 10.0, 14.0, 4.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0], "bins": [-38.25, -37.146484375, -36.04296875, -34.939453125, -33.8359375, -32.732421875, -31.62890625, -30.525390625, -29.421875, -28.318359375, -27.21484375, -26.111328125, -25.0078125, -23.904296875, -22.80078125, -21.697265625, -20.59375, -19.490234375, -18.38671875, -17.283203125, -16.1796875, -15.076171875, -13.97265625, -12.869140625, -11.765625, -10.662109375, -9.55859375, -8.455078125, -7.3515625, -6.248046875, -5.14453125, -4.041015625, -2.9375, -1.833984375, -0.73046875, 0.373046875, 1.4765625, 2.580078125, 3.68359375, 4.787109375, 5.890625, 6.994140625, 8.09765625, 9.201171875, 10.3046875, 11.408203125, 12.51171875, 13.615234375, 14.71875, 15.822265625, 16.92578125, 18.029296875, 19.1328125, 20.236328125, 21.33984375, 22.443359375, 23.546875, 24.650390625, 25.75390625, 26.857421875, 27.9609375, 29.064453125, 30.16796875, 31.271484375, 32.375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 4.0, 8.0, 3.0, 9.0, 6.0, 17.0, 13.0, 24.0, 19.0, 21.0, 40.0, 45.0, 76.0, 116.0, 150.0, 269.0, 428.0, 744.0, 1308.0, 2207.0, 4389.0, 10823.0, 198203.0, 3775138.0, 180526.0, 10414.0, 4339.0, 2140.0, 1127.0, 668.0, 347.0, 212.0, 129.0, 81.0, 58.0, 45.0, 25.0, 29.0, 14.0, 14.0, 12.0, 10.0, 13.0, 4.0, 4.0, 4.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0], "bins": [-165.875, -161.19921875, -156.5234375, -151.84765625, -147.171875, -142.49609375, -137.8203125, -133.14453125, -128.46875, -123.79296875, -119.1171875, -114.44140625, -109.765625, -105.08984375, -100.4140625, -95.73828125, -91.0625, -86.38671875, -81.7109375, -77.03515625, -72.359375, -67.68359375, -63.0078125, -58.33203125, -53.65625, -48.98046875, -44.3046875, -39.62890625, -34.953125, -30.27734375, -25.6015625, -20.92578125, -16.25, -11.57421875, -6.8984375, -2.22265625, 2.453125, 7.12890625, 11.8046875, 16.48046875, 21.15625, 25.83203125, 30.5078125, 35.18359375, 39.859375, 44.53515625, 49.2109375, 53.88671875, 58.5625, 63.23828125, 67.9140625, 72.58984375, 77.265625, 81.94140625, 86.6171875, 91.29296875, 95.96875, 100.64453125, 105.3203125, 109.99609375, 114.671875, 119.34765625, 124.0234375, 128.69921875, 133.375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 9.0, 6.0, 18.0, 19.0, 24.0, 50.0, 72.0, 264.0, 832.0, 1595.0, 737.0, 249.0, 75.0, 43.0, 19.0, 14.0, 10.0, 16.0, 6.0, 6.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.625, -154.1494140625, -149.673828125, -145.1982421875, -140.72265625, -136.2470703125, -131.771484375, -127.2958984375, -122.8203125, -118.3447265625, -113.869140625, -109.3935546875, -104.91796875, -100.4423828125, -95.966796875, -91.4912109375, -87.015625, -82.5400390625, -78.064453125, -73.5888671875, -69.11328125, -64.6376953125, -60.162109375, -55.6865234375, -51.2109375, -46.7353515625, -42.259765625, -37.7841796875, -33.30859375, -28.8330078125, -24.357421875, -19.8818359375, -15.40625, -10.9306640625, -6.455078125, -1.9794921875, 2.49609375, 6.9716796875, 11.447265625, 15.9228515625, 20.3984375, 24.8740234375, 29.349609375, 33.8251953125, 38.30078125, 42.7763671875, 47.251953125, 51.7275390625, 56.203125, 60.6787109375, 65.154296875, 69.6298828125, 74.10546875, 78.5810546875, 83.056640625, 87.5322265625, 92.0078125, 96.4833984375, 100.958984375, 105.4345703125, 109.91015625, 114.3857421875, 118.861328125, 123.3369140625, 127.8125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 6.0, 8.0, 10.0, 19.0, 36.0, 51.0, 65.0, 130.0, 183.0, 283.0, 550.0, 1107.0, 2953.0, 9966.0, 49287.0, 3708275.0, 388220.0, 23374.0, 5977.0, 1943.0, 808.0, 412.0, 226.0, 149.0, 94.0, 65.0, 43.0, 19.0, 10.0, 8.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-209.0, -201.48046875, -193.9609375, -186.44140625, -178.921875, -171.40234375, -163.8828125, -156.36328125, -148.84375, -141.32421875, -133.8046875, -126.28515625, -118.765625, -111.24609375, -103.7265625, -96.20703125, -88.6875, -81.16796875, -73.6484375, -66.12890625, -58.609375, -51.08984375, -43.5703125, -36.05078125, -28.53125, -21.01171875, -13.4921875, -5.97265625, 1.546875, 9.06640625, 16.5859375, 24.10546875, 31.625, 39.14453125, 46.6640625, 54.18359375, 61.703125, 69.22265625, 76.7421875, 84.26171875, 91.78125, 99.30078125, 106.8203125, 114.33984375, 121.859375, 129.37890625, 136.8984375, 144.41796875, 151.9375, 159.45703125, 166.9765625, 174.49609375, 182.015625, 189.53515625, 197.0546875, 204.57421875, 212.09375, 219.61328125, 227.1328125, 234.65234375, 242.171875, 249.69140625, 257.2109375, 264.73046875, 272.25]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 8.0, 18.0, 20.0, 29.0, 40.0, 52.0, 93.0, 187.0, 216.0, 125.0, 71.0, 48.0, 32.0, 34.0, 10.0, 8.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.93731689453125, -270.15240478515625, -254.36749267578125, -238.58258056640625, -222.79766845703125, -207.01275634765625, -191.2278594970703, -175.4429473876953, -159.6580352783203, -143.8731231689453, -128.0882110595703, -112.30330657958984, -96.51839447021484, -80.73348236083984, -64.94857788085938, -49.163665771484375, -33.378753662109375, -17.593843460083008, -1.8089332580566406, 13.975975036621094, 29.760887145996094, 45.545799255371094, 61.33070373535156, 77.11561584472656, 92.90052795410156, 108.68544006347656, 124.47035217285156, 140.2552490234375, 156.0401611328125, 171.8250732421875, 187.6099853515625, 203.3948974609375, 219.1798095703125, 234.9647216796875, 250.7496337890625, 266.5345458984375, 282.3194580078125, 298.1043701171875, 313.8892822265625, 329.6741943359375, 345.4591064453125, 361.2440185546875, 377.0289306640625, 392.8138427734375, 408.5987548828125, 424.3836669921875, 440.1685791015625, 455.9534912109375, 471.7383728027344, 487.5232849121094, 503.3081970214844, 519.0930786132812, 534.8779907226562, 550.6629028320312, 566.4478149414062, 582.2327270507812, 598.0176391601562, 613.8025512695312, 629.5874633789062, 645.3723754882812, 661.1572875976562, 676.9421997070312, 692.7271118164062, 708.5120239257812, 724.2969360351562]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 2.0, 1.0, 3.0, 8.0, 5.0, 10.0, 9.0, 15.0, 15.0, 6.0, 14.0, 13.0, 23.0, 17.0, 25.0, 25.0, 21.0, 34.0, 30.0, 38.0, 23.0, 38.0, 34.0, 36.0, 43.0, 37.0, 44.0, 25.0, 38.0, 33.0, 32.0, 29.0, 23.0, 34.0, 23.0, 26.0, 15.0, 18.0, 21.0, 13.0, 13.0, 9.0, 18.0, 11.0, 13.0, 7.0, 5.0, 3.0, 9.0, 4.0, 3.0, 1.0, 1.0, 8.0, 1.0, 1.0, 1.0, 2.0], "bins": [-193.8929443359375, -187.69061279296875, -181.48826599121094, -175.28591918945312, -169.08358764648438, -162.88125610351562, -156.6789093017578, -150.4765625, -144.27423095703125, -138.0718994140625, -131.8695526123047, -125.6672134399414, -119.46487426757812, -113.26253509521484, -107.06019592285156, -100.85785675048828, -94.655517578125, -88.45317840576172, -82.25083923339844, -76.04850006103516, -69.84616088867188, -63.643821716308594, -57.44148254394531, -51.23914337158203, -45.03680419921875, -38.83446502685547, -32.63212585449219, -26.429786682128906, -20.227447509765625, -14.025108337402344, -7.8227691650390625, -1.6204299926757812, 4.5819091796875, 10.784248352050781, 16.986587524414062, 23.188926696777344, 29.391265869140625, 35.593605041503906, 41.79594421386719, 47.99828338623047, 54.20062255859375, 60.40296173095703, 66.60530090332031, 72.8076400756836, 79.00997924804688, 85.21231842041016, 91.41465759277344, 97.61699676513672, 103.8193359375, 110.02167510986328, 116.22401428222656, 122.42635345458984, 128.62869262695312, 134.83102416992188, 141.0333709716797, 147.2357177734375, 153.43804931640625, 159.640380859375, 165.8427276611328, 172.04507446289062, 178.24740600585938, 184.44973754882812, 190.65208435058594, 196.85443115234375, 203.0567626953125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 10.0, 4.0, 10.0, 11.0, 7.0, 20.0, 12.0, 18.0, 13.0, 18.0, 32.0, 25.0, 26.0, 30.0, 31.0, 23.0, 39.0, 34.0, 37.0, 35.0, 44.0, 46.0, 37.0, 45.0, 35.0, 25.0, 34.0, 36.0, 35.0, 25.0, 25.0, 27.0, 26.0, 17.0, 10.0, 22.0, 19.0, 14.0, 4.0, 9.0, 5.0, 8.0, 2.0, 0.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-37.96875, -36.81591796875, -35.6630859375, -34.51025390625, -33.357421875, -32.20458984375, -31.0517578125, -29.89892578125, -28.74609375, -27.59326171875, -26.4404296875, -25.28759765625, -24.134765625, -22.98193359375, -21.8291015625, -20.67626953125, -19.5234375, -18.37060546875, -17.2177734375, -16.06494140625, -14.912109375, -13.75927734375, -12.6064453125, -11.45361328125, -10.30078125, -9.14794921875, -7.9951171875, -6.84228515625, -5.689453125, -4.53662109375, -3.3837890625, -2.23095703125, -1.078125, 0.07470703125, 1.2275390625, 2.38037109375, 3.533203125, 4.68603515625, 5.8388671875, 6.99169921875, 8.14453125, 9.29736328125, 10.4501953125, 11.60302734375, 12.755859375, 13.90869140625, 15.0615234375, 16.21435546875, 17.3671875, 18.52001953125, 19.6728515625, 20.82568359375, 21.978515625, 23.13134765625, 24.2841796875, 25.43701171875, 26.58984375, 27.74267578125, 28.8955078125, 30.04833984375, 31.201171875, 32.35400390625, 33.5068359375, 34.65966796875, 35.8125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 1.0, 6.0, 8.0, 13.0, 27.0, 25.0, 45.0, 44.0, 84.0, 110.0, 169.0, 284.0, 385.0, 610.0, 847.0, 1297.0, 1921.0, 2880.0, 4366.0, 6684.0, 10336.0, 15740.0, 24483.0, 40249.0, 66002.0, 116280.0, 221712.0, 230145.0, 120664.0, 68375.0, 41729.0, 25832.0, 16384.0, 10569.0, 6903.0, 4536.0, 2981.0, 1992.0, 1311.0, 832.0, 559.0, 374.0, 217.0, 192.0, 128.0, 74.0, 46.0, 40.0, 28.0, 12.0, 4.0, 10.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.720703125, -1.66143798828125, -1.6021728515625, -1.54290771484375, -1.483642578125, -1.42437744140625, -1.3651123046875, -1.30584716796875, -1.24658203125, -1.18731689453125, -1.1280517578125, -1.06878662109375, -1.009521484375, -0.95025634765625, -0.8909912109375, -0.83172607421875, -0.7724609375, -0.71319580078125, -0.6539306640625, -0.59466552734375, -0.535400390625, -0.47613525390625, -0.4168701171875, -0.35760498046875, -0.29833984375, -0.23907470703125, -0.1798095703125, -0.12054443359375, -0.061279296875, -0.00201416015625, 0.0572509765625, 0.11651611328125, 0.17578125, 0.23504638671875, 0.2943115234375, 0.35357666015625, 0.412841796875, 0.47210693359375, 0.5313720703125, 0.59063720703125, 0.64990234375, 0.70916748046875, 0.7684326171875, 0.82769775390625, 0.886962890625, 0.94622802734375, 1.0054931640625, 1.06475830078125, 1.1240234375, 1.18328857421875, 1.2425537109375, 1.30181884765625, 1.361083984375, 1.42034912109375, 1.4796142578125, 1.53887939453125, 1.59814453125, 1.65740966796875, 1.7166748046875, 1.77593994140625, 1.835205078125, 1.89447021484375, 1.9537353515625, 2.01300048828125, 2.072265625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 3.0, 2.0, 5.0, 13.0, 10.0, 6.0, 13.0, 7.0, 13.0, 17.0, 16.0, 21.0, 24.0, 29.0, 31.0, 31.0, 18.0, 38.0, 34.0, 34.0, 37.0, 46.0, 35.0, 35.0, 1062.0, 35.0, 33.0, 31.0, 30.0, 30.0, 27.0, 25.0, 29.0, 24.0, 18.0, 29.0, 18.0, 19.0, 13.0, 18.0, 13.0, 12.0, 12.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-22.875, -22.16552734375, -21.4560546875, -20.74658203125, -20.037109375, -19.32763671875, -18.6181640625, -17.90869140625, -17.19921875, -16.48974609375, -15.7802734375, -15.07080078125, -14.361328125, -13.65185546875, -12.9423828125, -12.23291015625, -11.5234375, -10.81396484375, -10.1044921875, -9.39501953125, -8.685546875, -7.97607421875, -7.2666015625, -6.55712890625, -5.84765625, -5.13818359375, -4.4287109375, -3.71923828125, -3.009765625, -2.30029296875, -1.5908203125, -0.88134765625, -0.171875, 0.53759765625, 1.2470703125, 1.95654296875, 2.666015625, 3.37548828125, 4.0849609375, 4.79443359375, 5.50390625, 6.21337890625, 6.9228515625, 7.63232421875, 8.341796875, 9.05126953125, 9.7607421875, 10.47021484375, 11.1796875, 11.88916015625, 12.5986328125, 13.30810546875, 14.017578125, 14.72705078125, 15.4365234375, 16.14599609375, 16.85546875, 17.56494140625, 18.2744140625, 18.98388671875, 19.693359375, 20.40283203125, 21.1123046875, 21.82177734375, 22.53125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 10.0, 12.0, 15.0, 28.0, 47.0, 61.0, 88.0, 114.0, 187.0, 235.0, 382.0, 502.0, 850.0, 1266.0, 1949.0, 2876.0, 4501.0, 7308.0, 11339.0, 18113.0, 29836.0, 50003.0, 89841.0, 192041.0, 1343434.0, 152114.0, 76408.0, 43436.0, 26135.0, 15890.0, 9994.0, 6312.0, 4045.0, 2659.0, 1689.0, 1146.0, 762.0, 489.0, 314.0, 228.0, 153.0, 106.0, 80.0, 37.0, 26.0, 25.0, 15.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9599609375, -1.8993988037109375, -1.838836669921875, -1.7782745361328125, -1.71771240234375, -1.6571502685546875, -1.596588134765625, -1.5360260009765625, -1.4754638671875, -1.4149017333984375, -1.354339599609375, -1.2937774658203125, -1.23321533203125, -1.1726531982421875, -1.112091064453125, -1.0515289306640625, -0.990966796875, -0.9304046630859375, -0.869842529296875, -0.8092803955078125, -0.74871826171875, -0.6881561279296875, -0.627593994140625, -0.5670318603515625, -0.5064697265625, -0.4459075927734375, -0.385345458984375, -0.3247833251953125, -0.26422119140625, -0.2036590576171875, -0.143096923828125, -0.0825347900390625, -0.02197265625, 0.0385894775390625, 0.099151611328125, 0.1597137451171875, 0.22027587890625, 0.2808380126953125, 0.341400146484375, 0.4019622802734375, 0.4625244140625, 0.5230865478515625, 0.583648681640625, 0.6442108154296875, 0.70477294921875, 0.7653350830078125, 0.825897216796875, 0.8864593505859375, 0.947021484375, 1.0075836181640625, 1.068145751953125, 1.1287078857421875, 1.18927001953125, 1.2498321533203125, 1.310394287109375, 1.3709564208984375, 1.4315185546875, 1.4920806884765625, 1.552642822265625, 1.6132049560546875, 1.67376708984375, 1.7343292236328125, 1.794891357421875, 1.8554534912109375, 1.916015625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 3.0, 12.0, 7.0, 11.0, 13.0, 13.0, 21.0, 15.0, 27.0, 33.0, 43.0, 58.0, 54.0, 53.0, 72.0, 54.0, 60.0, 52.0, 71.0, 44.0, 49.0, 32.0, 30.0, 21.0, 28.0, 25.0, 14.0, 18.0, 14.0, 9.0, 9.0, 8.0, 2.0, 1.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0215606689453125, -0.02093338966369629, -0.020306110382080078, -0.019678831100463867, -0.019051551818847656, -0.018424272537231445, -0.017796993255615234, -0.017169713973999023, -0.016542434692382812, -0.0159151554107666, -0.01528787612915039, -0.01466059684753418, -0.014033317565917969, -0.013406038284301758, -0.012778759002685547, -0.012151479721069336, -0.011524200439453125, -0.010896921157836914, -0.010269641876220703, -0.009642362594604492, -0.009015083312988281, -0.00838780403137207, -0.007760524749755859, -0.0071332454681396484, -0.0065059661865234375, -0.0058786869049072266, -0.005251407623291016, -0.004624128341674805, -0.003996849060058594, -0.003369569778442383, -0.002742290496826172, -0.002115011215209961, -0.00148773193359375, -0.0008604526519775391, -0.00023317337036132812, 0.0003941059112548828, 0.0010213851928710938, 0.0016486644744873047, 0.0022759437561035156, 0.0029032230377197266, 0.0035305023193359375, 0.0041577816009521484, 0.004785060882568359, 0.00541234016418457, 0.006039619445800781, 0.006666898727416992, 0.007294178009033203, 0.007921457290649414, 0.008548736572265625, 0.009176015853881836, 0.009803295135498047, 0.010430574417114258, 0.011057853698730469, 0.01168513298034668, 0.01231241226196289, 0.012939691543579102, 0.013566970825195312, 0.014194250106811523, 0.014821529388427734, 0.015448808670043945, 0.016076087951660156, 0.016703367233276367, 0.017330646514892578, 0.01795792579650879, 0.018585205078125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 7.0, 8.0, 13.0, 19.0, 18.0, 28.0, 30.0, 45.0, 49.0, 55.0, 99.0, 124.0, 275.0, 886.0, 6600.0, 95201.0, 891067.0, 48541.0, 4014.0, 709.0, 240.0, 146.0, 81.0, 58.0, 46.0, 32.0, 30.0, 25.0, 23.0, 16.0, 9.0, 15.0, 6.0, 9.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.288330078125, -0.2788429260253906, -0.26935577392578125, -0.2598686218261719, -0.2503814697265625, -0.24089431762695312, -0.23140716552734375, -0.22192001342773438, -0.212432861328125, -0.20294570922851562, -0.19345855712890625, -0.18397140502929688, -0.1744842529296875, -0.16499710083007812, -0.15550994873046875, -0.14602279663085938, -0.13653564453125, -0.12704849243164062, -0.11756134033203125, -0.10807418823242188, -0.0985870361328125, -0.08909988403320312, -0.07961273193359375, -0.07012557983398438, -0.060638427734375, -0.051151275634765625, -0.04166412353515625, -0.032176971435546875, -0.0226898193359375, -0.013202667236328125, -0.00371551513671875, 0.005771636962890625, 0.0152587890625, 0.024745941162109375, 0.03423309326171875, 0.043720245361328125, 0.0532073974609375, 0.06269454956054688, 0.07218170166015625, 0.08166885375976562, 0.091156005859375, 0.10064315795898438, 0.11013031005859375, 0.11961746215820312, 0.1291046142578125, 0.13859176635742188, 0.14807891845703125, 0.15756607055664062, 0.16705322265625, 0.17654037475585938, 0.18602752685546875, 0.19551467895507812, 0.2050018310546875, 0.21448898315429688, 0.22397613525390625, 0.23346328735351562, 0.242950439453125, 0.2524375915527344, 0.26192474365234375, 0.2714118957519531, 0.2808990478515625, 0.2903861999511719, 0.29987335205078125, 0.3093605041503906, 0.31884765625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 14.0, 51.0, 463.0, 411.0, 64.0, 9.0, 4.0], "bins": [-0.220830500125885, -0.2171487957239151, -0.21346710622310638, -0.20978540182113647, -0.20610369741916656, -0.20242200791835785, -0.19874030351638794, -0.19505859911441803, -0.19137690961360931, -0.1876952052116394, -0.1840135157108307, -0.18033181130886078, -0.17665010690689087, -0.17296841740608215, -0.16928671300411224, -0.16560500860214233, -0.16192330420017242, -0.15824159979820251, -0.1545599102973938, -0.1508782058954239, -0.14719650149345398, -0.14351481199264526, -0.13983310759067535, -0.13615140318870544, -0.13246971368789673, -0.12878800928592682, -0.1251063197851181, -0.1214246153831482, -0.11774291843175888, -0.11406121402978897, -0.11037951707839966, -0.10669781267642975, -0.10301612317562103, -0.09933442622423172, -0.09565272182226181, -0.0919710248708725, -0.08828932791948318, -0.08460762351751328, -0.08092592656612396, -0.07724422216415405, -0.07356252521276474, -0.06988082826137543, -0.06619912385940552, -0.0625174269080162, -0.058835726231336594, -0.05515402555465698, -0.05147232860326767, -0.04779062792658806, -0.04410892724990845, -0.040427226573228836, -0.03674552962183952, -0.03306382894515991, -0.0293821282684803, -0.02570042945444584, -0.022018730640411377, -0.018337029963731766, -0.014655332081019878, -0.010973632335662842, -0.0072919330559670925, -0.0036102337762713432, 7.146596908569336e-05, 0.00375316571444273, 0.007434864528477192, 0.011116565205156803, 0.014798264019191265]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 7.0, 10.0, 8.0, 8.0, 13.0, 17.0, 24.0, 24.0, 33.0, 36.0, 26.0, 42.0, 36.0, 49.0, 47.0, 39.0, 56.0, 49.0, 51.0, 55.0, 43.0, 44.0, 37.0, 33.0, 34.0, 39.0, 24.0, 19.0, 23.0, 25.0, 14.0, 10.0, 8.0, 6.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01298147439956665, -0.012542663142085075, -0.0121038518846035, -0.011665040627121925, -0.01122622936964035, -0.010787418112158775, -0.0103486068546772, -0.009909795597195625, -0.00947098433971405, -0.009032173082232475, -0.0085933618247509, -0.008154550567269325, -0.00771573930978775, -0.007276928052306175, -0.0068381167948246, -0.006399305537343025, -0.00596049427986145, -0.005521683022379875, -0.0050828717648983, -0.004644060507416725, -0.00420524924993515, -0.003766437992453575, -0.003327626734972, -0.002888815477490425, -0.00245000422000885, -0.002011192962527275, -0.0015723817050457, -0.001133570447564125, -0.00069475919008255, -0.00025594793260097504, 0.00018286332488059998, 0.000621674582362175, 0.00106048583984375, 0.001499297097325325, 0.0019381083548069, 0.002376919612288475, 0.00281573086977005, 0.003254542127251625, 0.0036933533847332, 0.004132164642214775, 0.00457097589969635, 0.005009787157177925, 0.0054485984146595, 0.005887409672141075, 0.00632622092962265, 0.006765032187104225, 0.0072038434445858, 0.007642654702067375, 0.00808146595954895, 0.008520277217030525, 0.0089590884745121, 0.009397899731993675, 0.00983671098947525, 0.010275522246956825, 0.0107143335044384, 0.011153144761919975, 0.01159195601940155, 0.012030767276883125, 0.0124695785343647, 0.012908389791846275, 0.01334720104932785, 0.013786012306809425, 0.014224823564291, 0.014663634821772575, 0.01510244607925415]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 10.0, 4.0, 10.0, 11.0, 7.0, 20.0, 12.0, 18.0, 13.0, 18.0, 32.0, 25.0, 26.0, 30.0, 31.0, 23.0, 39.0, 34.0, 37.0, 35.0, 44.0, 46.0, 37.0, 45.0, 35.0, 25.0, 34.0, 36.0, 35.0, 25.0, 25.0, 27.0, 26.0, 17.0, 10.0, 22.0, 19.0, 14.0, 4.0, 9.0, 5.0, 8.0, 2.0, 0.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-37.96875, -36.81591796875, -35.6630859375, -34.51025390625, -33.357421875, -32.20458984375, -31.0517578125, -29.89892578125, -28.74609375, -27.59326171875, -26.4404296875, -25.28759765625, -24.134765625, -22.98193359375, -21.8291015625, -20.67626953125, -19.5234375, -18.37060546875, -17.2177734375, -16.06494140625, -14.912109375, -13.75927734375, -12.6064453125, -11.45361328125, -10.30078125, -9.14794921875, -7.9951171875, -6.84228515625, -5.689453125, -4.53662109375, -3.3837890625, -2.23095703125, -1.078125, 0.07470703125, 1.2275390625, 2.38037109375, 3.533203125, 4.68603515625, 5.8388671875, 6.99169921875, 8.14453125, 9.29736328125, 10.4501953125, 11.60302734375, 12.755859375, 13.90869140625, 15.0615234375, 16.21435546875, 17.3671875, 18.52001953125, 19.6728515625, 20.82568359375, 21.978515625, 23.13134765625, 24.2841796875, 25.43701171875, 26.58984375, 27.74267578125, 28.8955078125, 30.04833984375, 31.201171875, 32.35400390625, 33.5068359375, 34.65966796875, 35.8125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 8.0, 15.0, 28.0, 20.0, 34.0, 42.0, 54.0, 87.0, 140.0, 131.0, 222.0, 269.0, 392.0, 534.0, 688.0, 1075.0, 1435.0, 2146.0, 3291.0, 5122.0, 9000.0, 19208.0, 64079.0, 387403.0, 437002.0, 69812.0, 20580.0, 9405.0, 5442.0, 3360.0, 2241.0, 1453.0, 1076.0, 776.0, 523.0, 369.0, 321.0, 184.0, 168.0, 117.0, 97.0, 55.0, 36.0, 29.0, 20.0, 21.0, 16.0, 15.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-32.71875, -31.697265625, -30.67578125, -29.654296875, -28.6328125, -27.611328125, -26.58984375, -25.568359375, -24.546875, -23.525390625, -22.50390625, -21.482421875, -20.4609375, -19.439453125, -18.41796875, -17.396484375, -16.375, -15.353515625, -14.33203125, -13.310546875, -12.2890625, -11.267578125, -10.24609375, -9.224609375, -8.203125, -7.181640625, -6.16015625, -5.138671875, -4.1171875, -3.095703125, -2.07421875, -1.052734375, -0.03125, 0.990234375, 2.01171875, 3.033203125, 4.0546875, 5.076171875, 6.09765625, 7.119140625, 8.140625, 9.162109375, 10.18359375, 11.205078125, 12.2265625, 13.248046875, 14.26953125, 15.291015625, 16.3125, 17.333984375, 18.35546875, 19.376953125, 20.3984375, 21.419921875, 22.44140625, 23.462890625, 24.484375, 25.505859375, 26.52734375, 27.548828125, 28.5703125, 29.591796875, 30.61328125, 31.634765625, 32.65625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 4.0, 6.0, 8.0, 10.0, 18.0, 23.0, 25.0, 31.0, 38.0, 32.0, 34.0, 49.0, 55.0, 52.0, 76.0, 73.0, 360.0, 1578.0, 103.0, 59.0, 37.0, 52.0, 47.0, 40.0, 42.0, 31.0, 20.0, 21.0, 25.0, 13.0, 16.0, 10.0, 10.0, 8.0, 6.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-153.875, -149.724609375, -145.57421875, -141.423828125, -137.2734375, -133.123046875, -128.97265625, -124.822265625, -120.671875, -116.521484375, -112.37109375, -108.220703125, -104.0703125, -99.919921875, -95.76953125, -91.619140625, -87.46875, -83.318359375, -79.16796875, -75.017578125, -70.8671875, -66.716796875, -62.56640625, -58.416015625, -54.265625, -50.115234375, -45.96484375, -41.814453125, -37.6640625, -33.513671875, -29.36328125, -25.212890625, -21.0625, -16.912109375, -12.76171875, -8.611328125, -4.4609375, -0.310546875, 3.83984375, 7.990234375, 12.140625, 16.291015625, 20.44140625, 24.591796875, 28.7421875, 32.892578125, 37.04296875, 41.193359375, 45.34375, 49.494140625, 53.64453125, 57.794921875, 61.9453125, 66.095703125, 70.24609375, 74.396484375, 78.546875, 82.697265625, 86.84765625, 90.998046875, 95.1484375, 99.298828125, 103.44921875, 107.599609375, 111.75]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 16.0, 9.0, 18.0, 23.0, 35.0, 41.0, 63.0, 68.0, 127.0, 189.0, 420.0, 1523.0, 8626.0, 297282.0, 2822346.0, 11783.0, 1953.0, 481.0, 210.0, 136.0, 99.0, 69.0, 50.0, 26.0, 18.0, 14.0, 8.0, 13.0, 5.0, 11.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-416.25, -404.03515625, -391.8203125, -379.60546875, -367.390625, -355.17578125, -342.9609375, -330.74609375, -318.53125, -306.31640625, -294.1015625, -281.88671875, -269.671875, -257.45703125, -245.2421875, -233.02734375, -220.8125, -208.59765625, -196.3828125, -184.16796875, -171.953125, -159.73828125, -147.5234375, -135.30859375, -123.09375, -110.87890625, -98.6640625, -86.44921875, -74.234375, -62.01953125, -49.8046875, -37.58984375, -25.375, -13.16015625, -0.9453125, 11.26953125, 23.484375, 35.69921875, 47.9140625, 60.12890625, 72.34375, 84.55859375, 96.7734375, 108.98828125, 121.203125, 133.41796875, 145.6328125, 157.84765625, 170.0625, 182.27734375, 194.4921875, 206.70703125, 218.921875, 231.13671875, 243.3515625, 255.56640625, 267.78125, 279.99609375, 292.2109375, 304.42578125, 316.640625, 328.85546875, 341.0703125, 353.28515625, 365.5]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 20.0, 39.0, 58.0, 156.0, 185.0, 227.0, 140.0, 78.0, 40.0, 22.0, 18.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.31800842285156, -115.85316467285156, -105.38831329345703, -94.9234619140625, -84.4586181640625, -73.9937744140625, -63.52892303466797, -53.06407165527344, -42.59922790527344, -32.13438034057617, -21.669532775878906, -11.20468521118164, -0.739837646484375, 9.72500991821289, 20.189857482910156, 30.654708862304688, 41.11955261230469, 51.58440017700195, 62.04924774169922, 72.51409912109375, 82.97894287109375, 93.44378662109375, 103.90863800048828, 114.37348937988281, 124.83833312988281, 135.3031768798828, 145.76803588867188, 156.23287963867188, 166.69772338867188, 177.16256713867188, 187.62741088867188, 198.09226989746094, 208.55712890625, 219.02197265625, 229.48681640625, 239.95167541503906, 250.41651916503906, 260.8813781738281, 271.3462219238281, 281.8110656738281, 292.2759094238281, 302.7407531738281, 313.2055969238281, 323.6704406738281, 334.13531494140625, 344.60015869140625, 355.06500244140625, 365.52984619140625, 375.99468994140625, 386.45953369140625, 396.92437744140625, 407.38922119140625, 417.85406494140625, 428.3189392089844, 438.7837829589844, 449.2486267089844, 459.7134704589844, 470.1783142089844, 480.6431579589844, 491.1080017089844, 501.5728759765625, 512.0377197265625, 522.5025634765625, 532.9674072265625, 543.4322509765625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 8.0, 9.0, 10.0, 16.0, 8.0, 13.0, 21.0, 23.0, 18.0, 23.0, 29.0, 28.0, 31.0, 45.0, 49.0, 49.0, 45.0, 40.0, 40.0, 42.0, 38.0, 38.0, 50.0, 33.0, 29.0, 37.0, 33.0, 26.0, 29.0, 21.0, 24.0, 23.0, 13.0, 8.0, 7.0, 10.0, 10.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.5811767578125, -300.86993408203125, -289.15869140625, -277.44744873046875, -265.7362060546875, -254.0249786376953, -242.31375122070312, -230.60250854492188, -218.89126586914062, -207.18002319335938, -195.46878051757812, -183.75755310058594, -172.0463104248047, -160.33506774902344, -148.62384033203125, -136.91259765625, -125.20135498046875, -113.4901123046875, -101.77887725830078, -90.06764221191406, -78.35639953613281, -66.64515686035156, -54.933921813964844, -43.222686767578125, -31.511444091796875, -19.80020523071289, -8.088966369628906, 3.622272491455078, 15.333511352539062, 27.044750213623047, 38.75598907470703, 50.46722412109375, 62.178466796875, 73.88970947265625, 85.60094451904297, 97.31217956542969, 109.02342224121094, 120.73466491699219, 132.44589233398438, 144.15713500976562, 155.86837768554688, 167.57962036132812, 179.29086303710938, 191.00209045410156, 202.7133331298828, 214.42457580566406, 226.13580322265625, 237.8470458984375, 249.55828857421875, 261.26953125, 272.98077392578125, 284.6920166015625, 296.40325927734375, 308.1144714355469, 319.8257141113281, 331.5369567871094, 343.2481994628906, 354.9594421386719, 366.6706848144531, 378.3819274902344, 390.0931396484375, 401.80438232421875, 413.515625, 425.22686767578125, 436.9381103515625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 2.0, 7.0, 6.0, 13.0, 9.0, 10.0, 8.0, 19.0, 13.0, 18.0, 16.0, 20.0, 38.0, 22.0, 23.0, 30.0, 31.0, 46.0, 40.0, 38.0, 37.0, 39.0, 33.0, 51.0, 38.0, 38.0, 32.0, 35.0, 40.0, 30.0, 30.0, 28.0, 27.0, 21.0, 18.0, 15.0, 9.0, 17.0, 12.0, 13.0, 5.0, 4.0, 10.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-41.15625, -39.90966796875, -38.6630859375, -37.41650390625, -36.169921875, -34.92333984375, -33.6767578125, -32.43017578125, -31.18359375, -29.93701171875, -28.6904296875, -27.44384765625, -26.197265625, -24.95068359375, -23.7041015625, -22.45751953125, -21.2109375, -19.96435546875, -18.7177734375, -17.47119140625, -16.224609375, -14.97802734375, -13.7314453125, -12.48486328125, -11.23828125, -9.99169921875, -8.7451171875, -7.49853515625, -6.251953125, -5.00537109375, -3.7587890625, -2.51220703125, -1.265625, -0.01904296875, 1.2275390625, 2.47412109375, 3.720703125, 4.96728515625, 6.2138671875, 7.46044921875, 8.70703125, 9.95361328125, 11.2001953125, 12.44677734375, 13.693359375, 14.93994140625, 16.1865234375, 17.43310546875, 18.6796875, 19.92626953125, 21.1728515625, 22.41943359375, 23.666015625, 24.91259765625, 26.1591796875, 27.40576171875, 28.65234375, 29.89892578125, 31.1455078125, 32.39208984375, 33.638671875, 34.88525390625, 36.1318359375, 37.37841796875, 38.625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 5.0, 8.0, 9.0, 14.0, 11.0, 18.0, 20.0, 26.0, 44.0, 53.0, 78.0, 142.0, 206.0, 286.0, 506.0, 783.0, 1494.0, 2898.0, 6436.0, 17677.0, 339433.0, 3621109.0, 177573.0, 14699.0, 5399.0, 2372.0, 1234.0, 670.0, 379.0, 241.0, 137.0, 97.0, 57.0, 42.0, 24.0, 25.0, 14.0, 19.0, 13.0, 4.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-158.375, -153.634765625, -148.89453125, -144.154296875, -139.4140625, -134.673828125, -129.93359375, -125.193359375, -120.453125, -115.712890625, -110.97265625, -106.232421875, -101.4921875, -96.751953125, -92.01171875, -87.271484375, -82.53125, -77.791015625, -73.05078125, -68.310546875, -63.5703125, -58.830078125, -54.08984375, -49.349609375, -44.609375, -39.869140625, -35.12890625, -30.388671875, -25.6484375, -20.908203125, -16.16796875, -11.427734375, -6.6875, -1.947265625, 2.79296875, 7.533203125, 12.2734375, 17.013671875, 21.75390625, 26.494140625, 31.234375, 35.974609375, 40.71484375, 45.455078125, 50.1953125, 54.935546875, 59.67578125, 64.416015625, 69.15625, 73.896484375, 78.63671875, 83.376953125, 88.1171875, 92.857421875, 97.59765625, 102.337890625, 107.078125, 111.818359375, 116.55859375, 121.298828125, 126.0390625, 130.779296875, 135.51953125, 140.259765625, 145.0]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 1.0, 6.0, 7.0, 8.0, 9.0, 16.0, 8.0, 19.0, 23.0, 26.0, 34.0, 38.0, 76.0, 157.0, 311.0, 663.0, 941.0, 781.0, 384.0, 224.0, 99.0, 58.0, 36.0, 25.0, 20.0, 21.0, 16.0, 14.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-75.4375, -72.6083984375, -69.779296875, -66.9501953125, -64.12109375, -61.2919921875, -58.462890625, -55.6337890625, -52.8046875, -49.9755859375, -47.146484375, -44.3173828125, -41.48828125, -38.6591796875, -35.830078125, -33.0009765625, -30.171875, -27.3427734375, -24.513671875, -21.6845703125, -18.85546875, -16.0263671875, -13.197265625, -10.3681640625, -7.5390625, -4.7099609375, -1.880859375, 0.9482421875, 3.77734375, 6.6064453125, 9.435546875, 12.2646484375, 15.09375, 17.9228515625, 20.751953125, 23.5810546875, 26.41015625, 29.2392578125, 32.068359375, 34.8974609375, 37.7265625, 40.5556640625, 43.384765625, 46.2138671875, 49.04296875, 51.8720703125, 54.701171875, 57.5302734375, 60.359375, 63.1884765625, 66.017578125, 68.8466796875, 71.67578125, 74.5048828125, 77.333984375, 80.1630859375, 82.9921875, 85.8212890625, 88.650390625, 91.4794921875, 94.30859375, 97.1376953125, 99.966796875, 102.7958984375, 105.625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 7.0, 17.0, 12.0, 17.0, 29.0, 59.0, 117.0, 255.0, 512.0, 1196.0, 3126.0, 9439.0, 37184.0, 887756.0, 3183914.0, 52289.0, 11761.0, 3899.0, 1491.0, 593.0, 265.0, 141.0, 66.0, 35.0, 21.0, 18.0, 15.0, 5.0, 4.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-283.75, -276.1015625, -268.453125, -260.8046875, -253.15625, -245.5078125, -237.859375, -230.2109375, -222.5625, -214.9140625, -207.265625, -199.6171875, -191.96875, -184.3203125, -176.671875, -169.0234375, -161.375, -153.7265625, -146.078125, -138.4296875, -130.78125, -123.1328125, -115.484375, -107.8359375, -100.1875, -92.5390625, -84.890625, -77.2421875, -69.59375, -61.9453125, -54.296875, -46.6484375, -39.0, -31.3515625, -23.703125, -16.0546875, -8.40625, -0.7578125, 6.890625, 14.5390625, 22.1875, 29.8359375, 37.484375, 45.1328125, 52.78125, 60.4296875, 68.078125, 75.7265625, 83.375, 91.0234375, 98.671875, 106.3203125, 113.96875, 121.6171875, 129.265625, 136.9140625, 144.5625, 152.2109375, 159.859375, 167.5078125, 175.15625, 182.8046875, 190.453125, 198.1015625, 205.75]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 15.0, 13.0, 30.0, 62.0, 112.0, 219.0, 273.0, 145.0, 67.0, 26.0, 16.0, 8.0, 7.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-453.4952087402344, -429.783447265625, -406.07171630859375, -382.3599853515625, -358.6482238769531, -334.93646240234375, -311.2247314453125, -287.51300048828125, -263.8012390136719, -240.08949279785156, -216.37774658203125, -192.66600036621094, -168.95425415039062, -145.2425079345703, -121.53076171875, -97.81901550292969, -74.10726928710938, -50.39552307128906, -26.68377685546875, -2.9720306396484375, 20.739715576171875, 44.45146179199219, 68.1632080078125, 91.87495422363281, 115.58670043945312, 139.29844665527344, 163.01019287109375, 186.72193908691406, 210.43368530273438, 234.1454315185547, 257.857177734375, 281.56890869140625, 305.2806396484375, 328.99237060546875, 352.7041320800781, 376.4158935546875, 400.12762451171875, 423.83935546875, 447.5511169433594, 471.26287841796875, 494.974609375, 518.6863403320312, 542.3980712890625, 566.10986328125, 589.8215942382812, 613.5333251953125, 637.2451171875, 660.9568481445312, 684.6685791015625, 708.3803100585938, 732.092041015625, 755.8038330078125, 779.5155639648438, 803.227294921875, 826.9390869140625, 850.6508178710938, 874.362548828125, 898.0742797851562, 921.7860107421875, 945.497802734375, 969.2095336914062, 992.9212646484375, 1016.633056640625, 1040.3447265625, 1064.0565185546875]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 3.0, 9.0, 4.0, 4.0, 4.0, 11.0, 17.0, 18.0, 22.0, 12.0, 27.0, 21.0, 16.0, 26.0, 37.0, 33.0, 34.0, 38.0, 42.0, 41.0, 33.0, 46.0, 25.0, 37.0, 37.0, 38.0, 35.0, 34.0, 33.0, 29.0, 24.0, 27.0, 25.0, 15.0, 15.0, 14.0, 21.0, 16.0, 10.0, 10.0, 5.0, 16.0, 3.0, 5.0, 7.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-201.67822265625, -194.50619506835938, -187.33416748046875, -180.16213989257812, -172.9901123046875, -165.81808471679688, -158.64605712890625, -151.47402954101562, -144.302001953125, -137.12997436523438, -129.95794677734375, -122.78591918945312, -115.6138916015625, -108.44186401367188, -101.26984405517578, -94.09781646728516, -86.92579650878906, -79.75376892089844, -72.58174133300781, -65.40971374511719, -58.23768997192383, -51.0656623840332, -43.893638610839844, -36.72161102294922, -29.549583435058594, -22.37755584716797, -15.205530166625977, -8.033504486083984, -0.8614768981933594, 6.310550689697266, 13.482574462890625, 20.65460205078125, 27.826629638671875, 34.9986572265625, 42.170684814453125, 49.342708587646484, 56.51473617553711, 63.686763763427734, 70.8587875366211, 78.03081512451172, 85.20284271240234, 92.37487030029297, 99.5468978881836, 106.71891784667969, 113.89094543457031, 121.06297302246094, 128.23500061035156, 135.4070281982422, 142.5790557861328, 149.75108337402344, 156.92311096191406, 164.0951385498047, 171.2671661376953, 178.43919372558594, 185.6112060546875, 192.78323364257812, 199.95526123046875, 207.12728881835938, 214.29931640625, 221.47134399414062, 228.64337158203125, 235.81539916992188, 242.9874267578125, 250.15945434570312, 257.33148193359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 12.0, 7.0, 12.0, 20.0, 14.0, 17.0, 33.0, 17.0, 21.0, 32.0, 47.0, 34.0, 35.0, 35.0, 54.0, 53.0, 40.0, 40.0, 39.0, 39.0, 45.0, 33.0, 36.0, 42.0, 27.0, 20.0, 27.0, 20.0, 30.0, 19.0, 11.0, 19.0, 8.0, 8.0, 6.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.3125, -38.96875, -37.625, -36.28125, -34.9375, -33.59375, -32.25, -30.90625, -29.5625, -28.21875, -26.875, -25.53125, -24.1875, -22.84375, -21.5, -20.15625, -18.8125, -17.46875, -16.125, -14.78125, -13.4375, -12.09375, -10.75, -9.40625, -8.0625, -6.71875, -5.375, -4.03125, -2.6875, -1.34375, 0.0, 1.34375, 2.6875, 4.03125, 5.375, 6.71875, 8.0625, 9.40625, 10.75, 12.09375, 13.4375, 14.78125, 16.125, 17.46875, 18.8125, 20.15625, 21.5, 22.84375, 24.1875, 25.53125, 26.875, 28.21875, 29.5625, 30.90625, 32.25, 33.59375, 34.9375, 36.28125, 37.625, 38.96875, 40.3125, 41.65625, 43.0, 44.34375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 7.0, 13.0, 18.0, 40.0, 56.0, 72.0, 100.0, 188.0, 254.0, 408.0, 600.0, 955.0, 1429.0, 2124.0, 3193.0, 4885.0, 7631.0, 11363.0, 18204.0, 28725.0, 46942.0, 81079.0, 152183.0, 263424.0, 184616.0, 95283.0, 54125.0, 32682.0, 20405.0, 12951.0, 8398.0, 5440.0, 3670.0, 2420.0, 1571.0, 1092.0, 679.0, 440.0, 317.0, 183.0, 133.0, 88.0, 55.0, 45.0, 25.0, 14.0, 9.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.103515625, -2.0390625, -1.974609375, -1.91015625, -1.845703125, -1.78125, -1.716796875, -1.65234375, -1.587890625, -1.5234375, -1.458984375, -1.39453125, -1.330078125, -1.265625, -1.201171875, -1.13671875, -1.072265625, -1.0078125, -0.943359375, -0.87890625, -0.814453125, -0.75, -0.685546875, -0.62109375, -0.556640625, -0.4921875, -0.427734375, -0.36328125, -0.298828125, -0.234375, -0.169921875, -0.10546875, -0.041015625, 0.0234375, 0.087890625, 0.15234375, 0.216796875, 0.28125, 0.345703125, 0.41015625, 0.474609375, 0.5390625, 0.603515625, 0.66796875, 0.732421875, 0.796875, 0.861328125, 0.92578125, 0.990234375, 1.0546875, 1.119140625, 1.18359375, 1.248046875, 1.3125, 1.376953125, 1.44140625, 1.505859375, 1.5703125, 1.634765625, 1.69921875, 1.763671875, 1.828125, 1.892578125, 1.95703125, 2.021484375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 6.0, 4.0, 7.0, 6.0, 18.0, 14.0, 17.0, 21.0, 21.0, 29.0, 24.0, 30.0, 27.0, 36.0, 35.0, 35.0, 38.0, 46.0, 35.0, 1079.0, 52.0, 48.0, 52.0, 45.0, 41.0, 33.0, 33.0, 30.0, 24.0, 32.0, 22.0, 19.0, 20.0, 15.0, 8.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-33.875, -32.9111328125, -31.947265625, -30.9833984375, -30.01953125, -29.0556640625, -28.091796875, -27.1279296875, -26.1640625, -25.2001953125, -24.236328125, -23.2724609375, -22.30859375, -21.3447265625, -20.380859375, -19.4169921875, -18.453125, -17.4892578125, -16.525390625, -15.5615234375, -14.59765625, -13.6337890625, -12.669921875, -11.7060546875, -10.7421875, -9.7783203125, -8.814453125, -7.8505859375, -6.88671875, -5.9228515625, -4.958984375, -3.9951171875, -3.03125, -2.0673828125, -1.103515625, -0.1396484375, 0.82421875, 1.7880859375, 2.751953125, 3.7158203125, 4.6796875, 5.6435546875, 6.607421875, 7.5712890625, 8.53515625, 9.4990234375, 10.462890625, 11.4267578125, 12.390625, 13.3544921875, 14.318359375, 15.2822265625, 16.24609375, 17.2099609375, 18.173828125, 19.1376953125, 20.1015625, 21.0654296875, 22.029296875, 22.9931640625, 23.95703125, 24.9208984375, 25.884765625, 26.8486328125, 27.8125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 9.0, 6.0, 16.0, 17.0, 25.0, 38.0, 45.0, 79.0, 118.0, 198.0, 272.0, 436.0, 705.0, 1176.0, 1915.0, 3347.0, 5663.0, 10158.0, 18011.0, 32771.0, 62186.0, 136582.0, 1378053.0, 245368.0, 94487.0, 46788.0, 25194.0, 14037.0, 8060.0, 4569.0, 2569.0, 1588.0, 981.0, 578.0, 373.0, 237.0, 148.0, 105.0, 72.0, 47.0, 33.0, 24.0, 12.0, 9.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.853515625, -2.771484375, -2.689453125, -2.607421875, -2.525390625, -2.443359375, -2.361328125, -2.279296875, -2.197265625, -2.115234375, -2.033203125, -1.951171875, -1.869140625, -1.787109375, -1.705078125, -1.623046875, -1.541015625, -1.458984375, -1.376953125, -1.294921875, -1.212890625, -1.130859375, -1.048828125, -0.966796875, -0.884765625, -0.802734375, -0.720703125, -0.638671875, -0.556640625, -0.474609375, -0.392578125, -0.310546875, -0.228515625, -0.146484375, -0.064453125, 0.017578125, 0.099609375, 0.181640625, 0.263671875, 0.345703125, 0.427734375, 0.509765625, 0.591796875, 0.673828125, 0.755859375, 0.837890625, 0.919921875, 1.001953125, 1.083984375, 1.166015625, 1.248046875, 1.330078125, 1.412109375, 1.494140625, 1.576171875, 1.658203125, 1.740234375, 1.822265625, 1.904296875, 1.986328125, 2.068359375, 2.150390625, 2.232421875, 2.314453125, 2.396484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 4.0, 6.0, 12.0, 6.0, 16.0, 18.0, 9.0, 15.0, 19.0, 26.0, 35.0, 59.0, 78.0, 93.0, 101.0, 86.0, 87.0, 52.0, 53.0, 35.0, 17.0, 30.0, 13.0, 17.0, 14.0, 14.0, 7.0, 5.0, 6.0, 7.0, 5.0, 10.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0289154052734375, -0.02808070182800293, -0.02724599838256836, -0.02641129493713379, -0.02557659149169922, -0.02474188804626465, -0.023907184600830078, -0.023072481155395508, -0.022237777709960938, -0.021403074264526367, -0.020568370819091797, -0.019733667373657227, -0.018898963928222656, -0.018064260482788086, -0.017229557037353516, -0.016394853591918945, -0.015560150146484375, -0.014725446701049805, -0.013890743255615234, -0.013056039810180664, -0.012221336364746094, -0.011386632919311523, -0.010551929473876953, -0.009717226028442383, -0.008882522583007812, -0.008047819137573242, -0.007213115692138672, -0.0063784122467041016, -0.005543708801269531, -0.004709005355834961, -0.0038743019104003906, -0.0030395984649658203, -0.00220489501953125, -0.0013701915740966797, -0.0005354881286621094, 0.00029921531677246094, 0.0011339187622070312, 0.0019686222076416016, 0.002803325653076172, 0.003638029098510742, 0.0044727325439453125, 0.005307435989379883, 0.006142139434814453, 0.0069768428802490234, 0.007811546325683594, 0.008646249771118164, 0.009480953216552734, 0.010315656661987305, 0.011150360107421875, 0.011985063552856445, 0.012819766998291016, 0.013654470443725586, 0.014489173889160156, 0.015323877334594727, 0.016158580780029297, 0.016993284225463867, 0.017827987670898438, 0.018662691116333008, 0.019497394561767578, 0.02033209800720215, 0.02116680145263672, 0.02200150489807129, 0.02283620834350586, 0.02367091178894043, 0.024505615234375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 11.0, 7.0, 14.0, 9.0, 11.0, 22.0, 25.0, 15.0, 33.0, 41.0, 59.0, 70.0, 120.0, 253.0, 1030.0, 10481.0, 814777.0, 213919.0, 6295.0, 729.0, 220.0, 97.0, 59.0, 46.0, 28.0, 22.0, 23.0, 14.0, 17.0, 15.0, 12.0, 8.0, 12.0, 3.0, 5.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.403076171875, -0.389129638671875, -0.37518310546875, -0.361236572265625, -0.3472900390625, -0.333343505859375, -0.31939697265625, -0.305450439453125, -0.29150390625, -0.277557373046875, -0.26361083984375, -0.249664306640625, -0.2357177734375, -0.221771240234375, -0.20782470703125, -0.193878173828125, -0.179931640625, -0.165985107421875, -0.15203857421875, -0.138092041015625, -0.1241455078125, -0.110198974609375, -0.09625244140625, -0.082305908203125, -0.068359375, -0.054412841796875, -0.04046630859375, -0.026519775390625, -0.0125732421875, 0.001373291015625, 0.01531982421875, 0.029266357421875, 0.043212890625, 0.057159423828125, 0.07110595703125, 0.085052490234375, 0.0989990234375, 0.112945556640625, 0.12689208984375, 0.140838623046875, 0.15478515625, 0.168731689453125, 0.18267822265625, 0.196624755859375, 0.2105712890625, 0.224517822265625, 0.23846435546875, 0.252410888671875, 0.266357421875, 0.280303955078125, 0.29425048828125, 0.308197021484375, 0.3221435546875, 0.336090087890625, 0.35003662109375, 0.363983154296875, 0.3779296875, 0.391876220703125, 0.40582275390625, 0.419769287109375, 0.4337158203125, 0.447662353515625, 0.46160888671875, 0.475555419921875, 0.489501953125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 9.0, 473.0, 530.0, 5.0], "bins": [-0.5342034101486206, -0.5255879163742065, -0.5169724225997925, -0.5083569288253784, -0.49974146485328674, -0.4911259710788727, -0.482510507106781, -0.47389501333236694, -0.4652795195579529, -0.4566640257835388, -0.44804853200912476, -0.4394330680370331, -0.430817574262619, -0.42220208048820496, -0.4135866165161133, -0.4049711227416992, -0.39635562896728516, -0.3877401351928711, -0.37912464141845703, -0.37050917744636536, -0.3618936836719513, -0.35327818989753723, -0.34466272592544556, -0.3360472321510315, -0.32743173837661743, -0.31881624460220337, -0.3102007508277893, -0.30158528685569763, -0.29296979308128357, -0.2843542993068695, -0.27573883533477783, -0.26712334156036377, -0.2585078775882721, -0.24989238381385803, -0.24127690494060516, -0.2326614260673523, -0.22404593229293823, -0.21543043851852417, -0.2068149596452713, -0.19819948077201843, -0.18958397209644318, -0.1809684932231903, -0.17235299944877625, -0.16373750567436218, -0.15512202680110931, -0.14650654792785645, -0.13789105415344238, -0.12927556037902832, -0.12066008150577545, -0.11204459518194199, -0.10342910885810852, -0.09481362253427505, -0.08619813621044159, -0.07758264988660812, -0.06896716356277466, -0.06035167723894119, -0.05173619091510773, -0.04312070459127426, -0.034505218267440796, -0.02588973194360733, -0.017274245619773865, -0.0086587592959404, -4.3272972106933594e-05, 0.008572213351726532, 0.01718769781291485]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 15.0, 13.0, 14.0, 33.0, 33.0, 49.0, 61.0, 65.0, 57.0, 63.0, 82.0, 55.0, 71.0, 69.0, 52.0, 47.0, 51.0, 38.0, 30.0, 23.0, 19.0, 14.0, 12.0, 7.0, 6.0, 5.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01769155263900757, -0.01692652888596058, -0.01616150513291359, -0.0153964813798666, -0.01463145762681961, -0.013866433873772621, -0.013101410120725632, -0.012336386367678642, -0.011571362614631653, -0.010806338861584663, -0.010041315108537674, -0.009276291355490685, -0.008511267602443695, -0.007746243849396706, -0.006981220096349716, -0.006216196343302727, -0.005451172590255737, -0.004686148837208748, -0.003921125084161758, -0.003156101331114769, -0.0023910775780677795, -0.00162605382502079, -0.0008610300719738007, -9.600631892681122e-05, 0.0006690174341201782, 0.0014340411871671677, 0.002199064940214157, 0.0029640886932611465, 0.003729112446308136, 0.004494136199355125, 0.005259159952402115, 0.006024183705449104, 0.006789207458496094, 0.007554231211543083, 0.008319254964590073, 0.009084278717637062, 0.009849302470684052, 0.010614326223731041, 0.01137934997677803, 0.01214437372982502, 0.01290939748287201, 0.013674421235918999, 0.014439444988965988, 0.015204468742012978, 0.015969492495059967, 0.016734516248106956, 0.017499540001153946, 0.018264563754200935, 0.019029587507247925, 0.019794611260294914, 0.020559635013341904, 0.021324658766388893, 0.022089682519435883, 0.022854706272482872, 0.02361973002552986, 0.02438475377857685, 0.02514977753162384, 0.02591480128467083, 0.02667982503771782, 0.02744484879076481, 0.028209872543811798, 0.028974896296858788, 0.029739920049905777, 0.030504943802952766, 0.031269967555999756]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 12.0, 7.0, 12.0, 20.0, 14.0, 17.0, 33.0, 17.0, 21.0, 32.0, 47.0, 34.0, 35.0, 35.0, 54.0, 53.0, 40.0, 40.0, 39.0, 38.0, 46.0, 33.0, 36.0, 42.0, 27.0, 20.0, 27.0, 20.0, 30.0, 19.0, 11.0, 19.0, 8.0, 8.0, 6.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.3125, -38.96875, -37.625, -36.28125, -34.9375, -33.59375, -32.25, -30.90625, -29.5625, -28.21875, -26.875, -25.53125, -24.1875, -22.84375, -21.5, -20.15625, -18.8125, -17.46875, -16.125, -14.78125, -13.4375, -12.09375, -10.75, -9.40625, -8.0625, -6.71875, -5.375, -4.03125, -2.6875, -1.34375, 0.0, 1.34375, 2.6875, 4.03125, 5.375, 6.71875, 8.0625, 9.40625, 10.75, 12.09375, 13.4375, 14.78125, 16.125, 17.46875, 18.8125, 20.15625, 21.5, 22.84375, 24.1875, 25.53125, 26.875, 28.21875, 29.5625, 30.90625, 32.25, 33.59375, 34.9375, 36.28125, 37.625, 38.96875, 40.3125, 41.65625, 43.0, 44.34375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 8.0, 6.0, 11.0, 18.0, 17.0, 23.0, 41.0, 43.0, 47.0, 85.0, 110.0, 151.0, 161.0, 263.0, 356.0, 509.0, 694.0, 958.0, 1473.0, 2065.0, 3256.0, 4960.0, 8238.0, 17341.0, 63448.0, 635039.0, 242740.0, 34467.0, 12441.0, 6603.0, 4164.0, 2676.0, 1808.0, 1257.0, 812.0, 647.0, 444.0, 311.0, 198.0, 157.0, 126.0, 102.0, 76.0, 51.0, 47.0, 34.0, 18.0, 9.0, 20.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-42.40625, -41.07275390625, -39.7392578125, -38.40576171875, -37.072265625, -35.73876953125, -34.4052734375, -33.07177734375, -31.73828125, -30.40478515625, -29.0712890625, -27.73779296875, -26.404296875, -25.07080078125, -23.7373046875, -22.40380859375, -21.0703125, -19.73681640625, -18.4033203125, -17.06982421875, -15.736328125, -14.40283203125, -13.0693359375, -11.73583984375, -10.40234375, -9.06884765625, -7.7353515625, -6.40185546875, -5.068359375, -3.73486328125, -2.4013671875, -1.06787109375, 0.265625, 1.59912109375, 2.9326171875, 4.26611328125, 5.599609375, 6.93310546875, 8.2666015625, 9.60009765625, 10.93359375, 12.26708984375, 13.6005859375, 14.93408203125, 16.267578125, 17.60107421875, 18.9345703125, 20.26806640625, 21.6015625, 22.93505859375, 24.2685546875, 25.60205078125, 26.935546875, 28.26904296875, 29.6025390625, 30.93603515625, 32.26953125, 33.60302734375, 34.9365234375, 36.27001953125, 37.603515625, 38.93701171875, 40.2705078125, 41.60400390625, 42.9375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 7.0, 7.0, 10.0, 11.0, 21.0, 22.0, 35.0, 29.0, 34.0, 43.0, 29.0, 41.0, 45.0, 52.0, 60.0, 88.0, 1733.0, 252.0, 78.0, 58.0, 45.0, 53.0, 54.0, 33.0, 29.0, 34.0, 23.0, 12.0, 14.0, 12.0, 24.0, 7.0, 5.0, 7.0, 4.0, 4.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-138.75, -134.525390625, -130.30078125, -126.076171875, -121.8515625, -117.626953125, -113.40234375, -109.177734375, -104.953125, -100.728515625, -96.50390625, -92.279296875, -88.0546875, -83.830078125, -79.60546875, -75.380859375, -71.15625, -66.931640625, -62.70703125, -58.482421875, -54.2578125, -50.033203125, -45.80859375, -41.583984375, -37.359375, -33.134765625, -28.91015625, -24.685546875, -20.4609375, -16.236328125, -12.01171875, -7.787109375, -3.5625, 0.662109375, 4.88671875, 9.111328125, 13.3359375, 17.560546875, 21.78515625, 26.009765625, 30.234375, 34.458984375, 38.68359375, 42.908203125, 47.1328125, 51.357421875, 55.58203125, 59.806640625, 64.03125, 68.255859375, 72.48046875, 76.705078125, 80.9296875, 85.154296875, 89.37890625, 93.603515625, 97.828125, 102.052734375, 106.27734375, 110.501953125, 114.7265625, 118.951171875, 123.17578125, 127.400390625, 131.625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 13.0, 10.0, 21.0, 29.0, 32.0, 70.0, 92.0, 151.0, 360.0, 1429.0, 19687.0, 3112163.0, 9813.0, 1063.0, 325.0, 171.0, 114.0, 54.0, 32.0, 25.0, 15.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-570.0, -550.6171875, -531.234375, -511.8515625, -492.46875, -473.0859375, -453.703125, -434.3203125, -414.9375, -395.5546875, -376.171875, -356.7890625, -337.40625, -318.0234375, -298.640625, -279.2578125, -259.875, -240.4921875, -221.109375, -201.7265625, -182.34375, -162.9609375, -143.578125, -124.1953125, -104.8125, -85.4296875, -66.046875, -46.6640625, -27.28125, -7.8984375, 11.484375, 30.8671875, 50.25, 69.6328125, 89.015625, 108.3984375, 127.78125, 147.1640625, 166.546875, 185.9296875, 205.3125, 224.6953125, 244.078125, 263.4609375, 282.84375, 302.2265625, 321.609375, 340.9921875, 360.375, 379.7578125, 399.140625, 418.5234375, 437.90625, 457.2890625, 476.671875, 496.0546875, 515.4375, 534.8203125, 554.203125, 573.5859375, 592.96875, 612.3515625, 631.734375, 651.1171875, 670.5]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 563.0, 448.0, 3.0], "bins": [-5059.2060546875, -4977.53857421875, -4895.87109375, -4814.20361328125, -4732.53564453125, -4650.8681640625, -4569.20068359375, -4487.533203125, -4405.86572265625, -4324.1982421875, -4242.53076171875, -4160.86328125, -4079.195556640625, -3997.528076171875, -3915.8603515625, -3834.19287109375, -3752.525390625, -3670.85791015625, -3589.190185546875, -3507.522705078125, -3425.855224609375, -3344.187744140625, -3262.52001953125, -3180.8525390625, -3099.184814453125, -3017.517333984375, -2935.849609375, -2854.18212890625, -2772.5146484375, -2690.84716796875, -2609.179443359375, -2527.511962890625, -2445.844482421875, -2364.177001953125, -2282.50927734375, -2200.841796875, -2119.17431640625, -2037.5067138671875, -1955.839111328125, -1874.171630859375, -1792.504150390625, -1710.8365478515625, -1629.1690673828125, -1547.50146484375, -1465.833984375, -1384.1663818359375, -1302.498779296875, -1220.831298828125, -1139.1636962890625, -1057.49609375, -975.82861328125, -894.1610107421875, -812.4935302734375, -730.825927734375, -649.1583862304688, -567.4908447265625, -485.8233642578125, -404.15582275390625, -322.48828125, -240.82070922851562, -159.15316772460938, -77.48562622070312, 4.18194580078125, 85.8494873046875, 167.5170440673828]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 6.0, 5.0, 14.0, 10.0, 13.0, 10.0, 16.0, 25.0, 18.0, 28.0, 25.0, 26.0, 27.0, 29.0, 26.0, 39.0, 43.0, 45.0, 42.0, 46.0, 42.0, 47.0, 37.0, 38.0, 36.0, 39.0, 38.0, 25.0, 24.0, 29.0, 17.0, 22.0, 20.0, 15.0, 14.0, 13.0, 9.0, 9.0, 4.0, 5.0, 7.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-334.1227111816406, -323.0453796386719, -311.96807861328125, -300.8907470703125, -289.81341552734375, -278.7361145019531, -267.6587829589844, -256.58148193359375, -245.504150390625, -234.4268341064453, -223.34951782226562, -212.27218627929688, -201.1948699951172, -190.1175537109375, -179.04022216796875, -167.96290588378906, -156.88558959960938, -145.8082733154297, -134.73095703125, -123.65362548828125, -112.57630920410156, -101.49899291992188, -90.42166900634766, -79.34434509277344, -68.26702880859375, -57.1897087097168, -46.112388610839844, -35.03506851196289, -23.957748413085938, -12.880428314208984, -1.8031082153320312, 9.274215698242188, 20.351531982421875, 31.428852081298828, 42.50617218017578, 53.583492279052734, 64.66081237792969, 75.73812866210938, 86.8154525756836, 97.89277648925781, 108.9700927734375, 120.04740905761719, 131.12472534179688, 142.20205688476562, 153.2793731689453, 164.356689453125, 175.43402099609375, 186.51133728027344, 197.58865356445312, 208.6659698486328, 219.7432861328125, 230.82061767578125, 241.89793395996094, 252.97525024414062, 264.0525817871094, 275.1298828125, 286.20721435546875, 297.2845458984375, 308.3618469238281, 319.4391784667969, 330.5164794921875, 341.59381103515625, 352.671142578125, 363.74847412109375, 374.8257751464844]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 9.0, 9.0, 12.0, 21.0, 9.0, 15.0, 24.0, 23.0, 23.0, 26.0, 25.0, 39.0, 40.0, 30.0, 45.0, 48.0, 38.0, 36.0, 47.0, 46.0, 38.0, 42.0, 36.0, 36.0, 34.0, 28.0, 16.0, 21.0, 22.0, 29.0, 25.0, 14.0, 16.0, 12.0, 13.0, 7.0, 8.0, 5.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.625, -39.2724609375, -37.919921875, -36.5673828125, -35.21484375, -33.8623046875, -32.509765625, -31.1572265625, -29.8046875, -28.4521484375, -27.099609375, -25.7470703125, -24.39453125, -23.0419921875, -21.689453125, -20.3369140625, -18.984375, -17.6318359375, -16.279296875, -14.9267578125, -13.57421875, -12.2216796875, -10.869140625, -9.5166015625, -8.1640625, -6.8115234375, -5.458984375, -4.1064453125, -2.75390625, -1.4013671875, -0.048828125, 1.3037109375, 2.65625, 4.0087890625, 5.361328125, 6.7138671875, 8.06640625, 9.4189453125, 10.771484375, 12.1240234375, 13.4765625, 14.8291015625, 16.181640625, 17.5341796875, 18.88671875, 20.2392578125, 21.591796875, 22.9443359375, 24.296875, 25.6494140625, 27.001953125, 28.3544921875, 29.70703125, 31.0595703125, 32.412109375, 33.7646484375, 35.1171875, 36.4697265625, 37.822265625, 39.1748046875, 40.52734375, 41.8798828125, 43.232421875, 44.5849609375, 45.9375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 11.0, 12.0, 22.0, 21.0, 38.0, 47.0, 68.0, 100.0, 118.0, 171.0, 279.0, 375.0, 560.0, 832.0, 1307.0, 2037.0, 3378.0, 6079.0, 12759.0, 59267.0, 1257652.0, 2670305.0, 144373.0, 16710.0, 7315.0, 3841.0, 2306.0, 1455.0, 927.0, 592.0, 389.0, 274.0, 213.0, 117.0, 95.0, 65.0, 42.0, 33.0, 34.0, 15.0, 15.0, 5.0, 9.0, 2.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.125, -102.6044921875, -99.083984375, -95.5634765625, -92.04296875, -88.5224609375, -85.001953125, -81.4814453125, -77.9609375, -74.4404296875, -70.919921875, -67.3994140625, -63.87890625, -60.3583984375, -56.837890625, -53.3173828125, -49.796875, -46.2763671875, -42.755859375, -39.2353515625, -35.71484375, -32.1943359375, -28.673828125, -25.1533203125, -21.6328125, -18.1123046875, -14.591796875, -11.0712890625, -7.55078125, -4.0302734375, -0.509765625, 3.0107421875, 6.53125, 10.0517578125, 13.572265625, 17.0927734375, 20.61328125, 24.1337890625, 27.654296875, 31.1748046875, 34.6953125, 38.2158203125, 41.736328125, 45.2568359375, 48.77734375, 52.2978515625, 55.818359375, 59.3388671875, 62.859375, 66.3798828125, 69.900390625, 73.4208984375, 76.94140625, 80.4619140625, 83.982421875, 87.5029296875, 91.0234375, 94.5439453125, 98.064453125, 101.5849609375, 105.10546875, 108.6259765625, 112.146484375, 115.6669921875, 119.1875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 7.0, 9.0, 6.0, 7.0, 22.0, 33.0, 27.0, 42.0, 62.0, 92.0, 226.0, 637.0, 1186.0, 955.0, 379.0, 177.0, 64.0, 51.0, 26.0, 18.0, 5.0, 9.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-155.5, -151.681640625, -147.86328125, -144.044921875, -140.2265625, -136.408203125, -132.58984375, -128.771484375, -124.953125, -121.134765625, -117.31640625, -113.498046875, -109.6796875, -105.861328125, -102.04296875, -98.224609375, -94.40625, -90.587890625, -86.76953125, -82.951171875, -79.1328125, -75.314453125, -71.49609375, -67.677734375, -63.859375, -60.041015625, -56.22265625, -52.404296875, -48.5859375, -44.767578125, -40.94921875, -37.130859375, -33.3125, -29.494140625, -25.67578125, -21.857421875, -18.0390625, -14.220703125, -10.40234375, -6.583984375, -2.765625, 1.052734375, 4.87109375, 8.689453125, 12.5078125, 16.326171875, 20.14453125, 23.962890625, 27.78125, 31.599609375, 35.41796875, 39.236328125, 43.0546875, 46.873046875, 50.69140625, 54.509765625, 58.328125, 62.146484375, 65.96484375, 69.783203125, 73.6015625, 77.419921875, 81.23828125, 85.056640625, 88.875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 12.0, 27.0, 38.0, 74.0, 124.0, 292.0, 625.0, 1576.0, 4726.0, 20114.0, 301017.0, 3803061.0, 49352.0, 8686.0, 2641.0, 974.0, 401.0, 211.0, 99.0, 78.0, 42.0, 30.0, 16.0, 12.0, 11.0, 11.0, 9.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-231.125, -221.587890625, -212.05078125, -202.513671875, -192.9765625, -183.439453125, -173.90234375, -164.365234375, -154.828125, -145.291015625, -135.75390625, -126.216796875, -116.6796875, -107.142578125, -97.60546875, -88.068359375, -78.53125, -68.994140625, -59.45703125, -49.919921875, -40.3828125, -30.845703125, -21.30859375, -11.771484375, -2.234375, 7.302734375, 16.83984375, 26.376953125, 35.9140625, 45.451171875, 54.98828125, 64.525390625, 74.0625, 83.599609375, 93.13671875, 102.673828125, 112.2109375, 121.748046875, 131.28515625, 140.822265625, 150.359375, 159.896484375, 169.43359375, 178.970703125, 188.5078125, 198.044921875, 207.58203125, 217.119140625, 226.65625, 236.193359375, 245.73046875, 255.267578125, 264.8046875, 274.341796875, 283.87890625, 293.416015625, 302.953125, 312.490234375, 322.02734375, 331.564453125, 341.1015625, 350.638671875, 360.17578125, 369.712890625, 379.25]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 13.0, 30.0, 49.0, 129.0, 281.0, 311.0, 127.0, 35.0, 18.0, 7.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-622.1337890625, -587.7919311523438, -553.4500732421875, -519.1082763671875, -484.76641845703125, -450.424560546875, -416.0827331542969, -381.74090576171875, -347.3990478515625, -313.05718994140625, -278.7153625488281, -244.37351989746094, -210.03167724609375, -175.68983459472656, -141.34799194335938, -107.00614929199219, -72.664306640625, -38.32246398925781, -3.980621337890625, 30.361221313476562, 64.70306396484375, 99.04490661621094, 133.38674926757812, 167.7285919189453, 202.0704345703125, 236.4122772216797, 270.7541198730469, 305.095947265625, 339.43780517578125, 373.7796630859375, 408.1214904785156, 442.46331787109375, 476.80517578125, 511.14703369140625, 545.4888916015625, 579.8306884765625, 614.1725463867188, 648.514404296875, 682.856201171875, 717.1980590820312, 751.5399169921875, 785.8817749023438, 820.2236328125, 854.5654296875, 888.9072875976562, 923.2491455078125, 957.5909423828125, 991.9328002929688, 1026.274658203125, 1060.616455078125, 1094.9583740234375, 1129.3001708984375, 1163.64208984375, 1197.98388671875, 1232.32568359375, 1266.6676025390625, 1301.0093994140625, 1335.3511962890625, 1369.693115234375, 1404.034912109375, 1438.376708984375, 1472.7186279296875, 1507.0604248046875, 1541.40234375, 1575.744140625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 9.0, 4.0, 9.0, 10.0, 7.0, 11.0, 17.0, 15.0, 20.0, 17.0, 14.0, 26.0, 28.0, 23.0, 31.0, 28.0, 44.0, 40.0, 44.0, 31.0, 32.0, 45.0, 48.0, 40.0, 47.0, 37.0, 43.0, 38.0, 26.0, 29.0, 33.0, 22.0, 23.0, 22.0, 15.0, 18.0, 14.0, 14.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-277.356201171875, -268.98248291015625, -260.6087951660156, -252.23507690429688, -243.8613739013672, -235.4876708984375, -227.11395263671875, -218.74024963378906, -210.36654663085938, -201.9928436279297, -193.619140625, -185.24542236328125, -176.87171936035156, -168.49801635742188, -160.12429809570312, -151.75059509277344, -143.37689208984375, -135.00318908691406, -126.62947845458984, -118.25576782226562, -109.88206481933594, -101.50836181640625, -93.13465118408203, -84.76094055175781, -76.38723754882812, -68.01353454589844, -59.63982391357422, -51.266117095947266, -42.89241027832031, -34.51870346069336, -26.144996643066406, -17.771289825439453, -9.397552490234375, -1.0238456726074219, 7.349861145019531, 15.723567962646484, 24.097274780273438, 32.47098159790039, 40.844688415527344, 49.2183952331543, 57.59210205078125, 65.96580505371094, 74.33951568603516, 82.71322631835938, 91.08692932128906, 99.46063232421875, 107.83434295654297, 116.20805358886719, 124.58175659179688, 132.95545959472656, 141.32916259765625, 149.702880859375, 158.0765838623047, 166.45028686523438, 174.82400512695312, 183.1977081298828, 191.5714111328125, 199.9451141357422, 208.31881713867188, 216.69253540039062, 225.0662384033203, 233.43994140625, 241.81365966796875, 250.18736267089844, 258.5610656738281]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 12.0, 11.0, 16.0, 18.0, 19.0, 8.0, 24.0, 25.0, 37.0, 37.0, 33.0, 39.0, 41.0, 38.0, 48.0, 45.0, 38.0, 30.0, 45.0, 42.0, 35.0, 38.0, 41.0, 27.0, 23.0, 31.0, 25.0, 18.0, 14.0, 20.0, 15.0, 15.0, 10.0, 11.0, 11.0, 7.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-45.96875, -44.64111328125, -43.3134765625, -41.98583984375, -40.658203125, -39.33056640625, -38.0029296875, -36.67529296875, -35.34765625, -34.02001953125, -32.6923828125, -31.36474609375, -30.037109375, -28.70947265625, -27.3818359375, -26.05419921875, -24.7265625, -23.39892578125, -22.0712890625, -20.74365234375, -19.416015625, -18.08837890625, -16.7607421875, -15.43310546875, -14.10546875, -12.77783203125, -11.4501953125, -10.12255859375, -8.794921875, -7.46728515625, -6.1396484375, -4.81201171875, -3.484375, -2.15673828125, -0.8291015625, 0.49853515625, 1.826171875, 3.15380859375, 4.4814453125, 5.80908203125, 7.13671875, 8.46435546875, 9.7919921875, 11.11962890625, 12.447265625, 13.77490234375, 15.1025390625, 16.43017578125, 17.7578125, 19.08544921875, 20.4130859375, 21.74072265625, 23.068359375, 24.39599609375, 25.7236328125, 27.05126953125, 28.37890625, 29.70654296875, 31.0341796875, 32.36181640625, 33.689453125, 35.01708984375, 36.3447265625, 37.67236328125, 39.0]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 6.0, 14.0, 14.0, 28.0, 49.0, 69.0, 112.0, 137.0, 220.0, 350.0, 507.0, 762.0, 1089.0, 1652.0, 2457.0, 3539.0, 5072.0, 7427.0, 10698.0, 16244.0, 24136.0, 38476.0, 63145.0, 112598.0, 216212.0, 232621.0, 122840.0, 68075.0, 41154.0, 26008.0, 16933.0, 11378.0, 7555.0, 5336.0, 3722.0, 2546.0, 1687.0, 1188.0, 815.0, 586.0, 340.0, 248.0, 164.0, 115.0, 80.0, 60.0, 33.0, 23.0, 14.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0], "bins": [-2.1796875, -2.1157073974609375, -2.051727294921875, -1.9877471923828125, -1.92376708984375, -1.8597869873046875, -1.795806884765625, -1.7318267822265625, -1.6678466796875, -1.6038665771484375, -1.539886474609375, -1.4759063720703125, -1.41192626953125, -1.3479461669921875, -1.283966064453125, -1.2199859619140625, -1.156005859375, -1.0920257568359375, -1.028045654296875, -0.9640655517578125, -0.90008544921875, -0.8361053466796875, -0.772125244140625, -0.7081451416015625, -0.6441650390625, -0.5801849365234375, -0.516204833984375, -0.4522247314453125, -0.38824462890625, -0.3242645263671875, -0.260284423828125, -0.1963043212890625, -0.13232421875, -0.0683441162109375, -0.004364013671875, 0.0596160888671875, 0.12359619140625, 0.1875762939453125, 0.251556396484375, 0.3155364990234375, 0.3795166015625, 0.4434967041015625, 0.507476806640625, 0.5714569091796875, 0.63543701171875, 0.6994171142578125, 0.763397216796875, 0.8273773193359375, 0.891357421875, 0.9553375244140625, 1.019317626953125, 1.0832977294921875, 1.14727783203125, 1.2112579345703125, 1.275238037109375, 1.3392181396484375, 1.4031982421875, 1.4671783447265625, 1.531158447265625, 1.5951385498046875, 1.65911865234375, 1.7230987548828125, 1.787078857421875, 1.8510589599609375, 1.9150390625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 6.0, 3.0, 5.0, 11.0, 15.0, 11.0, 21.0, 24.0, 14.0, 16.0, 21.0, 30.0, 19.0, 34.0, 25.0, 29.0, 41.0, 36.0, 33.0, 40.0, 31.0, 1069.0, 46.0, 32.0, 35.0, 35.0, 27.0, 40.0, 36.0, 24.0, 31.0, 33.0, 19.0, 21.0, 13.0, 23.0, 11.0, 9.0, 8.0, 9.0, 10.0, 6.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.671875, -24.822509765625, -23.97314453125, -23.123779296875, -22.2744140625, -21.425048828125, -20.57568359375, -19.726318359375, -18.876953125, -18.027587890625, -17.17822265625, -16.328857421875, -15.4794921875, -14.630126953125, -13.78076171875, -12.931396484375, -12.08203125, -11.232666015625, -10.38330078125, -9.533935546875, -8.6845703125, -7.835205078125, -6.98583984375, -6.136474609375, -5.287109375, -4.437744140625, -3.58837890625, -2.739013671875, -1.8896484375, -1.040283203125, -0.19091796875, 0.658447265625, 1.5078125, 2.357177734375, 3.20654296875, 4.055908203125, 4.9052734375, 5.754638671875, 6.60400390625, 7.453369140625, 8.302734375, 9.152099609375, 10.00146484375, 10.850830078125, 11.7001953125, 12.549560546875, 13.39892578125, 14.248291015625, 15.09765625, 15.947021484375, 16.79638671875, 17.645751953125, 18.4951171875, 19.344482421875, 20.19384765625, 21.043212890625, 21.892578125, 22.741943359375, 23.59130859375, 24.440673828125, 25.2900390625, 26.139404296875, 26.98876953125, 27.838134765625, 28.6875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 11.0, 2.0, 10.0, 16.0, 26.0, 23.0, 32.0, 53.0, 100.0, 133.0, 206.0, 294.0, 427.0, 648.0, 979.0, 1480.0, 2390.0, 3669.0, 5748.0, 9197.0, 14738.0, 24132.0, 40065.0, 70070.0, 138718.0, 1329843.0, 223042.0, 96167.0, 52839.0, 30945.0, 18909.0, 11794.0, 7408.0, 4559.0, 2960.0, 1882.0, 1268.0, 761.0, 549.0, 335.0, 244.0, 154.0, 95.0, 70.0, 48.0, 37.0, 20.0, 18.0, 11.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.083984375, -2.013946533203125, -1.94390869140625, -1.873870849609375, -1.8038330078125, -1.733795166015625, -1.66375732421875, -1.593719482421875, -1.523681640625, -1.453643798828125, -1.38360595703125, -1.313568115234375, -1.2435302734375, -1.173492431640625, -1.10345458984375, -1.033416748046875, -0.96337890625, -0.893341064453125, -0.82330322265625, -0.753265380859375, -0.6832275390625, -0.613189697265625, -0.54315185546875, -0.473114013671875, -0.403076171875, -0.333038330078125, -0.26300048828125, -0.192962646484375, -0.1229248046875, -0.052886962890625, 0.01715087890625, 0.087188720703125, 0.1572265625, 0.227264404296875, 0.29730224609375, 0.367340087890625, 0.4373779296875, 0.507415771484375, 0.57745361328125, 0.647491455078125, 0.717529296875, 0.787567138671875, 0.85760498046875, 0.927642822265625, 0.9976806640625, 1.067718505859375, 1.13775634765625, 1.207794189453125, 1.27783203125, 1.347869873046875, 1.41790771484375, 1.487945556640625, 1.5579833984375, 1.628021240234375, 1.69805908203125, 1.768096923828125, 1.838134765625, 1.908172607421875, 1.97821044921875, 2.048248291015625, 2.1182861328125, 2.188323974609375, 2.25836181640625, 2.328399658203125, 2.3984375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 5.0, 8.0, 10.0, 16.0, 21.0, 19.0, 26.0, 28.0, 36.0, 34.0, 68.0, 74.0, 66.0, 93.0, 92.0, 66.0, 66.0, 57.0, 47.0, 22.0, 16.0, 27.0, 17.0, 14.0, 21.0, 9.0, 8.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.036590576171875, -0.03556513786315918, -0.03453969955444336, -0.03351426124572754, -0.03248882293701172, -0.0314633846282959, -0.030437946319580078, -0.029412508010864258, -0.028387069702148438, -0.027361631393432617, -0.026336193084716797, -0.025310754776000977, -0.024285316467285156, -0.023259878158569336, -0.022234439849853516, -0.021209001541137695, -0.020183563232421875, -0.019158124923706055, -0.018132686614990234, -0.017107248306274414, -0.016081809997558594, -0.015056371688842773, -0.014030933380126953, -0.013005495071411133, -0.011980056762695312, -0.010954618453979492, -0.009929180145263672, -0.008903741836547852, -0.007878303527832031, -0.006852865219116211, -0.005827426910400391, -0.00480198860168457, -0.00377655029296875, -0.0027511119842529297, -0.0017256736755371094, -0.0007002353668212891, 0.00032520294189453125, 0.0013506412506103516, 0.002376079559326172, 0.003401517868041992, 0.0044269561767578125, 0.005452394485473633, 0.006477832794189453, 0.0075032711029052734, 0.008528709411621094, 0.009554147720336914, 0.010579586029052734, 0.011605024337768555, 0.012630462646484375, 0.013655900955200195, 0.014681339263916016, 0.015706777572631836, 0.016732215881347656, 0.017757654190063477, 0.018783092498779297, 0.019808530807495117, 0.020833969116210938, 0.021859407424926758, 0.022884845733642578, 0.0239102840423584, 0.02493572235107422, 0.02596116065979004, 0.02698659896850586, 0.02801203727722168, 0.0290374755859375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 8.0, 16.0, 24.0, 20.0, 35.0, 42.0, 44.0, 70.0, 83.0, 162.0, 464.0, 2585.0, 45499.0, 971089.0, 25667.0, 1822.0, 385.0, 152.0, 91.0, 60.0, 49.0, 35.0, 27.0, 25.0, 18.0, 16.0, 9.0, 6.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.480224609375, -0.4633293151855469, -0.44643402099609375, -0.4295387268066406, -0.4126434326171875, -0.3957481384277344, -0.37885284423828125, -0.3619575500488281, -0.345062255859375, -0.3281669616699219, -0.31127166748046875, -0.2943763732910156, -0.2774810791015625, -0.2605857849121094, -0.24369049072265625, -0.22679519653320312, -0.20989990234375, -0.19300460815429688, -0.17610931396484375, -0.15921401977539062, -0.1423187255859375, -0.12542343139648438, -0.10852813720703125, -0.09163284301757812, -0.074737548828125, -0.057842254638671875, -0.04094696044921875, -0.024051666259765625, -0.0071563720703125, 0.009738922119140625, 0.02663421630859375, 0.043529510498046875, 0.0604248046875, 0.07732009887695312, 0.09421539306640625, 0.11111068725585938, 0.1280059814453125, 0.14490127563476562, 0.16179656982421875, 0.17869186401367188, 0.195587158203125, 0.21248245239257812, 0.22937774658203125, 0.24627304077148438, 0.2631683349609375, 0.2800636291503906, 0.29695892333984375, 0.3138542175292969, 0.33074951171875, 0.3476448059082031, 0.36454010009765625, 0.3814353942871094, 0.3983306884765625, 0.4152259826660156, 0.43212127685546875, 0.4490165710449219, 0.465911865234375, 0.4828071594238281, 0.49970245361328125, 0.5165977478027344, 0.5334930419921875, 0.5503883361816406, 0.5672836303710938, 0.5841789245605469, 0.60107421875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 21.0, 104.0, 574.0, 261.0, 40.0, 11.0, 4.0], "bins": [-0.23129884898662567, -0.22742971777915955, -0.22356057167053223, -0.2196914404630661, -0.21582230925559998, -0.21195316314697266, -0.20808403193950653, -0.2042149007320404, -0.20034576952457428, -0.19647663831710815, -0.19260749220848083, -0.1887383610010147, -0.18486922979354858, -0.18100008368492126, -0.17713095247745514, -0.173261821269989, -0.1693926751613617, -0.16552354395389557, -0.16165439784526825, -0.15778526663780212, -0.153916135430336, -0.15004700422286987, -0.14617785811424255, -0.14230872690677643, -0.1384395956993103, -0.13457046449184418, -0.13070131838321686, -0.12683218717575073, -0.1229630559682846, -0.11909391731023788, -0.11522477865219116, -0.11135564744472504, -0.10748650878667831, -0.10361737012863159, -0.09974823892116547, -0.09587910026311874, -0.09200996905565262, -0.0881408303976059, -0.08427169919013977, -0.08040256053209305, -0.07653342187404633, -0.0726642832159996, -0.06879515200853348, -0.06492601335048676, -0.06105687841773033, -0.05718774348497391, -0.053318608552217484, -0.04944947361946106, -0.045580342411994934, -0.04171120747923851, -0.037842072546482086, -0.033972933888435364, -0.03010379895567894, -0.026234664022922516, -0.022365529090166092, -0.01849639229476452, -0.014627255499362946, -0.010758119635283947, -0.006888984236866236, -0.0030198488384485245, 0.0008492870256304741, 0.004718422889709473, 0.008587557822465897, 0.01245669461786747, 0.016325829550623894]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 8.0, 6.0, 13.0, 24.0, 18.0, 25.0, 21.0, 31.0, 30.0, 31.0, 37.0, 31.0, 47.0, 60.0, 53.0, 45.0, 47.0, 33.0, 64.0, 38.0, 53.0, 39.0, 31.0, 30.0, 25.0, 32.0, 21.0, 17.0, 24.0, 15.0, 16.0, 5.0, 7.0, 11.0, 7.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017859458923339844, -0.017259661108255386, -0.016659865155816078, -0.01606006920337677, -0.015460271388292313, -0.01486047450453043, -0.014260677620768547, -0.013660880737006664, -0.013061083853244781, -0.012461286969482899, -0.011861490085721016, -0.011261693201959133, -0.01066189631819725, -0.010062099434435368, -0.009462302550673485, -0.008862505666911602, -0.00826270878314972, -0.0076629118993878365, -0.007063115015625954, -0.006463318131864071, -0.005863521248102188, -0.005263724364340305, -0.0046639274805784225, -0.00406413059681654, -0.003464333713054657, -0.002864536829292774, -0.0022647399455308914, -0.0016649430617690086, -0.0010651461780071259, -0.00046534929424524307, 0.0001344475895166397, 0.0007342444732785225, 0.0013340413570404053, 0.001933838240802288, 0.002533635124564171, 0.0031334320083260536, 0.0037332288920879364, 0.004333025775849819, 0.004932822659611702, 0.005532619543373585, 0.0061324164271354675, 0.00673221331089735, 0.007332010194659233, 0.007931807078421116, 0.008531603962182999, 0.009131400845944881, 0.009731197729706764, 0.010330994613468647, 0.01093079149723053, 0.011530588380992413, 0.012130385264754295, 0.012730182148516178, 0.013329979032278061, 0.013929775916039944, 0.014529572799801826, 0.01512936968356371, 0.015729166567325592, 0.01632896438241005, 0.016928760334849358, 0.017528556287288666, 0.018128354102373123, 0.01872815191745758, 0.01932794786989689, 0.019927743822336197, 0.020527541637420654]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 12.0, 11.0, 16.0, 18.0, 19.0, 8.0, 24.0, 25.0, 37.0, 37.0, 33.0, 39.0, 41.0, 38.0, 48.0, 45.0, 38.0, 30.0, 45.0, 42.0, 35.0, 38.0, 41.0, 27.0, 23.0, 31.0, 25.0, 18.0, 14.0, 20.0, 15.0, 15.0, 10.0, 11.0, 11.0, 7.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-45.96875, -44.64111328125, -43.3134765625, -41.98583984375, -40.658203125, -39.33056640625, -38.0029296875, -36.67529296875, -35.34765625, -34.02001953125, -32.6923828125, -31.36474609375, -30.037109375, -28.70947265625, -27.3818359375, -26.05419921875, -24.7265625, -23.39892578125, -22.0712890625, -20.74365234375, -19.416015625, -18.08837890625, -16.7607421875, -15.43310546875, -14.10546875, -12.77783203125, -11.4501953125, -10.12255859375, -8.794921875, -7.46728515625, -6.1396484375, -4.81201171875, -3.484375, -2.15673828125, -0.8291015625, 0.49853515625, 1.826171875, 3.15380859375, 4.4814453125, 5.80908203125, 7.13671875, 8.46435546875, 9.7919921875, 11.11962890625, 12.447265625, 13.77490234375, 15.1025390625, 16.43017578125, 17.7578125, 19.08544921875, 20.4130859375, 21.74072265625, 23.068359375, 24.39599609375, 25.7236328125, 27.05126953125, 28.37890625, 29.70654296875, 31.0341796875, 32.36181640625, 33.689453125, 35.01708984375, 36.3447265625, 37.67236328125, 39.0]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 8.0, 13.0, 22.0, 21.0, 34.0, 50.0, 68.0, 111.0, 145.0, 196.0, 294.0, 405.0, 590.0, 906.0, 1274.0, 2049.0, 3343.0, 6641.0, 17868.0, 86523.0, 784457.0, 106357.0, 19958.0, 7259.0, 3548.0, 2093.0, 1330.0, 912.0, 645.0, 449.0, 278.0, 217.0, 144.0, 102.0, 73.0, 49.0, 28.0, 29.0, 19.0, 13.0, 11.0, 8.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-60.78125, -59.0712890625, -57.361328125, -55.6513671875, -53.94140625, -52.2314453125, -50.521484375, -48.8115234375, -47.1015625, -45.3916015625, -43.681640625, -41.9716796875, -40.26171875, -38.5517578125, -36.841796875, -35.1318359375, -33.421875, -31.7119140625, -30.001953125, -28.2919921875, -26.58203125, -24.8720703125, -23.162109375, -21.4521484375, -19.7421875, -18.0322265625, -16.322265625, -14.6123046875, -12.90234375, -11.1923828125, -9.482421875, -7.7724609375, -6.0625, -4.3525390625, -2.642578125, -0.9326171875, 0.77734375, 2.4873046875, 4.197265625, 5.9072265625, 7.6171875, 9.3271484375, 11.037109375, 12.7470703125, 14.45703125, 16.1669921875, 17.876953125, 19.5869140625, 21.296875, 23.0068359375, 24.716796875, 26.4267578125, 28.13671875, 29.8466796875, 31.556640625, 33.2666015625, 34.9765625, 36.6865234375, 38.396484375, 40.1064453125, 41.81640625, 43.5263671875, 45.236328125, 46.9462890625, 48.65625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 12.0, 18.0, 16.0, 18.0, 22.0, 20.0, 23.0, 30.0, 30.0, 50.0, 33.0, 48.0, 55.0, 57.0, 484.0, 1611.0, 79.0, 51.0, 47.0, 46.0, 36.0, 32.0, 33.0, 29.0, 20.0, 26.0, 18.0, 18.0, 15.0, 14.0, 9.0, 10.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-136.0, -131.61328125, -127.2265625, -122.83984375, -118.453125, -114.06640625, -109.6796875, -105.29296875, -100.90625, -96.51953125, -92.1328125, -87.74609375, -83.359375, -78.97265625, -74.5859375, -70.19921875, -65.8125, -61.42578125, -57.0390625, -52.65234375, -48.265625, -43.87890625, -39.4921875, -35.10546875, -30.71875, -26.33203125, -21.9453125, -17.55859375, -13.171875, -8.78515625, -4.3984375, -0.01171875, 4.375, 8.76171875, 13.1484375, 17.53515625, 21.921875, 26.30859375, 30.6953125, 35.08203125, 39.46875, 43.85546875, 48.2421875, 52.62890625, 57.015625, 61.40234375, 65.7890625, 70.17578125, 74.5625, 78.94921875, 83.3359375, 87.72265625, 92.109375, 96.49609375, 100.8828125, 105.26953125, 109.65625, 114.04296875, 118.4296875, 122.81640625, 127.203125, 131.58984375, 135.9765625, 140.36328125, 144.75]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 8.0, 11.0, 19.0, 35.0, 48.0, 73.0, 146.0, 265.0, 866.0, 10245.0, 3126000.0, 6764.0, 655.0, 256.0, 116.0, 64.0, 46.0, 38.0, 16.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-472.5, -453.1640625, -433.828125, -414.4921875, -395.15625, -375.8203125, -356.484375, -337.1484375, -317.8125, -298.4765625, -279.140625, -259.8046875, -240.46875, -221.1328125, -201.796875, -182.4609375, -163.125, -143.7890625, -124.453125, -105.1171875, -85.78125, -66.4453125, -47.109375, -27.7734375, -8.4375, 10.8984375, 30.234375, 49.5703125, 68.90625, 88.2421875, 107.578125, 126.9140625, 146.25, 165.5859375, 184.921875, 204.2578125, 223.59375, 242.9296875, 262.265625, 281.6015625, 300.9375, 320.2734375, 339.609375, 358.9453125, 378.28125, 397.6171875, 416.953125, 436.2890625, 455.625, 474.9609375, 494.296875, 513.6328125, 532.96875, 552.3046875, 571.640625, 590.9765625, 610.3125, 629.6484375, 648.984375, 668.3203125, 687.65625, 706.9921875, 726.328125, 745.6640625, 765.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 34.0, 366.0, 541.0, 59.0, 13.0], "bins": [-1305.7406005859375, -1284.364501953125, -1262.98828125, -1241.6121826171875, -1220.236083984375, -1198.85986328125, -1177.4837646484375, -1156.107666015625, -1134.7314453125, -1113.3553466796875, -1091.9791259765625, -1070.60302734375, -1049.2269287109375, -1027.8507080078125, -1006.474609375, -985.0984497070312, -963.7223510742188, -942.34619140625, -920.9700927734375, -899.5939331054688, -878.2177734375, -856.8416748046875, -835.4655151367188, -814.08935546875, -792.7132568359375, -771.3370971679688, -749.9609985351562, -728.5848388671875, -707.2086791992188, -685.83251953125, -664.4564208984375, -643.0802612304688, -621.7041015625, -600.3279418945312, -578.9518432617188, -557.57568359375, -536.1995239257812, -514.8233642578125, -493.447265625, -472.07110595703125, -450.6949768066406, -429.31884765625, -407.94268798828125, -386.5665588378906, -365.1904296875, -343.81427001953125, -322.4381408691406, -301.06201171875, -279.68585205078125, -258.3097229003906, -236.93356323242188, -215.55743408203125, -194.18128967285156, -172.80514526367188, -151.42901611328125, -130.05287170410156, -108.67672729492188, -87.30058288574219, -65.92444610595703, -44.548309326171875, -23.172164916992188, -1.7960205078125, 19.580108642578125, 40.95625305175781, 62.332393646240234]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 11.0, 10.0, 12.0, 15.0, 18.0, 34.0, 23.0, 29.0, 33.0, 35.0, 31.0, 42.0, 53.0, 57.0, 47.0, 60.0, 50.0, 51.0, 60.0, 39.0, 34.0, 38.0, 34.0, 24.0, 34.0, 21.0, 13.0, 13.0, 13.0, 16.0, 8.0, 7.0, 6.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-445.086669921875, -432.382080078125, -419.6774597167969, -406.9728698730469, -394.2682800292969, -381.5636901855469, -368.85906982421875, -356.15447998046875, -343.44989013671875, -330.74530029296875, -318.0406799316406, -305.3360900878906, -292.6315002441406, -279.9269104003906, -267.2222900390625, -254.5177001953125, -241.81309509277344, -229.10848999023438, -216.40390014648438, -203.6992950439453, -190.9947052001953, -178.29010009765625, -165.58551025390625, -152.8809051513672, -140.17630004882812, -127.4717025756836, -114.76710510253906, -102.0625, -89.35791015625, -76.65330505371094, -63.948707580566406, -51.244110107421875, -38.539520263671875, -25.834922790527344, -13.13032341003418, -0.4257240295410156, 12.278873443603516, 24.983470916748047, 37.688072204589844, 50.392669677734375, 63.097267150878906, 75.80186462402344, 88.50646209716797, 101.2110595703125, 113.91566467285156, 126.62025451660156, 139.32485961914062, 152.02944946289062, 164.7340545654297, 177.43865966796875, 190.14324951171875, 202.8478546142578, 215.5524444580078, 228.25704956054688, 240.96163940429688, 253.66624450683594, 266.370849609375, 279.075439453125, 291.7800598144531, 304.4846496582031, 317.1892395019531, 329.8938293457031, 342.59844970703125, 355.30303955078125, 368.00762939453125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 6.0, 14.0, 8.0, 18.0, 16.0, 19.0, 18.0, 28.0, 26.0, 30.0, 33.0, 30.0, 26.0, 43.0, 38.0, 41.0, 35.0, 41.0, 36.0, 44.0, 32.0, 40.0, 34.0, 44.0, 22.0, 35.0, 22.0, 23.0, 17.0, 22.0, 20.0, 18.0, 8.0, 9.0, 16.0, 12.0, 9.0, 10.0, 4.0, 6.0, 2.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-43.625, -42.3359375, -41.046875, -39.7578125, -38.46875, -37.1796875, -35.890625, -34.6015625, -33.3125, -32.0234375, -30.734375, -29.4453125, -28.15625, -26.8671875, -25.578125, -24.2890625, -23.0, -21.7109375, -20.421875, -19.1328125, -17.84375, -16.5546875, -15.265625, -13.9765625, -12.6875, -11.3984375, -10.109375, -8.8203125, -7.53125, -6.2421875, -4.953125, -3.6640625, -2.375, -1.0859375, 0.203125, 1.4921875, 2.78125, 4.0703125, 5.359375, 6.6484375, 7.9375, 9.2265625, 10.515625, 11.8046875, 13.09375, 14.3828125, 15.671875, 16.9609375, 18.25, 19.5390625, 20.828125, 22.1171875, 23.40625, 24.6953125, 25.984375, 27.2734375, 28.5625, 29.8515625, 31.140625, 32.4296875, 33.71875, 35.0078125, 36.296875, 37.5859375, 38.875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 7.0, 10.0, 9.0, 16.0, 20.0, 21.0, 32.0, 39.0, 63.0, 96.0, 138.0, 188.0, 240.0, 367.0, 580.0, 857.0, 1325.0, 2219.0, 3924.0, 7611.0, 18941.0, 191787.0, 2821387.0, 1057749.0, 60621.0, 12527.0, 5527.0, 2964.0, 1770.0, 1085.0, 654.0, 434.0, 313.0, 207.0, 160.0, 114.0, 74.0, 50.0, 37.0, 30.0, 21.0, 16.0, 14.0, 11.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-121.5625, -118.068359375, -114.57421875, -111.080078125, -107.5859375, -104.091796875, -100.59765625, -97.103515625, -93.609375, -90.115234375, -86.62109375, -83.126953125, -79.6328125, -76.138671875, -72.64453125, -69.150390625, -65.65625, -62.162109375, -58.66796875, -55.173828125, -51.6796875, -48.185546875, -44.69140625, -41.197265625, -37.703125, -34.208984375, -30.71484375, -27.220703125, -23.7265625, -20.232421875, -16.73828125, -13.244140625, -9.75, -6.255859375, -2.76171875, 0.732421875, 4.2265625, 7.720703125, 11.21484375, 14.708984375, 18.203125, 21.697265625, 25.19140625, 28.685546875, 32.1796875, 35.673828125, 39.16796875, 42.662109375, 46.15625, 49.650390625, 53.14453125, 56.638671875, 60.1328125, 63.626953125, 67.12109375, 70.615234375, 74.109375, 77.603515625, 81.09765625, 84.591796875, 88.0859375, 91.580078125, 95.07421875, 98.568359375, 102.0625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 0.0, 6.0, 3.0, 5.0, 8.0, 6.0, 9.0, 9.0, 15.0, 23.0, 31.0, 35.0, 44.0, 75.0, 106.0, 192.0, 416.0, 786.0, 901.0, 615.0, 303.0, 172.0, 91.0, 46.0, 37.0, 21.0, 24.0, 20.0, 17.0, 16.0, 9.0, 7.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-105.9375, -102.93359375, -99.9296875, -96.92578125, -93.921875, -90.91796875, -87.9140625, -84.91015625, -81.90625, -78.90234375, -75.8984375, -72.89453125, -69.890625, -66.88671875, -63.8828125, -60.87890625, -57.875, -54.87109375, -51.8671875, -48.86328125, -45.859375, -42.85546875, -39.8515625, -36.84765625, -33.84375, -30.83984375, -27.8359375, -24.83203125, -21.828125, -18.82421875, -15.8203125, -12.81640625, -9.8125, -6.80859375, -3.8046875, -0.80078125, 2.203125, 5.20703125, 8.2109375, 11.21484375, 14.21875, 17.22265625, 20.2265625, 23.23046875, 26.234375, 29.23828125, 32.2421875, 35.24609375, 38.25, 41.25390625, 44.2578125, 47.26171875, 50.265625, 53.26953125, 56.2734375, 59.27734375, 62.28125, 65.28515625, 68.2890625, 71.29296875, 74.296875, 77.30078125, 80.3046875, 83.30859375, 86.3125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 10.0, 7.0, 18.0, 24.0, 25.0, 28.0, 39.0, 89.0, 237.0, 700.0, 2369.0, 10624.0, 92774.0, 3975837.0, 97008.0, 10894.0, 2325.0, 719.0, 222.0, 117.0, 55.0, 42.0, 21.0, 17.0, 11.0, 11.0, 8.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-300.0, -289.09375, -278.1875, -267.28125, -256.375, -245.46875, -234.5625, -223.65625, -212.75, -201.84375, -190.9375, -180.03125, -169.125, -158.21875, -147.3125, -136.40625, -125.5, -114.59375, -103.6875, -92.78125, -81.875, -70.96875, -60.0625, -49.15625, -38.25, -27.34375, -16.4375, -5.53125, 5.375, 16.28125, 27.1875, 38.09375, 49.0, 59.90625, 70.8125, 81.71875, 92.625, 103.53125, 114.4375, 125.34375, 136.25, 147.15625, 158.0625, 168.96875, 179.875, 190.78125, 201.6875, 212.59375, 223.5, 234.40625, 245.3125, 256.21875, 267.125, 278.03125, 288.9375, 299.84375, 310.75, 321.65625, 332.5625, 343.46875, 354.375, 365.28125, 376.1875, 387.09375, 398.0]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 31.0, 62.0, 118.0, 308.0, 266.0, 108.0, 66.0, 19.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1017.845458984375, -988.7223510742188, -959.5993041992188, -930.4761962890625, -901.3531494140625, -872.2300415039062, -843.10693359375, -813.98388671875, -784.8607788085938, -755.7376708984375, -726.6146240234375, -697.4915161132812, -668.368408203125, -639.245361328125, -610.1222534179688, -580.9991455078125, -551.8760986328125, -522.7529907226562, -493.62994384765625, -464.5068359375, -435.3837585449219, -406.26068115234375, -377.1375732421875, -348.0144958496094, -318.89141845703125, -289.7683410644531, -260.645263671875, -231.52215576171875, -202.39907836914062, -173.2760009765625, -144.1529083251953, -115.02981567382812, -85.90673828125, -56.783653259277344, -27.660568237304688, 1.4625167846679688, 30.585601806640625, 59.70867919921875, 88.83177185058594, 117.95486450195312, 147.07794189453125, 176.20101928710938, 205.32411193847656, 234.44720458984375, 263.5702819824219, 292.693359375, 321.81646728515625, 350.9395446777344, 380.0626220703125, 409.1856994628906, 438.30877685546875, 467.431884765625, 496.5549621582031, 525.6780395507812, 554.8011474609375, 583.9241943359375, 613.0473022460938, 642.17041015625, 671.29345703125, 700.4165649414062, 729.5396728515625, 758.6627197265625, 787.7858276367188, 816.908935546875, 846.031982421875]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 6.0, 1.0, 5.0, 8.0, 8.0, 9.0, 10.0, 10.0, 14.0, 18.0, 21.0, 29.0, 20.0, 27.0, 27.0, 32.0, 26.0, 30.0, 41.0, 32.0, 43.0, 41.0, 22.0, 45.0, 37.0, 31.0, 35.0, 31.0, 42.0, 33.0, 35.0, 29.0, 32.0, 20.0, 20.0, 26.0, 19.0, 16.0, 13.0, 12.0, 7.0, 10.0, 7.0, 2.0, 4.0, 4.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-233.20901489257812, -225.56715393066406, -217.92529296875, -210.283447265625, -202.64158630371094, -194.99972534179688, -187.3578643798828, -179.71600341796875, -172.07415771484375, -164.4322967529297, -156.79043579101562, -149.14859008789062, -141.50672912597656, -133.8648681640625, -126.22300720214844, -118.58114624023438, -110.93928527832031, -103.29742431640625, -95.65557098388672, -88.01371002197266, -80.37185668945312, -72.72999572753906, -65.088134765625, -57.4462776184082, -49.804420471191406, -42.16256332397461, -34.52070617675781, -26.87884521484375, -19.236988067626953, -11.595130920410156, -3.9532699584960938, 3.688587188720703, 11.3304443359375, 18.972301483154297, 26.614160537719727, 34.256019592285156, 41.89787673950195, 49.53973388671875, 57.18159484863281, 64.82345581054688, 72.4653091430664, 80.10717010498047, 87.7490234375, 95.39088439941406, 103.03274536132812, 110.67459869384766, 118.31645965576172, 125.95831298828125, 133.6001739501953, 141.24203491210938, 148.88389587402344, 156.5257568359375, 164.1676025390625, 171.80946350097656, 179.45132446289062, 187.0931854248047, 194.73504638671875, 202.3769073486328, 210.01876831054688, 217.66061401367188, 225.30247497558594, 232.9443359375, 240.58619689941406, 248.22805786132812, 255.86990356445312]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 4.0, 3.0, 7.0, 12.0, 10.0, 10.0, 16.0, 11.0, 21.0, 20.0, 18.0, 29.0, 31.0, 23.0, 32.0, 31.0, 40.0, 28.0, 39.0, 44.0, 32.0, 34.0, 44.0, 47.0, 33.0, 30.0, 51.0, 22.0, 27.0, 23.0, 30.0, 16.0, 25.0, 20.0, 18.0, 14.0, 24.0, 15.0, 9.0, 8.0, 9.0, 4.0, 6.0, 6.0, 2.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-41.3125, -40.0517578125, -38.791015625, -37.5302734375, -36.26953125, -35.0087890625, -33.748046875, -32.4873046875, -31.2265625, -29.9658203125, -28.705078125, -27.4443359375, -26.18359375, -24.9228515625, -23.662109375, -22.4013671875, -21.140625, -19.8798828125, -18.619140625, -17.3583984375, -16.09765625, -14.8369140625, -13.576171875, -12.3154296875, -11.0546875, -9.7939453125, -8.533203125, -7.2724609375, -6.01171875, -4.7509765625, -3.490234375, -2.2294921875, -0.96875, 0.2919921875, 1.552734375, 2.8134765625, 4.07421875, 5.3349609375, 6.595703125, 7.8564453125, 9.1171875, 10.3779296875, 11.638671875, 12.8994140625, 14.16015625, 15.4208984375, 16.681640625, 17.9423828125, 19.203125, 20.4638671875, 21.724609375, 22.9853515625, 24.24609375, 25.5068359375, 26.767578125, 28.0283203125, 29.2890625, 30.5498046875, 31.810546875, 33.0712890625, 34.33203125, 35.5927734375, 36.853515625, 38.1142578125, 39.375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 10.0, 21.0, 16.0, 23.0, 37.0, 42.0, 74.0, 122.0, 161.0, 234.0, 356.0, 558.0, 828.0, 1315.0, 1971.0, 3161.0, 4967.0, 7870.0, 12397.0, 20025.0, 32723.0, 55238.0, 100907.0, 210616.0, 275045.0, 139147.0, 72229.0, 41328.0, 24892.0, 15607.0, 9596.0, 6053.0, 3900.0, 2459.0, 1605.0, 1010.0, 667.0, 440.0, 265.0, 196.0, 143.0, 94.0, 65.0, 35.0, 43.0, 17.0, 19.0, 10.0, 6.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.3359375, -2.263458251953125, -2.19097900390625, -2.118499755859375, -2.0460205078125, -1.973541259765625, -1.90106201171875, -1.828582763671875, -1.756103515625, -1.683624267578125, -1.61114501953125, -1.538665771484375, -1.4661865234375, -1.393707275390625, -1.32122802734375, -1.248748779296875, -1.17626953125, -1.103790283203125, -1.03131103515625, -0.958831787109375, -0.8863525390625, -0.813873291015625, -0.74139404296875, -0.668914794921875, -0.596435546875, -0.523956298828125, -0.45147705078125, -0.378997802734375, -0.3065185546875, -0.234039306640625, -0.16156005859375, -0.089080810546875, -0.0166015625, 0.055877685546875, 0.12835693359375, 0.200836181640625, 0.2733154296875, 0.345794677734375, 0.41827392578125, 0.490753173828125, 0.563232421875, 0.635711669921875, 0.70819091796875, 0.780670166015625, 0.8531494140625, 0.925628662109375, 0.99810791015625, 1.070587158203125, 1.14306640625, 1.215545654296875, 1.28802490234375, 1.360504150390625, 1.4329833984375, 1.505462646484375, 1.57794189453125, 1.650421142578125, 1.722900390625, 1.795379638671875, 1.86785888671875, 1.940338134765625, 2.0128173828125, 2.085296630859375, 2.15777587890625, 2.230255126953125, 2.302734375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 6.0, 10.0, 12.0, 12.0, 11.0, 8.0, 18.0, 23.0, 18.0, 39.0, 31.0, 27.0, 27.0, 34.0, 34.0, 43.0, 39.0, 41.0, 1078.0, 45.0, 38.0, 52.0, 35.0, 51.0, 31.0, 28.0, 32.0, 34.0, 27.0, 18.0, 18.0, 14.0, 13.0, 7.0, 11.0, 15.0, 8.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.515625, -25.627685546875, -24.73974609375, -23.851806640625, -22.9638671875, -22.075927734375, -21.18798828125, -20.300048828125, -19.412109375, -18.524169921875, -17.63623046875, -16.748291015625, -15.8603515625, -14.972412109375, -14.08447265625, -13.196533203125, -12.30859375, -11.420654296875, -10.53271484375, -9.644775390625, -8.7568359375, -7.868896484375, -6.98095703125, -6.093017578125, -5.205078125, -4.317138671875, -3.42919921875, -2.541259765625, -1.6533203125, -0.765380859375, 0.12255859375, 1.010498046875, 1.8984375, 2.786376953125, 3.67431640625, 4.562255859375, 5.4501953125, 6.338134765625, 7.22607421875, 8.114013671875, 9.001953125, 9.889892578125, 10.77783203125, 11.665771484375, 12.5537109375, 13.441650390625, 14.32958984375, 15.217529296875, 16.10546875, 16.993408203125, 17.88134765625, 18.769287109375, 19.6572265625, 20.545166015625, 21.43310546875, 22.321044921875, 23.208984375, 24.096923828125, 24.98486328125, 25.872802734375, 26.7607421875, 27.648681640625, 28.53662109375, 29.424560546875, 30.3125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 21.0, 26.0, 30.0, 48.0, 62.0, 100.0, 149.0, 197.0, 325.0, 495.0, 728.0, 1151.0, 1756.0, 2771.0, 4339.0, 7182.0, 11650.0, 19891.0, 35203.0, 65807.0, 139829.0, 1357629.0, 235113.0, 96070.0, 48960.0, 26982.0, 15531.0, 9373.0, 5752.0, 3509.0, 2255.0, 1427.0, 936.0, 624.0, 401.0, 246.0, 177.0, 114.0, 84.0, 56.0, 38.0, 24.0, 18.0, 15.0, 8.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.3203125, -2.244903564453125, -2.16949462890625, -2.094085693359375, -2.0186767578125, -1.943267822265625, -1.86785888671875, -1.792449951171875, -1.717041015625, -1.641632080078125, -1.56622314453125, -1.490814208984375, -1.4154052734375, -1.339996337890625, -1.26458740234375, -1.189178466796875, -1.11376953125, -1.038360595703125, -0.96295166015625, -0.887542724609375, -0.8121337890625, -0.736724853515625, -0.66131591796875, -0.585906982421875, -0.510498046875, -0.435089111328125, -0.35968017578125, -0.284271240234375, -0.2088623046875, -0.133453369140625, -0.05804443359375, 0.017364501953125, 0.0927734375, 0.168182373046875, 0.24359130859375, 0.319000244140625, 0.3944091796875, 0.469818115234375, 0.54522705078125, 0.620635986328125, 0.696044921875, 0.771453857421875, 0.84686279296875, 0.922271728515625, 0.9976806640625, 1.073089599609375, 1.14849853515625, 1.223907470703125, 1.29931640625, 1.374725341796875, 1.45013427734375, 1.525543212890625, 1.6009521484375, 1.676361083984375, 1.75177001953125, 1.827178955078125, 1.902587890625, 1.977996826171875, 2.05340576171875, 2.128814697265625, 2.2042236328125, 2.279632568359375, 2.35504150390625, 2.430450439453125, 2.505859375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 6.0, 8.0, 6.0, 11.0, 13.0, 11.0, 10.0, 15.0, 17.0, 33.0, 29.0, 45.0, 40.0, 48.0, 50.0, 77.0, 76.0, 80.0, 56.0, 45.0, 49.0, 46.0, 32.0, 24.0, 32.0, 27.0, 27.0, 13.0, 15.0, 8.0, 10.0, 6.0, 2.0, 4.0, 5.0, 5.0, 1.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0279083251953125, -0.02710866928100586, -0.02630901336669922, -0.025509357452392578, -0.024709701538085938, -0.023910045623779297, -0.023110389709472656, -0.022310733795166016, -0.021511077880859375, -0.020711421966552734, -0.019911766052246094, -0.019112110137939453, -0.018312454223632812, -0.017512798309326172, -0.01671314239501953, -0.01591348648071289, -0.01511383056640625, -0.01431417465209961, -0.013514518737792969, -0.012714862823486328, -0.011915206909179688, -0.011115550994873047, -0.010315895080566406, -0.009516239166259766, -0.008716583251953125, -0.007916927337646484, -0.007117271423339844, -0.006317615509033203, -0.0055179595947265625, -0.004718303680419922, -0.003918647766113281, -0.0031189918518066406, -0.0023193359375, -0.0015196800231933594, -0.0007200241088867188, 7.963180541992188e-05, 0.0008792877197265625, 0.0016789436340332031, 0.0024785995483398438, 0.0032782554626464844, 0.004077911376953125, 0.004877567291259766, 0.005677223205566406, 0.006476879119873047, 0.0072765350341796875, 0.008076190948486328, 0.008875846862792969, 0.00967550277709961, 0.01047515869140625, 0.01127481460571289, 0.012074470520019531, 0.012874126434326172, 0.013673782348632812, 0.014473438262939453, 0.015273094177246094, 0.016072750091552734, 0.016872406005859375, 0.017672061920166016, 0.018471717834472656, 0.019271373748779297, 0.020071029663085938, 0.020870685577392578, 0.02167034149169922, 0.02246999740600586, 0.0232696533203125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 8.0, 6.0, 5.0, 6.0, 7.0, 17.0, 15.0, 16.0, 20.0, 29.0, 37.0, 49.0, 75.0, 79.0, 113.0, 185.0, 559.0, 4801.0, 144880.0, 882788.0, 12915.0, 1139.0, 280.0, 129.0, 93.0, 65.0, 46.0, 47.0, 22.0, 24.0, 13.0, 19.0, 19.0, 9.0, 9.0, 5.0, 2.0, 10.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4189453125, -0.4045906066894531, -0.39023590087890625, -0.3758811950683594, -0.3615264892578125, -0.3471717834472656, -0.33281707763671875, -0.3184623718261719, -0.304107666015625, -0.2897529602050781, -0.27539825439453125, -0.2610435485839844, -0.2466888427734375, -0.23233413696289062, -0.21797943115234375, -0.20362472534179688, -0.18927001953125, -0.17491531372070312, -0.16056060791015625, -0.14620590209960938, -0.1318511962890625, -0.11749649047851562, -0.10314178466796875, -0.08878707885742188, -0.074432373046875, -0.060077667236328125, -0.04572296142578125, -0.031368255615234375, -0.0170135498046875, -0.002658843994140625, 0.01169586181640625, 0.026050567626953125, 0.0404052734375, 0.054759979248046875, 0.06911468505859375, 0.08346939086914062, 0.0978240966796875, 0.11217880249023438, 0.12653350830078125, 0.14088821411132812, 0.155242919921875, 0.16959762573242188, 0.18395233154296875, 0.19830703735351562, 0.2126617431640625, 0.22701644897460938, 0.24137115478515625, 0.2557258605957031, 0.27008056640625, 0.2844352722167969, 0.29878997802734375, 0.3131446838378906, 0.3274993896484375, 0.3418540954589844, 0.35620880126953125, 0.3705635070800781, 0.384918212890625, 0.3992729187011719, 0.41362762451171875, 0.4279823303222656, 0.4423370361328125, 0.4566917419433594, 0.47104644775390625, 0.4854011535644531, 0.499755859375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 24.0, 188.0, 725.0, 73.0, 5.0, 2.0, 1.0], "bins": [-0.27860090136528015, -0.27390599250793457, -0.269211083650589, -0.2645161747932434, -0.2598212659358978, -0.25512635707855225, -0.25043144822120667, -0.24573653936386108, -0.2410416305065155, -0.23634672164916992, -0.23165181279182434, -0.22695690393447876, -0.22226199507713318, -0.2175670862197876, -0.21287217736244202, -0.20817726850509644, -0.20348235964775085, -0.19878745079040527, -0.1940925419330597, -0.1893976330757141, -0.18470272421836853, -0.18000781536102295, -0.17531290650367737, -0.1706179976463318, -0.165923073887825, -0.16122816503047943, -0.15653325617313385, -0.15183834731578827, -0.1471434384584427, -0.1424485296010971, -0.13775362074375153, -0.13305871188640594, -0.12836380302906036, -0.12366889417171478, -0.1189739853143692, -0.11427907645702362, -0.10958416759967804, -0.10488925874233246, -0.10019434988498688, -0.0954994410276413, -0.09080452471971512, -0.08610961586236954, -0.08141470700502396, -0.07671979814767838, -0.0720248892903328, -0.06732998043298721, -0.06263506412506104, -0.05794015899300575, -0.05324524641036987, -0.04855033755302429, -0.04385542869567871, -0.03916051983833313, -0.03446561098098755, -0.02977070026099682, -0.025075789541006088, -0.020380880683660507, -0.015685973688960075, -0.010991064831614494, -0.006296155042946339, -0.001601245254278183, 0.003093663603067398, 0.007788572460412979, 0.01248348318040371, 0.01717839203774929, 0.02187330089509487]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 10.0, 10.0, 5.0, 12.0, 8.0, 21.0, 15.0, 17.0, 20.0, 18.0, 18.0, 31.0, 23.0, 33.0, 40.0, 34.0, 36.0, 38.0, 48.0, 41.0, 54.0, 40.0, 42.0, 42.0, 38.0, 38.0, 28.0, 28.0, 25.0, 22.0, 23.0, 27.0, 16.0, 16.0, 13.0, 18.0, 11.0, 10.0, 6.0, 4.0, 5.0, 5.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.013894498348236084, -0.013451100327074528, -0.013007702305912971, -0.012564304284751415, -0.012120906263589859, -0.011677508242428303, -0.011234110221266747, -0.01079071220010519, -0.010347314178943634, -0.009903916157782078, -0.009460518136620522, -0.009017120115458965, -0.008573722094297409, -0.008130324073135853, -0.007686926051974297, -0.00724352803081274, -0.006800130009651184, -0.006356731988489628, -0.005913333967328072, -0.005469935946166515, -0.005026537925004959, -0.004583139903843403, -0.004139741882681847, -0.0036963438615202904, -0.003252945840358734, -0.002809547819197178, -0.0023661497980356216, -0.0019227517768740654, -0.0014793537557125092, -0.001035955734550953, -0.0005925577133893967, -0.00014915969222784042, 0.0002942383289337158, 0.0007376363500952721, 0.0011810343712568283, 0.0016244323924183846, 0.002067830413579941, 0.002511228434741497, 0.0029546264559030533, 0.0033980244770646095, 0.0038414224982261658, 0.004284820519387722, 0.004728218540549278, 0.0051716165617108345, 0.005615014582872391, 0.006058412604033947, 0.006501810625195503, 0.0069452086463570595, 0.007388606667518616, 0.007832004688680172, 0.008275402709841728, 0.008718800731003284, 0.00916219875216484, 0.009605596773326397, 0.010048994794487953, 0.01049239281564951, 0.010935790836811066, 0.011379188857972622, 0.011822586879134178, 0.012265984900295734, 0.01270938292145729, 0.013152780942618847, 0.013596178963780403, 0.01403957698494196, 0.014482975006103516]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 4.0, 3.0, 8.0, 11.0, 10.0, 10.0, 16.0, 11.0, 21.0, 20.0, 18.0, 29.0, 31.0, 23.0, 32.0, 31.0, 40.0, 28.0, 39.0, 44.0, 32.0, 34.0, 44.0, 47.0, 33.0, 30.0, 51.0, 22.0, 27.0, 23.0, 30.0, 16.0, 25.0, 20.0, 18.0, 14.0, 24.0, 15.0, 9.0, 8.0, 9.0, 4.0, 6.0, 6.0, 2.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-41.3125, -40.0517578125, -38.791015625, -37.5302734375, -36.26953125, -35.0087890625, -33.748046875, -32.4873046875, -31.2265625, -29.9658203125, -28.705078125, -27.4443359375, -26.18359375, -24.9228515625, -23.662109375, -22.4013671875, -21.140625, -19.8798828125, -18.619140625, -17.3583984375, -16.09765625, -14.8369140625, -13.576171875, -12.3154296875, -11.0546875, -9.7939453125, -8.533203125, -7.2724609375, -6.01171875, -4.7509765625, -3.490234375, -2.2294921875, -0.96875, 0.2919921875, 1.552734375, 2.8134765625, 4.07421875, 5.3349609375, 6.595703125, 7.8564453125, 9.1171875, 10.3779296875, 11.638671875, 12.8994140625, 14.16015625, 15.4208984375, 16.681640625, 17.9423828125, 19.203125, 20.4638671875, 21.724609375, 22.9853515625, 24.24609375, 25.5068359375, 26.767578125, 28.0283203125, 29.2890625, 30.5498046875, 31.810546875, 33.0712890625, 34.33203125, 35.5927734375, 36.853515625, 38.1142578125, 39.375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 3.0, 12.0, 12.0, 11.0, 12.0, 23.0, 34.0, 41.0, 51.0, 92.0, 125.0, 169.0, 283.0, 467.0, 701.0, 1140.0, 1850.0, 3107.0, 5312.0, 9104.0, 17000.0, 32615.0, 67058.0, 151648.0, 346962.0, 223132.0, 93565.0, 43550.0, 21954.0, 11983.0, 6458.0, 3872.0, 2219.0, 1418.0, 901.0, 552.0, 363.0, 220.0, 154.0, 110.0, 82.0, 46.0, 41.0, 27.0, 13.0, 17.0, 15.0, 6.0, 8.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0], "bins": [-15.984375, -15.4957275390625, -15.007080078125, -14.5184326171875, -14.02978515625, -13.5411376953125, -13.052490234375, -12.5638427734375, -12.0751953125, -11.5865478515625, -11.097900390625, -10.6092529296875, -10.12060546875, -9.6319580078125, -9.143310546875, -8.6546630859375, -8.166015625, -7.6773681640625, -7.188720703125, -6.7000732421875, -6.21142578125, -5.7227783203125, -5.234130859375, -4.7454833984375, -4.2568359375, -3.7681884765625, -3.279541015625, -2.7908935546875, -2.30224609375, -1.8135986328125, -1.324951171875, -0.8363037109375, -0.34765625, 0.1409912109375, 0.629638671875, 1.1182861328125, 1.60693359375, 2.0955810546875, 2.584228515625, 3.0728759765625, 3.5615234375, 4.0501708984375, 4.538818359375, 5.0274658203125, 5.51611328125, 6.0047607421875, 6.493408203125, 6.9820556640625, 7.470703125, 7.9593505859375, 8.447998046875, 8.9366455078125, 9.42529296875, 9.9139404296875, 10.402587890625, 10.8912353515625, 11.3798828125, 11.8685302734375, 12.357177734375, 12.8458251953125, 13.33447265625, 13.8231201171875, 14.311767578125, 14.8004150390625, 15.2890625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 4.0, 7.0, 5.0, 8.0, 17.0, 11.0, 19.0, 28.0, 29.0, 26.0, 25.0, 25.0, 41.0, 32.0, 42.0, 53.0, 43.0, 57.0, 288.0, 1762.0, 94.0, 57.0, 50.0, 32.0, 43.0, 35.0, 37.0, 30.0, 28.0, 14.0, 19.0, 11.0, 15.0, 14.0, 12.0, 11.0, 6.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.9375, -109.7509765625, -105.564453125, -101.3779296875, -97.19140625, -93.0048828125, -88.818359375, -84.6318359375, -80.4453125, -76.2587890625, -72.072265625, -67.8857421875, -63.69921875, -59.5126953125, -55.326171875, -51.1396484375, -46.953125, -42.7666015625, -38.580078125, -34.3935546875, -30.20703125, -26.0205078125, -21.833984375, -17.6474609375, -13.4609375, -9.2744140625, -5.087890625, -0.9013671875, 3.28515625, 7.4716796875, 11.658203125, 15.8447265625, 20.03125, 24.2177734375, 28.404296875, 32.5908203125, 36.77734375, 40.9638671875, 45.150390625, 49.3369140625, 53.5234375, 57.7099609375, 61.896484375, 66.0830078125, 70.26953125, 74.4560546875, 78.642578125, 82.8291015625, 87.015625, 91.2021484375, 95.388671875, 99.5751953125, 103.76171875, 107.9482421875, 112.134765625, 116.3212890625, 120.5078125, 124.6943359375, 128.880859375, 133.0673828125, 137.25390625, 141.4404296875, 145.626953125, 149.8134765625, 154.0]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 5.0, 9.0, 7.0, 15.0, 17.0, 25.0, 24.0, 23.0, 34.0, 43.0, 72.0, 91.0, 93.0, 163.0, 190.0, 307.0, 773.0, 5214.0, 3113589.0, 22488.0, 1154.0, 372.0, 221.0, 185.0, 120.0, 129.0, 67.0, 56.0, 36.0, 38.0, 45.0, 24.0, 13.0, 17.0, 5.0, 8.0, 6.0, 2.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-363.75, -354.08984375, -344.4296875, -334.76953125, -325.109375, -315.44921875, -305.7890625, -296.12890625, -286.46875, -276.80859375, -267.1484375, -257.48828125, -247.828125, -238.16796875, -228.5078125, -218.84765625, -209.1875, -199.52734375, -189.8671875, -180.20703125, -170.546875, -160.88671875, -151.2265625, -141.56640625, -131.90625, -122.24609375, -112.5859375, -102.92578125, -93.265625, -83.60546875, -73.9453125, -64.28515625, -54.625, -44.96484375, -35.3046875, -25.64453125, -15.984375, -6.32421875, 3.3359375, 12.99609375, 22.65625, 32.31640625, 41.9765625, 51.63671875, 61.296875, 70.95703125, 80.6171875, 90.27734375, 99.9375, 109.59765625, 119.2578125, 128.91796875, 138.578125, 148.23828125, 157.8984375, 167.55859375, 177.21875, 186.87890625, 196.5390625, 206.19921875, 215.859375, 225.51953125, 235.1796875, 244.83984375, 254.5]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 126.0, 748.0, 137.0, 3.0, 1.0, 2.0], "bins": [-1179.3955078125, -1159.5711669921875, -1139.746826171875, -1119.9224853515625, -1100.0980224609375, -1080.273681640625, -1060.4493408203125, -1040.625, -1020.8006591796875, -1000.976318359375, -981.1519165039062, -961.3275756835938, -941.5032348632812, -921.6788940429688, -901.8544921875, -882.0301513671875, -862.205810546875, -842.3814697265625, -822.5570678710938, -802.7327270507812, -782.9083862304688, -763.0840454101562, -743.2596435546875, -723.435302734375, -703.6109008789062, -683.7865600585938, -663.962158203125, -644.1378173828125, -624.3134765625, -604.4891357421875, -584.6647338867188, -564.8403930664062, -545.0159912109375, -525.191650390625, -505.3672790527344, -485.54290771484375, -465.71856689453125, -445.8941955566406, -426.06982421875, -406.2454833984375, -386.421142578125, -366.5967712402344, -346.7724304199219, -326.94805908203125, -307.12371826171875, -287.2993469238281, -267.4749755859375, -247.650634765625, -227.8262939453125, -208.00193786621094, -188.17758178710938, -168.35321044921875, -148.52886962890625, -128.70449829101562, -108.88014221191406, -89.0557861328125, -69.23143005371094, -49.407073974609375, -29.582714080810547, -9.758354187011719, 10.066001892089844, 29.890357971191406, 49.7147216796875, 69.53907775878906, 89.36343383789062]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 5.0, 6.0, 10.0, 9.0, 20.0, 18.0, 19.0, 18.0, 29.0, 21.0, 34.0, 26.0, 31.0, 41.0, 53.0, 59.0, 49.0, 48.0, 57.0, 42.0, 42.0, 38.0, 35.0, 37.0, 37.0, 34.0, 31.0, 23.0, 23.0, 16.0, 18.0, 14.0, 11.0, 17.0, 8.0, 3.0, 4.0, 6.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-346.5399169921875, -335.1388854980469, -323.7378234863281, -312.3367919921875, -300.9357604980469, -289.53472900390625, -278.1336669921875, -266.7326354980469, -255.3315887451172, -243.9305419921875, -232.52951049804688, -221.1284637451172, -209.7274169921875, -198.32638549804688, -186.9253387451172, -175.5242919921875, -164.12326049804688, -152.7222137451172, -141.32118225097656, -129.92013549804688, -118.51909637451172, -107.11805725097656, -95.71701049804688, -84.31597137451172, -72.91493225097656, -61.513893127441406, -50.112850189208984, -38.71180725097656, -27.310768127441406, -15.90972900390625, -4.5086822509765625, 6.892356872558594, 18.29339599609375, 29.69443702697754, 41.09547805786133, 52.49652099609375, 63.897560119628906, 75.29859924316406, 86.69964599609375, 98.1006851196289, 109.50172424316406, 120.90276336669922, 132.30380249023438, 143.70484924316406, 155.10589599609375, 166.50692749023438, 177.90797424316406, 189.30902099609375, 200.71005249023438, 212.11109924316406, 223.5121307373047, 234.91317749023438, 246.314208984375, 257.71527099609375, 269.1163024902344, 280.517333984375, 291.91839599609375, 303.3194274902344, 314.7204895019531, 326.12152099609375, 337.5225524902344, 348.923583984375, 360.32464599609375, 371.7256774902344, 383.126708984375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 9.0, 5.0, 15.0, 7.0, 13.0, 16.0, 13.0, 19.0, 18.0, 24.0, 32.0, 23.0, 23.0, 37.0, 30.0, 41.0, 33.0, 34.0, 33.0, 45.0, 41.0, 39.0, 31.0, 30.0, 46.0, 43.0, 24.0, 23.0, 20.0, 27.0, 22.0, 14.0, 23.0, 18.0, 14.0, 22.0, 17.0, 14.0, 4.0, 8.0, 5.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-39.15625, -37.9091796875, -36.662109375, -35.4150390625, -34.16796875, -32.9208984375, -31.673828125, -30.4267578125, -29.1796875, -27.9326171875, -26.685546875, -25.4384765625, -24.19140625, -22.9443359375, -21.697265625, -20.4501953125, -19.203125, -17.9560546875, -16.708984375, -15.4619140625, -14.21484375, -12.9677734375, -11.720703125, -10.4736328125, -9.2265625, -7.9794921875, -6.732421875, -5.4853515625, -4.23828125, -2.9912109375, -1.744140625, -0.4970703125, 0.75, 1.9970703125, 3.244140625, 4.4912109375, 5.73828125, 6.9853515625, 8.232421875, 9.4794921875, 10.7265625, 11.9736328125, 13.220703125, 14.4677734375, 15.71484375, 16.9619140625, 18.208984375, 19.4560546875, 20.703125, 21.9501953125, 23.197265625, 24.4443359375, 25.69140625, 26.9384765625, 28.185546875, 29.4326171875, 30.6796875, 31.9267578125, 33.173828125, 34.4208984375, 35.66796875, 36.9150390625, 38.162109375, 39.4091796875, 40.65625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 1.0, 8.0, 3.0, 2.0, 6.0, 6.0, 12.0, 16.0, 9.0, 19.0, 30.0, 24.0, 40.0, 82.0, 83.0, 118.0, 141.0, 186.0, 249.0, 382.0, 502.0, 765.0, 1135.0, 1757.0, 2890.0, 5208.0, 11255.0, 76758.0, 1695900.0, 2265230.0, 104036.0, 13062.0, 5722.0, 3035.0, 1836.0, 1145.0, 736.0, 505.0, 343.0, 260.0, 210.0, 134.0, 110.0, 88.0, 48.0, 49.0, 39.0, 25.0, 20.0, 19.0, 12.0, 12.0, 4.0, 6.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-116.8125, -113.16796875, -109.5234375, -105.87890625, -102.234375, -98.58984375, -94.9453125, -91.30078125, -87.65625, -84.01171875, -80.3671875, -76.72265625, -73.078125, -69.43359375, -65.7890625, -62.14453125, -58.5, -54.85546875, -51.2109375, -47.56640625, -43.921875, -40.27734375, -36.6328125, -32.98828125, -29.34375, -25.69921875, -22.0546875, -18.41015625, -14.765625, -11.12109375, -7.4765625, -3.83203125, -0.1875, 3.45703125, 7.1015625, 10.74609375, 14.390625, 18.03515625, 21.6796875, 25.32421875, 28.96875, 32.61328125, 36.2578125, 39.90234375, 43.546875, 47.19140625, 50.8359375, 54.48046875, 58.125, 61.76953125, 65.4140625, 69.05859375, 72.703125, 76.34765625, 79.9921875, 83.63671875, 87.28125, 90.92578125, 94.5703125, 98.21484375, 101.859375, 105.50390625, 109.1484375, 112.79296875, 116.4375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 14.0, 10.0, 12.0, 11.0, 20.0, 22.0, 34.0, 70.0, 99.0, 184.0, 386.0, 704.0, 966.0, 702.0, 317.0, 183.0, 96.0, 61.0, 32.0, 27.0, 15.0, 17.0, 22.0, 13.0, 6.0, 6.0, 3.0, 7.0, 2.0, 4.0, 3.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-106.3125, -103.474609375, -100.63671875, -97.798828125, -94.9609375, -92.123046875, -89.28515625, -86.447265625, -83.609375, -80.771484375, -77.93359375, -75.095703125, -72.2578125, -69.419921875, -66.58203125, -63.744140625, -60.90625, -58.068359375, -55.23046875, -52.392578125, -49.5546875, -46.716796875, -43.87890625, -41.041015625, -38.203125, -35.365234375, -32.52734375, -29.689453125, -26.8515625, -24.013671875, -21.17578125, -18.337890625, -15.5, -12.662109375, -9.82421875, -6.986328125, -4.1484375, -1.310546875, 1.52734375, 4.365234375, 7.203125, 10.041015625, 12.87890625, 15.716796875, 18.5546875, 21.392578125, 24.23046875, 27.068359375, 29.90625, 32.744140625, 35.58203125, 38.419921875, 41.2578125, 44.095703125, 46.93359375, 49.771484375, 52.609375, 55.447265625, 58.28515625, 61.123046875, 63.9609375, 66.798828125, 69.63671875, 72.474609375, 75.3125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 1.0, 4.0, 5.0, 3.0, 11.0, 15.0, 20.0, 23.0, 18.0, 46.0, 78.0, 160.0, 380.0, 1161.0, 4721.0, 28290.0, 3214492.0, 918071.0, 21285.0, 3883.0, 948.0, 318.0, 128.0, 75.0, 38.0, 21.0, 13.0, 11.0, 17.0, 14.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-286.75, -276.1015625, -265.453125, -254.8046875, -244.15625, -233.5078125, -222.859375, -212.2109375, -201.5625, -190.9140625, -180.265625, -169.6171875, -158.96875, -148.3203125, -137.671875, -127.0234375, -116.375, -105.7265625, -95.078125, -84.4296875, -73.78125, -63.1328125, -52.484375, -41.8359375, -31.1875, -20.5390625, -9.890625, 0.7578125, 11.40625, 22.0546875, 32.703125, 43.3515625, 54.0, 64.6484375, 75.296875, 85.9453125, 96.59375, 107.2421875, 117.890625, 128.5390625, 139.1875, 149.8359375, 160.484375, 171.1328125, 181.78125, 192.4296875, 203.078125, 213.7265625, 224.375, 235.0234375, 245.671875, 256.3203125, 266.96875, 277.6171875, 288.265625, 298.9140625, 309.5625, 320.2109375, 330.859375, 341.5078125, 352.15625, 362.8046875, 373.453125, 384.1015625, 394.75]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 14.0, 21.0, 35.0, 72.0, 181.0, 269.0, 208.0, 102.0, 39.0, 28.0, 25.0, 9.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-794.7993774414062, -774.7706298828125, -754.7418823242188, -734.713134765625, -714.6843872070312, -694.6556396484375, -674.6268920898438, -654.59814453125, -634.5693969726562, -614.5406494140625, -594.5119018554688, -574.483154296875, -554.4544067382812, -534.4256591796875, -514.3969116210938, -494.3681640625, -474.33941650390625, -454.3106689453125, -434.28192138671875, -414.253173828125, -394.22442626953125, -374.1956787109375, -354.16693115234375, -334.13818359375, -314.10943603515625, -294.0806884765625, -274.05194091796875, -254.023193359375, -233.99444580078125, -213.9656982421875, -193.93695068359375, -173.908203125, -153.87945556640625, -133.8507080078125, -113.82196044921875, -93.793212890625, -73.76446533203125, -53.7357177734375, -33.70697021484375, -13.67822265625, 6.35052490234375, 26.3792724609375, 46.40802001953125, 66.436767578125, 86.46551513671875, 106.4942626953125, 126.52301025390625, 146.5517578125, 166.58050537109375, 186.6092529296875, 206.63800048828125, 226.666748046875, 246.69549560546875, 266.7242431640625, 286.75299072265625, 306.78173828125, 326.81048583984375, 346.8392333984375, 366.86798095703125, 386.896728515625, 406.92547607421875, 426.9542236328125, 446.98297119140625, 467.01171875, 487.04046630859375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 11.0, 9.0, 6.0, 5.0, 13.0, 13.0, 16.0, 13.0, 16.0, 18.0, 21.0, 33.0, 30.0, 36.0, 27.0, 33.0, 42.0, 41.0, 37.0, 45.0, 46.0, 40.0, 47.0, 36.0, 44.0, 28.0, 37.0, 29.0, 21.0, 34.0, 21.0, 26.0, 20.0, 16.0, 7.0, 12.0, 17.0, 6.0, 8.0, 9.0, 7.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0], "bins": [-243.2111053466797, -236.49725341796875, -229.7834014892578, -223.06954956054688, -216.35569763183594, -209.641845703125, -202.92799377441406, -196.21414184570312, -189.5002899169922, -182.78643798828125, -176.0725860595703, -169.35873413085938, -162.64488220214844, -155.9310302734375, -149.21717834472656, -142.50332641601562, -135.7894744873047, -129.07562255859375, -122.36177062988281, -115.64791870117188, -108.93406677246094, -102.22021484375, -95.50636291503906, -88.79251098632812, -82.07865905761719, -75.36480712890625, -68.65095520019531, -61.937103271484375, -55.22325134277344, -48.5093994140625, -41.79554748535156, -35.081695556640625, -28.36785888671875, -21.654006958007812, -14.940155029296875, -8.226303100585938, -1.512451171875, 5.2014007568359375, 11.915252685546875, 18.629104614257812, 25.34295654296875, 32.05680847167969, 38.770660400390625, 45.48451232910156, 52.1983642578125, 58.91221618652344, 65.62606811523438, 72.33992004394531, 79.05377197265625, 85.76762390136719, 92.48147583007812, 99.19532775878906, 105.9091796875, 112.62303161621094, 119.33688354492188, 126.05073547363281, 132.76458740234375, 139.4784393310547, 146.19229125976562, 152.90614318847656, 159.6199951171875, 166.33384704589844, 173.04769897460938, 179.7615509033203, 186.47540283203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 7.0, 9.0, 12.0, 13.0, 15.0, 20.0, 22.0, 18.0, 33.0, 30.0, 32.0, 27.0, 38.0, 26.0, 41.0, 40.0, 44.0, 42.0, 47.0, 39.0, 35.0, 38.0, 29.0, 33.0, 21.0, 27.0, 34.0, 31.0, 22.0, 18.0, 22.0, 17.0, 17.0, 13.0, 5.0, 13.0, 8.0, 8.0, 12.0, 3.0, 1.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.8125, -41.48291015625, -40.1533203125, -38.82373046875, -37.494140625, -36.16455078125, -34.8349609375, -33.50537109375, -32.17578125, -30.84619140625, -29.5166015625, -28.18701171875, -26.857421875, -25.52783203125, -24.1982421875, -22.86865234375, -21.5390625, -20.20947265625, -18.8798828125, -17.55029296875, -16.220703125, -14.89111328125, -13.5615234375, -12.23193359375, -10.90234375, -9.57275390625, -8.2431640625, -6.91357421875, -5.583984375, -4.25439453125, -2.9248046875, -1.59521484375, -0.265625, 1.06396484375, 2.3935546875, 3.72314453125, 5.052734375, 6.38232421875, 7.7119140625, 9.04150390625, 10.37109375, 11.70068359375, 13.0302734375, 14.35986328125, 15.689453125, 17.01904296875, 18.3486328125, 19.67822265625, 21.0078125, 22.33740234375, 23.6669921875, 24.99658203125, 26.326171875, 27.65576171875, 28.9853515625, 30.31494140625, 31.64453125, 32.97412109375, 34.3037109375, 35.63330078125, 36.962890625, 38.29248046875, 39.6220703125, 40.95166015625, 42.28125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 6.0, 7.0, 19.0, 26.0, 55.0, 68.0, 126.0, 183.0, 230.0, 347.0, 432.0, 719.0, 1036.0, 1388.0, 2077.0, 3016.0, 4437.0, 6469.0, 9719.0, 14537.0, 22377.0, 34614.0, 56526.0, 100057.0, 206923.0, 262389.0, 130142.0, 69405.0, 42132.0, 26830.0, 17175.0, 11251.0, 7532.0, 5037.0, 3454.0, 2405.0, 1678.0, 1071.0, 857.0, 555.0, 403.0, 278.0, 176.0, 115.0, 76.0, 66.0, 45.0, 36.0, 18.0, 12.0, 10.0, 4.0, 7.0, 1.0, 2.0], "bins": [-2.296875, -2.229705810546875, -2.16253662109375, -2.095367431640625, -2.0281982421875, -1.961029052734375, -1.89385986328125, -1.826690673828125, -1.759521484375, -1.692352294921875, -1.62518310546875, -1.558013916015625, -1.4908447265625, -1.423675537109375, -1.35650634765625, -1.289337158203125, -1.22216796875, -1.154998779296875, -1.08782958984375, -1.020660400390625, -0.9534912109375, -0.886322021484375, -0.81915283203125, -0.751983642578125, -0.684814453125, -0.617645263671875, -0.55047607421875, -0.483306884765625, -0.4161376953125, -0.348968505859375, -0.28179931640625, -0.214630126953125, -0.1474609375, -0.080291748046875, -0.01312255859375, 0.054046630859375, 0.1212158203125, 0.188385009765625, 0.25555419921875, 0.322723388671875, 0.389892578125, 0.457061767578125, 0.52423095703125, 0.591400146484375, 0.6585693359375, 0.725738525390625, 0.79290771484375, 0.860076904296875, 0.92724609375, 0.994415283203125, 1.06158447265625, 1.128753662109375, 1.1959228515625, 1.263092041015625, 1.33026123046875, 1.397430419921875, 1.464599609375, 1.531768798828125, 1.59893798828125, 1.666107177734375, 1.7332763671875, 1.800445556640625, 1.86761474609375, 1.934783935546875, 2.001953125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 6.0, 4.0, 9.0, 10.0, 16.0, 17.0, 22.0, 24.0, 34.0, 30.0, 32.0, 32.0, 44.0, 36.0, 23.0, 39.0, 49.0, 40.0, 1066.0, 50.0, 40.0, 37.0, 27.0, 42.0, 28.0, 39.0, 29.0, 23.0, 33.0, 25.0, 20.0, 18.0, 15.0, 10.0, 11.0, 12.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-32.71875, -31.747314453125, -30.77587890625, -29.804443359375, -28.8330078125, -27.861572265625, -26.89013671875, -25.918701171875, -24.947265625, -23.975830078125, -23.00439453125, -22.032958984375, -21.0615234375, -20.090087890625, -19.11865234375, -18.147216796875, -17.17578125, -16.204345703125, -15.23291015625, -14.261474609375, -13.2900390625, -12.318603515625, -11.34716796875, -10.375732421875, -9.404296875, -8.432861328125, -7.46142578125, -6.489990234375, -5.5185546875, -4.547119140625, -3.57568359375, -2.604248046875, -1.6328125, -0.661376953125, 0.31005859375, 1.281494140625, 2.2529296875, 3.224365234375, 4.19580078125, 5.167236328125, 6.138671875, 7.110107421875, 8.08154296875, 9.052978515625, 10.0244140625, 10.995849609375, 11.96728515625, 12.938720703125, 13.91015625, 14.881591796875, 15.85302734375, 16.824462890625, 17.7958984375, 18.767333984375, 19.73876953125, 20.710205078125, 21.681640625, 22.653076171875, 23.62451171875, 24.595947265625, 25.5673828125, 26.538818359375, 27.51025390625, 28.481689453125, 29.453125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 7.0, 12.0, 19.0, 28.0, 33.0, 60.0, 70.0, 111.0, 136.0, 191.0, 321.0, 502.0, 731.0, 1093.0, 1663.0, 2737.0, 4415.0, 7199.0, 12213.0, 20948.0, 36921.0, 67298.0, 135699.0, 1355143.0, 230681.0, 97193.0, 51343.0, 28642.0, 16475.0, 9565.0, 5821.0, 3544.0, 2157.0, 1359.0, 939.0, 610.0, 423.0, 251.0, 174.0, 113.0, 92.0, 65.0, 36.0, 36.0, 22.0, 12.0, 10.0, 5.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.640625, -2.56005859375, -2.4794921875, -2.39892578125, -2.318359375, -2.23779296875, -2.1572265625, -2.07666015625, -1.99609375, -1.91552734375, -1.8349609375, -1.75439453125, -1.673828125, -1.59326171875, -1.5126953125, -1.43212890625, -1.3515625, -1.27099609375, -1.1904296875, -1.10986328125, -1.029296875, -0.94873046875, -0.8681640625, -0.78759765625, -0.70703125, -0.62646484375, -0.5458984375, -0.46533203125, -0.384765625, -0.30419921875, -0.2236328125, -0.14306640625, -0.0625, 0.01806640625, 0.0986328125, 0.17919921875, 0.259765625, 0.34033203125, 0.4208984375, 0.50146484375, 0.58203125, 0.66259765625, 0.7431640625, 0.82373046875, 0.904296875, 0.98486328125, 1.0654296875, 1.14599609375, 1.2265625, 1.30712890625, 1.3876953125, 1.46826171875, 1.548828125, 1.62939453125, 1.7099609375, 1.79052734375, 1.87109375, 1.95166015625, 2.0322265625, 2.11279296875, 2.193359375, 2.27392578125, 2.3544921875, 2.43505859375, 2.515625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 2.0, 10.0, 7.0, 8.0, 12.0, 14.0, 18.0, 17.0, 25.0, 25.0, 38.0, 51.0, 58.0, 82.0, 96.0, 106.0, 74.0, 76.0, 54.0, 46.0, 34.0, 33.0, 26.0, 12.0, 13.0, 9.0, 12.0, 10.0, 10.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036590576171875, -0.03548240661621094, -0.034374237060546875, -0.03326606750488281, -0.03215789794921875, -0.031049728393554688, -0.029941558837890625, -0.028833389282226562, -0.0277252197265625, -0.026617050170898438, -0.025508880615234375, -0.024400711059570312, -0.02329254150390625, -0.022184371948242188, -0.021076202392578125, -0.019968032836914062, -0.01885986328125, -0.017751693725585938, -0.016643524169921875, -0.015535354614257812, -0.01442718505859375, -0.013319015502929688, -0.012210845947265625, -0.011102676391601562, -0.0099945068359375, -0.008886337280273438, -0.007778167724609375, -0.0066699981689453125, -0.00556182861328125, -0.0044536590576171875, -0.003345489501953125, -0.0022373199462890625, -0.001129150390625, -2.09808349609375e-05, 0.001087188720703125, 0.0021953582763671875, 0.00330352783203125, 0.0044116973876953125, 0.005519866943359375, 0.0066280364990234375, 0.0077362060546875, 0.008844375610351562, 0.009952545166015625, 0.011060714721679688, 0.01216888427734375, 0.013277053833007812, 0.014385223388671875, 0.015493392944335938, 0.0166015625, 0.017709732055664062, 0.018817901611328125, 0.019926071166992188, 0.02103424072265625, 0.022142410278320312, 0.023250579833984375, 0.024358749389648438, 0.0254669189453125, 0.026575088500976562, 0.027683258056640625, 0.028791427612304688, 0.02989959716796875, 0.031007766723632812, 0.032115936279296875, 0.03322410583496094, 0.034332275390625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 6.0, 4.0, 9.0, 13.0, 15.0, 7.0, 18.0, 22.0, 23.0, 50.0, 45.0, 66.0, 121.0, 164.0, 390.0, 3000.0, 840422.0, 201523.0, 1855.0, 319.0, 141.0, 81.0, 63.0, 46.0, 24.0, 32.0, 20.0, 18.0, 12.0, 12.0, 11.0, 3.0, 6.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.630859375, -0.6104583740234375, -0.590057373046875, -0.5696563720703125, -0.54925537109375, -0.5288543701171875, -0.508453369140625, -0.4880523681640625, -0.4676513671875, -0.4472503662109375, -0.426849365234375, -0.4064483642578125, -0.38604736328125, -0.3656463623046875, -0.345245361328125, -0.3248443603515625, -0.304443359375, -0.2840423583984375, -0.263641357421875, -0.2432403564453125, -0.22283935546875, -0.2024383544921875, -0.182037353515625, -0.1616363525390625, -0.1412353515625, -0.1208343505859375, -0.100433349609375, -0.0800323486328125, -0.05963134765625, -0.0392303466796875, -0.018829345703125, 0.0015716552734375, 0.02197265625, 0.0423736572265625, 0.062774658203125, 0.0831756591796875, 0.10357666015625, 0.1239776611328125, 0.144378662109375, 0.1647796630859375, 0.1851806640625, 0.2055816650390625, 0.225982666015625, 0.2463836669921875, 0.26678466796875, 0.2871856689453125, 0.307586669921875, 0.3279876708984375, 0.348388671875, 0.3687896728515625, 0.389190673828125, 0.4095916748046875, 0.42999267578125, 0.4503936767578125, 0.470794677734375, 0.4911956787109375, 0.5115966796875, 0.5319976806640625, 0.552398681640625, 0.5727996826171875, 0.59320068359375, 0.6136016845703125, 0.634002685546875, 0.6544036865234375, 0.6748046875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 25.0, 473.0, 483.0, 29.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.26946908235549927, -0.2646583616733551, -0.2598476707935333, -0.25503695011138916, -0.2502262592315674, -0.24541553854942322, -0.24060481786727905, -0.23579411208629608, -0.2309834063053131, -0.22617270052433014, -0.22136199474334717, -0.216551274061203, -0.21174056828022003, -0.20692986249923706, -0.2021191418170929, -0.19730843603610992, -0.19249773025512695, -0.18768702447414398, -0.182876318693161, -0.17806559801101685, -0.17325489223003387, -0.1684441864490509, -0.16363346576690674, -0.15882275998592377, -0.1540120542049408, -0.14920134842395782, -0.14439064264297485, -0.1395799219608307, -0.13476921617984772, -0.12995851039886475, -0.12514778971672058, -0.12033708393573761, -0.11552637815475464, -0.11071567237377167, -0.1059049591422081, -0.10109424591064453, -0.09628354012966156, -0.09147283434867859, -0.08666212111711502, -0.08185140788555145, -0.07704070210456848, -0.07222999632358551, -0.06741928309202194, -0.06260856986045837, -0.0577978640794754, -0.05298715457320213, -0.048176445066928864, -0.043365735560655594, -0.038555022329092026, -0.033744312822818756, -0.028933603316545486, -0.024122893810272217, -0.019312184303998947, -0.014501474797725677, -0.009690765291452408, -0.004880055785179138, -6.934627890586853e-05, 0.004741363227367401, 0.00955207273364067, 0.01436278223991394, 0.01917349174618721, 0.02398420125246048, 0.02879491075873375, 0.03360562026500702, 0.03841632977128029]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 5.0, 8.0, 8.0, 10.0, 12.0, 19.0, 16.0, 25.0, 31.0, 24.0, 31.0, 37.0, 45.0, 44.0, 37.0, 34.0, 49.0, 33.0, 40.0, 45.0, 34.0, 41.0, 35.0, 40.0, 42.0, 28.0, 36.0, 23.0, 30.0, 19.0, 23.0, 11.0, 19.0, 18.0, 16.0, 10.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018032431602478027, -0.017484823241829872, -0.016937214881181717, -0.01638960652053356, -0.015841998159885406, -0.015294389799237251, -0.014746781438589096, -0.01419917307794094, -0.013651564717292786, -0.01310395635664463, -0.012556347995996475, -0.01200873963534832, -0.011461131274700165, -0.01091352291405201, -0.010365914553403854, -0.0098183061927557, -0.009270697832107544, -0.008723089471459389, -0.008175481110811234, -0.007627872750163078, -0.007080264389514923, -0.006532656028866768, -0.005985047668218613, -0.0054374393075704575, -0.004889830946922302, -0.004342222586274147, -0.003794614225625992, -0.0032470058649778366, -0.0026993975043296814, -0.002151789143681526, -0.001604180783033371, -0.0010565724223852158, -0.0005089640617370605, 3.8644298911094666e-05, 0.0005862526595592499, 0.001133861020207405, 0.0016814693808555603, 0.0022290777415037155, 0.0027766861021518707, 0.003324294462800026, 0.003871902823448181, 0.004419511184096336, 0.004967119544744492, 0.005514727905392647, 0.006062336266040802, 0.006609944626688957, 0.007157552987337112, 0.007705161347985268, 0.008252769708633423, 0.008800378069281578, 0.009347986429929733, 0.009895594790577888, 0.010443203151226044, 0.010990811511874199, 0.011538419872522354, 0.01208602823317051, 0.012633636593818665, 0.01318124495446682, 0.013728853315114975, 0.01427646167576313, 0.014824070036411285, 0.01537167839705944, 0.015919286757707596, 0.01646689511835575, 0.017014503479003906]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 7.0, 9.0, 12.0, 13.0, 15.0, 20.0, 22.0, 18.0, 33.0, 30.0, 32.0, 27.0, 38.0, 26.0, 41.0, 40.0, 44.0, 42.0, 47.0, 39.0, 35.0, 38.0, 29.0, 33.0, 21.0, 27.0, 34.0, 31.0, 22.0, 18.0, 22.0, 17.0, 17.0, 13.0, 5.0, 13.0, 8.0, 8.0, 12.0, 3.0, 1.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.8125, -41.48291015625, -40.1533203125, -38.82373046875, -37.494140625, -36.16455078125, -34.8349609375, -33.50537109375, -32.17578125, -30.84619140625, -29.5166015625, -28.18701171875, -26.857421875, -25.52783203125, -24.1982421875, -22.86865234375, -21.5390625, -20.20947265625, -18.8798828125, -17.55029296875, -16.220703125, -14.89111328125, -13.5615234375, -12.23193359375, -10.90234375, -9.57275390625, -8.2431640625, -6.91357421875, -5.583984375, -4.25439453125, -2.9248046875, -1.59521484375, -0.265625, 1.06396484375, 2.3935546875, 3.72314453125, 5.052734375, 6.38232421875, 7.7119140625, 9.04150390625, 10.37109375, 11.70068359375, 13.0302734375, 14.35986328125, 15.689453125, 17.01904296875, 18.3486328125, 19.67822265625, 21.0078125, 22.33740234375, 23.6669921875, 24.99658203125, 26.326171875, 27.65576171875, 28.9853515625, 30.31494140625, 31.64453125, 32.97412109375, 34.3037109375, 35.63330078125, 36.962890625, 38.29248046875, 39.6220703125, 40.95166015625, 42.28125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 1.0, 3.0, 7.0, 11.0, 7.0, 8.0, 18.0, 12.0, 19.0, 21.0, 25.0, 35.0, 42.0, 55.0, 83.0, 102.0, 146.0, 210.0, 281.0, 411.0, 739.0, 1426.0, 3572.0, 10996.0, 44952.0, 318503.0, 575125.0, 67589.0, 15234.0, 4687.0, 1767.0, 847.0, 441.0, 302.0, 211.0, 143.0, 111.0, 94.0, 68.0, 47.0, 45.0, 36.0, 24.0, 23.0, 16.0, 15.0, 17.0, 7.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-44.09375, -42.72119140625, -41.3486328125, -39.97607421875, -38.603515625, -37.23095703125, -35.8583984375, -34.48583984375, -33.11328125, -31.74072265625, -30.3681640625, -28.99560546875, -27.623046875, -26.25048828125, -24.8779296875, -23.50537109375, -22.1328125, -20.76025390625, -19.3876953125, -18.01513671875, -16.642578125, -15.27001953125, -13.8974609375, -12.52490234375, -11.15234375, -9.77978515625, -8.4072265625, -7.03466796875, -5.662109375, -4.28955078125, -2.9169921875, -1.54443359375, -0.171875, 1.20068359375, 2.5732421875, 3.94580078125, 5.318359375, 6.69091796875, 8.0634765625, 9.43603515625, 10.80859375, 12.18115234375, 13.5537109375, 14.92626953125, 16.298828125, 17.67138671875, 19.0439453125, 20.41650390625, 21.7890625, 23.16162109375, 24.5341796875, 25.90673828125, 27.279296875, 28.65185546875, 30.0244140625, 31.39697265625, 32.76953125, 34.14208984375, 35.5146484375, 36.88720703125, 38.259765625, 39.63232421875, 41.0048828125, 42.37744140625, 43.75]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 13.0, 16.0, 18.0, 25.0, 33.0, 29.0, 35.0, 41.0, 32.0, 32.0, 41.0, 38.0, 51.0, 58.0, 175.0, 1870.0, 95.0, 40.0, 59.0, 32.0, 34.0, 37.0, 28.0, 32.0, 23.0, 23.0, 28.0, 16.0, 16.0, 7.0, 15.0, 4.0, 7.0, 4.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-125.0625, -120.9345703125, -116.806640625, -112.6787109375, -108.55078125, -104.4228515625, -100.294921875, -96.1669921875, -92.0390625, -87.9111328125, -83.783203125, -79.6552734375, -75.52734375, -71.3994140625, -67.271484375, -63.1435546875, -59.015625, -54.8876953125, -50.759765625, -46.6318359375, -42.50390625, -38.3759765625, -34.248046875, -30.1201171875, -25.9921875, -21.8642578125, -17.736328125, -13.6083984375, -9.48046875, -5.3525390625, -1.224609375, 2.9033203125, 7.03125, 11.1591796875, 15.287109375, 19.4150390625, 23.54296875, 27.6708984375, 31.798828125, 35.9267578125, 40.0546875, 44.1826171875, 48.310546875, 52.4384765625, 56.56640625, 60.6943359375, 64.822265625, 68.9501953125, 73.078125, 77.2060546875, 81.333984375, 85.4619140625, 89.58984375, 93.7177734375, 97.845703125, 101.9736328125, 106.1015625, 110.2294921875, 114.357421875, 118.4853515625, 122.61328125, 126.7412109375, 130.869140625, 134.9970703125, 139.125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 10.0, 11.0, 6.0, 9.0, 6.0, 23.0, 21.0, 32.0, 57.0, 41.0, 74.0, 109.0, 120.0, 206.0, 347.0, 1222.0, 9860.0, 3108939.0, 21450.0, 1817.0, 461.0, 248.0, 164.0, 126.0, 92.0, 67.0, 48.0, 43.0, 25.0, 28.0, 8.0, 15.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-339.0, -328.27734375, -317.5546875, -306.83203125, -296.109375, -285.38671875, -274.6640625, -263.94140625, -253.21875, -242.49609375, -231.7734375, -221.05078125, -210.328125, -199.60546875, -188.8828125, -178.16015625, -167.4375, -156.71484375, -145.9921875, -135.26953125, -124.546875, -113.82421875, -103.1015625, -92.37890625, -81.65625, -70.93359375, -60.2109375, -49.48828125, -38.765625, -28.04296875, -17.3203125, -6.59765625, 4.125, 14.84765625, 25.5703125, 36.29296875, 47.015625, 57.73828125, 68.4609375, 79.18359375, 89.90625, 100.62890625, 111.3515625, 122.07421875, 132.796875, 143.51953125, 154.2421875, 164.96484375, 175.6875, 186.41015625, 197.1328125, 207.85546875, 218.578125, 229.30078125, 240.0234375, 250.74609375, 261.46875, 272.19140625, 282.9140625, 293.63671875, 304.359375, 315.08203125, 325.8046875, 336.52734375, 347.25]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 893.0, 112.0, 4.0], "bins": [-2719.709716796875, -2675.62353515625, -2631.537353515625, -2587.451171875, -2543.364990234375, -2499.27880859375, -2455.19287109375, -2411.1064453125, -2367.0205078125, -2322.934326171875, -2278.84814453125, -2234.761962890625, -2190.67578125, -2146.589599609375, -2102.50341796875, -2058.41748046875, -2014.3310546875, -1970.244873046875, -1926.15869140625, -1882.072509765625, -1837.9864501953125, -1793.9002685546875, -1749.8140869140625, -1705.7279052734375, -1661.641845703125, -1617.5556640625, -1573.469482421875, -1529.38330078125, -1485.2972412109375, -1441.2110595703125, -1397.1248779296875, -1353.0386962890625, -1308.9525146484375, -1264.8663330078125, -1220.7801513671875, -1176.694091796875, -1132.60791015625, -1088.521728515625, -1044.435546875, -1000.349365234375, -956.2632446289062, -912.1770629882812, -868.0909423828125, -824.0047607421875, -779.9185791015625, -735.8323974609375, -691.7462768554688, -647.6600952148438, -603.5739135742188, -559.4877319335938, -515.401611328125, -471.3154296875, -427.229248046875, -383.1430969238281, -339.05694580078125, -294.97076416015625, -250.88462829589844, -206.7984619140625, -162.71231079101562, -118.62614440917969, -74.53997802734375, -30.453811645507812, 13.632339477539062, 57.71852111816406, 101.80467224121094]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 9.0, 11.0, 10.0, 17.0, 11.0, 14.0, 22.0, 14.0, 32.0, 22.0, 31.0, 36.0, 46.0, 45.0, 39.0, 39.0, 40.0, 51.0, 49.0, 38.0, 31.0, 34.0, 41.0, 38.0, 28.0, 35.0, 40.0, 20.0, 31.0, 16.0, 18.0, 16.0, 11.0, 12.0, 9.0, 8.0, 6.0, 6.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-338.1504211425781, -327.89068603515625, -317.6309509277344, -307.3712463378906, -297.11151123046875, -286.8517761230469, -276.592041015625, -266.3323059082031, -256.07257080078125, -245.81283569335938, -235.55311584472656, -225.2933807373047, -215.03366088867188, -204.77392578125, -194.51419067382812, -184.25445556640625, -173.9947509765625, -163.73501586914062, -153.4752960205078, -143.21556091308594, -132.95584106445312, -122.69610595703125, -112.43637084960938, -102.17664337158203, -91.91691589355469, -81.65718841552734, -71.3974609375, -61.137725830078125, -50.87799835205078, -40.61827087402344, -30.358539581298828, -20.09880828857422, -9.839080810546875, 0.42064857482910156, 10.680377960205078, 20.940107345581055, 31.19983673095703, 41.459564208984375, 51.719295501708984, 61.979026794433594, 72.23875427246094, 82.49848175048828, 92.75820922851562, 103.0179443359375, 113.27767181396484, 123.53739929199219, 133.79713439941406, 144.05685424804688, 154.31658935546875, 164.57632446289062, 174.83604431152344, 185.0957794189453, 195.35549926757812, 205.615234375, 215.87496948242188, 226.13470458984375, 236.39442443847656, 246.65415954589844, 256.91387939453125, 267.1736145019531, 277.433349609375, 287.69305419921875, 297.9527893066406, 308.2125244140625, 318.4722595214844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 4.0, 3.0, 5.0, 10.0, 10.0, 10.0, 13.0, 24.0, 15.0, 15.0, 26.0, 20.0, 33.0, 27.0, 29.0, 46.0, 42.0, 42.0, 39.0, 34.0, 49.0, 36.0, 43.0, 47.0, 31.0, 28.0, 26.0, 31.0, 34.0, 22.0, 30.0, 23.0, 22.0, 17.0, 17.0, 17.0, 6.0, 14.0, 10.0, 10.0, 5.0, 11.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.71875, -41.34375, -39.96875, -38.59375, -37.21875, -35.84375, -34.46875, -33.09375, -31.71875, -30.34375, -28.96875, -27.59375, -26.21875, -24.84375, -23.46875, -22.09375, -20.71875, -19.34375, -17.96875, -16.59375, -15.21875, -13.84375, -12.46875, -11.09375, -9.71875, -8.34375, -6.96875, -5.59375, -4.21875, -2.84375, -1.46875, -0.09375, 1.28125, 2.65625, 4.03125, 5.40625, 6.78125, 8.15625, 9.53125, 10.90625, 12.28125, 13.65625, 15.03125, 16.40625, 17.78125, 19.15625, 20.53125, 21.90625, 23.28125, 24.65625, 26.03125, 27.40625, 28.78125, 30.15625, 31.53125, 32.90625, 34.28125, 35.65625, 37.03125, 38.40625, 39.78125, 41.15625, 42.53125, 43.90625, 45.28125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 0.0, 7.0, 8.0, 6.0, 11.0, 23.0, 18.0, 30.0, 35.0, 48.0, 62.0, 98.0, 147.0, 211.0, 341.0, 454.0, 679.0, 1204.0, 2241.0, 5216.0, 22770.0, 1145606.0, 2953036.0, 48789.0, 6957.0, 2643.0, 1289.0, 757.0, 494.0, 336.0, 230.0, 140.0, 98.0, 76.0, 51.0, 40.0, 27.0, 16.0, 13.0, 17.0, 12.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-167.875, -162.6484375, -157.421875, -152.1953125, -146.96875, -141.7421875, -136.515625, -131.2890625, -126.0625, -120.8359375, -115.609375, -110.3828125, -105.15625, -99.9296875, -94.703125, -89.4765625, -84.25, -79.0234375, -73.796875, -68.5703125, -63.34375, -58.1171875, -52.890625, -47.6640625, -42.4375, -37.2109375, -31.984375, -26.7578125, -21.53125, -16.3046875, -11.078125, -5.8515625, -0.625, 4.6015625, 9.828125, 15.0546875, 20.28125, 25.5078125, 30.734375, 35.9609375, 41.1875, 46.4140625, 51.640625, 56.8671875, 62.09375, 67.3203125, 72.546875, 77.7734375, 83.0, 88.2265625, 93.453125, 98.6796875, 103.90625, 109.1328125, 114.359375, 119.5859375, 124.8125, 130.0390625, 135.265625, 140.4921875, 145.71875, 150.9453125, 156.171875, 161.3984375, 166.625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 3.0, 8.0, 4.0, 5.0, 9.0, 17.0, 23.0, 29.0, 50.0, 78.0, 128.0, 332.0, 795.0, 1190.0, 741.0, 288.0, 136.0, 81.0, 47.0, 31.0, 18.0, 15.0, 11.0, 9.0, 5.0, 6.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.9375, -100.408203125, -96.87890625, -93.349609375, -89.8203125, -86.291015625, -82.76171875, -79.232421875, -75.703125, -72.173828125, -68.64453125, -65.115234375, -61.5859375, -58.056640625, -54.52734375, -50.998046875, -47.46875, -43.939453125, -40.41015625, -36.880859375, -33.3515625, -29.822265625, -26.29296875, -22.763671875, -19.234375, -15.705078125, -12.17578125, -8.646484375, -5.1171875, -1.587890625, 1.94140625, 5.470703125, 9.0, 12.529296875, 16.05859375, 19.587890625, 23.1171875, 26.646484375, 30.17578125, 33.705078125, 37.234375, 40.763671875, 44.29296875, 47.822265625, 51.3515625, 54.880859375, 58.41015625, 61.939453125, 65.46875, 68.998046875, 72.52734375, 76.056640625, 79.5859375, 83.115234375, 86.64453125, 90.173828125, 93.703125, 97.232421875, 100.76171875, 104.291015625, 107.8203125, 111.349609375, 114.87890625, 118.408203125, 121.9375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 7.0, 10.0, 22.0, 39.0, 60.0, 131.0, 361.0, 1340.0, 7482.0, 195536.0, 3966075.0, 19677.0, 2505.0, 604.0, 205.0, 94.0, 37.0, 25.0, 12.0, 6.0, 6.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-539.0, -523.2421875, -507.484375, -491.7265625, -475.96875, -460.2109375, -444.453125, -428.6953125, -412.9375, -397.1796875, -381.421875, -365.6640625, -349.90625, -334.1484375, -318.390625, -302.6328125, -286.875, -271.1171875, -255.359375, -239.6015625, -223.84375, -208.0859375, -192.328125, -176.5703125, -160.8125, -145.0546875, -129.296875, -113.5390625, -97.78125, -82.0234375, -66.265625, -50.5078125, -34.75, -18.9921875, -3.234375, 12.5234375, 28.28125, 44.0390625, 59.796875, 75.5546875, 91.3125, 107.0703125, 122.828125, 138.5859375, 154.34375, 170.1015625, 185.859375, 201.6171875, 217.375, 233.1328125, 248.890625, 264.6484375, 280.40625, 296.1640625, 311.921875, 327.6796875, 343.4375, 359.1953125, 374.953125, 390.7109375, 406.46875, 422.2265625, 437.984375, 453.7421875, 469.5]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 9.0, 19.0, 53.0, 173.0, 363.0, 258.0, 84.0, 29.0, 14.0, 7.0, 6.0, 2.0, 1.0], "bins": [-1721.7830810546875, -1690.8748779296875, -1659.966552734375, -1629.058349609375, -1598.150146484375, -1567.2418212890625, -1536.3336181640625, -1505.4254150390625, -1474.51708984375, -1443.60888671875, -1412.7005615234375, -1381.7923583984375, -1350.8841552734375, -1319.975830078125, -1289.067626953125, -1258.159423828125, -1227.251220703125, -1196.343017578125, -1165.4346923828125, -1134.5264892578125, -1103.6182861328125, -1072.7099609375, -1041.8017578125, -1010.8934936523438, -979.9852294921875, -949.0769653320312, -918.1687622070312, -887.260498046875, -856.3522338867188, -825.4439697265625, -794.5357666015625, -763.6275024414062, -732.7191772460938, -701.8109130859375, -670.9027099609375, -639.9944458007812, -609.086181640625, -578.177978515625, -547.2697143554688, -516.3614501953125, -485.4532165527344, -454.54498291015625, -423.63671875, -392.7284851074219, -361.82025146484375, -330.9119873046875, -300.0037536621094, -269.09552001953125, -238.187255859375, -207.2790069580078, -176.37075805664062, -145.4625244140625, -114.55427551269531, -83.64602661132812, -52.73779296875, -21.829544067382812, 9.078704833984375, 39.9869499206543, 70.89519500732422, 101.80343627929688, 132.71168518066406, 163.61993408203125, 194.52816772460938, 225.43641662597656, 256.34466552734375]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 14.0, 8.0, 11.0, 15.0, 15.0, 23.0, 16.0, 19.0, 24.0, 25.0, 38.0, 23.0, 28.0, 38.0, 40.0, 28.0, 47.0, 43.0, 34.0, 32.0, 37.0, 34.0, 35.0, 32.0, 35.0, 28.0, 25.0, 29.0, 33.0, 35.0, 20.0, 23.0, 12.0, 17.0, 10.0, 10.0, 12.0, 6.0, 8.0, 6.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-197.28427124023438, -191.06707763671875, -184.84988403320312, -178.6326904296875, -172.41549682617188, -166.19830322265625, -159.98110961914062, -153.76393127441406, -147.54673767089844, -141.3295440673828, -135.1123504638672, -128.89515686035156, -122.67797088623047, -116.46077728271484, -110.24358367919922, -104.02639770507812, -97.80919647216797, -91.59200286865234, -85.37480926513672, -79.15762329101562, -72.9404296875, -66.72323608398438, -60.50604248046875, -54.28885269165039, -48.071659088134766, -41.85446548461914, -35.63727569580078, -29.420082092285156, -23.202890396118164, -16.985698699951172, -10.768505096435547, -4.5513153076171875, 1.6658782958984375, 7.883070468902588, 14.100262641906738, 20.317455291748047, 26.53464698791504, 32.75183868408203, 38.969032287597656, 45.186222076416016, 51.40341567993164, 57.620609283447266, 63.837799072265625, 70.05499267578125, 76.27218627929688, 82.4893798828125, 88.70657348632812, 94.92375946044922, 101.14095306396484, 107.35814666748047, 113.5753402709961, 119.79252624511719, 126.00971984863281, 132.22691345214844, 138.44410705566406, 144.6613006591797, 150.8784942626953, 157.09568786621094, 163.31288146972656, 169.5300750732422, 175.7472686767578, 181.96444702148438, 188.181640625, 194.39883422851562, 200.61602783203125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 9.0, 12.0, 11.0, 9.0, 8.0, 13.0, 16.0, 16.0, 29.0, 22.0, 33.0, 38.0, 44.0, 30.0, 45.0, 38.0, 53.0, 38.0, 42.0, 39.0, 32.0, 43.0, 38.0, 30.0, 38.0, 29.0, 28.0, 27.0, 35.0, 25.0, 17.0, 30.0, 15.0, 14.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.28125, -47.77783203125, -46.2744140625, -44.77099609375, -43.267578125, -41.76416015625, -40.2607421875, -38.75732421875, -37.25390625, -35.75048828125, -34.2470703125, -32.74365234375, -31.240234375, -29.73681640625, -28.2333984375, -26.72998046875, -25.2265625, -23.72314453125, -22.2197265625, -20.71630859375, -19.212890625, -17.70947265625, -16.2060546875, -14.70263671875, -13.19921875, -11.69580078125, -10.1923828125, -8.68896484375, -7.185546875, -5.68212890625, -4.1787109375, -2.67529296875, -1.171875, 0.33154296875, 1.8349609375, 3.33837890625, 4.841796875, 6.34521484375, 7.8486328125, 9.35205078125, 10.85546875, 12.35888671875, 13.8623046875, 15.36572265625, 16.869140625, 18.37255859375, 19.8759765625, 21.37939453125, 22.8828125, 24.38623046875, 25.8896484375, 27.39306640625, 28.896484375, 30.39990234375, 31.9033203125, 33.40673828125, 34.91015625, 36.41357421875, 37.9169921875, 39.42041015625, 40.923828125, 42.42724609375, 43.9306640625, 45.43408203125, 46.9375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 4.0, 6.0, 6.0, 9.0, 8.0, 18.0, 21.0, 40.0, 71.0, 72.0, 107.0, 148.0, 205.0, 326.0, 416.0, 560.0, 731.0, 1133.0, 1644.0, 2422.0, 3427.0, 4740.0, 7231.0, 10915.0, 16632.0, 25217.0, 40032.0, 64565.0, 113346.0, 210825.0, 226541.0, 123476.0, 70149.0, 42752.0, 26990.0, 17489.0, 11375.0, 7769.0, 5169.0, 3602.0, 2433.0, 1652.0, 1323.0, 836.0, 615.0, 421.0, 338.0, 198.0, 157.0, 118.0, 82.0, 55.0, 60.0, 30.0, 18.0, 17.0, 13.0, 5.0, 4.0, 3.0, 1.0], "bins": [-2.228515625, -2.1611328125, -2.09375, -2.0263671875, -1.958984375, -1.8916015625, -1.82421875, -1.7568359375, -1.689453125, -1.6220703125, -1.5546875, -1.4873046875, -1.419921875, -1.3525390625, -1.28515625, -1.2177734375, -1.150390625, -1.0830078125, -1.015625, -0.9482421875, -0.880859375, -0.8134765625, -0.74609375, -0.6787109375, -0.611328125, -0.5439453125, -0.4765625, -0.4091796875, -0.341796875, -0.2744140625, -0.20703125, -0.1396484375, -0.072265625, -0.0048828125, 0.0625, 0.1298828125, 0.197265625, 0.2646484375, 0.33203125, 0.3994140625, 0.466796875, 0.5341796875, 0.6015625, 0.6689453125, 0.736328125, 0.8037109375, 0.87109375, 0.9384765625, 1.005859375, 1.0732421875, 1.140625, 1.2080078125, 1.275390625, 1.3427734375, 1.41015625, 1.4775390625, 1.544921875, 1.6123046875, 1.6796875, 1.7470703125, 1.814453125, 1.8818359375, 1.94921875, 2.0166015625, 2.083984375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 1.0, 4.0, 8.0, 14.0, 11.0, 5.0, 12.0, 14.0, 11.0, 24.0, 26.0, 27.0, 23.0, 28.0, 37.0, 31.0, 41.0, 36.0, 33.0, 31.0, 41.0, 34.0, 1065.0, 33.0, 39.0, 27.0, 34.0, 43.0, 17.0, 28.0, 32.0, 26.0, 23.0, 22.0, 22.0, 12.0, 20.0, 13.0, 16.0, 14.0, 6.0, 6.0, 7.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-28.765625, -27.875732421875, -26.98583984375, -26.095947265625, -25.2060546875, -24.316162109375, -23.42626953125, -22.536376953125, -21.646484375, -20.756591796875, -19.86669921875, -18.976806640625, -18.0869140625, -17.197021484375, -16.30712890625, -15.417236328125, -14.52734375, -13.637451171875, -12.74755859375, -11.857666015625, -10.9677734375, -10.077880859375, -9.18798828125, -8.298095703125, -7.408203125, -6.518310546875, -5.62841796875, -4.738525390625, -3.8486328125, -2.958740234375, -2.06884765625, -1.178955078125, -0.2890625, 0.600830078125, 1.49072265625, 2.380615234375, 3.2705078125, 4.160400390625, 5.05029296875, 5.940185546875, 6.830078125, 7.719970703125, 8.60986328125, 9.499755859375, 10.3896484375, 11.279541015625, 12.16943359375, 13.059326171875, 13.94921875, 14.839111328125, 15.72900390625, 16.618896484375, 17.5087890625, 18.398681640625, 19.28857421875, 20.178466796875, 21.068359375, 21.958251953125, 22.84814453125, 23.738037109375, 24.6279296875, 25.517822265625, 26.40771484375, 27.297607421875, 28.1875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 10.0, 10.0, 14.0, 30.0, 39.0, 55.0, 90.0, 115.0, 156.0, 264.0, 423.0, 602.0, 894.0, 1366.0, 2080.0, 3247.0, 5150.0, 7970.0, 12578.0, 20785.0, 34027.0, 58410.0, 109027.0, 331333.0, 1225671.0, 121877.0, 63862.0, 37547.0, 21898.0, 13831.0, 8380.0, 5369.0, 3461.0, 2171.0, 1484.0, 979.0, 610.0, 412.0, 265.0, 210.0, 129.0, 94.0, 70.0, 47.0, 25.0, 23.0, 15.0, 11.0, 1.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.43359375, -2.35772705078125, -2.2818603515625, -2.20599365234375, -2.130126953125, -2.05426025390625, -1.9783935546875, -1.90252685546875, -1.82666015625, -1.75079345703125, -1.6749267578125, -1.59906005859375, -1.523193359375, -1.44732666015625, -1.3714599609375, -1.29559326171875, -1.2197265625, -1.14385986328125, -1.0679931640625, -0.99212646484375, -0.916259765625, -0.84039306640625, -0.7645263671875, -0.68865966796875, -0.61279296875, -0.53692626953125, -0.4610595703125, -0.38519287109375, -0.309326171875, -0.23345947265625, -0.1575927734375, -0.08172607421875, -0.005859375, 0.07000732421875, 0.1458740234375, 0.22174072265625, 0.297607421875, 0.37347412109375, 0.4493408203125, 0.52520751953125, 0.60107421875, 0.67694091796875, 0.7528076171875, 0.82867431640625, 0.904541015625, 0.98040771484375, 1.0562744140625, 1.13214111328125, 1.2080078125, 1.28387451171875, 1.3597412109375, 1.43560791015625, 1.511474609375, 1.58734130859375, 1.6632080078125, 1.73907470703125, 1.81494140625, 1.89080810546875, 1.9666748046875, 2.04254150390625, 2.118408203125, 2.19427490234375, 2.2701416015625, 2.34600830078125, 2.421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 5.0, 9.0, 13.0, 15.0, 24.0, 26.0, 24.0, 28.0, 39.0, 65.0, 63.0, 82.0, 95.0, 88.0, 93.0, 59.0, 39.0, 28.0, 24.0, 32.0, 24.0, 13.0, 13.0, 16.0, 11.0, 14.0, 6.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0345458984375, -0.03352069854736328, -0.03249549865722656, -0.031470298767089844, -0.030445098876953125, -0.029419898986816406, -0.028394699096679688, -0.02736949920654297, -0.02634429931640625, -0.02531909942626953, -0.024293899536132812, -0.023268699645996094, -0.022243499755859375, -0.021218299865722656, -0.020193099975585938, -0.01916790008544922, -0.0181427001953125, -0.01711750030517578, -0.016092300415039062, -0.015067100524902344, -0.014041900634765625, -0.013016700744628906, -0.011991500854492188, -0.010966300964355469, -0.00994110107421875, -0.008915901184082031, -0.007890701293945312, -0.006865501403808594, -0.005840301513671875, -0.004815101623535156, -0.0037899017333984375, -0.0027647018432617188, -0.001739501953125, -0.0007143020629882812, 0.0003108978271484375, 0.0013360977172851562, 0.002361297607421875, 0.0033864974975585938, 0.0044116973876953125, 0.005436897277832031, 0.00646209716796875, 0.007487297058105469, 0.008512496948242188, 0.009537696838378906, 0.010562896728515625, 0.011588096618652344, 0.012613296508789062, 0.013638496398925781, 0.0146636962890625, 0.01568889617919922, 0.016714096069335938, 0.017739295959472656, 0.018764495849609375, 0.019789695739746094, 0.020814895629882812, 0.02184009552001953, 0.02286529541015625, 0.02389049530029297, 0.024915695190429688, 0.025940895080566406, 0.026966094970703125, 0.027991294860839844, 0.029016494750976562, 0.03004169464111328, 0.03106689453125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 6.0, 3.0, 11.0, 10.0, 8.0, 25.0, 18.0, 20.0, 21.0, 30.0, 51.0, 49.0, 55.0, 90.0, 135.0, 287.0, 1248.0, 37981.0, 997298.0, 9844.0, 660.0, 235.0, 112.0, 91.0, 56.0, 39.0, 39.0, 34.0, 24.0, 16.0, 5.0, 10.0, 11.0, 5.0, 6.0, 7.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5654296875, -0.5467987060546875, -0.528167724609375, -0.5095367431640625, -0.49090576171875, -0.4722747802734375, -0.453643798828125, -0.4350128173828125, -0.4163818359375, -0.3977508544921875, -0.379119873046875, -0.3604888916015625, -0.34185791015625, -0.3232269287109375, -0.304595947265625, -0.2859649658203125, -0.267333984375, -0.2487030029296875, -0.230072021484375, -0.2114410400390625, -0.19281005859375, -0.1741790771484375, -0.155548095703125, -0.1369171142578125, -0.1182861328125, -0.0996551513671875, -0.081024169921875, -0.0623931884765625, -0.04376220703125, -0.0251312255859375, -0.006500244140625, 0.0121307373046875, 0.03076171875, 0.0493927001953125, 0.068023681640625, 0.0866546630859375, 0.10528564453125, 0.1239166259765625, 0.142547607421875, 0.1611785888671875, 0.1798095703125, 0.1984405517578125, 0.217071533203125, 0.2357025146484375, 0.25433349609375, 0.2729644775390625, 0.291595458984375, 0.3102264404296875, 0.328857421875, 0.3474884033203125, 0.366119384765625, 0.3847503662109375, 0.40338134765625, 0.4220123291015625, 0.440643310546875, 0.4592742919921875, 0.4779052734375, 0.4965362548828125, 0.515167236328125, 0.5337982177734375, 0.55242919921875, 0.5710601806640625, 0.589691162109375, 0.6083221435546875, 0.626953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 4.0, 21.0, 52.0, 90.0, 295.0, 363.0, 111.0, 53.0, 14.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013796009123325348, -0.01209486834704876, -0.010393726639449596, -0.008692585863173008, -0.006991444621235132, -0.0052903033792972565, -0.003589162603020668, -0.001888020895421505, -0.00018688011914491653, 0.0015142610063776374, 0.0032154021319001913, 0.004916543141007423, 0.006617684382945299, 0.008318825624883175, 0.010019966401159763, 0.011721108108758926, 0.013422248885035515, 0.015123389661312103, 0.01682453043758869, 0.01852567121386528, 0.020226813852787018, 0.021927954629063606, 0.023629095405340195, 0.025330238044261932, 0.02703137695789337, 0.02873251773416996, 0.03043365851044655, 0.032134801149368286, 0.033835940062999725, 0.03553708270192146, 0.0372382253408432, 0.03893936425447464, 0.04064050689339638, 0.042341649532318115, 0.044042788445949554, 0.04574393108487129, 0.04744506999850273, 0.04914621263742447, 0.05084735155105591, 0.052548494189977646, 0.054249636828899384, 0.05595077946782112, 0.05765191838145256, 0.0593530610203743, 0.06105419993400574, 0.06275534629821777, 0.06445648521184921, 0.06615762412548065, 0.06785876303911209, 0.06955990195274353, 0.07126104831695557, 0.072962187230587, 0.07466332614421844, 0.07636447250843048, 0.07806561142206192, 0.07976675033569336, 0.0814678966999054, 0.08316903561353683, 0.08487018197774887, 0.08657132089138031, 0.08827245980501175, 0.08997359871864319, 0.09167474508285522, 0.09337588399648666, 0.0950770229101181]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 7.0, 13.0, 12.0, 27.0, 14.0, 20.0, 20.0, 21.0, 30.0, 33.0, 24.0, 30.0, 32.0, 36.0, 37.0, 30.0, 49.0, 45.0, 40.0, 62.0, 43.0, 38.0, 29.0, 38.0, 30.0, 36.0, 34.0, 25.0, 21.0, 14.0, 16.0, 15.0, 27.0, 13.0, 14.0, 5.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017375648021697998, -0.01683177426457405, -0.016287900507450104, -0.015744026750326157, -0.01520015299320221, -0.014656279236078262, -0.014112405478954315, -0.013568531721830368, -0.013024657964706421, -0.012480784207582474, -0.011936910450458527, -0.01139303669333458, -0.010849162936210632, -0.010305289179086685, -0.009761415421962738, -0.009217541664838791, -0.008673667907714844, -0.008129794150590897, -0.0075859203934669495, -0.007042046636343002, -0.006498172879219055, -0.005954299122095108, -0.005410425364971161, -0.004866551607847214, -0.004322677850723267, -0.0037788040935993195, -0.0032349303364753723, -0.002691056579351425, -0.002147182822227478, -0.0016033090651035309, -0.0010594353079795837, -0.0005155615508556366, 2.8312206268310547e-05, 0.0005721859633922577, 0.0011160597205162048, 0.001659933477640152, 0.002203807234764099, 0.0027476809918880463, 0.0032915547490119934, 0.0038354285061359406, 0.004379302263259888, 0.004923176020383835, 0.005467049777507782, 0.006010923534631729, 0.006554797291755676, 0.007098671048879623, 0.0076425448060035706, 0.008186418563127518, 0.008730292320251465, 0.009274166077375412, 0.009818039834499359, 0.010361913591623306, 0.010905787348747253, 0.0114496611058712, 0.011993534862995148, 0.012537408620119095, 0.013081282377243042, 0.01362515613436699, 0.014169029891490936, 0.014712903648614883, 0.01525677740573883, 0.015800651162862778, 0.016344524919986725, 0.016888398677110672, 0.01743227243423462]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 9.0, 12.0, 11.0, 9.0, 8.0, 13.0, 16.0, 16.0, 29.0, 22.0, 33.0, 38.0, 44.0, 30.0, 45.0, 38.0, 53.0, 38.0, 42.0, 39.0, 32.0, 43.0, 38.0, 31.0, 37.0, 29.0, 28.0, 27.0, 35.0, 25.0, 17.0, 30.0, 15.0, 14.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.28125, -47.77783203125, -46.2744140625, -44.77099609375, -43.267578125, -41.76416015625, -40.2607421875, -38.75732421875, -37.25390625, -35.75048828125, -34.2470703125, -32.74365234375, -31.240234375, -29.73681640625, -28.2333984375, -26.72998046875, -25.2265625, -23.72314453125, -22.2197265625, -20.71630859375, -19.212890625, -17.70947265625, -16.2060546875, -14.70263671875, -13.19921875, -11.69580078125, -10.1923828125, -8.68896484375, -7.185546875, -5.68212890625, -4.1787109375, -2.67529296875, -1.171875, 0.33154296875, 1.8349609375, 3.33837890625, 4.841796875, 6.34521484375, 7.8486328125, 9.35205078125, 10.85546875, 12.35888671875, 13.8623046875, 15.36572265625, 16.869140625, 18.37255859375, 19.8759765625, 21.37939453125, 22.8828125, 24.38623046875, 25.8896484375, 27.39306640625, 28.896484375, 30.39990234375, 31.9033203125, 33.40673828125, 34.91015625, 36.41357421875, 37.9169921875, 39.42041015625, 40.923828125, 42.42724609375, 43.9306640625, 45.43408203125, 46.9375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 9.0, 11.0, 17.0, 17.0, 17.0, 23.0, 33.0, 39.0, 42.0, 79.0, 102.0, 139.0, 195.0, 325.0, 501.0, 930.0, 2181.0, 7211.0, 44912.0, 809751.0, 160669.0, 14549.0, 3540.0, 1340.0, 625.0, 375.0, 245.0, 177.0, 112.0, 98.0, 69.0, 40.0, 51.0, 29.0, 19.0, 20.0, 11.0, 10.0, 7.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-87.5625, -84.88671875, -82.2109375, -79.53515625, -76.859375, -74.18359375, -71.5078125, -68.83203125, -66.15625, -63.48046875, -60.8046875, -58.12890625, -55.453125, -52.77734375, -50.1015625, -47.42578125, -44.75, -42.07421875, -39.3984375, -36.72265625, -34.046875, -31.37109375, -28.6953125, -26.01953125, -23.34375, -20.66796875, -17.9921875, -15.31640625, -12.640625, -9.96484375, -7.2890625, -4.61328125, -1.9375, 0.73828125, 3.4140625, 6.08984375, 8.765625, 11.44140625, 14.1171875, 16.79296875, 19.46875, 22.14453125, 24.8203125, 27.49609375, 30.171875, 32.84765625, 35.5234375, 38.19921875, 40.875, 43.55078125, 46.2265625, 48.90234375, 51.578125, 54.25390625, 56.9296875, 59.60546875, 62.28125, 64.95703125, 67.6328125, 70.30859375, 72.984375, 75.66015625, 78.3359375, 81.01171875, 83.6875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 12.0, 10.0, 11.0, 20.0, 10.0, 22.0, 25.0, 37.0, 36.0, 53.0, 44.0, 57.0, 50.0, 72.0, 176.0, 1933.0, 86.0, 52.0, 45.0, 54.0, 29.0, 34.0, 29.0, 25.0, 28.0, 17.0, 23.0, 6.0, 14.0, 7.0, 7.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.0, -175.560546875, -170.12109375, -164.681640625, -159.2421875, -153.802734375, -148.36328125, -142.923828125, -137.484375, -132.044921875, -126.60546875, -121.166015625, -115.7265625, -110.287109375, -104.84765625, -99.408203125, -93.96875, -88.529296875, -83.08984375, -77.650390625, -72.2109375, -66.771484375, -61.33203125, -55.892578125, -50.453125, -45.013671875, -39.57421875, -34.134765625, -28.6953125, -23.255859375, -17.81640625, -12.376953125, -6.9375, -1.498046875, 3.94140625, 9.380859375, 14.8203125, 20.259765625, 25.69921875, 31.138671875, 36.578125, 42.017578125, 47.45703125, 52.896484375, 58.3359375, 63.775390625, 69.21484375, 74.654296875, 80.09375, 85.533203125, 90.97265625, 96.412109375, 101.8515625, 107.291015625, 112.73046875, 118.169921875, 123.609375, 129.048828125, 134.48828125, 139.927734375, 145.3671875, 150.806640625, 156.24609375, 161.685546875, 167.125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 6.0, 16.0, 8.0, 16.0, 25.0, 24.0, 27.0, 35.0, 43.0, 51.0, 104.0, 168.0, 347.0, 1946.0, 3129967.0, 11655.0, 541.0, 209.0, 136.0, 84.0, 72.0, 50.0, 38.0, 22.0, 23.0, 18.0, 13.0, 9.0, 11.0, 13.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-502.0, -485.640625, -469.28125, -452.921875, -436.5625, -420.203125, -403.84375, -387.484375, -371.125, -354.765625, -338.40625, -322.046875, -305.6875, -289.328125, -272.96875, -256.609375, -240.25, -223.890625, -207.53125, -191.171875, -174.8125, -158.453125, -142.09375, -125.734375, -109.375, -93.015625, -76.65625, -60.296875, -43.9375, -27.578125, -11.21875, 5.140625, 21.5, 37.859375, 54.21875, 70.578125, 86.9375, 103.296875, 119.65625, 136.015625, 152.375, 168.734375, 185.09375, 201.453125, 217.8125, 234.171875, 250.53125, 266.890625, 283.25, 299.609375, 315.96875, 332.328125, 348.6875, 365.046875, 381.40625, 397.765625, 414.125, 430.484375, 446.84375, 463.203125, 479.5625, 495.921875, 512.28125, 528.640625, 545.0]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 110.0, 900.0, 10.0], "bins": [-2062.98291015625, -2029.8673095703125, -1996.7518310546875, -1963.63623046875, -1930.520751953125, -1897.4051513671875, -1864.2896728515625, -1831.174072265625, -1798.05859375, -1764.9429931640625, -1731.8275146484375, -1698.7119140625, -1665.596435546875, -1632.4808349609375, -1599.3653564453125, -1566.249755859375, -1533.1341552734375, -1500.0185546875, -1466.903076171875, -1433.7874755859375, -1400.6719970703125, -1367.556396484375, -1334.44091796875, -1301.3253173828125, -1268.209716796875, -1235.0941162109375, -1201.9786376953125, -1168.863037109375, -1135.74755859375, -1102.6319580078125, -1069.5164794921875, -1036.40087890625, -1003.2854614257812, -970.169921875, -937.0543823242188, -903.9388427734375, -870.8232421875, -837.707763671875, -804.5921630859375, -771.4766235351562, -738.361083984375, -705.2455444335938, -672.1300048828125, -639.0144653320312, -605.89892578125, -572.7833251953125, -539.6677856445312, -506.55224609375, -473.4367370605469, -440.3211975097656, -407.20562744140625, -374.090087890625, -340.97454833984375, -307.8590087890625, -274.74346923828125, -241.62789916992188, -208.51235961914062, -175.39682006835938, -142.28126525878906, -109.16571807861328, -76.0501708984375, -42.93463134765625, -9.819076538085938, 23.296478271484375, 56.412025451660156]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 6.0, 10.0, 13.0, 10.0, 14.0, 14.0, 22.0, 21.0, 25.0, 34.0, 37.0, 22.0, 32.0, 36.0, 43.0, 37.0, 40.0, 45.0, 38.0, 44.0, 38.0, 37.0, 39.0, 29.0, 40.0, 34.0, 35.0, 29.0, 22.0, 23.0, 20.0, 15.0, 17.0, 17.0, 12.0, 5.0, 8.0, 4.0, 12.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-423.25286865234375, -410.153076171875, -397.05328369140625, -383.9534912109375, -370.85369873046875, -357.75390625, -344.65411376953125, -331.5543212890625, -318.45452880859375, -305.354736328125, -292.25494384765625, -279.1551513671875, -266.05535888671875, -252.95556640625, -239.85577392578125, -226.7559814453125, -213.65618896484375, -200.556396484375, -187.45660400390625, -174.3568115234375, -161.25701904296875, -148.1572265625, -135.05743408203125, -121.9576416015625, -108.85784912109375, -95.758056640625, -82.65826416015625, -69.5584716796875, -56.45867919921875, -43.35888671875, -30.25909423828125, -17.1593017578125, -4.059539794921875, 9.040252685546875, 22.140045166015625, 35.239837646484375, 48.339630126953125, 61.439422607421875, 74.53921508789062, 87.63900756835938, 100.73880004882812, 113.83859252929688, 126.93838500976562, 140.03817749023438, 153.13796997070312, 166.23776245117188, 179.33755493164062, 192.43734741210938, 205.53713989257812, 218.63693237304688, 231.73672485351562, 244.83651733398438, 257.9363098144531, 271.0361022949219, 284.1358947753906, 297.2356872558594, 310.3354797363281, 323.4352722167969, 336.5350646972656, 349.6348571777344, 362.7346496582031, 375.8344421386719, 388.9342346191406, 402.0340270996094, 415.1338195800781]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 0.0, 9.0, 11.0, 7.0, 9.0, 12.0, 6.0, 17.0, 11.0, 12.0, 21.0, 24.0, 37.0, 29.0, 33.0, 35.0, 48.0, 45.0, 42.0, 35.0, 32.0, 40.0, 42.0, 33.0, 41.0, 37.0, 35.0, 35.0, 35.0, 18.0, 30.0, 25.0, 31.0, 23.0, 27.0, 16.0, 10.0, 11.0, 7.0, 5.0, 3.0, 5.0, 5.0, 0.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-48.84375, -47.341796875, -45.83984375, -44.337890625, -42.8359375, -41.333984375, -39.83203125, -38.330078125, -36.828125, -35.326171875, -33.82421875, -32.322265625, -30.8203125, -29.318359375, -27.81640625, -26.314453125, -24.8125, -23.310546875, -21.80859375, -20.306640625, -18.8046875, -17.302734375, -15.80078125, -14.298828125, -12.796875, -11.294921875, -9.79296875, -8.291015625, -6.7890625, -5.287109375, -3.78515625, -2.283203125, -0.78125, 0.720703125, 2.22265625, 3.724609375, 5.2265625, 6.728515625, 8.23046875, 9.732421875, 11.234375, 12.736328125, 14.23828125, 15.740234375, 17.2421875, 18.744140625, 20.24609375, 21.748046875, 23.25, 24.751953125, 26.25390625, 27.755859375, 29.2578125, 30.759765625, 32.26171875, 33.763671875, 35.265625, 36.767578125, 38.26953125, 39.771484375, 41.2734375, 42.775390625, 44.27734375, 45.779296875, 47.28125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 10.0, 7.0, 23.0, 19.0, 36.0, 44.0, 53.0, 73.0, 134.0, 156.0, 254.0, 339.0, 541.0, 802.0, 1265.0, 2193.0, 4374.0, 9531.0, 35637.0, 707367.0, 3183026.0, 212279.0, 21146.0, 7013.0, 3238.0, 1786.0, 993.0, 634.0, 399.0, 288.0, 193.0, 132.0, 74.0, 58.0, 51.0, 32.0, 20.0, 14.0, 12.0, 12.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-150.125, -145.8740234375, -141.623046875, -137.3720703125, -133.12109375, -128.8701171875, -124.619140625, -120.3681640625, -116.1171875, -111.8662109375, -107.615234375, -103.3642578125, -99.11328125, -94.8623046875, -90.611328125, -86.3603515625, -82.109375, -77.8583984375, -73.607421875, -69.3564453125, -65.10546875, -60.8544921875, -56.603515625, -52.3525390625, -48.1015625, -43.8505859375, -39.599609375, -35.3486328125, -31.09765625, -26.8466796875, -22.595703125, -18.3447265625, -14.09375, -9.8427734375, -5.591796875, -1.3408203125, 2.91015625, 7.1611328125, 11.412109375, 15.6630859375, 19.9140625, 24.1650390625, 28.416015625, 32.6669921875, 36.91796875, 41.1689453125, 45.419921875, 49.6708984375, 53.921875, 58.1728515625, 62.423828125, 66.6748046875, 70.92578125, 75.1767578125, 79.427734375, 83.6787109375, 87.9296875, 92.1806640625, 96.431640625, 100.6826171875, 104.93359375, 109.1845703125, 113.435546875, 117.6865234375, 121.9375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 6.0, 4.0, 8.0, 9.0, 16.0, 19.0, 19.0, 32.0, 54.0, 64.0, 97.0, 216.0, 420.0, 879.0, 966.0, 607.0, 257.0, 134.0, 76.0, 49.0, 26.0, 25.0, 14.0, 15.0, 11.0, 15.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.9375, -119.4443359375, -115.951171875, -112.4580078125, -108.96484375, -105.4716796875, -101.978515625, -98.4853515625, -94.9921875, -91.4990234375, -88.005859375, -84.5126953125, -81.01953125, -77.5263671875, -74.033203125, -70.5400390625, -67.046875, -63.5537109375, -60.060546875, -56.5673828125, -53.07421875, -49.5810546875, -46.087890625, -42.5947265625, -39.1015625, -35.6083984375, -32.115234375, -28.6220703125, -25.12890625, -21.6357421875, -18.142578125, -14.6494140625, -11.15625, -7.6630859375, -4.169921875, -0.6767578125, 2.81640625, 6.3095703125, 9.802734375, 13.2958984375, 16.7890625, 20.2822265625, 23.775390625, 27.2685546875, 30.76171875, 34.2548828125, 37.748046875, 41.2412109375, 44.734375, 48.2275390625, 51.720703125, 55.2138671875, 58.70703125, 62.2001953125, 65.693359375, 69.1865234375, 72.6796875, 76.1728515625, 79.666015625, 83.1591796875, 86.65234375, 90.1455078125, 93.638671875, 97.1318359375, 100.625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 10.0, 13.0, 21.0, 21.0, 29.0, 83.0, 132.0, 295.0, 665.0, 2111.0, 8188.0, 53061.0, 3872497.0, 234165.0, 17185.0, 3766.0, 1133.0, 448.0, 176.0, 111.0, 43.0, 34.0, 23.0, 15.0, 9.0, 7.0, 7.0, 3.0, 5.0, 6.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.5, -292.5546875, -281.609375, -270.6640625, -259.71875, -248.7734375, -237.828125, -226.8828125, -215.9375, -204.9921875, -194.046875, -183.1015625, -172.15625, -161.2109375, -150.265625, -139.3203125, -128.375, -117.4296875, -106.484375, -95.5390625, -84.59375, -73.6484375, -62.703125, -51.7578125, -40.8125, -29.8671875, -18.921875, -7.9765625, 2.96875, 13.9140625, 24.859375, 35.8046875, 46.75, 57.6953125, 68.640625, 79.5859375, 90.53125, 101.4765625, 112.421875, 123.3671875, 134.3125, 145.2578125, 156.203125, 167.1484375, 178.09375, 189.0390625, 199.984375, 210.9296875, 221.875, 232.8203125, 243.765625, 254.7109375, 265.65625, 276.6015625, 287.546875, 298.4921875, 309.4375, 320.3828125, 331.328125, 342.2734375, 353.21875, 364.1640625, 375.109375, 386.0546875, 397.0]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 12.0, 42.0, 171.0, 432.0, 244.0, 62.0, 32.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2098.664794921875, -2058.842041015625, -2019.0194091796875, -1979.19677734375, -1939.3740234375, -1899.55126953125, -1859.7286376953125, -1819.906005859375, -1780.083251953125, -1740.260498046875, -1700.4378662109375, -1660.615234375, -1620.79248046875, -1580.9697265625, -1541.1470947265625, -1501.324462890625, -1461.501708984375, -1421.678955078125, -1381.8563232421875, -1342.03369140625, -1302.2109375, -1262.38818359375, -1222.5655517578125, -1182.742919921875, -1142.920166015625, -1103.097412109375, -1063.2747802734375, -1023.4520874023438, -983.62939453125, -943.8067016601562, -903.9840087890625, -864.1613159179688, -824.3387451171875, -784.5160522460938, -744.693359375, -704.8706665039062, -665.0479736328125, -625.2252807617188, -585.402587890625, -545.5798950195312, -505.7572021484375, -465.93450927734375, -426.11181640625, -386.28912353515625, -346.4664306640625, -306.64373779296875, -266.821044921875, -226.99835205078125, -187.1756591796875, -147.35296630859375, -107.5302734375, -67.70758056640625, -27.8848876953125, 11.93780517578125, 51.760498046875, 91.58319091796875, 131.4058837890625, 171.22857666015625, 211.05126953125, 250.87396240234375, 290.6966552734375, 330.51934814453125, 370.342041015625, 410.16473388671875, 449.9874267578125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 5.0, 12.0, 14.0, 10.0, 19.0, 12.0, 15.0, 15.0, 22.0, 19.0, 29.0, 31.0, 24.0, 29.0, 34.0, 28.0, 37.0, 24.0, 39.0, 43.0, 43.0, 40.0, 49.0, 42.0, 38.0, 30.0, 23.0, 25.0, 30.0, 28.0, 20.0, 23.0, 20.0, 20.0, 20.0, 14.0, 15.0, 11.0, 9.0, 8.0, 11.0, 2.0, 3.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.13265991210938, -233.33627319335938, -225.53988647460938, -217.7434844970703, -209.9470977783203, -202.1507110595703, -194.35430908203125, -186.55792236328125, -178.76153564453125, -170.96514892578125, -163.16876220703125, -155.3723602294922, -147.5759735107422, -139.7795867919922, -131.98318481445312, -124.18679809570312, -116.39041137695312, -108.59402465820312, -100.7976303100586, -93.00123596191406, -85.20484924316406, -77.40846252441406, -69.61206817626953, -61.815677642822266, -54.019287109375, -46.222896575927734, -38.42650604248047, -30.630115509033203, -22.833724975585938, -15.037334442138672, -7.240943908691406, 0.5554466247558594, 8.351837158203125, 16.14822769165039, 23.944618225097656, 31.741008758544922, 39.53739929199219, 47.33378982543945, 55.13018035888672, 62.926570892333984, 70.72296142578125, 78.51934814453125, 86.31574249267578, 94.11213684082031, 101.90852355957031, 109.70491027832031, 117.50130462646484, 125.29769897460938, 133.09408569335938, 140.89047241210938, 148.68685913085938, 156.48326110839844, 164.27964782714844, 172.07603454589844, 179.8724365234375, 187.6688232421875, 195.4652099609375, 203.2615966796875, 211.0579833984375, 218.85438537597656, 226.65077209472656, 234.44715881347656, 242.24356079101562, 250.03994750976562, 257.8363342285156]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 6.0, 3.0, 10.0, 11.0, 14.0, 21.0, 25.0, 17.0, 34.0, 22.0, 29.0, 39.0, 47.0, 34.0, 40.0, 35.0, 47.0, 53.0, 48.0, 50.0, 51.0, 40.0, 44.0, 39.0, 44.0, 30.0, 23.0, 26.0, 21.0, 23.0, 19.0, 10.0, 8.0, 8.0, 9.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.90625, -55.16748046875, -53.4287109375, -51.68994140625, -49.951171875, -48.21240234375, -46.4736328125, -44.73486328125, -42.99609375, -41.25732421875, -39.5185546875, -37.77978515625, -36.041015625, -34.30224609375, -32.5634765625, -30.82470703125, -29.0859375, -27.34716796875, -25.6083984375, -23.86962890625, -22.130859375, -20.39208984375, -18.6533203125, -16.91455078125, -15.17578125, -13.43701171875, -11.6982421875, -9.95947265625, -8.220703125, -6.48193359375, -4.7431640625, -3.00439453125, -1.265625, 0.47314453125, 2.2119140625, 3.95068359375, 5.689453125, 7.42822265625, 9.1669921875, 10.90576171875, 12.64453125, 14.38330078125, 16.1220703125, 17.86083984375, 19.599609375, 21.33837890625, 23.0771484375, 24.81591796875, 26.5546875, 28.29345703125, 30.0322265625, 31.77099609375, 33.509765625, 35.24853515625, 36.9873046875, 38.72607421875, 40.46484375, 42.20361328125, 43.9423828125, 45.68115234375, 47.419921875, 49.15869140625, 50.8974609375, 52.63623046875, 54.375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 10.0, 11.0, 23.0, 16.0, 36.0, 43.0, 67.0, 110.0, 122.0, 192.0, 285.0, 467.0, 570.0, 806.0, 1172.0, 1794.0, 2637.0, 4010.0, 5900.0, 8961.0, 13862.0, 21106.0, 34053.0, 55921.0, 98944.0, 192478.0, 254435.0, 147231.0, 77120.0, 45509.0, 28007.0, 17709.0, 11597.0, 7676.0, 5041.0, 3422.0, 2262.0, 1501.0, 1089.0, 762.0, 469.0, 332.0, 239.0, 175.0, 116.0, 85.0, 58.0, 44.0, 30.0, 23.0, 11.0, 9.0, 3.0, 3.0, 2.0, 5.0], "bins": [-2.419921875, -2.349365234375, -2.27880859375, -2.208251953125, -2.1376953125, -2.067138671875, -1.99658203125, -1.926025390625, -1.85546875, -1.784912109375, -1.71435546875, -1.643798828125, -1.5732421875, -1.502685546875, -1.43212890625, -1.361572265625, -1.291015625, -1.220458984375, -1.14990234375, -1.079345703125, -1.0087890625, -0.938232421875, -0.86767578125, -0.797119140625, -0.7265625, -0.656005859375, -0.58544921875, -0.514892578125, -0.4443359375, -0.373779296875, -0.30322265625, -0.232666015625, -0.162109375, -0.091552734375, -0.02099609375, 0.049560546875, 0.1201171875, 0.190673828125, 0.26123046875, 0.331787109375, 0.40234375, 0.472900390625, 0.54345703125, 0.614013671875, 0.6845703125, 0.755126953125, 0.82568359375, 0.896240234375, 0.966796875, 1.037353515625, 1.10791015625, 1.178466796875, 1.2490234375, 1.319580078125, 1.39013671875, 1.460693359375, 1.53125, 1.601806640625, 1.67236328125, 1.742919921875, 1.8134765625, 1.884033203125, 1.95458984375, 2.025146484375, 2.095703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 3.0, 7.0, 5.0, 3.0, 6.0, 8.0, 6.0, 11.0, 14.0, 19.0, 29.0, 24.0, 21.0, 22.0, 34.0, 32.0, 38.0, 37.0, 28.0, 53.0, 43.0, 46.0, 1066.0, 46.0, 52.0, 31.0, 45.0, 44.0, 38.0, 41.0, 21.0, 33.0, 22.0, 13.0, 17.0, 9.0, 14.0, 12.0, 5.0, 4.0, 9.0, 4.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.3125, -29.2724609375, -28.232421875, -27.1923828125, -26.15234375, -25.1123046875, -24.072265625, -23.0322265625, -21.9921875, -20.9521484375, -19.912109375, -18.8720703125, -17.83203125, -16.7919921875, -15.751953125, -14.7119140625, -13.671875, -12.6318359375, -11.591796875, -10.5517578125, -9.51171875, -8.4716796875, -7.431640625, -6.3916015625, -5.3515625, -4.3115234375, -3.271484375, -2.2314453125, -1.19140625, -0.1513671875, 0.888671875, 1.9287109375, 2.96875, 4.0087890625, 5.048828125, 6.0888671875, 7.12890625, 8.1689453125, 9.208984375, 10.2490234375, 11.2890625, 12.3291015625, 13.369140625, 14.4091796875, 15.44921875, 16.4892578125, 17.529296875, 18.5693359375, 19.609375, 20.6494140625, 21.689453125, 22.7294921875, 23.76953125, 24.8095703125, 25.849609375, 26.8896484375, 27.9296875, 28.9697265625, 30.009765625, 31.0498046875, 32.08984375, 33.1298828125, 34.169921875, 35.2099609375, 36.25]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 8.0, 15.0, 17.0, 20.0, 20.0, 39.0, 67.0, 96.0, 161.0, 234.0, 354.0, 519.0, 872.0, 1285.0, 2181.0, 3447.0, 5580.0, 9322.0, 15963.0, 28607.0, 53910.0, 111940.0, 454492.0, 1162338.0, 117721.0, 56335.0, 29961.0, 16694.0, 9747.0, 5699.0, 3511.0, 2170.0, 1349.0, 845.0, 557.0, 344.0, 259.0, 144.0, 111.0, 59.0, 52.0, 33.0, 12.0, 13.0, 11.0, 9.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.681640625, -2.59234619140625, -2.5030517578125, -2.41375732421875, -2.324462890625, -2.23516845703125, -2.1458740234375, -2.05657958984375, -1.96728515625, -1.87799072265625, -1.7886962890625, -1.69940185546875, -1.610107421875, -1.52081298828125, -1.4315185546875, -1.34222412109375, -1.2529296875, -1.16363525390625, -1.0743408203125, -0.98504638671875, -0.895751953125, -0.80645751953125, -0.7171630859375, -0.62786865234375, -0.53857421875, -0.44927978515625, -0.3599853515625, -0.27069091796875, -0.181396484375, -0.09210205078125, -0.0028076171875, 0.08648681640625, 0.17578125, 0.26507568359375, 0.3543701171875, 0.44366455078125, 0.532958984375, 0.62225341796875, 0.7115478515625, 0.80084228515625, 0.89013671875, 0.97943115234375, 1.0687255859375, 1.15802001953125, 1.247314453125, 1.33660888671875, 1.4259033203125, 1.51519775390625, 1.6044921875, 1.69378662109375, 1.7830810546875, 1.87237548828125, 1.961669921875, 2.05096435546875, 2.1402587890625, 2.22955322265625, 2.31884765625, 2.40814208984375, 2.4974365234375, 2.58673095703125, 2.676025390625, 2.76531982421875, 2.8546142578125, 2.94390869140625, 3.033203125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 9.0, 5.0, 8.0, 13.0, 11.0, 16.0, 19.0, 10.0, 16.0, 24.0, 22.0, 28.0, 42.0, 40.0, 58.0, 87.0, 86.0, 114.0, 59.0, 48.0, 46.0, 21.0, 36.0, 26.0, 23.0, 15.0, 15.0, 15.0, 12.0, 16.0, 7.0, 11.0, 6.0, 6.0, 10.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.031280517578125, -0.03035426139831543, -0.02942800521850586, -0.02850174903869629, -0.02757549285888672, -0.02664923667907715, -0.025722980499267578, -0.024796724319458008, -0.023870468139648438, -0.022944211959838867, -0.022017955780029297, -0.021091699600219727, -0.020165443420410156, -0.019239187240600586, -0.018312931060791016, -0.017386674880981445, -0.016460418701171875, -0.015534162521362305, -0.014607906341552734, -0.013681650161743164, -0.012755393981933594, -0.011829137802124023, -0.010902881622314453, -0.009976625442504883, -0.009050369262695312, -0.008124113082885742, -0.007197856903076172, -0.0062716007232666016, -0.005345344543457031, -0.004419088363647461, -0.0034928321838378906, -0.0025665760040283203, -0.00164031982421875, -0.0007140636444091797, 0.00021219253540039062, 0.001138448715209961, 0.0020647048950195312, 0.0029909610748291016, 0.003917217254638672, 0.004843473434448242, 0.0057697296142578125, 0.006695985794067383, 0.007622241973876953, 0.008548498153686523, 0.009474754333496094, 0.010401010513305664, 0.011327266693115234, 0.012253522872924805, 0.013179779052734375, 0.014106035232543945, 0.015032291412353516, 0.015958547592163086, 0.016884803771972656, 0.017811059951782227, 0.018737316131591797, 0.019663572311401367, 0.020589828491210938, 0.021516084671020508, 0.022442340850830078, 0.02336859703063965, 0.02429485321044922, 0.02522110939025879, 0.02614736557006836, 0.02707362174987793, 0.0279998779296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 8.0, 9.0, 12.0, 13.0, 19.0, 21.0, 21.0, 34.0, 33.0, 42.0, 64.0, 62.0, 95.0, 205.0, 444.0, 5204.0, 1004720.0, 36043.0, 763.0, 214.0, 151.0, 63.0, 67.0, 42.0, 38.0, 25.0, 25.0, 18.0, 20.0, 11.0, 12.0, 11.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5517578125, -0.5325241088867188, -0.5132904052734375, -0.49405670166015625, -0.474822998046875, -0.45558929443359375, -0.4363555908203125, -0.41712188720703125, -0.39788818359375, -0.37865447998046875, -0.3594207763671875, -0.34018707275390625, -0.320953369140625, -0.30171966552734375, -0.2824859619140625, -0.26325225830078125, -0.2440185546875, -0.22478485107421875, -0.2055511474609375, -0.18631744384765625, -0.167083740234375, -0.14785003662109375, -0.1286163330078125, -0.10938262939453125, -0.09014892578125, -0.07091522216796875, -0.0516815185546875, -0.03244781494140625, -0.013214111328125, 0.00601959228515625, 0.0252532958984375, 0.04448699951171875, 0.063720703125, 0.08295440673828125, 0.1021881103515625, 0.12142181396484375, 0.140655517578125, 0.15988922119140625, 0.1791229248046875, 0.19835662841796875, 0.21759033203125, 0.23682403564453125, 0.2560577392578125, 0.27529144287109375, 0.294525146484375, 0.31375885009765625, 0.3329925537109375, 0.35222625732421875, 0.3714599609375, 0.39069366455078125, 0.4099273681640625, 0.42916107177734375, 0.448394775390625, 0.46762847900390625, 0.4868621826171875, 0.5060958862304688, 0.52532958984375, 0.5445632934570312, 0.5637969970703125, 0.5830307006835938, 0.602264404296875, 0.6214981079101562, 0.6407318115234375, 0.6599655151367188, 0.67919921875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 15.0, 39.0, 150.0, 477.0, 240.0, 64.0, 14.0, 10.0, 2.0, 3.0], "bins": [-0.1085503026843071, -0.10666616261005402, -0.10478202998638153, -0.10289788991212845, -0.10101374983787537, -0.09912961721420288, -0.0972454771399498, -0.09536133706569672, -0.09347720444202423, -0.09159306436777115, -0.08970893174409866, -0.08782479166984558, -0.0859406515955925, -0.08405651897192001, -0.08217237889766693, -0.08028823882341385, -0.07840409874916077, -0.07651995867490768, -0.0746358260512352, -0.07275168597698212, -0.07086754590272903, -0.06898341327905655, -0.06709927320480347, -0.06521513313055038, -0.0633310005068779, -0.061446864157915115, -0.05956272408366203, -0.05767858773469925, -0.055794451385736465, -0.05391031503677368, -0.0520261749625206, -0.050142038613557816, -0.04825790226459503, -0.04637376591563225, -0.044489625841379166, -0.04260548949241638, -0.0407213531434536, -0.038837216794490814, -0.03695307672023773, -0.03506894037127495, -0.033184800297021866, -0.03130066394805908, -0.02941652573645115, -0.027532387524843216, -0.025648251175880432, -0.0237641129642725, -0.021879974752664566, -0.019995838403701782, -0.018111702054739, -0.016227563843131065, -0.014343427494168282, -0.012459289282560349, -0.01057515200227499, -0.008691014721989632, -0.006806876510381699, -0.00492273923009634, -0.003038601018488407, -0.001154463505372405, 0.000729674007743597, 0.0026138117536902428, 0.004497949033975601, 0.00638208631426096, 0.008266224525868893, 0.010150361806154251, 0.01203449908643961]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 10.0, 4.0, 11.0, 15.0, 18.0, 14.0, 23.0, 35.0, 30.0, 26.0, 31.0, 37.0, 37.0, 56.0, 36.0, 43.0, 35.0, 36.0, 45.0, 55.0, 44.0, 44.0, 45.0, 38.0, 37.0, 34.0, 25.0, 31.0, 26.0, 11.0, 11.0, 16.0, 10.0, 2.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.02012455463409424, -0.019553914666175842, -0.018983274698257446, -0.01841263473033905, -0.017841994762420654, -0.01727135479450226, -0.016700714826583862, -0.016130074858665466, -0.01555943489074707, -0.014988794922828674, -0.014418154954910278, -0.013847514986991882, -0.013276875019073486, -0.01270623505115509, -0.012135595083236694, -0.011564955115318298, -0.010994315147399902, -0.010423675179481506, -0.00985303521156311, -0.009282395243644714, -0.008711755275726318, -0.008141115307807922, -0.007570475339889526, -0.00699983537197113, -0.006429195404052734, -0.005858555436134338, -0.005287915468215942, -0.004717275500297546, -0.00414663553237915, -0.0035759955644607544, -0.0030053555965423584, -0.0024347156286239624, -0.0018640756607055664, -0.0012934356927871704, -0.0007227957248687744, -0.00015215575695037842, 0.0004184842109680176, 0.0009891241788864136, 0.0015597641468048096, 0.0021304041147232056, 0.0027010440826416016, 0.0032716840505599976, 0.0038423240184783936, 0.0044129639863967896, 0.0049836039543151855, 0.0055542439222335815, 0.0061248838901519775, 0.0066955238580703735, 0.0072661638259887695, 0.007836803793907166, 0.008407443761825562, 0.008978083729743958, 0.009548723697662354, 0.01011936366558075, 0.010690003633499146, 0.011260643601417542, 0.011831283569335938, 0.012401923537254333, 0.01297256350517273, 0.013543203473091125, 0.014113843441009521, 0.014684483408927917, 0.015255123376846313, 0.01582576334476471, 0.016396403312683105]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 6.0, 3.0, 10.0, 11.0, 14.0, 21.0, 25.0, 17.0, 34.0, 22.0, 29.0, 39.0, 47.0, 34.0, 40.0, 35.0, 47.0, 53.0, 48.0, 50.0, 51.0, 40.0, 44.0, 39.0, 44.0, 30.0, 23.0, 26.0, 21.0, 23.0, 19.0, 10.0, 8.0, 8.0, 9.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.90625, -55.16748046875, -53.4287109375, -51.68994140625, -49.951171875, -48.21240234375, -46.4736328125, -44.73486328125, -42.99609375, -41.25732421875, -39.5185546875, -37.77978515625, -36.041015625, -34.30224609375, -32.5634765625, -30.82470703125, -29.0859375, -27.34716796875, -25.6083984375, -23.86962890625, -22.130859375, -20.39208984375, -18.6533203125, -16.91455078125, -15.17578125, -13.43701171875, -11.6982421875, -9.95947265625, -8.220703125, -6.48193359375, -4.7431640625, -3.00439453125, -1.265625, 0.47314453125, 2.2119140625, 3.95068359375, 5.689453125, 7.42822265625, 9.1669921875, 10.90576171875, 12.64453125, 14.38330078125, 16.1220703125, 17.86083984375, 19.599609375, 21.33837890625, 23.0771484375, 24.81591796875, 26.5546875, 28.29345703125, 30.0322265625, 31.77099609375, 33.509765625, 35.24853515625, 36.9873046875, 38.72607421875, 40.46484375, 42.20361328125, 43.9423828125, 45.68115234375, 47.419921875, 49.15869140625, 50.8974609375, 52.63623046875, 54.375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 7.0, 13.0, 13.0, 19.0, 31.0, 39.0, 50.0, 107.0, 133.0, 231.0, 341.0, 567.0, 886.0, 1512.0, 2651.0, 5064.0, 10963.0, 30424.0, 145961.0, 664028.0, 135106.0, 28556.0, 10308.0, 4963.0, 2665.0, 1542.0, 842.0, 546.0, 326.0, 223.0, 131.0, 96.0, 62.0, 46.0, 27.0, 19.0, 15.0, 8.0, 12.0, 3.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.5625, -55.73388671875, -53.9052734375, -52.07666015625, -50.248046875, -48.41943359375, -46.5908203125, -44.76220703125, -42.93359375, -41.10498046875, -39.2763671875, -37.44775390625, -35.619140625, -33.79052734375, -31.9619140625, -30.13330078125, -28.3046875, -26.47607421875, -24.6474609375, -22.81884765625, -20.990234375, -19.16162109375, -17.3330078125, -15.50439453125, -13.67578125, -11.84716796875, -10.0185546875, -8.18994140625, -6.361328125, -4.53271484375, -2.7041015625, -0.87548828125, 0.953125, 2.78173828125, 4.6103515625, 6.43896484375, 8.267578125, 10.09619140625, 11.9248046875, 13.75341796875, 15.58203125, 17.41064453125, 19.2392578125, 21.06787109375, 22.896484375, 24.72509765625, 26.5537109375, 28.38232421875, 30.2109375, 32.03955078125, 33.8681640625, 35.69677734375, 37.525390625, 39.35400390625, 41.1826171875, 43.01123046875, 44.83984375, 46.66845703125, 48.4970703125, 50.32568359375, 52.154296875, 53.98291015625, 55.8115234375, 57.64013671875, 59.46875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 9.0, 10.0, 11.0, 16.0, 19.0, 19.0, 35.0, 35.0, 49.0, 43.0, 38.0, 48.0, 64.0, 60.0, 1634.0, 470.0, 76.0, 62.0, 42.0, 39.0, 36.0, 38.0, 32.0, 24.0, 29.0, 21.0, 22.0, 9.0, 13.0, 8.0, 5.0, 13.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.875, -171.5078125, -166.140625, -160.7734375, -155.40625, -150.0390625, -144.671875, -139.3046875, -133.9375, -128.5703125, -123.203125, -117.8359375, -112.46875, -107.1015625, -101.734375, -96.3671875, -91.0, -85.6328125, -80.265625, -74.8984375, -69.53125, -64.1640625, -58.796875, -53.4296875, -48.0625, -42.6953125, -37.328125, -31.9609375, -26.59375, -21.2265625, -15.859375, -10.4921875, -5.125, 0.2421875, 5.609375, 10.9765625, 16.34375, 21.7109375, 27.078125, 32.4453125, 37.8125, 43.1796875, 48.546875, 53.9140625, 59.28125, 64.6484375, 70.015625, 75.3828125, 80.75, 86.1171875, 91.484375, 96.8515625, 102.21875, 107.5859375, 112.953125, 118.3203125, 123.6875, 129.0546875, 134.421875, 139.7890625, 145.15625, 150.5234375, 155.890625, 161.2578125, 166.625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 6.0, 14.0, 20.0, 9.0, 28.0, 33.0, 44.0, 53.0, 72.0, 92.0, 124.0, 213.0, 301.0, 878.0, 4950.0, 135212.0, 2989291.0, 11711.0, 1409.0, 446.0, 229.0, 140.0, 125.0, 79.0, 62.0, 38.0, 26.0, 20.0, 17.0, 12.0, 10.0, 9.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-279.0, -270.05078125, -261.1015625, -252.15234375, -243.203125, -234.25390625, -225.3046875, -216.35546875, -207.40625, -198.45703125, -189.5078125, -180.55859375, -171.609375, -162.66015625, -153.7109375, -144.76171875, -135.8125, -126.86328125, -117.9140625, -108.96484375, -100.015625, -91.06640625, -82.1171875, -73.16796875, -64.21875, -55.26953125, -46.3203125, -37.37109375, -28.421875, -19.47265625, -10.5234375, -1.57421875, 7.375, 16.32421875, 25.2734375, 34.22265625, 43.171875, 52.12109375, 61.0703125, 70.01953125, 78.96875, 87.91796875, 96.8671875, 105.81640625, 114.765625, 123.71484375, 132.6640625, 141.61328125, 150.5625, 159.51171875, 168.4609375, 177.41015625, 186.359375, 195.30859375, 204.2578125, 213.20703125, 222.15625, 231.10546875, 240.0546875, 249.00390625, 257.953125, 266.90234375, 275.8515625, 284.80078125, 293.75]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 191.0, 799.0, 24.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2496.6630859375, -2453.805908203125, -2410.94873046875, -2368.091552734375, -2325.234130859375, -2282.376953125, -2239.519775390625, -2196.66259765625, -2153.805419921875, -2110.9482421875, -2068.091064453125, -2025.2337646484375, -1982.3765869140625, -1939.5194091796875, -1896.662109375, -1853.804931640625, -1810.94775390625, -1768.090576171875, -1725.2332763671875, -1682.3760986328125, -1639.5189208984375, -1596.6617431640625, -1553.804443359375, -1510.947265625, -1468.0899658203125, -1425.2327880859375, -1382.37548828125, -1339.518310546875, -1296.6611328125, -1253.803955078125, -1210.9466552734375, -1168.0894775390625, -1125.232177734375, -1082.375, -1039.5177001953125, -996.6605224609375, -953.8033447265625, -910.9461059570312, -868.0888671875, -825.231689453125, -782.37451171875, -739.5172729492188, -696.6600952148438, -653.8028564453125, -610.9456787109375, -568.0884399414062, -525.231201171875, -482.3740234375, -439.5168151855469, -396.65960693359375, -353.8023986816406, -310.9451904296875, -268.08795166015625, -225.2307586669922, -182.37353515625, -139.51632690429688, -96.65911865234375, -53.80190658569336, -10.944694519042969, 31.912521362304688, 74.76972961425781, 117.62693786621094, 160.48416137695312, 203.34136962890625, 246.19857788085938]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 7.0, 7.0, 12.0, 19.0, 13.0, 12.0, 19.0, 19.0, 22.0, 29.0, 28.0, 20.0, 34.0, 38.0, 49.0, 46.0, 31.0, 54.0, 48.0, 34.0, 49.0, 47.0, 44.0, 28.0, 25.0, 33.0, 38.0, 31.0, 36.0, 22.0, 21.0, 16.0, 12.0, 13.0, 12.0, 8.0, 7.0, 9.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-351.8155212402344, -339.8583984375, -327.9012451171875, -315.9441223144531, -303.98699951171875, -292.0298767089844, -280.07275390625, -268.1156005859375, -256.1584777832031, -244.20135498046875, -232.2442169189453, -220.28707885742188, -208.3299560546875, -196.37283325195312, -184.4156951904297, -172.45855712890625, -160.50143432617188, -148.5443115234375, -136.58717346191406, -124.63004302978516, -112.67291259765625, -100.71578216552734, -88.75865173339844, -76.80152130126953, -64.84439086914062, -52.88726043701172, -40.93013000488281, -28.972999572753906, -17.015869140625, -5.058738708496094, 6.8983917236328125, 18.85552215576172, 30.8126220703125, 42.769752502441406, 54.72688293457031, 66.68401336669922, 78.64114379882812, 90.59827423095703, 102.55540466308594, 114.51253509521484, 126.46966552734375, 138.42678833007812, 150.38392639160156, 162.341064453125, 174.29818725585938, 186.25531005859375, 198.2124481201172, 210.16958618164062, 222.126708984375, 234.08383178710938, 246.0409698486328, 257.99810791015625, 269.9552307128906, 281.912353515625, 293.8695068359375, 305.8266296386719, 317.78375244140625, 329.7408752441406, 341.697998046875, 353.6551513671875, 365.6122741699219, 377.56939697265625, 389.52655029296875, 401.4836730957031, 413.4407958984375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 1.0, 6.0, 5.0, 11.0, 11.0, 16.0, 21.0, 19.0, 20.0, 26.0, 31.0, 25.0, 33.0, 38.0, 34.0, 45.0, 36.0, 41.0, 48.0, 46.0, 49.0, 45.0, 45.0, 38.0, 39.0, 49.0, 36.0, 30.0, 25.0, 16.0, 28.0, 22.0, 20.0, 9.0, 5.0, 10.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.65625, -53.9814453125, -52.306640625, -50.6318359375, -48.95703125, -47.2822265625, -45.607421875, -43.9326171875, -42.2578125, -40.5830078125, -38.908203125, -37.2333984375, -35.55859375, -33.8837890625, -32.208984375, -30.5341796875, -28.859375, -27.1845703125, -25.509765625, -23.8349609375, -22.16015625, -20.4853515625, -18.810546875, -17.1357421875, -15.4609375, -13.7861328125, -12.111328125, -10.4365234375, -8.76171875, -7.0869140625, -5.412109375, -3.7373046875, -2.0625, -0.3876953125, 1.287109375, 2.9619140625, 4.63671875, 6.3115234375, 7.986328125, 9.6611328125, 11.3359375, 13.0107421875, 14.685546875, 16.3603515625, 18.03515625, 19.7099609375, 21.384765625, 23.0595703125, 24.734375, 26.4091796875, 28.083984375, 29.7587890625, 31.43359375, 33.1083984375, 34.783203125, 36.4580078125, 38.1328125, 39.8076171875, 41.482421875, 43.1572265625, 44.83203125, 46.5068359375, 48.181640625, 49.8564453125, 51.53125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 11.0, 16.0, 23.0, 21.0, 39.0, 50.0, 69.0, 109.0, 126.0, 165.0, 275.0, 383.0, 531.0, 787.0, 1102.0, 1782.0, 2826.0, 5055.0, 10264.0, 31124.0, 337426.0, 3338372.0, 403824.0, 35804.0, 10817.0, 5112.0, 2852.0, 1743.0, 1086.0, 764.0, 520.0, 360.0, 235.0, 203.0, 120.0, 82.0, 66.0, 40.0, 23.0, 19.0, 12.0, 10.0, 4.0, 11.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-122.1875, -118.4306640625, -114.673828125, -110.9169921875, -107.16015625, -103.4033203125, -99.646484375, -95.8896484375, -92.1328125, -88.3759765625, -84.619140625, -80.8623046875, -77.10546875, -73.3486328125, -69.591796875, -65.8349609375, -62.078125, -58.3212890625, -54.564453125, -50.8076171875, -47.05078125, -43.2939453125, -39.537109375, -35.7802734375, -32.0234375, -28.2666015625, -24.509765625, -20.7529296875, -16.99609375, -13.2392578125, -9.482421875, -5.7255859375, -1.96875, 1.7880859375, 5.544921875, 9.3017578125, 13.05859375, 16.8154296875, 20.572265625, 24.3291015625, 28.0859375, 31.8427734375, 35.599609375, 39.3564453125, 43.11328125, 46.8701171875, 50.626953125, 54.3837890625, 58.140625, 61.8974609375, 65.654296875, 69.4111328125, 73.16796875, 76.9248046875, 80.681640625, 84.4384765625, 88.1953125, 91.9521484375, 95.708984375, 99.4658203125, 103.22265625, 106.9794921875, 110.736328125, 114.4931640625, 118.25]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 5.0, 6.0, 4.0, 5.0, 8.0, 8.0, 9.0, 6.0, 10.0, 25.0, 31.0, 41.0, 43.0, 85.0, 139.0, 309.0, 540.0, 969.0, 781.0, 432.0, 259.0, 118.0, 66.0, 30.0, 38.0, 22.0, 17.0, 13.0, 17.0, 8.0, 12.0, 6.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-93.5625, -90.6171875, -87.671875, -84.7265625, -81.78125, -78.8359375, -75.890625, -72.9453125, -70.0, -67.0546875, -64.109375, -61.1640625, -58.21875, -55.2734375, -52.328125, -49.3828125, -46.4375, -43.4921875, -40.546875, -37.6015625, -34.65625, -31.7109375, -28.765625, -25.8203125, -22.875, -19.9296875, -16.984375, -14.0390625, -11.09375, -8.1484375, -5.203125, -2.2578125, 0.6875, 3.6328125, 6.578125, 9.5234375, 12.46875, 15.4140625, 18.359375, 21.3046875, 24.25, 27.1953125, 30.140625, 33.0859375, 36.03125, 38.9765625, 41.921875, 44.8671875, 47.8125, 50.7578125, 53.703125, 56.6484375, 59.59375, 62.5390625, 65.484375, 68.4296875, 71.375, 74.3203125, 77.265625, 80.2109375, 83.15625, 86.1015625, 89.046875, 91.9921875, 94.9375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 14.0, 17.0, 18.0, 29.0, 40.0, 58.0, 96.0, 176.0, 336.0, 809.0, 2119.0, 6722.0, 25783.0, 247471.0, 3804286.0, 83789.0, 15370.0, 4408.0, 1487.0, 544.0, 275.0, 155.0, 82.0, 55.0, 28.0, 20.0, 16.0, 17.0, 12.0, 5.0, 8.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-275.5, -266.9765625, -258.453125, -249.9296875, -241.40625, -232.8828125, -224.359375, -215.8359375, -207.3125, -198.7890625, -190.265625, -181.7421875, -173.21875, -164.6953125, -156.171875, -147.6484375, -139.125, -130.6015625, -122.078125, -113.5546875, -105.03125, -96.5078125, -87.984375, -79.4609375, -70.9375, -62.4140625, -53.890625, -45.3671875, -36.84375, -28.3203125, -19.796875, -11.2734375, -2.75, 5.7734375, 14.296875, 22.8203125, 31.34375, 39.8671875, 48.390625, 56.9140625, 65.4375, 73.9609375, 82.484375, 91.0078125, 99.53125, 108.0546875, 116.578125, 125.1015625, 133.625, 142.1484375, 150.671875, 159.1953125, 167.71875, 176.2421875, 184.765625, 193.2890625, 201.8125, 210.3359375, 218.859375, 227.3828125, 235.90625, 244.4296875, 252.953125, 261.4765625, 270.0]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 9.0, 11.0, 19.0, 44.0, 76.0, 149.0, 284.0, 194.0, 110.0, 58.0, 27.0, 11.0, 11.0, 2.0, 2.0, 1.0, 4.0], "bins": [-1070.8450927734375, -1050.9007568359375, -1030.956298828125, -1011.011962890625, -991.0675659179688, -971.1232299804688, -951.1788330078125, -931.2344970703125, -911.2901000976562, -891.345703125, -871.4013671875, -851.4569702148438, -831.5125732421875, -811.5682373046875, -791.6238403320312, -771.679443359375, -751.735107421875, -731.7907104492188, -711.8463745117188, -691.9019775390625, -671.9575805664062, -652.0132446289062, -632.06884765625, -612.12451171875, -592.1800537109375, -572.2356567382812, -552.2913208007812, -532.346923828125, -512.4025268554688, -492.45819091796875, -472.5137939453125, -452.5694274902344, -432.62506103515625, -412.6806945800781, -392.7362976074219, -372.79193115234375, -352.8475646972656, -332.9031982421875, -312.95880126953125, -293.0144348144531, -273.0700378417969, -253.1256561279297, -233.18128967285156, -213.23690795898438, -193.29254150390625, -173.34815979003906, -153.40377807617188, -133.45941162109375, -113.51502990722656, -93.5706558227539, -73.62628173828125, -53.68190002441406, -33.737525939941406, -13.79315185546875, 6.1512298583984375, 26.095596313476562, 46.03997802734375, 65.9843521118164, 85.92872619628906, 105.87310791015625, 125.8174819946289, 145.76185607910156, 165.70623779296875, 185.65060424804688, 205.59498596191406]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 5.0, 4.0, 2.0, 6.0, 4.0, 9.0, 8.0, 13.0, 13.0, 17.0, 23.0, 20.0, 25.0, 18.0, 26.0, 35.0, 26.0, 24.0, 38.0, 46.0, 34.0, 48.0, 39.0, 38.0, 35.0, 39.0, 32.0, 37.0, 44.0, 37.0, 35.0, 29.0, 36.0, 22.0, 17.0, 20.0, 8.0, 14.0, 15.0, 14.0, 12.0, 9.0, 3.0, 10.0, 4.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-234.14645385742188, -227.0242462158203, -219.90203857421875, -212.7798309326172, -205.65762329101562, -198.535400390625, -191.41319274902344, -184.29098510742188, -177.1687774658203, -170.04656982421875, -162.9243621826172, -155.80215454101562, -148.679931640625, -141.5577392578125, -134.43551635742188, -127.31330871582031, -120.19110107421875, -113.06889343261719, -105.94668579101562, -98.82447052001953, -91.70226287841797, -84.5800552368164, -77.45783996582031, -70.33563232421875, -63.21342468261719, -56.091217041015625, -48.9690055847168, -41.84679412841797, -34.724586486816406, -27.602378845214844, -20.480167388916016, -13.357955932617188, -6.235748291015625, 0.8864612579345703, 8.008670806884766, 15.130880355834961, 22.253089904785156, 29.37529754638672, 36.49750900268555, 43.619720458984375, 50.74192810058594, 57.8641357421875, 64.98634338378906, 72.10855865478516, 79.23076629638672, 86.35297393798828, 93.47518920898438, 100.59739685058594, 107.7196044921875, 114.84181213378906, 121.96401977539062, 129.0862274169922, 136.20843505859375, 143.33065795898438, 150.45286560058594, 157.5750732421875, 164.69728088378906, 171.81948852539062, 178.9416961669922, 186.06390380859375, 193.18612670898438, 200.30831909179688, 207.4305419921875, 214.55274963378906, 221.67495727539062]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 5.0, 8.0, 15.0, 14.0, 12.0, 17.0, 21.0, 17.0, 36.0, 30.0, 31.0, 31.0, 33.0, 36.0, 45.0, 40.0, 50.0, 40.0, 48.0, 38.0, 30.0, 44.0, 39.0, 42.0, 45.0, 35.0, 27.0, 29.0, 23.0, 20.0, 17.0, 19.0, 9.0, 8.0, 5.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -45.82470703125, -44.1806640625, -42.53662109375, -40.892578125, -39.24853515625, -37.6044921875, -35.96044921875, -34.31640625, -32.67236328125, -31.0283203125, -29.38427734375, -27.740234375, -26.09619140625, -24.4521484375, -22.80810546875, -21.1640625, -19.52001953125, -17.8759765625, -16.23193359375, -14.587890625, -12.94384765625, -11.2998046875, -9.65576171875, -8.01171875, -6.36767578125, -4.7236328125, -3.07958984375, -1.435546875, 0.20849609375, 1.8525390625, 3.49658203125, 5.140625, 6.78466796875, 8.4287109375, 10.07275390625, 11.716796875, 13.36083984375, 15.0048828125, 16.64892578125, 18.29296875, 19.93701171875, 21.5810546875, 23.22509765625, 24.869140625, 26.51318359375, 28.1572265625, 29.80126953125, 31.4453125, 33.08935546875, 34.7333984375, 36.37744140625, 38.021484375, 39.66552734375, 41.3095703125, 42.95361328125, 44.59765625, 46.24169921875, 47.8857421875, 49.52978515625, 51.173828125, 52.81787109375, 54.4619140625, 56.10595703125, 57.75]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 9.0, 18.0, 36.0, 48.0, 72.0, 104.0, 167.0, 232.0, 340.0, 512.0, 720.0, 1145.0, 1811.0, 2706.0, 4319.0, 6952.0, 11433.0, 19601.0, 33986.0, 63927.0, 132806.0, 293956.0, 242501.0, 105785.0, 53000.0, 28921.0, 16724.0, 10051.0, 5968.0, 3825.0, 2327.0, 1580.0, 1026.0, 636.0, 454.0, 265.0, 190.0, 118.0, 101.0, 64.0, 39.0, 27.0, 23.0, 8.0, 6.0, 2.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.998046875, -2.90679931640625, -2.8155517578125, -2.72430419921875, -2.633056640625, -2.54180908203125, -2.4505615234375, -2.35931396484375, -2.26806640625, -2.17681884765625, -2.0855712890625, -1.99432373046875, -1.903076171875, -1.81182861328125, -1.7205810546875, -1.62933349609375, -1.5380859375, -1.44683837890625, -1.3555908203125, -1.26434326171875, -1.173095703125, -1.08184814453125, -0.9906005859375, -0.89935302734375, -0.80810546875, -0.71685791015625, -0.6256103515625, -0.53436279296875, -0.443115234375, -0.35186767578125, -0.2606201171875, -0.16937255859375, -0.078125, 0.01312255859375, 0.1043701171875, 0.19561767578125, 0.286865234375, 0.37811279296875, 0.4693603515625, 0.56060791015625, 0.65185546875, 0.74310302734375, 0.8343505859375, 0.92559814453125, 1.016845703125, 1.10809326171875, 1.1993408203125, 1.29058837890625, 1.3818359375, 1.47308349609375, 1.5643310546875, 1.65557861328125, 1.746826171875, 1.83807373046875, 1.9293212890625, 2.02056884765625, 2.11181640625, 2.20306396484375, 2.2943115234375, 2.38555908203125, 2.476806640625, 2.56805419921875, 2.6593017578125, 2.75054931640625, 2.841796875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 2.0, 9.0, 9.0, 13.0, 14.0, 19.0, 14.0, 16.0, 21.0, 21.0, 27.0, 29.0, 36.0, 35.0, 28.0, 36.0, 30.0, 46.0, 48.0, 35.0, 1056.0, 29.0, 42.0, 45.0, 47.0, 29.0, 33.0, 28.0, 32.0, 23.0, 28.0, 14.0, 21.0, 12.0, 15.0, 16.0, 15.0, 7.0, 3.0, 16.0, 6.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-34.78125, -33.71728515625, -32.6533203125, -31.58935546875, -30.525390625, -29.46142578125, -28.3974609375, -27.33349609375, -26.26953125, -25.20556640625, -24.1416015625, -23.07763671875, -22.013671875, -20.94970703125, -19.8857421875, -18.82177734375, -17.7578125, -16.69384765625, -15.6298828125, -14.56591796875, -13.501953125, -12.43798828125, -11.3740234375, -10.31005859375, -9.24609375, -8.18212890625, -7.1181640625, -6.05419921875, -4.990234375, -3.92626953125, -2.8623046875, -1.79833984375, -0.734375, 0.32958984375, 1.3935546875, 2.45751953125, 3.521484375, 4.58544921875, 5.6494140625, 6.71337890625, 7.77734375, 8.84130859375, 9.9052734375, 10.96923828125, 12.033203125, 13.09716796875, 14.1611328125, 15.22509765625, 16.2890625, 17.35302734375, 18.4169921875, 19.48095703125, 20.544921875, 21.60888671875, 22.6728515625, 23.73681640625, 24.80078125, 25.86474609375, 26.9287109375, 27.99267578125, 29.056640625, 30.12060546875, 31.1845703125, 32.24853515625, 33.3125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 14.0, 25.0, 19.0, 48.0, 69.0, 119.0, 131.0, 251.0, 368.0, 509.0, 863.0, 1291.0, 2069.0, 3255.0, 5114.0, 8301.0, 13603.0, 22026.0, 37482.0, 68435.0, 137980.0, 1341717.0, 229912.0, 96691.0, 51260.0, 29383.0, 17610.0, 10596.0, 6659.0, 4111.0, 2565.0, 1656.0, 1050.0, 637.0, 441.0, 276.0, 202.0, 126.0, 73.0, 59.0, 37.0, 28.0, 18.0, 14.0, 12.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.876953125, -2.786376953125, -2.69580078125, -2.605224609375, -2.5146484375, -2.424072265625, -2.33349609375, -2.242919921875, -2.15234375, -2.061767578125, -1.97119140625, -1.880615234375, -1.7900390625, -1.699462890625, -1.60888671875, -1.518310546875, -1.427734375, -1.337158203125, -1.24658203125, -1.156005859375, -1.0654296875, -0.974853515625, -0.88427734375, -0.793701171875, -0.703125, -0.612548828125, -0.52197265625, -0.431396484375, -0.3408203125, -0.250244140625, -0.15966796875, -0.069091796875, 0.021484375, 0.112060546875, 0.20263671875, 0.293212890625, 0.3837890625, 0.474365234375, 0.56494140625, 0.655517578125, 0.74609375, 0.836669921875, 0.92724609375, 1.017822265625, 1.1083984375, 1.198974609375, 1.28955078125, 1.380126953125, 1.470703125, 1.561279296875, 1.65185546875, 1.742431640625, 1.8330078125, 1.923583984375, 2.01416015625, 2.104736328125, 2.1953125, 2.285888671875, 2.37646484375, 2.467041015625, 2.5576171875, 2.648193359375, 2.73876953125, 2.829345703125, 2.919921875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 7.0, 7.0, 5.0, 14.0, 18.0, 26.0, 18.0, 30.0, 31.0, 45.0, 69.0, 90.0, 154.0, 144.0, 73.0, 60.0, 50.0, 36.0, 18.0, 20.0, 21.0, 5.0, 11.0, 9.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051971435546875, -0.05039548873901367, -0.048819541931152344, -0.047243595123291016, -0.04566764831542969, -0.04409170150756836, -0.04251575469970703, -0.0409398078918457, -0.039363861083984375, -0.03778791427612305, -0.03621196746826172, -0.03463602066040039, -0.03306007385253906, -0.031484127044677734, -0.029908180236816406, -0.028332233428955078, -0.02675628662109375, -0.025180339813232422, -0.023604393005371094, -0.022028446197509766, -0.020452499389648438, -0.01887655258178711, -0.01730060577392578, -0.015724658966064453, -0.014148712158203125, -0.012572765350341797, -0.010996818542480469, -0.00942087173461914, -0.007844924926757812, -0.006268978118896484, -0.004693031311035156, -0.003117084503173828, -0.0015411376953125, 3.4809112548828125e-05, 0.0016107559204101562, 0.0031867027282714844, 0.0047626495361328125, 0.006338596343994141, 0.007914543151855469, 0.009490489959716797, 0.011066436767578125, 0.012642383575439453, 0.014218330383300781, 0.01579427719116211, 0.017370223999023438, 0.018946170806884766, 0.020522117614746094, 0.022098064422607422, 0.02367401123046875, 0.025249958038330078, 0.026825904846191406, 0.028401851654052734, 0.029977798461914062, 0.03155374526977539, 0.03312969207763672, 0.03470563888549805, 0.036281585693359375, 0.0378575325012207, 0.03943347930908203, 0.04100942611694336, 0.04258537292480469, 0.044161319732666016, 0.045737266540527344, 0.04731321334838867, 0.04888916015625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 7.0, 4.0, 7.0, 12.0, 19.0, 22.0, 35.0, 33.0, 51.0, 106.0, 168.0, 425.0, 6970.0, 1029586.0, 10066.0, 470.0, 191.0, 95.0, 83.0, 44.0, 30.0, 36.0, 23.0, 12.0, 14.0, 9.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9308853149414062, -0.8993682861328125, -0.8678512573242188, -0.836334228515625, -0.8048171997070312, -0.7733001708984375, -0.7417831420898438, -0.71026611328125, -0.6787490844726562, -0.6472320556640625, -0.6157150268554688, -0.584197998046875, -0.5526809692382812, -0.5211639404296875, -0.48964691162109375, -0.4581298828125, -0.42661285400390625, -0.3950958251953125, -0.36357879638671875, -0.332061767578125, -0.30054473876953125, -0.2690277099609375, -0.23751068115234375, -0.20599365234375, -0.17447662353515625, -0.1429595947265625, -0.11144256591796875, -0.079925537109375, -0.04840850830078125, -0.0168914794921875, 0.01462554931640625, 0.046142578125, 0.07765960693359375, 0.1091766357421875, 0.14069366455078125, 0.172210693359375, 0.20372772216796875, 0.2352447509765625, 0.26676177978515625, 0.29827880859375, 0.32979583740234375, 0.3613128662109375, 0.39282989501953125, 0.424346923828125, 0.45586395263671875, 0.4873809814453125, 0.5188980102539062, 0.5504150390625, 0.5819320678710938, 0.6134490966796875, 0.6449661254882812, 0.676483154296875, 0.7080001831054688, 0.7395172119140625, 0.7710342407226562, 0.80255126953125, 0.8340682983398438, 0.8655853271484375, 0.8971023559570312, 0.928619384765625, 0.9601364135742188, 0.9916534423828125, 1.0231704711914062, 1.0546875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 13.0, 24.0, 55.0, 163.0, 377.0, 239.0, 95.0, 29.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.025633031502366066, -0.023612642660737038, -0.02159225568175316, -0.01957186684012413, -0.017551477998495102, -0.015531089156866074, -0.01351070124655962, -0.011490313336253166, -0.009469924494624138, -0.007449536118656397, -0.005429147742688656, -0.003408759366720915, -0.0013883709907531738, 0.0006320178508758545, 0.002652405761182308, 0.004672793671488762, 0.00669318251311779, 0.008713571354746819, 0.010733959265053272, 0.012754347175359726, 0.014774736016988754, 0.016795124858617783, 0.01881551370024681, 0.02083590067923069, 0.02285628952085972, 0.024876678362488747, 0.026897065341472626, 0.028917454183101654, 0.030937843024730682, 0.03295823186635971, 0.03497862070798874, 0.03699900954961777, 0.0390193909406662, 0.04103977978229523, 0.043060168623924255, 0.045080557465553284, 0.04710094630718231, 0.04912133514881134, 0.05114172026515007, 0.0531621091067791, 0.05518249794840813, 0.057202886790037155, 0.059223275631666183, 0.06124366447329521, 0.06326404958963394, 0.06528443843126297, 0.067304827272892, 0.06932521611452103, 0.07134560495615005, 0.07336599379777908, 0.07538638263940811, 0.07740677148103714, 0.07942716032266617, 0.0814475491642952, 0.08346793800592422, 0.08548831939697266, 0.08750870823860168, 0.08952909708023071, 0.09154948592185974, 0.09356987476348877, 0.0955902636051178, 0.09761065244674683, 0.09963104128837585, 0.10165143013000488, 0.10367181897163391]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 8.0, 14.0, 11.0, 14.0, 13.0, 24.0, 16.0, 20.0, 32.0, 36.0, 32.0, 45.0, 33.0, 27.0, 56.0, 56.0, 47.0, 49.0, 54.0, 51.0, 40.0, 43.0, 42.0, 32.0, 35.0, 21.0, 25.0, 23.0, 18.0, 24.0, 9.0, 10.0, 14.0, 6.0, 12.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021982908248901367, -0.02121187001466751, -0.020440833643078804, -0.019669797271490097, -0.01889875903725624, -0.018127720803022385, -0.017356684431433678, -0.01658564805984497, -0.015814609825611115, -0.015043572522699833, -0.014272535219788551, -0.01350149791687727, -0.012730460613965988, -0.011959423311054707, -0.011188386008143425, -0.010417348705232143, -0.009646311402320862, -0.00887527409940958, -0.008104236796498299, -0.007333199493587017, -0.0065621621906757355, -0.005791124887764454, -0.005020087584853172, -0.004249050281941891, -0.003478012979030609, -0.0027069756761193275, -0.001935938373208046, -0.0011649010702967644, -0.0003938637673854828, 0.0003771735355257988, 0.0011482108384370804, 0.001919248141348362, 0.0026902854442596436, 0.003461322747170925, 0.004232360050082207, 0.005003397352993488, 0.00577443465590477, 0.0065454719588160515, 0.007316509261727333, 0.008087546564638615, 0.008858583867549896, 0.009629621170461178, 0.01040065847337246, 0.011171695776283741, 0.011942733079195023, 0.012713770382106304, 0.013484807685017586, 0.014255844987928867, 0.015026882290840149, 0.015797920525074005, 0.016568956896662712, 0.01733999326825142, 0.018111031502485275, 0.01888206973671913, 0.01965310610830784, 0.020424142479896545, 0.0211951807141304, 0.021966218948364258, 0.022737255319952965, 0.023508291691541672, 0.024279329925775528, 0.025050368160009384, 0.02582140453159809, 0.026592440903186798, 0.027363479137420654]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 5.0, 8.0, 16.0, 13.0, 12.0, 17.0, 21.0, 17.0, 36.0, 30.0, 31.0, 31.0, 33.0, 36.0, 45.0, 40.0, 50.0, 40.0, 48.0, 38.0, 30.0, 44.0, 39.0, 42.0, 45.0, 35.0, 27.0, 29.0, 23.0, 20.0, 17.0, 19.0, 9.0, 8.0, 5.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -45.82470703125, -44.1806640625, -42.53662109375, -40.892578125, -39.24853515625, -37.6044921875, -35.96044921875, -34.31640625, -32.67236328125, -31.0283203125, -29.38427734375, -27.740234375, -26.09619140625, -24.4521484375, -22.80810546875, -21.1640625, -19.52001953125, -17.8759765625, -16.23193359375, -14.587890625, -12.94384765625, -11.2998046875, -9.65576171875, -8.01171875, -6.36767578125, -4.7236328125, -3.07958984375, -1.435546875, 0.20849609375, 1.8525390625, 3.49658203125, 5.140625, 6.78466796875, 8.4287109375, 10.07275390625, 11.716796875, 13.36083984375, 15.0048828125, 16.64892578125, 18.29296875, 19.93701171875, 21.5810546875, 23.22509765625, 24.869140625, 26.51318359375, 28.1572265625, 29.80126953125, 31.4453125, 33.08935546875, 34.7333984375, 36.37744140625, 38.021484375, 39.66552734375, 41.3095703125, 42.95361328125, 44.59765625, 46.24169921875, 47.8857421875, 49.52978515625, 51.173828125, 52.81787109375, 54.4619140625, 56.10595703125, 57.75]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 10.0, 4.0, 11.0, 20.0, 15.0, 20.0, 27.0, 43.0, 39.0, 75.0, 85.0, 126.0, 181.0, 243.0, 467.0, 867.0, 2772.0, 19668.0, 748100.0, 261340.0, 10523.0, 1939.0, 729.0, 361.0, 250.0, 165.0, 117.0, 75.0, 62.0, 54.0, 33.0, 26.0, 26.0, 14.0, 13.0, 11.0, 12.0, 5.0, 5.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.4375, -92.1318359375, -88.826171875, -85.5205078125, -82.21484375, -78.9091796875, -75.603515625, -72.2978515625, -68.9921875, -65.6865234375, -62.380859375, -59.0751953125, -55.76953125, -52.4638671875, -49.158203125, -45.8525390625, -42.546875, -39.2412109375, -35.935546875, -32.6298828125, -29.32421875, -26.0185546875, -22.712890625, -19.4072265625, -16.1015625, -12.7958984375, -9.490234375, -6.1845703125, -2.87890625, 0.4267578125, 3.732421875, 7.0380859375, 10.34375, 13.6494140625, 16.955078125, 20.2607421875, 23.56640625, 26.8720703125, 30.177734375, 33.4833984375, 36.7890625, 40.0947265625, 43.400390625, 46.7060546875, 50.01171875, 53.3173828125, 56.623046875, 59.9287109375, 63.234375, 66.5400390625, 69.845703125, 73.1513671875, 76.45703125, 79.7626953125, 83.068359375, 86.3740234375, 89.6796875, 92.9853515625, 96.291015625, 99.5966796875, 102.90234375, 106.2080078125, 109.513671875, 112.8193359375, 116.125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 10.0, 8.0, 11.0, 14.0, 15.0, 22.0, 18.0, 17.0, 28.0, 23.0, 30.0, 29.0, 30.0, 33.0, 32.0, 33.0, 54.0, 161.0, 1868.0, 102.0, 60.0, 44.0, 51.0, 38.0, 42.0, 34.0, 22.0, 23.0, 21.0, 23.0, 23.0, 27.0, 11.0, 11.0, 14.0, 5.0, 8.0, 10.0, 12.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-123.1875, -119.1416015625, -115.095703125, -111.0498046875, -107.00390625, -102.9580078125, -98.912109375, -94.8662109375, -90.8203125, -86.7744140625, -82.728515625, -78.6826171875, -74.63671875, -70.5908203125, -66.544921875, -62.4990234375, -58.453125, -54.4072265625, -50.361328125, -46.3154296875, -42.26953125, -38.2236328125, -34.177734375, -30.1318359375, -26.0859375, -22.0400390625, -17.994140625, -13.9482421875, -9.90234375, -5.8564453125, -1.810546875, 2.2353515625, 6.28125, 10.3271484375, 14.373046875, 18.4189453125, 22.46484375, 26.5107421875, 30.556640625, 34.6025390625, 38.6484375, 42.6943359375, 46.740234375, 50.7861328125, 54.83203125, 58.8779296875, 62.923828125, 66.9697265625, 71.015625, 75.0615234375, 79.107421875, 83.1533203125, 87.19921875, 91.2451171875, 95.291015625, 99.3369140625, 103.3828125, 107.4287109375, 111.474609375, 115.5205078125, 119.56640625, 123.6123046875, 127.658203125, 131.7041015625, 135.75]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 12.0, 10.0, 7.0, 9.0, 14.0, 18.0, 12.0, 29.0, 27.0, 34.0, 29.0, 42.0, 44.0, 76.0, 111.0, 167.0, 269.0, 581.0, 2467.0, 2909520.0, 229291.0, 1629.0, 487.0, 248.0, 137.0, 100.0, 55.0, 46.0, 38.0, 30.0, 26.0, 15.0, 28.0, 15.0, 15.0, 16.0, 6.0, 9.0, 8.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-322.0, -312.50390625, -303.0078125, -293.51171875, -284.015625, -274.51953125, -265.0234375, -255.52734375, -246.03125, -236.53515625, -227.0390625, -217.54296875, -208.046875, -198.55078125, -189.0546875, -179.55859375, -170.0625, -160.56640625, -151.0703125, -141.57421875, -132.078125, -122.58203125, -113.0859375, -103.58984375, -94.09375, -84.59765625, -75.1015625, -65.60546875, -56.109375, -46.61328125, -37.1171875, -27.62109375, -18.125, -8.62890625, 0.8671875, 10.36328125, 19.859375, 29.35546875, 38.8515625, 48.34765625, 57.84375, 67.33984375, 76.8359375, 86.33203125, 95.828125, 105.32421875, 114.8203125, 124.31640625, 133.8125, 143.30859375, 152.8046875, 162.30078125, 171.796875, 181.29296875, 190.7890625, 200.28515625, 209.78125, 219.27734375, 228.7734375, 238.26953125, 247.765625, 257.26171875, 266.7578125, 276.25390625, 285.75]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 87.0, 384.0, 442.0, 89.0, 10.0, 1.0, 0.0, 0.0, 2.0], "bins": [-645.3421630859375, -634.0117797851562, -622.6814575195312, -611.35107421875, -600.020751953125, -588.6903686523438, -577.3600463867188, -566.0296630859375, -554.6993408203125, -543.3689575195312, -532.0386352539062, -520.708251953125, -509.3779296875, -498.04754638671875, -486.71722412109375, -475.3868408203125, -464.05645751953125, -452.7261047363281, -441.395751953125, -430.0653991699219, -418.73504638671875, -407.4046630859375, -396.0743408203125, -384.74395751953125, -373.41363525390625, -362.0832824707031, -350.7529296875, -339.4225769042969, -328.09222412109375, -316.7618408203125, -305.4315185546875, -294.10113525390625, -282.7707824707031, -271.4404296875, -260.1100769042969, -248.77972412109375, -237.44935607910156, -226.11900329589844, -214.7886505126953, -203.45828247070312, -192.1279296875, -180.79757690429688, -169.46722412109375, -158.13687133789062, -146.80650329589844, -135.4761505126953, -124.14579772949219, -112.81543731689453, -101.4850845336914, -90.15473175048828, -78.82437133789062, -67.4940185546875, -56.16366195678711, -44.83330535888672, -33.502952575683594, -22.172592163085938, -10.842239379882812, 0.4881162643432617, 11.818471908569336, 23.148826599121094, 34.479183197021484, 45.809539794921875, 57.139892578125, 68.47025299072266, 79.80060577392578]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 5.0, 5.0, 8.0, 15.0, 13.0, 20.0, 19.0, 20.0, 18.0, 36.0, 24.0, 20.0, 24.0, 32.0, 31.0, 40.0, 47.0, 41.0, 45.0, 47.0, 46.0, 50.0, 36.0, 29.0, 33.0, 27.0, 38.0, 28.0, 24.0, 26.0, 22.0, 19.0, 17.0, 14.0, 14.0, 14.0, 11.0, 10.0, 5.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.28436279296875, -293.1263427734375, -282.96832275390625, -272.8102722167969, -262.6522521972656, -252.49423217773438, -242.33621215820312, -232.1781768798828, -222.0201416015625, -211.86212158203125, -201.70408630371094, -191.5460662841797, -181.38803100585938, -171.23001098632812, -161.07199096679688, -150.91395568847656, -140.7559356689453, -130.59791564941406, -120.43988037109375, -110.2818603515625, -100.12382507324219, -89.96580505371094, -79.80777740478516, -69.64974975585938, -59.491722106933594, -49.33369445800781, -39.17566680908203, -29.017642974853516, -18.859615325927734, -8.701587677001953, 1.4564361572265625, 11.614463806152344, 21.772491455078125, 31.930519104003906, 42.08854675292969, 52.2465705871582, 62.404598236083984, 72.5626220703125, 82.72064971923828, 92.87867736816406, 103.03670501708984, 113.19473266601562, 123.3527603149414, 133.5107879638672, 143.66880798339844, 153.82684326171875, 163.98486328125, 174.14288330078125, 184.30091857910156, 194.4589385986328, 204.61697387695312, 214.77499389648438, 224.9330291748047, 235.09104919433594, 245.24908447265625, 255.4071044921875, 265.56512451171875, 275.72314453125, 285.88116455078125, 296.0392150878906, 306.1972351074219, 316.3552551269531, 326.5132751464844, 336.67132568359375, 346.829345703125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 8.0, 4.0, 9.0, 9.0, 14.0, 12.0, 19.0, 18.0, 21.0, 32.0, 21.0, 38.0, 31.0, 33.0, 29.0, 41.0, 39.0, 55.0, 52.0, 29.0, 41.0, 40.0, 42.0, 41.0, 42.0, 39.0, 40.0, 33.0, 27.0, 26.0, 22.0, 21.0, 13.0, 14.0, 8.0, 8.0, 5.0, 5.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.84375, -45.181640625, -43.51953125, -41.857421875, -40.1953125, -38.533203125, -36.87109375, -35.208984375, -33.546875, -31.884765625, -30.22265625, -28.560546875, -26.8984375, -25.236328125, -23.57421875, -21.912109375, -20.25, -18.587890625, -16.92578125, -15.263671875, -13.6015625, -11.939453125, -10.27734375, -8.615234375, -6.953125, -5.291015625, -3.62890625, -1.966796875, -0.3046875, 1.357421875, 3.01953125, 4.681640625, 6.34375, 8.005859375, 9.66796875, 11.330078125, 12.9921875, 14.654296875, 16.31640625, 17.978515625, 19.640625, 21.302734375, 22.96484375, 24.626953125, 26.2890625, 27.951171875, 29.61328125, 31.275390625, 32.9375, 34.599609375, 36.26171875, 37.923828125, 39.5859375, 41.248046875, 42.91015625, 44.572265625, 46.234375, 47.896484375, 49.55859375, 51.220703125, 52.8828125, 54.544921875, 56.20703125, 57.869140625, 59.53125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 6.0, 12.0, 8.0, 19.0, 11.0, 25.0, 51.0, 43.0, 72.0, 108.0, 151.0, 202.0, 323.0, 446.0, 735.0, 1044.0, 1724.0, 2727.0, 4812.0, 9266.0, 20569.0, 102826.0, 3386183.0, 597189.0, 36271.0, 13351.0, 6370.0, 3658.0, 2133.0, 1317.0, 897.0, 574.0, 355.0, 259.0, 181.0, 122.0, 78.0, 47.0, 36.0, 25.0, 16.0, 16.0, 9.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-174.5, -169.001953125, -163.50390625, -158.005859375, -152.5078125, -147.009765625, -141.51171875, -136.013671875, -130.515625, -125.017578125, -119.51953125, -114.021484375, -108.5234375, -103.025390625, -97.52734375, -92.029296875, -86.53125, -81.033203125, -75.53515625, -70.037109375, -64.5390625, -59.041015625, -53.54296875, -48.044921875, -42.546875, -37.048828125, -31.55078125, -26.052734375, -20.5546875, -15.056640625, -9.55859375, -4.060546875, 1.4375, 6.935546875, 12.43359375, 17.931640625, 23.4296875, 28.927734375, 34.42578125, 39.923828125, 45.421875, 50.919921875, 56.41796875, 61.916015625, 67.4140625, 72.912109375, 78.41015625, 83.908203125, 89.40625, 94.904296875, 100.40234375, 105.900390625, 111.3984375, 116.896484375, 122.39453125, 127.892578125, 133.390625, 138.888671875, 144.38671875, 149.884765625, 155.3828125, 160.880859375, 166.37890625, 171.876953125, 177.375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 5.0, 10.0, 10.0, 15.0, 19.0, 14.0, 22.0, 39.0, 46.0, 66.0, 124.0, 254.0, 433.0, 814.0, 991.0, 564.0, 237.0, 135.0, 70.0, 37.0, 33.0, 28.0, 20.0, 16.0, 7.0, 2.0, 5.0, 5.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.25, -110.9990234375, -107.748046875, -104.4970703125, -101.24609375, -97.9951171875, -94.744140625, -91.4931640625, -88.2421875, -84.9912109375, -81.740234375, -78.4892578125, -75.23828125, -71.9873046875, -68.736328125, -65.4853515625, -62.234375, -58.9833984375, -55.732421875, -52.4814453125, -49.23046875, -45.9794921875, -42.728515625, -39.4775390625, -36.2265625, -32.9755859375, -29.724609375, -26.4736328125, -23.22265625, -19.9716796875, -16.720703125, -13.4697265625, -10.21875, -6.9677734375, -3.716796875, -0.4658203125, 2.78515625, 6.0361328125, 9.287109375, 12.5380859375, 15.7890625, 19.0400390625, 22.291015625, 25.5419921875, 28.79296875, 32.0439453125, 35.294921875, 38.5458984375, 41.796875, 45.0478515625, 48.298828125, 51.5498046875, 54.80078125, 58.0517578125, 61.302734375, 64.5537109375, 67.8046875, 71.0556640625, 74.306640625, 77.5576171875, 80.80859375, 84.0595703125, 87.310546875, 90.5615234375, 93.8125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 12.0, 5.0, 11.0, 14.0, 30.0, 37.0, 51.0, 79.0, 107.0, 204.0, 324.0, 595.0, 1127.0, 2268.0, 4636.0, 10643.0, 26272.0, 98264.0, 3153869.0, 797785.0, 62264.0, 19669.0, 8139.0, 3692.0, 1884.0, 969.0, 502.0, 293.0, 179.0, 123.0, 63.0, 47.0, 28.0, 29.0, 15.0, 13.0, 7.0, 8.0, 3.0, 3.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-178.375, -172.193359375, -166.01171875, -159.830078125, -153.6484375, -147.466796875, -141.28515625, -135.103515625, -128.921875, -122.740234375, -116.55859375, -110.376953125, -104.1953125, -98.013671875, -91.83203125, -85.650390625, -79.46875, -73.287109375, -67.10546875, -60.923828125, -54.7421875, -48.560546875, -42.37890625, -36.197265625, -30.015625, -23.833984375, -17.65234375, -11.470703125, -5.2890625, 0.892578125, 7.07421875, 13.255859375, 19.4375, 25.619140625, 31.80078125, 37.982421875, 44.1640625, 50.345703125, 56.52734375, 62.708984375, 68.890625, 75.072265625, 81.25390625, 87.435546875, 93.6171875, 99.798828125, 105.98046875, 112.162109375, 118.34375, 124.525390625, 130.70703125, 136.888671875, 143.0703125, 149.251953125, 155.43359375, 161.615234375, 167.796875, 173.978515625, 180.16015625, 186.341796875, 192.5234375, 198.705078125, 204.88671875, 211.068359375, 217.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 3.0, 9.0, 13.0, 21.0, 42.0, 91.0, 170.0, 270.0, 193.0, 103.0, 42.0, 24.0, 13.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.5532684326172, -232.78933715820312, -211.025390625, -189.26145935058594, -167.49752807617188, -145.7335968017578, -123.96965026855469, -102.20571899414062, -80.44178771972656, -58.677852630615234, -36.913917541503906, -15.149978637695312, 6.61395263671875, 28.377883911132812, 50.14183044433594, 71.90576171875, 93.66969299316406, 115.43362426757812, 137.19757080078125, 158.9615020751953, 180.72543334960938, 202.48936462402344, 224.25331115722656, 246.01724243164062, 267.78118896484375, 289.5451354980469, 311.3090515136719, 333.072998046875, 354.8369140625, 376.6008605957031, 398.36480712890625, 420.12872314453125, 441.8927001953125, 463.6566467285156, 485.4205627441406, 507.18450927734375, 528.9484252929688, 550.71240234375, 572.476318359375, 594.240234375, 616.004150390625, 637.76806640625, 659.5320434570312, 681.2959594726562, 703.0598754882812, 724.8238525390625, 746.5877685546875, 768.3516845703125, 790.1156616210938, 811.8795776367188, 833.6435546875, 855.407470703125, 877.17138671875, 898.935302734375, 920.6992797851562, 942.4631958007812, 964.2271728515625, 985.9910888671875, 1007.7550659179688, 1029.51904296875, 1051.282958984375, 1073.046875, 1094.810791015625, 1116.57470703125, 1138.338623046875]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 2.0, 13.0, 10.0, 15.0, 16.0, 12.0, 23.0, 27.0, 19.0, 31.0, 32.0, 40.0, 32.0, 40.0, 34.0, 44.0, 51.0, 52.0, 43.0, 40.0, 33.0, 47.0, 44.0, 37.0, 32.0, 27.0, 28.0, 23.0, 19.0, 21.0, 15.0, 13.0, 13.0, 13.0, 10.0, 8.0, 8.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-290.7010192871094, -281.8777770996094, -273.0545349121094, -264.23126220703125, -255.40802001953125, -246.58477783203125, -237.76153564453125, -228.93829345703125, -220.1150360107422, -211.2917938232422, -202.46853637695312, -193.64529418945312, -184.82205200195312, -175.99879455566406, -167.17555236816406, -158.352294921875, -149.529052734375, -140.705810546875, -131.88255310058594, -123.05931091308594, -114.2360610961914, -105.41281127929688, -96.58956909179688, -87.76631927490234, -78.94306945800781, -70.11981964111328, -61.296573638916016, -52.47332763671875, -43.65007781982422, -34.82682800292969, -26.003582000732422, -17.180335998535156, -8.357086181640625, 0.46616172790527344, 9.289409637451172, 18.11265754699707, 26.93590545654297, 35.7591552734375, 44.582401275634766, 53.40564727783203, 62.22889709472656, 71.0521469116211, 79.87539672851562, 88.69863891601562, 97.52188873291016, 106.34513854980469, 115.16838073730469, 123.99163055419922, 132.81488037109375, 141.63812255859375, 150.4613800048828, 159.2846221923828, 168.10787963867188, 176.93112182617188, 185.75436401367188, 194.57760620117188, 203.40086364746094, 212.22410583496094, 221.04736328125, 229.87060546875, 238.69384765625, 247.51710510253906, 256.3403625488281, 265.1636047363281, 273.9868469238281]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 11.0, 9.0, 17.0, 15.0, 9.0, 10.0, 20.0, 23.0, 33.0, 28.0, 24.0, 31.0, 30.0, 34.0, 44.0, 47.0, 43.0, 39.0, 41.0, 52.0, 40.0, 47.0, 40.0, 36.0, 37.0, 31.0, 26.0, 23.0, 29.0, 18.0, 23.0, 13.0, 14.0, 9.0, 9.0, 9.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.0625, -46.3583984375, -44.654296875, -42.9501953125, -41.24609375, -39.5419921875, -37.837890625, -36.1337890625, -34.4296875, -32.7255859375, -31.021484375, -29.3173828125, -27.61328125, -25.9091796875, -24.205078125, -22.5009765625, -20.796875, -19.0927734375, -17.388671875, -15.6845703125, -13.98046875, -12.2763671875, -10.572265625, -8.8681640625, -7.1640625, -5.4599609375, -3.755859375, -2.0517578125, -0.34765625, 1.3564453125, 3.060546875, 4.7646484375, 6.46875, 8.1728515625, 9.876953125, 11.5810546875, 13.28515625, 14.9892578125, 16.693359375, 18.3974609375, 20.1015625, 21.8056640625, 23.509765625, 25.2138671875, 26.91796875, 28.6220703125, 30.326171875, 32.0302734375, 33.734375, 35.4384765625, 37.142578125, 38.8466796875, 40.55078125, 42.2548828125, 43.958984375, 45.6630859375, 47.3671875, 49.0712890625, 50.775390625, 52.4794921875, 54.18359375, 55.8876953125, 57.591796875, 59.2958984375, 61.0]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 11.0, 24.0, 26.0, 39.0, 66.0, 99.0, 151.0, 247.0, 361.0, 503.0, 820.0, 1304.0, 1994.0, 2984.0, 4688.0, 7186.0, 11567.0, 18104.0, 30189.0, 51747.0, 96385.0, 197681.0, 285033.0, 151198.0, 76411.0, 42259.0, 24952.0, 15275.0, 9731.0, 6221.0, 3931.0, 2535.0, 1640.0, 1081.0, 733.0, 464.0, 301.0, 205.0, 123.0, 89.0, 73.0, 41.0, 25.0, 17.0, 17.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.984375, -2.894805908203125, -2.80523681640625, -2.715667724609375, -2.6260986328125, -2.536529541015625, -2.44696044921875, -2.357391357421875, -2.267822265625, -2.178253173828125, -2.08868408203125, -1.999114990234375, -1.9095458984375, -1.819976806640625, -1.73040771484375, -1.640838623046875, -1.55126953125, -1.461700439453125, -1.37213134765625, -1.282562255859375, -1.1929931640625, -1.103424072265625, -1.01385498046875, -0.924285888671875, -0.834716796875, -0.745147705078125, -0.65557861328125, -0.566009521484375, -0.4764404296875, -0.386871337890625, -0.29730224609375, -0.207733154296875, -0.1181640625, -0.028594970703125, 0.06097412109375, 0.150543212890625, 0.2401123046875, 0.329681396484375, 0.41925048828125, 0.508819580078125, 0.598388671875, 0.687957763671875, 0.77752685546875, 0.867095947265625, 0.9566650390625, 1.046234130859375, 1.13580322265625, 1.225372314453125, 1.31494140625, 1.404510498046875, 1.49407958984375, 1.583648681640625, 1.6732177734375, 1.762786865234375, 1.85235595703125, 1.941925048828125, 2.031494140625, 2.121063232421875, 2.21063232421875, 2.300201416015625, 2.3897705078125, 2.479339599609375, 2.56890869140625, 2.658477783203125, 2.748046875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 5.0, 10.0, 11.0, 13.0, 19.0, 17.0, 15.0, 16.0, 25.0, 30.0, 40.0, 38.0, 41.0, 40.0, 37.0, 49.0, 40.0, 1071.0, 53.0, 49.0, 43.0, 31.0, 38.0, 42.0, 35.0, 25.0, 22.0, 20.0, 26.0, 24.0, 11.0, 14.0, 16.0, 11.0, 11.0, 7.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.09375, -34.91455078125, -33.7353515625, -32.55615234375, -31.376953125, -30.19775390625, -29.0185546875, -27.83935546875, -26.66015625, -25.48095703125, -24.3017578125, -23.12255859375, -21.943359375, -20.76416015625, -19.5849609375, -18.40576171875, -17.2265625, -16.04736328125, -14.8681640625, -13.68896484375, -12.509765625, -11.33056640625, -10.1513671875, -8.97216796875, -7.79296875, -6.61376953125, -5.4345703125, -4.25537109375, -3.076171875, -1.89697265625, -0.7177734375, 0.46142578125, 1.640625, 2.81982421875, 3.9990234375, 5.17822265625, 6.357421875, 7.53662109375, 8.7158203125, 9.89501953125, 11.07421875, 12.25341796875, 13.4326171875, 14.61181640625, 15.791015625, 16.97021484375, 18.1494140625, 19.32861328125, 20.5078125, 21.68701171875, 22.8662109375, 24.04541015625, 25.224609375, 26.40380859375, 27.5830078125, 28.76220703125, 29.94140625, 31.12060546875, 32.2998046875, 33.47900390625, 34.658203125, 35.83740234375, 37.0166015625, 38.19580078125, 39.375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 8.0, 11.0, 14.0, 26.0, 36.0, 33.0, 78.0, 86.0, 134.0, 234.0, 326.0, 487.0, 749.0, 1183.0, 1897.0, 3044.0, 5038.0, 8422.0, 14022.0, 24185.0, 43911.0, 87687.0, 208008.0, 1392112.0, 150488.0, 69009.0, 35491.0, 20252.0, 11699.0, 6990.0, 4213.0, 2629.0, 1631.0, 1024.0, 673.0, 453.0, 273.0, 185.0, 129.0, 80.0, 55.0, 39.0, 31.0, 12.0, 18.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.236328125, -3.13623046875, -3.0361328125, -2.93603515625, -2.8359375, -2.73583984375, -2.6357421875, -2.53564453125, -2.435546875, -2.33544921875, -2.2353515625, -2.13525390625, -2.03515625, -1.93505859375, -1.8349609375, -1.73486328125, -1.634765625, -1.53466796875, -1.4345703125, -1.33447265625, -1.234375, -1.13427734375, -1.0341796875, -0.93408203125, -0.833984375, -0.73388671875, -0.6337890625, -0.53369140625, -0.43359375, -0.33349609375, -0.2333984375, -0.13330078125, -0.033203125, 0.06689453125, 0.1669921875, 0.26708984375, 0.3671875, 0.46728515625, 0.5673828125, 0.66748046875, 0.767578125, 0.86767578125, 0.9677734375, 1.06787109375, 1.16796875, 1.26806640625, 1.3681640625, 1.46826171875, 1.568359375, 1.66845703125, 1.7685546875, 1.86865234375, 1.96875, 2.06884765625, 2.1689453125, 2.26904296875, 2.369140625, 2.46923828125, 2.5693359375, 2.66943359375, 2.76953125, 2.86962890625, 2.9697265625, 3.06982421875, 3.169921875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 4.0, 9.0, 8.0, 14.0, 14.0, 16.0, 21.0, 19.0, 23.0, 30.0, 30.0, 27.0, 43.0, 40.0, 62.0, 60.0, 66.0, 81.0, 68.0, 47.0, 42.0, 36.0, 34.0, 27.0, 28.0, 24.0, 20.0, 15.0, 14.0, 13.0, 11.0, 8.0, 7.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0298004150390625, -0.028895854949951172, -0.027991294860839844, -0.027086734771728516, -0.026182174682617188, -0.02527761459350586, -0.02437305450439453, -0.023468494415283203, -0.022563934326171875, -0.021659374237060547, -0.02075481414794922, -0.01985025405883789, -0.018945693969726562, -0.018041133880615234, -0.017136573791503906, -0.016232013702392578, -0.01532745361328125, -0.014422893524169922, -0.013518333435058594, -0.012613773345947266, -0.011709213256835938, -0.01080465316772461, -0.009900093078613281, -0.008995532989501953, -0.008090972900390625, -0.007186412811279297, -0.006281852722167969, -0.005377292633056641, -0.0044727325439453125, -0.0035681724548339844, -0.0026636123657226562, -0.0017590522766113281, -0.0008544921875, 5.0067901611328125e-05, 0.0009546279907226562, 0.0018591880798339844, 0.0027637481689453125, 0.0036683082580566406, 0.004572868347167969, 0.005477428436279297, 0.006381988525390625, 0.007286548614501953, 0.008191108703613281, 0.00909566879272461, 0.010000228881835938, 0.010904788970947266, 0.011809349060058594, 0.012713909149169922, 0.01361846923828125, 0.014523029327392578, 0.015427589416503906, 0.016332149505615234, 0.017236709594726562, 0.01814126968383789, 0.01904582977294922, 0.019950389862060547, 0.020854949951171875, 0.021759510040283203, 0.02266407012939453, 0.02356863021850586, 0.024473190307617188, 0.025377750396728516, 0.026282310485839844, 0.027186870574951172, 0.0280914306640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 1.0, 11.0, 5.0, 9.0, 12.0, 11.0, 17.0, 23.0, 27.0, 36.0, 42.0, 50.0, 56.0, 84.0, 127.0, 202.0, 446.0, 3554.0, 888943.0, 152289.0, 1577.0, 348.0, 186.0, 116.0, 76.0, 66.0, 41.0, 36.0, 35.0, 19.0, 32.0, 21.0, 15.0, 10.0, 5.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.62744140625, -0.608917236328125, -0.59039306640625, -0.571868896484375, -0.5533447265625, -0.534820556640625, -0.51629638671875, -0.497772216796875, -0.479248046875, -0.460723876953125, -0.44219970703125, -0.423675537109375, -0.4051513671875, -0.386627197265625, -0.36810302734375, -0.349578857421875, -0.3310546875, -0.312530517578125, -0.29400634765625, -0.275482177734375, -0.2569580078125, -0.238433837890625, -0.21990966796875, -0.201385498046875, -0.182861328125, -0.164337158203125, -0.14581298828125, -0.127288818359375, -0.1087646484375, -0.090240478515625, -0.07171630859375, -0.053192138671875, -0.03466796875, -0.016143798828125, 0.00238037109375, 0.020904541015625, 0.0394287109375, 0.057952880859375, 0.07647705078125, 0.095001220703125, 0.113525390625, 0.132049560546875, 0.15057373046875, 0.169097900390625, 0.1876220703125, 0.206146240234375, 0.22467041015625, 0.243194580078125, 0.26171875, 0.280242919921875, 0.29876708984375, 0.317291259765625, 0.3358154296875, 0.354339599609375, 0.37286376953125, 0.391387939453125, 0.409912109375, 0.428436279296875, 0.44696044921875, 0.465484619140625, 0.4840087890625, 0.502532958984375, 0.52105712890625, 0.539581298828125, 0.55810546875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 29.0, 740.0, 237.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031296346336603165, -0.02586252987384796, -0.020428715273737907, -0.014994900673627853, -0.00956108421087265, -0.004127267748117447, 0.0013065449893474579, 0.006740361452102661, 0.012174177914857864, 0.017607994377613068, 0.02304180897772312, 0.028475623577833176, 0.03390944004058838, 0.03934325650334358, 0.04477706924080849, 0.05021088570356369, 0.05564470216631889, 0.0610785186290741, 0.066512331366539, 0.0719461441040039, 0.07737996429204941, 0.08281378448009491, 0.08824759721755981, 0.09368140995502472, 0.09911522269248962, 0.10454903542995453, 0.10998285561800003, 0.11541666835546494, 0.12085048854351044, 0.12628430128097534, 0.13171811401844025, 0.13715192675590515, 0.14258575439453125, 0.14801956713199615, 0.15345337986946106, 0.15888720750808716, 0.16432102024555206, 0.16975483298301697, 0.17518864572048187, 0.18062245845794678, 0.18605628609657288, 0.19149009883403778, 0.19692391157150269, 0.20235773921012878, 0.2077915519475937, 0.2132253646850586, 0.2186591774225235, 0.2240929901599884, 0.2295268028974533, 0.2349606156349182, 0.24039442837238312, 0.24582824110984802, 0.2512620687484741, 0.25669586658477783, 0.26212969422340393, 0.26756352186203003, 0.27299731969833374, 0.27843114733695984, 0.28386494517326355, 0.28929877281188965, 0.29473257064819336, 0.30016639828681946, 0.30560022592544556, 0.31103402376174927, 0.31646785140037537]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 7.0, 7.0, 15.0, 16.0, 16.0, 23.0, 18.0, 26.0, 27.0, 31.0, 29.0, 34.0, 37.0, 38.0, 31.0, 42.0, 36.0, 40.0, 38.0, 35.0, 45.0, 38.0, 43.0, 29.0, 37.0, 36.0, 32.0, 24.0, 28.0, 25.0, 21.0, 12.0, 16.0, 9.0, 5.0, 4.0, 10.0, 5.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016697227954864502, -0.016158541664481163, -0.015619855374097824, -0.015081169083714485, -0.014542482793331146, -0.014003796502947807, -0.013465110212564468, -0.01292642392218113, -0.01238773763179779, -0.011849051341414452, -0.011310365051031113, -0.010771678760647774, -0.010232992470264435, -0.009694306179881096, -0.009155619889497757, -0.008616933599114418, -0.008078247308731079, -0.00753956101834774, -0.007000874727964401, -0.006462188437581062, -0.005923502147197723, -0.0053848158568143845, -0.0048461295664310455, -0.004307443276047707, -0.0037687569856643677, -0.0032300706952810287, -0.00269138440489769, -0.002152698114514351, -0.001614011824131012, -0.001075325533747673, -0.0005366392433643341, 2.0470470190048218e-06, 0.0005407333374023438, 0.0010794196277856827, 0.0016181059181690216, 0.0021567922085523605, 0.0026954784989356995, 0.0032341647893190384, 0.0037728510797023773, 0.004311537370085716, 0.004850223660469055, 0.005388909950852394, 0.005927596241235733, 0.006466282531619072, 0.007004968822002411, 0.00754365511238575, 0.008082341402769089, 0.008621027693152428, 0.009159713983535767, 0.009698400273919106, 0.010237086564302444, 0.010775772854685783, 0.011314459145069122, 0.011853145435452461, 0.0123918317258358, 0.012930518016219139, 0.013469204306602478, 0.014007890596985817, 0.014546576887369156, 0.015085263177752495, 0.015623949468135834, 0.016162635758519173, 0.01670132204890251, 0.01724000833928585, 0.01777869462966919]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 11.0, 9.0, 17.0, 15.0, 9.0, 10.0, 20.0, 23.0, 33.0, 28.0, 24.0, 31.0, 30.0, 34.0, 44.0, 47.0, 43.0, 39.0, 41.0, 52.0, 41.0, 46.0, 39.0, 37.0, 37.0, 31.0, 26.0, 23.0, 29.0, 18.0, 23.0, 13.0, 14.0, 9.0, 9.0, 9.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.0625, -46.3583984375, -44.654296875, -42.9501953125, -41.24609375, -39.5419921875, -37.837890625, -36.1337890625, -34.4296875, -32.7255859375, -31.021484375, -29.3173828125, -27.61328125, -25.9091796875, -24.205078125, -22.5009765625, -20.796875, -19.0927734375, -17.388671875, -15.6845703125, -13.98046875, -12.2763671875, -10.572265625, -8.8681640625, -7.1640625, -5.4599609375, -3.755859375, -2.0517578125, -0.34765625, 1.3564453125, 3.060546875, 4.7646484375, 6.46875, 8.1728515625, 9.876953125, 11.5810546875, 13.28515625, 14.9892578125, 16.693359375, 18.3974609375, 20.1015625, 21.8056640625, 23.509765625, 25.2138671875, 26.91796875, 28.6220703125, 30.326171875, 32.0302734375, 33.734375, 35.4384765625, 37.142578125, 38.8466796875, 40.55078125, 42.2548828125, 43.958984375, 45.6630859375, 47.3671875, 49.0712890625, 50.775390625, 52.4794921875, 54.18359375, 55.8876953125, 57.591796875, 59.2958984375, 61.0]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 6.0, 6.0, 4.0, 17.0, 26.0, 27.0, 39.0, 39.0, 35.0, 67.0, 87.0, 149.0, 225.0, 354.0, 529.0, 814.0, 1494.0, 2742.0, 5672.0, 14485.0, 100773.0, 868444.0, 33332.0, 9608.0, 4226.0, 2120.0, 1143.0, 706.0, 453.0, 264.0, 179.0, 118.0, 101.0, 64.0, 43.0, 33.0, 24.0, 26.0, 21.0, 17.0, 13.0, 7.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-122.375, -118.05078125, -113.7265625, -109.40234375, -105.078125, -100.75390625, -96.4296875, -92.10546875, -87.78125, -83.45703125, -79.1328125, -74.80859375, -70.484375, -66.16015625, -61.8359375, -57.51171875, -53.1875, -48.86328125, -44.5390625, -40.21484375, -35.890625, -31.56640625, -27.2421875, -22.91796875, -18.59375, -14.26953125, -9.9453125, -5.62109375, -1.296875, 3.02734375, 7.3515625, 11.67578125, 16.0, 20.32421875, 24.6484375, 28.97265625, 33.296875, 37.62109375, 41.9453125, 46.26953125, 50.59375, 54.91796875, 59.2421875, 63.56640625, 67.890625, 72.21484375, 76.5390625, 80.86328125, 85.1875, 89.51171875, 93.8359375, 98.16015625, 102.484375, 106.80859375, 111.1328125, 115.45703125, 119.78125, 124.10546875, 128.4296875, 132.75390625, 137.078125, 141.40234375, 145.7265625, 150.05078125, 154.375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 2.0, 7.0, 7.0, 8.0, 9.0, 8.0, 13.0, 11.0, 21.0, 27.0, 27.0, 24.0, 40.0, 39.0, 39.0, 46.0, 34.0, 61.0, 87.0, 1676.0, 375.0, 79.0, 46.0, 45.0, 37.0, 52.0, 37.0, 30.0, 29.0, 25.0, 24.0, 14.0, 12.0, 6.0, 12.0, 14.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-143.375, -138.736328125, -134.09765625, -129.458984375, -124.8203125, -120.181640625, -115.54296875, -110.904296875, -106.265625, -101.626953125, -96.98828125, -92.349609375, -87.7109375, -83.072265625, -78.43359375, -73.794921875, -69.15625, -64.517578125, -59.87890625, -55.240234375, -50.6015625, -45.962890625, -41.32421875, -36.685546875, -32.046875, -27.408203125, -22.76953125, -18.130859375, -13.4921875, -8.853515625, -4.21484375, 0.423828125, 5.0625, 9.701171875, 14.33984375, 18.978515625, 23.6171875, 28.255859375, 32.89453125, 37.533203125, 42.171875, 46.810546875, 51.44921875, 56.087890625, 60.7265625, 65.365234375, 70.00390625, 74.642578125, 79.28125, 83.919921875, 88.55859375, 93.197265625, 97.8359375, 102.474609375, 107.11328125, 111.751953125, 116.390625, 121.029296875, 125.66796875, 130.306640625, 134.9453125, 139.583984375, 144.22265625, 148.861328125, 153.5]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 7.0, 8.0, 20.0, 11.0, 9.0, 15.0, 19.0, 20.0, 35.0, 39.0, 36.0, 55.0, 72.0, 109.0, 236.0, 724.0, 4993.0, 1836369.0, 1296464.0, 5015.0, 727.0, 246.0, 104.0, 75.0, 54.0, 46.0, 28.0, 31.0, 23.0, 23.0, 15.0, 14.0, 10.0, 11.0, 7.0, 10.0, 6.0, 2.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-414.25, -401.6953125, -389.140625, -376.5859375, -364.03125, -351.4765625, -338.921875, -326.3671875, -313.8125, -301.2578125, -288.703125, -276.1484375, -263.59375, -251.0390625, -238.484375, -225.9296875, -213.375, -200.8203125, -188.265625, -175.7109375, -163.15625, -150.6015625, -138.046875, -125.4921875, -112.9375, -100.3828125, -87.828125, -75.2734375, -62.71875, -50.1640625, -37.609375, -25.0546875, -12.5, 0.0546875, 12.609375, 25.1640625, 37.71875, 50.2734375, 62.828125, 75.3828125, 87.9375, 100.4921875, 113.046875, 125.6015625, 138.15625, 150.7109375, 163.265625, 175.8203125, 188.375, 200.9296875, 213.484375, 226.0390625, 238.59375, 251.1484375, 263.703125, 276.2578125, 288.8125, 301.3671875, 313.921875, 326.4765625, 339.03125, 351.5859375, 364.140625, 376.6953125, 389.25]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 19.0, 144.0, 529.0, 269.0, 46.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-809.7523193359375, -794.6707153320312, -779.5890502929688, -764.5074462890625, -749.42578125, -734.3441772460938, -719.2625122070312, -704.180908203125, -689.0992431640625, -674.0176391601562, -658.9359741210938, -643.8543701171875, -628.772705078125, -613.6911010742188, -598.6094360351562, -583.52783203125, -568.4461669921875, -553.3645629882812, -538.2828979492188, -523.2012939453125, -508.11962890625, -493.0379943847656, -477.95635986328125, -462.8747253417969, -447.7931213378906, -432.71148681640625, -417.6298522949219, -402.5482177734375, -387.4665832519531, -372.38494873046875, -357.3033142089844, -342.2216796875, -327.1400451660156, -312.05841064453125, -296.9767761230469, -281.8951416015625, -266.8135070800781, -251.73187255859375, -236.65023803710938, -221.568603515625, -206.48696899414062, -191.40533447265625, -176.32369995117188, -161.2420654296875, -146.16043090820312, -131.07879638671875, -115.9971694946289, -100.91553497314453, -85.83390808105469, -70.75227355957031, -55.67063903808594, -40.58900833129883, -25.507373809814453, -10.425743103027344, 4.655891418457031, 19.737525939941406, 34.81916046142578, 49.900794982910156, 64.98242950439453, 80.06405639648438, 95.14569091796875, 110.22732543945312, 125.3089599609375, 140.39059448242188, 155.47222900390625]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 8.0, 3.0, 12.0, 12.0, 10.0, 9.0, 16.0, 14.0, 30.0, 19.0, 24.0, 38.0, 29.0, 29.0, 44.0, 34.0, 41.0, 36.0, 52.0, 48.0, 36.0, 39.0, 43.0, 37.0, 30.0, 22.0, 37.0, 41.0, 26.0, 27.0, 22.0, 21.0, 20.0, 11.0, 15.0, 15.0, 8.0, 5.0, 6.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-351.0616149902344, -339.9876403808594, -328.9136962890625, -317.8397216796875, -306.7657775878906, -295.6918029785156, -284.61785888671875, -273.54388427734375, -262.46990966796875, -251.3959503173828, -240.32199096679688, -229.24801635742188, -218.174072265625, -207.10009765625, -196.02613830566406, -184.95217895507812, -173.87823486328125, -162.8042755126953, -151.73031616210938, -140.65634155273438, -129.5823974609375, -118.50843048095703, -107.43446350097656, -96.36050415039062, -85.28654479980469, -74.21258544921875, -63.13862228393555, -52.064659118652344, -40.990699768066406, -29.91674041748047, -18.8427734375, -7.7688140869140625, 3.30511474609375, 14.37907600402832, 25.45303726196289, 36.527000427246094, 47.60095977783203, 58.67491912841797, 69.74888610839844, 80.82284545898438, 91.89680480957031, 102.97076416015625, 114.04472351074219, 125.11869049072266, 136.19265747070312, 147.2666015625, 158.340576171875, 169.41453552246094, 180.48849487304688, 191.5624542236328, 202.63641357421875, 213.71038818359375, 224.78433227539062, 235.85830688476562, 246.93226623535156, 258.0062255859375, 269.0802001953125, 280.1541748046875, 291.2281188964844, 302.3020935058594, 313.37603759765625, 324.45001220703125, 335.52398681640625, 346.5979309082031, 357.671875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 6.0, 11.0, 11.0, 13.0, 15.0, 15.0, 13.0, 28.0, 26.0, 23.0, 27.0, 43.0, 30.0, 34.0, 41.0, 41.0, 35.0, 46.0, 39.0, 50.0, 51.0, 42.0, 43.0, 35.0, 42.0, 27.0, 30.0, 34.0, 23.0, 15.0, 16.0, 14.0, 17.0, 13.0, 10.0, 9.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.15625, -47.42041015625, -45.6845703125, -43.94873046875, -42.212890625, -40.47705078125, -38.7412109375, -37.00537109375, -35.26953125, -33.53369140625, -31.7978515625, -30.06201171875, -28.326171875, -26.59033203125, -24.8544921875, -23.11865234375, -21.3828125, -19.64697265625, -17.9111328125, -16.17529296875, -14.439453125, -12.70361328125, -10.9677734375, -9.23193359375, -7.49609375, -5.76025390625, -4.0244140625, -2.28857421875, -0.552734375, 1.18310546875, 2.9189453125, 4.65478515625, 6.390625, 8.12646484375, 9.8623046875, 11.59814453125, 13.333984375, 15.06982421875, 16.8056640625, 18.54150390625, 20.27734375, 22.01318359375, 23.7490234375, 25.48486328125, 27.220703125, 28.95654296875, 30.6923828125, 32.42822265625, 34.1640625, 35.89990234375, 37.6357421875, 39.37158203125, 41.107421875, 42.84326171875, 44.5791015625, 46.31494140625, 48.05078125, 49.78662109375, 51.5224609375, 53.25830078125, 54.994140625, 56.72998046875, 58.4658203125, 60.20166015625, 61.9375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 21.0, 18.0, 24.0, 28.0, 54.0, 77.0, 130.0, 175.0, 313.0, 521.0, 825.0, 1552.0, 2940.0, 6444.0, 16534.0, 93686.0, 3591313.0, 434504.0, 26914.0, 9348.0, 4112.0, 1989.0, 1076.0, 629.0, 360.0, 252.0, 152.0, 94.0, 61.0, 36.0, 30.0, 16.0, 7.0, 5.0, 12.0, 10.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-207.75, -201.396484375, -195.04296875, -188.689453125, -182.3359375, -175.982421875, -169.62890625, -163.275390625, -156.921875, -150.568359375, -144.21484375, -137.861328125, -131.5078125, -125.154296875, -118.80078125, -112.447265625, -106.09375, -99.740234375, -93.38671875, -87.033203125, -80.6796875, -74.326171875, -67.97265625, -61.619140625, -55.265625, -48.912109375, -42.55859375, -36.205078125, -29.8515625, -23.498046875, -17.14453125, -10.791015625, -4.4375, 1.916015625, 8.26953125, 14.623046875, 20.9765625, 27.330078125, 33.68359375, 40.037109375, 46.390625, 52.744140625, 59.09765625, 65.451171875, 71.8046875, 78.158203125, 84.51171875, 90.865234375, 97.21875, 103.572265625, 109.92578125, 116.279296875, 122.6328125, 128.986328125, 135.33984375, 141.693359375, 148.046875, 154.400390625, 160.75390625, 167.107421875, 173.4609375, 179.814453125, 186.16796875, 192.521484375, 198.875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 10.0, 9.0, 9.0, 8.0, 10.0, 19.0, 23.0, 28.0, 63.0, 66.0, 127.0, 301.0, 710.0, 1195.0, 733.0, 362.0, 135.0, 70.0, 44.0, 30.0, 32.0, 19.0, 15.0, 12.0, 6.0, 12.0, 3.0, 9.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.4375, -98.7138671875, -94.990234375, -91.2666015625, -87.54296875, -83.8193359375, -80.095703125, -76.3720703125, -72.6484375, -68.9248046875, -65.201171875, -61.4775390625, -57.75390625, -54.0302734375, -50.306640625, -46.5830078125, -42.859375, -39.1357421875, -35.412109375, -31.6884765625, -27.96484375, -24.2412109375, -20.517578125, -16.7939453125, -13.0703125, -9.3466796875, -5.623046875, -1.8994140625, 1.82421875, 5.5478515625, 9.271484375, 12.9951171875, 16.71875, 20.4423828125, 24.166015625, 27.8896484375, 31.61328125, 35.3369140625, 39.060546875, 42.7841796875, 46.5078125, 50.2314453125, 53.955078125, 57.6787109375, 61.40234375, 65.1259765625, 68.849609375, 72.5732421875, 76.296875, 80.0205078125, 83.744140625, 87.4677734375, 91.19140625, 94.9150390625, 98.638671875, 102.3623046875, 106.0859375, 109.8095703125, 113.533203125, 117.2568359375, 120.98046875, 124.7041015625, 128.427734375, 132.1513671875, 135.875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 5.0, 18.0, 11.0, 25.0, 36.0, 55.0, 130.0, 290.0, 737.0, 2092.0, 7046.0, 30313.0, 640711.0, 3450772.0, 48004.0, 9623.0, 2757.0, 949.0, 358.0, 169.0, 73.0, 37.0, 25.0, 17.0, 13.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.0, -337.80078125, -327.6015625, -317.40234375, -307.203125, -297.00390625, -286.8046875, -276.60546875, -266.40625, -256.20703125, -246.0078125, -235.80859375, -225.609375, -215.41015625, -205.2109375, -195.01171875, -184.8125, -174.61328125, -164.4140625, -154.21484375, -144.015625, -133.81640625, -123.6171875, -113.41796875, -103.21875, -93.01953125, -82.8203125, -72.62109375, -62.421875, -52.22265625, -42.0234375, -31.82421875, -21.625, -11.42578125, -1.2265625, 8.97265625, 19.171875, 29.37109375, 39.5703125, 49.76953125, 59.96875, 70.16796875, 80.3671875, 90.56640625, 100.765625, 110.96484375, 121.1640625, 131.36328125, 141.5625, 151.76171875, 161.9609375, 172.16015625, 182.359375, 192.55859375, 202.7578125, 212.95703125, 223.15625, 233.35546875, 243.5546875, 253.75390625, 263.953125, 274.15234375, 284.3515625, 294.55078125, 304.75]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 24.0, 106.0, 433.0, 350.0, 69.0, 22.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2600.3037109375, -2554.5888671875, -2508.873779296875, -2463.158935546875, -2417.44384765625, -2371.72900390625, -2326.013916015625, -2280.299072265625, -2234.583984375, -2188.869140625, -2143.154052734375, -2097.439208984375, -2051.72412109375, -2006.0091552734375, -1960.294189453125, -1914.5792236328125, -1868.8642578125, -1823.1492919921875, -1777.434326171875, -1731.7193603515625, -1686.00439453125, -1640.2894287109375, -1594.574462890625, -1548.8594970703125, -1503.1446533203125, -1457.4296875, -1411.7147216796875, -1365.999755859375, -1320.2847900390625, -1274.56982421875, -1228.8548583984375, -1183.139892578125, -1137.4249267578125, -1091.7099609375, -1045.9949951171875, -1000.280029296875, -954.5650634765625, -908.85009765625, -863.1351318359375, -817.420166015625, -771.7052001953125, -725.990234375, -680.2752685546875, -634.560302734375, -588.8453369140625, -543.13037109375, -497.4154357910156, -451.7004699707031, -405.9855041503906, -360.2705383300781, -314.5555725097656, -268.84063720703125, -223.1256561279297, -177.4106903076172, -131.69573974609375, -85.98077392578125, -40.26580810546875, 5.449153900146484, 51.16411590576172, 96.87907409667969, 142.5940399169922, 188.3090057373047, 234.02395629882812, 279.7389221191406, 325.4538879394531]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 5.0, 12.0, 11.0, 8.0, 13.0, 11.0, 14.0, 18.0, 23.0, 25.0, 34.0, 33.0, 37.0, 30.0, 36.0, 35.0, 27.0, 32.0, 42.0, 42.0, 29.0, 54.0, 43.0, 36.0, 42.0, 29.0, 34.0, 28.0, 30.0, 26.0, 22.0, 25.0, 18.0, 18.0, 12.0, 12.0, 10.0, 11.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-281.7017822265625, -273.3728332519531, -265.0438537597656, -256.71490478515625, -248.3859405517578, -240.05697631835938, -231.72802734375, -223.39906311035156, -215.07009887695312, -206.7411346435547, -198.41217041015625, -190.08322143554688, -181.75425720214844, -173.42529296875, -165.09634399414062, -156.7673797607422, -148.43841552734375, -140.1094512939453, -131.78048706054688, -123.4515380859375, -115.12257385253906, -106.79360961914062, -98.46465301513672, -90.13569641113281, -81.80673217773438, -73.47776794433594, -65.14881134033203, -56.81985092163086, -48.49089050292969, -40.161930084228516, -31.832969665527344, -23.504009246826172, -15.175018310546875, -6.846057891845703, 1.4829025268554688, 9.81186294555664, 18.140823364257812, 26.469783782958984, 34.798744201660156, 43.12770462036133, 51.4566650390625, 59.78562545776367, 68.11458587646484, 76.44354248046875, 84.77250671386719, 93.10147094726562, 101.43042755126953, 109.75938415527344, 118.08834838867188, 126.41731262207031, 134.74627685546875, 143.07522583007812, 151.40419006347656, 159.733154296875, 168.06210327148438, 176.3910675048828, 184.72003173828125, 193.0489959716797, 201.37796020507812, 209.7069091796875, 218.03587341308594, 226.36483764648438, 234.69378662109375, 243.0227508544922, 251.35171508789062]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 4.0, 4.0, 8.0, 9.0, 5.0, 16.0, 13.0, 14.0, 12.0, 17.0, 24.0, 20.0, 36.0, 25.0, 34.0, 36.0, 33.0, 34.0, 35.0, 38.0, 40.0, 51.0, 31.0, 43.0, 45.0, 47.0, 26.0, 44.0, 33.0, 24.0, 23.0, 29.0, 25.0, 20.0, 17.0, 13.0, 18.0, 8.0, 6.0, 9.0, 10.0, 3.0, 2.0, 3.0, 6.0, 1.0, 1.0, 5.0, 2.0, 2.0], "bins": [-59.53125, -57.8583984375, -56.185546875, -54.5126953125, -52.83984375, -51.1669921875, -49.494140625, -47.8212890625, -46.1484375, -44.4755859375, -42.802734375, -41.1298828125, -39.45703125, -37.7841796875, -36.111328125, -34.4384765625, -32.765625, -31.0927734375, -29.419921875, -27.7470703125, -26.07421875, -24.4013671875, -22.728515625, -21.0556640625, -19.3828125, -17.7099609375, -16.037109375, -14.3642578125, -12.69140625, -11.0185546875, -9.345703125, -7.6728515625, -6.0, -4.3271484375, -2.654296875, -0.9814453125, 0.69140625, 2.3642578125, 4.037109375, 5.7099609375, 7.3828125, 9.0556640625, 10.728515625, 12.4013671875, 14.07421875, 15.7470703125, 17.419921875, 19.0927734375, 20.765625, 22.4384765625, 24.111328125, 25.7841796875, 27.45703125, 29.1298828125, 30.802734375, 32.4755859375, 34.1484375, 35.8212890625, 37.494140625, 39.1669921875, 40.83984375, 42.5126953125, 44.185546875, 45.8583984375, 47.53125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 16.0, 10.0, 19.0, 30.0, 48.0, 72.0, 107.0, 176.0, 242.0, 351.0, 493.0, 699.0, 1039.0, 1426.0, 2107.0, 3024.0, 4464.0, 6400.0, 9287.0, 13576.0, 19644.0, 29516.0, 44922.0, 72802.0, 128766.0, 232255.0, 193113.0, 103749.0, 60715.0, 38754.0, 25295.0, 17419.0, 11779.0, 8206.0, 5567.0, 3852.0, 2622.0, 1817.0, 1325.0, 900.0, 577.0, 435.0, 313.0, 220.0, 146.0, 93.0, 55.0, 38.0, 24.0, 17.0, 16.0, 10.0, 6.0, 1.0, 4.0, 3.0], "bins": [-2.50390625, -2.42987060546875, -2.3558349609375, -2.28179931640625, -2.207763671875, -2.13372802734375, -2.0596923828125, -1.98565673828125, -1.91162109375, -1.83758544921875, -1.7635498046875, -1.68951416015625, -1.615478515625, -1.54144287109375, -1.4674072265625, -1.39337158203125, -1.3193359375, -1.24530029296875, -1.1712646484375, -1.09722900390625, -1.023193359375, -0.94915771484375, -0.8751220703125, -0.80108642578125, -0.72705078125, -0.65301513671875, -0.5789794921875, -0.50494384765625, -0.430908203125, -0.35687255859375, -0.2828369140625, -0.20880126953125, -0.134765625, -0.06072998046875, 0.0133056640625, 0.08734130859375, 0.161376953125, 0.23541259765625, 0.3094482421875, 0.38348388671875, 0.45751953125, 0.53155517578125, 0.6055908203125, 0.67962646484375, 0.753662109375, 0.82769775390625, 0.9017333984375, 0.97576904296875, 1.0498046875, 1.12384033203125, 1.1978759765625, 1.27191162109375, 1.345947265625, 1.41998291015625, 1.4940185546875, 1.56805419921875, 1.64208984375, 1.71612548828125, 1.7901611328125, 1.86419677734375, 1.938232421875, 2.01226806640625, 2.0863037109375, 2.16033935546875, 2.234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 13.0, 6.0, 8.0, 16.0, 11.0, 15.0, 20.0, 23.0, 33.0, 25.0, 32.0, 38.0, 40.0, 35.0, 49.0, 38.0, 33.0, 49.0, 1064.0, 54.0, 39.0, 46.0, 39.0, 39.0, 34.0, 40.0, 36.0, 25.0, 23.0, 19.0, 16.0, 16.0, 8.0, 8.0, 4.0, 10.0, 9.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -37.27001953125, -36.0400390625, -34.81005859375, -33.580078125, -32.35009765625, -31.1201171875, -29.89013671875, -28.66015625, -27.43017578125, -26.2001953125, -24.97021484375, -23.740234375, -22.51025390625, -21.2802734375, -20.05029296875, -18.8203125, -17.59033203125, -16.3603515625, -15.13037109375, -13.900390625, -12.67041015625, -11.4404296875, -10.21044921875, -8.98046875, -7.75048828125, -6.5205078125, -5.29052734375, -4.060546875, -2.83056640625, -1.6005859375, -0.37060546875, 0.859375, 2.08935546875, 3.3193359375, 4.54931640625, 5.779296875, 7.00927734375, 8.2392578125, 9.46923828125, 10.69921875, 11.92919921875, 13.1591796875, 14.38916015625, 15.619140625, 16.84912109375, 18.0791015625, 19.30908203125, 20.5390625, 21.76904296875, 22.9990234375, 24.22900390625, 25.458984375, 26.68896484375, 27.9189453125, 29.14892578125, 30.37890625, 31.60888671875, 32.8388671875, 34.06884765625, 35.298828125, 36.52880859375, 37.7587890625, 38.98876953125, 40.21875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 10.0, 20.0, 32.0, 36.0, 62.0, 81.0, 115.0, 161.0, 316.0, 504.0, 760.0, 1250.0, 2078.0, 3577.0, 6258.0, 11101.0, 20428.0, 39142.0, 79509.0, 186599.0, 1405545.0, 178873.0, 77027.0, 37887.0, 20002.0, 10855.0, 6129.0, 3540.0, 1981.0, 1236.0, 748.0, 475.0, 278.0, 182.0, 93.0, 86.0, 52.0, 29.0, 26.0, 14.0, 10.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3984375, -3.28692626953125, -3.1754150390625, -3.06390380859375, -2.952392578125, -2.84088134765625, -2.7293701171875, -2.61785888671875, -2.50634765625, -2.39483642578125, -2.2833251953125, -2.17181396484375, -2.060302734375, -1.94879150390625, -1.8372802734375, -1.72576904296875, -1.6142578125, -1.50274658203125, -1.3912353515625, -1.27972412109375, -1.168212890625, -1.05670166015625, -0.9451904296875, -0.83367919921875, -0.72216796875, -0.61065673828125, -0.4991455078125, -0.38763427734375, -0.276123046875, -0.16461181640625, -0.0531005859375, 0.05841064453125, 0.169921875, 0.28143310546875, 0.3929443359375, 0.50445556640625, 0.615966796875, 0.72747802734375, 0.8389892578125, 0.95050048828125, 1.06201171875, 1.17352294921875, 1.2850341796875, 1.39654541015625, 1.508056640625, 1.61956787109375, 1.7310791015625, 1.84259033203125, 1.9541015625, 2.06561279296875, 2.1771240234375, 2.28863525390625, 2.400146484375, 2.51165771484375, 2.6231689453125, 2.73468017578125, 2.84619140625, 2.95770263671875, 3.0692138671875, 3.18072509765625, 3.292236328125, 3.40374755859375, 3.5152587890625, 3.62677001953125, 3.73828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 6.0, 16.0, 8.0, 13.0, 11.0, 20.0, 17.0, 21.0, 34.0, 28.0, 41.0, 55.0, 70.0, 77.0, 72.0, 72.0, 74.0, 53.0, 46.0, 56.0, 28.0, 28.0, 24.0, 21.0, 20.0, 11.0, 14.0, 12.0, 15.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.051513671875, -0.04984903335571289, -0.04818439483642578, -0.04651975631713867, -0.04485511779785156, -0.04319047927856445, -0.041525840759277344, -0.039861202239990234, -0.038196563720703125, -0.036531925201416016, -0.034867286682128906, -0.0332026481628418, -0.03153800964355469, -0.029873371124267578, -0.02820873260498047, -0.02654409408569336, -0.02487945556640625, -0.02321481704711914, -0.02155017852783203, -0.019885540008544922, -0.018220901489257812, -0.016556262969970703, -0.014891624450683594, -0.013226985931396484, -0.011562347412109375, -0.009897708892822266, -0.008233070373535156, -0.006568431854248047, -0.0049037933349609375, -0.003239154815673828, -0.0015745162963867188, 9.012222290039062e-05, 0.0017547607421875, 0.0034193992614746094, 0.005084037780761719, 0.006748676300048828, 0.008413314819335938, 0.010077953338623047, 0.011742591857910156, 0.013407230377197266, 0.015071868896484375, 0.016736507415771484, 0.018401145935058594, 0.020065784454345703, 0.021730422973632812, 0.023395061492919922, 0.02505970001220703, 0.02672433853149414, 0.02838897705078125, 0.03005361557006836, 0.03171825408935547, 0.03338289260864258, 0.03504753112792969, 0.0367121696472168, 0.038376808166503906, 0.040041446685791016, 0.041706085205078125, 0.043370723724365234, 0.045035362243652344, 0.04670000076293945, 0.04836463928222656, 0.05002927780151367, 0.05169391632080078, 0.05335855484008789, 0.055023193359375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 8.0, 11.0, 24.0, 18.0, 22.0, 32.0, 49.0, 41.0, 68.0, 75.0, 121.0, 210.0, 395.0, 1515.0, 469221.0, 574006.0, 1642.0, 403.0, 192.0, 116.0, 77.0, 66.0, 33.0, 33.0, 37.0, 31.0, 19.0, 12.0, 20.0, 4.0, 10.0, 7.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.064453125, -1.0322036743164062, -0.9999542236328125, -0.9677047729492188, -0.935455322265625, -0.9032058715820312, -0.8709564208984375, -0.8387069702148438, -0.80645751953125, -0.7742080688476562, -0.7419586181640625, -0.7097091674804688, -0.677459716796875, -0.6452102661132812, -0.6129608154296875, -0.5807113647460938, -0.5484619140625, -0.5162124633789062, -0.4839630126953125, -0.45171356201171875, -0.419464111328125, -0.38721466064453125, -0.3549652099609375, -0.32271575927734375, -0.29046630859375, -0.25821685791015625, -0.2259674072265625, -0.19371795654296875, -0.161468505859375, -0.12921905517578125, -0.0969696044921875, -0.06472015380859375, -0.032470703125, -0.00022125244140625, 0.0320281982421875, 0.06427764892578125, 0.096527099609375, 0.12877655029296875, 0.1610260009765625, 0.19327545166015625, 0.22552490234375, 0.25777435302734375, 0.2900238037109375, 0.32227325439453125, 0.354522705078125, 0.38677215576171875, 0.4190216064453125, 0.45127105712890625, 0.4835205078125, 0.5157699584960938, 0.5480194091796875, 0.5802688598632812, 0.612518310546875, 0.6447677612304688, 0.6770172119140625, 0.7092666625976562, 0.74151611328125, 0.7737655639648438, 0.8060150146484375, 0.8382644653320312, 0.870513916015625, 0.9027633666992188, 0.9350128173828125, 0.9672622680664062, 0.99951171875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [783.0, 234.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0168991070240736, 0.001999128609895706, 0.020897364243865013, 0.03979559987783432, 0.05869383364915848, 0.07759206742048264, 0.09649030864238739, 0.11538854241371155, 0.1342867761850357, 0.15318500995635986, 0.17208324372768402, 0.19098147749900818, 0.20987972617149353, 0.2287779450416565, 0.24767619371414185, 0.2665744423866272, 0.28547266125679016, 0.3043709099292755, 0.3232691287994385, 0.34216737747192383, 0.3610655963420868, 0.37996384501457214, 0.3988620638847351, 0.41776031255722046, 0.4366585612297058, 0.45555680990219116, 0.4744550287723541, 0.4933532774448395, 0.5122514963150024, 0.5311497449874878, 0.5500479936599731, 0.5689462423324585, 0.5878444314002991, 0.6067426800727844, 0.6256409287452698, 0.6445391178131104, 0.6634373664855957, 0.682335615158081, 0.7012338638305664, 0.7201321125030518, 0.7390303015708923, 0.7579285502433777, 0.776826798915863, 0.7957249879837036, 0.814623236656189, 0.8335214853286743, 0.8524197340011597, 0.871317982673645, 0.8902162313461304, 0.9091144800186157, 0.9280127286911011, 0.9469109177589417, 0.965809166431427, 0.9847074151039124, 1.003605604171753, 1.0225038528442383, 1.0414021015167236, 1.060300350189209, 1.0791985988616943, 1.0980968475341797, 1.116995096206665, 1.1358932256698608, 1.1547914743423462, 1.1736897230148315, 1.192587971687317]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 12.0, 9.0, 19.0, 15.0, 35.0, 44.0, 40.0, 45.0, 50.0, 65.0, 52.0, 78.0, 65.0, 64.0, 74.0, 55.0, 52.0, 52.0, 26.0, 41.0, 40.0, 12.0, 14.0, 9.0, 7.0, 8.0, 5.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.06185096502304077, -0.06038789451122284, -0.058924827724695206, -0.05746176093816757, -0.05599869042634964, -0.05453561991453171, -0.053072553128004074, -0.05160948634147644, -0.05014641582965851, -0.048683345317840576, -0.04722027853131294, -0.04575721174478531, -0.04429414123296738, -0.042831070721149445, -0.04136800393462181, -0.03990493714809418, -0.038441866636276245, -0.03697879612445831, -0.03551572933793068, -0.034052662551403046, -0.032589592039585114, -0.03112652339041233, -0.029663454741239548, -0.028200386092066765, -0.026737317442893982, -0.0252742487937212, -0.023811180144548416, -0.022348111495375633, -0.02088504284620285, -0.019421974197030067, -0.017958905547857285, -0.0164958368986845, -0.015032768249511719, -0.013569699600338936, -0.012106630951166153, -0.01064356230199337, -0.009180493652820587, -0.007717425003647804, -0.006254356354475021, -0.0047912877053022385, -0.0033282190561294556, -0.0018651504069566727, -0.00040208175778388977, 0.0010609868913888931, 0.002524055540561676, 0.003987124189734459, 0.005450192838907242, 0.006913261488080025, 0.008376330137252808, 0.00983939878642559, 0.011302467435598373, 0.012765536084771156, 0.01422860473394394, 0.015691673383116722, 0.017154742032289505, 0.018617810681462288, 0.02008087933063507, 0.021543947979807854, 0.023007016628980637, 0.02447008527815342, 0.025933153927326202, 0.027396222576498985, 0.028859291225671768, 0.03032235987484455, 0.031785428524017334]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 4.0, 4.0, 8.0, 9.0, 5.0, 16.0, 13.0, 14.0, 12.0, 17.0, 24.0, 20.0, 35.0, 26.0, 34.0, 36.0, 33.0, 34.0, 35.0, 38.0, 39.0, 52.0, 31.0, 43.0, 45.0, 47.0, 26.0, 44.0, 33.0, 24.0, 23.0, 29.0, 25.0, 20.0, 17.0, 13.0, 17.0, 9.0, 6.0, 9.0, 10.0, 3.0, 2.0, 3.0, 6.0, 1.0, 1.0, 5.0, 2.0, 2.0], "bins": [-59.53125, -57.8583984375, -56.185546875, -54.5126953125, -52.83984375, -51.1669921875, -49.494140625, -47.8212890625, -46.1484375, -44.4755859375, -42.802734375, -41.1298828125, -39.45703125, -37.7841796875, -36.111328125, -34.4384765625, -32.765625, -31.0927734375, -29.419921875, -27.7470703125, -26.07421875, -24.4013671875, -22.728515625, -21.0556640625, -19.3828125, -17.7099609375, -16.037109375, -14.3642578125, -12.69140625, -11.0185546875, -9.345703125, -7.6728515625, -6.0, -4.3271484375, -2.654296875, -0.9814453125, 0.69140625, 2.3642578125, 4.037109375, 5.7099609375, 7.3828125, 9.0556640625, 10.728515625, 12.4013671875, 14.07421875, 15.7470703125, 17.419921875, 19.0927734375, 20.765625, 22.4384765625, 24.111328125, 25.7841796875, 27.45703125, 29.1298828125, 30.802734375, 32.4755859375, 34.1484375, 35.8212890625, 37.494140625, 39.1669921875, 40.83984375, 42.5126953125, 44.185546875, 45.8583984375, 47.53125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 6.0, 7.0, 8.0, 14.0, 22.0, 26.0, 33.0, 60.0, 67.0, 97.0, 134.0, 166.0, 260.0, 352.0, 599.0, 929.0, 1611.0, 2786.0, 5835.0, 15601.0, 79698.0, 744580.0, 157661.0, 22269.0, 7298.0, 3452.0, 1836.0, 1033.0, 679.0, 438.0, 272.0, 207.0, 121.0, 115.0, 73.0, 60.0, 29.0, 35.0, 21.0, 14.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0], "bins": [-93.75, -90.962890625, -88.17578125, -85.388671875, -82.6015625, -79.814453125, -77.02734375, -74.240234375, -71.453125, -68.666015625, -65.87890625, -63.091796875, -60.3046875, -57.517578125, -54.73046875, -51.943359375, -49.15625, -46.369140625, -43.58203125, -40.794921875, -38.0078125, -35.220703125, -32.43359375, -29.646484375, -26.859375, -24.072265625, -21.28515625, -18.498046875, -15.7109375, -12.923828125, -10.13671875, -7.349609375, -4.5625, -1.775390625, 1.01171875, 3.798828125, 6.5859375, 9.373046875, 12.16015625, 14.947265625, 17.734375, 20.521484375, 23.30859375, 26.095703125, 28.8828125, 31.669921875, 34.45703125, 37.244140625, 40.03125, 42.818359375, 45.60546875, 48.392578125, 51.1796875, 53.966796875, 56.75390625, 59.541015625, 62.328125, 65.115234375, 67.90234375, 70.689453125, 73.4765625, 76.263671875, 79.05078125, 81.837890625, 84.625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 8.0, 3.0, 9.0, 7.0, 17.0, 7.0, 17.0, 18.0, 18.0, 23.0, 25.0, 32.0, 43.0, 42.0, 42.0, 66.0, 53.0, 92.0, 1598.0, 439.0, 89.0, 53.0, 40.0, 41.0, 45.0, 34.0, 35.0, 29.0, 19.0, 19.0, 18.0, 22.0, 8.0, 5.0, 8.0, 11.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.125, -132.390625, -127.65625, -122.921875, -118.1875, -113.453125, -108.71875, -103.984375, -99.25, -94.515625, -89.78125, -85.046875, -80.3125, -75.578125, -70.84375, -66.109375, -61.375, -56.640625, -51.90625, -47.171875, -42.4375, -37.703125, -32.96875, -28.234375, -23.5, -18.765625, -14.03125, -9.296875, -4.5625, 0.171875, 4.90625, 9.640625, 14.375, 19.109375, 23.84375, 28.578125, 33.3125, 38.046875, 42.78125, 47.515625, 52.25, 56.984375, 61.71875, 66.453125, 71.1875, 75.921875, 80.65625, 85.390625, 90.125, 94.859375, 99.59375, 104.328125, 109.0625, 113.796875, 118.53125, 123.265625, 128.0, 132.734375, 137.46875, 142.203125, 146.9375, 151.671875, 156.40625, 161.140625, 165.875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 8.0, 26.0, 35.0, 59.0, 81.0, 166.0, 353.0, 868.0, 4783.0, 1814568.0, 1318500.0, 4664.0, 846.0, 314.0, 159.0, 89.0, 70.0, 40.0, 25.0, 20.0, 15.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-345.25, -335.09375, -324.9375, -314.78125, -304.625, -294.46875, -284.3125, -274.15625, -264.0, -253.84375, -243.6875, -233.53125, -223.375, -213.21875, -203.0625, -192.90625, -182.75, -172.59375, -162.4375, -152.28125, -142.125, -131.96875, -121.8125, -111.65625, -101.5, -91.34375, -81.1875, -71.03125, -60.875, -50.71875, -40.5625, -30.40625, -20.25, -10.09375, 0.0625, 10.21875, 20.375, 30.53125, 40.6875, 50.84375, 61.0, 71.15625, 81.3125, 91.46875, 101.625, 111.78125, 121.9375, 132.09375, 142.25, 152.40625, 162.5625, 172.71875, 182.875, 193.03125, 203.1875, 213.34375, 223.5, 233.65625, 243.8125, 253.96875, 264.125, 274.28125, 284.4375, 294.59375, 304.75]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 540.0, 457.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1083.6590576171875, -1052.6412353515625, -1021.6233520507812, -990.6055297851562, -959.5877075195312, -928.56982421875, -897.552001953125, -866.5341796875, -835.516357421875, -804.49853515625, -773.4806518554688, -742.4628295898438, -711.4450073242188, -680.4271240234375, -649.4093017578125, -618.3914794921875, -587.3735961914062, -556.3557739257812, -525.337890625, -494.320068359375, -463.30224609375, -432.2843933105469, -401.26654052734375, -370.24871826171875, -339.2308654785156, -308.2130126953125, -277.1951904296875, -246.17733764648438, -215.1595001220703, -184.14166259765625, -153.12380981445312, -122.10597229003906, -91.08819580078125, -60.07035446166992, -29.052513122558594, 1.96533203125, 32.98316955566406, 64.00100708007812, 95.01885986328125, 126.03669738769531, 157.05453491210938, 188.07237243652344, 219.0902099609375, 250.10806274414062, 281.12591552734375, 312.14373779296875, 343.1615905761719, 374.179443359375, 405.197265625, 436.2151184082031, 467.2329406738281, 498.25079345703125, 529.2686157226562, 560.2864990234375, 591.3043212890625, 622.3221435546875, 653.3399658203125, 684.3577880859375, 715.3756713867188, 746.3934936523438, 777.4113159179688, 808.42919921875, 839.447021484375, 870.46484375, 901.4827270507812]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 8.0, 7.0, 13.0, 15.0, 12.0, 9.0, 23.0, 19.0, 28.0, 32.0, 29.0, 31.0, 46.0, 40.0, 39.0, 34.0, 36.0, 37.0, 52.0, 40.0, 43.0, 36.0, 35.0, 31.0, 29.0, 40.0, 29.0, 28.0, 26.0, 19.0, 20.0, 22.0, 10.0, 6.0, 16.0, 10.0, 11.0, 6.0, 4.0, 5.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-275.23089599609375, -266.0248107910156, -256.8187255859375, -247.61265563964844, -238.40658569335938, -229.20050048828125, -219.99441528320312, -210.78834533691406, -201.582275390625, -192.37619018554688, -183.1701202392578, -173.9640350341797, -164.75796508789062, -155.5518798828125, -146.34579467773438, -137.1397247314453, -127.93363952636719, -118.7275619506836, -109.521484375, -100.31539916992188, -91.10932922363281, -81.90324401855469, -72.6971664428711, -63.4910888671875, -54.285011291503906, -45.07893371582031, -35.87285614013672, -26.66677474975586, -17.460697174072266, -8.254619598388672, 0.9514617919921875, 10.157539367675781, 19.363616943359375, 28.56969451904297, 37.77577209472656, 46.98185348510742, 56.187931060791016, 65.39401245117188, 74.60009002685547, 83.80616760253906, 93.01224517822266, 102.21832275390625, 111.42440032958984, 120.63047790527344, 129.83656311035156, 139.04263305664062, 148.24871826171875, 157.45480346679688, 166.66087341308594, 175.86695861816406, 185.07302856445312, 194.27911376953125, 203.4851837158203, 212.69126892089844, 221.8973388671875, 231.10342407226562, 240.30950927734375, 249.51559448242188, 258.7216796875, 267.927734375, 277.1338195800781, 286.33990478515625, 295.5459899902344, 304.7520751953125, 313.9581298828125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 6.0, 7.0, 7.0, 13.0, 9.0, 12.0, 20.0, 13.0, 16.0, 31.0, 30.0, 25.0, 21.0, 34.0, 48.0, 38.0, 29.0, 35.0, 36.0, 55.0, 45.0, 47.0, 45.0, 34.0, 38.0, 37.0, 31.0, 34.0, 21.0, 27.0, 25.0, 21.0, 18.0, 18.0, 9.0, 6.0, 14.0, 8.0, 4.0, 9.0, 5.0, 1.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-59.875, -58.15869140625, -56.4423828125, -54.72607421875, -53.009765625, -51.29345703125, -49.5771484375, -47.86083984375, -46.14453125, -44.42822265625, -42.7119140625, -40.99560546875, -39.279296875, -37.56298828125, -35.8466796875, -34.13037109375, -32.4140625, -30.69775390625, -28.9814453125, -27.26513671875, -25.548828125, -23.83251953125, -22.1162109375, -20.39990234375, -18.68359375, -16.96728515625, -15.2509765625, -13.53466796875, -11.818359375, -10.10205078125, -8.3857421875, -6.66943359375, -4.953125, -3.23681640625, -1.5205078125, 0.19580078125, 1.912109375, 3.62841796875, 5.3447265625, 7.06103515625, 8.77734375, 10.49365234375, 12.2099609375, 13.92626953125, 15.642578125, 17.35888671875, 19.0751953125, 20.79150390625, 22.5078125, 24.22412109375, 25.9404296875, 27.65673828125, 29.373046875, 31.08935546875, 32.8056640625, 34.52197265625, 36.23828125, 37.95458984375, 39.6708984375, 41.38720703125, 43.103515625, 44.81982421875, 46.5361328125, 48.25244140625, 49.96875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 11.0, 8.0, 13.0, 10.0, 17.0, 29.0, 41.0, 53.0, 59.0, 101.0, 151.0, 190.0, 308.0, 516.0, 851.0, 1459.0, 2835.0, 5823.0, 14067.0, 54046.0, 1933887.0, 2095884.0, 56474.0, 14596.0, 6007.0, 2893.0, 1476.0, 913.0, 525.0, 323.0, 206.0, 142.0, 110.0, 68.0, 43.0, 29.0, 30.0, 25.0, 12.0, 10.0, 12.0, 5.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-198.875, -193.02734375, -187.1796875, -181.33203125, -175.484375, -169.63671875, -163.7890625, -157.94140625, -152.09375, -146.24609375, -140.3984375, -134.55078125, -128.703125, -122.85546875, -117.0078125, -111.16015625, -105.3125, -99.46484375, -93.6171875, -87.76953125, -81.921875, -76.07421875, -70.2265625, -64.37890625, -58.53125, -52.68359375, -46.8359375, -40.98828125, -35.140625, -29.29296875, -23.4453125, -17.59765625, -11.75, -5.90234375, -0.0546875, 5.79296875, 11.640625, 17.48828125, 23.3359375, 29.18359375, 35.03125, 40.87890625, 46.7265625, 52.57421875, 58.421875, 64.26953125, 70.1171875, 75.96484375, 81.8125, 87.66015625, 93.5078125, 99.35546875, 105.203125, 111.05078125, 116.8984375, 122.74609375, 128.59375, 134.44140625, 140.2890625, 146.13671875, 151.984375, 157.83203125, 163.6796875, 169.52734375, 175.375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 5.0, 6.0, 5.0, 6.0, 8.0, 13.0, 23.0, 34.0, 35.0, 47.0, 77.0, 195.0, 558.0, 1369.0, 1042.0, 313.0, 125.0, 65.0, 44.0, 27.0, 15.0, 19.0, 13.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.5, -136.90625, -132.3125, -127.71875, -123.125, -118.53125, -113.9375, -109.34375, -104.75, -100.15625, -95.5625, -90.96875, -86.375, -81.78125, -77.1875, -72.59375, -68.0, -63.40625, -58.8125, -54.21875, -49.625, -45.03125, -40.4375, -35.84375, -31.25, -26.65625, -22.0625, -17.46875, -12.875, -8.28125, -3.6875, 0.90625, 5.5, 10.09375, 14.6875, 19.28125, 23.875, 28.46875, 33.0625, 37.65625, 42.25, 46.84375, 51.4375, 56.03125, 60.625, 65.21875, 69.8125, 74.40625, 79.0, 83.59375, 88.1875, 92.78125, 97.375, 101.96875, 106.5625, 111.15625, 115.75, 120.34375, 124.9375, 129.53125, 134.125, 138.71875, 143.3125, 147.90625, 152.5]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 11.0, 14.0, 12.0, 30.0, 29.0, 60.0, 59.0, 92.0, 160.0, 207.0, 395.0, 549.0, 838.0, 1405.0, 2377.0, 4098.0, 7777.0, 16606.0, 43606.0, 208462.0, 3549955.0, 271672.0, 48817.0, 18196.0, 8287.0, 4175.0, 2378.0, 1505.0, 840.0, 544.0, 387.0, 219.0, 148.0, 98.0, 90.0, 51.0, 32.0, 29.0, 22.0, 10.0, 11.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.75, -155.48828125, -150.2265625, -144.96484375, -139.703125, -134.44140625, -129.1796875, -123.91796875, -118.65625, -113.39453125, -108.1328125, -102.87109375, -97.609375, -92.34765625, -87.0859375, -81.82421875, -76.5625, -71.30078125, -66.0390625, -60.77734375, -55.515625, -50.25390625, -44.9921875, -39.73046875, -34.46875, -29.20703125, -23.9453125, -18.68359375, -13.421875, -8.16015625, -2.8984375, 2.36328125, 7.625, 12.88671875, 18.1484375, 23.41015625, 28.671875, 33.93359375, 39.1953125, 44.45703125, 49.71875, 54.98046875, 60.2421875, 65.50390625, 70.765625, 76.02734375, 81.2890625, 86.55078125, 91.8125, 97.07421875, 102.3359375, 107.59765625, 112.859375, 118.12109375, 123.3828125, 128.64453125, 133.90625, 139.16796875, 144.4296875, 149.69140625, 154.953125, 160.21484375, 165.4765625, 170.73828125, 176.0]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 5.0, 19.0, 70.0, 288.0, 455.0, 119.0, 39.0, 11.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.4744262695312, -545.1289672851562, -500.783447265625, -456.43798828125, -412.0924987792969, -367.74700927734375, -323.40155029296875, -279.0560607910156, -234.7105712890625, -190.36508178710938, -146.0196075439453, -101.67413330078125, -57.328643798828125, -12.983154296875, 31.3623046875, 75.70779418945312, 120.05328369140625, 164.39877319335938, 208.74424743652344, 253.0897216796875, 297.4352111816406, 341.78070068359375, 386.12615966796875, 430.4716491699219, 474.817138671875, 519.16259765625, 563.5081176757812, 607.8535766601562, 652.1990966796875, 696.5445556640625, 740.8900146484375, 785.2354736328125, 829.5810546875, 873.926513671875, 918.2720336914062, 962.6174926757812, 1006.9630126953125, 1051.3084716796875, 1095.6539306640625, 1139.9993896484375, 1184.344970703125, 1228.6904296875, 1273.035888671875, 1317.38134765625, 1361.7269287109375, 1406.0723876953125, 1450.4178466796875, 1494.7633056640625, 1539.1087646484375, 1583.4542236328125, 1627.7996826171875, 1672.145263671875, 1716.49072265625, 1760.836181640625, 1805.181640625, 1849.527099609375, 1893.87255859375, 1938.218017578125, 1982.5634765625, 2026.908935546875, 2071.25439453125, 2115.60009765625, 2159.9453125, 2204.291015625, 2248.636474609375]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 9.0, 12.0, 6.0, 8.0, 13.0, 10.0, 12.0, 11.0, 26.0, 30.0, 33.0, 29.0, 44.0, 30.0, 39.0, 29.0, 55.0, 36.0, 32.0, 58.0, 52.0, 50.0, 40.0, 42.0, 35.0, 35.0, 31.0, 31.0, 29.0, 22.0, 19.0, 19.0, 23.0, 13.0, 4.0, 8.0, 8.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-293.8227233886719, -283.9903259277344, -274.1579284667969, -264.3255310058594, -254.49313354492188, -244.66073608398438, -234.82835388183594, -224.99595642089844, -215.16355895996094, -205.33116149902344, -195.49876403808594, -185.66636657714844, -175.833984375, -166.0015869140625, -156.169189453125, -146.3367919921875, -136.50439453125, -126.6719970703125, -116.839599609375, -107.00720977783203, -97.17481231689453, -87.34241485595703, -77.51002502441406, -67.67762756347656, -57.84523010253906, -48.01283264160156, -38.18043899536133, -28.34804344177246, -18.515647888183594, -8.683250427246094, 1.1491432189941406, 10.981536865234375, 20.81396484375, 30.646360397338867, 40.478755950927734, 50.31114959716797, 60.14354705810547, 69.97594451904297, 79.80833435058594, 89.64073181152344, 99.47312927246094, 109.30552673339844, 119.13792419433594, 128.97032165527344, 138.80270385742188, 148.63510131835938, 158.46749877929688, 168.29989624023438, 178.13229370117188, 187.96469116210938, 197.79708862304688, 207.62948608398438, 217.46188354492188, 227.29428100585938, 237.1266632080078, 246.9590606689453, 256.79144287109375, 266.62384033203125, 276.45623779296875, 286.28863525390625, 296.12103271484375, 305.95343017578125, 315.78582763671875, 325.61822509765625, 335.45062255859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 11.0, 12.0, 5.0, 12.0, 20.0, 8.0, 23.0, 23.0, 22.0, 36.0, 29.0, 37.0, 34.0, 31.0, 46.0, 43.0, 32.0, 37.0, 32.0, 46.0, 44.0, 46.0, 42.0, 54.0, 31.0, 32.0, 31.0, 25.0, 28.0, 23.0, 20.0, 20.0, 7.0, 8.0, 8.0, 11.0, 6.0, 7.0, 2.0, 3.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.75, -51.794921875, -49.83984375, -47.884765625, -45.9296875, -43.974609375, -42.01953125, -40.064453125, -38.109375, -36.154296875, -34.19921875, -32.244140625, -30.2890625, -28.333984375, -26.37890625, -24.423828125, -22.46875, -20.513671875, -18.55859375, -16.603515625, -14.6484375, -12.693359375, -10.73828125, -8.783203125, -6.828125, -4.873046875, -2.91796875, -0.962890625, 0.9921875, 2.947265625, 4.90234375, 6.857421875, 8.8125, 10.767578125, 12.72265625, 14.677734375, 16.6328125, 18.587890625, 20.54296875, 22.498046875, 24.453125, 26.408203125, 28.36328125, 30.318359375, 32.2734375, 34.228515625, 36.18359375, 38.138671875, 40.09375, 42.048828125, 44.00390625, 45.958984375, 47.9140625, 49.869140625, 51.82421875, 53.779296875, 55.734375, 57.689453125, 59.64453125, 61.599609375, 63.5546875, 65.509765625, 67.46484375, 69.419921875, 71.375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 15.0, 14.0, 27.0, 30.0, 49.0, 86.0, 130.0, 175.0, 269.0, 402.0, 583.0, 831.0, 1363.0, 2017.0, 2950.0, 4651.0, 6925.0, 10654.0, 16650.0, 26415.0, 43911.0, 76665.0, 149779.0, 275252.0, 193786.0, 95413.0, 52773.0, 31151.0, 19537.0, 12308.0, 7987.0, 5310.0, 3597.0, 2266.0, 1525.0, 1059.0, 674.0, 423.0, 294.0, 198.0, 141.0, 95.0, 62.0, 36.0, 29.0, 18.0, 16.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.751953125, -2.659210205078125, -2.56646728515625, -2.473724365234375, -2.3809814453125, -2.288238525390625, -2.19549560546875, -2.102752685546875, -2.010009765625, -1.917266845703125, -1.82452392578125, -1.731781005859375, -1.6390380859375, -1.546295166015625, -1.45355224609375, -1.360809326171875, -1.26806640625, -1.175323486328125, -1.08258056640625, -0.989837646484375, -0.8970947265625, -0.804351806640625, -0.71160888671875, -0.618865966796875, -0.526123046875, -0.433380126953125, -0.34063720703125, -0.247894287109375, -0.1551513671875, -0.062408447265625, 0.03033447265625, 0.123077392578125, 0.2158203125, 0.308563232421875, 0.40130615234375, 0.494049072265625, 0.5867919921875, 0.679534912109375, 0.77227783203125, 0.865020751953125, 0.957763671875, 1.050506591796875, 1.14324951171875, 1.235992431640625, 1.3287353515625, 1.421478271484375, 1.51422119140625, 1.606964111328125, 1.69970703125, 1.792449951171875, 1.88519287109375, 1.977935791015625, 2.0706787109375, 2.163421630859375, 2.25616455078125, 2.348907470703125, 2.441650390625, 2.534393310546875, 2.62713623046875, 2.719879150390625, 2.8126220703125, 2.905364990234375, 2.99810791015625, 3.090850830078125, 3.18359375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 5.0, 2.0, 1.0, 7.0, 8.0, 15.0, 12.0, 11.0, 17.0, 15.0, 22.0, 23.0, 30.0, 13.0, 33.0, 32.0, 37.0, 34.0, 49.0, 42.0, 33.0, 40.0, 1059.0, 39.0, 41.0, 31.0, 40.0, 24.0, 28.0, 34.0, 31.0, 35.0, 29.0, 19.0, 19.0, 20.0, 15.0, 14.0, 10.0, 14.0, 11.0, 10.0, 5.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -39.0322265625, -37.845703125, -36.6591796875, -35.47265625, -34.2861328125, -33.099609375, -31.9130859375, -30.7265625, -29.5400390625, -28.353515625, -27.1669921875, -25.98046875, -24.7939453125, -23.607421875, -22.4208984375, -21.234375, -20.0478515625, -18.861328125, -17.6748046875, -16.48828125, -15.3017578125, -14.115234375, -12.9287109375, -11.7421875, -10.5556640625, -9.369140625, -8.1826171875, -6.99609375, -5.8095703125, -4.623046875, -3.4365234375, -2.25, -1.0634765625, 0.123046875, 1.3095703125, 2.49609375, 3.6826171875, 4.869140625, 6.0556640625, 7.2421875, 8.4287109375, 9.615234375, 10.8017578125, 11.98828125, 13.1748046875, 14.361328125, 15.5478515625, 16.734375, 17.9208984375, 19.107421875, 20.2939453125, 21.48046875, 22.6669921875, 23.853515625, 25.0400390625, 26.2265625, 27.4130859375, 28.599609375, 29.7861328125, 30.97265625, 32.1591796875, 33.345703125, 34.5322265625, 35.71875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 12.0, 18.0, 19.0, 20.0, 32.0, 58.0, 80.0, 137.0, 158.0, 277.0, 374.0, 669.0, 888.0, 1506.0, 2284.0, 3476.0, 5767.0, 9314.0, 14912.0, 25000.0, 43200.0, 78288.0, 161364.0, 1359048.0, 184738.0, 87565.0, 47237.0, 27286.0, 16231.0, 10025.0, 6244.0, 3892.0, 2502.0, 1592.0, 966.0, 675.0, 444.0, 273.0, 185.0, 122.0, 103.0, 55.0, 24.0, 20.0, 17.0, 11.0, 7.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.482421875, -3.3817138671875, -3.281005859375, -3.1802978515625, -3.07958984375, -2.9788818359375, -2.878173828125, -2.7774658203125, -2.6767578125, -2.5760498046875, -2.475341796875, -2.3746337890625, -2.27392578125, -2.1732177734375, -2.072509765625, -1.9718017578125, -1.87109375, -1.7703857421875, -1.669677734375, -1.5689697265625, -1.46826171875, -1.3675537109375, -1.266845703125, -1.1661376953125, -1.0654296875, -0.9647216796875, -0.864013671875, -0.7633056640625, -0.66259765625, -0.5618896484375, -0.461181640625, -0.3604736328125, -0.259765625, -0.1590576171875, -0.058349609375, 0.0423583984375, 0.14306640625, 0.2437744140625, 0.344482421875, 0.4451904296875, 0.5458984375, 0.6466064453125, 0.747314453125, 0.8480224609375, 0.94873046875, 1.0494384765625, 1.150146484375, 1.2508544921875, 1.3515625, 1.4522705078125, 1.552978515625, 1.6536865234375, 1.75439453125, 1.8551025390625, 1.955810546875, 2.0565185546875, 2.1572265625, 2.2579345703125, 2.358642578125, 2.4593505859375, 2.56005859375, 2.6607666015625, 2.761474609375, 2.8621826171875, 2.962890625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 9.0, 7.0, 14.0, 14.0, 11.0, 18.0, 23.0, 38.0, 46.0, 68.0, 70.0, 91.0, 82.0, 78.0, 73.0, 83.0, 64.0, 55.0, 29.0, 20.0, 16.0, 16.0, 17.0, 9.0, 6.0, 3.0, 4.0, 8.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03131103515625, -0.030415058135986328, -0.029519081115722656, -0.028623104095458984, -0.027727127075195312, -0.02683115005493164, -0.02593517303466797, -0.025039196014404297, -0.024143218994140625, -0.023247241973876953, -0.02235126495361328, -0.02145528793334961, -0.020559310913085938, -0.019663333892822266, -0.018767356872558594, -0.017871379852294922, -0.01697540283203125, -0.016079425811767578, -0.015183448791503906, -0.014287471771240234, -0.013391494750976562, -0.01249551773071289, -0.011599540710449219, -0.010703563690185547, -0.009807586669921875, -0.008911609649658203, -0.008015632629394531, -0.007119655609130859, -0.0062236785888671875, -0.005327701568603516, -0.004431724548339844, -0.003535747528076172, -0.0026397705078125, -0.0017437934875488281, -0.0008478164672851562, 4.8160552978515625e-05, 0.0009441375732421875, 0.0018401145935058594, 0.0027360916137695312, 0.003632068634033203, 0.004528045654296875, 0.005424022674560547, 0.006319999694824219, 0.007215976715087891, 0.008111953735351562, 0.009007930755615234, 0.009903907775878906, 0.010799884796142578, 0.01169586181640625, 0.012591838836669922, 0.013487815856933594, 0.014383792877197266, 0.015279769897460938, 0.01617574691772461, 0.01707172393798828, 0.017967700958251953, 0.018863677978515625, 0.019759654998779297, 0.02065563201904297, 0.02155160903930664, 0.022447586059570312, 0.023343563079833984, 0.024239540100097656, 0.025135517120361328, 0.026031494140625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 1.0, 4.0, 6.0, 13.0, 11.0, 8.0, 19.0, 18.0, 31.0, 27.0, 47.0, 48.0, 73.0, 141.0, 230.0, 470.0, 3108.0, 346567.0, 692346.0, 4140.0, 534.0, 226.0, 142.0, 91.0, 38.0, 44.0, 27.0, 29.0, 31.0, 10.0, 16.0, 15.0, 7.0, 5.0, 9.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47021484375, -0.4540252685546875, -0.437835693359375, -0.4216461181640625, -0.40545654296875, -0.3892669677734375, -0.373077392578125, -0.3568878173828125, -0.3406982421875, -0.3245086669921875, -0.308319091796875, -0.2921295166015625, -0.27593994140625, -0.2597503662109375, -0.243560791015625, -0.2273712158203125, -0.211181640625, -0.1949920654296875, -0.178802490234375, -0.1626129150390625, -0.14642333984375, -0.1302337646484375, -0.114044189453125, -0.0978546142578125, -0.0816650390625, -0.0654754638671875, -0.049285888671875, -0.0330963134765625, -0.01690673828125, -0.0007171630859375, 0.015472412109375, 0.0316619873046875, 0.0478515625, 0.0640411376953125, 0.080230712890625, 0.0964202880859375, 0.11260986328125, 0.1287994384765625, 0.144989013671875, 0.1611785888671875, 0.1773681640625, 0.1935577392578125, 0.209747314453125, 0.2259368896484375, 0.24212646484375, 0.2583160400390625, 0.274505615234375, 0.2906951904296875, 0.306884765625, 0.3230743408203125, 0.339263916015625, 0.3554534912109375, 0.37164306640625, 0.3878326416015625, 0.404022216796875, 0.4202117919921875, 0.4364013671875, 0.4525909423828125, 0.468780517578125, 0.4849700927734375, 0.50115966796875, 0.5173492431640625, 0.533538818359375, 0.5497283935546875, 0.56591796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 21.0, 189.0, 626.0, 154.0, 21.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017965836450457573, -0.014657502993941307, -0.011349169537425041, -0.0080408351495862, -0.004732501693069935, -0.0014241673052310944, 0.0018841661512851715, 0.005192499607801437, 0.008500833064317703, 0.011809166520833969, 0.015117499977350235, 0.0184258334338665, 0.021734166890382767, 0.025042502209544182, 0.028350835666060448, 0.03165917098522186, 0.03496750444173813, 0.038275837898254395, 0.04158417135477066, 0.044892504811286926, 0.04820083826780319, 0.05150917172431946, 0.054817505180835724, 0.05812583863735199, 0.061434172093868256, 0.06474250555038452, 0.06805083900690079, 0.07135917246341705, 0.07466750591993332, 0.07797583937644958, 0.08128417283296585, 0.08459250628948212, 0.08790083974599838, 0.09120917320251465, 0.09451750665903091, 0.09782584011554718, 0.10113417357206345, 0.10444250702857971, 0.10775084048509598, 0.11105917394161224, 0.11436750739812851, 0.11767584085464478, 0.12098417431116104, 0.12429250776767731, 0.12760084867477417, 0.13090917468070984, 0.1342175155878067, 0.13752584159374237, 0.14083418250083923, 0.1441425234079361, 0.14745084941387177, 0.15075919032096863, 0.1540675163269043, 0.15737585723400116, 0.16068418323993683, 0.1639925241470337, 0.16730085015296936, 0.17060919106006622, 0.1739175170660019, 0.17722585797309875, 0.18053418397903442, 0.1838425248861313, 0.18715085089206696, 0.19045919179916382, 0.1937675178050995]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 9.0, 5.0, 12.0, 9.0, 20.0, 13.0, 14.0, 21.0, 31.0, 29.0, 31.0, 34.0, 28.0, 24.0, 37.0, 46.0, 35.0, 35.0, 39.0, 65.0, 44.0, 50.0, 34.0, 35.0, 29.0, 29.0, 38.0, 24.0, 28.0, 28.0, 30.0, 17.0, 12.0, 14.0, 9.0, 13.0, 12.0, 4.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01277703046798706, -0.012350988574326038, -0.011924946680665016, -0.011498904787003994, -0.011072862893342972, -0.01064682099968195, -0.010220779106020927, -0.009794737212359905, -0.009368695318698883, -0.008942653425037861, -0.008516611531376839, -0.008090569637715816, -0.007664527744054794, -0.007238485850393772, -0.00681244395673275, -0.006386402063071728, -0.005960360169410706, -0.005534318275749683, -0.005108276382088661, -0.004682234488427639, -0.004256192594766617, -0.0038301507011055946, -0.0034041088074445724, -0.0029780669137835503, -0.002552025020122528, -0.002125983126461506, -0.0016999412328004837, -0.0012738993391394615, -0.0008478574454784393, -0.00042181555181741714, 4.2263418436050415e-06, 0.00043026823550462723, 0.0008563101291656494, 0.0012823520228266716, 0.0017083939164876938, 0.002134435810148716, 0.002560477703809738, 0.0029865195974707603, 0.0034125614911317825, 0.0038386033847928047, 0.004264645278453827, 0.004690687172114849, 0.005116729065775871, 0.0055427709594368935, 0.005968812853097916, 0.006394854746758938, 0.00682089664041996, 0.007246938534080982, 0.007672980427742004, 0.008099022321403027, 0.008525064215064049, 0.008951106108725071, 0.009377148002386093, 0.009803189896047115, 0.010229231789708138, 0.01065527368336916, 0.011081315577030182, 0.011507357470691204, 0.011933399364352226, 0.012359441258013248, 0.01278548315167427, 0.013211525045335293, 0.013637566938996315, 0.014063608832657337, 0.01448965072631836]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 11.0, 12.0, 5.0, 12.0, 20.0, 8.0, 23.0, 23.0, 22.0, 36.0, 29.0, 37.0, 34.0, 31.0, 46.0, 43.0, 32.0, 37.0, 32.0, 46.0, 44.0, 46.0, 42.0, 54.0, 31.0, 32.0, 31.0, 25.0, 28.0, 23.0, 20.0, 20.0, 7.0, 8.0, 8.0, 11.0, 6.0, 7.0, 2.0, 3.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.75, -51.794921875, -49.83984375, -47.884765625, -45.9296875, -43.974609375, -42.01953125, -40.064453125, -38.109375, -36.154296875, -34.19921875, -32.244140625, -30.2890625, -28.333984375, -26.37890625, -24.423828125, -22.46875, -20.513671875, -18.55859375, -16.603515625, -14.6484375, -12.693359375, -10.73828125, -8.783203125, -6.828125, -4.873046875, -2.91796875, -0.962890625, 0.9921875, 2.947265625, 4.90234375, 6.857421875, 8.8125, 10.767578125, 12.72265625, 14.677734375, 16.6328125, 18.587890625, 20.54296875, 22.498046875, 24.453125, 26.408203125, 28.36328125, 30.318359375, 32.2734375, 34.228515625, 36.18359375, 38.138671875, 40.09375, 42.048828125, 44.00390625, 45.958984375, 47.9140625, 49.869140625, 51.82421875, 53.779296875, 55.734375, 57.689453125, 59.64453125, 61.599609375, 63.5546875, 65.509765625, 67.46484375, 69.419921875, 71.375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 10.0, 3.0, 5.0, 8.0, 21.0, 26.0, 28.0, 49.0, 52.0, 85.0, 123.0, 175.0, 272.0, 359.0, 537.0, 731.0, 1104.0, 1638.0, 2467.0, 4163.0, 7046.0, 13662.0, 32159.0, 115560.0, 646710.0, 149360.0, 36961.0, 15003.0, 7656.0, 4308.0, 2697.0, 1784.0, 1174.0, 799.0, 583.0, 360.0, 251.0, 194.0, 110.0, 100.0, 59.0, 43.0, 40.0, 23.0, 22.0, 10.0, 11.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-93.125, -90.265625, -87.40625, -84.546875, -81.6875, -78.828125, -75.96875, -73.109375, -70.25, -67.390625, -64.53125, -61.671875, -58.8125, -55.953125, -53.09375, -50.234375, -47.375, -44.515625, -41.65625, -38.796875, -35.9375, -33.078125, -30.21875, -27.359375, -24.5, -21.640625, -18.78125, -15.921875, -13.0625, -10.203125, -7.34375, -4.484375, -1.625, 1.234375, 4.09375, 6.953125, 9.8125, 12.671875, 15.53125, 18.390625, 21.25, 24.109375, 26.96875, 29.828125, 32.6875, 35.546875, 38.40625, 41.265625, 44.125, 46.984375, 49.84375, 52.703125, 55.5625, 58.421875, 61.28125, 64.140625, 67.0, 69.859375, 72.71875, 75.578125, 78.4375, 81.296875, 84.15625, 87.015625, 89.875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 8.0, 2.0, 3.0, 6.0, 8.0, 14.0, 18.0, 15.0, 19.0, 24.0, 16.0, 24.0, 27.0, 44.0, 44.0, 48.0, 53.0, 71.0, 130.0, 267.0, 1539.0, 176.0, 98.0, 57.0, 66.0, 27.0, 37.0, 47.0, 29.0, 25.0, 25.0, 13.0, 17.0, 16.0, 6.0, 11.0, 3.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-131.75, -127.08984375, -122.4296875, -117.76953125, -113.109375, -108.44921875, -103.7890625, -99.12890625, -94.46875, -89.80859375, -85.1484375, -80.48828125, -75.828125, -71.16796875, -66.5078125, -61.84765625, -57.1875, -52.52734375, -47.8671875, -43.20703125, -38.546875, -33.88671875, -29.2265625, -24.56640625, -19.90625, -15.24609375, -10.5859375, -5.92578125, -1.265625, 3.39453125, 8.0546875, 12.71484375, 17.375, 22.03515625, 26.6953125, 31.35546875, 36.015625, 40.67578125, 45.3359375, 49.99609375, 54.65625, 59.31640625, 63.9765625, 68.63671875, 73.296875, 77.95703125, 82.6171875, 87.27734375, 91.9375, 96.59765625, 101.2578125, 105.91796875, 110.578125, 115.23828125, 119.8984375, 124.55859375, 129.21875, 133.87890625, 138.5390625, 143.19921875, 147.859375, 152.51953125, 157.1796875, 161.83984375, 166.5]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 8.0, 8.0, 13.0, 22.0, 26.0, 36.0, 47.0, 71.0, 106.0, 183.0, 355.0, 1018.0, 4544.0, 41387.0, 2997114.0, 91023.0, 7216.0, 1421.0, 458.0, 214.0, 115.0, 81.0, 63.0, 64.0, 37.0, 14.0, 12.0, 11.0, 8.0, 8.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-337.75, -328.26953125, -318.7890625, -309.30859375, -299.828125, -290.34765625, -280.8671875, -271.38671875, -261.90625, -252.42578125, -242.9453125, -233.46484375, -223.984375, -214.50390625, -205.0234375, -195.54296875, -186.0625, -176.58203125, -167.1015625, -157.62109375, -148.140625, -138.66015625, -129.1796875, -119.69921875, -110.21875, -100.73828125, -91.2578125, -81.77734375, -72.296875, -62.81640625, -53.3359375, -43.85546875, -34.375, -24.89453125, -15.4140625, -5.93359375, 3.546875, 13.02734375, 22.5078125, 31.98828125, 41.46875, 50.94921875, 60.4296875, 69.91015625, 79.390625, 88.87109375, 98.3515625, 107.83203125, 117.3125, 126.79296875, 136.2734375, 145.75390625, 155.234375, 164.71484375, 174.1953125, 183.67578125, 193.15625, 202.63671875, 212.1171875, 221.59765625, 231.078125, 240.55859375, 250.0390625, 259.51953125, 269.0]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 18.0, 160.0, 573.0, 236.0, 26.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1370.4422607421875, -1342.791259765625, -1315.140380859375, -1287.4893798828125, -1259.83837890625, -1232.1875, -1204.5364990234375, -1176.885498046875, -1149.234619140625, -1121.5836181640625, -1093.9327392578125, -1066.28173828125, -1038.6307373046875, -1010.9798583984375, -983.328857421875, -955.6779174804688, -928.0269165039062, -900.3759765625, -872.7249755859375, -845.0740356445312, -817.423095703125, -789.7720947265625, -762.1211547851562, -734.47021484375, -706.8192138671875, -679.1682739257812, -651.5172729492188, -623.8663330078125, -596.2153930664062, -568.564453125, -540.9134521484375, -513.2625122070312, -485.611572265625, -457.9606018066406, -430.3096618652344, -402.65869140625, -375.00775146484375, -347.3567810058594, -319.705810546875, -292.05487060546875, -264.4039001464844, -236.75294494628906, -209.10198974609375, -181.45101928710938, -153.80006408691406, -126.14910888671875, -98.49813842773438, -70.84718322753906, -43.19622802734375, -15.545269012451172, 12.105690002441406, 39.75665283203125, 67.40760803222656, 95.05856323242188, 122.70953369140625, 150.36048889160156, 178.01144409179688, 205.6623992919922, 233.3133544921875, 260.9643249511719, 288.61529541015625, 316.2662353515625, 343.9172058105469, 371.56817626953125, 399.2191162109375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1.0, 1.0, 6.0, 6.0, 4.0, 17.0, 13.0, 13.0, 11.0, 20.0, 19.0, 29.0, 19.0, 27.0, 32.0, 45.0, 23.0, 47.0, 47.0, 42.0, 40.0, 45.0, 44.0, 42.0, 52.0, 39.0, 29.0, 31.0, 41.0, 22.0, 23.0, 31.0, 23.0, 16.0, 20.0, 17.0, 13.0, 18.0, 5.0, 13.0, 4.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0], "bins": [-360.70159912109375, -351.1728515625, -341.64410400390625, -332.1153259277344, -322.5865783691406, -313.0578308105469, -303.5290832519531, -294.00030517578125, -284.4715576171875, -274.94281005859375, -265.4140625, -255.8852996826172, -246.35653686523438, -236.82778930664062, -227.29904174804688, -217.77027893066406, -208.2415313720703, -198.71278381347656, -189.18402099609375, -179.6552734375, -170.1265106201172, -160.59776306152344, -151.06900024414062, -141.54025268554688, -132.01150512695312, -122.48274993896484, -112.95399475097656, -103.42524719238281, -93.896484375, -84.36773681640625, -74.83898162841797, -65.31022644042969, -55.781463623046875, -46.252708435058594, -36.72395324707031, -27.195201873779297, -17.666446685791016, -8.137691497802734, 1.3910598754882812, 10.919815063476562, 20.448570251464844, 29.977325439453125, 39.506080627441406, 49.03483200073242, 58.5635871887207, 68.09234619140625, 77.62109375, 87.14984893798828, 96.67860412597656, 106.20735931396484, 115.73611450195312, 125.26486206054688, 134.7936248779297, 144.32237243652344, 153.85113525390625, 163.3798828125, 172.90863037109375, 182.4373779296875, 191.9661407470703, 201.49488830566406, 211.02365112304688, 220.55239868164062, 230.08114624023438, 239.6099090576172, 249.138671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 11.0, 4.0, 11.0, 10.0, 14.0, 15.0, 21.0, 17.0, 35.0, 22.0, 35.0, 34.0, 27.0, 30.0, 43.0, 29.0, 50.0, 39.0, 43.0, 34.0, 39.0, 32.0, 47.0, 46.0, 25.0, 31.0, 29.0, 37.0, 22.0, 23.0, 22.0, 26.0, 14.0, 15.0, 16.0, 12.0, 7.0, 5.0, 3.0, 2.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.0, -54.134765625, -52.26953125, -50.404296875, -48.5390625, -46.673828125, -44.80859375, -42.943359375, -41.078125, -39.212890625, -37.34765625, -35.482421875, -33.6171875, -31.751953125, -29.88671875, -28.021484375, -26.15625, -24.291015625, -22.42578125, -20.560546875, -18.6953125, -16.830078125, -14.96484375, -13.099609375, -11.234375, -9.369140625, -7.50390625, -5.638671875, -3.7734375, -1.908203125, -0.04296875, 1.822265625, 3.6875, 5.552734375, 7.41796875, 9.283203125, 11.1484375, 13.013671875, 14.87890625, 16.744140625, 18.609375, 20.474609375, 22.33984375, 24.205078125, 26.0703125, 27.935546875, 29.80078125, 31.666015625, 33.53125, 35.396484375, 37.26171875, 39.126953125, 40.9921875, 42.857421875, 44.72265625, 46.587890625, 48.453125, 50.318359375, 52.18359375, 54.048828125, 55.9140625, 57.779296875, 59.64453125, 61.509765625, 63.375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 7.0, 2.0, 7.0, 5.0, 7.0, 15.0, 22.0, 25.0, 42.0, 40.0, 39.0, 63.0, 100.0, 135.0, 207.0, 436.0, 987.0, 3107.0, 23365.0, 4125795.0, 33869.0, 3712.0, 1068.0, 439.0, 230.0, 144.0, 111.0, 67.0, 60.0, 34.0, 35.0, 25.0, 15.0, 19.0, 12.0, 8.0, 3.0, 5.0, 7.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-655.5, -636.53125, -617.5625, -598.59375, -579.625, -560.65625, -541.6875, -522.71875, -503.75, -484.78125, -465.8125, -446.84375, -427.875, -408.90625, -389.9375, -370.96875, -352.0, -333.03125, -314.0625, -295.09375, -276.125, -257.15625, -238.1875, -219.21875, -200.25, -181.28125, -162.3125, -143.34375, -124.375, -105.40625, -86.4375, -67.46875, -48.5, -29.53125, -10.5625, 8.40625, 27.375, 46.34375, 65.3125, 84.28125, 103.25, 122.21875, 141.1875, 160.15625, 179.125, 198.09375, 217.0625, 236.03125, 255.0, 273.96875, 292.9375, 311.90625, 330.875, 349.84375, 368.8125, 387.78125, 406.75, 425.71875, 444.6875, 463.65625, 482.625, 501.59375, 520.5625, 539.53125, 558.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 9.0, 10.0, 10.0, 14.0, 21.0, 41.0, 50.0, 79.0, 118.0, 220.0, 507.0, 1006.0, 877.0, 412.0, 251.0, 113.0, 92.0, 42.0, 39.0, 23.0, 20.0, 20.0, 20.0, 11.0, 3.0, 11.0, 6.0, 4.0, 3.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.0625, -98.8642578125, -95.666015625, -92.4677734375, -89.26953125, -86.0712890625, -82.873046875, -79.6748046875, -76.4765625, -73.2783203125, -70.080078125, -66.8818359375, -63.68359375, -60.4853515625, -57.287109375, -54.0888671875, -50.890625, -47.6923828125, -44.494140625, -41.2958984375, -38.09765625, -34.8994140625, -31.701171875, -28.5029296875, -25.3046875, -22.1064453125, -18.908203125, -15.7099609375, -12.51171875, -9.3134765625, -6.115234375, -2.9169921875, 0.28125, 3.4794921875, 6.677734375, 9.8759765625, 13.07421875, 16.2724609375, 19.470703125, 22.6689453125, 25.8671875, 29.0654296875, 32.263671875, 35.4619140625, 38.66015625, 41.8583984375, 45.056640625, 48.2548828125, 51.453125, 54.6513671875, 57.849609375, 61.0478515625, 64.24609375, 67.4443359375, 70.642578125, 73.8408203125, 77.0390625, 80.2373046875, 83.435546875, 86.6337890625, 89.83203125, 93.0302734375, 96.228515625, 99.4267578125, 102.625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 6.0, 8.0, 14.0, 11.0, 22.0, 30.0, 52.0, 113.0, 289.0, 1081.0, 4420.0, 30574.0, 3866165.0, 275071.0, 12984.0, 2451.0, 610.0, 175.0, 71.0, 36.0, 25.0, 19.0, 13.0, 11.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-492.25, -478.10546875, -463.9609375, -449.81640625, -435.671875, -421.52734375, -407.3828125, -393.23828125, -379.09375, -364.94921875, -350.8046875, -336.66015625, -322.515625, -308.37109375, -294.2265625, -280.08203125, -265.9375, -251.79296875, -237.6484375, -223.50390625, -209.359375, -195.21484375, -181.0703125, -166.92578125, -152.78125, -138.63671875, -124.4921875, -110.34765625, -96.203125, -82.05859375, -67.9140625, -53.76953125, -39.625, -25.48046875, -11.3359375, 2.80859375, 16.953125, 31.09765625, 45.2421875, 59.38671875, 73.53125, 87.67578125, 101.8203125, 115.96484375, 130.109375, 144.25390625, 158.3984375, 172.54296875, 186.6875, 200.83203125, 214.9765625, 229.12109375, 243.265625, 257.41015625, 271.5546875, 285.69921875, 299.84375, 313.98828125, 328.1328125, 342.27734375, 356.421875, 370.56640625, 384.7109375, 398.85546875, 413.0]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 14.0, 70.0, 485.0, 379.0, 60.0, 8.0, 2.0], "bins": [-3549.258056640625, -3489.983642578125, -3430.709228515625, -3371.434814453125, -3312.16015625, -3252.8857421875, -3193.611328125, -3134.3369140625, -3075.0625, -3015.7880859375, -2956.513671875, -2897.2392578125, -2837.964599609375, -2778.690185546875, -2719.415771484375, -2660.141357421875, -2600.866943359375, -2541.592529296875, -2482.318115234375, -2423.043701171875, -2363.76904296875, -2304.49462890625, -2245.22021484375, -2185.94580078125, -2126.67138671875, -2067.39697265625, -2008.1224365234375, -1948.8480224609375, -1889.5736083984375, -1830.299072265625, -1771.024658203125, -1711.750244140625, -1652.4757080078125, -1593.2012939453125, -1533.9267578125, -1474.65234375, -1415.3779296875, -1356.103515625, -1296.8289794921875, -1237.5545654296875, -1178.280029296875, -1119.005615234375, -1059.7310791015625, -1000.4566650390625, -941.1822509765625, -881.9077758789062, -822.63330078125, -763.35888671875, -704.08447265625, -644.8099975585938, -585.5355834960938, -526.2611083984375, -466.9866943359375, -407.71221923828125, -348.4377746582031, -289.163330078125, -229.88890075683594, -170.6144561767578, -111.34000396728516, -52.0655517578125, 7.208892822265625, 66.48335266113281, 125.75779724121094, 185.03224182128906, 244.3066864013672]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 10.0, 11.0, 11.0, 9.0, 9.0, 20.0, 19.0, 22.0, 23.0, 18.0, 18.0, 34.0, 33.0, 26.0, 40.0, 41.0, 44.0, 44.0, 49.0, 53.0, 41.0, 56.0, 37.0, 40.0, 39.0, 36.0, 43.0, 21.0, 31.0, 17.0, 27.0, 11.0, 4.0, 9.0, 10.0, 4.0, 10.0, 6.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-333.1680908203125, -323.7839660644531, -314.39984130859375, -305.0157470703125, -295.6316223144531, -286.24749755859375, -276.8633728027344, -267.479248046875, -258.09515380859375, -248.71102905273438, -239.32691955566406, -229.9427947998047, -220.55868530273438, -211.174560546875, -201.79043579101562, -192.4063262939453, -183.02220153808594, -173.63807678222656, -164.25396728515625, -154.86984252929688, -145.48573303222656, -136.1016082763672, -126.71749114990234, -117.3333740234375, -107.94925689697266, -98.56513977050781, -89.18102264404297, -79.79690551757812, -70.41278076171875, -61.02866744995117, -51.64454650878906, -42.26042938232422, -32.876312255859375, -23.49219512939453, -14.108076095581055, -4.723957061767578, 4.660160064697266, 14.04427719116211, 23.42839813232422, 32.81251525878906, 42.196632385253906, 51.58074951171875, 60.964866638183594, 70.34898376464844, 79.73310852050781, 89.11721801757812, 98.5013427734375, 107.88545989990234, 117.26957702636719, 126.65369415283203, 136.03781127929688, 145.42193603515625, 154.80604553222656, 164.19017028808594, 173.57427978515625, 182.95840454101562, 192.342529296875, 201.72665405273438, 211.1107635498047, 220.49488830566406, 229.87899780273438, 239.26312255859375, 248.64724731445312, 258.0313720703125, 267.41546630859375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 10.0, 8.0, 12.0, 9.0, 13.0, 22.0, 15.0, 22.0, 28.0, 31.0, 36.0, 35.0, 35.0, 46.0, 47.0, 47.0, 39.0, 34.0, 36.0, 41.0, 31.0, 46.0, 31.0, 36.0, 44.0, 33.0, 34.0, 21.0, 26.0, 23.0, 20.0, 16.0, 13.0, 8.0, 9.0, 3.0, 9.0, 5.0, 5.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.9375, -46.01953125, -44.1015625, -42.18359375, -40.265625, -38.34765625, -36.4296875, -34.51171875, -32.59375, -30.67578125, -28.7578125, -26.83984375, -24.921875, -23.00390625, -21.0859375, -19.16796875, -17.25, -15.33203125, -13.4140625, -11.49609375, -9.578125, -7.66015625, -5.7421875, -3.82421875, -1.90625, 0.01171875, 1.9296875, 3.84765625, 5.765625, 7.68359375, 9.6015625, 11.51953125, 13.4375, 15.35546875, 17.2734375, 19.19140625, 21.109375, 23.02734375, 24.9453125, 26.86328125, 28.78125, 30.69921875, 32.6171875, 34.53515625, 36.453125, 38.37109375, 40.2890625, 42.20703125, 44.125, 46.04296875, 47.9609375, 49.87890625, 51.796875, 53.71484375, 55.6328125, 57.55078125, 59.46875, 61.38671875, 63.3046875, 65.22265625, 67.140625, 69.05859375, 70.9765625, 72.89453125, 74.8125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 13.0, 13.0, 29.0, 56.0, 94.0, 123.0, 212.0, 402.0, 594.0, 902.0, 1365.0, 2197.0, 3145.0, 4739.0, 7205.0, 11358.0, 18190.0, 29530.0, 50056.0, 89591.0, 179084.0, 290478.0, 157676.0, 81135.0, 45645.0, 27278.0, 17012.0, 10712.0, 6781.0, 4405.0, 2943.0, 2016.0, 1310.0, 825.0, 527.0, 347.0, 208.0, 125.0, 70.0, 52.0, 36.0, 24.0, 17.0, 9.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0], "bins": [-3.560546875, -3.46002197265625, -3.3594970703125, -3.25897216796875, -3.158447265625, -3.05792236328125, -2.9573974609375, -2.85687255859375, -2.75634765625, -2.65582275390625, -2.5552978515625, -2.45477294921875, -2.354248046875, -2.25372314453125, -2.1531982421875, -2.05267333984375, -1.9521484375, -1.85162353515625, -1.7510986328125, -1.65057373046875, -1.550048828125, -1.44952392578125, -1.3489990234375, -1.24847412109375, -1.14794921875, -1.04742431640625, -0.9468994140625, -0.84637451171875, -0.745849609375, -0.64532470703125, -0.5447998046875, -0.44427490234375, -0.34375, -0.24322509765625, -0.1427001953125, -0.04217529296875, 0.058349609375, 0.15887451171875, 0.2593994140625, 0.35992431640625, 0.46044921875, 0.56097412109375, 0.6614990234375, 0.76202392578125, 0.862548828125, 0.96307373046875, 1.0635986328125, 1.16412353515625, 1.2646484375, 1.36517333984375, 1.4656982421875, 1.56622314453125, 1.666748046875, 1.76727294921875, 1.8677978515625, 1.96832275390625, 2.06884765625, 2.16937255859375, 2.2698974609375, 2.37042236328125, 2.470947265625, 2.57147216796875, 2.6719970703125, 2.77252197265625, 2.873046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 1.0, 9.0, 4.0, 7.0, 19.0, 11.0, 10.0, 10.0, 17.0, 17.0, 19.0, 21.0, 28.0, 35.0, 39.0, 29.0, 44.0, 44.0, 43.0, 40.0, 31.0, 1065.0, 45.0, 46.0, 37.0, 46.0, 32.0, 31.0, 27.0, 27.0, 29.0, 14.0, 18.0, 16.0, 22.0, 17.0, 17.0, 12.0, 8.0, 5.0, 6.0, 4.0, 6.0, 7.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0], "bins": [-40.5, -39.36083984375, -38.2216796875, -37.08251953125, -35.943359375, -34.80419921875, -33.6650390625, -32.52587890625, -31.38671875, -30.24755859375, -29.1083984375, -27.96923828125, -26.830078125, -25.69091796875, -24.5517578125, -23.41259765625, -22.2734375, -21.13427734375, -19.9951171875, -18.85595703125, -17.716796875, -16.57763671875, -15.4384765625, -14.29931640625, -13.16015625, -12.02099609375, -10.8818359375, -9.74267578125, -8.603515625, -7.46435546875, -6.3251953125, -5.18603515625, -4.046875, -2.90771484375, -1.7685546875, -0.62939453125, 0.509765625, 1.64892578125, 2.7880859375, 3.92724609375, 5.06640625, 6.20556640625, 7.3447265625, 8.48388671875, 9.623046875, 10.76220703125, 11.9013671875, 13.04052734375, 14.1796875, 15.31884765625, 16.4580078125, 17.59716796875, 18.736328125, 19.87548828125, 21.0146484375, 22.15380859375, 23.29296875, 24.43212890625, 25.5712890625, 26.71044921875, 27.849609375, 28.98876953125, 30.1279296875, 31.26708984375, 32.40625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 12.0, 13.0, 15.0, 25.0, 43.0, 60.0, 100.0, 136.0, 217.0, 275.0, 433.0, 688.0, 1037.0, 1619.0, 2471.0, 3897.0, 6157.0, 9953.0, 15628.0, 26216.0, 45630.0, 86588.0, 194113.0, 1360933.0, 162146.0, 75532.0, 40878.0, 23481.0, 14344.0, 8877.0, 5410.0, 3571.0, 2331.0, 1481.0, 963.0, 588.0, 387.0, 291.0, 198.0, 137.0, 91.0, 47.0, 33.0, 20.0, 24.0, 8.0, 10.0, 9.0, 3.0, 5.0, 3.0, 2.0], "bins": [-3.376953125, -3.28155517578125, -3.1861572265625, -3.09075927734375, -2.995361328125, -2.89996337890625, -2.8045654296875, -2.70916748046875, -2.61376953125, -2.51837158203125, -2.4229736328125, -2.32757568359375, -2.232177734375, -2.13677978515625, -2.0413818359375, -1.94598388671875, -1.8505859375, -1.75518798828125, -1.6597900390625, -1.56439208984375, -1.468994140625, -1.37359619140625, -1.2781982421875, -1.18280029296875, -1.08740234375, -0.99200439453125, -0.8966064453125, -0.80120849609375, -0.705810546875, -0.61041259765625, -0.5150146484375, -0.41961669921875, -0.32421875, -0.22882080078125, -0.1334228515625, -0.03802490234375, 0.057373046875, 0.15277099609375, 0.2481689453125, 0.34356689453125, 0.43896484375, 0.53436279296875, 0.6297607421875, 0.72515869140625, 0.820556640625, 0.91595458984375, 1.0113525390625, 1.10675048828125, 1.2021484375, 1.29754638671875, 1.3929443359375, 1.48834228515625, 1.583740234375, 1.67913818359375, 1.7745361328125, 1.86993408203125, 1.96533203125, 2.06072998046875, 2.1561279296875, 2.25152587890625, 2.346923828125, 2.44232177734375, 2.5377197265625, 2.63311767578125, 2.728515625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 0.0, 5.0, 4.0, 5.0, 13.0, 8.0, 19.0, 20.0, 35.0, 34.0, 81.0, 68.0, 102.0, 95.0, 105.0, 92.0, 66.0, 54.0, 61.0, 32.0, 25.0, 17.0, 13.0, 13.0, 6.0, 3.0, 3.0, 8.0, 7.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0484619140625, -0.04712343215942383, -0.045784950256347656, -0.044446468353271484, -0.04310798645019531, -0.04176950454711914, -0.04043102264404297, -0.0390925407409668, -0.037754058837890625, -0.03641557693481445, -0.03507709503173828, -0.03373861312866211, -0.03240013122558594, -0.031061649322509766, -0.029723167419433594, -0.028384685516357422, -0.02704620361328125, -0.025707721710205078, -0.024369239807128906, -0.023030757904052734, -0.021692276000976562, -0.02035379409790039, -0.01901531219482422, -0.017676830291748047, -0.016338348388671875, -0.014999866485595703, -0.013661384582519531, -0.01232290267944336, -0.010984420776367188, -0.009645938873291016, -0.008307456970214844, -0.006968975067138672, -0.0056304931640625, -0.004292011260986328, -0.0029535293579101562, -0.0016150474548339844, -0.0002765655517578125, 0.0010619163513183594, 0.0024003982543945312, 0.003738880157470703, 0.005077362060546875, 0.006415843963623047, 0.007754325866699219, 0.00909280776977539, 0.010431289672851562, 0.011769771575927734, 0.013108253479003906, 0.014446735382080078, 0.01578521728515625, 0.017123699188232422, 0.018462181091308594, 0.019800662994384766, 0.021139144897460938, 0.02247762680053711, 0.02381610870361328, 0.025154590606689453, 0.026493072509765625, 0.027831554412841797, 0.02917003631591797, 0.03050851821899414, 0.03184700012207031, 0.033185482025146484, 0.034523963928222656, 0.03586244583129883, 0.037200927734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 2.0, 8.0, 7.0, 10.0, 9.0, 10.0, 12.0, 22.0, 29.0, 27.0, 48.0, 86.0, 146.0, 221.0, 495.0, 4037.0, 1016695.0, 24993.0, 905.0, 313.0, 174.0, 95.0, 54.0, 39.0, 28.0, 20.0, 19.0, 12.0, 5.0, 8.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66796875, -0.6438522338867188, -0.6197357177734375, -0.5956192016601562, -0.571502685546875, -0.5473861694335938, -0.5232696533203125, -0.49915313720703125, -0.47503662109375, -0.45092010498046875, -0.4268035888671875, -0.40268707275390625, -0.378570556640625, -0.35445404052734375, -0.3303375244140625, -0.30622100830078125, -0.2821044921875, -0.25798797607421875, -0.2338714599609375, -0.20975494384765625, -0.185638427734375, -0.16152191162109375, -0.1374053955078125, -0.11328887939453125, -0.08917236328125, -0.06505584716796875, -0.0409393310546875, -0.01682281494140625, 0.007293701171875, 0.03141021728515625, 0.0555267333984375, 0.07964324951171875, 0.103759765625, 0.12787628173828125, 0.1519927978515625, 0.17610931396484375, 0.200225830078125, 0.22434234619140625, 0.2484588623046875, 0.27257537841796875, 0.29669189453125, 0.32080841064453125, 0.3449249267578125, 0.36904144287109375, 0.393157958984375, 0.41727447509765625, 0.4413909912109375, 0.46550750732421875, 0.4896240234375, 0.5137405395507812, 0.5378570556640625, 0.5619735717773438, 0.586090087890625, 0.6102066040039062, 0.6343231201171875, 0.6584396362304688, 0.68255615234375, 0.7066726684570312, 0.7307891845703125, 0.7549057006835938, 0.779022216796875, 0.8031387329101562, 0.8272552490234375, 0.8513717651367188, 0.87548828125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 23.0, 959.0, 36.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11683978885412216, -0.10670732706785202, -0.09657486528158188, -0.08644240349531174, -0.0763099417090416, -0.06617747992277145, -0.05604501813650131, -0.04591255635023117, -0.03578009456396103, -0.025647632777690887, -0.015515170991420746, -0.005382709205150604, 0.004749752581119537, 0.014882214367389679, 0.02501467615365982, 0.03514713793992996, 0.045279599726200104, 0.055412061512470245, 0.06554452329874039, 0.07567698508501053, 0.08580944687128067, 0.09594190865755081, 0.10607437044382095, 0.1162068322300911, 0.12633928656578064, 0.13647174835205078, 0.14660421013832092, 0.15673667192459106, 0.1668691337108612, 0.17700159549713135, 0.1871340572834015, 0.19726651906967163, 0.20739901065826416, 0.2175314724445343, 0.22766393423080444, 0.23779639601707458, 0.24792885780334473, 0.25806131958961487, 0.268193781375885, 0.27832624316215515, 0.2884587049484253, 0.29859116673469543, 0.3087236285209656, 0.3188560903072357, 0.32898855209350586, 0.339121013879776, 0.34925347566604614, 0.3593859374523163, 0.3695183992385864, 0.37965086102485657, 0.3897833228111267, 0.39991578459739685, 0.410048246383667, 0.42018070816993713, 0.4303131699562073, 0.4404456317424774, 0.45057809352874756, 0.4607105553150177, 0.47084301710128784, 0.480975478887558, 0.4911079406738281, 0.5012403726577759, 0.5113728642463684, 0.5215053558349609, 0.5316377878189087]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 2.0, 10.0, 6.0, 10.0, 17.0, 24.0, 21.0, 24.0, 27.0, 21.0, 44.0, 48.0, 59.0, 50.0, 57.0, 48.0, 61.0, 50.0, 50.0, 57.0, 41.0, 49.0, 42.0, 45.0, 32.0, 28.0, 16.0, 14.0, 13.0, 12.0, 7.0, 9.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.02974987030029297, -0.029008792713284492, -0.028267715126276016, -0.02752663753926754, -0.026785559952259064, -0.026044482365250587, -0.02530340477824211, -0.024562327191233635, -0.02382124960422516, -0.023080172017216682, -0.022339094430208206, -0.02159801684319973, -0.020856939256191254, -0.020115861669182777, -0.0193747840821743, -0.018633706495165825, -0.01789262890815735, -0.017151551321148872, -0.016410473734140396, -0.01566939614713192, -0.014928318560123444, -0.014187240973114967, -0.013446163386106491, -0.012705085799098015, -0.011964008212089539, -0.011222930625081062, -0.010481853038072586, -0.00974077545106411, -0.008999697864055634, -0.008258620277047157, -0.007517542690038681, -0.006776465103030205, -0.0060353875160217285, -0.005294309929013252, -0.004553232342004776, -0.0038121547549962997, -0.0030710771679878235, -0.0023299995809793472, -0.001588921993970871, -0.0008478444069623947, -0.00010676681995391846, 0.0006343107670545578, 0.001375388354063034, 0.0021164659410715103, 0.0028575435280799866, 0.003598621115088463, 0.004339698702096939, 0.005080776289105415, 0.005821853876113892, 0.006562931463122368, 0.007304009050130844, 0.00804508663713932, 0.008786164224147797, 0.009527241811156273, 0.01026831939816475, 0.011009396985173225, 0.011750474572181702, 0.012491552159190178, 0.013232629746198654, 0.01397370733320713, 0.014714784920215607, 0.015455862507224083, 0.01619694009423256, 0.016938017681241035, 0.01767909526824951]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 10.0, 8.0, 12.0, 9.0, 13.0, 22.0, 15.0, 22.0, 28.0, 31.0, 36.0, 35.0, 35.0, 46.0, 47.0, 47.0, 39.0, 34.0, 36.0, 41.0, 31.0, 46.0, 31.0, 36.0, 44.0, 33.0, 34.0, 21.0, 26.0, 23.0, 20.0, 16.0, 13.0, 8.0, 9.0, 3.0, 9.0, 5.0, 5.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.9375, -46.01953125, -44.1015625, -42.18359375, -40.265625, -38.34765625, -36.4296875, -34.51171875, -32.59375, -30.67578125, -28.7578125, -26.83984375, -24.921875, -23.00390625, -21.0859375, -19.16796875, -17.25, -15.33203125, -13.4140625, -11.49609375, -9.578125, -7.66015625, -5.7421875, -3.82421875, -1.90625, 0.01171875, 1.9296875, 3.84765625, 5.765625, 7.68359375, 9.6015625, 11.51953125, 13.4375, 15.35546875, 17.2734375, 19.19140625, 21.109375, 23.02734375, 24.9453125, 26.86328125, 28.78125, 30.69921875, 32.6171875, 34.53515625, 36.453125, 38.37109375, 40.2890625, 42.20703125, 44.125, 46.04296875, 47.9609375, 49.87890625, 51.796875, 53.71484375, 55.6328125, 57.55078125, 59.46875, 61.38671875, 63.3046875, 65.22265625, 67.140625, 69.05859375, 70.9765625, 72.89453125, 74.8125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 7.0, 9.0, 13.0, 20.0, 40.0, 74.0, 75.0, 122.0, 218.0, 289.0, 368.0, 490.0, 680.0, 958.0, 1440.0, 1994.0, 3207.0, 5513.0, 11746.0, 31317.0, 143836.0, 643832.0, 143686.0, 31603.0, 11569.0, 5488.0, 3124.0, 2025.0, 1383.0, 996.0, 735.0, 485.0, 358.0, 285.0, 194.0, 134.0, 95.0, 55.0, 34.0, 22.0, 19.0, 8.0, 5.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.375, -103.8544921875, -100.333984375, -96.8134765625, -93.29296875, -89.7724609375, -86.251953125, -82.7314453125, -79.2109375, -75.6904296875, -72.169921875, -68.6494140625, -65.12890625, -61.6083984375, -58.087890625, -54.5673828125, -51.046875, -47.5263671875, -44.005859375, -40.4853515625, -36.96484375, -33.4443359375, -29.923828125, -26.4033203125, -22.8828125, -19.3623046875, -15.841796875, -12.3212890625, -8.80078125, -5.2802734375, -1.759765625, 1.7607421875, 5.28125, 8.8017578125, 12.322265625, 15.8427734375, 19.36328125, 22.8837890625, 26.404296875, 29.9248046875, 33.4453125, 36.9658203125, 40.486328125, 44.0068359375, 47.52734375, 51.0478515625, 54.568359375, 58.0888671875, 61.609375, 65.1298828125, 68.650390625, 72.1708984375, 75.69140625, 79.2119140625, 82.732421875, 86.2529296875, 89.7734375, 93.2939453125, 96.814453125, 100.3349609375, 103.85546875, 107.3759765625, 110.896484375, 114.4169921875, 117.9375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 9.0, 8.0, 7.0, 8.0, 12.0, 18.0, 27.0, 34.0, 37.0, 35.0, 47.0, 45.0, 63.0, 97.0, 211.0, 1586.0, 292.0, 94.0, 60.0, 51.0, 54.0, 42.0, 42.0, 33.0, 29.0, 16.0, 26.0, 16.0, 15.0, 10.0, 7.0, 4.0, 5.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.4375, -115.3408203125, -110.244140625, -105.1474609375, -100.05078125, -94.9541015625, -89.857421875, -84.7607421875, -79.6640625, -74.5673828125, -69.470703125, -64.3740234375, -59.27734375, -54.1806640625, -49.083984375, -43.9873046875, -38.890625, -33.7939453125, -28.697265625, -23.6005859375, -18.50390625, -13.4072265625, -8.310546875, -3.2138671875, 1.8828125, 6.9794921875, 12.076171875, 17.1728515625, 22.26953125, 27.3662109375, 32.462890625, 37.5595703125, 42.65625, 47.7529296875, 52.849609375, 57.9462890625, 63.04296875, 68.1396484375, 73.236328125, 78.3330078125, 83.4296875, 88.5263671875, 93.623046875, 98.7197265625, 103.81640625, 108.9130859375, 114.009765625, 119.1064453125, 124.203125, 129.2998046875, 134.396484375, 139.4931640625, 144.58984375, 149.6865234375, 154.783203125, 159.8798828125, 164.9765625, 170.0732421875, 175.169921875, 180.2666015625, 185.36328125, 190.4599609375, 195.556640625, 200.6533203125, 205.75]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 9.0, 12.0, 13.0, 14.0, 11.0, 25.0, 28.0, 39.0, 54.0, 73.0, 107.0, 245.0, 601.0, 2771.0, 2930809.0, 207960.0, 1912.0, 481.0, 221.0, 106.0, 63.0, 36.0, 25.0, 20.0, 15.0, 8.0, 12.0, 12.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-702.5, -682.9375, -663.375, -643.8125, -624.25, -604.6875, -585.125, -565.5625, -546.0, -526.4375, -506.875, -487.3125, -467.75, -448.1875, -428.625, -409.0625, -389.5, -369.9375, -350.375, -330.8125, -311.25, -291.6875, -272.125, -252.5625, -233.0, -213.4375, -193.875, -174.3125, -154.75, -135.1875, -115.625, -96.0625, -76.5, -56.9375, -37.375, -17.8125, 1.75, 21.3125, 40.875, 60.4375, 80.0, 99.5625, 119.125, 138.6875, 158.25, 177.8125, 197.375, 216.9375, 236.5, 256.0625, 275.625, 295.1875, 314.75, 334.3125, 353.875, 373.4375, 393.0, 412.5625, 432.125, 451.6875, 471.25, 490.8125, 510.375, 529.9375, 549.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 100.0, 780.0, 130.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1219.6351318359375, -1160.1058349609375, -1100.576416015625, -1041.047119140625, -981.5177001953125, -921.9884033203125, -862.4590454101562, -802.9296875, -743.4003295898438, -683.8709716796875, -624.3416137695312, -564.812255859375, -505.2829284667969, -445.7535705566406, -386.2242431640625, -326.69488525390625, -267.16552734375, -207.63616943359375, -148.10682678222656, -88.57748413085938, -29.048126220703125, 30.481231689453125, 90.01055908203125, 149.5399169921875, 209.06927490234375, 268.5986328125, 328.12799072265625, 387.6573181152344, 447.1866760253906, 506.7160339355469, 566.245361328125, 625.7747192382812, 685.30419921875, 744.8335571289062, 804.3629150390625, 863.8922119140625, 923.421630859375, 982.950927734375, 1042.480224609375, 1102.0096435546875, 1161.5390625, 1221.068359375, 1280.5977783203125, 1340.1270751953125, 1399.656494140625, 1459.185791015625, 1518.715087890625, 1578.2445068359375, 1637.7738037109375, 1697.3031005859375, 1756.83251953125, 1816.36181640625, 1875.8912353515625, 1935.4205322265625, 1994.949951171875, 2054.479248046875, 2114.008544921875, 2173.537841796875, 2233.067138671875, 2292.5966796875, 2352.1259765625, 2411.6552734375, 2471.1845703125, 2530.7138671875, 2590.243408203125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 8.0, 11.0, 10.0, 13.0, 20.0, 15.0, 10.0, 15.0, 31.0, 30.0, 30.0, 27.0, 26.0, 40.0, 25.0, 38.0, 39.0, 31.0, 43.0, 31.0, 40.0, 36.0, 35.0, 31.0, 28.0, 27.0, 26.0, 35.0, 28.0, 31.0, 30.0, 15.0, 24.0, 17.0, 11.0, 10.0, 14.0, 16.0, 10.0, 5.0, 7.0, 3.0, 10.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-298.99188232421875, -288.9653625488281, -278.9388122558594, -268.91229248046875, -258.8857727050781, -248.85923767089844, -238.83270263671875, -228.80618286132812, -218.7796630859375, -208.7531280517578, -198.7266082763672, -188.7000732421875, -178.67355346679688, -168.6470184326172, -158.6204833984375, -148.59396362304688, -138.5674285888672, -128.5408935546875, -118.51437377929688, -108.48783874511719, -98.46131896972656, -88.43478393554688, -78.40825653076172, -68.38172912597656, -58.355201721191406, -48.32867431640625, -38.302146911621094, -28.275615692138672, -18.249088287353516, -8.22256088256836, 1.8039703369140625, 11.830497741699219, 21.857025146484375, 31.88355255126953, 41.91007995605469, 51.93661117553711, 61.963138580322266, 71.98966979980469, 82.01619720458984, 92.042724609375, 102.06925201416016, 112.09577941894531, 122.12230682373047, 132.14883422851562, 142.1753692626953, 152.20188903808594, 162.22842407226562, 172.25494384765625, 182.28147888183594, 192.30801391601562, 202.33453369140625, 212.36106872558594, 222.38758850097656, 232.41412353515625, 242.44064331054688, 252.46717834472656, 262.49371337890625, 272.5202331542969, 282.5467834472656, 292.57330322265625, 302.5998229980469, 312.6263427734375, 322.65289306640625, 332.6794128417969, 342.7059326171875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 5.0, 8.0, 11.0, 14.0, 13.0, 12.0, 15.0, 19.0, 17.0, 22.0, 32.0, 35.0, 29.0, 33.0, 39.0, 45.0, 40.0, 45.0, 37.0, 51.0, 36.0, 38.0, 37.0, 35.0, 34.0, 31.0, 32.0, 41.0, 32.0, 34.0, 26.0, 22.0, 13.0, 12.0, 11.0, 11.0, 11.0, 7.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.78125, -54.80224609375, -52.8232421875, -50.84423828125, -48.865234375, -46.88623046875, -44.9072265625, -42.92822265625, -40.94921875, -38.97021484375, -36.9912109375, -35.01220703125, -33.033203125, -31.05419921875, -29.0751953125, -27.09619140625, -25.1171875, -23.13818359375, -21.1591796875, -19.18017578125, -17.201171875, -15.22216796875, -13.2431640625, -11.26416015625, -9.28515625, -7.30615234375, -5.3271484375, -3.34814453125, -1.369140625, 0.60986328125, 2.5888671875, 4.56787109375, 6.546875, 8.52587890625, 10.5048828125, 12.48388671875, 14.462890625, 16.44189453125, 18.4208984375, 20.39990234375, 22.37890625, 24.35791015625, 26.3369140625, 28.31591796875, 30.294921875, 32.27392578125, 34.2529296875, 36.23193359375, 38.2109375, 40.18994140625, 42.1689453125, 44.14794921875, 46.126953125, 48.10595703125, 50.0849609375, 52.06396484375, 54.04296875, 56.02197265625, 58.0009765625, 59.97998046875, 61.958984375, 63.93798828125, 65.9169921875, 67.89599609375, 69.875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 8.0, 7.0, 15.0, 26.0, 32.0, 42.0, 57.0, 85.0, 134.0, 182.0, 299.0, 477.0, 706.0, 1153.0, 1800.0, 3000.0, 5388.0, 11085.0, 34905.0, 281830.0, 2552320.0, 1152385.0, 111424.0, 18389.0, 7945.0, 4131.0, 2401.0, 1443.0, 867.0, 575.0, 359.0, 237.0, 188.0, 122.0, 69.0, 50.0, 36.0, 39.0, 23.0, 8.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-116.25, -112.34765625, -108.4453125, -104.54296875, -100.640625, -96.73828125, -92.8359375, -88.93359375, -85.03125, -81.12890625, -77.2265625, -73.32421875, -69.421875, -65.51953125, -61.6171875, -57.71484375, -53.8125, -49.91015625, -46.0078125, -42.10546875, -38.203125, -34.30078125, -30.3984375, -26.49609375, -22.59375, -18.69140625, -14.7890625, -10.88671875, -6.984375, -3.08203125, 0.8203125, 4.72265625, 8.625, 12.52734375, 16.4296875, 20.33203125, 24.234375, 28.13671875, 32.0390625, 35.94140625, 39.84375, 43.74609375, 47.6484375, 51.55078125, 55.453125, 59.35546875, 63.2578125, 67.16015625, 71.0625, 74.96484375, 78.8671875, 82.76953125, 86.671875, 90.57421875, 94.4765625, 98.37890625, 102.28125, 106.18359375, 110.0859375, 113.98828125, 117.890625, 121.79296875, 125.6953125, 129.59765625, 133.5]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 10.0, 8.0, 8.0, 15.0, 23.0, 20.0, 38.0, 48.0, 71.0, 115.0, 184.0, 306.0, 577.0, 967.0, 693.0, 343.0, 220.0, 126.0, 86.0, 52.0, 40.0, 34.0, 20.0, 14.0, 10.0, 7.0, 8.0, 3.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-161.5, -157.4296875, -153.359375, -149.2890625, -145.21875, -141.1484375, -137.078125, -133.0078125, -128.9375, -124.8671875, -120.796875, -116.7265625, -112.65625, -108.5859375, -104.515625, -100.4453125, -96.375, -92.3046875, -88.234375, -84.1640625, -80.09375, -76.0234375, -71.953125, -67.8828125, -63.8125, -59.7421875, -55.671875, -51.6015625, -47.53125, -43.4609375, -39.390625, -35.3203125, -31.25, -27.1796875, -23.109375, -19.0390625, -14.96875, -10.8984375, -6.828125, -2.7578125, 1.3125, 5.3828125, 9.453125, 13.5234375, 17.59375, 21.6640625, 25.734375, 29.8046875, 33.875, 37.9453125, 42.015625, 46.0859375, 50.15625, 54.2265625, 58.296875, 62.3671875, 66.4375, 70.5078125, 74.578125, 78.6484375, 82.71875, 86.7890625, 90.859375, 94.9296875, 99.0]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 16.0, 21.0, 45.0, 61.0, 89.0, 187.0, 346.0, 606.0, 1244.0, 2561.0, 6430.0, 19006.0, 84009.0, 2247900.0, 1724948.0, 77682.0, 17998.0, 6133.0, 2492.0, 1177.0, 571.0, 301.0, 171.0, 104.0, 70.0, 35.0, 25.0, 13.0, 11.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.625, -198.01953125, -191.4140625, -184.80859375, -178.203125, -171.59765625, -164.9921875, -158.38671875, -151.78125, -145.17578125, -138.5703125, -131.96484375, -125.359375, -118.75390625, -112.1484375, -105.54296875, -98.9375, -92.33203125, -85.7265625, -79.12109375, -72.515625, -65.91015625, -59.3046875, -52.69921875, -46.09375, -39.48828125, -32.8828125, -26.27734375, -19.671875, -13.06640625, -6.4609375, 0.14453125, 6.75, 13.35546875, 19.9609375, 26.56640625, 33.171875, 39.77734375, 46.3828125, 52.98828125, 59.59375, 66.19921875, 72.8046875, 79.41015625, 86.015625, 92.62109375, 99.2265625, 105.83203125, 112.4375, 119.04296875, 125.6484375, 132.25390625, 138.859375, 145.46484375, 152.0703125, 158.67578125, 165.28125, 171.88671875, 178.4921875, 185.09765625, 191.703125, 198.30859375, 204.9140625, 211.51953125, 218.125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 1002.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12957.9404296875, -12645.447265625, -12332.955078125, -12020.462890625, -11707.9697265625, -11395.4765625, -11082.984375, -10770.4921875, -10457.9990234375, -10145.505859375, -9833.013671875, -9520.521484375, -9208.0283203125, -8895.53515625, -8583.04296875, -8270.55078125, -7958.0576171875, -7645.56494140625, -7333.072265625, -7020.57958984375, -6708.0869140625, -6395.59423828125, -6083.1015625, -5770.60888671875, -5458.1162109375, -5145.62353515625, -4833.130859375, -4520.63818359375, -4208.1455078125, -3895.65283203125, -3583.16015625, -3270.66748046875, -2958.17578125, -2645.68310546875, -2333.1904296875, -2020.69775390625, -1708.205078125, -1395.71240234375, -1083.2197265625, -770.72705078125, -458.234375, -145.74169921875, 166.7509765625, 479.24365234375, 791.736328125, 1104.22900390625, 1416.7216796875, 1729.21435546875, 2041.70703125, 2354.19970703125, 2666.6923828125, 2979.18505859375, 3291.677734375, 3604.17041015625, 3916.6630859375, 4229.15576171875, 4541.6484375, 4854.14111328125, 5166.6337890625, 5479.12646484375, 5791.619140625, 6104.11181640625, 6416.6044921875, 6729.09716796875, 7041.58984375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 6.0, 17.0, 15.0, 26.0, 37.0, 33.0, 39.0, 56.0, 44.0, 60.0, 95.0, 79.0, 83.0, 66.0, 64.0, 84.0, 52.0, 37.0, 35.0, 23.0, 14.0, 14.0, 10.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-380.5922546386719, -361.2588195800781, -341.9253845214844, -322.5919494628906, -303.258544921875, -283.92510986328125, -264.5916748046875, -245.25823974609375, -225.9248046875, -206.59136962890625, -187.2579345703125, -167.9245147705078, -148.59107971191406, -129.2576446533203, -109.9242172241211, -90.59078979492188, -71.25735473632812, -51.92392349243164, -32.590492248535156, -13.257061004638672, 6.0763702392578125, 25.409805297851562, 44.74323272705078, 64.07666015625, 83.41009521484375, 102.7435302734375, 122.07695770263672, 141.41038513183594, 160.7438201904297, 180.07725524902344, 199.41067504882812, 218.74411010742188, 238.07757568359375, 257.4110107421875, 276.74444580078125, 296.077880859375, 315.41131591796875, 334.7447509765625, 354.0781555175781, 373.4115905761719, 392.7450256347656, 412.0784606933594, 431.4118957519531, 450.7453308105469, 470.0787353515625, 489.41217041015625, 508.74560546875, 528.0790405273438, 547.4124755859375, 566.7459106445312, 586.079345703125, 605.4127807617188, 624.7462158203125, 644.0796508789062, 663.4130859375, 682.7464599609375, 702.0799560546875, 721.4133911132812, 740.746826171875, 760.0802612304688, 779.4136962890625, 798.7471313476562, 818.08056640625, 837.4139404296875, 856.7473754882812]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 5.0, 7.0, 8.0, 11.0, 15.0, 12.0, 21.0, 17.0, 12.0, 17.0, 21.0, 18.0, 30.0, 27.0, 36.0, 46.0, 40.0, 41.0, 38.0, 47.0, 53.0, 34.0, 35.0, 42.0, 34.0, 27.0, 31.0, 33.0, 35.0, 36.0, 16.0, 24.0, 25.0, 17.0, 15.0, 13.0, 10.0, 7.0, 9.0, 11.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.03125, -50.47216796875, -48.9130859375, -47.35400390625, -45.794921875, -44.23583984375, -42.6767578125, -41.11767578125, -39.55859375, -37.99951171875, -36.4404296875, -34.88134765625, -33.322265625, -31.76318359375, -30.2041015625, -28.64501953125, -27.0859375, -25.52685546875, -23.9677734375, -22.40869140625, -20.849609375, -19.29052734375, -17.7314453125, -16.17236328125, -14.61328125, -13.05419921875, -11.4951171875, -9.93603515625, -8.376953125, -6.81787109375, -5.2587890625, -3.69970703125, -2.140625, -0.58154296875, 0.9775390625, 2.53662109375, 4.095703125, 5.65478515625, 7.2138671875, 8.77294921875, 10.33203125, 11.89111328125, 13.4501953125, 15.00927734375, 16.568359375, 18.12744140625, 19.6865234375, 21.24560546875, 22.8046875, 24.36376953125, 25.9228515625, 27.48193359375, 29.041015625, 30.60009765625, 32.1591796875, 33.71826171875, 35.27734375, 36.83642578125, 38.3955078125, 39.95458984375, 41.513671875, 43.07275390625, 44.6318359375, 46.19091796875, 47.75]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 6.0, 8.0, 19.0, 25.0, 30.0, 44.0, 66.0, 90.0, 132.0, 211.0, 293.0, 411.0, 544.0, 866.0, 1242.0, 1762.0, 2463.0, 3702.0, 5270.0, 7696.0, 11196.0, 16680.0, 24847.0, 38563.0, 61524.0, 106650.0, 196743.0, 232005.0, 128270.0, 73957.0, 44960.0, 28686.0, 18925.0, 12767.0, 8736.0, 5889.0, 4032.0, 2805.0, 1981.0, 1393.0, 966.0, 616.0, 468.0, 323.0, 206.0, 149.0, 122.0, 77.0, 47.0, 34.0, 26.0, 13.0, 9.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.068359375, -1.999786376953125, -1.93121337890625, -1.862640380859375, -1.7940673828125, -1.725494384765625, -1.65692138671875, -1.588348388671875, -1.519775390625, -1.451202392578125, -1.38262939453125, -1.314056396484375, -1.2454833984375, -1.176910400390625, -1.10833740234375, -1.039764404296875, -0.97119140625, -0.902618408203125, -0.83404541015625, -0.765472412109375, -0.6968994140625, -0.628326416015625, -0.55975341796875, -0.491180419921875, -0.422607421875, -0.354034423828125, -0.28546142578125, -0.216888427734375, -0.1483154296875, -0.079742431640625, -0.01116943359375, 0.057403564453125, 0.1259765625, 0.194549560546875, 0.26312255859375, 0.331695556640625, 0.4002685546875, 0.468841552734375, 0.53741455078125, 0.605987548828125, 0.674560546875, 0.743133544921875, 0.81170654296875, 0.880279541015625, 0.9488525390625, 1.017425537109375, 1.08599853515625, 1.154571533203125, 1.22314453125, 1.291717529296875, 1.36029052734375, 1.428863525390625, 1.4974365234375, 1.566009521484375, 1.63458251953125, 1.703155517578125, 1.771728515625, 1.840301513671875, 1.90887451171875, 1.977447509765625, 2.0460205078125, 2.114593505859375, 2.18316650390625, 2.251739501953125, 2.3203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 2.0, 7.0, 11.0, 7.0, 5.0, 11.0, 15.0, 12.0, 19.0, 14.0, 22.0, 26.0, 34.0, 23.0, 26.0, 28.0, 43.0, 34.0, 34.0, 52.0, 35.0, 1067.0, 34.0, 42.0, 44.0, 31.0, 44.0, 34.0, 22.0, 36.0, 28.0, 33.0, 21.0, 9.0, 19.0, 16.0, 16.0, 10.0, 10.0, 3.0, 11.0, 5.0, 6.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.875, -28.88037109375, -27.8857421875, -26.89111328125, -25.896484375, -24.90185546875, -23.9072265625, -22.91259765625, -21.91796875, -20.92333984375, -19.9287109375, -18.93408203125, -17.939453125, -16.94482421875, -15.9501953125, -14.95556640625, -13.9609375, -12.96630859375, -11.9716796875, -10.97705078125, -9.982421875, -8.98779296875, -7.9931640625, -6.99853515625, -6.00390625, -5.00927734375, -4.0146484375, -3.02001953125, -2.025390625, -1.03076171875, -0.0361328125, 0.95849609375, 1.953125, 2.94775390625, 3.9423828125, 4.93701171875, 5.931640625, 6.92626953125, 7.9208984375, 8.91552734375, 9.91015625, 10.90478515625, 11.8994140625, 12.89404296875, 13.888671875, 14.88330078125, 15.8779296875, 16.87255859375, 17.8671875, 18.86181640625, 19.8564453125, 20.85107421875, 21.845703125, 22.84033203125, 23.8349609375, 24.82958984375, 25.82421875, 26.81884765625, 27.8134765625, 28.80810546875, 29.802734375, 30.79736328125, 31.7919921875, 32.78662109375, 33.78125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 5.0, 7.0, 13.0, 9.0, 23.0, 31.0, 36.0, 72.0, 103.0, 131.0, 204.0, 313.0, 431.0, 634.0, 903.0, 1428.0, 2187.0, 3226.0, 4908.0, 7818.0, 12157.0, 19365.0, 32705.0, 57562.0, 111168.0, 409113.0, 1164553.0, 117420.0, 59977.0, 34475.0, 20411.0, 12573.0, 7989.0, 5005.0, 3394.0, 2197.0, 1478.0, 973.0, 644.0, 482.0, 293.0, 217.0, 154.0, 111.0, 72.0, 45.0, 33.0, 29.0, 17.0, 13.0, 17.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0], "bins": [-2.458984375, -2.37713623046875, -2.2952880859375, -2.21343994140625, -2.131591796875, -2.04974365234375, -1.9678955078125, -1.88604736328125, -1.80419921875, -1.72235107421875, -1.6405029296875, -1.55865478515625, -1.476806640625, -1.39495849609375, -1.3131103515625, -1.23126220703125, -1.1494140625, -1.06756591796875, -0.9857177734375, -0.90386962890625, -0.822021484375, -0.74017333984375, -0.6583251953125, -0.57647705078125, -0.49462890625, -0.41278076171875, -0.3309326171875, -0.24908447265625, -0.167236328125, -0.08538818359375, -0.0035400390625, 0.07830810546875, 0.16015625, 0.24200439453125, 0.3238525390625, 0.40570068359375, 0.487548828125, 0.56939697265625, 0.6512451171875, 0.73309326171875, 0.81494140625, 0.89678955078125, 0.9786376953125, 1.06048583984375, 1.142333984375, 1.22418212890625, 1.3060302734375, 1.38787841796875, 1.4697265625, 1.55157470703125, 1.6334228515625, 1.71527099609375, 1.797119140625, 1.87896728515625, 1.9608154296875, 2.04266357421875, 2.12451171875, 2.20635986328125, 2.2882080078125, 2.37005615234375, 2.451904296875, 2.53375244140625, 2.6156005859375, 2.69744873046875, 2.779296875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 0.0, 6.0, 4.0, 9.0, 7.0, 5.0, 5.0, 6.0, 10.0, 11.0, 20.0, 14.0, 23.0, 26.0, 22.0, 28.0, 29.0, 55.0, 52.0, 66.0, 80.0, 71.0, 78.0, 52.0, 35.0, 38.0, 35.0, 30.0, 23.0, 22.0, 16.0, 21.0, 15.0, 9.0, 20.0, 11.0, 8.0, 6.0, 5.0, 6.0, 5.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025421142578125, -0.024588823318481445, -0.02375650405883789, -0.022924184799194336, -0.02209186553955078, -0.021259546279907227, -0.020427227020263672, -0.019594907760620117, -0.018762588500976562, -0.017930269241333008, -0.017097949981689453, -0.0162656307220459, -0.015433311462402344, -0.014600992202758789, -0.013768672943115234, -0.01293635368347168, -0.012104034423828125, -0.01127171516418457, -0.010439395904541016, -0.009607076644897461, -0.008774757385253906, -0.007942438125610352, -0.007110118865966797, -0.006277799606323242, -0.0054454803466796875, -0.004613161087036133, -0.003780841827392578, -0.0029485225677490234, -0.0021162033081054688, -0.001283884048461914, -0.0004515647888183594, 0.0003807544708251953, 0.00121307373046875, 0.0020453929901123047, 0.0028777122497558594, 0.003710031509399414, 0.004542350769042969, 0.0053746700286865234, 0.006206989288330078, 0.007039308547973633, 0.007871627807617188, 0.008703947067260742, 0.009536266326904297, 0.010368585586547852, 0.011200904846191406, 0.012033224105834961, 0.012865543365478516, 0.01369786262512207, 0.014530181884765625, 0.01536250114440918, 0.016194820404052734, 0.01702713966369629, 0.017859458923339844, 0.0186917781829834, 0.019524097442626953, 0.020356416702270508, 0.021188735961914062, 0.022021055221557617, 0.022853374481201172, 0.023685693740844727, 0.02451801300048828, 0.025350332260131836, 0.02618265151977539, 0.027014970779418945, 0.0278472900390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 15.0, 7.0, 14.0, 11.0, 15.0, 15.0, 31.0, 24.0, 30.0, 35.0, 35.0, 43.0, 72.0, 85.0, 114.0, 183.0, 303.0, 697.0, 9274.0, 950254.0, 84015.0, 1932.0, 450.0, 275.0, 127.0, 96.0, 80.0, 58.0, 41.0, 43.0, 29.0, 23.0, 14.0, 14.0, 8.0, 13.0, 12.0, 18.0, 17.0, 5.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.496826171875, -0.4816551208496094, -0.46648406982421875, -0.4513130187988281, -0.4361419677734375, -0.4209709167480469, -0.40579986572265625, -0.3906288146972656, -0.375457763671875, -0.3602867126464844, -0.34511566162109375, -0.3299446105957031, -0.3147735595703125, -0.2996025085449219, -0.28443145751953125, -0.2692604064941406, -0.25408935546875, -0.23891830444335938, -0.22374725341796875, -0.20857620239257812, -0.1934051513671875, -0.17823410034179688, -0.16306304931640625, -0.14789199829101562, -0.132720947265625, -0.11754989624023438, -0.10237884521484375, -0.08720779418945312, -0.0720367431640625, -0.056865692138671875, -0.04169464111328125, -0.026523590087890625, -0.0113525390625, 0.003818511962890625, 0.01898956298828125, 0.034160614013671875, 0.0493316650390625, 0.06450271606445312, 0.07967376708984375, 0.09484481811523438, 0.110015869140625, 0.12518692016601562, 0.14035797119140625, 0.15552902221679688, 0.1707000732421875, 0.18587112426757812, 0.20104217529296875, 0.21621322631835938, 0.23138427734375, 0.24655532836914062, 0.26172637939453125, 0.2768974304199219, 0.2920684814453125, 0.3072395324707031, 0.32241058349609375, 0.3375816345214844, 0.352752685546875, 0.3679237365722656, 0.38309478759765625, 0.3982658386230469, 0.4134368896484375, 0.4286079406738281, 0.44377899169921875, 0.4589500427246094, 0.47412109375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 21.0, 353.0, 625.0, 19.0], "bins": [-0.3406594395637512, -0.3351737856864929, -0.3296881318092346, -0.3242024779319763, -0.318716824054718, -0.3132311701774597, -0.3077455163002014, -0.3022598624229431, -0.2967742085456848, -0.2912885546684265, -0.2858029007911682, -0.2803172469139099, -0.2748315930366516, -0.2693459391593933, -0.263860285282135, -0.2583746314048767, -0.2528889775276184, -0.2474033236503601, -0.2419176697731018, -0.2364320158958435, -0.2309463620185852, -0.2254607081413269, -0.2199750542640686, -0.2144894003868103, -0.2090037763118744, -0.2035181224346161, -0.1980324685573578, -0.1925468146800995, -0.1870611608028412, -0.18157550692558289, -0.17608985304832458, -0.17060419917106628, -0.16511856019496918, -0.15963290631771088, -0.15414725244045258, -0.14866159856319427, -0.14317594468593597, -0.13769029080867767, -0.13220465183258057, -0.12671899795532227, -0.12123333662748337, -0.11574768275022507, -0.11026202887296677, -0.10477638244628906, -0.09929072856903076, -0.09380507469177246, -0.08831942081451416, -0.08283376693725586, -0.07734811305999756, -0.07186245918273926, -0.06637680530548096, -0.060891155153512955, -0.055405501276254654, -0.04991984739899635, -0.04443419724702835, -0.03894854336977005, -0.03346288949251175, -0.02797723561525345, -0.022491583600640297, -0.017005931586027145, -0.011520277708768845, -0.006034623831510544, -0.0005489736795425415, 0.004936680197715759, 0.01042233593761921]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 9.0, 18.0, 20.0, 20.0, 29.0, 23.0, 32.0, 35.0, 49.0, 52.0, 53.0, 42.0, 47.0, 55.0, 54.0, 51.0, 54.0, 48.0, 40.0, 38.0, 32.0, 35.0, 23.0, 29.0, 20.0, 17.0, 19.0, 9.0, 6.0, 7.0, 7.0, 9.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01752525568008423, -0.01690787822008133, -0.01629050076007843, -0.01567312330007553, -0.015055745840072632, -0.014438368380069733, -0.013820990920066833, -0.013203613460063934, -0.012586236000061035, -0.011968858540058136, -0.011351481080055237, -0.010734103620052338, -0.010116726160049438, -0.00949934870004654, -0.00888197124004364, -0.008264593780040741, -0.007647216320037842, -0.007029838860034943, -0.0064124614000320435, -0.005795083940029144, -0.005177706480026245, -0.004560329020023346, -0.003942951560020447, -0.0033255741000175476, -0.0027081966400146484, -0.0020908191800117493, -0.00147344172000885, -0.0008560642600059509, -0.00023868680000305176, 0.0003786906599998474, 0.0009960681200027466, 0.0016134455800056458, 0.002230823040008545, 0.002848200500011444, 0.0034655779600143433, 0.004082955420017242, 0.004700332880020142, 0.005317710340023041, 0.00593508780002594, 0.006552465260028839, 0.007169842720031738, 0.0077872201800346375, 0.008404597640037537, 0.009021975100040436, 0.009639352560043335, 0.010256730020046234, 0.010874107480049133, 0.011491484940052032, 0.012108862400054932, 0.01272623986005783, 0.01334361732006073, 0.01396099478006363, 0.014578372240066528, 0.015195749700069427, 0.015813127160072327, 0.016430504620075226, 0.017047882080078125, 0.017665259540081024, 0.018282637000083923, 0.018900014460086823, 0.01951739192008972, 0.02013476938009262, 0.02075214684009552, 0.02136952430009842, 0.02198690176010132]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 5.0, 7.0, 8.0, 11.0, 15.0, 12.0, 21.0, 17.0, 12.0, 17.0, 21.0, 18.0, 30.0, 27.0, 36.0, 46.0, 40.0, 41.0, 38.0, 47.0, 53.0, 34.0, 35.0, 42.0, 34.0, 27.0, 31.0, 33.0, 35.0, 36.0, 16.0, 24.0, 25.0, 17.0, 15.0, 13.0, 10.0, 7.0, 9.0, 11.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.03125, -50.47216796875, -48.9130859375, -47.35400390625, -45.794921875, -44.23583984375, -42.6767578125, -41.11767578125, -39.55859375, -37.99951171875, -36.4404296875, -34.88134765625, -33.322265625, -31.76318359375, -30.2041015625, -28.64501953125, -27.0859375, -25.52685546875, -23.9677734375, -22.40869140625, -20.849609375, -19.29052734375, -17.7314453125, -16.17236328125, -14.61328125, -13.05419921875, -11.4951171875, -9.93603515625, -8.376953125, -6.81787109375, -5.2587890625, -3.69970703125, -2.140625, -0.58154296875, 0.9775390625, 2.53662109375, 4.095703125, 5.65478515625, 7.2138671875, 8.77294921875, 10.33203125, 11.89111328125, 13.4501953125, 15.00927734375, 16.568359375, 18.12744140625, 19.6865234375, 21.24560546875, 22.8046875, 24.36376953125, 25.9228515625, 27.48193359375, 29.041015625, 30.60009765625, 32.1591796875, 33.71826171875, 35.27734375, 36.83642578125, 38.3955078125, 39.95458984375, 41.513671875, 43.07275390625, 44.6318359375, 46.19091796875, 47.75]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 11.0, 16.0, 23.0, 23.0, 21.0, 52.0, 72.0, 98.0, 138.0, 160.0, 244.0, 354.0, 555.0, 742.0, 1135.0, 1787.0, 2874.0, 4908.0, 10247.0, 26682.0, 109938.0, 648071.0, 176433.0, 36262.0, 12728.0, 5837.0, 3244.0, 1932.0, 1233.0, 845.0, 558.0, 371.0, 278.0, 172.0, 133.0, 99.0, 65.0, 57.0, 43.0, 39.0, 13.0, 15.0, 15.0, 6.0, 2.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-115.4375, -111.787109375, -108.13671875, -104.486328125, -100.8359375, -97.185546875, -93.53515625, -89.884765625, -86.234375, -82.583984375, -78.93359375, -75.283203125, -71.6328125, -67.982421875, -64.33203125, -60.681640625, -57.03125, -53.380859375, -49.73046875, -46.080078125, -42.4296875, -38.779296875, -35.12890625, -31.478515625, -27.828125, -24.177734375, -20.52734375, -16.876953125, -13.2265625, -9.576171875, -5.92578125, -2.275390625, 1.375, 5.025390625, 8.67578125, 12.326171875, 15.9765625, 19.626953125, 23.27734375, 26.927734375, 30.578125, 34.228515625, 37.87890625, 41.529296875, 45.1796875, 48.830078125, 52.48046875, 56.130859375, 59.78125, 63.431640625, 67.08203125, 70.732421875, 74.3828125, 78.033203125, 81.68359375, 85.333984375, 88.984375, 92.634765625, 96.28515625, 99.935546875, 103.5859375, 107.236328125, 110.88671875, 114.537109375, 118.1875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 7.0, 9.0, 9.0, 10.0, 8.0, 13.0, 21.0, 20.0, 16.0, 19.0, 32.0, 28.0, 34.0, 47.0, 47.0, 59.0, 88.0, 180.0, 1634.0, 222.0, 108.0, 64.0, 49.0, 53.0, 40.0, 34.0, 35.0, 36.0, 19.0, 17.0, 19.0, 23.0, 13.0, 6.0, 5.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-114.3125, -110.802734375, -107.29296875, -103.783203125, -100.2734375, -96.763671875, -93.25390625, -89.744140625, -86.234375, -82.724609375, -79.21484375, -75.705078125, -72.1953125, -68.685546875, -65.17578125, -61.666015625, -58.15625, -54.646484375, -51.13671875, -47.626953125, -44.1171875, -40.607421875, -37.09765625, -33.587890625, -30.078125, -26.568359375, -23.05859375, -19.548828125, -16.0390625, -12.529296875, -9.01953125, -5.509765625, -2.0, 1.509765625, 5.01953125, 8.529296875, 12.0390625, 15.548828125, 19.05859375, 22.568359375, 26.078125, 29.587890625, 33.09765625, 36.607421875, 40.1171875, 43.626953125, 47.13671875, 50.646484375, 54.15625, 57.666015625, 61.17578125, 64.685546875, 68.1953125, 71.705078125, 75.21484375, 78.724609375, 82.234375, 85.744140625, 89.25390625, 92.763671875, 96.2734375, 99.783203125, 103.29296875, 106.802734375, 110.3125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 12.0, 20.0, 28.0, 41.0, 67.0, 88.0, 140.0, 256.0, 430.0, 1385.0, 21251.0, 3110447.0, 9551.0, 981.0, 366.0, 209.0, 132.0, 78.0, 61.0, 44.0, 28.0, 20.0, 9.0, 9.0, 11.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-465.25, -451.32421875, -437.3984375, -423.47265625, -409.546875, -395.62109375, -381.6953125, -367.76953125, -353.84375, -339.91796875, -325.9921875, -312.06640625, -298.140625, -284.21484375, -270.2890625, -256.36328125, -242.4375, -228.51171875, -214.5859375, -200.66015625, -186.734375, -172.80859375, -158.8828125, -144.95703125, -131.03125, -117.10546875, -103.1796875, -89.25390625, -75.328125, -61.40234375, -47.4765625, -33.55078125, -19.625, -5.69921875, 8.2265625, 22.15234375, 36.078125, 50.00390625, 63.9296875, 77.85546875, 91.78125, 105.70703125, 119.6328125, 133.55859375, 147.484375, 161.41015625, 175.3359375, 189.26171875, 203.1875, 217.11328125, 231.0390625, 244.96484375, 258.890625, 272.81640625, 286.7421875, 300.66796875, 314.59375, 328.51953125, 342.4453125, 356.37109375, 370.296875, 384.22265625, 398.1484375, 412.07421875, 426.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 10.0, 23.0, 37.0, 47.0, 102.0, 179.0, 202.0, 135.0, 107.0, 76.0, 41.0, 21.0, 12.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-538.4881591796875, -527.806396484375, -517.1246948242188, -506.4429626464844, -495.76123046875, -485.0794982910156, -474.39776611328125, -463.7160339355469, -453.0343017578125, -442.3525695800781, -431.67083740234375, -420.9891052246094, -410.307373046875, -399.6256408691406, -388.94390869140625, -378.2621765136719, -367.5804443359375, -356.8987121582031, -346.21697998046875, -335.5352478027344, -324.853515625, -314.1717834472656, -303.49005126953125, -292.8083190917969, -282.1265869140625, -271.4448547363281, -260.76312255859375, -250.08139038085938, -239.399658203125, -228.71792602539062, -218.03619384765625, -207.35446166992188, -196.67274475097656, -185.9910125732422, -175.3092803955078, -164.62754821777344, -153.94581604003906, -143.2640838623047, -132.5823516845703, -121.90061950683594, -111.21888732910156, -100.53715515136719, -89.85542297363281, -79.17369079589844, -68.49195861816406, -57.81022644042969, -47.12849426269531, -36.44676208496094, -25.765029907226562, -15.083297729492188, -4.4015655517578125, 6.2801666259765625, 16.961898803710938, 27.643630981445312, 38.32536315917969, 49.00709533691406, 59.68882751464844, 70.37055969238281, 81.05229187011719, 91.73402404785156, 102.41575622558594, 113.09748840332031, 123.77922058105469, 134.46095275878906, 145.14268493652344]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 5.0, 10.0, 9.0, 11.0, 3.0, 10.0, 15.0, 14.0, 19.0, 19.0, 17.0, 28.0, 22.0, 32.0, 33.0, 34.0, 40.0, 43.0, 41.0, 46.0, 55.0, 53.0, 57.0, 40.0, 46.0, 36.0, 27.0, 37.0, 26.0, 30.0, 29.0, 24.0, 13.0, 15.0, 13.0, 11.0, 1.0, 8.0, 5.0, 3.0, 3.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-306.19561767578125, -295.8919677734375, -285.58831787109375, -275.28466796875, -264.98101806640625, -254.67735290527344, -244.3737030029297, -234.07003784179688, -223.76638793945312, -213.46273803710938, -203.15908813476562, -192.85543823242188, -182.55177307128906, -172.2481231689453, -161.94447326660156, -151.64080810546875, -141.33717346191406, -131.0335235595703, -120.72986602783203, -110.42621612548828, -100.12255859375, -89.81890869140625, -79.5152587890625, -69.21160125732422, -58.90795135498047, -48.60429763793945, -38.30064392089844, -27.996994018554688, -17.693340301513672, -7.389686584472656, 2.9139633178710938, 13.217620849609375, 23.521270751953125, 33.82492446899414, 44.128578186035156, 54.432228088378906, 64.73588562011719, 75.03953552246094, 85.34318542480469, 95.64684295654297, 105.95049285888672, 116.25414276123047, 126.55780029296875, 136.8614501953125, 147.16510009765625, 157.46875, 167.77239990234375, 178.07606506347656, 188.3797149658203, 198.68336486816406, 208.9870147705078, 219.29067993164062, 229.59432983398438, 239.89797973632812, 250.20162963867188, 260.5052795410156, 270.8089294433594, 281.1125793457031, 291.4162292480469, 301.7198791503906, 312.0235290527344, 322.32720947265625, 332.630859375, 342.93450927734375, 353.2381591796875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 9.0, 6.0, 14.0, 15.0, 18.0, 19.0, 24.0, 25.0, 26.0, 22.0, 31.0, 28.0, 39.0, 40.0, 43.0, 40.0, 54.0, 51.0, 45.0, 51.0, 45.0, 33.0, 40.0, 33.0, 28.0, 38.0, 21.0, 26.0, 21.0, 14.0, 27.0, 9.0, 14.0, 10.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.3125, -56.513671875, -54.71484375, -52.916015625, -51.1171875, -49.318359375, -47.51953125, -45.720703125, -43.921875, -42.123046875, -40.32421875, -38.525390625, -36.7265625, -34.927734375, -33.12890625, -31.330078125, -29.53125, -27.732421875, -25.93359375, -24.134765625, -22.3359375, -20.537109375, -18.73828125, -16.939453125, -15.140625, -13.341796875, -11.54296875, -9.744140625, -7.9453125, -6.146484375, -4.34765625, -2.548828125, -0.75, 1.048828125, 2.84765625, 4.646484375, 6.4453125, 8.244140625, 10.04296875, 11.841796875, 13.640625, 15.439453125, 17.23828125, 19.037109375, 20.8359375, 22.634765625, 24.43359375, 26.232421875, 28.03125, 29.830078125, 31.62890625, 33.427734375, 35.2265625, 37.025390625, 38.82421875, 40.623046875, 42.421875, 44.220703125, 46.01953125, 47.818359375, 49.6171875, 51.416015625, 53.21484375, 55.013671875, 56.8125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 12.0, 11.0, 12.0, 18.0, 26.0, 41.0, 41.0, 56.0, 86.0, 116.0, 178.0, 250.0, 347.0, 476.0, 682.0, 1079.0, 1929.0, 3853.0, 8318.0, 23855.0, 253047.0, 3044260.0, 784909.0, 48079.0, 11341.0, 4739.0, 2347.0, 1438.0, 868.0, 560.0, 377.0, 264.0, 172.0, 133.0, 100.0, 74.0, 54.0, 34.0, 25.0, 14.0, 22.0, 7.0, 5.0, 9.0, 6.0, 4.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0], "bins": [-148.875, -144.3203125, -139.765625, -135.2109375, -130.65625, -126.1015625, -121.546875, -116.9921875, -112.4375, -107.8828125, -103.328125, -98.7734375, -94.21875, -89.6640625, -85.109375, -80.5546875, -76.0, -71.4453125, -66.890625, -62.3359375, -57.78125, -53.2265625, -48.671875, -44.1171875, -39.5625, -35.0078125, -30.453125, -25.8984375, -21.34375, -16.7890625, -12.234375, -7.6796875, -3.125, 1.4296875, 5.984375, 10.5390625, 15.09375, 19.6484375, 24.203125, 28.7578125, 33.3125, 37.8671875, 42.421875, 46.9765625, 51.53125, 56.0859375, 60.640625, 65.1953125, 69.75, 74.3046875, 78.859375, 83.4140625, 87.96875, 92.5234375, 97.078125, 101.6328125, 106.1875, 110.7421875, 115.296875, 119.8515625, 124.40625, 128.9609375, 133.515625, 138.0703125, 142.625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 10.0, 16.0, 23.0, 50.0, 74.0, 128.0, 216.0, 471.0, 1121.0, 1025.0, 454.0, 206.0, 106.0, 68.0, 34.0, 24.0, 14.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.375, -96.03125, -90.6875, -85.34375, -80.0, -74.65625, -69.3125, -63.96875, -58.625, -53.28125, -47.9375, -42.59375, -37.25, -31.90625, -26.5625, -21.21875, -15.875, -10.53125, -5.1875, 0.15625, 5.5, 10.84375, 16.1875, 21.53125, 26.875, 32.21875, 37.5625, 42.90625, 48.25, 53.59375, 58.9375, 64.28125, 69.625, 74.96875, 80.3125, 85.65625, 91.0, 96.34375, 101.6875, 107.03125, 112.375, 117.71875, 123.0625, 128.40625, 133.75, 139.09375, 144.4375, 149.78125, 155.125, 160.46875, 165.8125, 171.15625, 176.5, 181.84375, 187.1875, 192.53125, 197.875, 203.21875, 208.5625, 213.90625, 219.25, 224.59375, 229.9375, 235.28125, 240.625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 10.0, 13.0, 29.0, 44.0, 96.0, 172.0, 471.0, 1515.0, 10387.0, 437298.0, 3716701.0, 23743.0, 2604.0, 653.0, 281.0, 129.0, 68.0, 34.0, 14.0, 10.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-558.0, -545.0703125, -532.140625, -519.2109375, -506.28125, -493.3515625, -480.421875, -467.4921875, -454.5625, -441.6328125, -428.703125, -415.7734375, -402.84375, -389.9140625, -376.984375, -364.0546875, -351.125, -338.1953125, -325.265625, -312.3359375, -299.40625, -286.4765625, -273.546875, -260.6171875, -247.6875, -234.7578125, -221.828125, -208.8984375, -195.96875, -183.0390625, -170.109375, -157.1796875, -144.25, -131.3203125, -118.390625, -105.4609375, -92.53125, -79.6015625, -66.671875, -53.7421875, -40.8125, -27.8828125, -14.953125, -2.0234375, 10.90625, 23.8359375, 36.765625, 49.6953125, 62.625, 75.5546875, 88.484375, 101.4140625, 114.34375, 127.2734375, 140.203125, 153.1328125, 166.0625, 178.9921875, 191.921875, 204.8515625, 217.78125, 230.7109375, 243.640625, 256.5703125, 269.5]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 17.0, 110.0, 550.0, 276.0, 51.0, 9.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1232.1685791015625, -1166.4124755859375, -1100.6563720703125, -1034.9002685546875, -969.1441650390625, -903.3880615234375, -837.6320190429688, -771.8759155273438, -706.1198120117188, -640.3637084960938, -574.6076049804688, -508.8515319824219, -443.0954284667969, -377.3393249511719, -311.583251953125, -245.8271484375, -180.071044921875, -114.31494903564453, -48.55885314941406, 17.197235107421875, 82.95333862304688, 148.70944213867188, 214.46551513671875, 280.22161865234375, 345.97772216796875, 411.73382568359375, 477.48992919921875, 543.2459716796875, 609.0020751953125, 674.7581787109375, 740.5142822265625, 806.2703857421875, 872.0263671875, 937.782470703125, 1003.53857421875, 1069.294677734375, 1135.05078125, 1200.806884765625, 1266.56298828125, 1332.319091796875, 1398.0751953125, 1463.831298828125, 1529.58740234375, 1595.343505859375, 1661.099609375, 1726.855712890625, 1792.61181640625, 1858.367919921875, 1924.1239013671875, 1989.8800048828125, 2055.635986328125, 2121.39208984375, 2187.148193359375, 2252.904296875, 2318.660400390625, 2384.41650390625, 2450.172607421875, 2515.9287109375, 2581.684814453125, 2647.44091796875, 2713.197021484375, 2778.953125, 2844.709228515625, 2910.46533203125, 2976.221435546875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 8.0, 10.0, 15.0, 17.0, 15.0, 18.0, 19.0, 26.0, 28.0, 37.0, 39.0, 47.0, 27.0, 46.0, 46.0, 40.0, 33.0, 59.0, 39.0, 39.0, 31.0, 44.0, 40.0, 42.0, 28.0, 26.0, 25.0, 26.0, 20.0, 14.0, 14.0, 17.0, 5.0, 11.0, 7.0, 8.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-365.26678466796875, -354.63714599609375, -344.0074768066406, -333.3778381347656, -322.7481994628906, -312.1185302734375, -301.4888916015625, -290.8592529296875, -280.2295837402344, -269.5999450683594, -258.97027587890625, -248.34063720703125, -237.7109832763672, -227.08132934570312, -216.45169067382812, -205.82203674316406, -195.19239807128906, -184.562744140625, -173.93310546875, -163.30345153808594, -152.67379760742188, -142.04415893554688, -131.4145050048828, -120.78485107421875, -110.15520477294922, -99.52555847167969, -88.89590454101562, -78.2662582397461, -67.63661193847656, -57.0069580078125, -46.37731170654297, -35.747657775878906, -25.118011474609375, -14.488362312316895, -3.858713150024414, 6.77093505859375, 17.400585174560547, 28.030235290527344, 38.659881591796875, 49.28953552246094, 59.91918182373047, 70.548828125, 81.17848205566406, 91.8081283569336, 102.43777465820312, 113.06742858886719, 123.69707489013672, 134.32672119140625, 144.9563751220703, 155.58602905273438, 166.21566772460938, 176.84532165527344, 187.4749755859375, 198.1046142578125, 208.73426818847656, 219.36392211914062, 229.99356079101562, 240.6232147216797, 251.2528533935547, 261.88250732421875, 272.51214599609375, 283.1418151855469, 293.7714538574219, 304.401123046875, 315.03076171875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 2.0, 2.0, 5.0, 9.0, 11.0, 6.0, 16.0, 12.0, 21.0, 18.0, 30.0, 27.0, 30.0, 29.0, 28.0, 40.0, 36.0, 47.0, 52.0, 59.0, 42.0, 42.0, 57.0, 40.0, 44.0, 34.0, 30.0, 32.0, 36.0, 20.0, 19.0, 22.0, 25.0, 10.0, 14.0, 9.0, 9.0, 9.0, 9.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-59.0, -57.33203125, -55.6640625, -53.99609375, -52.328125, -50.66015625, -48.9921875, -47.32421875, -45.65625, -43.98828125, -42.3203125, -40.65234375, -38.984375, -37.31640625, -35.6484375, -33.98046875, -32.3125, -30.64453125, -28.9765625, -27.30859375, -25.640625, -23.97265625, -22.3046875, -20.63671875, -18.96875, -17.30078125, -15.6328125, -13.96484375, -12.296875, -10.62890625, -8.9609375, -7.29296875, -5.625, -3.95703125, -2.2890625, -0.62109375, 1.046875, 2.71484375, 4.3828125, 6.05078125, 7.71875, 9.38671875, 11.0546875, 12.72265625, 14.390625, 16.05859375, 17.7265625, 19.39453125, 21.0625, 22.73046875, 24.3984375, 26.06640625, 27.734375, 29.40234375, 31.0703125, 32.73828125, 34.40625, 36.07421875, 37.7421875, 39.41015625, 41.078125, 42.74609375, 44.4140625, 46.08203125, 47.75]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 13.0, 12.0, 24.0, 23.0, 36.0, 68.0, 112.0, 146.0, 271.0, 369.0, 578.0, 949.0, 1406.0, 2128.0, 3338.0, 5235.0, 8336.0, 13376.0, 22186.0, 36850.0, 64465.0, 128127.0, 291493.0, 231528.0, 101641.0, 54013.0, 31252.0, 18745.0, 11534.0, 7453.0, 4646.0, 2913.0, 1875.0, 1250.0, 752.0, 498.0, 346.0, 186.0, 128.0, 84.0, 63.0, 44.0, 33.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.830078125, -2.7464599609375, -2.662841796875, -2.5792236328125, -2.49560546875, -2.4119873046875, -2.328369140625, -2.2447509765625, -2.1611328125, -2.0775146484375, -1.993896484375, -1.9102783203125, -1.82666015625, -1.7430419921875, -1.659423828125, -1.5758056640625, -1.4921875, -1.4085693359375, -1.324951171875, -1.2413330078125, -1.15771484375, -1.0740966796875, -0.990478515625, -0.9068603515625, -0.8232421875, -0.7396240234375, -0.656005859375, -0.5723876953125, -0.48876953125, -0.4051513671875, -0.321533203125, -0.2379150390625, -0.154296875, -0.0706787109375, 0.012939453125, 0.0965576171875, 0.18017578125, 0.2637939453125, 0.347412109375, 0.4310302734375, 0.5146484375, 0.5982666015625, 0.681884765625, 0.7655029296875, 0.84912109375, 0.9327392578125, 1.016357421875, 1.0999755859375, 1.18359375, 1.2672119140625, 1.350830078125, 1.4344482421875, 1.51806640625, 1.6016845703125, 1.685302734375, 1.7689208984375, 1.8525390625, 1.9361572265625, 2.019775390625, 2.1033935546875, 2.18701171875, 2.2706298828125, 2.354248046875, 2.4378662109375, 2.521484375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 3.0, 7.0, 9.0, 6.0, 10.0, 14.0, 17.0, 28.0, 20.0, 23.0, 23.0, 36.0, 48.0, 27.0, 51.0, 36.0, 40.0, 32.0, 46.0, 1073.0, 45.0, 42.0, 47.0, 33.0, 30.0, 40.0, 26.0, 32.0, 29.0, 23.0, 23.0, 23.0, 11.0, 14.0, 4.0, 12.0, 7.0, 7.0, 7.0, 3.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.984375, -28.005615234375, -27.02685546875, -26.048095703125, -25.0693359375, -24.090576171875, -23.11181640625, -22.133056640625, -21.154296875, -20.175537109375, -19.19677734375, -18.218017578125, -17.2392578125, -16.260498046875, -15.28173828125, -14.302978515625, -13.32421875, -12.345458984375, -11.36669921875, -10.387939453125, -9.4091796875, -8.430419921875, -7.45166015625, -6.472900390625, -5.494140625, -4.515380859375, -3.53662109375, -2.557861328125, -1.5791015625, -0.600341796875, 0.37841796875, 1.357177734375, 2.3359375, 3.314697265625, 4.29345703125, 5.272216796875, 6.2509765625, 7.229736328125, 8.20849609375, 9.187255859375, 10.166015625, 11.144775390625, 12.12353515625, 13.102294921875, 14.0810546875, 15.059814453125, 16.03857421875, 17.017333984375, 17.99609375, 18.974853515625, 19.95361328125, 20.932373046875, 21.9111328125, 22.889892578125, 23.86865234375, 24.847412109375, 25.826171875, 26.804931640625, 27.78369140625, 28.762451171875, 29.7412109375, 30.719970703125, 31.69873046875, 32.677490234375, 33.65625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 6.0, 8.0, 12.0, 15.0, 34.0, 38.0, 61.0, 97.0, 136.0, 220.0, 320.0, 495.0, 729.0, 1080.0, 1748.0, 2697.0, 4377.0, 7022.0, 11741.0, 20179.0, 35614.0, 66501.0, 137076.0, 1366018.0, 225977.0, 97327.0, 49852.0, 27493.0, 15809.0, 9123.0, 5646.0, 3476.0, 2186.0, 1327.0, 857.0, 597.0, 434.0, 262.0, 154.0, 111.0, 82.0, 53.0, 43.0, 28.0, 26.0, 23.0, 7.0, 4.0, 3.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.498046875, -2.4168701171875, -2.335693359375, -2.2545166015625, -2.17333984375, -2.0921630859375, -2.010986328125, -1.9298095703125, -1.8486328125, -1.7674560546875, -1.686279296875, -1.6051025390625, -1.52392578125, -1.4427490234375, -1.361572265625, -1.2803955078125, -1.19921875, -1.1180419921875, -1.036865234375, -0.9556884765625, -0.87451171875, -0.7933349609375, -0.712158203125, -0.6309814453125, -0.5498046875, -0.4686279296875, -0.387451171875, -0.3062744140625, -0.22509765625, -0.1439208984375, -0.062744140625, 0.0184326171875, 0.099609375, 0.1807861328125, 0.261962890625, 0.3431396484375, 0.42431640625, 0.5054931640625, 0.586669921875, 0.6678466796875, 0.7490234375, 0.8302001953125, 0.911376953125, 0.9925537109375, 1.07373046875, 1.1549072265625, 1.236083984375, 1.3172607421875, 1.3984375, 1.4796142578125, 1.560791015625, 1.6419677734375, 1.72314453125, 1.8043212890625, 1.885498046875, 1.9666748046875, 2.0478515625, 2.1290283203125, 2.210205078125, 2.2913818359375, 2.37255859375, 2.4537353515625, 2.534912109375, 2.6160888671875, 2.697265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 0.0, 7.0, 4.0, 6.0, 2.0, 10.0, 10.0, 12.0, 16.0, 22.0, 28.0, 26.0, 49.0, 57.0, 87.0, 85.0, 110.0, 86.0, 78.0, 70.0, 40.0, 34.0, 30.0, 18.0, 13.0, 11.0, 12.0, 7.0, 6.0, 8.0, 10.0, 7.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0217437744140625, -0.021120548248291016, -0.02049732208251953, -0.019874095916748047, -0.019250869750976562, -0.018627643585205078, -0.018004417419433594, -0.01738119125366211, -0.016757965087890625, -0.01613473892211914, -0.015511512756347656, -0.014888286590576172, -0.014265060424804688, -0.013641834259033203, -0.013018608093261719, -0.012395381927490234, -0.01177215576171875, -0.011148929595947266, -0.010525703430175781, -0.009902477264404297, -0.009279251098632812, -0.008656024932861328, -0.008032798767089844, -0.007409572601318359, -0.006786346435546875, -0.006163120269775391, -0.005539894104003906, -0.004916667938232422, -0.0042934417724609375, -0.003670215606689453, -0.0030469894409179688, -0.0024237632751464844, -0.001800537109375, -0.0011773109436035156, -0.0005540847778320312, 6.914138793945312e-05, 0.0006923675537109375, 0.0013155937194824219, 0.0019388198852539062, 0.0025620460510253906, 0.003185272216796875, 0.0038084983825683594, 0.004431724548339844, 0.005054950714111328, 0.0056781768798828125, 0.006301403045654297, 0.006924629211425781, 0.007547855377197266, 0.00817108154296875, 0.008794307708740234, 0.009417533874511719, 0.010040760040283203, 0.010663986206054688, 0.011287212371826172, 0.011910438537597656, 0.01253366470336914, 0.013156890869140625, 0.01378011703491211, 0.014403343200683594, 0.015026569366455078, 0.015649795532226562, 0.016273021697998047, 0.01689624786376953, 0.017519474029541016, 0.0181427001953125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 9.0, 6.0, 8.0, 11.0, 11.0, 15.0, 23.0, 20.0, 32.0, 36.0, 40.0, 61.0, 83.0, 146.0, 208.0, 452.0, 2119.0, 117930.0, 919986.0, 5765.0, 651.0, 313.0, 179.0, 113.0, 69.0, 60.0, 41.0, 38.0, 17.0, 15.0, 15.0, 6.0, 12.0, 13.0, 10.0, 8.0, 7.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.323974609375, -0.3132362365722656, -0.30249786376953125, -0.2917594909667969, -0.2810211181640625, -0.2702827453613281, -0.25954437255859375, -0.24880599975585938, -0.238067626953125, -0.22732925415039062, -0.21659088134765625, -0.20585250854492188, -0.1951141357421875, -0.18437576293945312, -0.17363739013671875, -0.16289901733398438, -0.15216064453125, -0.14142227172851562, -0.13068389892578125, -0.11994552612304688, -0.1092071533203125, -0.09846878051757812, -0.08773040771484375, -0.07699203491210938, -0.066253662109375, -0.055515289306640625, -0.04477691650390625, -0.034038543701171875, -0.0233001708984375, -0.012561798095703125, -0.00182342529296875, 0.008914947509765625, 0.0196533203125, 0.030391693115234375, 0.04113006591796875, 0.051868438720703125, 0.0626068115234375, 0.07334518432617188, 0.08408355712890625, 0.09482192993164062, 0.105560302734375, 0.11629867553710938, 0.12703704833984375, 0.13777542114257812, 0.1485137939453125, 0.15925216674804688, 0.16999053955078125, 0.18072891235351562, 0.19146728515625, 0.20220565795898438, 0.21294403076171875, 0.22368240356445312, 0.2344207763671875, 0.24515914916992188, 0.25589752197265625, 0.2666358947753906, 0.277374267578125, 0.2881126403808594, 0.29885101318359375, 0.3095893859863281, 0.3203277587890625, 0.3310661315917969, 0.34180450439453125, 0.3525428771972656, 0.36328125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 12.0, 4.0, 20.0, 15.0, 30.0, 60.0, 94.0, 139.0, 177.0, 164.0, 106.0, 60.0, 53.0, 25.0, 18.0, 6.0, 8.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014822851866483688, -0.014396080747246742, -0.01396931055933237, -0.013542540371418, -0.013115769252181053, -0.012688998132944107, -0.012262227945029736, -0.011835457757115364, -0.011408686637878418, -0.010981915518641472, -0.0105551453307271, -0.010128375142812729, -0.009701604023575783, -0.009274832904338837, -0.008848062716424465, -0.008421292528510094, -0.007994521409273148, -0.007567750755697489, -0.00714098010212183, -0.006714209448546171, -0.006287438794970512, -0.005860668141394854, -0.005433897487819195, -0.005007126834243536, -0.004580356180667877, -0.004153585527092218, -0.0037268148735165596, -0.003300044219940901, -0.002873273566365242, -0.002446502912789583, -0.0020197322592139244, -0.0015929616056382656, -0.0011661909520626068, -0.000739420298486948, -0.0003126496449112892, 0.00011412100866436958, 0.0005408916622400284, 0.0009676623158156872, 0.001394432969391346, 0.0018212036229670048, 0.0022479742765426636, 0.0026747449301183224, 0.003101515583693981, 0.00352828623726964, 0.003955056890845299, 0.0043818275444209576, 0.004808598197996616, 0.005235368851572275, 0.005662139505147934, 0.006088910158723593, 0.0065156808122992516, 0.00694245146587491, 0.007369222119450569, 0.007795992773026228, 0.008222763426601887, 0.008649533614516258, 0.009076304733753204, 0.00950307585299015, 0.009929846040904522, 0.010356616228818893, 0.01078338734805584, 0.011210158467292786, 0.011636928655207157, 0.012063698843121529, 0.012490469962358475]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 1.0, 6.0, 9.0, 9.0, 9.0, 9.0, 14.0, 19.0, 24.0, 16.0, 24.0, 28.0, 27.0, 33.0, 42.0, 43.0, 31.0, 41.0, 51.0, 45.0, 50.0, 44.0, 47.0, 38.0, 38.0, 37.0, 36.0, 34.0, 31.0, 25.0, 20.0, 22.0, 17.0, 21.0, 13.0, 9.0, 14.0, 9.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007675349712371826, -0.007352359592914581, -0.007029369473457336, -0.0067063793540000916, -0.006383389234542847, -0.006060399115085602, -0.005737408995628357, -0.005414418876171112, -0.005091428756713867, -0.004768438637256622, -0.0044454485177993774, -0.004122458398342133, -0.0037994682788848877, -0.003476478159427643, -0.003153488039970398, -0.002830497920513153, -0.002507507801055908, -0.0021845176815986633, -0.0018615275621414185, -0.0015385374426841736, -0.0012155473232269287, -0.0008925572037696838, -0.000569567084312439, -0.0002465769648551941, 7.641315460205078e-05, 0.00039940327405929565, 0.0007223933935165405, 0.0010453835129737854, 0.0013683736324310303, 0.0016913637518882751, 0.00201435387134552, 0.002337343990802765, 0.0026603341102600098, 0.0029833242297172546, 0.0033063143491744995, 0.0036293044686317444, 0.003952294588088989, 0.004275284707546234, 0.004598274827003479, 0.004921264946460724, 0.005244255065917969, 0.005567245185375214, 0.0058902353048324585, 0.006213225424289703, 0.006536215543746948, 0.006859205663204193, 0.007182195782661438, 0.007505185902118683, 0.007828176021575928, 0.008151166141033173, 0.008474156260490417, 0.008797146379947662, 0.009120136499404907, 0.009443126618862152, 0.009766116738319397, 0.010089106857776642, 0.010412096977233887, 0.010735087096691132, 0.011058077216148376, 0.011381067335605621, 0.011704057455062866, 0.012027047574520111, 0.012350037693977356, 0.0126730278134346, 0.012996017932891846]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 2.0, 2.0, 5.0, 9.0, 11.0, 6.0, 16.0, 12.0, 21.0, 18.0, 30.0, 27.0, 30.0, 29.0, 28.0, 40.0, 36.0, 47.0, 52.0, 59.0, 42.0, 42.0, 57.0, 40.0, 44.0, 34.0, 30.0, 32.0, 36.0, 20.0, 19.0, 22.0, 25.0, 10.0, 14.0, 9.0, 9.0, 9.0, 9.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-59.0, -57.33203125, -55.6640625, -53.99609375, -52.328125, -50.66015625, -48.9921875, -47.32421875, -45.65625, -43.98828125, -42.3203125, -40.65234375, -38.984375, -37.31640625, -35.6484375, -33.98046875, -32.3125, -30.64453125, -28.9765625, -27.30859375, -25.640625, -23.97265625, -22.3046875, -20.63671875, -18.96875, -17.30078125, -15.6328125, -13.96484375, -12.296875, -10.62890625, -8.9609375, -7.29296875, -5.625, -3.95703125, -2.2890625, -0.62109375, 1.046875, 2.71484375, 4.3828125, 6.05078125, 7.71875, 9.38671875, 11.0546875, 12.72265625, 14.390625, 16.05859375, 17.7265625, 19.39453125, 21.0625, 22.73046875, 24.3984375, 26.06640625, 27.734375, 29.40234375, 31.0703125, 32.73828125, 34.40625, 36.07421875, 37.7421875, 39.41015625, 41.078125, 42.74609375, 44.4140625, 46.08203125, 47.75]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 6.0, 14.0, 22.0, 17.0, 43.0, 60.0, 86.0, 153.0, 240.0, 331.0, 531.0, 839.0, 1420.0, 2498.0, 4814.0, 10013.0, 27214.0, 104054.0, 602539.0, 219482.0, 45095.0, 14924.0, 6264.0, 3202.0, 1824.0, 1055.0, 630.0, 402.0, 269.0, 167.0, 110.0, 82.0, 50.0, 28.0, 24.0, 10.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-92.5, -89.8349609375, -87.169921875, -84.5048828125, -81.83984375, -79.1748046875, -76.509765625, -73.8447265625, -71.1796875, -68.5146484375, -65.849609375, -63.1845703125, -60.51953125, -57.8544921875, -55.189453125, -52.5244140625, -49.859375, -47.1943359375, -44.529296875, -41.8642578125, -39.19921875, -36.5341796875, -33.869140625, -31.2041015625, -28.5390625, -25.8740234375, -23.208984375, -20.5439453125, -17.87890625, -15.2138671875, -12.548828125, -9.8837890625, -7.21875, -4.5537109375, -1.888671875, 0.7763671875, 3.44140625, 6.1064453125, 8.771484375, 11.4365234375, 14.1015625, 16.7666015625, 19.431640625, 22.0966796875, 24.76171875, 27.4267578125, 30.091796875, 32.7568359375, 35.421875, 38.0869140625, 40.751953125, 43.4169921875, 46.08203125, 48.7470703125, 51.412109375, 54.0771484375, 56.7421875, 59.4072265625, 62.072265625, 64.7373046875, 67.40234375, 70.0673828125, 72.732421875, 75.3974609375, 78.0625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 2.0, 7.0, 14.0, 14.0, 25.0, 20.0, 19.0, 29.0, 32.0, 33.0, 43.0, 52.0, 49.0, 86.0, 163.0, 1583.0, 356.0, 117.0, 74.0, 55.0, 45.0, 40.0, 30.0, 21.0, 27.0, 18.0, 11.0, 17.0, 12.0, 13.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-122.4375, -118.5869140625, -114.736328125, -110.8857421875, -107.03515625, -103.1845703125, -99.333984375, -95.4833984375, -91.6328125, -87.7822265625, -83.931640625, -80.0810546875, -76.23046875, -72.3798828125, -68.529296875, -64.6787109375, -60.828125, -56.9775390625, -53.126953125, -49.2763671875, -45.42578125, -41.5751953125, -37.724609375, -33.8740234375, -30.0234375, -26.1728515625, -22.322265625, -18.4716796875, -14.62109375, -10.7705078125, -6.919921875, -3.0693359375, 0.78125, 4.6318359375, 8.482421875, 12.3330078125, 16.18359375, 20.0341796875, 23.884765625, 27.7353515625, 31.5859375, 35.4365234375, 39.287109375, 43.1376953125, 46.98828125, 50.8388671875, 54.689453125, 58.5400390625, 62.390625, 66.2412109375, 70.091796875, 73.9423828125, 77.79296875, 81.6435546875, 85.494140625, 89.3447265625, 93.1953125, 97.0458984375, 100.896484375, 104.7470703125, 108.59765625, 112.4482421875, 116.298828125, 120.1494140625, 124.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 11.0, 4.0, 7.0, 11.0, 15.0, 25.0, 24.0, 22.0, 50.0, 68.0, 109.0, 183.0, 358.0, 993.0, 9459.0, 3114014.0, 18042.0, 1274.0, 437.0, 196.0, 129.0, 66.0, 44.0, 45.0, 27.0, 19.0, 25.0, 12.0, 10.0, 6.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-360.5, -349.43359375, -338.3671875, -327.30078125, -316.234375, -305.16796875, -294.1015625, -283.03515625, -271.96875, -260.90234375, -249.8359375, -238.76953125, -227.703125, -216.63671875, -205.5703125, -194.50390625, -183.4375, -172.37109375, -161.3046875, -150.23828125, -139.171875, -128.10546875, -117.0390625, -105.97265625, -94.90625, -83.83984375, -72.7734375, -61.70703125, -50.640625, -39.57421875, -28.5078125, -17.44140625, -6.375, 4.69140625, 15.7578125, 26.82421875, 37.890625, 48.95703125, 60.0234375, 71.08984375, 82.15625, 93.22265625, 104.2890625, 115.35546875, 126.421875, 137.48828125, 148.5546875, 159.62109375, 170.6875, 181.75390625, 192.8203125, 203.88671875, 214.953125, 226.01953125, 237.0859375, 248.15234375, 259.21875, 270.28515625, 281.3515625, 292.41796875, 303.484375, 314.55078125, 325.6171875, 336.68359375, 347.75]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 32.0, 367.0, 536.0, 70.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.91610717773438, -105.24034118652344, -79.56456756591797, -53.8887939453125, -28.213027954101562, -2.537261962890625, 23.138519287109375, 48.81428527832031, 74.49005126953125, 100.16581726074219, 125.84159088134766, 151.51736450195312, 177.19313049316406, 202.868896484375, 228.544677734375, 254.22044372558594, 279.8962097167969, 305.5719909667969, 331.24774169921875, 356.92352294921875, 382.59930419921875, 408.2750549316406, 433.9508361816406, 459.6265869140625, 485.3023681640625, 510.9781494140625, 536.6539306640625, 562.3297119140625, 588.0054321289062, 613.6812133789062, 639.3569946289062, 665.0327758789062, 690.70849609375, 716.38427734375, 742.06005859375, 767.73583984375, 793.4115600585938, 819.0873413085938, 844.7631225585938, 870.4389038085938, 896.1146240234375, 921.7904052734375, 947.4661865234375, 973.1419677734375, 998.8176879882812, 1024.493408203125, 1050.169189453125, 1075.844970703125, 1101.520751953125, 1127.196533203125, 1152.872314453125, 1178.548095703125, 1204.223876953125, 1229.899658203125, 1255.575439453125, 1281.2510986328125, 1306.927001953125, 1332.602783203125, 1358.278564453125, 1383.954345703125, 1409.630126953125, 1435.305908203125, 1460.981689453125, 1486.6573486328125, 1512.3331298828125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 4.0, 4.0, 8.0, 6.0, 14.0, 10.0, 12.0, 14.0, 28.0, 22.0, 23.0, 29.0, 30.0, 34.0, 28.0, 33.0, 44.0, 43.0, 33.0, 38.0, 43.0, 33.0, 32.0, 46.0, 46.0, 40.0, 25.0, 36.0, 32.0, 30.0, 21.0, 21.0, 31.0, 18.0, 12.0, 16.0, 13.0, 4.0, 14.0, 4.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.01531982421875, -207.11715698242188, -200.21900939941406, -193.32086181640625, -186.42269897460938, -179.5245361328125, -172.6263885498047, -165.72824096679688, -158.830078125, -151.93191528320312, -145.0337677001953, -138.1356201171875, -131.23745727539062, -124.33930206298828, -117.44114685058594, -110.5429916381836, -103.64483642578125, -96.7466812133789, -89.84852600097656, -82.95037078857422, -76.05221557617188, -69.15406036376953, -62.25590515136719, -55.357749938964844, -48.4595947265625, -41.561439514160156, -34.66328430175781, -27.76512908935547, -20.866973876953125, -13.968818664550781, -7.0706634521484375, -0.17250823974609375, 6.7256317138671875, 13.623786926269531, 20.521942138671875, 27.42009735107422, 34.31825256347656, 41.216407775878906, 48.11456298828125, 55.012718200683594, 61.91087341308594, 68.80902862548828, 75.70718383789062, 82.60533905029297, 89.50349426269531, 96.40164947509766, 103.2998046875, 110.19795989990234, 117.09611511230469, 123.99427032470703, 130.89242553710938, 137.79058837890625, 144.68873596191406, 151.58688354492188, 158.48504638671875, 165.38320922851562, 172.28135681152344, 179.17950439453125, 186.07766723632812, 192.975830078125, 199.8739776611328, 206.77212524414062, 213.6702880859375, 220.56845092773438, 227.4665985107422]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 8.0, 10.0, 11.0, 13.0, 20.0, 18.0, 23.0, 29.0, 31.0, 38.0, 33.0, 40.0, 36.0, 38.0, 47.0, 44.0, 54.0, 50.0, 48.0, 57.0, 40.0, 34.0, 39.0, 29.0, 33.0, 20.0, 25.0, 21.0, 31.0, 12.0, 16.0, 9.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.375, -57.5078125, -55.640625, -53.7734375, -51.90625, -50.0390625, -48.171875, -46.3046875, -44.4375, -42.5703125, -40.703125, -38.8359375, -36.96875, -35.1015625, -33.234375, -31.3671875, -29.5, -27.6328125, -25.765625, -23.8984375, -22.03125, -20.1640625, -18.296875, -16.4296875, -14.5625, -12.6953125, -10.828125, -8.9609375, -7.09375, -5.2265625, -3.359375, -1.4921875, 0.375, 2.2421875, 4.109375, 5.9765625, 7.84375, 9.7109375, 11.578125, 13.4453125, 15.3125, 17.1796875, 19.046875, 20.9140625, 22.78125, 24.6484375, 26.515625, 28.3828125, 30.25, 32.1171875, 33.984375, 35.8515625, 37.71875, 39.5859375, 41.453125, 43.3203125, 45.1875, 47.0546875, 48.921875, 50.7890625, 52.65625, 54.5234375, 56.390625, 58.2578125, 60.125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 5.0, 7.0, 11.0, 10.0, 15.0, 19.0, 19.0, 46.0, 52.0, 81.0, 126.0, 149.0, 239.0, 374.0, 761.0, 1483.0, 3446.0, 10033.0, 39092.0, 1751273.0, 2322910.0, 46051.0, 10882.0, 3794.0, 1508.0, 731.0, 392.0, 240.0, 148.0, 95.0, 76.0, 54.0, 58.0, 27.0, 19.0, 24.0, 9.0, 11.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-300.5, -291.12109375, -281.7421875, -272.36328125, -262.984375, -253.60546875, -244.2265625, -234.84765625, -225.46875, -216.08984375, -206.7109375, -197.33203125, -187.953125, -178.57421875, -169.1953125, -159.81640625, -150.4375, -141.05859375, -131.6796875, -122.30078125, -112.921875, -103.54296875, -94.1640625, -84.78515625, -75.40625, -66.02734375, -56.6484375, -47.26953125, -37.890625, -28.51171875, -19.1328125, -9.75390625, -0.375, 9.00390625, 18.3828125, 27.76171875, 37.140625, 46.51953125, 55.8984375, 65.27734375, 74.65625, 84.03515625, 93.4140625, 102.79296875, 112.171875, 121.55078125, 130.9296875, 140.30859375, 149.6875, 159.06640625, 168.4453125, 177.82421875, 187.203125, 196.58203125, 205.9609375, 215.33984375, 224.71875, 234.09765625, 243.4765625, 252.85546875, 262.234375, 271.61328125, 280.9921875, 290.37109375, 299.75]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 14.0, 14.0, 16.0, 18.0, 37.0, 48.0, 72.0, 101.0, 147.0, 230.0, 413.0, 723.0, 940.0, 477.0, 272.0, 164.0, 110.0, 72.0, 45.0, 34.0, 22.0, 21.0, 15.0, 12.0, 10.0, 9.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.625, -169.669921875, -164.71484375, -159.759765625, -154.8046875, -149.849609375, -144.89453125, -139.939453125, -134.984375, -130.029296875, -125.07421875, -120.119140625, -115.1640625, -110.208984375, -105.25390625, -100.298828125, -95.34375, -90.388671875, -85.43359375, -80.478515625, -75.5234375, -70.568359375, -65.61328125, -60.658203125, -55.703125, -50.748046875, -45.79296875, -40.837890625, -35.8828125, -30.927734375, -25.97265625, -21.017578125, -16.0625, -11.107421875, -6.15234375, -1.197265625, 3.7578125, 8.712890625, 13.66796875, 18.623046875, 23.578125, 28.533203125, 33.48828125, 38.443359375, 43.3984375, 48.353515625, 53.30859375, 58.263671875, 63.21875, 68.173828125, 73.12890625, 78.083984375, 83.0390625, 87.994140625, 92.94921875, 97.904296875, 102.859375, 107.814453125, 112.76953125, 117.724609375, 122.6796875, 127.634765625, 132.58984375, 137.544921875, 142.5]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 12.0, 6.0, 16.0, 21.0, 26.0, 30.0, 41.0, 79.0, 86.0, 129.0, 178.0, 306.0, 428.0, 640.0, 958.0, 1589.0, 2536.0, 4349.0, 7745.0, 14676.0, 30259.0, 73729.0, 236167.0, 2034237.0, 1464963.0, 197486.0, 65020.0, 27341.0, 13124.0, 7242.0, 4007.0, 2476.0, 1529.0, 969.0, 576.0, 428.0, 270.0, 168.0, 130.0, 80.0, 66.0, 57.0, 35.0, 19.0, 20.0, 8.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-94.4375, -91.384765625, -88.33203125, -85.279296875, -82.2265625, -79.173828125, -76.12109375, -73.068359375, -70.015625, -66.962890625, -63.91015625, -60.857421875, -57.8046875, -54.751953125, -51.69921875, -48.646484375, -45.59375, -42.541015625, -39.48828125, -36.435546875, -33.3828125, -30.330078125, -27.27734375, -24.224609375, -21.171875, -18.119140625, -15.06640625, -12.013671875, -8.9609375, -5.908203125, -2.85546875, 0.197265625, 3.25, 6.302734375, 9.35546875, 12.408203125, 15.4609375, 18.513671875, 21.56640625, 24.619140625, 27.671875, 30.724609375, 33.77734375, 36.830078125, 39.8828125, 42.935546875, 45.98828125, 49.041015625, 52.09375, 55.146484375, 58.19921875, 61.251953125, 64.3046875, 67.357421875, 70.41015625, 73.462890625, 76.515625, 79.568359375, 82.62109375, 85.673828125, 88.7265625, 91.779296875, 94.83203125, 97.884765625, 100.9375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 16.0, 4.0, 15.0, 20.0, 19.0, 31.0, 46.0, 80.0, 113.0, 148.0, 158.0, 102.0, 74.0, 54.0, 35.0, 24.0, 13.0, 15.0, 8.0, 5.0, 4.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1648.35986328125, -1612.5533447265625, -1576.746826171875, -1540.9403076171875, -1505.1337890625, -1469.3272705078125, -1433.520751953125, -1397.714111328125, -1361.90771484375, -1326.1011962890625, -1290.294677734375, -1254.4881591796875, -1218.681640625, -1182.8751220703125, -1147.068603515625, -1111.261962890625, -1075.4554443359375, -1039.64892578125, -1003.8424072265625, -968.035888671875, -932.2293701171875, -896.4228515625, -860.6162719726562, -824.8097534179688, -789.0032348632812, -753.1967163085938, -717.3901977539062, -681.5836791992188, -645.777099609375, -609.9705810546875, -574.1640625, -538.3575439453125, -502.55108642578125, -466.74456787109375, -430.93804931640625, -395.1315002441406, -359.3249816894531, -323.5184631347656, -287.7119140625, -251.9053955078125, -216.098876953125, -180.2923583984375, -144.48582458496094, -108.6792984008789, -72.87277221679688, -37.066253662109375, -1.2597198486328125, 34.54681396484375, 70.35333251953125, 106.15985870361328, 141.9663848876953, 177.77291870117188, 213.57943725585938, 249.38595581054688, 285.1925048828125, 320.9990234375, 356.8055419921875, 392.612060546875, 428.4185791015625, 464.2251281738281, 500.0316467285156, 535.838134765625, 571.6447143554688, 607.4512329101562, 643.2577514648438]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 0.0, 7.0, 5.0, 8.0, 10.0, 13.0, 16.0, 16.0, 18.0, 26.0, 18.0, 35.0, 25.0, 19.0, 40.0, 41.0, 31.0, 48.0, 64.0, 40.0, 39.0, 41.0, 32.0, 42.0, 50.0, 35.0, 41.0, 28.0, 38.0, 24.0, 27.0, 26.0, 16.0, 14.0, 15.0, 15.0, 9.0, 7.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-533.291259765625, -515.253662109375, -497.2160339355469, -479.1784362792969, -461.14080810546875, -443.10321044921875, -425.06561279296875, -407.02801513671875, -388.9903869628906, -370.9527893066406, -352.9151611328125, -334.8775634765625, -316.8399658203125, -298.8023376464844, -280.7647399902344, -262.72711181640625, -244.68951416015625, -226.6519012451172, -208.61428833007812, -190.57669067382812, -172.53907775878906, -154.50146484375, -136.4638671875, -118.42625427246094, -100.38864135742188, -82.35102844238281, -64.31342315673828, -46.275814056396484, -28.238204956054688, -10.200592041015625, 7.837013244628906, 25.874618530273438, 43.91229248046875, 61.94990158081055, 79.98751068115234, 98.02511596679688, 116.06272888183594, 134.100341796875, 152.137939453125, 170.17555236816406, 188.21316528320312, 206.2507781982422, 224.28839111328125, 242.32598876953125, 260.36358642578125, 278.4012145996094, 296.4388122558594, 314.4764404296875, 332.5140380859375, 350.5516357421875, 368.5892639160156, 386.6268615722656, 404.66448974609375, 422.70208740234375, 440.73968505859375, 458.77728271484375, 476.8149108886719, 494.8525085449219, 512.89013671875, 530.927734375, 548.96533203125, 567.0029296875, 585.0405883789062, 603.0781860351562, 621.1157836914062]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 14.0, 16.0, 13.0, 19.0, 15.0, 23.0, 26.0, 22.0, 29.0, 31.0, 37.0, 37.0, 41.0, 50.0, 60.0, 41.0, 50.0, 33.0, 50.0, 41.0, 38.0, 38.0, 36.0, 29.0, 27.0, 34.0, 20.0, 18.0, 19.0, 11.0, 15.0, 7.0, 11.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-920.5, -890.90625, -861.3125, -831.71875, -802.125, -772.53125, -742.9375, -713.34375, -683.75, -654.15625, -624.5625, -594.96875, -565.375, -535.78125, -506.1875, -476.59375, -447.0, -417.40625, -387.8125, -358.21875, -328.625, -299.03125, -269.4375, -239.84375, -210.25, -180.65625, -151.0625, -121.46875, -91.875, -62.28125, -32.6875, -3.09375, 26.5, 56.09375, 85.6875, 115.28125, 144.875, 174.46875, 204.0625, 233.65625, 263.25, 292.84375, 322.4375, 352.03125, 381.625, 411.21875, 440.8125, 470.40625, 500.0, 529.59375, 559.1875, 588.78125, 618.375, 647.96875, 677.5625, 707.15625, 736.75, 766.34375, 795.9375, 825.53125, 855.125, 884.71875, 914.3125, 943.90625, 973.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 8.0, 2.0, 9.0, 12.0, 19.0, 19.0, 43.0, 56.0, 69.0, 97.0, 164.0, 256.0, 367.0, 505.0, 818.0, 1246.0, 1950.0, 2927.0, 4547.0, 7066.0, 11052.0, 17783.0, 28347.0, 46726.0, 82804.0, 175213.0, 322555.0, 153438.0, 75195.0, 42968.0, 26551.0, 16423.0, 10434.0, 6612.0, 4255.0, 2684.0, 1835.0, 1145.0, 770.0, 556.0, 331.0, 207.0, 153.0, 114.0, 84.0, 38.0, 34.0, 29.0, 16.0, 15.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.625, -48.9609375, -47.296875, -45.6328125, -43.96875, -42.3046875, -40.640625, -38.9765625, -37.3125, -35.6484375, -33.984375, -32.3203125, -30.65625, -28.9921875, -27.328125, -25.6640625, -24.0, -22.3359375, -20.671875, -19.0078125, -17.34375, -15.6796875, -14.015625, -12.3515625, -10.6875, -9.0234375, -7.359375, -5.6953125, -4.03125, -2.3671875, -0.703125, 0.9609375, 2.625, 4.2890625, 5.953125, 7.6171875, 9.28125, 10.9453125, 12.609375, 14.2734375, 15.9375, 17.6015625, 19.265625, 20.9296875, 22.59375, 24.2578125, 25.921875, 27.5859375, 29.25, 30.9140625, 32.578125, 34.2421875, 35.90625, 37.5703125, 39.234375, 40.8984375, 42.5625, 44.2265625, 45.890625, 47.5546875, 49.21875, 50.8828125, 52.546875, 54.2109375, 55.875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 7.0, 7.0, 6.0, 9.0, 4.0, 6.0, 15.0, 10.0, 13.0, 20.0, 11.0, 26.0, 23.0, 23.0, 22.0, 28.0, 30.0, 30.0, 34.0, 29.0, 32.0, 23.0, 42.0, 31.0, 1069.0, 42.0, 38.0, 30.0, 23.0, 36.0, 35.0, 32.0, 28.0, 20.0, 20.0, 16.0, 23.0, 18.0, 17.0, 10.0, 14.0, 11.0, 14.0, 8.0, 10.0, 8.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-512.0, -496.5078125, -481.015625, -465.5234375, -450.03125, -434.5390625, -419.046875, -403.5546875, -388.0625, -372.5703125, -357.078125, -341.5859375, -326.09375, -310.6015625, -295.109375, -279.6171875, -264.125, -248.6328125, -233.140625, -217.6484375, -202.15625, -186.6640625, -171.171875, -155.6796875, -140.1875, -124.6953125, -109.203125, -93.7109375, -78.21875, -62.7265625, -47.234375, -31.7421875, -16.25, -0.7578125, 14.734375, 30.2265625, 45.71875, 61.2109375, 76.703125, 92.1953125, 107.6875, 123.1796875, 138.671875, 154.1640625, 169.65625, 185.1484375, 200.640625, 216.1328125, 231.625, 247.1171875, 262.609375, 278.1015625, 293.59375, 309.0859375, 324.578125, 340.0703125, 355.5625, 371.0546875, 386.546875, 402.0390625, 417.53125, 433.0234375, 448.515625, 464.0078125, 479.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 13.0, 16.0, 19.0, 30.0, 40.0, 71.0, 115.0, 128.0, 202.0, 311.0, 418.0, 662.0, 915.0, 1363.0, 2153.0, 3124.0, 4673.0, 6814.0, 10133.0, 15228.0, 23142.0, 36628.0, 60467.0, 109757.0, 955601.0, 593071.0, 107422.0, 59821.0, 35889.0, 22916.0, 15148.0, 10041.0, 6748.0, 4500.0, 3091.0, 2093.0, 1361.0, 976.0, 629.0, 439.0, 340.0, 193.0, 139.0, 99.0, 67.0, 45.0, 28.0, 24.0, 12.0, 9.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.15625, -36.9248046875, -35.693359375, -34.4619140625, -33.23046875, -31.9990234375, -30.767578125, -29.5361328125, -28.3046875, -27.0732421875, -25.841796875, -24.6103515625, -23.37890625, -22.1474609375, -20.916015625, -19.6845703125, -18.453125, -17.2216796875, -15.990234375, -14.7587890625, -13.52734375, -12.2958984375, -11.064453125, -9.8330078125, -8.6015625, -7.3701171875, -6.138671875, -4.9072265625, -3.67578125, -2.4443359375, -1.212890625, 0.0185546875, 1.25, 2.4814453125, 3.712890625, 4.9443359375, 6.17578125, 7.4072265625, 8.638671875, 9.8701171875, 11.1015625, 12.3330078125, 13.564453125, 14.7958984375, 16.02734375, 17.2587890625, 18.490234375, 19.7216796875, 20.953125, 22.1845703125, 23.416015625, 24.6474609375, 25.87890625, 27.1103515625, 28.341796875, 29.5732421875, 30.8046875, 32.0361328125, 33.267578125, 34.4990234375, 35.73046875, 36.9619140625, 38.193359375, 39.4248046875, 40.65625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 10.0, 13.0, 13.0, 9.0, 6.0, 18.0, 24.0, 35.0, 28.0, 51.0, 53.0, 62.0, 93.0, 115.0, 122.0, 63.0, 55.0, 48.0, 43.0, 34.0, 26.0, 11.0, 15.0, 15.0, 5.0, 9.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74609375, -0.7225189208984375, -0.698944091796875, -0.6753692626953125, -0.65179443359375, -0.6282196044921875, -0.604644775390625, -0.5810699462890625, -0.5574951171875, -0.5339202880859375, -0.510345458984375, -0.4867706298828125, -0.46319580078125, -0.4396209716796875, -0.416046142578125, -0.3924713134765625, -0.368896484375, -0.3453216552734375, -0.321746826171875, -0.2981719970703125, -0.27459716796875, -0.2510223388671875, -0.227447509765625, -0.2038726806640625, -0.1802978515625, -0.1567230224609375, -0.133148193359375, -0.1095733642578125, -0.08599853515625, -0.0624237060546875, -0.038848876953125, -0.0152740478515625, 0.00830078125, 0.0318756103515625, 0.055450439453125, 0.0790252685546875, 0.10260009765625, 0.1261749267578125, 0.149749755859375, 0.1733245849609375, 0.1968994140625, 0.2204742431640625, 0.244049072265625, 0.2676239013671875, 0.29119873046875, 0.3147735595703125, 0.338348388671875, 0.3619232177734375, 0.385498046875, 0.4090728759765625, 0.432647705078125, 0.4562225341796875, 0.47979736328125, 0.5033721923828125, 0.526947021484375, 0.5505218505859375, 0.5740966796875, 0.5976715087890625, 0.621246337890625, 0.6448211669921875, 0.66839599609375, 0.6919708251953125, 0.715545654296875, 0.7391204833984375, 0.7626953125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 10.0, 10.0, 14.0, 13.0, 38.0, 48.0, 106.0, 149.0, 233.0, 446.0, 795.0, 1572.0, 3228.0, 7210.0, 17192.0, 47626.0, 179364.0, 595573.0, 130789.0, 38184.0, 14056.0, 6134.0, 2693.0, 1320.0, 687.0, 381.0, 235.0, 144.0, 98.0, 68.0, 46.0, 23.0, 19.0, 7.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.978515625, -3.855712890625, -3.73291015625, -3.610107421875, -3.4873046875, -3.364501953125, -3.24169921875, -3.118896484375, -2.99609375, -2.873291015625, -2.75048828125, -2.627685546875, -2.5048828125, -2.382080078125, -2.25927734375, -2.136474609375, -2.013671875, -1.890869140625, -1.76806640625, -1.645263671875, -1.5224609375, -1.399658203125, -1.27685546875, -1.154052734375, -1.03125, -0.908447265625, -0.78564453125, -0.662841796875, -0.5400390625, -0.417236328125, -0.29443359375, -0.171630859375, -0.048828125, 0.073974609375, 0.19677734375, 0.319580078125, 0.4423828125, 0.565185546875, 0.68798828125, 0.810791015625, 0.93359375, 1.056396484375, 1.17919921875, 1.302001953125, 1.4248046875, 1.547607421875, 1.67041015625, 1.793212890625, 1.916015625, 2.038818359375, 2.16162109375, 2.284423828125, 2.4072265625, 2.530029296875, 2.65283203125, 2.775634765625, 2.8984375, 3.021240234375, 3.14404296875, 3.266845703125, 3.3896484375, 3.512451171875, 3.63525390625, 3.758056640625, 3.880859375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 3.0, 11.0, 7.0, 9.0, 20.0, 11.0, 28.0, 24.0, 30.0, 54.0, 57.0, 86.0, 105.0, 122.0, 107.0, 104.0, 41.0, 48.0, 29.0, 24.0, 21.0, 7.0, 17.0, 7.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8118162751197815, -0.789677083492279, -0.7675378322601318, -0.7453986406326294, -0.7232593894004822, -0.7011201977729797, -0.6789809465408325, -0.6568417549133301, -0.6347025036811829, -0.6125633120536804, -0.5904240608215332, -0.5682848691940308, -0.5461456179618835, -0.5240064263343811, -0.5018671751022339, -0.47972798347473145, -0.4575887620449066, -0.4354495406150818, -0.41331031918525696, -0.39117109775543213, -0.3690318763256073, -0.34689265489578247, -0.32475346326828003, -0.3026142120361328, -0.28047502040863037, -0.25833579897880554, -0.2361965775489807, -0.21405735611915588, -0.19191813468933105, -0.16977891325950623, -0.1476397067308426, -0.12550048530101776, -0.10336124897003174, -0.08122202754020691, -0.05908280983567238, -0.03694359213113785, -0.014804370701313019, 0.00733485072851181, 0.029474064707756042, 0.05161328613758087, 0.0737525075674057, 0.09589172899723053, 0.11803095042705536, 0.140170156955719, 0.16230937838554382, 0.18444859981536865, 0.20658782124519348, 0.2287270426750183, 0.25086626410484314, 0.27300548553466797, 0.2951447069644928, 0.3172839283943176, 0.33942314982414246, 0.3615623712539673, 0.3837015628814697, 0.40584081411361694, 0.4279800057411194, 0.4501192271709442, 0.47225844860076904, 0.49439767003059387, 0.5165368914604187, 0.5386760830879211, 0.5608153343200684, 0.5829545259475708, 0.605093777179718]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 9.0, 5.0, 15.0, 16.0, 22.0, 7.0, 29.0, 19.0, 33.0, 33.0, 28.0, 27.0, 43.0, 42.0, 43.0, 38.0, 43.0, 29.0, 43.0, 34.0, 46.0, 52.0, 39.0, 28.0, 33.0, 26.0, 26.0, 25.0, 35.0, 24.0, 13.0, 16.0, 16.0, 16.0, 15.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.4518786072731018, -0.438330739736557, -0.4247828423976898, -0.411234974861145, -0.3976871073246002, -0.3841392397880554, -0.37059134244918823, -0.35704347491264343, -0.34349560737609863, -0.32994773983955383, -0.31639984250068665, -0.30285197496414185, -0.28930410742759705, -0.27575623989105225, -0.26220834255218506, -0.24866047501564026, -0.23511257767677307, -0.22156469523906708, -0.20801682770252228, -0.19446894526481628, -0.18092107772827148, -0.1673731952905655, -0.1538253128528595, -0.1402774453163147, -0.1267295628786087, -0.1131816878914833, -0.09963381290435791, -0.08608593046665192, -0.07253805547952652, -0.05899018049240112, -0.04544229805469513, -0.03189442306756973, -0.018346548080444336, -0.00479867123067379, 0.008749205619096756, 0.02229708433151245, 0.03584495931863785, 0.049392834305763245, 0.06294071674346924, 0.07648859173059464, 0.09003646671772003, 0.10358434170484543, 0.11713221669197083, 0.13068009912967682, 0.1442279815673828, 0.1577758491039276, 0.1713237315416336, 0.1848716139793396, 0.1984194815158844, 0.2119673639535904, 0.2255152314901352, 0.2390631139278412, 0.252610981464386, 0.2661588788032532, 0.279706746339798, 0.2932546138763428, 0.30680251121520996, 0.32035037875175476, 0.33389827609062195, 0.34744614362716675, 0.36099401116371155, 0.37454187870025635, 0.38808977603912354, 0.40163764357566833, 0.41518551111221313]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 9.0, 14.0, 16.0, 13.0, 19.0, 16.0, 23.0, 25.0, 23.0, 29.0, 30.0, 38.0, 38.0, 39.0, 53.0, 56.0, 43.0, 49.0, 32.0, 52.0, 41.0, 37.0, 39.0, 34.0, 30.0, 27.0, 34.0, 19.0, 19.0, 18.0, 14.0, 13.0, 6.0, 12.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-919.0, -889.4375, -859.875, -830.3125, -800.75, -771.1875, -741.625, -712.0625, -682.5, -652.9375, -623.375, -593.8125, -564.25, -534.6875, -505.125, -475.5625, -446.0, -416.4375, -386.875, -357.3125, -327.75, -298.1875, -268.625, -239.0625, -209.5, -179.9375, -150.375, -120.8125, -91.25, -61.6875, -32.125, -2.5625, 27.0, 56.5625, 86.125, 115.6875, 145.25, 174.8125, 204.375, 233.9375, 263.5, 293.0625, 322.625, 352.1875, 381.75, 411.3125, 440.875, 470.4375, 500.0, 529.5625, 559.125, 588.6875, 618.25, 647.8125, 677.375, 706.9375, 736.5, 766.0625, 795.625, 825.1875, 854.75, 884.3125, 913.875, 943.4375, 973.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 5.0, 4.0, 12.0, 16.0, 20.0, 24.0, 45.0, 46.0, 54.0, 100.0, 159.0, 214.0, 288.0, 409.0, 669.0, 1048.0, 1888.0, 3913.0, 9219.0, 26162.0, 89134.0, 470477.0, 337968.0, 69707.0, 21220.0, 7798.0, 3489.0, 1649.0, 928.0, 564.0, 395.0, 275.0, 181.0, 146.0, 96.0, 66.0, 40.0, 30.0, 27.0, 18.0, 17.0, 8.0, 6.0, 9.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-170.125, -164.79296875, -159.4609375, -154.12890625, -148.796875, -143.46484375, -138.1328125, -132.80078125, -127.46875, -122.13671875, -116.8046875, -111.47265625, -106.140625, -100.80859375, -95.4765625, -90.14453125, -84.8125, -79.48046875, -74.1484375, -68.81640625, -63.484375, -58.15234375, -52.8203125, -47.48828125, -42.15625, -36.82421875, -31.4921875, -26.16015625, -20.828125, -15.49609375, -10.1640625, -4.83203125, 0.5, 5.83203125, 11.1640625, 16.49609375, 21.828125, 27.16015625, 32.4921875, 37.82421875, 43.15625, 48.48828125, 53.8203125, 59.15234375, 64.484375, 69.81640625, 75.1484375, 80.48046875, 85.8125, 91.14453125, 96.4765625, 101.80859375, 107.140625, 112.47265625, 117.8046875, 123.13671875, 128.46875, 133.80078125, 139.1328125, 144.46484375, 149.796875, 155.12890625, 160.4609375, 165.79296875, 171.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 5.0, 6.0, 9.0, 12.0, 12.0, 20.0, 12.0, 21.0, 31.0, 31.0, 28.0, 40.0, 50.0, 40.0, 46.0, 40.0, 49.0, 2091.0, 72.0, 52.0, 52.0, 52.0, 42.0, 40.0, 45.0, 25.0, 23.0, 21.0, 14.0, 15.0, 12.0, 11.0, 9.0, 4.0, 1.0, 10.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1075.0, -1039.875, -1004.75, -969.625, -934.5, -899.375, -864.25, -829.125, -794.0, -758.875, -723.75, -688.625, -653.5, -618.375, -583.25, -548.125, -513.0, -477.875, -442.75, -407.625, -372.5, -337.375, -302.25, -267.125, -232.0, -196.875, -161.75, -126.625, -91.5, -56.375, -21.25, 13.875, 49.0, 84.125, 119.25, 154.375, 189.5, 224.625, 259.75, 294.875, 330.0, 365.125, 400.25, 435.375, 470.5, 505.625, 540.75, 575.875, 611.0, 646.125, 681.25, 716.375, 751.5, 786.625, 821.75, 856.875, 892.0, 927.125, 962.25, 997.375, 1032.5, 1067.625, 1102.75, 1137.875, 1173.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 11.0, 13.0, 21.0, 26.0, 38.0, 46.0, 59.0, 92.0, 115.0, 157.0, 220.0, 325.0, 582.0, 1162.0, 3019.0, 12271.0, 88575.0, 2855293.0, 157423.0, 18857.0, 4012.0, 1414.0, 662.0, 419.0, 224.0, 173.0, 150.0, 91.0, 59.0, 40.0, 40.0, 30.0, 28.0, 15.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-224.25, -217.375, -210.5, -203.625, -196.75, -189.875, -183.0, -176.125, -169.25, -162.375, -155.5, -148.625, -141.75, -134.875, -128.0, -121.125, -114.25, -107.375, -100.5, -93.625, -86.75, -79.875, -73.0, -66.125, -59.25, -52.375, -45.5, -38.625, -31.75, -24.875, -18.0, -11.125, -4.25, 2.625, 9.5, 16.375, 23.25, 30.125, 37.0, 43.875, 50.75, 57.625, 64.5, 71.375, 78.25, 85.125, 92.0, 98.875, 105.75, 112.625, 119.5, 126.375, 133.25, 140.125, 147.0, 153.875, 160.75, 167.625, 174.5, 181.375, 188.25, 195.125, 202.0, 208.875, 215.75]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 20.0, 28.0, 51.0, 83.0, 167.0, 248.0, 179.0, 81.0, 41.0, 29.0, 15.0, 13.0, 9.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2271.555908203125, -2210.9716796875, -2150.3876953125, -2089.803466796875, -2029.21923828125, -1968.6351318359375, -1908.051025390625, -1847.466796875, -1786.8826904296875, -1726.298583984375, -1665.71435546875, -1605.1302490234375, -1544.546142578125, -1483.9619140625, -1423.3778076171875, -1362.793701171875, -1302.20947265625, -1241.6253662109375, -1181.0411376953125, -1120.45703125, -1059.872802734375, -999.2886962890625, -938.70458984375, -878.1204223632812, -817.5362548828125, -756.9520874023438, -696.367919921875, -635.7838134765625, -575.1996459960938, -514.615478515625, -454.0313415527344, -393.44720458984375, -332.8631591796875, -272.27899169921875, -211.69485473632812, -151.11070251464844, -90.52655029296875, -29.9423828125, 30.641754150390625, 91.22589111328125, 151.81005859375, 212.3942108154297, 272.9783630371094, 333.5625, 394.14666748046875, 454.7308349609375, 515.31494140625, 575.8991088867188, 636.4832763671875, 697.0674438476562, 757.651611328125, 818.2357177734375, 878.8198852539062, 939.404052734375, 999.9881591796875, 1060.572265625, 1121.156494140625, 1181.7406005859375, 1242.3248291015625, 1302.908935546875, 1363.4931640625, 1424.0772705078125, 1484.661376953125, 1545.24560546875, 1605.8297119140625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 0.0, 4.0, 1.0, 7.0, 7.0, 10.0, 6.0, 9.0, 12.0, 25.0, 23.0, 20.0, 20.0, 33.0, 30.0, 43.0, 33.0, 39.0, 37.0, 50.0, 40.0, 52.0, 40.0, 50.0, 43.0, 43.0, 47.0, 31.0, 44.0, 29.0, 39.0, 25.0, 25.0, 19.0, 13.0, 18.0, 3.0, 7.0, 5.0, 4.0, 3.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1486.2545166015625, -1440.933349609375, -1395.6123046875, -1350.2911376953125, -1304.969970703125, -1259.6488037109375, -1214.32763671875, -1169.006591796875, -1123.6854248046875, -1078.3642578125, -1033.043212890625, -987.7220458984375, -942.40087890625, -897.0797119140625, -851.7586059570312, -806.4375, -761.1163330078125, -715.795166015625, -670.4740600585938, -625.1529541015625, -579.831787109375, -534.5106201171875, -489.18951416015625, -443.8683776855469, -398.5472412109375, -353.2261047363281, -307.90496826171875, -262.5838317871094, -217.2626953125, -171.94155883789062, -126.62042236328125, -81.29928588867188, -35.9781494140625, 9.342987060546875, 54.66412353515625, 99.98526000976562, 145.306396484375, 190.62753295898438, 235.94866943359375, 281.2698059082031, 326.5909423828125, 371.9120788574219, 417.23321533203125, 462.5543518066406, 507.87548828125, 553.1966552734375, 598.5177612304688, 643.8388671875, 689.1600341796875, 734.481201171875, 779.8023071289062, 825.1234130859375, 870.444580078125, 915.7657470703125, 961.0868530273438, 1006.407958984375, 1051.7291259765625, 1097.05029296875, 1142.371337890625, 1187.6925048828125, 1233.013671875, 1278.3348388671875, 1323.656005859375, 1368.97705078125, 1414.2982177734375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 5.0, 2.0, 9.0, 6.0, 15.0, 11.0, 12.0, 16.0, 14.0, 23.0, 19.0, 18.0, 40.0, 37.0, 46.0, 92.0, 171.0, 281.0, 410.0, 609.0, 2672.0, 1042215.0, 659.0, 409.0, 262.0, 150.0, 81.0, 49.0, 26.0, 35.0, 31.0, 20.0, 21.0, 19.0, 13.0, 11.0, 7.0, 13.0, 10.0, 3.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-677.0581665039062, -649.98095703125, -622.9037475585938, -595.8265380859375, -568.749267578125, -541.672119140625, -514.5948486328125, -487.51763916015625, -460.4404296875, -433.36322021484375, -406.2860107421875, -379.2087707519531, -352.1315612792969, -325.0543518066406, -297.97711181640625, -270.89990234375, -243.82269287109375, -216.7454833984375, -189.6682586669922, -162.59103393554688, -135.51382446289062, -108.43661499023438, -81.35939025878906, -54.28216552734375, -27.2049560546875, -0.12773895263671875, 26.949478149414062, 54.026695251464844, 81.10391235351562, 108.18112182617188, 135.2583465576172, 162.3355712890625, 189.412841796875, 216.49005126953125, 243.56727600097656, 270.6445007324219, 297.7217102050781, 324.7989196777344, 351.87615966796875, 378.953369140625, 406.03057861328125, 433.1077880859375, 460.18499755859375, 487.2622375488281, 514.3394775390625, 541.4166259765625, 568.493896484375, 595.5711059570312, 622.6483154296875, 649.7255249023438, 676.802734375, 703.8799438476562, 730.9571533203125, 758.034423828125, 785.1116333007812, 812.1888427734375, 839.2660522460938, 866.34326171875, 893.4204711914062, 920.4976806640625, 947.574951171875, 974.652099609375, 1001.7293701171875, 1028.806640625, 1055.8837890625]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 10.0, 6.0, 10.0, 12.0, 15.0, 17.0, 34.0, 114.0, 257.0, 3928.0, 51458124.0, 397.0, 119.0, 50.0, 18.0, 10.0, 5.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2840.538330078125, -2665.204345703125, -2489.870361328125, -2314.5361328125, -2139.2021484375, -1963.8682861328125, -1788.5341796875, -1613.2001953125, -1437.8662109375, -1262.5322265625, -1087.1982421875, -911.8641357421875, -736.5301513671875, -561.1961669921875, -385.862060546875, -210.528076171875, -35.194091796875, 140.13992309570312, 315.47393798828125, 490.8079833984375, 666.1419677734375, 841.4759521484375, 1016.81005859375, 1192.14404296875, 1367.47802734375, 1542.81201171875, 1718.14599609375, 1893.4801025390625, 2068.81396484375, 2244.14794921875, 2419.482177734375, 2594.816162109375, 2770.150390625, 2945.484375, 3120.818359375, 3296.15234375, 3471.486328125, 3646.8203125, 3822.154541015625, 3997.488525390625, 4172.822265625, 4348.15625, 4523.490234375, 4698.82421875, 4874.158203125, 5049.4921875, 5224.826171875, 5400.16015625, 5575.49462890625, 5750.82861328125, 5926.16259765625, 6101.49658203125, 6276.83056640625, 6452.16455078125, 6627.4990234375, 6802.8330078125, 6978.1669921875, 7153.5009765625, 7328.8349609375, 7504.1689453125, 7679.5029296875, 7854.8369140625, 8030.1708984375, 8205.5048828125, 8380.8388671875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 8.0, 6.0, 7.0, 18.0, 21.0, 27.0, 48.0, 57.0, 80.0, 143.0, 195.0, 283.0, 460.0, 626.0, 1066.0, 1528.0, 2296.0, 3545.0, 5335.0, 8315.0, 13133.0, 20142.0, 32477.0, 51256.0, 82950.0, 136849.0, 242663.0, 481360.0, 3977069.0, 565175.0, 270697.0, 150370.0, 90540.0, 55660.0, 35234.0, 22054.0, 14131.0, 9000.0, 5720.0, 3761.0, 2417.0, 1566.0, 1042.0, 703.0, 440.0, 311.0, 216.0, 135.0, 89.0, 56.0, 60.0, 38.0, 19.0, 10.0, 8.0, 9.0, 7.0, 8.0, 3.0, 3.0, 3.0, 1.0], "bins": [-16.921875, -16.36865234375, -15.8154296875, -15.26220703125, -14.708984375, -14.15576171875, -13.6025390625, -13.04931640625, -12.49609375, -11.94287109375, -11.3896484375, -10.83642578125, -10.283203125, -9.72998046875, -9.1767578125, -8.62353515625, -8.0703125, -7.51708984375, -6.9638671875, -6.41064453125, -5.857421875, -5.30419921875, -4.7509765625, -4.19775390625, -3.64453125, -3.09130859375, -2.5380859375, -1.98486328125, -1.431640625, -0.87841796875, -0.3251953125, 0.22802734375, 0.78125, 1.33447265625, 1.8876953125, 2.44091796875, 2.994140625, 3.54736328125, 4.1005859375, 4.65380859375, 5.20703125, 5.76025390625, 6.3134765625, 6.86669921875, 7.419921875, 7.97314453125, 8.5263671875, 9.07958984375, 9.6328125, 10.18603515625, 10.7392578125, 11.29248046875, 11.845703125, 12.39892578125, 12.9521484375, 13.50537109375, 14.05859375, 14.61181640625, 15.1650390625, 15.71826171875, 16.271484375, 16.82470703125, 17.3779296875, 17.93115234375, 18.484375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 9.0, 7.0, 13.0, 9.0, 13.0, 18.0, 17.0, 18.0, 23.0, 31.0, 22.0, 26.0, 26.0, 28.0, 44.0, 28.0, 43.0, 32.0, 20.0, 56.0, 992.0, 63.0, 27.0, 25.0, 40.0, 37.0, 31.0, 30.0, 28.0, 28.0, 28.0, 16.0, 24.0, 23.0, 23.0, 14.0, 18.0, 9.0, 13.0, 14.0, 10.0, 4.0, 5.0, 3.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0], "bins": [-197.375, -191.486328125, -185.59765625, -179.708984375, -173.8203125, -167.931640625, -162.04296875, -156.154296875, -150.265625, -144.376953125, -138.48828125, -132.599609375, -126.7109375, -120.822265625, -114.93359375, -109.044921875, -103.15625, -97.267578125, -91.37890625, -85.490234375, -79.6015625, -73.712890625, -67.82421875, -61.935546875, -56.046875, -50.158203125, -44.26953125, -38.380859375, -32.4921875, -26.603515625, -20.71484375, -14.826171875, -8.9375, -3.048828125, 2.83984375, 8.728515625, 14.6171875, 20.505859375, 26.39453125, 32.283203125, 38.171875, 44.060546875, 49.94921875, 55.837890625, 61.7265625, 67.615234375, 73.50390625, 79.392578125, 85.28125, 91.169921875, 97.05859375, 102.947265625, 108.8359375, 114.724609375, 120.61328125, 126.501953125, 132.390625, 138.279296875, 144.16796875, 150.056640625, 155.9453125, 161.833984375, 167.72265625, 173.611328125, 179.5]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 2.0, 4.0, 14.0, 20.0, 28.0, 50.0, 65.0, 103.0, 137.0, 224.0, 299.0, 456.0, 662.0, 1068.0, 1499.0, 2421.0, 3575.0, 5848.0, 9072.0, 14449.0, 23755.0, 38481.0, 65017.0, 111636.0, 196973.0, 364471.0, 1335967.0, 3193523.0, 404565.0, 215218.0, 120961.0, 70607.0, 41811.0, 25411.0, 15579.0, 9803.0, 6163.0, 3931.0, 2568.0, 1663.0, 1079.0, 699.0, 540.0, 316.0, 222.0, 138.0, 106.0, 80.0, 57.0, 34.0, 18.0, 16.0, 6.0, 4.0, 8.0, 3.0, 1.0, 2.0], "bins": [-19.921875, -19.319580078125, -18.71728515625, -18.114990234375, -17.5126953125, -16.910400390625, -16.30810546875, -15.705810546875, -15.103515625, -14.501220703125, -13.89892578125, -13.296630859375, -12.6943359375, -12.092041015625, -11.48974609375, -10.887451171875, -10.28515625, -9.682861328125, -9.08056640625, -8.478271484375, -7.8759765625, -7.273681640625, -6.67138671875, -6.069091796875, -5.466796875, -4.864501953125, -4.26220703125, -3.659912109375, -3.0576171875, -2.455322265625, -1.85302734375, -1.250732421875, -0.6484375, -0.046142578125, 0.55615234375, 1.158447265625, 1.7607421875, 2.363037109375, 2.96533203125, 3.567626953125, 4.169921875, 4.772216796875, 5.37451171875, 5.976806640625, 6.5791015625, 7.181396484375, 7.78369140625, 8.385986328125, 8.98828125, 9.590576171875, 10.19287109375, 10.795166015625, 11.3974609375, 11.999755859375, 12.60205078125, 13.204345703125, 13.806640625, 14.408935546875, 15.01123046875, 15.613525390625, 16.2158203125, 16.818115234375, 17.42041015625, 18.022705078125, 18.625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 4.0, 12.0, 17.0, 10.0, 15.0, 15.0, 20.0, 27.0, 26.0, 31.0, 51.0, 36.0, 38.0, 39.0, 32.0, 48.0, 55.0, 932.0, 148.0, 35.0, 41.0, 28.0, 38.0, 36.0, 36.0, 26.0, 32.0, 21.0, 25.0, 24.0, 18.0, 20.0, 16.0, 8.0, 12.0, 6.0, 6.0, 5.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-202.625, -196.630859375, -190.63671875, -184.642578125, -178.6484375, -172.654296875, -166.66015625, -160.666015625, -154.671875, -148.677734375, -142.68359375, -136.689453125, -130.6953125, -124.701171875, -118.70703125, -112.712890625, -106.71875, -100.724609375, -94.73046875, -88.736328125, -82.7421875, -76.748046875, -70.75390625, -64.759765625, -58.765625, -52.771484375, -46.77734375, -40.783203125, -34.7890625, -28.794921875, -22.80078125, -16.806640625, -10.8125, -4.818359375, 1.17578125, 7.169921875, 13.1640625, 19.158203125, 25.15234375, 31.146484375, 37.140625, 43.134765625, 49.12890625, 55.123046875, 61.1171875, 67.111328125, 73.10546875, 79.099609375, 85.09375, 91.087890625, 97.08203125, 103.076171875, 109.0703125, 115.064453125, 121.05859375, 127.052734375, 133.046875, 139.041015625, 145.03515625, 151.029296875, 157.0234375, 163.017578125, 169.01171875, 175.005859375, 181.0]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 15.0, 7.0, 11.0, 15.0, 33.0, 36.0, 45.0, 71.0, 92.0, 149.0, 211.0, 306.0, 481.0, 697.0, 1043.0, 1591.0, 2437.0, 3927.0, 6513.0, 11403.0, 21355.0, 46481.0, 133703.0, 5779824.0, 170346.0, 54326.0, 24412.0, 12613.0, 7295.0, 4218.0, 2657.0, 1712.0, 1082.0, 733.0, 483.0, 304.0, 227.0, 189.0, 103.0, 84.0, 51.0, 46.0, 29.0, 16.0, 11.0, 11.0, 14.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0], "bins": [-65.125, -63.2421875, -61.359375, -59.4765625, -57.59375, -55.7109375, -53.828125, -51.9453125, -50.0625, -48.1796875, -46.296875, -44.4140625, -42.53125, -40.6484375, -38.765625, -36.8828125, -35.0, -33.1171875, -31.234375, -29.3515625, -27.46875, -25.5859375, -23.703125, -21.8203125, -19.9375, -18.0546875, -16.171875, -14.2890625, -12.40625, -10.5234375, -8.640625, -6.7578125, -4.875, -2.9921875, -1.109375, 0.7734375, 2.65625, 4.5390625, 6.421875, 8.3046875, 10.1875, 12.0703125, 13.953125, 15.8359375, 17.71875, 19.6015625, 21.484375, 23.3671875, 25.25, 27.1328125, 29.015625, 30.8984375, 32.78125, 34.6640625, 36.546875, 38.4296875, 40.3125, 42.1953125, 44.078125, 45.9609375, 47.84375, 49.7265625, 51.609375, 53.4921875, 55.375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 15.0, 11.0, 14.0, 24.0, 15.0, 20.0, 34.0, 31.0, 28.0, 34.0, 48.0, 53.0, 52.0, 46.0, 223.0, 883.0, 39.0, 52.0, 54.0, 31.0, 36.0, 32.0, 27.0, 24.0, 25.0, 23.0, 22.0, 18.0, 16.0, 10.0, 11.0, 5.0, 9.0, 4.0, 8.0, 5.0, 0.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.25, -184.515625, -178.78125, -173.046875, -167.3125, -161.578125, -155.84375, -150.109375, -144.375, -138.640625, -132.90625, -127.171875, -121.4375, -115.703125, -109.96875, -104.234375, -98.5, -92.765625, -87.03125, -81.296875, -75.5625, -69.828125, -64.09375, -58.359375, -52.625, -46.890625, -41.15625, -35.421875, -29.6875, -23.953125, -18.21875, -12.484375, -6.75, -1.015625, 4.71875, 10.453125, 16.1875, 21.921875, 27.65625, 33.390625, 39.125, 44.859375, 50.59375, 56.328125, 62.0625, 67.796875, 73.53125, 79.265625, 85.0, 90.734375, 96.46875, 102.203125, 107.9375, 113.671875, 119.40625, 125.140625, 130.875, 136.609375, 142.34375, 148.078125, 153.8125, 159.546875, 165.28125, 171.015625, 176.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 22.0, 32.0, 41.0, 91.0, 228.0, 321.0, 115.0, 67.0, 25.0, 14.0, 14.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1283.35791015625, -1257.22802734375, -1231.0980224609375, -1204.9681396484375, -1178.8382568359375, -1152.708251953125, -1126.578369140625, -1100.448486328125, -1074.318603515625, -1048.188720703125, -1022.0587768554688, -995.9288330078125, -969.7989501953125, -943.6690063476562, -917.5390625, -891.4091796875, -865.2791748046875, -839.1492309570312, -813.0193481445312, -786.889404296875, -760.759521484375, -734.6295776367188, -708.4996337890625, -682.3697509765625, -656.2398071289062, -630.10986328125, -603.97998046875, -577.8500366210938, -551.7200927734375, -525.5902099609375, -499.46026611328125, -473.3303527832031, -447.2004699707031, -421.070556640625, -394.94061279296875, -368.8106994628906, -342.6807861328125, -316.5508728027344, -290.42095947265625, -264.291015625, -238.16110229492188, -212.03118896484375, -185.90126037597656, -159.77133178710938, -133.64141845703125, -107.51150512695312, -81.38157653808594, -55.25164794921875, -29.121734619140625, -2.9918136596679688, 23.138107299804688, 49.268028259277344, 75.39794921875, 101.52786254882812, 127.65779113769531, 153.7877197265625, 179.91763305664062, 206.04754638671875, 232.17747497558594, 258.3074035644531, 284.43731689453125, 310.5672302246094, 336.6971435546875, 362.82708740234375, 388.9570007324219]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 7.0, 10.0, 11.0, 14.0, 7.0, 10.0, 15.0, 15.0, 19.0, 24.0, 19.0, 29.0, 22.0, 25.0, 21.0, 35.0, 39.0, 29.0, 37.0, 43.0, 29.0, 36.0, 46.0, 43.0, 30.0, 39.0, 28.0, 33.0, 35.0, 26.0, 35.0, 27.0, 19.0, 16.0, 27.0, 17.0, 12.0, 10.0, 19.0, 5.0, 9.0, 10.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-618.5052490234375, -600.7103271484375, -582.9153442382812, -565.1204223632812, -547.325439453125, -529.530517578125, -511.7355651855469, -493.94061279296875, -476.1456604003906, -458.3507080078125, -440.5557556152344, -422.76080322265625, -404.96588134765625, -387.1708984375, -369.3759765625, -351.5810241699219, -333.78607177734375, -315.9911193847656, -298.1961669921875, -280.4012145996094, -262.60626220703125, -244.8113250732422, -227.01638793945312, -209.221435546875, -191.42648315429688, -173.63153076171875, -155.83657836914062, -138.04164123535156, -120.24668884277344, -102.45173645019531, -84.65679168701172, -66.86184692382812, -49.06689453125, -31.27194595336914, -13.476997375488281, 4.317951202392578, 22.112899780273438, 39.90785217285156, 57.702796936035156, 75.49774169921875, 93.29269409179688, 111.087646484375, 128.88259887695312, 146.6775360107422, 164.4724884033203, 182.26744079589844, 200.0623779296875, 217.85733032226562, 235.65228271484375, 253.44723510742188, 271.2421875, 289.0371398925781, 306.83209228515625, 324.62701416015625, 342.4219665527344, 360.2169189453125, 378.0118713378906, 395.80682373046875, 413.6017761230469, 431.396728515625, 449.191650390625, 466.98663330078125, 484.78155517578125, 502.5765075683594, 520.3714599609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 13.0, 23.0, 18.0, 38.0, 49.0, 86.0, 112.0, 173.0, 259.0, 447.0, 747.0, 1313.0, 2447.0, 5351.0, 15053.0, 90864.0, 4022037.0, 35354.0, 10331.0, 4351.0, 2215.0, 1200.0, 641.0, 406.0, 267.0, 168.0, 92.0, 68.0, 36.0, 44.0, 21.0, 12.0, 7.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.20703125, -5.05059814453125, -4.8941650390625, -4.73773193359375, -4.581298828125, -4.42486572265625, -4.2684326171875, -4.11199951171875, -3.95556640625, -3.79913330078125, -3.6427001953125, -3.48626708984375, -3.329833984375, -3.17340087890625, -3.0169677734375, -2.86053466796875, -2.7041015625, -2.54766845703125, -2.3912353515625, -2.23480224609375, -2.078369140625, -1.92193603515625, -1.7655029296875, -1.60906982421875, -1.45263671875, -1.29620361328125, -1.1397705078125, -0.98333740234375, -0.826904296875, -0.67047119140625, -0.5140380859375, -0.35760498046875, -0.201171875, -0.04473876953125, 0.1116943359375, 0.26812744140625, 0.424560546875, 0.58099365234375, 0.7374267578125, 0.89385986328125, 1.05029296875, 1.20672607421875, 1.3631591796875, 1.51959228515625, 1.676025390625, 1.83245849609375, 1.9888916015625, 2.14532470703125, 2.3017578125, 2.45819091796875, 2.6146240234375, 2.77105712890625, 2.927490234375, 3.08392333984375, 3.2403564453125, 3.39678955078125, 3.55322265625, 3.70965576171875, 3.8660888671875, 4.02252197265625, 4.178955078125, 4.33538818359375, 4.4918212890625, 4.64825439453125, 4.8046875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 8.0, 10.0, 14.0, 16.0, 11.0, 16.0, 737.0, 64.0, 20.0, 12.0, 13.0, 8.0, 7.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9755859375, -1.91558837890625, -1.8555908203125, -1.79559326171875, -1.735595703125, -1.67559814453125, -1.6156005859375, -1.55560302734375, -1.49560546875, -1.43560791015625, -1.3756103515625, -1.31561279296875, -1.255615234375, -1.19561767578125, -1.1356201171875, -1.07562255859375, -1.015625, -0.95562744140625, -0.8956298828125, -0.83563232421875, -0.775634765625, -0.71563720703125, -0.6556396484375, -0.59564208984375, -0.53564453125, -0.47564697265625, -0.4156494140625, -0.35565185546875, -0.295654296875, -0.23565673828125, -0.1756591796875, -0.11566162109375, -0.0556640625, 0.00433349609375, 0.0643310546875, 0.12432861328125, 0.184326171875, 0.24432373046875, 0.3043212890625, 0.36431884765625, 0.42431640625, 0.48431396484375, 0.5443115234375, 0.60430908203125, 0.664306640625, 0.72430419921875, 0.7843017578125, 0.84429931640625, 0.904296875, 0.96429443359375, 1.0242919921875, 1.08428955078125, 1.144287109375, 1.20428466796875, 1.2642822265625, 1.32427978515625, 1.38427734375, 1.44427490234375, 1.5042724609375, 1.56427001953125, 1.624267578125, 1.68426513671875, 1.7442626953125, 1.80426025390625, 1.8642578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 24.0, 32.0, 40.0, 55.0, 83.0, 146.0, 270.0, 482.0, 919.0, 1944.0, 4633.0, 14370.0, 72121.0, 3445410.0, 592524.0, 44071.0, 10435.0, 3589.0, 1471.0, 700.0, 354.0, 211.0, 118.0, 89.0, 70.0, 29.0, 24.0, 13.0, 16.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.93115234375, -4.7763671875, -4.62158203125, -4.466796875, -4.31201171875, -4.1572265625, -4.00244140625, -3.84765625, -3.69287109375, -3.5380859375, -3.38330078125, -3.228515625, -3.07373046875, -2.9189453125, -2.76416015625, -2.609375, -2.45458984375, -2.2998046875, -2.14501953125, -1.990234375, -1.83544921875, -1.6806640625, -1.52587890625, -1.37109375, -1.21630859375, -1.0615234375, -0.90673828125, -0.751953125, -0.59716796875, -0.4423828125, -0.28759765625, -0.1328125, 0.02197265625, 0.1767578125, 0.33154296875, 0.486328125, 0.64111328125, 0.7958984375, 0.95068359375, 1.10546875, 1.26025390625, 1.4150390625, 1.56982421875, 1.724609375, 1.87939453125, 2.0341796875, 2.18896484375, 2.34375, 2.49853515625, 2.6533203125, 2.80810546875, 2.962890625, 3.11767578125, 3.2724609375, 3.42724609375, 3.58203125, 3.73681640625, 3.8916015625, 4.04638671875, 4.201171875, 4.35595703125, 4.5107421875, 4.66552734375, 4.8203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 9.0, 7.0, 17.0, 19.0, 38.0, 68.0, 91.0, 155.0, 524.0, 2295.0, 425.0, 138.0, 99.0, 52.0, 43.0, 33.0, 16.0, 11.0, 6.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.474273681640625, -2.38409423828125, -2.293914794921875, -2.2037353515625, -2.113555908203125, -2.02337646484375, -1.933197021484375, -1.843017578125, -1.752838134765625, -1.66265869140625, -1.572479248046875, -1.4822998046875, -1.392120361328125, -1.30194091796875, -1.211761474609375, -1.12158203125, -1.031402587890625, -0.94122314453125, -0.851043701171875, -0.7608642578125, -0.670684814453125, -0.58050537109375, -0.490325927734375, -0.400146484375, -0.309967041015625, -0.21978759765625, -0.129608154296875, -0.0394287109375, 0.050750732421875, 0.14093017578125, 0.231109619140625, 0.3212890625, 0.411468505859375, 0.50164794921875, 0.591827392578125, 0.6820068359375, 0.772186279296875, 0.86236572265625, 0.952545166015625, 1.042724609375, 1.132904052734375, 1.22308349609375, 1.313262939453125, 1.4034423828125, 1.493621826171875, 1.58380126953125, 1.673980712890625, 1.76416015625, 1.854339599609375, 1.94451904296875, 2.034698486328125, 2.1248779296875, 2.215057373046875, 2.30523681640625, 2.395416259765625, 2.485595703125, 2.575775146484375, 2.66595458984375, 2.756134033203125, 2.8463134765625, 2.936492919921875, 3.02667236328125, 3.116851806640625, 3.20703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 19.0, 86.0, 509.0, 324.0, 40.0, 20.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.623452186584473, -4.802863597869873, -3.9822750091552734, -3.161686420440674, -2.341097831726074, -1.5205092430114746, -0.699920654296875, 0.12066793441772461, 0.9412565231323242, 1.7618451118469238, 2.5824337005615234, 3.403022289276123, 4.223610877990723, 5.044199466705322, 5.864788055419922, 6.6853766441345215, 7.505965232849121, 8.326553344726562, 9.14714241027832, 9.967731475830078, 10.78831958770752, 11.608907699584961, 12.429496765136719, 13.250085830688477, 14.070673942565918, 14.89126205444336, 15.711851119995117, 16.532440185546875, 17.35302734375, 18.173616409301758, 18.994205474853516, 19.814794540405273, 20.63538360595703, 21.45597267150879, 22.276561737060547, 23.097148895263672, 23.91773796081543, 24.738327026367188, 25.558914184570312, 26.37950325012207, 27.200092315673828, 28.020681381225586, 28.841270446777344, 29.66185760498047, 30.482446670532227, 31.303035736083984, 32.12362289428711, 32.9442138671875, 33.764801025390625, 34.58538818359375, 35.40597915649414, 36.226566314697266, 37.047157287597656, 37.86774444580078, 38.688331604003906, 39.5089225769043, 40.32950973510742, 41.15009689331055, 41.97068786621094, 42.79127502441406, 43.61186218261719, 44.43245315551758, 45.2530403137207, 46.073631286621094, 46.89421844482422]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 6.0, 6.0, 13.0, 15.0, 18.0, 19.0, 20.0, 17.0, 44.0, 33.0, 47.0, 50.0, 61.0, 48.0, 50.0, 57.0, 54.0, 67.0, 60.0, 38.0, 41.0, 42.0, 35.0, 32.0, 23.0, 22.0, 16.0, 19.0, 8.0, 10.0, 7.0, 6.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.067513465881348, -7.841927528381348, -7.616341590881348, -7.390755653381348, -7.165169715881348, -6.939583778381348, -6.713997840881348, -6.4884114265441895, -6.2628254890441895, -6.0372395515441895, -5.8116536140441895, -5.5860676765441895, -5.3604817390441895, -5.134895324707031, -4.909309387207031, -4.683723449707031, -4.458137512207031, -4.232551574707031, -4.006965637207031, -3.7813796997070312, -3.555793523788452, -3.330207586288452, -3.104621648788452, -2.879035472869873, -2.6534500122070312, -2.4278640747070312, -2.2022781372070312, -1.9766920804977417, -1.7511060237884521, -1.5255200862884521, -1.2999341487884521, -1.0743480920791626, -0.848762035369873, -0.6231760382652283, -0.3975900709629059, -0.1720041036605835, 0.05358189344406128, 0.27916789054870605, 0.504753828048706, 0.7303398847579956, 0.9559258222579956, 1.1815117597579956, 1.4070978164672852, 1.6326837539672852, 1.8582696914672852, 2.083855628967285, 2.309441566467285, 2.5350277423858643, 2.7606136798858643, 2.9861996173858643, 3.2117855548858643, 3.4373717308044434, 3.6629576683044434, 3.8885436058044434, 4.114129543304443, 4.339715480804443, 4.565301418304443, 4.790887355804443, 5.016473293304443, 5.242059230804443, 5.467645168304443, 5.693231582641602, 5.918817520141602, 6.144403457641602, 6.369989395141602]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 9.0, 16.0, 23.0, 20.0, 24.0, 49.0, 63.0, 97.0, 116.0, 161.0, 216.0, 295.0, 437.0, 578.0, 874.0, 1166.0, 1713.0, 2659.0, 4148.0, 7248.0, 13939.0, 33604.0, 898371.0, 44303.0, 16228.0, 8269.0, 4658.0, 2892.0, 1901.0, 1298.0, 914.0, 603.0, 481.0, 339.0, 214.0, 172.0, 125.0, 74.0, 67.0, 54.0, 31.0, 30.0, 15.0, 17.0, 13.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.3125, -9.017822265625, -8.72314453125, -8.428466796875, -8.1337890625, -7.839111328125, -7.54443359375, -7.249755859375, -6.955078125, -6.660400390625, -6.36572265625, -6.071044921875, -5.7763671875, -5.481689453125, -5.18701171875, -4.892333984375, -4.59765625, -4.302978515625, -4.00830078125, -3.713623046875, -3.4189453125, -3.124267578125, -2.82958984375, -2.534912109375, -2.240234375, -1.945556640625, -1.65087890625, -1.356201171875, -1.0615234375, -0.766845703125, -0.47216796875, -0.177490234375, 0.1171875, 0.411865234375, 0.70654296875, 1.001220703125, 1.2958984375, 1.590576171875, 1.88525390625, 2.179931640625, 2.474609375, 2.769287109375, 3.06396484375, 3.358642578125, 3.6533203125, 3.947998046875, 4.24267578125, 4.537353515625, 4.83203125, 5.126708984375, 5.42138671875, 5.716064453125, 6.0107421875, 6.305419921875, 6.60009765625, 6.894775390625, 7.189453125, 7.484130859375, 7.77880859375, 8.073486328125, 8.3681640625, 8.662841796875, 8.95751953125, 9.252197265625, 9.546875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 5.0, 11.0, 12.0, 15.0, 13.0, 18.0, 203.0, 586.0, 31.0, 12.0, 11.0, 12.0, 11.0, 6.0, 7.0, 2.0, 4.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.958984375, -1.8983001708984375, -1.837615966796875, -1.7769317626953125, -1.71624755859375, -1.6555633544921875, -1.594879150390625, -1.5341949462890625, -1.4735107421875, -1.4128265380859375, -1.352142333984375, -1.2914581298828125, -1.23077392578125, -1.1700897216796875, -1.109405517578125, -1.0487213134765625, -0.988037109375, -0.9273529052734375, -0.866668701171875, -0.8059844970703125, -0.74530029296875, -0.6846160888671875, -0.623931884765625, -0.5632476806640625, -0.5025634765625, -0.4418792724609375, -0.381195068359375, -0.3205108642578125, -0.25982666015625, -0.1991424560546875, -0.138458251953125, -0.0777740478515625, -0.01708984375, 0.0435943603515625, 0.104278564453125, 0.1649627685546875, 0.22564697265625, 0.2863311767578125, 0.347015380859375, 0.4076995849609375, 0.4683837890625, 0.5290679931640625, 0.589752197265625, 0.6504364013671875, 0.71112060546875, 0.7718048095703125, 0.832489013671875, 0.8931732177734375, 0.953857421875, 1.0145416259765625, 1.075225830078125, 1.1359100341796875, 1.19659423828125, 1.2572784423828125, 1.317962646484375, 1.3786468505859375, 1.4393310546875, 1.5000152587890625, 1.560699462890625, 1.6213836669921875, 1.68206787109375, 1.7427520751953125, 1.803436279296875, 1.8641204833984375, 1.9248046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 1.0, 7.0, 12.0, 14.0, 14.0, 17.0, 26.0, 30.0, 36.0, 48.0, 69.0, 117.0, 130.0, 191.0, 276.0, 391.0, 679.0, 1058.0, 1911.0, 3649.0, 8167.0, 19293.0, 52577.0, 182946.0, 576778.0, 129541.0, 40815.0, 15401.0, 6666.0, 3143.0, 1759.0, 902.0, 555.0, 387.0, 242.0, 181.0, 121.0, 101.0, 72.0, 56.0, 45.0, 39.0, 21.0, 20.0, 10.0, 7.0, 14.0, 5.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.1484375, -4.98944091796875, -4.8304443359375, -4.67144775390625, -4.512451171875, -4.35345458984375, -4.1944580078125, -4.03546142578125, -3.87646484375, -3.71746826171875, -3.5584716796875, -3.39947509765625, -3.240478515625, -3.08148193359375, -2.9224853515625, -2.76348876953125, -2.6044921875, -2.44549560546875, -2.2864990234375, -2.12750244140625, -1.968505859375, -1.80950927734375, -1.6505126953125, -1.49151611328125, -1.33251953125, -1.17352294921875, -1.0145263671875, -0.85552978515625, -0.696533203125, -0.53753662109375, -0.3785400390625, -0.21954345703125, -0.060546875, 0.09844970703125, 0.2574462890625, 0.41644287109375, 0.575439453125, 0.73443603515625, 0.8934326171875, 1.05242919921875, 1.21142578125, 1.37042236328125, 1.5294189453125, 1.68841552734375, 1.847412109375, 2.00640869140625, 2.1654052734375, 2.32440185546875, 2.4833984375, 2.64239501953125, 2.8013916015625, 2.96038818359375, 3.119384765625, 3.27838134765625, 3.4373779296875, 3.59637451171875, 3.75537109375, 3.91436767578125, 4.0733642578125, 4.23236083984375, 4.391357421875, 4.55035400390625, 4.7093505859375, 4.86834716796875, 5.02734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 10.0, 21.0, 18.0, 17.0, 13.0, 29.0, 24.0, 26.0, 25.0, 33.0, 36.0, 44.0, 48.0, 45.0, 35.0, 52.0, 38.0, 43.0, 37.0, 42.0, 34.0, 17.0, 34.0, 36.0, 27.0, 32.0, 18.0, 24.0, 11.0, 24.0, 15.0, 16.0, 4.0, 12.0, 6.0, 7.0, 8.0, 6.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.0625, -5.86993408203125, -5.6773681640625, -5.48480224609375, -5.292236328125, -5.09967041015625, -4.9071044921875, -4.71453857421875, -4.52197265625, -4.32940673828125, -4.1368408203125, -3.94427490234375, -3.751708984375, -3.55914306640625, -3.3665771484375, -3.17401123046875, -2.9814453125, -2.78887939453125, -2.5963134765625, -2.40374755859375, -2.211181640625, -2.01861572265625, -1.8260498046875, -1.63348388671875, -1.44091796875, -1.24835205078125, -1.0557861328125, -0.86322021484375, -0.670654296875, -0.47808837890625, -0.2855224609375, -0.09295654296875, 0.099609375, 0.29217529296875, 0.4847412109375, 0.67730712890625, 0.869873046875, 1.06243896484375, 1.2550048828125, 1.44757080078125, 1.64013671875, 1.83270263671875, 2.0252685546875, 2.21783447265625, 2.410400390625, 2.60296630859375, 2.7955322265625, 2.98809814453125, 3.1806640625, 3.37322998046875, 3.5657958984375, 3.75836181640625, 3.950927734375, 4.14349365234375, 4.3360595703125, 4.52862548828125, 4.72119140625, 4.91375732421875, 5.1063232421875, 5.29888916015625, 5.491455078125, 5.68402099609375, 5.8765869140625, 6.06915283203125, 6.26171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 6.0, 9.0, 11.0, 10.0, 14.0, 19.0, 28.0, 34.0, 54.0, 93.0, 125.0, 212.0, 382.0, 716.0, 1774.0, 5618.0, 35293.0, 947843.0, 46226.0, 6311.0, 1919.0, 797.0, 421.0, 217.0, 130.0, 70.0, 63.0, 32.0, 33.0, 24.0, 18.0, 11.0, 4.0, 4.0, 7.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.65625, -7.3970947265625, -7.137939453125, -6.8787841796875, -6.61962890625, -6.3604736328125, -6.101318359375, -5.8421630859375, -5.5830078125, -5.3238525390625, -5.064697265625, -4.8055419921875, -4.54638671875, -4.2872314453125, -4.028076171875, -3.7689208984375, -3.509765625, -3.2506103515625, -2.991455078125, -2.7322998046875, -2.47314453125, -2.2139892578125, -1.954833984375, -1.6956787109375, -1.4365234375, -1.1773681640625, -0.918212890625, -0.6590576171875, -0.39990234375, -0.1407470703125, 0.118408203125, 0.3775634765625, 0.63671875, 0.8958740234375, 1.155029296875, 1.4141845703125, 1.67333984375, 1.9324951171875, 2.191650390625, 2.4508056640625, 2.7099609375, 2.9691162109375, 3.228271484375, 3.4874267578125, 3.74658203125, 4.0057373046875, 4.264892578125, 4.5240478515625, 4.783203125, 5.0423583984375, 5.301513671875, 5.5606689453125, 5.81982421875, 6.0789794921875, 6.338134765625, 6.5972900390625, 6.8564453125, 7.1156005859375, 7.374755859375, 7.6339111328125, 7.89306640625, 8.1522216796875, 8.411376953125, 8.6705322265625, 8.9296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 9.0, 15.0, 27.0, 43.0, 81.0, 130.0, 195.0, 169.0, 109.0, 76.0, 46.0, 25.0, 18.0, 9.0, 11.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004100799560546875, -0.00039636343717575073, -0.00038264691829681396, -0.0003689303994178772, -0.00035521388053894043, -0.00034149736166000366, -0.0003277808427810669, -0.0003140643239021301, -0.00030034780502319336, -0.0002866312861442566, -0.0002729147672653198, -0.00025919824838638306, -0.0002454817295074463, -0.00023176521062850952, -0.00021804869174957275, -0.00020433217287063599, -0.00019061565399169922, -0.00017689913511276245, -0.00016318261623382568, -0.00014946609735488892, -0.00013574957847595215, -0.00012203305959701538, -0.00010831654071807861, -9.460002183914185e-05, -8.088350296020508e-05, -6.716698408126831e-05, -5.345046520233154e-05, -3.9733946323394775e-05, -2.6017427444458008e-05, -1.230090856552124e-05, 1.4156103134155273e-06, 1.5132129192352295e-05, 2.8848648071289062e-05, 4.256516695022583e-05, 5.62816858291626e-05, 6.999820470809937e-05, 8.371472358703613e-05, 9.74312424659729e-05, 0.00011114776134490967, 0.00012486428022384644, 0.0001385807991027832, 0.00015229731798171997, 0.00016601383686065674, 0.0001797303557395935, 0.00019344687461853027, 0.00020716339349746704, 0.0002208799123764038, 0.00023459643125534058, 0.00024831295013427734, 0.0002620294690132141, 0.0002757459878921509, 0.00028946250677108765, 0.0003031790256500244, 0.0003168955445289612, 0.00033061206340789795, 0.0003443285822868347, 0.0003580451011657715, 0.00037176162004470825, 0.000385478138923645, 0.0003991946578025818, 0.00041291117668151855, 0.0004266276955604553, 0.0004403442144393921, 0.00045406073331832886, 0.0004677772521972656]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 10.0, 12.0, 20.0, 30.0, 39.0, 70.0, 97.0, 178.0, 331.0, 640.0, 1388.0, 3716.0, 14002.0, 101135.0, 824901.0, 83465.0, 12291.0, 3478.0, 1344.0, 615.0, 319.0, 176.0, 95.0, 46.0, 57.0, 29.0, 22.0, 8.0, 8.0, 5.0, 7.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.40625, -5.24468994140625, -5.0831298828125, -4.92156982421875, -4.760009765625, -4.59844970703125, -4.4368896484375, -4.27532958984375, -4.11376953125, -3.95220947265625, -3.7906494140625, -3.62908935546875, -3.467529296875, -3.30596923828125, -3.1444091796875, -2.98284912109375, -2.8212890625, -2.65972900390625, -2.4981689453125, -2.33660888671875, -2.175048828125, -2.01348876953125, -1.8519287109375, -1.69036865234375, -1.52880859375, -1.36724853515625, -1.2056884765625, -1.04412841796875, -0.882568359375, -0.72100830078125, -0.5594482421875, -0.39788818359375, -0.236328125, -0.07476806640625, 0.0867919921875, 0.24835205078125, 0.409912109375, 0.57147216796875, 0.7330322265625, 0.89459228515625, 1.05615234375, 1.21771240234375, 1.3792724609375, 1.54083251953125, 1.702392578125, 1.86395263671875, 2.0255126953125, 2.18707275390625, 2.3486328125, 2.51019287109375, 2.6717529296875, 2.83331298828125, 2.994873046875, 3.15643310546875, 3.3179931640625, 3.47955322265625, 3.64111328125, 3.80267333984375, 3.9642333984375, 4.12579345703125, 4.287353515625, 4.44891357421875, 4.6104736328125, 4.77203369140625, 4.93359375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 11.0, 15.0, 19.0, 26.0, 38.0, 60.0, 80.0, 131.0, 125.0, 112.0, 95.0, 86.0, 50.0, 39.0, 28.0, 28.0, 16.0, 8.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.18359375, -4.9989013671875, -4.814208984375, -4.6295166015625, -4.44482421875, -4.2601318359375, -4.075439453125, -3.8907470703125, -3.7060546875, -3.5213623046875, -3.336669921875, -3.1519775390625, -2.96728515625, -2.7825927734375, -2.597900390625, -2.4132080078125, -2.228515625, -2.0438232421875, -1.859130859375, -1.6744384765625, -1.48974609375, -1.3050537109375, -1.120361328125, -0.9356689453125, -0.7509765625, -0.5662841796875, -0.381591796875, -0.1968994140625, -0.01220703125, 0.1724853515625, 0.357177734375, 0.5418701171875, 0.7265625, 0.9112548828125, 1.095947265625, 1.2806396484375, 1.46533203125, 1.6500244140625, 1.834716796875, 2.0194091796875, 2.2041015625, 2.3887939453125, 2.573486328125, 2.7581787109375, 2.94287109375, 3.1275634765625, 3.312255859375, 3.4969482421875, 3.681640625, 3.8663330078125, 4.051025390625, 4.2357177734375, 4.42041015625, 4.6051025390625, 4.789794921875, 4.9744873046875, 5.1591796875, 5.3438720703125, 5.528564453125, 5.7132568359375, 5.89794921875, 6.0826416015625, 6.267333984375, 6.4520263671875, 6.63671875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 6.0, 12.0, 34.0, 71.0, 204.0, 436.0, 134.0, 41.0, 24.0, 13.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.56300735473633, -57.570335388183594, -54.577659606933594, -51.58498764038086, -48.59231185913086, -45.599639892578125, -42.606964111328125, -39.61429214477539, -36.621620178222656, -33.62894821166992, -30.636272430419922, -27.643600463867188, -24.650924682617188, -21.658252716064453, -18.665578842163086, -15.672904968261719, -12.680229187011719, -9.687555313110352, -6.694881916046143, -3.7022085189819336, -0.7095346450805664, 2.283139228820801, 5.275812149047852, 8.268486022949219, 11.261159896850586, 14.253833770751953, 17.24650764465332, 20.239181518554688, 23.231853485107422, 26.224529266357422, 29.217201232910156, 32.209877014160156, 35.202552795410156, 38.19522476196289, 41.18790054321289, 44.180572509765625, 47.173248291015625, 50.16592025756836, 53.158592224121094, 56.151268005371094, 59.143943786621094, 62.13661575317383, 65.12928771972656, 68.12196350097656, 71.11463928222656, 74.10731506347656, 77.09998321533203, 80.09265899658203, 83.0853271484375, 86.0780029296875, 89.07067108154297, 92.06334686279297, 95.05602264404297, 98.04869842529297, 101.04136657714844, 104.03404235839844, 107.02671813964844, 110.01939392089844, 113.0120620727539, 116.0047378540039, 118.9974136352539, 121.9900894165039, 124.98275756835938, 127.97543334960938, 130.96810913085938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 5.0, 10.0, 4.0, 19.0, 26.0, 32.0, 54.0, 88.0, 92.0, 142.0, 154.0, 105.0, 68.0, 40.0, 45.0, 22.0, 17.0, 11.0, 12.0, 8.0, 11.0, 4.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0], "bins": [-151.12779235839844, -147.177734375, -143.2276611328125, -139.27760314941406, -135.32754516601562, -131.3774871826172, -127.42742156982422, -123.47735595703125, -119.52729797363281, -115.57723999023438, -111.6271743774414, -107.67710876464844, -103.72705078125, -99.77699279785156, -95.8269271850586, -91.87686157226562, -87.92680358886719, -83.97674560546875, -80.02667999267578, -76.07661437988281, -72.12655639648438, -68.17649841308594, -64.22643280029297, -60.276371002197266, -56.32630920410156, -52.37624740600586, -48.426185607910156, -44.47612380981445, -40.52606201171875, -36.57600021362305, -32.625938415527344, -28.67587661743164, -24.725807189941406, -20.775745391845703, -16.82568359375, -12.875621795654297, -8.925559997558594, -4.975498199462891, -1.0254364013671875, 2.9246253967285156, 6.874687194824219, 10.824748992919922, 14.774810791015625, 18.724872589111328, 22.67493438720703, 26.624996185302734, 30.575057983398438, 34.52511978149414, 38.475181579589844, 42.42524337768555, 46.37530517578125, 50.32536697387695, 54.275428771972656, 58.22549057006836, 62.17555236816406, 66.1256103515625, 70.07567596435547, 74.02574157714844, 77.97579956054688, 81.92585754394531, 85.87592315673828, 89.82598876953125, 93.77604675292969, 97.72610473632812, 101.6761703491211]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 12.0, 17.0, 20.0, 46.0, 101.0, 176.0, 401.0, 893.0, 2181.0, 5922.0, 21134.0, 226562.0, 3877422.0, 43006.0, 10256.0, 3572.0, 1411.0, 580.0, 265.0, 127.0, 69.0, 33.0, 21.0, 15.0, 9.0, 5.0, 3.0, 5.0, 1.0, 1.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.890625, -20.220947265625, -19.55126953125, -18.881591796875, -18.2119140625, -17.542236328125, -16.87255859375, -16.202880859375, -15.533203125, -14.863525390625, -14.19384765625, -13.524169921875, -12.8544921875, -12.184814453125, -11.51513671875, -10.845458984375, -10.17578125, -9.506103515625, -8.83642578125, -8.166748046875, -7.4970703125, -6.827392578125, -6.15771484375, -5.488037109375, -4.818359375, -4.148681640625, -3.47900390625, -2.809326171875, -2.1396484375, -1.469970703125, -0.80029296875, -0.130615234375, 0.5390625, 1.208740234375, 1.87841796875, 2.548095703125, 3.2177734375, 3.887451171875, 4.55712890625, 5.226806640625, 5.896484375, 6.566162109375, 7.23583984375, 7.905517578125, 8.5751953125, 9.244873046875, 9.91455078125, 10.584228515625, 11.25390625, 11.923583984375, 12.59326171875, 13.262939453125, 13.9326171875, 14.602294921875, 15.27197265625, 15.941650390625, 16.611328125, 17.281005859375, 17.95068359375, 18.620361328125, 19.2900390625, 19.959716796875, 20.62939453125, 21.299072265625, 21.96875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 9.0, 9.0, 14.0, 10.0, 16.0, 32.0, 102.0, 235.0, 273.0, 123.0, 45.0, 25.0, 14.0, 12.0, 10.0, 4.0, 7.0, 7.0, 4.0, 2.0, 2.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2978515625, -1.257598876953125, -1.21734619140625, -1.177093505859375, -1.1368408203125, -1.096588134765625, -1.05633544921875, -1.016082763671875, -0.975830078125, -0.935577392578125, -0.89532470703125, -0.855072021484375, -0.8148193359375, -0.774566650390625, -0.73431396484375, -0.694061279296875, -0.65380859375, -0.613555908203125, -0.57330322265625, -0.533050537109375, -0.4927978515625, -0.452545166015625, -0.41229248046875, -0.372039794921875, -0.331787109375, -0.291534423828125, -0.25128173828125, -0.211029052734375, -0.1707763671875, -0.130523681640625, -0.09027099609375, -0.050018310546875, -0.009765625, 0.030487060546875, 0.07073974609375, 0.110992431640625, 0.1512451171875, 0.191497802734375, 0.23175048828125, 0.272003173828125, 0.312255859375, 0.352508544921875, 0.39276123046875, 0.433013916015625, 0.4732666015625, 0.513519287109375, 0.55377197265625, 0.594024658203125, 0.63427734375, 0.674530029296875, 0.71478271484375, 0.755035400390625, 0.7952880859375, 0.835540771484375, 0.87579345703125, 0.916046142578125, 0.956298828125, 0.996551513671875, 1.03680419921875, 1.077056884765625, 1.1173095703125, 1.157562255859375, 1.19781494140625, 1.238067626953125, 1.2783203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 8.0, 12.0, 16.0, 8.0, 23.0, 28.0, 25.0, 41.0, 53.0, 65.0, 120.0, 152.0, 276.0, 332.0, 680.0, 1299.0, 2747.0, 6543.0, 18569.0, 80022.0, 2763557.0, 1224908.0, 67828.0, 16186.0, 5770.0, 2391.0, 1084.0, 573.0, 342.0, 198.0, 121.0, 81.0, 54.0, 44.0, 30.0, 32.0, 19.0, 10.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.921875, -8.67376708984375, -8.4256591796875, -8.17755126953125, -7.929443359375, -7.68133544921875, -7.4332275390625, -7.18511962890625, -6.93701171875, -6.68890380859375, -6.4407958984375, -6.19268798828125, -5.944580078125, -5.69647216796875, -5.4483642578125, -5.20025634765625, -4.9521484375, -4.70404052734375, -4.4559326171875, -4.20782470703125, -3.959716796875, -3.71160888671875, -3.4635009765625, -3.21539306640625, -2.96728515625, -2.71917724609375, -2.4710693359375, -2.22296142578125, -1.974853515625, -1.72674560546875, -1.4786376953125, -1.23052978515625, -0.982421875, -0.73431396484375, -0.4862060546875, -0.23809814453125, 0.010009765625, 0.25811767578125, 0.5062255859375, 0.75433349609375, 1.00244140625, 1.25054931640625, 1.4986572265625, 1.74676513671875, 1.994873046875, 2.24298095703125, 2.4910888671875, 2.73919677734375, 2.9873046875, 3.23541259765625, 3.4835205078125, 3.73162841796875, 3.979736328125, 4.22784423828125, 4.4759521484375, 4.72406005859375, 4.97216796875, 5.22027587890625, 5.4683837890625, 5.71649169921875, 5.964599609375, 6.21270751953125, 6.4608154296875, 6.70892333984375, 6.95703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 1.0, 5.0, 16.0, 6.0, 10.0, 16.0, 18.0, 17.0, 26.0, 35.0, 64.0, 80.0, 116.0, 168.0, 279.0, 761.0, 1554.0, 286.0, 190.0, 120.0, 63.0, 59.0, 46.0, 19.0, 24.0, 17.0, 17.0, 4.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5986328125, -1.5544281005859375, -1.510223388671875, -1.4660186767578125, -1.42181396484375, -1.3776092529296875, -1.333404541015625, -1.2891998291015625, -1.2449951171875, -1.2007904052734375, -1.156585693359375, -1.1123809814453125, -1.06817626953125, -1.0239715576171875, -0.979766845703125, -0.9355621337890625, -0.891357421875, -0.8471527099609375, -0.802947998046875, -0.7587432861328125, -0.71453857421875, -0.6703338623046875, -0.626129150390625, -0.5819244384765625, -0.5377197265625, -0.4935150146484375, -0.449310302734375, -0.4051055908203125, -0.36090087890625, -0.3166961669921875, -0.272491455078125, -0.2282867431640625, -0.18408203125, -0.1398773193359375, -0.095672607421875, -0.0514678955078125, -0.00726318359375, 0.0369415283203125, 0.081146240234375, 0.1253509521484375, 0.1695556640625, 0.2137603759765625, 0.257965087890625, 0.3021697998046875, 0.34637451171875, 0.3905792236328125, 0.434783935546875, 0.4789886474609375, 0.523193359375, 0.5673980712890625, 0.611602783203125, 0.6558074951171875, 0.70001220703125, 0.7442169189453125, 0.788421630859375, 0.8326263427734375, 0.8768310546875, 0.9210357666015625, 0.965240478515625, 1.0094451904296875, 1.05364990234375, 1.0978546142578125, 1.142059326171875, 1.1862640380859375, 1.23046875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 10.0, 24.0, 105.0, 572.0, 252.0, 30.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-58.69364547729492, -57.62516784667969, -56.55668640136719, -55.48820877075195, -54.41973114013672, -53.35124969482422, -52.282772064208984, -51.21429443359375, -50.14581298828125, -49.077335357666016, -48.008853912353516, -46.94037628173828, -45.87189865112305, -44.80341720581055, -43.73493957519531, -42.66646194458008, -41.597984313964844, -40.52950668334961, -39.46102523803711, -38.392547607421875, -37.32406997680664, -36.25558853149414, -35.187110900878906, -34.11863327026367, -33.05015182495117, -31.981672286987305, -30.91319465637207, -29.844715118408203, -28.776235580444336, -27.70775604248047, -26.639278411865234, -25.570798873901367, -24.5023193359375, -23.433839797973633, -22.3653621673584, -21.29688262939453, -20.228403091430664, -19.159923553466797, -18.091445922851562, -17.022966384887695, -15.954487800598145, -14.886009216308594, -13.817529678344727, -12.749051094055176, -11.680572509765625, -10.612092971801758, -9.543614387512207, -8.475135803222656, -7.406656265258789, -6.33817720413208, -5.269698143005371, -4.20121955871582, -3.1327404975891113, -2.0642614364624023, -0.9957828521728516, 0.07269620895385742, 1.1411752700805664, 2.2096543312072754, 3.2781331539154053, 4.346611976623535, 5.415091037750244, 6.483570098876953, 7.552048683166504, 8.620527267456055, 9.689006805419922]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 12.0, 8.0, 12.0, 21.0, 25.0, 18.0, 40.0, 49.0, 61.0, 51.0, 49.0, 59.0, 58.0, 61.0, 71.0, 75.0, 48.0, 35.0, 44.0, 40.0, 31.0, 24.0, 25.0, 8.0, 10.0, 12.0, 9.0, 2.0, 9.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.984344482421875, -8.689896583557129, -8.395448684692383, -8.101000785827637, -7.806553363800049, -7.512105464935303, -7.217658042907715, -6.923210144042969, -6.628762245178223, -6.334314346313477, -6.0398664474487305, -5.745419025421143, -5.4509711265563965, -5.15652322769165, -4.8620758056640625, -4.567627906799316, -4.27318000793457, -3.978732109069824, -3.6842844486236572, -3.3898367881774902, -3.095388889312744, -2.800940990447998, -2.506493330001831, -2.212045669555664, -1.917597770690918, -1.6231499910354614, -1.3287022113800049, -1.0342544317245483, -0.7398066520690918, -0.44535887241363525, -0.1509110927581787, 0.14353656768798828, 0.43798351287841797, 0.7324312925338745, 1.026879072189331, 1.3213268518447876, 1.6157746315002441, 1.9102224111557007, 2.2046701908111572, 2.499117851257324, 2.7935657501220703, 3.0880136489868164, 3.3824613094329834, 3.6769089698791504, 3.9713568687438965, 4.265804767608643, 4.5602521896362305, 4.854700088500977, 5.149147987365723, 5.443595886230469, 5.738043785095215, 6.032491207122803, 6.326939105987549, 6.621387004852295, 6.915834426879883, 7.210282325744629, 7.504730224609375, 7.799178123474121, 8.093626022338867, 8.388073921203613, 8.68252182006836, 8.976968765258789, 9.271416664123535, 9.565864562988281, 9.860312461853027]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0, 11.0, 12.0, 12.0, 16.0, 34.0, 40.0, 55.0, 76.0, 128.0, 170.0, 268.0, 408.0, 636.0, 1022.0, 1667.0, 3015.0, 5416.0, 10843.0, 27529.0, 201325.0, 712029.0, 52015.0, 15177.0, 7156.0, 3874.0, 2145.0, 1282.0, 744.0, 487.0, 297.0, 197.0, 137.0, 88.0, 57.0, 55.0, 36.0, 35.0, 15.0, 11.0, 4.0, 8.0, 3.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3828125, -8.1142578125, -7.845703125, -7.5771484375, -7.30859375, -7.0400390625, -6.771484375, -6.5029296875, -6.234375, -5.9658203125, -5.697265625, -5.4287109375, -5.16015625, -4.8916015625, -4.623046875, -4.3544921875, -4.0859375, -3.8173828125, -3.548828125, -3.2802734375, -3.01171875, -2.7431640625, -2.474609375, -2.2060546875, -1.9375, -1.6689453125, -1.400390625, -1.1318359375, -0.86328125, -0.5947265625, -0.326171875, -0.0576171875, 0.2109375, 0.4794921875, 0.748046875, 1.0166015625, 1.28515625, 1.5537109375, 1.822265625, 2.0908203125, 2.359375, 2.6279296875, 2.896484375, 3.1650390625, 3.43359375, 3.7021484375, 3.970703125, 4.2392578125, 4.5078125, 4.7763671875, 5.044921875, 5.3134765625, 5.58203125, 5.8505859375, 6.119140625, 6.3876953125, 6.65625, 6.9248046875, 7.193359375, 7.4619140625, 7.73046875, 7.9990234375, 8.267578125, 8.5361328125, 8.8046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 4.0, 6.0, 5.0, 10.0, 17.0, 24.0, 65.0, 142.0, 200.0, 220.0, 131.0, 61.0, 20.0, 23.0, 12.0, 8.0, 6.0, 5.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.4452056884765625, -1.400177001953125, -1.3551483154296875, -1.31011962890625, -1.2650909423828125, -1.220062255859375, -1.1750335693359375, -1.1300048828125, -1.0849761962890625, -1.039947509765625, -0.9949188232421875, -0.94989013671875, -0.9048614501953125, -0.859832763671875, -0.8148040771484375, -0.769775390625, -0.7247467041015625, -0.679718017578125, -0.6346893310546875, -0.58966064453125, -0.5446319580078125, -0.499603271484375, -0.4545745849609375, -0.4095458984375, -0.3645172119140625, -0.319488525390625, -0.2744598388671875, -0.22943115234375, -0.1844024658203125, -0.139373779296875, -0.0943450927734375, -0.04931640625, -0.0042877197265625, 0.040740966796875, 0.0857696533203125, 0.13079833984375, 0.1758270263671875, 0.220855712890625, 0.2658843994140625, 0.3109130859375, 0.3559417724609375, 0.400970458984375, 0.4459991455078125, 0.49102783203125, 0.5360565185546875, 0.581085205078125, 0.6261138916015625, 0.671142578125, 0.7161712646484375, 0.761199951171875, 0.8062286376953125, 0.85125732421875, 0.8962860107421875, 0.941314697265625, 0.9863433837890625, 1.0313720703125, 1.0764007568359375, 1.121429443359375, 1.1664581298828125, 1.21148681640625, 1.2565155029296875, 1.301544189453125, 1.3465728759765625, 1.3916015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 2.0, 21.0, 24.0, 34.0, 41.0, 42.0, 80.0, 110.0, 137.0, 210.0, 329.0, 481.0, 807.0, 1575.0, 3215.0, 7442.0, 18988.0, 54022.0, 190890.0, 564733.0, 135318.0, 42161.0, 15201.0, 6302.0, 2699.0, 1390.0, 769.0, 499.0, 294.0, 190.0, 164.0, 115.0, 68.0, 54.0, 44.0, 35.0, 24.0, 10.0, 9.0, 8.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.9122314453125, -3.758056640625, -3.6038818359375, -3.44970703125, -3.2955322265625, -3.141357421875, -2.9871826171875, -2.8330078125, -2.6788330078125, -2.524658203125, -2.3704833984375, -2.21630859375, -2.0621337890625, -1.907958984375, -1.7537841796875, -1.599609375, -1.4454345703125, -1.291259765625, -1.1370849609375, -0.98291015625, -0.8287353515625, -0.674560546875, -0.5203857421875, -0.3662109375, -0.2120361328125, -0.057861328125, 0.0963134765625, 0.25048828125, 0.4046630859375, 0.558837890625, 0.7130126953125, 0.8671875, 1.0213623046875, 1.175537109375, 1.3297119140625, 1.48388671875, 1.6380615234375, 1.792236328125, 1.9464111328125, 2.1005859375, 2.2547607421875, 2.408935546875, 2.5631103515625, 2.71728515625, 2.8714599609375, 3.025634765625, 3.1798095703125, 3.333984375, 3.4881591796875, 3.642333984375, 3.7965087890625, 3.95068359375, 4.1048583984375, 4.259033203125, 4.4132080078125, 4.5673828125, 4.7215576171875, 4.875732421875, 5.0299072265625, 5.18408203125, 5.3382568359375, 5.492431640625, 5.6466064453125, 5.80078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 11.0, 11.0, 15.0, 12.0, 17.0, 17.0, 25.0, 35.0, 29.0, 32.0, 35.0, 35.0, 32.0, 41.0, 53.0, 46.0, 47.0, 46.0, 42.0, 42.0, 32.0, 41.0, 35.0, 31.0, 37.0, 29.0, 23.0, 27.0, 21.0, 16.0, 11.0, 12.0, 15.0, 8.0, 8.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.32421875, -3.19866943359375, -3.0731201171875, -2.94757080078125, -2.822021484375, -2.69647216796875, -2.5709228515625, -2.44537353515625, -2.31982421875, -2.19427490234375, -2.0687255859375, -1.94317626953125, -1.817626953125, -1.69207763671875, -1.5665283203125, -1.44097900390625, -1.3154296875, -1.18988037109375, -1.0643310546875, -0.93878173828125, -0.813232421875, -0.68768310546875, -0.5621337890625, -0.43658447265625, -0.31103515625, -0.18548583984375, -0.0599365234375, 0.06561279296875, 0.191162109375, 0.31671142578125, 0.4422607421875, 0.56781005859375, 0.693359375, 0.81890869140625, 0.9444580078125, 1.07000732421875, 1.195556640625, 1.32110595703125, 1.4466552734375, 1.57220458984375, 1.69775390625, 1.82330322265625, 1.9488525390625, 2.07440185546875, 2.199951171875, 2.32550048828125, 2.4510498046875, 2.57659912109375, 2.7021484375, 2.82769775390625, 2.9532470703125, 3.07879638671875, 3.204345703125, 3.32989501953125, 3.4554443359375, 3.58099365234375, 3.70654296875, 3.83209228515625, 3.9576416015625, 4.08319091796875, 4.208740234375, 4.33428955078125, 4.4598388671875, 4.58538818359375, 4.7109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 19.0, 35.0, 55.0, 113.0, 260.0, 681.0, 2126.0, 16088.0, 966060.0, 58019.0, 3506.0, 897.0, 347.0, 163.0, 54.0, 37.0, 22.0, 15.0, 10.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.609375, -11.2308349609375, -10.852294921875, -10.4737548828125, -10.09521484375, -9.7166748046875, -9.338134765625, -8.9595947265625, -8.5810546875, -8.2025146484375, -7.823974609375, -7.4454345703125, -7.06689453125, -6.6883544921875, -6.309814453125, -5.9312744140625, -5.552734375, -5.1741943359375, -4.795654296875, -4.4171142578125, -4.03857421875, -3.6600341796875, -3.281494140625, -2.9029541015625, -2.5244140625, -2.1458740234375, -1.767333984375, -1.3887939453125, -1.01025390625, -0.6317138671875, -0.253173828125, 0.1253662109375, 0.50390625, 0.8824462890625, 1.260986328125, 1.6395263671875, 2.01806640625, 2.3966064453125, 2.775146484375, 3.1536865234375, 3.5322265625, 3.9107666015625, 4.289306640625, 4.6678466796875, 5.04638671875, 5.4249267578125, 5.803466796875, 6.1820068359375, 6.560546875, 6.9390869140625, 7.317626953125, 7.6961669921875, 8.07470703125, 8.4532470703125, 8.831787109375, 9.2103271484375, 9.5888671875, 9.9674072265625, 10.345947265625, 10.7244873046875, 11.10302734375, 11.4815673828125, 11.860107421875, 12.2386474609375, 12.6171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 11.0, 12.0, 30.0, 117.0, 315.0, 374.0, 95.0, 34.0, 14.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025653839111328125, -0.00022448599338531494, -0.00019243359565734863, -0.00016038119792938232, -0.00012832880020141602, -9.627640247344971e-05, -6.42240047454834e-05, -3.217160701751709e-05, -1.1920928955078125e-07, 3.193318843841553e-05, 6.398558616638184e-05, 9.603798389434814e-05, 0.00012809038162231445, 0.00016014277935028076, 0.00019219517707824707, 0.00022424757480621338, 0.0002562999725341797, 0.000288352370262146, 0.0003204047679901123, 0.0003524571657180786, 0.0003845095634460449, 0.00041656196117401123, 0.00044861435890197754, 0.00048066675662994385, 0.0005127191543579102, 0.0005447715520858765, 0.0005768239498138428, 0.0006088763475418091, 0.0006409287452697754, 0.0006729811429977417, 0.000705033540725708, 0.0007370859384536743, 0.0007691383361816406, 0.0008011907339096069, 0.0008332431316375732, 0.0008652955293655396, 0.0008973479270935059, 0.0009294003248214722, 0.0009614527225494385, 0.0009935051202774048, 0.001025557518005371, 0.0010576099157333374, 0.0010896623134613037, 0.00112171471118927, 0.0011537671089172363, 0.0011858195066452026, 0.001217871904373169, 0.0012499243021011353, 0.0012819766998291016, 0.0013140290975570679, 0.0013460814952850342, 0.0013781338930130005, 0.0014101862907409668, 0.001442238688468933, 0.0014742910861968994, 0.0015063434839248657, 0.001538395881652832, 0.0015704482793807983, 0.0016025006771087646, 0.001634553074836731, 0.0016666054725646973, 0.0016986578702926636, 0.0017307102680206299, 0.0017627626657485962, 0.0017948150634765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 8.0, 15.0, 13.0, 15.0, 19.0, 37.0, 54.0, 72.0, 96.0, 135.0, 224.0, 367.0, 630.0, 1144.0, 2362.0, 6138.0, 17645.0, 73682.0, 602433.0, 282609.0, 41430.0, 11308.0, 4089.0, 1849.0, 883.0, 481.0, 287.0, 158.0, 122.0, 65.0, 61.0, 33.0, 25.0, 14.0, 10.0, 10.0, 6.0, 4.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.14453125, -4.02880859375, -3.9130859375, -3.79736328125, -3.681640625, -3.56591796875, -3.4501953125, -3.33447265625, -3.21875, -3.10302734375, -2.9873046875, -2.87158203125, -2.755859375, -2.64013671875, -2.5244140625, -2.40869140625, -2.29296875, -2.17724609375, -2.0615234375, -1.94580078125, -1.830078125, -1.71435546875, -1.5986328125, -1.48291015625, -1.3671875, -1.25146484375, -1.1357421875, -1.02001953125, -0.904296875, -0.78857421875, -0.6728515625, -0.55712890625, -0.44140625, -0.32568359375, -0.2099609375, -0.09423828125, 0.021484375, 0.13720703125, 0.2529296875, 0.36865234375, 0.484375, 0.60009765625, 0.7158203125, 0.83154296875, 0.947265625, 1.06298828125, 1.1787109375, 1.29443359375, 1.41015625, 1.52587890625, 1.6416015625, 1.75732421875, 1.873046875, 1.98876953125, 2.1044921875, 2.22021484375, 2.3359375, 2.45166015625, 2.5673828125, 2.68310546875, 2.798828125, 2.91455078125, 3.0302734375, 3.14599609375, 3.26171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 9.0, 7.0, 4.0, 13.0, 14.0, 14.0, 16.0, 19.0, 23.0, 40.0, 52.0, 47.0, 77.0, 80.0, 101.0, 101.0, 92.0, 58.0, 49.0, 42.0, 28.0, 22.0, 20.0, 16.0, 12.0, 12.0, 8.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.3984375, -3.30511474609375, -3.2117919921875, -3.11846923828125, -3.025146484375, -2.93182373046875, -2.8385009765625, -2.74517822265625, -2.65185546875, -2.55853271484375, -2.4652099609375, -2.37188720703125, -2.278564453125, -2.18524169921875, -2.0919189453125, -1.99859619140625, -1.9052734375, -1.81195068359375, -1.7186279296875, -1.62530517578125, -1.531982421875, -1.43865966796875, -1.3453369140625, -1.25201416015625, -1.15869140625, -1.06536865234375, -0.9720458984375, -0.87872314453125, -0.785400390625, -0.69207763671875, -0.5987548828125, -0.50543212890625, -0.412109375, -0.31878662109375, -0.2254638671875, -0.13214111328125, -0.038818359375, 0.05450439453125, 0.1478271484375, 0.24114990234375, 0.33447265625, 0.42779541015625, 0.5211181640625, 0.61444091796875, 0.707763671875, 0.80108642578125, 0.8944091796875, 0.98773193359375, 1.0810546875, 1.17437744140625, 1.2677001953125, 1.36102294921875, 1.454345703125, 1.54766845703125, 1.6409912109375, 1.73431396484375, 1.82763671875, 1.92095947265625, 2.0142822265625, 2.10760498046875, 2.200927734375, 2.29425048828125, 2.3875732421875, 2.48089599609375, 2.57421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 17.0, 48.0, 179.0, 532.0, 170.0, 35.0, 12.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.53518676757812, -72.88227844238281, -70.22936248779297, -67.57645416259766, -64.92354583740234, -62.2706298828125, -59.61772155761719, -56.96480941772461, -54.31189727783203, -51.65898513793945, -49.00607681274414, -46.35316467285156, -43.700252532958984, -41.047340393066406, -38.394432067871094, -35.741519927978516, -33.0886116027832, -30.435701370239258, -27.78278923034668, -25.129878997802734, -22.476966857910156, -19.82405662536621, -17.171146392822266, -14.518234252929688, -11.865324020385742, -9.21241283416748, -6.559502124786377, -3.9065914154052734, -1.2536802291870117, 1.39923095703125, 4.052141189575195, 6.705053329467773, 9.357963562011719, 12.01087474822998, 14.663785934448242, 17.316696166992188, 19.969608306884766, 22.62251853942871, 25.275428771972656, 27.928340911865234, 30.58125114440918, 33.234161376953125, 35.8870735168457, 38.53998565673828, 41.192893981933594, 43.84580612182617, 46.49871826171875, 49.15162658691406, 51.80453872680664, 54.45745086669922, 57.11035919189453, 59.76327133178711, 62.41618347167969, 65.069091796875, 67.72200012207031, 70.37491607666016, 73.02782440185547, 75.68073272705078, 78.33364868164062, 80.98655700683594, 83.63946533203125, 86.2923812866211, 88.9452896118164, 91.59820556640625, 94.25111389160156]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 3.0, 9.0, 5.0, 9.0, 10.0, 12.0, 18.0, 31.0, 51.0, 33.0, 66.0, 76.0, 90.0, 97.0, 88.0, 77.0, 68.0, 60.0, 50.0, 36.0, 25.0, 17.0, 14.0, 9.0, 7.0, 6.0, 2.0, 7.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.034263610839844, -38.54399490356445, -37.0537223815918, -35.563453674316406, -34.073184967041016, -32.582916259765625, -31.09264373779297, -29.602375030517578, -28.112104415893555, -26.62183380126953, -25.13156509399414, -23.641294479370117, -22.151023864746094, -20.660755157470703, -19.17048454284668, -17.680213928222656, -16.189945220947266, -14.699675559997559, -13.209405899047852, -11.719135284423828, -10.228865623474121, -8.738595962524414, -7.248325347900391, -5.758055686950684, -4.267786026000977, -2.7775161266326904, -1.2872462272644043, 0.20302391052246094, 1.693293571472168, 3.183563232421875, 4.673833847045898, 6.1641035079956055, 7.654369354248047, 9.144639015197754, 10.634908676147461, 12.125179290771484, 13.615448951721191, 15.105718612670898, 16.595989227294922, 18.086257934570312, 19.576528549194336, 21.06679916381836, 22.55706787109375, 24.047338485717773, 25.537609100341797, 27.027877807617188, 28.51814842224121, 30.008419036865234, 31.498687744140625, 32.988956451416016, 34.47922897338867, 35.96949768066406, 37.45976638793945, 38.950035095214844, 40.4403076171875, 41.93057632446289, 43.42084503173828, 44.91111373901367, 46.40138626098633, 47.89165496826172, 49.38192367553711, 50.8721923828125, 52.362464904785156, 53.85273361206055, 55.3430061340332]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 10.0, 5.0, 7.0, 11.0, 16.0, 23.0, 29.0, 35.0, 60.0, 105.0, 160.0, 278.0, 481.0, 896.0, 1906.0, 5511.0, 35758.0, 4095855.0, 42290.0, 6231.0, 2151.0, 914.0, 555.0, 338.0, 183.0, 127.0, 83.0, 68.0, 48.0, 38.0, 26.0, 21.0, 22.0, 11.0, 6.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-35.1875, -34.13818359375, -33.0888671875, -32.03955078125, -30.990234375, -29.94091796875, -28.8916015625, -27.84228515625, -26.79296875, -25.74365234375, -24.6943359375, -23.64501953125, -22.595703125, -21.54638671875, -20.4970703125, -19.44775390625, -18.3984375, -17.34912109375, -16.2998046875, -15.25048828125, -14.201171875, -13.15185546875, -12.1025390625, -11.05322265625, -10.00390625, -8.95458984375, -7.9052734375, -6.85595703125, -5.806640625, -4.75732421875, -3.7080078125, -2.65869140625, -1.609375, -0.56005859375, 0.4892578125, 1.53857421875, 2.587890625, 3.63720703125, 4.6865234375, 5.73583984375, 6.78515625, 7.83447265625, 8.8837890625, 9.93310546875, 10.982421875, 12.03173828125, 13.0810546875, 14.13037109375, 15.1796875, 16.22900390625, 17.2783203125, 18.32763671875, 19.376953125, 20.42626953125, 21.4755859375, 22.52490234375, 23.57421875, 24.62353515625, 25.6728515625, 26.72216796875, 27.771484375, 28.82080078125, 29.8701171875, 30.91943359375, 31.96875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 9.0, 18.0, 35.0, 75.0, 142.0, 211.0, 213.0, 133.0, 61.0, 22.0, 19.0, 10.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6298828125, -1.58184814453125, -1.5338134765625, -1.48577880859375, -1.437744140625, -1.38970947265625, -1.3416748046875, -1.29364013671875, -1.24560546875, -1.19757080078125, -1.1495361328125, -1.10150146484375, -1.053466796875, -1.00543212890625, -0.9573974609375, -0.90936279296875, -0.861328125, -0.81329345703125, -0.7652587890625, -0.71722412109375, -0.669189453125, -0.62115478515625, -0.5731201171875, -0.52508544921875, -0.47705078125, -0.42901611328125, -0.3809814453125, -0.33294677734375, -0.284912109375, -0.23687744140625, -0.1888427734375, -0.14080810546875, -0.0927734375, -0.04473876953125, 0.0032958984375, 0.05133056640625, 0.099365234375, 0.14739990234375, 0.1954345703125, 0.24346923828125, 0.29150390625, 0.33953857421875, 0.3875732421875, 0.43560791015625, 0.483642578125, 0.53167724609375, 0.5797119140625, 0.62774658203125, 0.67578125, 0.72381591796875, 0.7718505859375, 0.81988525390625, 0.867919921875, 0.91595458984375, 0.9639892578125, 1.01202392578125, 1.06005859375, 1.10809326171875, 1.1561279296875, 1.20416259765625, 1.252197265625, 1.30023193359375, 1.3482666015625, 1.39630126953125, 1.4443359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 7.0, 8.0, 9.0, 14.0, 10.0, 22.0, 36.0, 46.0, 102.0, 382.0, 2656.0, 74236.0, 4104023.0, 11173.0, 1050.0, 252.0, 87.0, 53.0, 27.0, 19.0, 18.0, 10.0, 6.0, 4.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.9375, -41.6845703125, -40.431640625, -39.1787109375, -37.92578125, -36.6728515625, -35.419921875, -34.1669921875, -32.9140625, -31.6611328125, -30.408203125, -29.1552734375, -27.90234375, -26.6494140625, -25.396484375, -24.1435546875, -22.890625, -21.6376953125, -20.384765625, -19.1318359375, -17.87890625, -16.6259765625, -15.373046875, -14.1201171875, -12.8671875, -11.6142578125, -10.361328125, -9.1083984375, -7.85546875, -6.6025390625, -5.349609375, -4.0966796875, -2.84375, -1.5908203125, -0.337890625, 0.9150390625, 2.16796875, 3.4208984375, 4.673828125, 5.9267578125, 7.1796875, 8.4326171875, 9.685546875, 10.9384765625, 12.19140625, 13.4443359375, 14.697265625, 15.9501953125, 17.203125, 18.4560546875, 19.708984375, 20.9619140625, 22.21484375, 23.4677734375, 24.720703125, 25.9736328125, 27.2265625, 28.4794921875, 29.732421875, 30.9853515625, 32.23828125, 33.4912109375, 34.744140625, 35.9970703125, 37.25]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 7.0, 4.0, 10.0, 11.0, 22.0, 31.0, 36.0, 70.0, 101.0, 193.0, 636.0, 2240.0, 311.0, 129.0, 68.0, 48.0, 38.0, 20.0, 21.0, 11.0, 11.0, 13.0, 9.0, 4.0, 3.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.966796875, -1.901824951171875, -1.83685302734375, -1.771881103515625, -1.7069091796875, -1.641937255859375, -1.57696533203125, -1.511993408203125, -1.447021484375, -1.382049560546875, -1.31707763671875, -1.252105712890625, -1.1871337890625, -1.122161865234375, -1.05718994140625, -0.992218017578125, -0.92724609375, -0.862274169921875, -0.79730224609375, -0.732330322265625, -0.6673583984375, -0.602386474609375, -0.53741455078125, -0.472442626953125, -0.407470703125, -0.342498779296875, -0.27752685546875, -0.212554931640625, -0.1475830078125, -0.082611083984375, -0.01763916015625, 0.047332763671875, 0.1123046875, 0.177276611328125, 0.24224853515625, 0.307220458984375, 0.3721923828125, 0.437164306640625, 0.50213623046875, 0.567108154296875, 0.632080078125, 0.697052001953125, 0.76202392578125, 0.826995849609375, 0.8919677734375, 0.956939697265625, 1.02191162109375, 1.086883544921875, 1.15185546875, 1.216827392578125, 1.28179931640625, 1.346771240234375, 1.4117431640625, 1.476715087890625, 1.54168701171875, 1.606658935546875, 1.671630859375, 1.736602783203125, 1.80157470703125, 1.866546630859375, 1.9315185546875, 1.996490478515625, 2.06146240234375, 2.126434326171875, 2.19140625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 39.0, 212.0, 482.0, 178.0, 42.0, 23.0, 11.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.168739318847656, -14.386367797851562, -13.603996276855469, -12.821623802185059, -12.039252281188965, -11.256880760192871, -10.474508285522461, -9.692136764526367, -8.909765243530273, -8.12739372253418, -7.345021724700928, -6.562649726867676, -5.780278205871582, -4.997906684875488, -4.215534687042236, -3.4331626892089844, -2.6507911682128906, -1.8684194087982178, -1.086047649383545, -0.30367588996887207, 0.4786958694458008, 1.2610676288604736, 2.0434393882751465, 2.8258113861083984, 3.608182907104492, 4.390554428100586, 5.172926425933838, 5.95529842376709, 6.737669944763184, 7.520041465759277, 8.302413940429688, 9.084785461425781, 9.867156982421875, 10.649528503417969, 11.431900024414062, 12.214272499084473, 12.996644020080566, 13.77901554107666, 14.56138801574707, 15.343759536743164, 16.126131057739258, 16.90850257873535, 17.690874099731445, 18.47324562072754, 19.255619049072266, 20.03799057006836, 20.820362091064453, 21.602733612060547, 22.38510513305664, 23.167476654052734, 23.949848175048828, 24.732219696044922, 25.514591217041016, 26.296964645385742, 27.079336166381836, 27.86170768737793, 28.644079208374023, 29.426450729370117, 30.20882225036621, 30.991193771362305, 31.77356719970703, 32.555938720703125, 33.33831024169922, 34.12068176269531, 34.903053283691406]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 9.0, 13.0, 16.0, 21.0, 26.0, 34.0, 45.0, 54.0, 47.0, 66.0, 64.0, 62.0, 68.0, 63.0, 71.0, 67.0, 54.0, 38.0, 39.0, 28.0, 22.0, 24.0, 15.0, 13.0, 6.0, 6.0, 5.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.673911094665527, -9.397655487060547, -9.121399879455566, -8.845144271850586, -8.568888664245605, -8.292633056640625, -8.016376495361328, -7.740121364593506, -7.463865280151367, -7.187609672546387, -6.911354064941406, -6.635098457336426, -6.358842372894287, -6.082586765289307, -5.806331157684326, -5.530075550079346, -5.253819942474365, -4.977564334869385, -4.701308727264404, -4.425052642822266, -4.148797035217285, -3.8725414276123047, -3.596285820007324, -3.3200302124023438, -3.043774366378784, -2.7675187587738037, -2.491262912750244, -2.2150073051452637, -1.9387515783309937, -1.6624958515167236, -1.3862402439117432, -1.1099845170974731, -0.8337287902832031, -0.5574730634689331, -0.28121739625930786, -0.004961729049682617, 0.2712939977645874, 0.5475497245788574, 0.8238053321838379, 1.100061058998108, 1.376316785812378, 1.652572512626648, 1.928828239440918, 2.2050838470458984, 2.481339454650879, 2.7575953006744385, 3.033850908279419, 3.3101067543029785, 3.586362361907959, 3.8626179695129395, 4.13887357711792, 4.415129661560059, 4.691385269165039, 4.9676408767700195, 5.243896484375, 5.5201520919799805, 5.796407699584961, 6.072663307189941, 6.348918914794922, 6.625174522399902, 6.901430606842041, 7.1776862144470215, 7.453941822052002, 7.730197429656982, 8.006453514099121]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 11.0, 2.0, 13.0, 8.0, 31.0, 34.0, 38.0, 76.0, 94.0, 134.0, 204.0, 311.0, 574.0, 992.0, 2197.0, 6035.0, 28802.0, 677788.0, 303611.0, 19024.0, 4487.0, 1814.0, 906.0, 479.0, 291.0, 201.0, 114.0, 90.0, 57.0, 31.0, 21.0, 23.0, 9.0, 19.0, 6.0, 9.0, 4.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.734375, -13.3037109375, -12.873046875, -12.4423828125, -12.01171875, -11.5810546875, -11.150390625, -10.7197265625, -10.2890625, -9.8583984375, -9.427734375, -8.9970703125, -8.56640625, -8.1357421875, -7.705078125, -7.2744140625, -6.84375, -6.4130859375, -5.982421875, -5.5517578125, -5.12109375, -4.6904296875, -4.259765625, -3.8291015625, -3.3984375, -2.9677734375, -2.537109375, -2.1064453125, -1.67578125, -1.2451171875, -0.814453125, -0.3837890625, 0.046875, 0.4775390625, 0.908203125, 1.3388671875, 1.76953125, 2.2001953125, 2.630859375, 3.0615234375, 3.4921875, 3.9228515625, 4.353515625, 4.7841796875, 5.21484375, 5.6455078125, 6.076171875, 6.5068359375, 6.9375, 7.3681640625, 7.798828125, 8.2294921875, 8.66015625, 9.0908203125, 9.521484375, 9.9521484375, 10.3828125, 10.8134765625, 11.244140625, 11.6748046875, 12.10546875, 12.5361328125, 12.966796875, 13.3974609375, 13.828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 20.0, 36.0, 71.0, 134.0, 219.0, 205.0, 147.0, 65.0, 35.0, 14.0, 13.0, 11.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7490234375, -1.70050048828125, -1.6519775390625, -1.60345458984375, -1.554931640625, -1.50640869140625, -1.4578857421875, -1.40936279296875, -1.36083984375, -1.31231689453125, -1.2637939453125, -1.21527099609375, -1.166748046875, -1.11822509765625, -1.0697021484375, -1.02117919921875, -0.97265625, -0.92413330078125, -0.8756103515625, -0.82708740234375, -0.778564453125, -0.73004150390625, -0.6815185546875, -0.63299560546875, -0.58447265625, -0.53594970703125, -0.4874267578125, -0.43890380859375, -0.390380859375, -0.34185791015625, -0.2933349609375, -0.24481201171875, -0.1962890625, -0.14776611328125, -0.0992431640625, -0.05072021484375, -0.002197265625, 0.04632568359375, 0.0948486328125, 0.14337158203125, 0.19189453125, 0.24041748046875, 0.2889404296875, 0.33746337890625, 0.385986328125, 0.43450927734375, 0.4830322265625, 0.53155517578125, 0.580078125, 0.62860107421875, 0.6771240234375, 0.72564697265625, 0.774169921875, 0.82269287109375, 0.8712158203125, 0.91973876953125, 0.96826171875, 1.01678466796875, 1.0653076171875, 1.11383056640625, 1.162353515625, 1.21087646484375, 1.2593994140625, 1.30792236328125, 1.3564453125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 9.0, 9.0, 22.0, 20.0, 45.0, 46.0, 52.0, 62.0, 89.0, 128.0, 207.0, 298.0, 495.0, 727.0, 1391.0, 2627.0, 5362.0, 12276.0, 31556.0, 102804.0, 429029.0, 332958.0, 80488.0, 26250.0, 10671.0, 4841.0, 2481.0, 1274.0, 720.0, 480.0, 304.0, 216.0, 165.0, 103.0, 87.0, 59.0, 46.0, 34.0, 23.0, 26.0, 22.0, 12.0, 5.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.26171875, -6.0714111328125, -5.881103515625, -5.6907958984375, -5.50048828125, -5.3101806640625, -5.119873046875, -4.9295654296875, -4.7392578125, -4.5489501953125, -4.358642578125, -4.1683349609375, -3.97802734375, -3.7877197265625, -3.597412109375, -3.4071044921875, -3.216796875, -3.0264892578125, -2.836181640625, -2.6458740234375, -2.45556640625, -2.2652587890625, -2.074951171875, -1.8846435546875, -1.6943359375, -1.5040283203125, -1.313720703125, -1.1234130859375, -0.93310546875, -0.7427978515625, -0.552490234375, -0.3621826171875, -0.171875, 0.0184326171875, 0.208740234375, 0.3990478515625, 0.58935546875, 0.7796630859375, 0.969970703125, 1.1602783203125, 1.3505859375, 1.5408935546875, 1.731201171875, 1.9215087890625, 2.11181640625, 2.3021240234375, 2.492431640625, 2.6827392578125, 2.873046875, 3.0633544921875, 3.253662109375, 3.4439697265625, 3.63427734375, 3.8245849609375, 4.014892578125, 4.2052001953125, 4.3955078125, 4.5858154296875, 4.776123046875, 4.9664306640625, 5.15673828125, 5.3470458984375, 5.537353515625, 5.7276611328125, 5.91796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 1.0, 4.0, 5.0, 6.0, 4.0, 11.0, 15.0, 17.0, 14.0, 26.0, 17.0, 28.0, 29.0, 29.0, 48.0, 34.0, 55.0, 44.0, 43.0, 50.0, 45.0, 37.0, 41.0, 47.0, 32.0, 42.0, 46.0, 32.0, 23.0, 13.0, 20.0, 16.0, 19.0, 14.0, 13.0, 11.0, 12.0, 11.0, 6.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.52734375, -3.40673828125, -3.2861328125, -3.16552734375, -3.044921875, -2.92431640625, -2.8037109375, -2.68310546875, -2.5625, -2.44189453125, -2.3212890625, -2.20068359375, -2.080078125, -1.95947265625, -1.8388671875, -1.71826171875, -1.59765625, -1.47705078125, -1.3564453125, -1.23583984375, -1.115234375, -0.99462890625, -0.8740234375, -0.75341796875, -0.6328125, -0.51220703125, -0.3916015625, -0.27099609375, -0.150390625, -0.02978515625, 0.0908203125, 0.21142578125, 0.33203125, 0.45263671875, 0.5732421875, 0.69384765625, 0.814453125, 0.93505859375, 1.0556640625, 1.17626953125, 1.296875, 1.41748046875, 1.5380859375, 1.65869140625, 1.779296875, 1.89990234375, 2.0205078125, 2.14111328125, 2.26171875, 2.38232421875, 2.5029296875, 2.62353515625, 2.744140625, 2.86474609375, 2.9853515625, 3.10595703125, 3.2265625, 3.34716796875, 3.4677734375, 3.58837890625, 3.708984375, 3.82958984375, 3.9501953125, 4.07080078125, 4.19140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 13.0, 9.0, 37.0, 51.0, 86.0, 185.0, 473.0, 1196.0, 5666.0, 84571.0, 899954.0, 50232.0, 4283.0, 1052.0, 376.0, 172.0, 77.0, 38.0, 23.0, 16.0, 9.0, 11.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.9405517578125, -8.646728515625, -8.3529052734375, -8.05908203125, -7.7652587890625, -7.471435546875, -7.1776123046875, -6.8837890625, -6.5899658203125, -6.296142578125, -6.0023193359375, -5.70849609375, -5.4146728515625, -5.120849609375, -4.8270263671875, -4.533203125, -4.2393798828125, -3.945556640625, -3.6517333984375, -3.35791015625, -3.0640869140625, -2.770263671875, -2.4764404296875, -2.1826171875, -1.8887939453125, -1.594970703125, -1.3011474609375, -1.00732421875, -0.7135009765625, -0.419677734375, -0.1258544921875, 0.16796875, 0.4617919921875, 0.755615234375, 1.0494384765625, 1.34326171875, 1.6370849609375, 1.930908203125, 2.2247314453125, 2.5185546875, 2.8123779296875, 3.106201171875, 3.4000244140625, 3.69384765625, 3.9876708984375, 4.281494140625, 4.5753173828125, 4.869140625, 5.1629638671875, 5.456787109375, 5.7506103515625, 6.04443359375, 6.3382568359375, 6.632080078125, 6.9259033203125, 7.2197265625, 7.5135498046875, 7.807373046875, 8.1011962890625, 8.39501953125, 8.6888427734375, 8.982666015625, 9.2764892578125, 9.5703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 2.0, 1.0, 5.0, 5.0, 3.0, 11.0, 11.0, 11.0, 8.0, 20.0, 18.0, 23.0, 43.0, 33.0, 46.0, 68.0, 79.0, 82.0, 102.0, 74.0, 66.0, 73.0, 48.0, 31.0, 33.0, 17.0, 22.0, 11.0, 10.0, 7.0, 4.0, 5.0, 5.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0003845691680908203, -0.00037327781319618225, -0.0003619864583015442, -0.00035069510340690613, -0.00033940374851226807, -0.00032811239361763, -0.00031682103872299194, -0.0003055296838283539, -0.0002942383289337158, -0.00028294697403907776, -0.0002716556191444397, -0.00026036426424980164, -0.0002490729093551636, -0.0002377815544605255, -0.00022649019956588745, -0.0002151988446712494, -0.00020390748977661133, -0.00019261613488197327, -0.0001813247799873352, -0.00017003342509269714, -0.00015874207019805908, -0.00014745071530342102, -0.00013615936040878296, -0.0001248680055141449, -0.00011357665061950684, -0.00010228529572486877, -9.099394083023071e-05, -7.970258593559265e-05, -6.841123104095459e-05, -5.711987614631653e-05, -4.582852125167847e-05, -3.4537166357040405e-05, -2.3245811462402344e-05, -1.1954456567764282e-05, -6.631016731262207e-07, 1.062825322151184e-05, 2.1919608116149902e-05, 3.3210963010787964e-05, 4.4502317905426025e-05, 5.579367280006409e-05, 6.708502769470215e-05, 7.837638258934021e-05, 8.966773748397827e-05, 0.00010095909237861633, 0.0001122504472732544, 0.00012354180216789246, 0.00013483315706253052, 0.00014612451195716858, 0.00015741586685180664, 0.0001687072217464447, 0.00017999857664108276, 0.00019128993153572083, 0.0002025812864303589, 0.00021387264132499695, 0.000225163996219635, 0.00023645535111427307, 0.00024774670600891113, 0.0002590380609035492, 0.00027032941579818726, 0.0002816207706928253, 0.0002929121255874634, 0.00030420348048210144, 0.0003154948353767395, 0.00032678619027137756, 0.0003380775451660156]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 2.0, 2.0, 10.0, 6.0, 17.0, 27.0, 31.0, 58.0, 124.0, 194.0, 370.0, 900.0, 2708.0, 12795.0, 172346.0, 796059.0, 53370.0, 6498.0, 1728.0, 646.0, 292.0, 134.0, 98.0, 44.0, 29.0, 19.0, 6.0, 10.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58203125, -7.34735107421875, -7.1126708984375, -6.87799072265625, -6.643310546875, -6.40863037109375, -6.1739501953125, -5.93927001953125, -5.70458984375, -5.46990966796875, -5.2352294921875, -5.00054931640625, -4.765869140625, -4.53118896484375, -4.2965087890625, -4.06182861328125, -3.8271484375, -3.59246826171875, -3.3577880859375, -3.12310791015625, -2.888427734375, -2.65374755859375, -2.4190673828125, -2.18438720703125, -1.94970703125, -1.71502685546875, -1.4803466796875, -1.24566650390625, -1.010986328125, -0.77630615234375, -0.5416259765625, -0.30694580078125, -0.072265625, 0.16241455078125, 0.3970947265625, 0.63177490234375, 0.866455078125, 1.10113525390625, 1.3358154296875, 1.57049560546875, 1.80517578125, 2.03985595703125, 2.2745361328125, 2.50921630859375, 2.743896484375, 2.97857666015625, 3.2132568359375, 3.44793701171875, 3.6826171875, 3.91729736328125, 4.1519775390625, 4.38665771484375, 4.621337890625, 4.85601806640625, 5.0906982421875, 5.32537841796875, 5.56005859375, 5.79473876953125, 6.0294189453125, 6.26409912109375, 6.498779296875, 6.73345947265625, 6.9681396484375, 7.20281982421875, 7.4375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 9.0, 19.0, 9.0, 16.0, 31.0, 40.0, 46.0, 65.0, 66.0, 92.0, 102.0, 116.0, 88.0, 82.0, 44.0, 34.0, 33.0, 33.0, 20.0, 12.0, 14.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.111328125, -3.0366363525390625, -2.961944580078125, -2.8872528076171875, -2.81256103515625, -2.7378692626953125, -2.663177490234375, -2.5884857177734375, -2.5137939453125, -2.4391021728515625, -2.364410400390625, -2.2897186279296875, -2.21502685546875, -2.1403350830078125, -2.065643310546875, -1.9909515380859375, -1.916259765625, -1.8415679931640625, -1.766876220703125, -1.6921844482421875, -1.61749267578125, -1.5428009033203125, -1.468109130859375, -1.3934173583984375, -1.3187255859375, -1.2440338134765625, -1.169342041015625, -1.0946502685546875, -1.01995849609375, -0.9452667236328125, -0.870574951171875, -0.7958831787109375, -0.72119140625, -0.6464996337890625, -0.571807861328125, -0.4971160888671875, -0.42242431640625, -0.3477325439453125, -0.273040771484375, -0.1983489990234375, -0.1236572265625, -0.0489654541015625, 0.025726318359375, 0.1004180908203125, 0.17510986328125, 0.2498016357421875, 0.324493408203125, 0.3991851806640625, 0.473876953125, 0.5485687255859375, 0.623260498046875, 0.6979522705078125, 0.77264404296875, 0.8473358154296875, 0.922027587890625, 0.9967193603515625, 1.0714111328125, 1.1461029052734375, 1.220794677734375, 1.2954864501953125, 1.37017822265625, 1.4448699951171875, 1.519561767578125, 1.5942535400390625, 1.6689453125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 14.0, 17.0, 55.0, 133.0, 402.0, 271.0, 66.0, 24.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.47560119628906, -77.24583435058594, -74.01606750488281, -70.78630065917969, -67.5565414428711, -64.32677459716797, -61.097007751464844, -57.86724090576172, -54.63747787475586, -51.407711029052734, -48.177947998046875, -44.94818115234375, -41.718414306640625, -38.488651275634766, -35.25888442993164, -32.02912139892578, -28.799354553222656, -25.569589614868164, -22.339824676513672, -19.110057830810547, -15.880292892456055, -12.650527954101562, -9.420761108398438, -6.190996170043945, -2.961231231689453, 0.26853418350219727, 3.4982995986938477, 6.728065490722656, 9.957830429077148, 13.18759536743164, 16.417362213134766, 19.647127151489258, 22.87689208984375, 26.106657028198242, 29.336421966552734, 32.56618881225586, 35.79595184326172, 39.025718688964844, 42.25548553466797, 45.485252380371094, 48.71501541137695, 51.94478225708008, 55.17454528808594, 58.40431213378906, 61.63407897949219, 64.86384582519531, 68.09361267089844, 71.32337188720703, 74.55313873291016, 77.78290557861328, 81.0126724243164, 84.242431640625, 87.47219848632812, 90.70196533203125, 93.93173217773438, 97.1614990234375, 100.39126586914062, 103.62103271484375, 106.85079956054688, 110.08056640625, 113.3103256225586, 116.54009246826172, 119.76985931396484, 122.99962615966797, 126.22938537597656]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 10.0, 15.0, 24.0, 27.0, 24.0, 43.0, 77.0, 78.0, 76.0, 77.0, 99.0, 95.0, 57.0, 83.0, 55.0, 33.0, 41.0, 26.0, 15.0, 19.0, 9.0, 4.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.1520004272461, -67.35523223876953, -65.55845642089844, -63.761688232421875, -61.96491622924805, -60.16814422607422, -58.371376037597656, -56.57460403442383, -54.77783203125, -52.98106002807617, -51.18429183959961, -49.38751983642578, -47.59074783325195, -45.793975830078125, -43.99720764160156, -42.200435638427734, -40.40366744995117, -38.606895446777344, -36.81012725830078, -35.01335525512695, -33.216583251953125, -31.41981315612793, -29.623043060302734, -27.826271057128906, -26.02950096130371, -24.232730865478516, -22.435958862304688, -20.639188766479492, -18.842418670654297, -17.04564666748047, -15.248876571655273, -13.452105522155762, -11.655330657958984, -9.858559608459473, -8.061788558959961, -6.265018463134766, -4.468247413635254, -2.671476364135742, -0.8747062683105469, 0.9220647811889648, 2.7188358306884766, 4.515606880187988, 6.312377452850342, 8.109148025512695, 9.905919075012207, 11.702690124511719, 13.499460220336914, 15.296231269836426, 17.093002319335938, 18.889772415161133, 20.68654441833496, 22.483314514160156, 24.280086517333984, 26.07685661315918, 27.873626708984375, 29.670398712158203, 31.4671688079834, 33.263938903808594, 35.06071090698242, 36.85748291015625, 38.65425109863281, 40.45102310180664, 42.24779510498047, 44.04456329345703, 45.84133529663086]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 12.0, 14.0, 37.0, 94.0, 229.0, 809.0, 12281.0, 4175435.0, 4556.0, 532.0, 174.0, 57.0, 21.0, 10.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-128.0, -124.6640625, -121.328125, -117.9921875, -114.65625, -111.3203125, -107.984375, -104.6484375, -101.3125, -97.9765625, -94.640625, -91.3046875, -87.96875, -84.6328125, -81.296875, -77.9609375, -74.625, -71.2890625, -67.953125, -64.6171875, -61.28125, -57.9453125, -54.609375, -51.2734375, -47.9375, -44.6015625, -41.265625, -37.9296875, -34.59375, -31.2578125, -27.921875, -24.5859375, -21.25, -17.9140625, -14.578125, -11.2421875, -7.90625, -4.5703125, -1.234375, 2.1015625, 5.4375, 8.7734375, 12.109375, 15.4453125, 18.78125, 22.1171875, 25.453125, 28.7890625, 32.125, 35.4609375, 38.796875, 42.1328125, 45.46875, 48.8046875, 52.140625, 55.4765625, 58.8125, 62.1484375, 65.484375, 68.8203125, 72.15625, 75.4921875, 78.828125, 82.1640625, 85.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 15.0, 18.0, 60.0, 100.0, 145.0, 159.0, 170.0, 137.0, 80.0, 46.0, 24.0, 14.0, 10.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.603515625, -2.534942626953125, -2.46636962890625, -2.397796630859375, -2.3292236328125, -2.260650634765625, -2.19207763671875, -2.123504638671875, -2.054931640625, -1.986358642578125, -1.91778564453125, -1.849212646484375, -1.7806396484375, -1.712066650390625, -1.64349365234375, -1.574920654296875, -1.50634765625, -1.437774658203125, -1.36920166015625, -1.300628662109375, -1.2320556640625, -1.163482666015625, -1.09490966796875, -1.026336669921875, -0.957763671875, -0.889190673828125, -0.82061767578125, -0.752044677734375, -0.6834716796875, -0.614898681640625, -0.54632568359375, -0.477752685546875, -0.4091796875, -0.340606689453125, -0.27203369140625, -0.203460693359375, -0.1348876953125, -0.066314697265625, 0.00225830078125, 0.070831298828125, 0.139404296875, 0.207977294921875, 0.27655029296875, 0.345123291015625, 0.4136962890625, 0.482269287109375, 0.55084228515625, 0.619415283203125, 0.68798828125, 0.756561279296875, 0.82513427734375, 0.893707275390625, 0.9622802734375, 1.030853271484375, 1.09942626953125, 1.167999267578125, 1.236572265625, 1.305145263671875, 1.37371826171875, 1.442291259765625, 1.5108642578125, 1.579437255859375, 1.64801025390625, 1.716583251953125, 1.78515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 13.0, 11.0, 19.0, 30.0, 35.0, 52.0, 88.0, 165.0, 620.0, 8336.0, 4134805.0, 48166.0, 1357.0, 297.0, 117.0, 58.0, 51.0, 25.0, 16.0, 16.0, 5.0, 5.0, 5.0, 0.0, 1.0, 3.0], "bins": [-78.25, -76.642578125, -75.03515625, -73.427734375, -71.8203125, -70.212890625, -68.60546875, -66.998046875, -65.390625, -63.783203125, -62.17578125, -60.568359375, -58.9609375, -57.353515625, -55.74609375, -54.138671875, -52.53125, -50.923828125, -49.31640625, -47.708984375, -46.1015625, -44.494140625, -42.88671875, -41.279296875, -39.671875, -38.064453125, -36.45703125, -34.849609375, -33.2421875, -31.634765625, -30.02734375, -28.419921875, -26.8125, -25.205078125, -23.59765625, -21.990234375, -20.3828125, -18.775390625, -17.16796875, -15.560546875, -13.953125, -12.345703125, -10.73828125, -9.130859375, -7.5234375, -5.916015625, -4.30859375, -2.701171875, -1.09375, 0.513671875, 2.12109375, 3.728515625, 5.3359375, 6.943359375, 8.55078125, 10.158203125, 11.765625, 13.373046875, 14.98046875, 16.587890625, 18.1953125, 19.802734375, 21.41015625, 23.017578125, 24.625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 20.0, 46.0, 92.0, 231.0, 2328.0, 989.0, 188.0, 64.0, 49.0, 21.0, 10.0, 9.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.40423583984375, -5.2537841796875, -5.10333251953125, -4.952880859375, -4.80242919921875, -4.6519775390625, -4.50152587890625, -4.35107421875, -4.20062255859375, -4.0501708984375, -3.89971923828125, -3.749267578125, -3.59881591796875, -3.4483642578125, -3.29791259765625, -3.1474609375, -2.99700927734375, -2.8465576171875, -2.69610595703125, -2.545654296875, -2.39520263671875, -2.2447509765625, -2.09429931640625, -1.94384765625, -1.79339599609375, -1.6429443359375, -1.49249267578125, -1.342041015625, -1.19158935546875, -1.0411376953125, -0.89068603515625, -0.740234375, -0.58978271484375, -0.4393310546875, -0.28887939453125, -0.138427734375, 0.01202392578125, 0.1624755859375, 0.31292724609375, 0.46337890625, 0.61383056640625, 0.7642822265625, 0.91473388671875, 1.065185546875, 1.21563720703125, 1.3660888671875, 1.51654052734375, 1.6669921875, 1.81744384765625, 1.9678955078125, 2.11834716796875, 2.268798828125, 2.41925048828125, 2.5697021484375, 2.72015380859375, 2.87060546875, 3.02105712890625, 3.1715087890625, 3.32196044921875, 3.472412109375, 3.62286376953125, 3.7733154296875, 3.92376708984375, 4.07421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 13.0, 28.0, 81.0, 195.0, 329.0, 211.0, 74.0, 37.0, 19.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.809279441833496, -13.914764404296875, -13.02025032043457, -12.12573528289795, -11.231220245361328, -10.336705207824707, -9.442190170288086, -8.547676086425781, -7.65316104888916, -6.758646011352539, -5.864131450653076, -4.969616889953613, -4.075101852416992, -3.180586814880371, -2.286072254180908, -1.3915576934814453, -0.4970426559448242, 0.3974721431732178, 1.2919869422912598, 2.1865017414093018, 3.0810165405273438, 3.975531578063965, 4.870046138763428, 5.764560699462891, 6.659075736999512, 7.553590774536133, 8.448104858398438, 9.342619895935059, 10.23713493347168, 11.1316499710083, 12.026165008544922, 12.920679092407227, 13.815193176269531, 14.709708213806152, 15.604223251342773, 16.498737335205078, 17.393253326416016, 18.28776741027832, 19.182281494140625, 20.076797485351562, 20.971311569213867, 21.865825653076172, 22.76034164428711, 23.654855728149414, 24.54936981201172, 25.443885803222656, 26.33839988708496, 27.232913970947266, 28.127429962158203, 29.021944046020508, 29.916460037231445, 30.81097412109375, 31.705490112304688, 32.600006103515625, 33.4945182800293, 34.389034271240234, 35.283546447753906, 36.178062438964844, 37.072574615478516, 37.96709060668945, 38.86160659790039, 39.75611877441406, 40.650634765625, 41.54515075683594, 42.439666748046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 2.0, 10.0, 14.0, 15.0, 12.0, 25.0, 31.0, 31.0, 35.0, 33.0, 36.0, 45.0, 44.0, 53.0, 60.0, 57.0, 60.0, 51.0, 48.0, 50.0, 35.0, 35.0, 40.0, 30.0, 27.0, 26.0, 16.0, 19.0, 14.0, 8.0, 8.0, 7.0, 7.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.732166290283203, -8.455063819885254, -8.177961349487305, -7.900857925415039, -7.62375545501709, -7.346652984619141, -7.069550037384033, -6.792447090148926, -6.515344619750977, -6.238242149353027, -5.96113920211792, -5.6840362548828125, -5.406933784484863, -5.129831314086914, -4.852728366851807, -4.575625419616699, -4.29852294921875, -4.021420478820801, -3.7443175315856934, -3.467214822769165, -3.1901121139526367, -2.9130094051361084, -2.63590669631958, -2.3588039875030518, -2.0817012786865234, -1.8045985698699951, -1.5274958610534668, -1.2503931522369385, -0.9732904434204102, -0.6961877346038818, -0.4190850257873535, -0.1419823169708252, 0.13511943817138672, 0.41222214698791504, 0.6893248558044434, 0.9664275646209717, 1.2435302734375, 1.5206329822540283, 1.7977356910705566, 2.074838399887085, 2.3519411087036133, 2.6290438175201416, 2.90614652633667, 3.1832492351531982, 3.4603519439697266, 3.737454652786255, 4.014557361602783, 4.291660308837891, 4.56876277923584, 4.845865249633789, 5.1229681968688965, 5.400071144104004, 5.677173614501953, 5.954276084899902, 6.23137903213501, 6.508481979370117, 6.785584449768066, 7.062686920166016, 7.339789867401123, 7.6168928146362305, 7.89399528503418, 8.171097755432129, 8.448200225830078, 8.725303649902344, 9.002406120300293]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 12.0, 22.0, 30.0, 44.0, 61.0, 72.0, 121.0, 226.0, 341.0, 559.0, 1061.0, 2366.0, 7742.0, 71425.0, 816845.0, 131543.0, 10382.0, 2820.0, 1264.0, 608.0, 386.0, 215.0, 123.0, 87.0, 72.0, 30.0, 18.0, 18.0, 11.0, 11.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.09375, -15.5999755859375, -15.106201171875, -14.6124267578125, -14.11865234375, -13.6248779296875, -13.131103515625, -12.6373291015625, -12.1435546875, -11.6497802734375, -11.156005859375, -10.6622314453125, -10.16845703125, -9.6746826171875, -9.180908203125, -8.6871337890625, -8.193359375, -7.6995849609375, -7.205810546875, -6.7120361328125, -6.21826171875, -5.7244873046875, -5.230712890625, -4.7369384765625, -4.2431640625, -3.7493896484375, -3.255615234375, -2.7618408203125, -2.26806640625, -1.7742919921875, -1.280517578125, -0.7867431640625, -0.29296875, 0.2008056640625, 0.694580078125, 1.1883544921875, 1.68212890625, 2.1759033203125, 2.669677734375, 3.1634521484375, 3.6572265625, 4.1510009765625, 4.644775390625, 5.1385498046875, 5.63232421875, 6.1260986328125, 6.619873046875, 7.1136474609375, 7.607421875, 8.1011962890625, 8.594970703125, 9.0887451171875, 9.58251953125, 10.0762939453125, 10.570068359375, 11.0638427734375, 11.5576171875, 12.0513916015625, 12.545166015625, 13.0389404296875, 13.53271484375, 14.0264892578125, 14.520263671875, 15.0140380859375, 15.5078125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 11.0, 9.0, 20.0, 50.0, 81.0, 121.0, 174.0, 173.0, 140.0, 95.0, 65.0, 32.0, 12.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.609375, -2.5428009033203125, -2.476226806640625, -2.4096527099609375, -2.34307861328125, -2.2765045166015625, -2.209930419921875, -2.1433563232421875, -2.0767822265625, -2.0102081298828125, -1.943634033203125, -1.8770599365234375, -1.81048583984375, -1.7439117431640625, -1.677337646484375, -1.6107635498046875, -1.544189453125, -1.4776153564453125, -1.411041259765625, -1.3444671630859375, -1.27789306640625, -1.2113189697265625, -1.144744873046875, -1.0781707763671875, -1.0115966796875, -0.9450225830078125, -0.878448486328125, -0.8118743896484375, -0.74530029296875, -0.6787261962890625, -0.612152099609375, -0.5455780029296875, -0.47900390625, -0.4124298095703125, -0.345855712890625, -0.2792816162109375, -0.21270751953125, -0.1461334228515625, -0.079559326171875, -0.0129852294921875, 0.0535888671875, 0.1201629638671875, 0.186737060546875, 0.2533111572265625, 0.31988525390625, 0.3864593505859375, 0.453033447265625, 0.5196075439453125, 0.586181640625, 0.6527557373046875, 0.719329833984375, 0.7859039306640625, 0.85247802734375, 0.9190521240234375, 0.985626220703125, 1.0522003173828125, 1.1187744140625, 1.1853485107421875, 1.251922607421875, 1.3184967041015625, 1.38507080078125, 1.4516448974609375, 1.518218994140625, 1.5847930908203125, 1.6513671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 8.0, 11.0, 13.0, 23.0, 24.0, 44.0, 76.0, 107.0, 184.0, 328.0, 592.0, 1200.0, 2883.0, 9130.0, 46434.0, 437124.0, 482911.0, 51853.0, 9900.0, 3029.0, 1247.0, 607.0, 311.0, 170.0, 124.0, 71.0, 47.0, 28.0, 25.0, 10.0, 14.0, 7.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.2890625, -11.9571533203125, -11.625244140625, -11.2933349609375, -10.96142578125, -10.6295166015625, -10.297607421875, -9.9656982421875, -9.6337890625, -9.3018798828125, -8.969970703125, -8.6380615234375, -8.30615234375, -7.9742431640625, -7.642333984375, -7.3104248046875, -6.978515625, -6.6466064453125, -6.314697265625, -5.9827880859375, -5.65087890625, -5.3189697265625, -4.987060546875, -4.6551513671875, -4.3232421875, -3.9913330078125, -3.659423828125, -3.3275146484375, -2.99560546875, -2.6636962890625, -2.331787109375, -1.9998779296875, -1.66796875, -1.3360595703125, -1.004150390625, -0.6722412109375, -0.34033203125, -0.0084228515625, 0.323486328125, 0.6553955078125, 0.9873046875, 1.3192138671875, 1.651123046875, 1.9830322265625, 2.31494140625, 2.6468505859375, 2.978759765625, 3.3106689453125, 3.642578125, 3.9744873046875, 4.306396484375, 4.6383056640625, 4.97021484375, 5.3021240234375, 5.634033203125, 5.9659423828125, 6.2978515625, 6.6297607421875, 6.961669921875, 7.2935791015625, 7.62548828125, 7.9573974609375, 8.289306640625, 8.6212158203125, 8.953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 11.0, 10.0, 11.0, 13.0, 17.0, 38.0, 36.0, 52.0, 65.0, 74.0, 87.0, 111.0, 104.0, 71.0, 66.0, 59.0, 49.0, 30.0, 33.0, 19.0, 17.0, 11.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.796875, -9.54278564453125, -9.2886962890625, -9.03460693359375, -8.780517578125, -8.52642822265625, -8.2723388671875, -8.01824951171875, -7.76416015625, -7.51007080078125, -7.2559814453125, -7.00189208984375, -6.747802734375, -6.49371337890625, -6.2396240234375, -5.98553466796875, -5.7314453125, -5.47735595703125, -5.2232666015625, -4.96917724609375, -4.715087890625, -4.46099853515625, -4.2069091796875, -3.95281982421875, -3.69873046875, -3.44464111328125, -3.1905517578125, -2.93646240234375, -2.682373046875, -2.42828369140625, -2.1741943359375, -1.92010498046875, -1.666015625, -1.41192626953125, -1.1578369140625, -0.90374755859375, -0.649658203125, -0.39556884765625, -0.1414794921875, 0.11260986328125, 0.36669921875, 0.62078857421875, 0.8748779296875, 1.12896728515625, 1.383056640625, 1.63714599609375, 1.8912353515625, 2.14532470703125, 2.3994140625, 2.65350341796875, 2.9075927734375, 3.16168212890625, 3.415771484375, 3.66986083984375, 3.9239501953125, 4.17803955078125, 4.43212890625, 4.68621826171875, 4.9403076171875, 5.19439697265625, 5.448486328125, 5.70257568359375, 5.9566650390625, 6.21075439453125, 6.46484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 9.0, 12.0, 23.0, 71.0, 143.0, 360.0, 2425.0, 895620.0, 147810.0, 1542.0, 307.0, 121.0, 63.0, 18.0, 11.0, 8.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.40625, -38.3935546875, -37.380859375, -36.3681640625, -35.35546875, -34.3427734375, -33.330078125, -32.3173828125, -31.3046875, -30.2919921875, -29.279296875, -28.2666015625, -27.25390625, -26.2412109375, -25.228515625, -24.2158203125, -23.203125, -22.1904296875, -21.177734375, -20.1650390625, -19.15234375, -18.1396484375, -17.126953125, -16.1142578125, -15.1015625, -14.0888671875, -13.076171875, -12.0634765625, -11.05078125, -10.0380859375, -9.025390625, -8.0126953125, -7.0, -5.9873046875, -4.974609375, -3.9619140625, -2.94921875, -1.9365234375, -0.923828125, 0.0888671875, 1.1015625, 2.1142578125, 3.126953125, 4.1396484375, 5.15234375, 6.1650390625, 7.177734375, 8.1904296875, 9.203125, 10.2158203125, 11.228515625, 12.2412109375, 13.25390625, 14.2666015625, 15.279296875, 16.2919921875, 17.3046875, 18.3173828125, 19.330078125, 20.3427734375, 21.35546875, 22.3681640625, 23.380859375, 24.3935546875, 25.40625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 15.0, 16.0, 22.0, 41.0, 50.0, 71.0, 112.0, 143.0, 126.0, 137.0, 73.0, 58.0, 33.0, 24.0, 13.0, 15.0, 4.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005950927734375, -0.0005752593278884888, -0.0005554258823394775, -0.0005355924367904663, -0.0005157589912414551, -0.0004959255456924438, -0.0004760921001434326, -0.0004562586545944214, -0.00043642520904541016, -0.0004165917634963989, -0.0003967583179473877, -0.00037692487239837646, -0.00035709142684936523, -0.000337257981300354, -0.0003174245357513428, -0.00029759109020233154, -0.0002777576446533203, -0.0002579241991043091, -0.00023809075355529785, -0.00021825730800628662, -0.0001984238624572754, -0.00017859041690826416, -0.00015875697135925293, -0.0001389235258102417, -0.00011909008026123047, -9.925663471221924e-05, -7.942318916320801e-05, -5.958974361419678e-05, -3.975629806518555e-05, -1.9922852516174316e-05, -8.940696716308594e-08, 1.9744038581848145e-05, 3.9577484130859375e-05, 5.9410929679870605e-05, 7.924437522888184e-05, 9.907782077789307e-05, 0.0001189112663269043, 0.00013874471187591553, 0.00015857815742492676, 0.000178411602973938, 0.00019824504852294922, 0.00021807849407196045, 0.00023791193962097168, 0.0002577453851699829, 0.00027757883071899414, 0.00029741227626800537, 0.0003172457218170166, 0.00033707916736602783, 0.00035691261291503906, 0.0003767460584640503, 0.0003965795040130615, 0.00041641294956207275, 0.000436246395111084, 0.0004560798406600952, 0.00047591328620910645, 0.0004957467317581177, 0.0005155801773071289, 0.0005354136228561401, 0.0005552470684051514, 0.0005750805139541626, 0.0005949139595031738, 0.0006147474050521851, 0.0006345808506011963, 0.0006544142961502075, 0.0006742477416992188]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 7.0, 8.0, 19.0, 13.0, 26.0, 64.0, 136.0, 375.0, 1233.0, 6186.0, 286368.0, 743000.0, 8834.0, 1542.0, 420.0, 167.0, 64.0, 40.0, 16.0, 13.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -14.0240478515625, -13.524658203125, -13.0252685546875, -12.52587890625, -12.0264892578125, -11.527099609375, -11.0277099609375, -10.5283203125, -10.0289306640625, -9.529541015625, -9.0301513671875, -8.53076171875, -8.0313720703125, -7.531982421875, -7.0325927734375, -6.533203125, -6.0338134765625, -5.534423828125, -5.0350341796875, -4.53564453125, -4.0362548828125, -3.536865234375, -3.0374755859375, -2.5380859375, -2.0386962890625, -1.539306640625, -1.0399169921875, -0.54052734375, -0.0411376953125, 0.458251953125, 0.9576416015625, 1.45703125, 1.9564208984375, 2.455810546875, 2.9552001953125, 3.45458984375, 3.9539794921875, 4.453369140625, 4.9527587890625, 5.4521484375, 5.9515380859375, 6.450927734375, 6.9503173828125, 7.44970703125, 7.9490966796875, 8.448486328125, 8.9478759765625, 9.447265625, 9.9466552734375, 10.446044921875, 10.9454345703125, 11.44482421875, 11.9442138671875, 12.443603515625, 12.9429931640625, 13.4423828125, 13.9417724609375, 14.441162109375, 14.9405517578125, 15.43994140625, 15.9393310546875, 16.438720703125, 16.9381103515625, 17.4375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 18.0, 23.0, 53.0, 57.0, 101.0, 161.0, 132.0, 166.0, 103.0, 68.0, 50.0, 22.0, 11.0, 10.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.243743896484375, -4.12030029296875, -3.996856689453125, -3.8734130859375, -3.749969482421875, -3.62652587890625, -3.503082275390625, -3.379638671875, -3.256195068359375, -3.13275146484375, -3.009307861328125, -2.8858642578125, -2.762420654296875, -2.63897705078125, -2.515533447265625, -2.39208984375, -2.268646240234375, -2.14520263671875, -2.021759033203125, -1.8983154296875, -1.774871826171875, -1.65142822265625, -1.527984619140625, -1.404541015625, -1.281097412109375, -1.15765380859375, -1.034210205078125, -0.9107666015625, -0.787322998046875, -0.66387939453125, -0.540435791015625, -0.4169921875, -0.293548583984375, -0.17010498046875, -0.046661376953125, 0.0767822265625, 0.200225830078125, 0.32366943359375, 0.447113037109375, 0.570556640625, 0.694000244140625, 0.81744384765625, 0.940887451171875, 1.0643310546875, 1.187774658203125, 1.31121826171875, 1.434661865234375, 1.55810546875, 1.681549072265625, 1.80499267578125, 1.928436279296875, 2.0518798828125, 2.175323486328125, 2.29876708984375, 2.422210693359375, 2.545654296875, 2.669097900390625, 2.79254150390625, 2.915985107421875, 3.0394287109375, 3.162872314453125, 3.28631591796875, 3.409759521484375, 3.533203125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 14.0, 54.0, 263.0, 501.0, 139.0, 21.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.68284606933594, -125.55628967285156, -121.42972564697266, -117.30316162109375, -113.17660522460938, -109.050048828125, -104.9234848022461, -100.79692077636719, -96.67036437988281, -92.54380798339844, -88.41724395751953, -84.29067993164062, -80.16412353515625, -76.03756713867188, -71.91100311279297, -67.78443908691406, -63.65788269042969, -59.53132247924805, -55.404762268066406, -51.278202056884766, -47.151641845703125, -43.025081634521484, -38.898521423339844, -34.7719612121582, -30.645401000976562, -26.518840789794922, -22.39228057861328, -18.26572036743164, -14.13916015625, -10.01259994506836, -5.886039733886719, -1.7594795227050781, 2.367095947265625, 6.493656158447266, 10.620216369628906, 14.746776580810547, 18.873336791992188, 22.999897003173828, 27.12645721435547, 31.25301742553711, 35.37957763671875, 39.50613784790039, 43.63269805908203, 47.75925827026367, 51.88581848144531, 56.01237869262695, 60.138938903808594, 64.2655029296875, 68.39205932617188, 72.51861572265625, 76.64517974853516, 80.77174377441406, 84.89830017089844, 89.02485656738281, 93.15142059326172, 97.27798461914062, 101.404541015625, 105.53109741210938, 109.65766143798828, 113.78422546386719, 117.91078186035156, 122.03733825683594, 126.16390228271484, 130.29046630859375, 134.41702270507812]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 0.0, 3.0, 8.0, 2.0, 7.0, 11.0, 6.0, 14.0, 20.0, 25.0, 27.0, 31.0, 28.0, 33.0, 54.0, 57.0, 49.0, 56.0, 60.0, 72.0, 51.0, 60.0, 53.0, 36.0, 44.0, 42.0, 20.0, 38.0, 22.0, 20.0, 14.0, 12.0, 8.0, 5.0, 5.0, 2.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.000144958496094, -39.90468215942383, -38.80922317504883, -37.71376037597656, -36.61830139160156, -35.5228385925293, -34.42737579345703, -33.33191680908203, -32.236454010009766, -31.140993118286133, -30.0455322265625, -28.950069427490234, -27.8546085357666, -26.75914764404297, -25.663684844970703, -24.56822395324707, -23.472763061523438, -22.377302169799805, -21.281841278076172, -20.186378479003906, -19.090917587280273, -17.99545669555664, -16.899993896484375, -15.804533004760742, -14.70907211303711, -13.613611221313477, -12.518149375915527, -11.422687530517578, -10.327226638793945, -9.231765747070312, -8.136303901672363, -7.040842533111572, -5.945381164550781, -4.84991979598999, -3.754458427429199, -2.658997058868408, -1.5635356903076172, -0.46807432174682617, 0.6273870468139648, 1.7228484153747559, 2.818309783935547, 3.913771152496338, 5.009232521057129, 6.10469388961792, 7.200155258178711, 8.295616149902344, 9.391077995300293, 10.486539840698242, 11.582000732421875, 12.677461624145508, 13.772923469543457, 14.868385314941406, 15.963846206665039, 17.059307098388672, 18.154769897460938, 19.25023078918457, 20.345691680908203, 21.441152572631836, 22.53661346435547, 23.632076263427734, 24.727537155151367, 25.822998046875, 26.918460845947266, 28.0139217376709, 29.10938262939453]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 15.0, 16.0, 30.0, 46.0, 82.0, 121.0, 250.0, 573.0, 1742.0, 8735.0, 186588.0, 3968147.0, 22925.0, 3267.0, 946.0, 401.0, 168.0, 83.0, 54.0, 26.0, 21.0, 11.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.796875, -30.98583984375, -30.1748046875, -29.36376953125, -28.552734375, -27.74169921875, -26.9306640625, -26.11962890625, -25.30859375, -24.49755859375, -23.6865234375, -22.87548828125, -22.064453125, -21.25341796875, -20.4423828125, -19.63134765625, -18.8203125, -18.00927734375, -17.1982421875, -16.38720703125, -15.576171875, -14.76513671875, -13.9541015625, -13.14306640625, -12.33203125, -11.52099609375, -10.7099609375, -9.89892578125, -9.087890625, -8.27685546875, -7.4658203125, -6.65478515625, -5.84375, -5.03271484375, -4.2216796875, -3.41064453125, -2.599609375, -1.78857421875, -0.9775390625, -0.16650390625, 0.64453125, 1.45556640625, 2.2666015625, 3.07763671875, 3.888671875, 4.69970703125, 5.5107421875, 6.32177734375, 7.1328125, 7.94384765625, 8.7548828125, 9.56591796875, 10.376953125, 11.18798828125, 11.9990234375, 12.81005859375, 13.62109375, 14.43212890625, 15.2431640625, 16.05419921875, 16.865234375, 17.67626953125, 18.4873046875, 19.29833984375, 20.109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 7.0, 5.0, 12.0, 15.0, 31.0, 35.0, 38.0, 77.0, 93.0, 111.0, 130.0, 122.0, 95.0, 78.0, 44.0, 29.0, 41.0, 12.0, 10.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.123504638671875, -2.06536865234375, -2.007232666015625, -1.9490966796875, -1.890960693359375, -1.83282470703125, -1.774688720703125, -1.716552734375, -1.658416748046875, -1.60028076171875, -1.542144775390625, -1.4840087890625, -1.425872802734375, -1.36773681640625, -1.309600830078125, -1.25146484375, -1.193328857421875, -1.13519287109375, -1.077056884765625, -1.0189208984375, -0.960784912109375, -0.90264892578125, -0.844512939453125, -0.786376953125, -0.728240966796875, -0.67010498046875, -0.611968994140625, -0.5538330078125, -0.495697021484375, -0.43756103515625, -0.379425048828125, -0.3212890625, -0.263153076171875, -0.20501708984375, -0.146881103515625, -0.0887451171875, -0.030609130859375, 0.02752685546875, 0.085662841796875, 0.143798828125, 0.201934814453125, 0.26007080078125, 0.318206787109375, 0.3763427734375, 0.434478759765625, 0.49261474609375, 0.550750732421875, 0.60888671875, 0.667022705078125, 0.72515869140625, 0.783294677734375, 0.8414306640625, 0.899566650390625, 0.95770263671875, 1.015838623046875, 1.073974609375, 1.132110595703125, 1.19024658203125, 1.248382568359375, 1.3065185546875, 1.364654541015625, 1.42279052734375, 1.480926513671875, 1.5390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 13.0, 15.0, 38.0, 43.0, 55.0, 71.0, 152.0, 502.0, 9135.0, 4137523.0, 45178.0, 1084.0, 208.0, 109.0, 60.0, 51.0, 16.0, 15.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.21875, -61.834228515625, -60.44970703125, -59.065185546875, -57.6806640625, -56.296142578125, -54.91162109375, -53.527099609375, -52.142578125, -50.758056640625, -49.37353515625, -47.989013671875, -46.6044921875, -45.219970703125, -43.83544921875, -42.450927734375, -41.06640625, -39.681884765625, -38.29736328125, -36.912841796875, -35.5283203125, -34.143798828125, -32.75927734375, -31.374755859375, -29.990234375, -28.605712890625, -27.22119140625, -25.836669921875, -24.4521484375, -23.067626953125, -21.68310546875, -20.298583984375, -18.9140625, -17.529541015625, -16.14501953125, -14.760498046875, -13.3759765625, -11.991455078125, -10.60693359375, -9.222412109375, -7.837890625, -6.453369140625, -5.06884765625, -3.684326171875, -2.2998046875, -0.915283203125, 0.46923828125, 1.853759765625, 3.23828125, 4.622802734375, 6.00732421875, 7.391845703125, 8.7763671875, 10.160888671875, 11.54541015625, 12.929931640625, 14.314453125, 15.698974609375, 17.08349609375, 18.468017578125, 19.8525390625, 21.237060546875, 22.62158203125, 24.006103515625, 25.390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 6.0, 14.0, 21.0, 43.0, 88.0, 197.0, 927.0, 2279.0, 241.0, 95.0, 53.0, 32.0, 26.0, 16.0, 14.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.3828125, -5.2578125, -5.1328125, -5.0078125, -4.8828125, -4.7578125, -4.6328125, -4.5078125, -4.3828125, -4.2578125, -4.1328125, -4.0078125, -3.8828125, -3.7578125, -3.6328125, -3.5078125, -3.3828125, -3.2578125, -3.1328125, -3.0078125, -2.8828125, -2.7578125, -2.6328125, -2.5078125, -2.3828125, -2.2578125, -2.1328125, -2.0078125, -1.8828125, -1.7578125, -1.6328125, -1.5078125, -1.3828125, -1.2578125, -1.1328125, -1.0078125, -0.8828125, -0.7578125, -0.6328125, -0.5078125, -0.3828125, -0.2578125, -0.1328125, -0.0078125, 0.1171875, 0.2421875, 0.3671875, 0.4921875, 0.6171875, 0.7421875, 0.8671875, 0.9921875, 1.1171875, 1.2421875, 1.3671875, 1.4921875, 1.6171875, 1.7421875, 1.8671875, 1.9921875, 2.1171875, 2.2421875, 2.3671875, 2.4921875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 27.0, 83.0, 195.0, 339.0, 223.0, 83.0, 15.0, 14.0, 8.0, 8.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.32158851623535, -29.387624740600586, -28.45366096496582, -27.519697189331055, -26.585731506347656, -25.65176773071289, -24.717803955078125, -23.78384017944336, -22.849876403808594, -21.915912628173828, -20.981948852539062, -20.047985076904297, -19.11402130126953, -18.180057525634766, -17.246091842651367, -16.3121280670166, -15.378164291381836, -14.44420051574707, -13.510236740112305, -12.576272010803223, -11.642308235168457, -10.708344459533691, -9.77437973022461, -8.840415954589844, -7.906452178955078, -6.9724884033203125, -6.038524150848389, -5.104559898376465, -4.170596122741699, -3.2366323471069336, -2.3026680946350098, -1.368703842163086, -0.4347419738769531, 0.4992220401763916, 1.4331860542297363, 2.367150068283081, 3.301114082336426, 4.235077857971191, 5.169042110443115, 6.103006362915039, 7.036970138549805, 7.97093391418457, 8.904897689819336, 9.838862419128418, 10.772826194763184, 11.70678997039795, 12.640754699707031, 13.574718475341797, 14.508682250976562, 15.442646026611328, 16.376609802246094, 17.31057357788086, 18.244537353515625, 19.17850112915039, 20.11246681213379, 21.046430587768555, 21.98039436340332, 22.914358139038086, 23.84832191467285, 24.782285690307617, 25.716251373291016, 26.65021514892578, 27.584178924560547, 28.518142700195312, 29.452106475830078]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 11.0, 15.0, 15.0, 24.0, 25.0, 40.0, 38.0, 42.0, 41.0, 57.0, 44.0, 46.0, 47.0, 68.0, 64.0, 48.0, 42.0, 44.0, 42.0, 43.0, 40.0, 28.0, 23.0, 18.0, 15.0, 10.0, 11.0, 11.0, 7.0, 10.0, 3.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.262730121612549, -7.011105060577393, -6.759479522705078, -6.507854461669922, -6.256229400634766, -6.004603862762451, -5.752978801727295, -5.5013532638549805, -5.249728202819824, -4.998103141784668, -4.7464776039123535, -4.494852542877197, -4.243227005004883, -3.9916019439697266, -3.7399768829345703, -3.488351583480835, -3.2367262840270996, -2.9851009845733643, -2.733475685119629, -2.4818506240844727, -2.2302253246307373, -1.978600025177002, -1.7269748449325562, -1.4753496646881104, -1.223724365234375, -0.9720991253852844, -0.7204738855361938, -0.46884864568710327, -0.2172234058380127, 0.034401893615722656, 0.28602707386016846, 0.5376522541046143, 0.7892780303955078, 1.0409033298492432, 1.292528510093689, 1.5441536903381348, 1.7957789897918701, 2.0474042892456055, 2.2990293502807617, 2.550654649734497, 2.8022799491882324, 3.0539052486419678, 3.305530548095703, 3.5571556091308594, 3.8087809085845947, 4.06040620803833, 4.312031269073486, 4.563656806945801, 4.815281867980957, 5.066906929016113, 5.318532466888428, 5.570157527923584, 5.821783065795898, 6.073408126831055, 6.325033187866211, 6.576658248901367, 6.828283786773682, 7.079908847808838, 7.331534385681152, 7.583159446716309, 7.834784507751465, 8.086410522460938, 8.338035583496094, 8.58966064453125, 8.841285705566406]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 10.0, 15.0, 21.0, 22.0, 40.0, 53.0, 79.0, 94.0, 143.0, 219.0, 356.0, 574.0, 916.0, 1722.0, 3433.0, 8558.0, 27305.0, 113200.0, 448038.0, 333315.0, 77300.0, 19884.0, 6676.0, 2811.0, 1424.0, 828.0, 502.0, 327.0, 212.0, 136.0, 100.0, 71.0, 45.0, 34.0, 15.0, 16.0, 12.0, 9.0, 7.0, 8.0, 5.0, 1.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.44140625, -7.21502685546875, -6.9886474609375, -6.76226806640625, -6.535888671875, -6.30950927734375, -6.0831298828125, -5.85675048828125, -5.63037109375, -5.40399169921875, -5.1776123046875, -4.95123291015625, -4.724853515625, -4.49847412109375, -4.2720947265625, -4.04571533203125, -3.8193359375, -3.59295654296875, -3.3665771484375, -3.14019775390625, -2.913818359375, -2.68743896484375, -2.4610595703125, -2.23468017578125, -2.00830078125, -1.78192138671875, -1.5555419921875, -1.32916259765625, -1.102783203125, -0.87640380859375, -0.6500244140625, -0.42364501953125, -0.197265625, 0.02911376953125, 0.2554931640625, 0.48187255859375, 0.708251953125, 0.93463134765625, 1.1610107421875, 1.38739013671875, 1.61376953125, 1.84014892578125, 2.0665283203125, 2.29290771484375, 2.519287109375, 2.74566650390625, 2.9720458984375, 3.19842529296875, 3.4248046875, 3.65118408203125, 3.8775634765625, 4.10394287109375, 4.330322265625, 4.55670166015625, 4.7830810546875, 5.00946044921875, 5.23583984375, 5.46221923828125, 5.6885986328125, 5.91497802734375, 6.141357421875, 6.36773681640625, 6.5941162109375, 6.82049560546875, 7.046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 8.0, 13.0, 18.0, 20.0, 36.0, 50.0, 61.0, 78.0, 92.0, 99.0, 108.0, 85.0, 85.0, 76.0, 52.0, 39.0, 21.0, 17.0, 12.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9599609375, -1.9084320068359375, -1.856903076171875, -1.8053741455078125, -1.75384521484375, -1.7023162841796875, -1.650787353515625, -1.5992584228515625, -1.5477294921875, -1.4962005615234375, -1.444671630859375, -1.3931427001953125, -1.34161376953125, -1.2900848388671875, -1.238555908203125, -1.1870269775390625, -1.135498046875, -1.0839691162109375, -1.032440185546875, -0.9809112548828125, -0.92938232421875, -0.8778533935546875, -0.826324462890625, -0.7747955322265625, -0.7232666015625, -0.6717376708984375, -0.620208740234375, -0.5686798095703125, -0.51715087890625, -0.4656219482421875, -0.414093017578125, -0.3625640869140625, -0.31103515625, -0.2595062255859375, -0.207977294921875, -0.1564483642578125, -0.10491943359375, -0.0533905029296875, -0.001861572265625, 0.0496673583984375, 0.1011962890625, 0.1527252197265625, 0.204254150390625, 0.2557830810546875, 0.30731201171875, 0.3588409423828125, 0.410369873046875, 0.4618988037109375, 0.513427734375, 0.5649566650390625, 0.616485595703125, 0.6680145263671875, 0.71954345703125, 0.7710723876953125, 0.822601318359375, 0.8741302490234375, 0.9256591796875, 0.9771881103515625, 1.028717041015625, 1.0802459716796875, 1.13177490234375, 1.1833038330078125, 1.234832763671875, 1.2863616943359375, 1.337890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 5.0, 9.0, 13.0, 9.0, 7.0, 24.0, 33.0, 32.0, 62.0, 82.0, 168.0, 290.0, 606.0, 1420.0, 3610.0, 11220.0, 41958.0, 196880.0, 564454.0, 173837.0, 37837.0, 10103.0, 3357.0, 1209.0, 610.0, 275.0, 172.0, 96.0, 52.0, 38.0, 24.0, 16.0, 19.0, 13.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6484375, -7.40533447265625, -7.1622314453125, -6.91912841796875, -6.676025390625, -6.43292236328125, -6.1898193359375, -5.94671630859375, -5.70361328125, -5.46051025390625, -5.2174072265625, -4.97430419921875, -4.731201171875, -4.48809814453125, -4.2449951171875, -4.00189208984375, -3.7587890625, -3.51568603515625, -3.2725830078125, -3.02947998046875, -2.786376953125, -2.54327392578125, -2.3001708984375, -2.05706787109375, -1.81396484375, -1.57086181640625, -1.3277587890625, -1.08465576171875, -0.841552734375, -0.59844970703125, -0.3553466796875, -0.11224365234375, 0.130859375, 0.37396240234375, 0.6170654296875, 0.86016845703125, 1.103271484375, 1.34637451171875, 1.5894775390625, 1.83258056640625, 2.07568359375, 2.31878662109375, 2.5618896484375, 2.80499267578125, 3.048095703125, 3.29119873046875, 3.5343017578125, 3.77740478515625, 4.0205078125, 4.26361083984375, 4.5067138671875, 4.74981689453125, 4.992919921875, 5.23602294921875, 5.4791259765625, 5.72222900390625, 5.96533203125, 6.20843505859375, 6.4515380859375, 6.69464111328125, 6.937744140625, 7.18084716796875, 7.4239501953125, 7.66705322265625, 7.91015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 12.0, 8.0, 9.0, 13.0, 14.0, 19.0, 24.0, 20.0, 34.0, 30.0, 33.0, 29.0, 38.0, 32.0, 51.0, 56.0, 58.0, 45.0, 48.0, 50.0, 46.0, 34.0, 41.0, 34.0, 30.0, 30.0, 23.0, 25.0, 21.0, 15.0, 12.0, 9.0, 9.0, 11.0, 7.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.31494140625, -4.1572265625, -3.99951171875, -3.841796875, -3.68408203125, -3.5263671875, -3.36865234375, -3.2109375, -3.05322265625, -2.8955078125, -2.73779296875, -2.580078125, -2.42236328125, -2.2646484375, -2.10693359375, -1.94921875, -1.79150390625, -1.6337890625, -1.47607421875, -1.318359375, -1.16064453125, -1.0029296875, -0.84521484375, -0.6875, -0.52978515625, -0.3720703125, -0.21435546875, -0.056640625, 0.10107421875, 0.2587890625, 0.41650390625, 0.57421875, 0.73193359375, 0.8896484375, 1.04736328125, 1.205078125, 1.36279296875, 1.5205078125, 1.67822265625, 1.8359375, 1.99365234375, 2.1513671875, 2.30908203125, 2.466796875, 2.62451171875, 2.7822265625, 2.93994140625, 3.09765625, 3.25537109375, 3.4130859375, 3.57080078125, 3.728515625, 3.88623046875, 4.0439453125, 4.20166015625, 4.359375, 4.51708984375, 4.6748046875, 4.83251953125, 4.990234375, 5.14794921875, 5.3056640625, 5.46337890625, 5.62109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 10.0, 13.0, 11.0, 16.0, 23.0, 33.0, 59.0, 92.0, 144.0, 314.0, 672.0, 1650.0, 4928.0, 19156.0, 129569.0, 743733.0, 121786.0, 18328.0, 4851.0, 1687.0, 699.0, 311.0, 165.0, 92.0, 53.0, 32.0, 27.0, 32.0, 15.0, 12.0, 14.0, 13.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-5.7578125, -5.61199951171875, -5.4661865234375, -5.32037353515625, -5.174560546875, -5.02874755859375, -4.8829345703125, -4.73712158203125, -4.59130859375, -4.44549560546875, -4.2996826171875, -4.15386962890625, -4.008056640625, -3.86224365234375, -3.7164306640625, -3.57061767578125, -3.4248046875, -3.27899169921875, -3.1331787109375, -2.98736572265625, -2.841552734375, -2.69573974609375, -2.5499267578125, -2.40411376953125, -2.25830078125, -2.11248779296875, -1.9666748046875, -1.82086181640625, -1.675048828125, -1.52923583984375, -1.3834228515625, -1.23760986328125, -1.091796875, -0.94598388671875, -0.8001708984375, -0.65435791015625, -0.508544921875, -0.36273193359375, -0.2169189453125, -0.07110595703125, 0.07470703125, 0.22052001953125, 0.3663330078125, 0.51214599609375, 0.657958984375, 0.80377197265625, 0.9495849609375, 1.09539794921875, 1.2412109375, 1.38702392578125, 1.5328369140625, 1.67864990234375, 1.824462890625, 1.97027587890625, 2.1160888671875, 2.26190185546875, 2.40771484375, 2.55352783203125, 2.6993408203125, 2.84515380859375, 2.990966796875, 3.13677978515625, 3.2825927734375, 3.42840576171875, 3.57421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 5.0, 8.0, 6.0, 20.0, 19.0, 28.0, 35.0, 52.0, 69.0, 94.0, 111.0, 115.0, 128.0, 81.0, 58.0, 40.0, 22.0, 17.0, 19.0, 17.0, 7.0, 9.0, 7.0, 4.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004911422729492188, -0.00047593191266059875, -0.00046072155237197876, -0.00044551119208335876, -0.00043030083179473877, -0.0004150904715061188, -0.0003998801112174988, -0.0003846697509288788, -0.0003694593906402588, -0.0003542490303516388, -0.0003390386700630188, -0.0003238283097743988, -0.0003086179494857788, -0.0002934075891971588, -0.0002781972289085388, -0.0002629868686199188, -0.00024777650833129883, -0.00023256614804267883, -0.00021735578775405884, -0.00020214542746543884, -0.00018693506717681885, -0.00017172470688819885, -0.00015651434659957886, -0.00014130398631095886, -0.00012609362602233887, -0.00011088326573371887, -9.567290544509888e-05, -8.046254515647888e-05, -6.525218486785889e-05, -5.004182457923889e-05, -3.4831464290618896e-05, -1.96211040019989e-05, -4.410743713378906e-06, 1.0799616575241089e-05, 2.6009976863861084e-05, 4.122033715248108e-05, 5.6430697441101074e-05, 7.164105772972107e-05, 8.685141801834106e-05, 0.00010206177830696106, 0.00011727213859558105, 0.00013248249888420105, 0.00014769285917282104, 0.00016290321946144104, 0.00017811357975006104, 0.00019332394003868103, 0.00020853430032730103, 0.00022374466061592102, 0.00023895502090454102, 0.000254165381193161, 0.000269375741481781, 0.000284586101770401, 0.000299796462059021, 0.000315006822347641, 0.000330217182636261, 0.000345427542924881, 0.000360637903213501, 0.00037584826350212097, 0.00039105862379074097, 0.00040626898407936096, 0.00042147934436798096, 0.00043668970465660095, 0.00045190006494522095, 0.00046711042523384094, 0.00048232078552246094]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 18.0, 24.0, 25.0, 59.0, 106.0, 224.0, 740.0, 2540.0, 17552.0, 544005.0, 463939.0, 15690.0, 2479.0, 663.0, 236.0, 104.0, 51.0, 25.0, 21.0, 6.0, 3.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5703125, -7.30908203125, -7.0478515625, -6.78662109375, -6.525390625, -6.26416015625, -6.0029296875, -5.74169921875, -5.48046875, -5.21923828125, -4.9580078125, -4.69677734375, -4.435546875, -4.17431640625, -3.9130859375, -3.65185546875, -3.390625, -3.12939453125, -2.8681640625, -2.60693359375, -2.345703125, -2.08447265625, -1.8232421875, -1.56201171875, -1.30078125, -1.03955078125, -0.7783203125, -0.51708984375, -0.255859375, 0.00537109375, 0.2666015625, 0.52783203125, 0.7890625, 1.05029296875, 1.3115234375, 1.57275390625, 1.833984375, 2.09521484375, 2.3564453125, 2.61767578125, 2.87890625, 3.14013671875, 3.4013671875, 3.66259765625, 3.923828125, 4.18505859375, 4.4462890625, 4.70751953125, 4.96875, 5.22998046875, 5.4912109375, 5.75244140625, 6.013671875, 6.27490234375, 6.5361328125, 6.79736328125, 7.05859375, 7.31982421875, 7.5810546875, 7.84228515625, 8.103515625, 8.36474609375, 8.6259765625, 8.88720703125, 9.1484375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 4.0, 5.0, 8.0, 11.0, 9.0, 9.0, 13.0, 28.0, 44.0, 49.0, 49.0, 78.0, 92.0, 98.0, 88.0, 98.0, 64.0, 53.0, 59.0, 29.0, 24.0, 24.0, 19.0, 10.0, 8.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51953125, -2.441131591796875, -2.36273193359375, -2.284332275390625, -2.2059326171875, -2.127532958984375, -2.04913330078125, -1.970733642578125, -1.892333984375, -1.813934326171875, -1.73553466796875, -1.657135009765625, -1.5787353515625, -1.500335693359375, -1.42193603515625, -1.343536376953125, -1.26513671875, -1.186737060546875, -1.10833740234375, -1.029937744140625, -0.9515380859375, -0.873138427734375, -0.79473876953125, -0.716339111328125, -0.637939453125, -0.559539794921875, -0.48114013671875, -0.402740478515625, -0.3243408203125, -0.245941162109375, -0.16754150390625, -0.089141845703125, -0.0107421875, 0.067657470703125, 0.14605712890625, 0.224456787109375, 0.3028564453125, 0.381256103515625, 0.45965576171875, 0.538055419921875, 0.616455078125, 0.694854736328125, 0.77325439453125, 0.851654052734375, 0.9300537109375, 1.008453369140625, 1.08685302734375, 1.165252685546875, 1.24365234375, 1.322052001953125, 1.40045166015625, 1.478851318359375, 1.5572509765625, 1.635650634765625, 1.71405029296875, 1.792449951171875, 1.870849609375, 1.949249267578125, 2.02764892578125, 2.106048583984375, 2.1844482421875, 2.262847900390625, 2.34124755859375, 2.419647216796875, 2.498046875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 22.0, 95.0, 320.0, 408.0, 110.0, 34.0, 9.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-197.99044799804688, -194.19415283203125, -190.3978729248047, -186.60157775878906, -182.8052978515625, -179.00900268554688, -175.21270751953125, -171.4164276123047, -167.62013244628906, -163.82383728027344, -160.02755737304688, -156.23126220703125, -152.43496704101562, -148.63868713378906, -144.84239196777344, -141.04611206054688, -137.24981689453125, -133.45352172851562, -129.65724182128906, -125.86094665527344, -122.06465911865234, -118.26837158203125, -114.47207641601562, -110.67578887939453, -106.87950134277344, -103.08321380615234, -99.28692626953125, -95.49063110351562, -91.69434356689453, -87.89805603027344, -84.10176086425781, -80.30547332763672, -76.50918579101562, -72.71289825439453, -68.91661071777344, -65.12031555175781, -61.32402801513672, -57.527740478515625, -53.731449127197266, -49.935157775878906, -46.13887023925781, -42.34258270263672, -38.54629135131836, -34.75, -30.953712463378906, -27.15742301940918, -23.361133575439453, -19.564844131469727, -15.7685546875, -11.972265243530273, -8.175975799560547, -4.37968635559082, -0.5833969116210938, 3.212892532348633, 7.009181976318359, 10.805471420288086, 14.601760864257812, 18.39805030822754, 22.194339752197266, 25.990629196166992, 29.78691864013672, 33.58320617675781, 37.37949752807617, 41.17578887939453, 44.972076416015625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 8.0, 8.0, 15.0, 10.0, 14.0, 16.0, 25.0, 20.0, 41.0, 41.0, 37.0, 53.0, 60.0, 62.0, 72.0, 66.0, 64.0, 49.0, 49.0, 40.0, 45.0, 36.0, 35.0, 22.0, 25.0, 27.0, 15.0, 19.0, 10.0, 6.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.848594665527344, -40.72073745727539, -39.59288024902344, -38.46501922607422, -37.337162017822266, -36.20930480957031, -35.08144760131836, -33.953590393066406, -32.82573318481445, -31.6978759765625, -30.570016860961914, -29.44215965270996, -28.314302444458008, -27.186443328857422, -26.05858612060547, -24.930728912353516, -23.80286979675293, -22.675012588500977, -21.54715347290039, -20.419296264648438, -19.291439056396484, -18.16358184814453, -17.035722732543945, -15.907865524291992, -14.780007362365723, -13.652149200439453, -12.5242919921875, -11.39643383026123, -10.268575668334961, -9.140718460083008, -8.012860298156738, -6.885002613067627, -5.757146835327148, -4.629289150238037, -3.5014312267303467, -2.3735733032226562, -1.245715618133545, -0.1178579330444336, 1.010000228881836, 2.1378579139709473, 3.2657155990600586, 4.39357328414917, 5.521430969238281, 6.649289131164551, 7.777146816253662, 8.905004501342773, 10.032862663269043, 11.160720825195312, 12.288578033447266, 13.416436195373535, 14.544293403625488, 15.672151565551758, 16.80000877380371, 17.927867889404297, 19.05572509765625, 20.183582305908203, 21.311439514160156, 22.43929672241211, 23.567155838012695, 24.69501304626465, 25.8228702545166, 26.950729370117188, 28.07858657836914, 29.206443786621094, 30.33430290222168]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 3.0, 3.0, 9.0, 3.0, 1.0, 5.0, 13.0, 20.0, 24.0, 36.0, 46.0, 62.0, 106.0, 178.0, 285.0, 541.0, 1237.0, 3208.0, 11984.0, 92960.0, 3981419.0, 84787.0, 11658.0, 3227.0, 1210.0, 558.0, 300.0, 144.0, 107.0, 53.0, 40.0, 18.0, 12.0, 4.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6875, -14.295654296875, -13.90380859375, -13.511962890625, -13.1201171875, -12.728271484375, -12.33642578125, -11.944580078125, -11.552734375, -11.160888671875, -10.76904296875, -10.377197265625, -9.9853515625, -9.593505859375, -9.20166015625, -8.809814453125, -8.41796875, -8.026123046875, -7.63427734375, -7.242431640625, -6.8505859375, -6.458740234375, -6.06689453125, -5.675048828125, -5.283203125, -4.891357421875, -4.49951171875, -4.107666015625, -3.7158203125, -3.323974609375, -2.93212890625, -2.540283203125, -2.1484375, -1.756591796875, -1.36474609375, -0.972900390625, -0.5810546875, -0.189208984375, 0.20263671875, 0.594482421875, 0.986328125, 1.378173828125, 1.77001953125, 2.161865234375, 2.5537109375, 2.945556640625, 3.33740234375, 3.729248046875, 4.12109375, 4.512939453125, 4.90478515625, 5.296630859375, 5.6884765625, 6.080322265625, 6.47216796875, 6.864013671875, 7.255859375, 7.647705078125, 8.03955078125, 8.431396484375, 8.8232421875, 9.215087890625, 9.60693359375, 9.998779296875, 10.390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 10.0, 7.0, 18.0, 24.0, 26.0, 36.0, 47.0, 56.0, 80.0, 78.0, 93.0, 82.0, 74.0, 72.0, 74.0, 61.0, 40.0, 26.0, 25.0, 21.0, 14.0, 12.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7958984375, -1.744903564453125, -1.69390869140625, -1.642913818359375, -1.5919189453125, -1.540924072265625, -1.48992919921875, -1.438934326171875, -1.387939453125, -1.336944580078125, -1.28594970703125, -1.234954833984375, -1.1839599609375, -1.132965087890625, -1.08197021484375, -1.030975341796875, -0.97998046875, -0.928985595703125, -0.87799072265625, -0.826995849609375, -0.7760009765625, -0.725006103515625, -0.67401123046875, -0.623016357421875, -0.572021484375, -0.521026611328125, -0.47003173828125, -0.419036865234375, -0.3680419921875, -0.317047119140625, -0.26605224609375, -0.215057373046875, -0.1640625, -0.113067626953125, -0.06207275390625, -0.011077880859375, 0.0399169921875, 0.090911865234375, 0.14190673828125, 0.192901611328125, 0.243896484375, 0.294891357421875, 0.34588623046875, 0.396881103515625, 0.4478759765625, 0.498870849609375, 0.54986572265625, 0.600860595703125, 0.65185546875, 0.702850341796875, 0.75384521484375, 0.804840087890625, 0.8558349609375, 0.906829833984375, 0.95782470703125, 1.008819580078125, 1.059814453125, 1.110809326171875, 1.16180419921875, 1.212799072265625, 1.2637939453125, 1.314788818359375, 1.36578369140625, 1.416778564453125, 1.4677734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 12.0, 15.0, 50.0, 109.0, 321.0, 1198.0, 7297.0, 163519.0, 3995718.0, 22357.0, 2690.0, 632.0, 199.0, 72.0, 39.0, 13.0, 8.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.65625, -19.02685546875, -18.3974609375, -17.76806640625, -17.138671875, -16.50927734375, -15.8798828125, -15.25048828125, -14.62109375, -13.99169921875, -13.3623046875, -12.73291015625, -12.103515625, -11.47412109375, -10.8447265625, -10.21533203125, -9.5859375, -8.95654296875, -8.3271484375, -7.69775390625, -7.068359375, -6.43896484375, -5.8095703125, -5.18017578125, -4.55078125, -3.92138671875, -3.2919921875, -2.66259765625, -2.033203125, -1.40380859375, -0.7744140625, -0.14501953125, 0.484375, 1.11376953125, 1.7431640625, 2.37255859375, 3.001953125, 3.63134765625, 4.2607421875, 4.89013671875, 5.51953125, 6.14892578125, 6.7783203125, 7.40771484375, 8.037109375, 8.66650390625, 9.2958984375, 9.92529296875, 10.5546875, 11.18408203125, 11.8134765625, 12.44287109375, 13.072265625, 13.70166015625, 14.3310546875, 14.96044921875, 15.58984375, 16.21923828125, 16.8486328125, 17.47802734375, 18.107421875, 18.73681640625, 19.3662109375, 19.99560546875, 20.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 0.0, 6.0, 3.0, 7.0, 8.0, 14.0, 25.0, 33.0, 72.0, 115.0, 241.0, 1148.0, 1809.0, 230.0, 127.0, 68.0, 53.0, 25.0, 23.0, 15.0, 4.0, 16.0, 6.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.189453125, -2.12109375, -2.052734375, -1.984375, -1.916015625, -1.84765625, -1.779296875, -1.7109375, -1.642578125, -1.57421875, -1.505859375, -1.4375, -1.369140625, -1.30078125, -1.232421875, -1.1640625, -1.095703125, -1.02734375, -0.958984375, -0.890625, -0.822265625, -0.75390625, -0.685546875, -0.6171875, -0.548828125, -0.48046875, -0.412109375, -0.34375, -0.275390625, -0.20703125, -0.138671875, -0.0703125, -0.001953125, 0.06640625, 0.134765625, 0.203125, 0.271484375, 0.33984375, 0.408203125, 0.4765625, 0.544921875, 0.61328125, 0.681640625, 0.75, 0.818359375, 0.88671875, 0.955078125, 1.0234375, 1.091796875, 1.16015625, 1.228515625, 1.296875, 1.365234375, 1.43359375, 1.501953125, 1.5703125, 1.638671875, 1.70703125, 1.775390625, 1.84375, 1.912109375, 1.98046875, 2.048828125, 2.1171875, 2.185546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 9.0, 21.0, 74.0, 153.0, 254.0, 251.0, 131.0, 49.0, 36.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.15121841430664, -15.548493385314941, -14.945768356323242, -14.343043327331543, -13.740318298339844, -13.137594223022461, -12.534869194030762, -11.932144165039062, -11.329419136047363, -10.726694107055664, -10.123969078063965, -9.521244049072266, -8.918519973754883, -8.315793991088867, -7.713069915771484, -7.110344886779785, -6.507619857788086, -5.904894828796387, -5.3021697998046875, -4.6994452476501465, -4.096720218658447, -3.493995189666748, -2.891270399093628, -2.288545608520508, -1.6858205795288086, -1.083095669746399, -0.48037075996398926, 0.12235414981842041, 0.7250790596008301, 1.3278040885925293, 1.9305288791656494, 2.5332536697387695, 3.135976791381836, 3.738701820373535, 4.341426849365234, 4.944151401519775, 5.546876430511475, 6.149601459503174, 6.752326011657715, 7.355051040649414, 7.957776069641113, 8.560501098632812, 9.163226127624512, 9.765951156616211, 10.368675231933594, 10.97140121459961, 11.574125289916992, 12.176850318908691, 12.77957534790039, 13.38230037689209, 13.985025405883789, 14.587750434875488, 15.190475463867188, 15.79319953918457, 16.395925521850586, 16.99864959716797, 17.601375579833984, 18.204099655151367, 18.806825637817383, 19.409549713134766, 20.01227569580078, 20.614999771118164, 21.21772575378418, 21.820449829101562, 22.423173904418945]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 8.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 15.0, 12.0, 16.0, 19.0, 32.0, 25.0, 41.0, 37.0, 34.0, 45.0, 36.0, 42.0, 34.0, 48.0, 45.0, 45.0, 43.0, 43.0, 41.0, 32.0, 36.0, 37.0, 34.0, 33.0, 28.0, 18.0, 7.0, 14.0, 13.0, 13.0, 8.0, 12.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3957624435424805, -5.2276787757873535, -5.059594631195068, -4.891510963439941, -4.723426818847656, -4.555343151092529, -4.387259483337402, -4.219175338745117, -4.05109167098999, -3.883007764816284, -3.714923858642578, -3.546840190887451, -3.378756284713745, -3.210672378540039, -3.042588472366333, -2.874504566192627, -2.706420660018921, -2.538336753845215, -2.370252847671509, -2.2021689414978027, -2.034085273742676, -1.8660013675689697, -1.6979174613952637, -1.5298336744308472, -1.3617497682571411, -1.193665862083435, -1.0255820751190186, -0.8574981689453125, -0.6894143223762512, -0.5213304758071899, -0.3532465696334839, -0.18516278266906738, -0.017078876495361328, 0.15100498497486115, 0.3190888464450836, 0.4871727228164673, 0.6552565693855286, 0.8233404159545898, 0.9914243221282959, 1.1595081090927124, 1.3275920152664185, 1.4956759214401245, 1.663759708404541, 1.831843614578247, 1.9999275207519531, 2.16801118850708, 2.3360953330993652, 2.504179000854492, 2.6722629070281982, 2.8403468132019043, 3.0084307193756104, 3.1765146255493164, 3.3445982933044434, 3.5126821994781494, 3.6807661056518555, 3.8488497734069824, 4.016933917999268, 4.1850175857543945, 4.35310173034668, 4.521185398101807, 4.689269542694092, 4.857353210449219, 5.025437355041504, 5.193521022796631, 5.361604690551758]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 14.0, 16.0, 22.0, 27.0, 50.0, 47.0, 112.0, 156.0, 256.0, 367.0, 711.0, 1304.0, 2538.0, 5743.0, 15781.0, 52762.0, 204456.0, 482830.0, 202494.0, 51789.0, 15592.0, 5712.0, 2514.0, 1345.0, 732.0, 421.0, 255.0, 178.0, 107.0, 70.0, 40.0, 39.0, 11.0, 10.0, 10.0, 9.0, 6.0, 6.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2109375, -5.99298095703125, -5.7750244140625, -5.55706787109375, -5.339111328125, -5.12115478515625, -4.9031982421875, -4.68524169921875, -4.46728515625, -4.24932861328125, -4.0313720703125, -3.81341552734375, -3.595458984375, -3.37750244140625, -3.1595458984375, -2.94158935546875, -2.7236328125, -2.50567626953125, -2.2877197265625, -2.06976318359375, -1.851806640625, -1.63385009765625, -1.4158935546875, -1.19793701171875, -0.97998046875, -0.76202392578125, -0.5440673828125, -0.32611083984375, -0.108154296875, 0.10980224609375, 0.3277587890625, 0.54571533203125, 0.763671875, 0.98162841796875, 1.1995849609375, 1.41754150390625, 1.635498046875, 1.85345458984375, 2.0714111328125, 2.28936767578125, 2.50732421875, 2.72528076171875, 2.9432373046875, 3.16119384765625, 3.379150390625, 3.59710693359375, 3.8150634765625, 4.03302001953125, 4.2509765625, 4.46893310546875, 4.6868896484375, 4.90484619140625, 5.122802734375, 5.34075927734375, 5.5587158203125, 5.77667236328125, 5.99462890625, 6.21258544921875, 6.4305419921875, 6.64849853515625, 6.866455078125, 7.08441162109375, 7.3023681640625, 7.52032470703125, 7.73828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 11.0, 9.0, 18.0, 24.0, 40.0, 56.0, 65.0, 76.0, 65.0, 92.0, 98.0, 67.0, 80.0, 64.0, 53.0, 40.0, 36.0, 26.0, 20.0, 8.0, 12.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787109375, -1.7348785400390625, -1.682647705078125, -1.6304168701171875, -1.57818603515625, -1.5259552001953125, -1.473724365234375, -1.4214935302734375, -1.3692626953125, -1.3170318603515625, -1.264801025390625, -1.2125701904296875, -1.16033935546875, -1.1081085205078125, -1.055877685546875, -1.0036468505859375, -0.951416015625, -0.8991851806640625, -0.846954345703125, -0.7947235107421875, -0.74249267578125, -0.6902618408203125, -0.638031005859375, -0.5858001708984375, -0.5335693359375, -0.4813385009765625, -0.429107666015625, -0.3768768310546875, -0.32464599609375, -0.2724151611328125, -0.220184326171875, -0.1679534912109375, -0.11572265625, -0.0634918212890625, -0.011260986328125, 0.0409698486328125, 0.09320068359375, 0.1454315185546875, 0.197662353515625, 0.2498931884765625, 0.3021240234375, 0.3543548583984375, 0.406585693359375, 0.4588165283203125, 0.51104736328125, 0.5632781982421875, 0.615509033203125, 0.6677398681640625, 0.719970703125, 0.7722015380859375, 0.824432373046875, 0.8766632080078125, 0.92889404296875, 0.9811248779296875, 1.033355712890625, 1.0855865478515625, 1.1378173828125, 1.1900482177734375, 1.242279052734375, 1.2945098876953125, 1.34674072265625, 1.3989715576171875, 1.451202392578125, 1.5034332275390625, 1.5556640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 4.0, 12.0, 14.0, 13.0, 24.0, 36.0, 64.0, 89.0, 132.0, 210.0, 448.0, 854.0, 1996.0, 5836.0, 19905.0, 79347.0, 363311.0, 439919.0, 100809.0, 24251.0, 6876.0, 2281.0, 939.0, 472.0, 266.0, 142.0, 71.0, 65.0, 39.0, 23.0, 25.0, 18.0, 10.0, 4.0, 13.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2578125, -8.02239990234375, -7.7869873046875, -7.55157470703125, -7.316162109375, -7.08074951171875, -6.8453369140625, -6.60992431640625, -6.37451171875, -6.13909912109375, -5.9036865234375, -5.66827392578125, -5.432861328125, -5.19744873046875, -4.9620361328125, -4.72662353515625, -4.4912109375, -4.25579833984375, -4.0203857421875, -3.78497314453125, -3.549560546875, -3.31414794921875, -3.0787353515625, -2.84332275390625, -2.60791015625, -2.37249755859375, -2.1370849609375, -1.90167236328125, -1.666259765625, -1.43084716796875, -1.1954345703125, -0.96002197265625, -0.724609375, -0.48919677734375, -0.2537841796875, -0.01837158203125, 0.217041015625, 0.45245361328125, 0.6878662109375, 0.92327880859375, 1.15869140625, 1.39410400390625, 1.6295166015625, 1.86492919921875, 2.100341796875, 2.33575439453125, 2.5711669921875, 2.80657958984375, 3.0419921875, 3.27740478515625, 3.5128173828125, 3.74822998046875, 3.983642578125, 4.21905517578125, 4.4544677734375, 4.68988037109375, 4.92529296875, 5.16070556640625, 5.3961181640625, 5.63153076171875, 5.866943359375, 6.10235595703125, 6.3377685546875, 6.57318115234375, 6.80859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 4.0, 7.0, 7.0, 9.0, 15.0, 17.0, 16.0, 22.0, 32.0, 21.0, 37.0, 31.0, 37.0, 28.0, 42.0, 40.0, 48.0, 46.0, 36.0, 52.0, 49.0, 41.0, 49.0, 28.0, 29.0, 34.0, 39.0, 30.0, 21.0, 28.0, 15.0, 13.0, 17.0, 14.0, 7.0, 5.0, 6.0, 4.0, 6.0, 4.0, 4.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.125, -4.970947265625, -4.81689453125, -4.662841796875, -4.5087890625, -4.354736328125, -4.20068359375, -4.046630859375, -3.892578125, -3.738525390625, -3.58447265625, -3.430419921875, -3.2763671875, -3.122314453125, -2.96826171875, -2.814208984375, -2.66015625, -2.506103515625, -2.35205078125, -2.197998046875, -2.0439453125, -1.889892578125, -1.73583984375, -1.581787109375, -1.427734375, -1.273681640625, -1.11962890625, -0.965576171875, -0.8115234375, -0.657470703125, -0.50341796875, -0.349365234375, -0.1953125, -0.041259765625, 0.11279296875, 0.266845703125, 0.4208984375, 0.574951171875, 0.72900390625, 0.883056640625, 1.037109375, 1.191162109375, 1.34521484375, 1.499267578125, 1.6533203125, 1.807373046875, 1.96142578125, 2.115478515625, 2.26953125, 2.423583984375, 2.57763671875, 2.731689453125, 2.8857421875, 3.039794921875, 3.19384765625, 3.347900390625, 3.501953125, 3.656005859375, 3.81005859375, 3.964111328125, 4.1181640625, 4.272216796875, 4.42626953125, 4.580322265625, 4.734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 12.0, 18.0, 22.0, 40.0, 67.0, 121.0, 215.0, 423.0, 856.0, 2189.0, 5817.0, 21999.0, 154106.0, 721656.0, 114426.0, 18033.0, 5016.0, 1865.0, 767.0, 395.0, 205.0, 113.0, 63.0, 30.0, 23.0, 13.0, 12.0, 6.0, 11.0, 4.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.502288818359375, -3.36981201171875, -3.237335205078125, -3.1048583984375, -2.972381591796875, -2.83990478515625, -2.707427978515625, -2.574951171875, -2.442474365234375, -2.30999755859375, -2.177520751953125, -2.0450439453125, -1.912567138671875, -1.78009033203125, -1.647613525390625, -1.51513671875, -1.382659912109375, -1.25018310546875, -1.117706298828125, -0.9852294921875, -0.852752685546875, -0.72027587890625, -0.587799072265625, -0.455322265625, -0.322845458984375, -0.19036865234375, -0.057891845703125, 0.0745849609375, 0.207061767578125, 0.33953857421875, 0.472015380859375, 0.6044921875, 0.736968994140625, 0.86944580078125, 1.001922607421875, 1.1343994140625, 1.266876220703125, 1.39935302734375, 1.531829833984375, 1.664306640625, 1.796783447265625, 1.92926025390625, 2.061737060546875, 2.1942138671875, 2.326690673828125, 2.45916748046875, 2.591644287109375, 2.72412109375, 2.856597900390625, 2.98907470703125, 3.121551513671875, 3.2540283203125, 3.386505126953125, 3.51898193359375, 3.651458740234375, 3.783935546875, 3.916412353515625, 4.04888916015625, 4.181365966796875, 4.3138427734375, 4.446319580078125, 4.57879638671875, 4.711273193359375, 4.84375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 7.0, 9.0, 22.0, 20.0, 44.0, 63.0, 176.0, 250.0, 170.0, 95.0, 54.0, 28.0, 22.0, 13.0, 9.0, 5.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008573532104492188, -0.0008252710103988647, -0.0007931888103485107, -0.0007611066102981567, -0.0007290244102478027, -0.0006969422101974487, -0.0006648600101470947, -0.0006327778100967407, -0.0006006956100463867, -0.0005686134099960327, -0.0005365312099456787, -0.0005044490098953247, -0.0004723668098449707, -0.0004402846097946167, -0.0004082024097442627, -0.0003761202096939087, -0.0003440380096435547, -0.0003119558095932007, -0.0002798736095428467, -0.0002477914094924927, -0.00021570920944213867, -0.00018362700939178467, -0.00015154480934143066, -0.00011946260929107666, -8.738040924072266e-05, -5.529820919036865e-05, -2.321600914001465e-05, 8.866190910339355e-06, 4.094839096069336e-05, 7.303059101104736e-05, 0.00010511279106140137, 0.00013719499111175537, 0.00016927719116210938, 0.00020135939121246338, 0.00023344159126281738, 0.0002655237913131714, 0.0002976059913635254, 0.0003296881914138794, 0.0003617703914642334, 0.0003938525915145874, 0.0004259347915649414, 0.0004580169916152954, 0.0004900991916656494, 0.0005221813917160034, 0.0005542635917663574, 0.0005863457918167114, 0.0006184279918670654, 0.0006505101919174194, 0.0006825923919677734, 0.0007146745920181274, 0.0007467567920684814, 0.0007788389921188354, 0.0008109211921691895, 0.0008430033922195435, 0.0008750855922698975, 0.0009071677923202515, 0.0009392499923706055, 0.0009713321924209595, 0.0010034143924713135, 0.0010354965925216675, 0.0010675787925720215, 0.0010996609926223755, 0.0011317431926727295, 0.0011638253927230835, 0.0011959075927734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 4.0, 8.0, 6.0, 9.0, 12.0, 21.0, 36.0, 49.0, 92.0, 216.0, 581.0, 2335.0, 14412.0, 358721.0, 646734.0, 21029.0, 3027.0, 749.0, 244.0, 104.0, 64.0, 31.0, 26.0, 8.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.099609375, -6.85546875, -6.611328125, -6.3671875, -6.123046875, -5.87890625, -5.634765625, -5.390625, -5.146484375, -4.90234375, -4.658203125, -4.4140625, -4.169921875, -3.92578125, -3.681640625, -3.4375, -3.193359375, -2.94921875, -2.705078125, -2.4609375, -2.216796875, -1.97265625, -1.728515625, -1.484375, -1.240234375, -0.99609375, -0.751953125, -0.5078125, -0.263671875, -0.01953125, 0.224609375, 0.46875, 0.712890625, 0.95703125, 1.201171875, 1.4453125, 1.689453125, 1.93359375, 2.177734375, 2.421875, 2.666015625, 2.91015625, 3.154296875, 3.3984375, 3.642578125, 3.88671875, 4.130859375, 4.375, 4.619140625, 4.86328125, 5.107421875, 5.3515625, 5.595703125, 5.83984375, 6.083984375, 6.328125, 6.572265625, 6.81640625, 7.060546875, 7.3046875, 7.548828125, 7.79296875, 8.037109375, 8.28125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 8.0, 7.0, 12.0, 14.0, 16.0, 22.0, 35.0, 31.0, 42.0, 59.0, 73.0, 99.0, 117.0, 86.0, 73.0, 83.0, 53.0, 38.0, 27.0, 23.0, 18.0, 16.0, 8.0, 6.0, 11.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3515625, -2.274566650390625, -2.19757080078125, -2.120574951171875, -2.0435791015625, -1.966583251953125, -1.88958740234375, -1.812591552734375, -1.735595703125, -1.658599853515625, -1.58160400390625, -1.504608154296875, -1.4276123046875, -1.350616455078125, -1.27362060546875, -1.196624755859375, -1.11962890625, -1.042633056640625, -0.96563720703125, -0.888641357421875, -0.8116455078125, -0.734649658203125, -0.65765380859375, -0.580657958984375, -0.503662109375, -0.426666259765625, -0.34967041015625, -0.272674560546875, -0.1956787109375, -0.118682861328125, -0.04168701171875, 0.035308837890625, 0.1123046875, 0.189300537109375, 0.26629638671875, 0.343292236328125, 0.4202880859375, 0.497283935546875, 0.57427978515625, 0.651275634765625, 0.728271484375, 0.805267333984375, 0.88226318359375, 0.959259033203125, 1.0362548828125, 1.113250732421875, 1.19024658203125, 1.267242431640625, 1.34423828125, 1.421234130859375, 1.49822998046875, 1.575225830078125, 1.6522216796875, 1.729217529296875, 1.80621337890625, 1.883209228515625, 1.960205078125, 2.037200927734375, 2.11419677734375, 2.191192626953125, 2.2681884765625, 2.345184326171875, 2.42218017578125, 2.499176025390625, 2.576171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 7.0, 7.0, 25.0, 34.0, 76.0, 94.0, 164.0, 212.0, 153.0, 82.0, 50.0, 38.0, 19.0, 16.0, 5.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.842506408691406, -44.15380859375, -42.465110778808594, -40.77641296386719, -39.08771514892578, -37.399017333984375, -35.7103157043457, -34.0216178894043, -32.33292007446289, -30.644222259521484, -28.955524444580078, -27.26682472229004, -25.578126907348633, -23.889429092407227, -22.200729370117188, -20.51203155517578, -18.823333740234375, -17.13463592529297, -15.445937156677246, -13.757238388061523, -12.068540573120117, -10.379842758178711, -8.691143989562988, -7.002445220947266, -5.313747406005859, -3.625049114227295, -1.9363508224487305, -0.24765253067016602, 1.4410457611083984, 3.1297435760498047, 4.818442344665527, 6.50714111328125, 8.195842742919922, 9.884540557861328, 11.57323932647705, 13.261938095092773, 14.95063591003418, 16.639333724975586, 18.328033447265625, 20.01673126220703, 21.705429077148438, 23.394126892089844, 25.08282470703125, 26.77152442932129, 28.460222244262695, 30.1489200592041, 31.83761978149414, 33.52631759643555, 35.21501541137695, 36.90371322631836, 38.592411041259766, 40.28110885620117, 41.969810485839844, 43.65850830078125, 45.347206115722656, 47.03590393066406, 48.72460174560547, 50.413299560546875, 52.10199737548828, 53.79069519042969, 55.479393005371094, 57.1680908203125, 58.85679244995117, 60.54549026489258, 62.234188079833984]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 3.0, 10.0, 9.0, 13.0, 20.0, 19.0, 28.0, 44.0, 33.0, 40.0, 48.0, 49.0, 67.0, 50.0, 66.0, 51.0, 61.0, 49.0, 72.0, 43.0, 38.0, 39.0, 30.0, 29.0, 20.0, 18.0, 15.0, 9.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.17283630371094, -41.99806594848633, -40.823299407958984, -39.648529052734375, -38.473758697509766, -37.29899215698242, -36.12422180175781, -34.94945526123047, -33.77468490600586, -32.59991455078125, -31.425146102905273, -30.250377655029297, -29.07560920715332, -27.900840759277344, -26.726070404052734, -25.551301956176758, -24.37653160095215, -23.201763153076172, -22.026992797851562, -20.852224349975586, -19.67745590209961, -18.502685546875, -17.327917098999023, -16.153148651123047, -14.978379249572754, -13.803609848022461, -12.628841400146484, -11.454071998596191, -10.279302597045898, -9.104534149169922, -7.929764747619629, -6.754996299743652, -5.580226898193359, -4.405457973480225, -3.2306888103485107, -2.055919647216797, -0.8811507225036621, 0.29361820220947266, 1.4683876037597656, 2.643156051635742, 3.817925453186035, 4.99269437789917, 6.167463302612305, 7.342232704162598, 8.51700210571289, 9.691770553588867, 10.86653995513916, 12.041308403015137, 13.21607780456543, 14.390847206115723, 15.5656156539917, 16.740385055541992, 17.91515350341797, 19.089923858642578, 20.264692306518555, 21.43946075439453, 22.61423110961914, 23.788999557495117, 24.963769912719727, 26.138538360595703, 27.31330680847168, 28.488075256347656, 29.662845611572266, 30.837614059448242, 32.01238250732422]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 6.0, 7.0, 6.0, 7.0, 16.0, 33.0, 37.0, 48.0, 60.0, 99.0, 130.0, 258.0, 364.0, 619.0, 1194.0, 2657.0, 7277.0, 28026.0, 281387.0, 3777946.0, 71993.0, 14067.0, 4364.0, 1728.0, 837.0, 447.0, 253.0, 147.0, 91.0, 63.0, 37.0, 21.0, 16.0, 9.0, 6.0, 2.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0], "bins": [-14.0390625, -13.681396484375, -13.32373046875, -12.966064453125, -12.6083984375, -12.250732421875, -11.89306640625, -11.535400390625, -11.177734375, -10.820068359375, -10.46240234375, -10.104736328125, -9.7470703125, -9.389404296875, -9.03173828125, -8.674072265625, -8.31640625, -7.958740234375, -7.60107421875, -7.243408203125, -6.8857421875, -6.528076171875, -6.17041015625, -5.812744140625, -5.455078125, -5.097412109375, -4.73974609375, -4.382080078125, -4.0244140625, -3.666748046875, -3.30908203125, -2.951416015625, -2.59375, -2.236083984375, -1.87841796875, -1.520751953125, -1.1630859375, -0.805419921875, -0.44775390625, -0.090087890625, 0.267578125, 0.625244140625, 0.98291015625, 1.340576171875, 1.6982421875, 2.055908203125, 2.41357421875, 2.771240234375, 3.12890625, 3.486572265625, 3.84423828125, 4.201904296875, 4.5595703125, 4.917236328125, 5.27490234375, 5.632568359375, 5.990234375, 6.347900390625, 6.70556640625, 7.063232421875, 7.4208984375, 7.778564453125, 8.13623046875, 8.493896484375, 8.8515625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 10.0, 7.0, 8.0, 7.0, 15.0, 18.0, 31.0, 35.0, 50.0, 61.0, 60.0, 86.0, 90.0, 78.0, 85.0, 80.0, 57.0, 63.0, 37.0, 34.0, 28.0, 22.0, 13.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9765625, -1.91888427734375, -1.8612060546875, -1.80352783203125, -1.745849609375, -1.68817138671875, -1.6304931640625, -1.57281494140625, -1.51513671875, -1.45745849609375, -1.3997802734375, -1.34210205078125, -1.284423828125, -1.22674560546875, -1.1690673828125, -1.11138916015625, -1.0537109375, -0.99603271484375, -0.9383544921875, -0.88067626953125, -0.822998046875, -0.76531982421875, -0.7076416015625, -0.64996337890625, -0.59228515625, -0.53460693359375, -0.4769287109375, -0.41925048828125, -0.361572265625, -0.30389404296875, -0.2462158203125, -0.18853759765625, -0.130859375, -0.07318115234375, -0.0155029296875, 0.04217529296875, 0.099853515625, 0.15753173828125, 0.2152099609375, 0.27288818359375, 0.33056640625, 0.38824462890625, 0.4459228515625, 0.50360107421875, 0.561279296875, 0.61895751953125, 0.6766357421875, 0.73431396484375, 0.7919921875, 0.84967041015625, 0.9073486328125, 0.96502685546875, 1.022705078125, 1.08038330078125, 1.1380615234375, 1.19573974609375, 1.25341796875, 1.31109619140625, 1.3687744140625, 1.42645263671875, 1.484130859375, 1.54180908203125, 1.5994873046875, 1.65716552734375, 1.71484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 15.0, 29.0, 44.0, 93.0, 141.0, 472.0, 5681.0, 4121343.0, 64722.0, 1303.0, 265.0, 85.0, 47.0, 20.0, 9.0, 7.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.8125, -66.3623046875, -64.912109375, -63.4619140625, -62.01171875, -60.5615234375, -59.111328125, -57.6611328125, -56.2109375, -54.7607421875, -53.310546875, -51.8603515625, -50.41015625, -48.9599609375, -47.509765625, -46.0595703125, -44.609375, -43.1591796875, -41.708984375, -40.2587890625, -38.80859375, -37.3583984375, -35.908203125, -34.4580078125, -33.0078125, -31.5576171875, -30.107421875, -28.6572265625, -27.20703125, -25.7568359375, -24.306640625, -22.8564453125, -21.40625, -19.9560546875, -18.505859375, -17.0556640625, -15.60546875, -14.1552734375, -12.705078125, -11.2548828125, -9.8046875, -8.3544921875, -6.904296875, -5.4541015625, -4.00390625, -2.5537109375, -1.103515625, 0.3466796875, 1.796875, 3.2470703125, 4.697265625, 6.1474609375, 7.59765625, 9.0478515625, 10.498046875, 11.9482421875, 13.3984375, 14.8486328125, 16.298828125, 17.7490234375, 19.19921875, 20.6494140625, 22.099609375, 23.5498046875, 25.0]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 9.0, 6.0, 18.0, 18.0, 45.0, 81.0, 201.0, 723.0, 2380.0, 349.0, 100.0, 55.0, 31.0, 19.0, 13.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.7890625, -7.6168212890625, -7.444580078125, -7.2723388671875, -7.10009765625, -6.9278564453125, -6.755615234375, -6.5833740234375, -6.4111328125, -6.2388916015625, -6.066650390625, -5.8944091796875, -5.72216796875, -5.5499267578125, -5.377685546875, -5.2054443359375, -5.033203125, -4.8609619140625, -4.688720703125, -4.5164794921875, -4.34423828125, -4.1719970703125, -3.999755859375, -3.8275146484375, -3.6552734375, -3.4830322265625, -3.310791015625, -3.1385498046875, -2.96630859375, -2.7940673828125, -2.621826171875, -2.4495849609375, -2.27734375, -2.1051025390625, -1.932861328125, -1.7606201171875, -1.58837890625, -1.4161376953125, -1.243896484375, -1.0716552734375, -0.8994140625, -0.7271728515625, -0.554931640625, -0.3826904296875, -0.21044921875, -0.0382080078125, 0.134033203125, 0.3062744140625, 0.478515625, 0.6507568359375, 0.822998046875, 0.9952392578125, 1.16748046875, 1.3397216796875, 1.511962890625, 1.6842041015625, 1.8564453125, 2.0286865234375, 2.200927734375, 2.3731689453125, 2.54541015625, 2.7176513671875, 2.889892578125, 3.0621337890625, 3.234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 9.0, 22.0, 59.0, 204.0, 355.0, 223.0, 88.0, 22.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.79380416870117, -55.32221984863281, -53.85063552856445, -52.37905502319336, -50.907470703125, -49.43588638305664, -47.96430206298828, -46.49272155761719, -45.02113723754883, -43.54955291748047, -42.07796859741211, -40.606388092041016, -39.134803771972656, -37.6632194519043, -36.19163513183594, -34.720054626464844, -33.24846649169922, -31.77688217163086, -30.305299758911133, -28.833715438842773, -27.362133026123047, -25.890548706054688, -24.418964385986328, -22.9473819732666, -21.475799560546875, -20.004215240478516, -18.53263282775879, -17.06104850769043, -15.589466094970703, -14.117881774902344, -12.6462984085083, -11.174715042114258, -9.703132629394531, -8.231549263000488, -6.759965896606445, -5.288382053375244, -3.816798686981201, -2.345215320587158, -0.873631477355957, 0.5979518890380859, 2.069535255432129, 3.541118621826172, 5.012701988220215, 6.484285831451416, 7.955869197845459, 9.427452087402344, 10.899036407470703, 12.370619773864746, 13.842203140258789, 15.313786506652832, 16.785369873046875, 18.256954193115234, 19.72853660583496, 21.20012092590332, 22.671703338623047, 24.143287658691406, 25.614871978759766, 27.086456298828125, 28.55803871154785, 30.02962303161621, 31.501205444335938, 32.9727897644043, 34.444374084472656, 35.91595458984375, 37.38753890991211]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 7.0, 14.0, 20.0, 20.0, 25.0, 24.0, 38.0, 31.0, 45.0, 44.0, 57.0, 55.0, 66.0, 73.0, 68.0, 62.0, 52.0, 45.0, 46.0, 31.0, 36.0, 24.0, 19.0, 24.0, 16.0, 10.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.519977569580078, -14.105334281921387, -13.690690994262695, -13.27604866027832, -12.861405372619629, -12.446762084960938, -12.032118797302246, -11.617475509643555, -11.20283317565918, -10.788189888000488, -10.373546600341797, -9.958904266357422, -9.54426097869873, -9.129617691040039, -8.714974403381348, -8.300331115722656, -7.885687828063965, -7.471044540405273, -7.05640172958374, -6.641758441925049, -6.227115631103516, -5.812472343444824, -5.397829055786133, -4.983185768127441, -4.568542957305908, -4.153899669647217, -3.7392568588256836, -3.324613571166992, -2.90997052192688, -2.4953274726867676, -2.080684185028076, -1.6660411357879639, -1.251399040222168, -0.8367559313774109, -0.4221128225326538, -0.007469654083251953, 0.40717339515686035, 0.8218164443969727, 1.236459732055664, 1.6511027812957764, 2.0657458305358887, 2.480388879776001, 2.8950319290161133, 3.3096752166748047, 3.724318265914917, 4.138961315155029, 4.553604602813721, 4.968247413635254, 5.382890701293945, 5.797533988952637, 6.21217679977417, 6.626820087432861, 7.0414628982543945, 7.456106185913086, 7.870749473571777, 8.285392761230469, 8.700035095214844, 9.114678382873535, 9.529321670532227, 9.943964004516602, 10.358607292175293, 10.773250579833984, 11.187893867492676, 11.602537155151367, 12.017180442810059]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 10.0, 6.0, 16.0, 18.0, 34.0, 43.0, 62.0, 99.0, 146.0, 244.0, 363.0, 568.0, 905.0, 1751.0, 3577.0, 9822.0, 35497.0, 167777.0, 557105.0, 207384.0, 43046.0, 11319.0, 4129.0, 1900.0, 1019.0, 592.0, 384.0, 269.0, 165.0, 97.0, 64.0, 44.0, 31.0, 25.0, 12.0, 9.0, 8.0, 5.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.21875, -8.9356689453125, -8.652587890625, -8.3695068359375, -8.08642578125, -7.8033447265625, -7.520263671875, -7.2371826171875, -6.9541015625, -6.6710205078125, -6.387939453125, -6.1048583984375, -5.82177734375, -5.5386962890625, -5.255615234375, -4.9725341796875, -4.689453125, -4.4063720703125, -4.123291015625, -3.8402099609375, -3.55712890625, -3.2740478515625, -2.990966796875, -2.7078857421875, -2.4248046875, -2.1417236328125, -1.858642578125, -1.5755615234375, -1.29248046875, -1.0093994140625, -0.726318359375, -0.4432373046875, -0.16015625, 0.1229248046875, 0.406005859375, 0.6890869140625, 0.97216796875, 1.2552490234375, 1.538330078125, 1.8214111328125, 2.1044921875, 2.3875732421875, 2.670654296875, 2.9537353515625, 3.23681640625, 3.5198974609375, 3.802978515625, 4.0860595703125, 4.369140625, 4.6522216796875, 4.935302734375, 5.2183837890625, 5.50146484375, 5.7845458984375, 6.067626953125, 6.3507080078125, 6.6337890625, 6.9168701171875, 7.199951171875, 7.4830322265625, 7.76611328125, 8.0491943359375, 8.332275390625, 8.6153564453125, 8.8984375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 11.0, 26.0, 33.0, 42.0, 53.0, 79.0, 85.0, 85.0, 95.0, 105.0, 85.0, 84.0, 48.0, 46.0, 36.0, 31.0, 11.0, 6.0, 7.0, 2.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.228515625, -2.162017822265625, -2.09552001953125, -2.029022216796875, -1.9625244140625, -1.896026611328125, -1.82952880859375, -1.763031005859375, -1.696533203125, -1.630035400390625, -1.56353759765625, -1.497039794921875, -1.4305419921875, -1.364044189453125, -1.29754638671875, -1.231048583984375, -1.16455078125, -1.098052978515625, -1.03155517578125, -0.965057373046875, -0.8985595703125, -0.832061767578125, -0.76556396484375, -0.699066162109375, -0.632568359375, -0.566070556640625, -0.49957275390625, -0.433074951171875, -0.3665771484375, -0.300079345703125, -0.23358154296875, -0.167083740234375, -0.1005859375, -0.034088134765625, 0.03240966796875, 0.098907470703125, 0.1654052734375, 0.231903076171875, 0.29840087890625, 0.364898681640625, 0.431396484375, 0.497894287109375, 0.56439208984375, 0.630889892578125, 0.6973876953125, 0.763885498046875, 0.83038330078125, 0.896881103515625, 0.96337890625, 1.029876708984375, 1.09637451171875, 1.162872314453125, 1.2293701171875, 1.295867919921875, 1.36236572265625, 1.428863525390625, 1.495361328125, 1.561859130859375, 1.62835693359375, 1.694854736328125, 1.7613525390625, 1.827850341796875, 1.89434814453125, 1.960845947265625, 2.02734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 6.0, 13.0, 14.0, 18.0, 36.0, 42.0, 45.0, 54.0, 88.0, 184.0, 358.0, 829.0, 2221.0, 5789.0, 17917.0, 64939.0, 278442.0, 490337.0, 136774.0, 34475.0, 10207.0, 3304.0, 1247.0, 535.0, 218.0, 127.0, 85.0, 61.0, 42.0, 27.0, 17.0, 14.0, 9.0, 8.0, 4.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.90234375, -6.6815185546875, -6.460693359375, -6.2398681640625, -6.01904296875, -5.7982177734375, -5.577392578125, -5.3565673828125, -5.1357421875, -4.9149169921875, -4.694091796875, -4.4732666015625, -4.25244140625, -4.0316162109375, -3.810791015625, -3.5899658203125, -3.369140625, -3.1483154296875, -2.927490234375, -2.7066650390625, -2.48583984375, -2.2650146484375, -2.044189453125, -1.8233642578125, -1.6025390625, -1.3817138671875, -1.160888671875, -0.9400634765625, -0.71923828125, -0.4984130859375, -0.277587890625, -0.0567626953125, 0.1640625, 0.3848876953125, 0.605712890625, 0.8265380859375, 1.04736328125, 1.2681884765625, 1.489013671875, 1.7098388671875, 1.9306640625, 2.1514892578125, 2.372314453125, 2.5931396484375, 2.81396484375, 3.0347900390625, 3.255615234375, 3.4764404296875, 3.697265625, 3.9180908203125, 4.138916015625, 4.3597412109375, 4.58056640625, 4.8013916015625, 5.022216796875, 5.2430419921875, 5.4638671875, 5.6846923828125, 5.905517578125, 6.1263427734375, 6.34716796875, 6.5679931640625, 6.788818359375, 7.0096435546875, 7.23046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 4.0, 6.0, 13.0, 15.0, 12.0, 16.0, 22.0, 15.0, 21.0, 31.0, 24.0, 36.0, 27.0, 36.0, 45.0, 46.0, 50.0, 37.0, 43.0, 41.0, 45.0, 44.0, 32.0, 35.0, 33.0, 24.0, 36.0, 24.0, 21.0, 23.0, 21.0, 24.0, 17.0, 8.0, 9.0, 8.0, 8.0, 7.0, 4.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-4.81640625, -4.6702880859375, -4.524169921875, -4.3780517578125, -4.23193359375, -4.0858154296875, -3.939697265625, -3.7935791015625, -3.6474609375, -3.5013427734375, -3.355224609375, -3.2091064453125, -3.06298828125, -2.9168701171875, -2.770751953125, -2.6246337890625, -2.478515625, -2.3323974609375, -2.186279296875, -2.0401611328125, -1.89404296875, -1.7479248046875, -1.601806640625, -1.4556884765625, -1.3095703125, -1.1634521484375, -1.017333984375, -0.8712158203125, -0.72509765625, -0.5789794921875, -0.432861328125, -0.2867431640625, -0.140625, 0.0054931640625, 0.151611328125, 0.2977294921875, 0.44384765625, 0.5899658203125, 0.736083984375, 0.8822021484375, 1.0283203125, 1.1744384765625, 1.320556640625, 1.4666748046875, 1.61279296875, 1.7589111328125, 1.905029296875, 2.0511474609375, 2.197265625, 2.3433837890625, 2.489501953125, 2.6356201171875, 2.78173828125, 2.9278564453125, 3.073974609375, 3.2200927734375, 3.3662109375, 3.5123291015625, 3.658447265625, 3.8045654296875, 3.95068359375, 4.0968017578125, 4.242919921875, 4.3890380859375, 4.53515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 4.0, 1.0, 6.0, 8.0, 8.0, 16.0, 13.0, 31.0, 71.0, 124.0, 313.0, 680.0, 1901.0, 7084.0, 60144.0, 886713.0, 79874.0, 7956.0, 2194.0, 771.0, 310.0, 141.0, 67.0, 42.0, 21.0, 16.0, 7.0, 7.0, 6.0, 5.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2734375, -7.0428466796875, -6.812255859375, -6.5816650390625, -6.35107421875, -6.1204833984375, -5.889892578125, -5.6593017578125, -5.4287109375, -5.1981201171875, -4.967529296875, -4.7369384765625, -4.50634765625, -4.2757568359375, -4.045166015625, -3.8145751953125, -3.583984375, -3.3533935546875, -3.122802734375, -2.8922119140625, -2.66162109375, -2.4310302734375, -2.200439453125, -1.9698486328125, -1.7392578125, -1.5086669921875, -1.278076171875, -1.0474853515625, -0.81689453125, -0.5863037109375, -0.355712890625, -0.1251220703125, 0.10546875, 0.3360595703125, 0.566650390625, 0.7972412109375, 1.02783203125, 1.2584228515625, 1.489013671875, 1.7196044921875, 1.9501953125, 2.1807861328125, 2.411376953125, 2.6419677734375, 2.87255859375, 3.1031494140625, 3.333740234375, 3.5643310546875, 3.794921875, 4.0255126953125, 4.256103515625, 4.4866943359375, 4.71728515625, 4.9478759765625, 5.178466796875, 5.4090576171875, 5.6396484375, 5.8702392578125, 6.100830078125, 6.3314208984375, 6.56201171875, 6.7926025390625, 7.023193359375, 7.2537841796875, 7.484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 1.0, 2.0, 4.0, 4.0, 9.0, 13.0, 19.0, 30.0, 43.0, 72.0, 102.0, 116.0, 129.0, 118.0, 88.0, 74.0, 50.0, 33.0, 23.0, 20.0, 9.0, 14.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005321502685546875, -0.0005148202180862427, -0.0004974901676177979, -0.00048016011714935303, -0.0004628300666809082, -0.0004455000162124634, -0.00042816996574401855, -0.00041083991527557373, -0.0003935098648071289, -0.0003761798143386841, -0.00035884976387023926, -0.00034151971340179443, -0.0003241896629333496, -0.0003068596124649048, -0.00028952956199645996, -0.00027219951152801514, -0.0002548694610595703, -0.0002375394105911255, -0.00022020936012268066, -0.00020287930965423584, -0.00018554925918579102, -0.0001682192087173462, -0.00015088915824890137, -0.00013355910778045654, -0.00011622905731201172, -9.88990068435669e-05, -8.156895637512207e-05, -6.423890590667725e-05, -4.690885543823242e-05, -2.9578804969787598e-05, -1.2248754501342773e-05, 5.081295967102051e-06, 2.2411346435546875e-05, 3.97413969039917e-05, 5.7071447372436523e-05, 7.440149784088135e-05, 9.173154830932617e-05, 0.000109061598777771, 0.00012639164924621582, 0.00014372169971466064, 0.00016105175018310547, 0.0001783818006515503, 0.00019571185111999512, 0.00021304190158843994, 0.00023037195205688477, 0.0002477020025253296, 0.0002650320529937744, 0.00028236210346221924, 0.00029969215393066406, 0.0003170222043991089, 0.0003343522548675537, 0.00035168230533599854, 0.00036901235580444336, 0.0003863424062728882, 0.000403672456741333, 0.00042100250720977783, 0.00043833255767822266, 0.0004556626081466675, 0.0004729926586151123, 0.0004903227090835571, 0.000507652759552002, 0.0005249828100204468, 0.0005423128604888916, 0.0005596429109573364, 0.0005769729614257812]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 5.0, 23.0, 27.0, 40.0, 84.0, 182.0, 443.0, 1587.0, 8607.0, 309516.0, 713308.0, 11816.0, 1904.0, 567.0, 196.0, 103.0, 48.0, 33.0, 17.0, 13.0, 4.0, 5.0, 6.0, 1.0, 2.0, 9.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.8829345703125, -8.554931640625, -8.2269287109375, -7.89892578125, -7.5709228515625, -7.242919921875, -6.9149169921875, -6.5869140625, -6.2589111328125, -5.930908203125, -5.6029052734375, -5.27490234375, -4.9468994140625, -4.618896484375, -4.2908935546875, -3.962890625, -3.6348876953125, -3.306884765625, -2.9788818359375, -2.65087890625, -2.3228759765625, -1.994873046875, -1.6668701171875, -1.3388671875, -1.0108642578125, -0.682861328125, -0.3548583984375, -0.02685546875, 0.3011474609375, 0.629150390625, 0.9571533203125, 1.28515625, 1.6131591796875, 1.941162109375, 2.2691650390625, 2.59716796875, 2.9251708984375, 3.253173828125, 3.5811767578125, 3.9091796875, 4.2371826171875, 4.565185546875, 4.8931884765625, 5.22119140625, 5.5491943359375, 5.877197265625, 6.2052001953125, 6.533203125, 6.8612060546875, 7.189208984375, 7.5172119140625, 7.84521484375, 8.1732177734375, 8.501220703125, 8.8292236328125, 9.1572265625, 9.4852294921875, 9.813232421875, 10.1412353515625, 10.46923828125, 10.7972412109375, 11.125244140625, 11.4532470703125, 11.78125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 11.0, 12.0, 31.0, 42.0, 90.0, 200.0, 229.0, 171.0, 90.0, 45.0, 24.0, 12.0, 12.0, 11.0, 8.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.61328125, -3.43609619140625, -3.2589111328125, -3.08172607421875, -2.904541015625, -2.72735595703125, -2.5501708984375, -2.37298583984375, -2.19580078125, -2.01861572265625, -1.8414306640625, -1.66424560546875, -1.487060546875, -1.30987548828125, -1.1326904296875, -0.95550537109375, -0.7783203125, -0.60113525390625, -0.4239501953125, -0.24676513671875, -0.069580078125, 0.10760498046875, 0.2847900390625, 0.46197509765625, 0.63916015625, 0.81634521484375, 0.9935302734375, 1.17071533203125, 1.347900390625, 1.52508544921875, 1.7022705078125, 1.87945556640625, 2.056640625, 2.23382568359375, 2.4110107421875, 2.58819580078125, 2.765380859375, 2.94256591796875, 3.1197509765625, 3.29693603515625, 3.47412109375, 3.65130615234375, 3.8284912109375, 4.00567626953125, 4.182861328125, 4.36004638671875, 4.5372314453125, 4.71441650390625, 4.8916015625, 5.06878662109375, 5.2459716796875, 5.42315673828125, 5.600341796875, 5.77752685546875, 5.9547119140625, 6.13189697265625, 6.30908203125, 6.48626708984375, 6.6634521484375, 6.84063720703125, 7.017822265625, 7.19500732421875, 7.3721923828125, 7.54937744140625, 7.7265625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 10.0, 10.0, 19.0, 34.0, 59.0, 111.0, 175.0, 200.0, 160.0, 106.0, 49.0, 31.0, 17.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.546142578125, -57.65206527709961, -55.75798797607422, -53.863914489746094, -51.9698371887207, -50.07575988769531, -48.18168258666992, -46.28760528564453, -44.393531799316406, -42.499454498291016, -40.605377197265625, -38.7113037109375, -36.81722640991211, -34.92314910888672, -33.02907180786133, -31.134994506835938, -29.240917205810547, -27.346839904785156, -25.4527645111084, -23.558687210083008, -21.66461181640625, -19.77053451538086, -17.87645721435547, -15.982380867004395, -14.08830451965332, -12.194228172302246, -10.300151824951172, -8.406074523925781, -6.511998176574707, -4.617921829223633, -2.723844528198242, -0.829768180847168, 1.0643081665039062, 2.9583847522735596, 4.852461338043213, 6.746538162231445, 8.64061450958252, 10.534690856933594, 12.428768157958984, 14.322844505310059, 16.216920852661133, 18.110998153686523, 20.00507354736328, 21.899150848388672, 23.793228149414062, 25.68730354309082, 27.58138084411621, 29.47545623779297, 31.36953353881836, 33.26361083984375, 35.15768814086914, 37.05176544189453, 38.945838928222656, 40.83991622924805, 42.73399353027344, 44.62807083129883, 46.52214813232422, 48.41622543334961, 50.310302734375, 52.204376220703125, 54.098453521728516, 55.992530822753906, 57.8866081237793, 59.78068542480469, 61.67475891113281]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 11.0, 12.0, 9.0, 13.0, 20.0, 19.0, 25.0, 35.0, 28.0, 34.0, 54.0, 47.0, 51.0, 53.0, 60.0, 64.0, 56.0, 53.0, 47.0, 45.0, 44.0, 35.0, 31.0, 36.0, 26.0, 14.0, 13.0, 18.0, 15.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.852067947387695, -30.700029373168945, -29.547992706298828, -28.395954132080078, -27.243915557861328, -26.09187889099121, -24.93984031677246, -23.787803649902344, -22.635765075683594, -21.483726501464844, -20.331689834594727, -19.179651260375977, -18.02761459350586, -16.87557601928711, -15.72353744506836, -14.571499824523926, -13.419462203979492, -12.267424583435059, -11.115386962890625, -9.963348388671875, -8.811310768127441, -7.659273147583008, -6.507235050201416, -5.355196952819824, -4.203159332275391, -3.051121473312378, -1.8990836143493652, -0.7470457553863525, 0.40499210357666016, 1.5570297241210938, 2.7090678215026855, 3.8611059188842773, 5.013145446777344, 6.165183067321777, 7.317221164703369, 8.469259262084961, 9.621296882629395, 10.773334503173828, 11.925373077392578, 13.077410697937012, 14.229448318481445, 15.381485939025879, 16.533523559570312, 17.685562133789062, 18.837600708007812, 19.98963737487793, 21.14167594909668, 22.293712615966797, 23.445751190185547, 24.597789764404297, 25.749826431274414, 26.901865005493164, 28.05390167236328, 29.20594024658203, 30.35797882080078, 31.51001739501953, 32.66205596923828, 33.81409454345703, 34.96613311767578, 36.118167877197266, 37.270206451416016, 38.422245025634766, 39.574283599853516, 40.726322174072266, 41.87835693359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 6.0, 11.0, 19.0, 18.0, 33.0, 49.0, 53.0, 87.0, 143.0, 254.0, 484.0, 801.0, 1899.0, 6020.0, 26776.0, 2463611.0, 1657960.0, 26357.0, 5933.0, 1936.0, 841.0, 361.0, 258.0, 121.0, 88.0, 48.0, 29.0, 22.0, 14.0, 4.0, 9.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.265625, -11.8939208984375, -11.522216796875, -11.1505126953125, -10.77880859375, -10.4071044921875, -10.035400390625, -9.6636962890625, -9.2919921875, -8.9202880859375, -8.548583984375, -8.1768798828125, -7.80517578125, -7.4334716796875, -7.061767578125, -6.6900634765625, -6.318359375, -5.9466552734375, -5.574951171875, -5.2032470703125, -4.83154296875, -4.4598388671875, -4.088134765625, -3.7164306640625, -3.3447265625, -2.9730224609375, -2.601318359375, -2.2296142578125, -1.85791015625, -1.4862060546875, -1.114501953125, -0.7427978515625, -0.37109375, 0.0006103515625, 0.372314453125, 0.7440185546875, 1.11572265625, 1.4874267578125, 1.859130859375, 2.2308349609375, 2.6025390625, 2.9742431640625, 3.345947265625, 3.7176513671875, 4.08935546875, 4.4610595703125, 4.832763671875, 5.2044677734375, 5.576171875, 5.9478759765625, 6.319580078125, 6.6912841796875, 7.06298828125, 7.4346923828125, 7.806396484375, 8.1781005859375, 8.5498046875, 8.9215087890625, 9.293212890625, 9.6649169921875, 10.03662109375, 10.4083251953125, 10.780029296875, 11.1517333984375, 11.5234375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 15.0, 27.0, 34.0, 33.0, 60.0, 71.0, 73.0, 85.0, 121.0, 103.0, 93.0, 66.0, 71.0, 36.0, 36.0, 26.0, 9.0, 10.0, 5.0, 2.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.59375, -2.516510009765625, -2.43927001953125, -2.362030029296875, -2.2847900390625, -2.207550048828125, -2.13031005859375, -2.053070068359375, -1.975830078125, -1.898590087890625, -1.82135009765625, -1.744110107421875, -1.6668701171875, -1.589630126953125, -1.51239013671875, -1.435150146484375, -1.35791015625, -1.280670166015625, -1.20343017578125, -1.126190185546875, -1.0489501953125, -0.971710205078125, -0.89447021484375, -0.817230224609375, -0.739990234375, -0.662750244140625, -0.58551025390625, -0.508270263671875, -0.4310302734375, -0.353790283203125, -0.27655029296875, -0.199310302734375, -0.1220703125, -0.044830322265625, 0.03240966796875, 0.109649658203125, 0.1868896484375, 0.264129638671875, 0.34136962890625, 0.418609619140625, 0.495849609375, 0.573089599609375, 0.65032958984375, 0.727569580078125, 0.8048095703125, 0.882049560546875, 0.95928955078125, 1.036529541015625, 1.11376953125, 1.191009521484375, 1.26824951171875, 1.345489501953125, 1.4227294921875, 1.499969482421875, 1.57720947265625, 1.654449462890625, 1.731689453125, 1.808929443359375, 1.88616943359375, 1.963409423828125, 2.0406494140625, 2.117889404296875, 2.19512939453125, 2.272369384765625, 2.349609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 12.0, 20.0, 31.0, 37.0, 60.0, 80.0, 210.0, 741.0, 5721.0, 150389.0, 4017096.0, 17554.0, 1702.0, 336.0, 110.0, 58.0, 42.0, 23.0, 16.0, 12.0, 11.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.625, -20.953857421875, -20.28271484375, -19.611572265625, -18.9404296875, -18.269287109375, -17.59814453125, -16.927001953125, -16.255859375, -15.584716796875, -14.91357421875, -14.242431640625, -13.5712890625, -12.900146484375, -12.22900390625, -11.557861328125, -10.88671875, -10.215576171875, -9.54443359375, -8.873291015625, -8.2021484375, -7.531005859375, -6.85986328125, -6.188720703125, -5.517578125, -4.846435546875, -4.17529296875, -3.504150390625, -2.8330078125, -2.161865234375, -1.49072265625, -0.819580078125, -0.1484375, 0.522705078125, 1.19384765625, 1.864990234375, 2.5361328125, 3.207275390625, 3.87841796875, 4.549560546875, 5.220703125, 5.891845703125, 6.56298828125, 7.234130859375, 7.9052734375, 8.576416015625, 9.24755859375, 9.918701171875, 10.58984375, 11.260986328125, 11.93212890625, 12.603271484375, 13.2744140625, 13.945556640625, 14.61669921875, 15.287841796875, 15.958984375, 16.630126953125, 17.30126953125, 17.972412109375, 18.6435546875, 19.314697265625, 19.98583984375, 20.656982421875, 21.328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 7.0, 10.0, 7.0, 17.0, 30.0, 70.0, 168.0, 848.0, 2594.0, 186.0, 62.0, 31.0, 17.0, 14.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5859375, -7.421295166015625, -7.25665283203125, -7.092010498046875, -6.9273681640625, -6.762725830078125, -6.59808349609375, -6.433441162109375, -6.268798828125, -6.104156494140625, -5.93951416015625, -5.774871826171875, -5.6102294921875, -5.445587158203125, -5.28094482421875, -5.116302490234375, -4.95166015625, -4.787017822265625, -4.62237548828125, -4.457733154296875, -4.2930908203125, -4.128448486328125, -3.96380615234375, -3.799163818359375, -3.634521484375, -3.469879150390625, -3.30523681640625, -3.140594482421875, -2.9759521484375, -2.811309814453125, -2.64666748046875, -2.482025146484375, -2.3173828125, -2.152740478515625, -1.98809814453125, -1.823455810546875, -1.6588134765625, -1.494171142578125, -1.32952880859375, -1.164886474609375, -1.000244140625, -0.835601806640625, -0.67095947265625, -0.506317138671875, -0.3416748046875, -0.177032470703125, -0.01239013671875, 0.152252197265625, 0.31689453125, 0.481536865234375, 0.64617919921875, 0.810821533203125, 0.9754638671875, 1.140106201171875, 1.30474853515625, 1.469390869140625, 1.634033203125, 1.798675537109375, 1.96331787109375, 2.127960205078125, 2.2926025390625, 2.457244873046875, 2.62188720703125, 2.786529541015625, 2.951171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 13.0, 15.0, 66.0, 171.0, 371.0, 221.0, 96.0, 29.0, 10.0, 10.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.182174682617188, -18.104724884033203, -17.02727699279785, -15.949827194213867, -14.8723783493042, -13.794929504394531, -12.717479705810547, -11.640030860900879, -10.562582015991211, -9.485133171081543, -8.407684326171875, -7.330234527587891, -6.252785682678223, -5.175336837768555, -4.0978875160217285, -3.0204381942749023, -1.9429893493652344, -0.8655402660369873, 0.21190881729125977, 1.2893579006195068, 2.366806983947754, 3.444255828857422, 4.521705150604248, 5.599154472351074, 6.676603317260742, 7.75405216217041, 8.831501007080078, 9.908950805664062, 10.98639965057373, 12.063848495483398, 13.141298294067383, 14.21874713897705, 15.296192169189453, 16.373641967773438, 17.45108985900879, 18.528539657592773, 19.605987548828125, 20.68343734741211, 21.760887145996094, 22.838336944580078, 23.91578483581543, 24.993234634399414, 26.070682525634766, 27.14813232421875, 28.225582122802734, 29.303030014038086, 30.38047981262207, 31.457927703857422, 32.535377502441406, 33.61282730102539, 34.690277099609375, 35.767723083496094, 36.84517288208008, 37.92262268066406, 39.00007247924805, 40.07752227783203, 41.15496826171875, 42.232418060302734, 43.30986785888672, 44.38731384277344, 45.46476364135742, 46.542213439941406, 47.61966323852539, 48.697113037109375, 49.77456283569336]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 7.0, 5.0, 14.0, 10.0, 8.0, 11.0, 19.0, 17.0, 17.0, 18.0, 29.0, 18.0, 25.0, 32.0, 30.0, 41.0, 35.0, 43.0, 44.0, 42.0, 38.0, 42.0, 49.0, 30.0, 31.0, 42.0, 34.0, 23.0, 26.0, 16.0, 26.0, 21.0, 26.0, 15.0, 11.0, 10.0, 12.0, 14.0, 11.0, 8.0, 9.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.807323932647705, -6.588171482086182, -6.369019031524658, -6.149866104125977, -5.930713653564453, -5.71156120300293, -5.492408752441406, -5.273256301879883, -5.054103851318359, -4.834951400756836, -4.6157989501953125, -4.396646499633789, -4.177493572235107, -3.958341121673584, -3.7391886711120605, -3.520036220550537, -3.3008832931518555, -3.081730842590332, -2.8625781536102295, -2.643425703048706, -2.4242730140686035, -2.20512056350708, -1.9859681129455566, -1.7668155431747437, -1.5476629734039307, -1.3285104036331177, -1.1093578338623047, -0.8902053833007812, -0.6710528135299683, -0.4519002437591553, -0.23274779319763184, -0.013595223426818848, 0.20555782318115234, 0.42471036314964294, 0.6438629031181335, 0.8630154132843018, 1.0821679830551147, 1.3013205528259277, 1.5204730033874512, 1.7396255731582642, 1.9587781429290771, 2.1779305934906006, 2.397083282470703, 2.6162357330322266, 2.83538818359375, 3.0545408725738525, 3.273693323135376, 3.4928460121154785, 3.711998462677002, 3.9311509132385254, 4.150303363800049, 4.3694562911987305, 4.588608741760254, 4.807761192321777, 5.026913642883301, 5.246066093444824, 5.465218544006348, 5.684370994567871, 5.9035234451293945, 6.122675895690918, 6.3418288230896, 6.560981273651123, 6.7801337242126465, 6.99928617477417, 7.218439102172852]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 15.0, 10.0, 21.0, 21.0, 24.0, 50.0, 70.0, 87.0, 144.0, 204.0, 222.0, 412.0, 623.0, 942.0, 1732.0, 3327.0, 7465.0, 20194.0, 64971.0, 234721.0, 472827.0, 166232.0, 46149.0, 15280.0, 5889.0, 2758.0, 1491.0, 884.0, 546.0, 355.0, 273.0, 170.0, 115.0, 82.0, 63.0, 51.0, 37.0, 22.0, 17.0, 14.0, 12.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.19140625, -6.95458984375, -6.7177734375, -6.48095703125, -6.244140625, -6.00732421875, -5.7705078125, -5.53369140625, -5.296875, -5.06005859375, -4.8232421875, -4.58642578125, -4.349609375, -4.11279296875, -3.8759765625, -3.63916015625, -3.40234375, -3.16552734375, -2.9287109375, -2.69189453125, -2.455078125, -2.21826171875, -1.9814453125, -1.74462890625, -1.5078125, -1.27099609375, -1.0341796875, -0.79736328125, -0.560546875, -0.32373046875, -0.0869140625, 0.14990234375, 0.38671875, 0.62353515625, 0.8603515625, 1.09716796875, 1.333984375, 1.57080078125, 1.8076171875, 2.04443359375, 2.28125, 2.51806640625, 2.7548828125, 2.99169921875, 3.228515625, 3.46533203125, 3.7021484375, 3.93896484375, 4.17578125, 4.41259765625, 4.6494140625, 4.88623046875, 5.123046875, 5.35986328125, 5.5966796875, 5.83349609375, 6.0703125, 6.30712890625, 6.5439453125, 6.78076171875, 7.017578125, 7.25439453125, 7.4912109375, 7.72802734375, 7.96484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 14.0, 13.0, 32.0, 37.0, 42.0, 63.0, 87.0, 91.0, 113.0, 100.0, 100.0, 86.0, 63.0, 49.0, 37.0, 26.0, 14.0, 9.0, 5.0, 1.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.64453125, -2.5616455078125, -2.478759765625, -2.3958740234375, -2.31298828125, -2.2301025390625, -2.147216796875, -2.0643310546875, -1.9814453125, -1.8985595703125, -1.815673828125, -1.7327880859375, -1.64990234375, -1.5670166015625, -1.484130859375, -1.4012451171875, -1.318359375, -1.2354736328125, -1.152587890625, -1.0697021484375, -0.98681640625, -0.9039306640625, -0.821044921875, -0.7381591796875, -0.6552734375, -0.5723876953125, -0.489501953125, -0.4066162109375, -0.32373046875, -0.2408447265625, -0.157958984375, -0.0750732421875, 0.0078125, 0.0906982421875, 0.173583984375, 0.2564697265625, 0.33935546875, 0.4222412109375, 0.505126953125, 0.5880126953125, 0.6708984375, 0.7537841796875, 0.836669921875, 0.9195556640625, 1.00244140625, 1.0853271484375, 1.168212890625, 1.2510986328125, 1.333984375, 1.4168701171875, 1.499755859375, 1.5826416015625, 1.66552734375, 1.7484130859375, 1.831298828125, 1.9141845703125, 1.9970703125, 2.0799560546875, 2.162841796875, 2.2457275390625, 2.32861328125, 2.4114990234375, 2.494384765625, 2.5772705078125, 2.66015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 6.0, 6.0, 6.0, 7.0, 18.0, 12.0, 24.0, 28.0, 41.0, 57.0, 78.0, 157.0, 305.0, 649.0, 1650.0, 4633.0, 14728.0, 56839.0, 250105.0, 524594.0, 145214.0, 34437.0, 9646.0, 3070.0, 1151.0, 488.0, 238.0, 113.0, 87.0, 33.0, 24.0, 21.0, 21.0, 17.0, 5.0, 9.0, 11.0, 7.0, 4.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.950439453125, -6.71337890625, -6.476318359375, -6.2392578125, -6.002197265625, -5.76513671875, -5.528076171875, -5.291015625, -5.053955078125, -4.81689453125, -4.579833984375, -4.3427734375, -4.105712890625, -3.86865234375, -3.631591796875, -3.39453125, -3.157470703125, -2.92041015625, -2.683349609375, -2.4462890625, -2.209228515625, -1.97216796875, -1.735107421875, -1.498046875, -1.260986328125, -1.02392578125, -0.786865234375, -0.5498046875, -0.312744140625, -0.07568359375, 0.161376953125, 0.3984375, 0.635498046875, 0.87255859375, 1.109619140625, 1.3466796875, 1.583740234375, 1.82080078125, 2.057861328125, 2.294921875, 2.531982421875, 2.76904296875, 3.006103515625, 3.2431640625, 3.480224609375, 3.71728515625, 3.954345703125, 4.19140625, 4.428466796875, 4.66552734375, 4.902587890625, 5.1396484375, 5.376708984375, 5.61376953125, 5.850830078125, 6.087890625, 6.324951171875, 6.56201171875, 6.799072265625, 7.0361328125, 7.273193359375, 7.51025390625, 7.747314453125, 7.984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 13.0, 8.0, 10.0, 14.0, 9.0, 11.0, 22.0, 22.0, 23.0, 29.0, 27.0, 27.0, 28.0, 43.0, 37.0, 37.0, 32.0, 45.0, 42.0, 41.0, 45.0, 32.0, 39.0, 44.0, 39.0, 27.0, 21.0, 24.0, 22.0, 27.0, 21.0, 23.0, 25.0, 14.0, 5.0, 13.0, 9.0, 9.0, 5.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.21484375, -5.0567626953125, -4.898681640625, -4.7406005859375, -4.58251953125, -4.4244384765625, -4.266357421875, -4.1082763671875, -3.9501953125, -3.7921142578125, -3.634033203125, -3.4759521484375, -3.31787109375, -3.1597900390625, -3.001708984375, -2.8436279296875, -2.685546875, -2.5274658203125, -2.369384765625, -2.2113037109375, -2.05322265625, -1.8951416015625, -1.737060546875, -1.5789794921875, -1.4208984375, -1.2628173828125, -1.104736328125, -0.9466552734375, -0.78857421875, -0.6304931640625, -0.472412109375, -0.3143310546875, -0.15625, 0.0018310546875, 0.159912109375, 0.3179931640625, 0.47607421875, 0.6341552734375, 0.792236328125, 0.9503173828125, 1.1083984375, 1.2664794921875, 1.424560546875, 1.5826416015625, 1.74072265625, 1.8988037109375, 2.056884765625, 2.2149658203125, 2.373046875, 2.5311279296875, 2.689208984375, 2.8472900390625, 3.00537109375, 3.1634521484375, 3.321533203125, 3.4796142578125, 3.6376953125, 3.7957763671875, 3.953857421875, 4.1119384765625, 4.27001953125, 4.4281005859375, 4.586181640625, 4.7442626953125, 4.90234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 7.0, 10.0, 24.0, 19.0, 34.0, 45.0, 91.0, 162.0, 296.0, 614.0, 1337.0, 3231.0, 9579.0, 48739.0, 639140.0, 307368.0, 26496.0, 6717.0, 2449.0, 1139.0, 454.0, 252.0, 117.0, 76.0, 36.0, 31.0, 16.0, 11.0, 10.0, 13.0, 6.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.3916015625, -5.216796875, -5.0419921875, -4.8671875, -4.6923828125, -4.517578125, -4.3427734375, -4.16796875, -3.9931640625, -3.818359375, -3.6435546875, -3.46875, -3.2939453125, -3.119140625, -2.9443359375, -2.76953125, -2.5947265625, -2.419921875, -2.2451171875, -2.0703125, -1.8955078125, -1.720703125, -1.5458984375, -1.37109375, -1.1962890625, -1.021484375, -0.8466796875, -0.671875, -0.4970703125, -0.322265625, -0.1474609375, 0.02734375, 0.2021484375, 0.376953125, 0.5517578125, 0.7265625, 0.9013671875, 1.076171875, 1.2509765625, 1.42578125, 1.6005859375, 1.775390625, 1.9501953125, 2.125, 2.2998046875, 2.474609375, 2.6494140625, 2.82421875, 2.9990234375, 3.173828125, 3.3486328125, 3.5234375, 3.6982421875, 3.873046875, 4.0478515625, 4.22265625, 4.3974609375, 4.572265625, 4.7470703125, 4.921875, 5.0966796875, 5.271484375, 5.4462890625, 5.62109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 13.0, 12.0, 20.0, 31.0, 58.0, 72.0, 133.0, 173.0, 175.0, 106.0, 77.0, 44.0, 23.0, 14.0, 9.0, 9.0, 3.0, 5.0, 4.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005078315734863281, -0.00048207491636276245, -0.0004563182592391968, -0.0004305616021156311, -0.00040480494499206543, -0.00037904828786849976, -0.0003532916307449341, -0.0003275349736213684, -0.00030177831649780273, -0.00027602165937423706, -0.0002502650022506714, -0.0002245083451271057, -0.00019875168800354004, -0.00017299503087997437, -0.0001472383737564087, -0.00012148171663284302, -9.572505950927734e-05, -6.996840238571167e-05, -4.4211745262145996e-05, -1.8455088138580322e-05, 7.3015689849853516e-06, 3.3058226108551025e-05, 5.88148832321167e-05, 8.457154035568237e-05, 0.00011032819747924805, 0.00013608485460281372, 0.0001618415117263794, 0.00018759816884994507, 0.00021335482597351074, 0.00023911148309707642, 0.0002648681402206421, 0.00029062479734420776, 0.00031638145446777344, 0.0003421381115913391, 0.0003678947687149048, 0.00039365142583847046, 0.00041940808296203613, 0.0004451647400856018, 0.0004709213972091675, 0.0004966780543327332, 0.0005224347114562988, 0.0005481913685798645, 0.0005739480257034302, 0.0005997046828269958, 0.0006254613399505615, 0.0006512179970741272, 0.0006769746541976929, 0.0007027313113212585, 0.0007284879684448242, 0.0007542446255683899, 0.0007800012826919556, 0.0008057579398155212, 0.0008315145969390869, 0.0008572712540626526, 0.0008830279111862183, 0.0009087845683097839, 0.0009345412254333496, 0.0009602978825569153, 0.000986054539680481, 0.0010118111968040466, 0.0010375678539276123, 0.001063324511051178, 0.0010890811681747437, 0.0011148378252983093, 0.001140594482421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 6.0, 12.0, 16.0, 29.0, 62.0, 143.0, 409.0, 1559.0, 8687.0, 520446.0, 506274.0, 8678.0, 1476.0, 450.0, 138.0, 68.0, 29.0, 13.0, 15.0, 7.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.578125, -13.200927734375, -12.82373046875, -12.446533203125, -12.0693359375, -11.692138671875, -11.31494140625, -10.937744140625, -10.560546875, -10.183349609375, -9.80615234375, -9.428955078125, -9.0517578125, -8.674560546875, -8.29736328125, -7.920166015625, -7.54296875, -7.165771484375, -6.78857421875, -6.411376953125, -6.0341796875, -5.656982421875, -5.27978515625, -4.902587890625, -4.525390625, -4.148193359375, -3.77099609375, -3.393798828125, -3.0166015625, -2.639404296875, -2.26220703125, -1.885009765625, -1.5078125, -1.130615234375, -0.75341796875, -0.376220703125, 0.0009765625, 0.378173828125, 0.75537109375, 1.132568359375, 1.509765625, 1.886962890625, 2.26416015625, 2.641357421875, 3.0185546875, 3.395751953125, 3.77294921875, 4.150146484375, 4.52734375, 4.904541015625, 5.28173828125, 5.658935546875, 6.0361328125, 6.413330078125, 6.79052734375, 7.167724609375, 7.544921875, 7.922119140625, 8.29931640625, 8.676513671875, 9.0537109375, 9.430908203125, 9.80810546875, 10.185302734375, 10.5625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 3.0, 5.0, 10.0, 19.0, 27.0, 50.0, 89.0, 117.0, 143.0, 148.0, 100.0, 99.0, 56.0, 44.0, 24.0, 12.0, 8.0, 9.0, 3.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.7479248046875, -4.613037109375, -4.4781494140625, -4.34326171875, -4.2083740234375, -4.073486328125, -3.9385986328125, -3.8037109375, -3.6688232421875, -3.533935546875, -3.3990478515625, -3.26416015625, -3.1292724609375, -2.994384765625, -2.8594970703125, -2.724609375, -2.5897216796875, -2.454833984375, -2.3199462890625, -2.18505859375, -2.0501708984375, -1.915283203125, -1.7803955078125, -1.6455078125, -1.5106201171875, -1.375732421875, -1.2408447265625, -1.10595703125, -0.9710693359375, -0.836181640625, -0.7012939453125, -0.56640625, -0.4315185546875, -0.296630859375, -0.1617431640625, -0.02685546875, 0.1080322265625, 0.242919921875, 0.3778076171875, 0.5126953125, 0.6475830078125, 0.782470703125, 0.9173583984375, 1.05224609375, 1.1871337890625, 1.322021484375, 1.4569091796875, 1.591796875, 1.7266845703125, 1.861572265625, 1.9964599609375, 2.13134765625, 2.2662353515625, 2.401123046875, 2.5360107421875, 2.6708984375, 2.8057861328125, 2.940673828125, 3.0755615234375, 3.21044921875, 3.3453369140625, 3.480224609375, 3.6151123046875, 3.75]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 24.0, 48.0, 114.0, 262.0, 301.0, 163.0, 47.0, 18.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-128.00192260742188, -124.81848907470703, -121.63505554199219, -118.45162200927734, -115.2681884765625, -112.08475494384766, -108.90132141113281, -105.71788787841797, -102.53445434570312, -99.35102081298828, -96.16758728027344, -92.9841537475586, -89.80072021484375, -86.6172866821289, -83.43385314941406, -80.25041961669922, -77.06698608398438, -73.88355255126953, -70.70011901855469, -67.51668548583984, -64.333251953125, -61.149818420410156, -57.96638488769531, -54.78295135498047, -51.599525451660156, -48.41609191894531, -45.23265838623047, -42.049224853515625, -38.86579132080078, -35.68235778808594, -32.498924255371094, -29.315492630004883, -26.132057189941406, -22.948623657226562, -19.76519012451172, -16.581756591796875, -13.398324012756348, -10.214890480041504, -7.031457901000977, -3.848024368286133, -0.6645908355712891, 2.5188424587249756, 5.70227575302124, 8.885708808898926, 12.06914234161377, 15.252575874328613, 18.43600845336914, 21.619441986083984, 24.802875518798828, 27.986309051513672, 31.169742584228516, 34.35317611694336, 37.5366096496582, 40.72004318237305, 43.903472900390625, 47.08690643310547, 50.27033996582031, 53.453773498535156, 56.63720703125, 59.820640563964844, 63.00407409667969, 66.18750762939453, 69.37094116210938, 72.55437469482422, 75.73780822753906]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 8.0, 15.0, 16.0, 17.0, 17.0, 31.0, 29.0, 28.0, 35.0, 32.0, 39.0, 49.0, 47.0, 58.0, 50.0, 54.0, 42.0, 50.0, 56.0, 38.0, 46.0, 42.0, 22.0, 28.0, 27.0, 21.0, 20.0, 17.0, 10.0, 10.0, 14.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.9231071472168, -40.73573684692383, -39.54836654663086, -38.360992431640625, -37.173622131347656, -35.98625183105469, -34.79888153076172, -33.61151123046875, -32.42414093017578, -31.236770629882812, -30.04939842224121, -28.862028121948242, -27.67465591430664, -26.487285614013672, -25.299915313720703, -24.112545013427734, -22.9251708984375, -21.73780059814453, -20.55042839050293, -19.36305809020996, -18.17568588256836, -16.98831558227539, -15.800945281982422, -14.613574028015137, -13.426202774047852, -12.238831520080566, -11.051460266113281, -9.864089965820312, -8.676718711853027, -7.489347457885742, -6.301976680755615, -5.114605903625488, -3.9272384643554688, -2.7398674488067627, -1.5524964332580566, -0.3651254177093506, 0.8222455978393555, 2.0096168518066406, 3.1969876289367676, 4.3843584060668945, 5.57172966003418, 6.759100914001465, 7.946471691131592, 9.133842468261719, 10.321213722229004, 11.508584976196289, 12.695955276489258, 13.883326530456543, 15.070697784423828, 16.258068084716797, 17.4454402923584, 18.632810592651367, 19.82018280029297, 21.007553100585938, 22.194923400878906, 23.382293701171875, 24.569665908813477, 25.757036209106445, 26.944408416748047, 28.131778717041016, 29.319149017333984, 30.506521224975586, 31.693891525268555, 32.881263732910156, 34.068634033203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 8.0, 14.0, 10.0, 18.0, 23.0, 21.0, 37.0, 50.0, 85.0, 128.0, 211.0, 345.0, 627.0, 1256.0, 3140.0, 12197.0, 118068.0, 3993501.0, 52600.0, 7629.0, 2246.0, 937.0, 481.0, 272.0, 118.0, 93.0, 54.0, 26.0, 23.0, 18.0, 9.0, 8.0, 4.0, 3.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.9609375, -13.4854736328125, -13.010009765625, -12.5345458984375, -12.05908203125, -11.5836181640625, -11.108154296875, -10.6326904296875, -10.1572265625, -9.6817626953125, -9.206298828125, -8.7308349609375, -8.25537109375, -7.7799072265625, -7.304443359375, -6.8289794921875, -6.353515625, -5.8780517578125, -5.402587890625, -4.9271240234375, -4.45166015625, -3.9761962890625, -3.500732421875, -3.0252685546875, -2.5498046875, -2.0743408203125, -1.598876953125, -1.1234130859375, -0.64794921875, -0.1724853515625, 0.302978515625, 0.7784423828125, 1.25390625, 1.7293701171875, 2.204833984375, 2.6802978515625, 3.15576171875, 3.6312255859375, 4.106689453125, 4.5821533203125, 5.0576171875, 5.5330810546875, 6.008544921875, 6.4840087890625, 6.95947265625, 7.4349365234375, 7.910400390625, 8.3858642578125, 8.861328125, 9.3367919921875, 9.812255859375, 10.2877197265625, 10.76318359375, 11.2386474609375, 11.714111328125, 12.1895751953125, 12.6650390625, 13.1405029296875, 13.615966796875, 14.0914306640625, 14.56689453125, 15.0423583984375, 15.517822265625, 15.9932861328125, 16.46875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 9.0, 15.0, 19.0, 29.0, 34.0, 47.0, 54.0, 76.0, 77.0, 80.0, 95.0, 106.0, 77.0, 74.0, 63.0, 29.0, 40.0, 13.0, 18.0, 11.0, 9.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.584136962890625, -2.49835205078125, -2.412567138671875, -2.3267822265625, -2.240997314453125, -2.15521240234375, -2.069427490234375, -1.983642578125, -1.897857666015625, -1.81207275390625, -1.726287841796875, -1.6405029296875, -1.554718017578125, -1.46893310546875, -1.383148193359375, -1.29736328125, -1.211578369140625, -1.12579345703125, -1.040008544921875, -0.9542236328125, -0.868438720703125, -0.78265380859375, -0.696868896484375, -0.611083984375, -0.525299072265625, -0.43951416015625, -0.353729248046875, -0.2679443359375, -0.182159423828125, -0.09637451171875, -0.010589599609375, 0.0751953125, 0.160980224609375, 0.24676513671875, 0.332550048828125, 0.4183349609375, 0.504119873046875, 0.58990478515625, 0.675689697265625, 0.761474609375, 0.847259521484375, 0.93304443359375, 1.018829345703125, 1.1046142578125, 1.190399169921875, 1.27618408203125, 1.361968994140625, 1.44775390625, 1.533538818359375, 1.61932373046875, 1.705108642578125, 1.7908935546875, 1.876678466796875, 1.96246337890625, 2.048248291015625, 2.134033203125, 2.219818115234375, 2.30560302734375, 2.391387939453125, 2.4771728515625, 2.562957763671875, 2.64874267578125, 2.734527587890625, 2.8203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 2.0, 7.0, 9.0, 5.0, 14.0, 22.0, 42.0, 106.0, 361.0, 1450.0, 9794.0, 174039.0, 3973804.0, 30144.0, 3417.0, 717.0, 198.0, 73.0, 28.0, 15.0, 9.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.453125, -16.8125, -16.171875, -15.53125, -14.890625, -14.25, -13.609375, -12.96875, -12.328125, -11.6875, -11.046875, -10.40625, -9.765625, -9.125, -8.484375, -7.84375, -7.203125, -6.5625, -5.921875, -5.28125, -4.640625, -4.0, -3.359375, -2.71875, -2.078125, -1.4375, -0.796875, -0.15625, 0.484375, 1.125, 1.765625, 2.40625, 3.046875, 3.6875, 4.328125, 4.96875, 5.609375, 6.25, 6.890625, 7.53125, 8.171875, 8.8125, 9.453125, 10.09375, 10.734375, 11.375, 12.015625, 12.65625, 13.296875, 13.9375, 14.578125, 15.21875, 15.859375, 16.5, 17.140625, 17.78125, 18.421875, 19.0625, 19.703125, 20.34375, 20.984375, 21.625, 22.265625, 22.90625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 5.0, 11.0, 6.0, 10.0, 16.0, 23.0, 31.0, 33.0, 45.0, 84.0, 185.0, 499.0, 2390.0, 342.0, 143.0, 86.0, 45.0, 28.0, 15.0, 11.0, 15.0, 11.0, 8.0, 5.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2734375, -3.15362548828125, -3.0338134765625, -2.91400146484375, -2.794189453125, -2.67437744140625, -2.5545654296875, -2.43475341796875, -2.31494140625, -2.19512939453125, -2.0753173828125, -1.95550537109375, -1.835693359375, -1.71588134765625, -1.5960693359375, -1.47625732421875, -1.3564453125, -1.23663330078125, -1.1168212890625, -0.99700927734375, -0.877197265625, -0.75738525390625, -0.6375732421875, -0.51776123046875, -0.39794921875, -0.27813720703125, -0.1583251953125, -0.03851318359375, 0.081298828125, 0.20111083984375, 0.3209228515625, 0.44073486328125, 0.560546875, 0.68035888671875, 0.8001708984375, 0.91998291015625, 1.039794921875, 1.15960693359375, 1.2794189453125, 1.39923095703125, 1.51904296875, 1.63885498046875, 1.7586669921875, 1.87847900390625, 1.998291015625, 2.11810302734375, 2.2379150390625, 2.35772705078125, 2.4775390625, 2.59735107421875, 2.7171630859375, 2.83697509765625, 2.956787109375, 3.07659912109375, 3.1964111328125, 3.31622314453125, 3.43603515625, 3.55584716796875, 3.6756591796875, 3.79547119140625, 3.915283203125, 4.03509521484375, 4.1549072265625, 4.27471923828125, 4.39453125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 17.0, 41.0, 135.0, 419.0, 298.0, 72.0, 22.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-91.73446655273438, -89.85538482666016, -87.97630310058594, -86.09722137451172, -84.2181396484375, -82.33906555175781, -80.4599838256836, -78.58090209960938, -76.70182037353516, -74.82273864746094, -72.94365692138672, -71.0645751953125, -69.18549346923828, -67.30641174316406, -65.42733764648438, -63.548255920410156, -61.66917419433594, -59.79009246826172, -57.9110107421875, -56.03193283081055, -54.15285110473633, -52.27376937866211, -50.39468765258789, -48.51560974121094, -46.63652420043945, -44.757442474365234, -42.878360748291016, -40.99928283691406, -39.120201110839844, -37.241119384765625, -35.362037658691406, -33.48295593261719, -31.603878021240234, -29.724796295166016, -27.84571647644043, -25.96663475036621, -24.087554931640625, -22.208473205566406, -20.329391479492188, -18.4503116607666, -16.571231842041016, -14.692151069641113, -12.813070297241211, -10.933988571166992, -9.054908752441406, -7.1758270263671875, -5.296746253967285, -3.417665481567383, -1.538583755493164, 0.34049713611602783, 2.2195780277252197, 4.098659038543701, 5.9777398109436035, 7.856821060180664, 9.735901832580566, 11.614982604980469, 13.494063377380371, 15.373144149780273, 17.252225875854492, 19.131305694580078, 21.010387420654297, 22.889469146728516, 24.7685489654541, 26.647628784179688, 28.526710510253906]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 2.0, 7.0, 6.0, 11.0, 13.0, 14.0, 17.0, 26.0, 30.0, 38.0, 31.0, 48.0, 58.0, 52.0, 51.0, 51.0, 54.0, 61.0, 44.0, 55.0, 56.0, 54.0, 46.0, 41.0, 33.0, 18.0, 23.0, 12.0, 16.0, 7.0, 13.0, 7.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.47601318359375, -16.03172492980957, -15.587434768676758, -15.143145561218262, -14.698856353759766, -14.254568099975586, -13.810277938842773, -13.365989685058594, -12.921700477600098, -12.477411270141602, -12.033122062683105, -11.58883285522461, -11.144543647766113, -10.700254440307617, -10.255966186523438, -9.811676979064941, -9.367387771606445, -8.92309856414795, -8.478809356689453, -8.034520149230957, -7.590231418609619, -7.145942211151123, -6.701653003692627, -6.257364273071289, -5.813074111938477, -5.3687849044799805, -4.924495697021484, -4.480206489562988, -4.03591775894165, -3.5916285514831543, -3.147339344024658, -2.703050374984741, -2.258761405944824, -1.8144723176956177, -1.3701832294464111, -0.925894021987915, -0.4816049337387085, -0.03731584548950195, 0.40697336196899414, 0.8512623310089111, 1.2955515384674072, 1.7398406267166138, 2.1841297149658203, 2.6284189224243164, 3.0727081298828125, 3.5169970989227295, 3.9612863063812256, 4.405575275421143, 4.849864482879639, 5.294153690338135, 5.738442897796631, 6.182731628417969, 6.627020835876465, 7.071310043334961, 7.515599250793457, 7.959888458251953, 8.40417766571045, 8.848466873168945, 9.292756080627441, 9.737045288085938, 10.181334495544434, 10.62562370300293, 11.06991195678711, 11.514201164245605, 11.958490371704102]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 8.0, 9.0, 12.0, 18.0, 27.0, 52.0, 87.0, 110.0, 224.0, 396.0, 855.0, 1956.0, 5471.0, 21819.0, 153572.0, 735174.0, 104412.0, 16468.0, 4490.0, 1764.0, 740.0, 397.0, 170.0, 105.0, 73.0, 43.0, 30.0, 25.0, 11.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.484375, -13.041015625, -12.59765625, -12.154296875, -11.7109375, -11.267578125, -10.82421875, -10.380859375, -9.9375, -9.494140625, -9.05078125, -8.607421875, -8.1640625, -7.720703125, -7.27734375, -6.833984375, -6.390625, -5.947265625, -5.50390625, -5.060546875, -4.6171875, -4.173828125, -3.73046875, -3.287109375, -2.84375, -2.400390625, -1.95703125, -1.513671875, -1.0703125, -0.626953125, -0.18359375, 0.259765625, 0.703125, 1.146484375, 1.58984375, 2.033203125, 2.4765625, 2.919921875, 3.36328125, 3.806640625, 4.25, 4.693359375, 5.13671875, 5.580078125, 6.0234375, 6.466796875, 6.91015625, 7.353515625, 7.796875, 8.240234375, 8.68359375, 9.126953125, 9.5703125, 10.013671875, 10.45703125, 10.900390625, 11.34375, 11.787109375, 12.23046875, 12.673828125, 13.1171875, 13.560546875, 14.00390625, 14.447265625, 14.890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 9.0, 16.0, 14.0, 28.0, 25.0, 52.0, 53.0, 71.0, 107.0, 81.0, 103.0, 80.0, 93.0, 72.0, 46.0, 42.0, 43.0, 17.0, 13.0, 11.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2578125, -3.16534423828125, -3.0728759765625, -2.98040771484375, -2.887939453125, -2.79547119140625, -2.7030029296875, -2.61053466796875, -2.51806640625, -2.42559814453125, -2.3331298828125, -2.24066162109375, -2.148193359375, -2.05572509765625, -1.9632568359375, -1.87078857421875, -1.7783203125, -1.68585205078125, -1.5933837890625, -1.50091552734375, -1.408447265625, -1.31597900390625, -1.2235107421875, -1.13104248046875, -1.03857421875, -0.94610595703125, -0.8536376953125, -0.76116943359375, -0.668701171875, -0.57623291015625, -0.4837646484375, -0.39129638671875, -0.298828125, -0.20635986328125, -0.1138916015625, -0.02142333984375, 0.071044921875, 0.16351318359375, 0.2559814453125, 0.34844970703125, 0.44091796875, 0.53338623046875, 0.6258544921875, 0.71832275390625, 0.810791015625, 0.90325927734375, 0.9957275390625, 1.08819580078125, 1.1806640625, 1.27313232421875, 1.3656005859375, 1.45806884765625, 1.550537109375, 1.64300537109375, 1.7354736328125, 1.82794189453125, 1.92041015625, 2.01287841796875, 2.1053466796875, 2.19781494140625, 2.290283203125, 2.38275146484375, 2.4752197265625, 2.56768798828125, 2.66015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 15.0, 12.0, 21.0, 30.0, 42.0, 73.0, 156.0, 339.0, 1066.0, 4265.0, 32456.0, 658733.0, 327604.0, 19314.0, 3024.0, 789.0, 264.0, 141.0, 66.0, 46.0, 25.0, 15.0, 23.0, 8.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.2406005859375, -15.746826171875, -15.2530517578125, -14.75927734375, -14.2655029296875, -13.771728515625, -13.2779541015625, -12.7841796875, -12.2904052734375, -11.796630859375, -11.3028564453125, -10.80908203125, -10.3153076171875, -9.821533203125, -9.3277587890625, -8.833984375, -8.3402099609375, -7.846435546875, -7.3526611328125, -6.85888671875, -6.3651123046875, -5.871337890625, -5.3775634765625, -4.8837890625, -4.3900146484375, -3.896240234375, -3.4024658203125, -2.90869140625, -2.4149169921875, -1.921142578125, -1.4273681640625, -0.93359375, -0.4398193359375, 0.053955078125, 0.5477294921875, 1.04150390625, 1.5352783203125, 2.029052734375, 2.5228271484375, 3.0166015625, 3.5103759765625, 4.004150390625, 4.4979248046875, 4.99169921875, 5.4854736328125, 5.979248046875, 6.4730224609375, 6.966796875, 7.4605712890625, 7.954345703125, 8.4481201171875, 8.94189453125, 9.4356689453125, 9.929443359375, 10.4232177734375, 10.9169921875, 11.4107666015625, 11.904541015625, 12.3983154296875, 12.89208984375, 13.3858642578125, 13.879638671875, 14.3734130859375, 14.8671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 5.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 14.0, 21.0, 25.0, 31.0, 23.0, 44.0, 42.0, 41.0, 43.0, 45.0, 50.0, 49.0, 54.0, 59.0, 54.0, 44.0, 57.0, 39.0, 28.0, 39.0, 29.0, 22.0, 22.0, 20.0, 24.0, 9.0, 12.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.33203125, -7.099365234375, -6.86669921875, -6.634033203125, -6.4013671875, -6.168701171875, -5.93603515625, -5.703369140625, -5.470703125, -5.238037109375, -5.00537109375, -4.772705078125, -4.5400390625, -4.307373046875, -4.07470703125, -3.842041015625, -3.609375, -3.376708984375, -3.14404296875, -2.911376953125, -2.6787109375, -2.446044921875, -2.21337890625, -1.980712890625, -1.748046875, -1.515380859375, -1.28271484375, -1.050048828125, -0.8173828125, -0.584716796875, -0.35205078125, -0.119384765625, 0.11328125, 0.345947265625, 0.57861328125, 0.811279296875, 1.0439453125, 1.276611328125, 1.50927734375, 1.741943359375, 1.974609375, 2.207275390625, 2.43994140625, 2.672607421875, 2.9052734375, 3.137939453125, 3.37060546875, 3.603271484375, 3.8359375, 4.068603515625, 4.30126953125, 4.533935546875, 4.7666015625, 4.999267578125, 5.23193359375, 5.464599609375, 5.697265625, 5.929931640625, 6.16259765625, 6.395263671875, 6.6279296875, 6.860595703125, 7.09326171875, 7.325927734375, 7.55859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 11.0, 6.0, 12.0, 26.0, 21.0, 66.0, 128.0, 327.0, 815.0, 2533.0, 9401.0, 70036.0, 913557.0, 41361.0, 7099.0, 1966.0, 671.0, 260.0, 124.0, 50.0, 30.0, 19.0, 14.0, 4.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0078125, -8.6790771484375, -8.350341796875, -8.0216064453125, -7.69287109375, -7.3641357421875, -7.035400390625, -6.7066650390625, -6.3779296875, -6.0491943359375, -5.720458984375, -5.3917236328125, -5.06298828125, -4.7342529296875, -4.405517578125, -4.0767822265625, -3.748046875, -3.4193115234375, -3.090576171875, -2.7618408203125, -2.43310546875, -2.1043701171875, -1.775634765625, -1.4468994140625, -1.1181640625, -0.7894287109375, -0.460693359375, -0.1319580078125, 0.19677734375, 0.5255126953125, 0.854248046875, 1.1829833984375, 1.51171875, 1.8404541015625, 2.169189453125, 2.4979248046875, 2.82666015625, 3.1553955078125, 3.484130859375, 3.8128662109375, 4.1416015625, 4.4703369140625, 4.799072265625, 5.1278076171875, 5.45654296875, 5.7852783203125, 6.114013671875, 6.4427490234375, 6.771484375, 7.1002197265625, 7.428955078125, 7.7576904296875, 8.08642578125, 8.4151611328125, 8.743896484375, 9.0726318359375, 9.4013671875, 9.7301025390625, 10.058837890625, 10.3875732421875, 10.71630859375, 11.0450439453125, 11.373779296875, 11.7025146484375, 12.03125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 2.0, 4.0, 6.0, 13.0, 21.0, 49.0, 85.0, 297.0, 320.0, 96.0, 44.0, 22.0, 13.0, 8.0, 10.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019140243530273438, -0.001857861876487732, -0.0018016993999481201, -0.0017455369234085083, -0.0016893744468688965, -0.0016332119703292847, -0.0015770494937896729, -0.001520887017250061, -0.0014647245407104492, -0.0014085620641708374, -0.0013523995876312256, -0.0012962371110916138, -0.001240074634552002, -0.0011839121580123901, -0.0011277496814727783, -0.0010715872049331665, -0.0010154247283935547, -0.0009592622518539429, -0.0009030997753143311, -0.0008469372987747192, -0.0007907748222351074, -0.0007346123456954956, -0.0006784498691558838, -0.000622287392616272, -0.0005661249160766602, -0.0005099624395370483, -0.0004537999629974365, -0.0003976374864578247, -0.0003414750099182129, -0.0002853125333786011, -0.00022915005683898926, -0.00017298758029937744, -0.00011682510375976562, -6.066262722015381e-05, -4.500150680541992e-06, 5.1662325859069824e-05, 0.00010782480239868164, 0.00016398727893829346, 0.00022014975547790527, 0.0002763122320175171, 0.0003324747085571289, 0.0003886371850967407, 0.00044479966163635254, 0.0005009621381759644, 0.0005571246147155762, 0.000613287091255188, 0.0006694495677947998, 0.0007256120443344116, 0.0007817745208740234, 0.0008379369974136353, 0.0008940994739532471, 0.0009502619504928589, 0.0010064244270324707, 0.0010625869035720825, 0.0011187493801116943, 0.0011749118566513062, 0.001231074333190918, 0.0012872368097305298, 0.0013433992862701416, 0.0013995617628097534, 0.0014557242393493652, 0.001511886715888977, 0.0015680491924285889, 0.0016242116689682007, 0.0016803741455078125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 10.0, 5.0, 8.0, 15.0, 14.0, 16.0, 25.0, 51.0, 108.0, 241.0, 788.0, 3620.0, 33955.0, 970836.0, 33952.0, 3607.0, 793.0, 249.0, 98.0, 55.0, 27.0, 19.0, 12.0, 9.0, 9.0, 5.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0], "bins": [-21.15625, -20.658447265625, -20.16064453125, -19.662841796875, -19.1650390625, -18.667236328125, -18.16943359375, -17.671630859375, -17.173828125, -16.676025390625, -16.17822265625, -15.680419921875, -15.1826171875, -14.684814453125, -14.18701171875, -13.689208984375, -13.19140625, -12.693603515625, -12.19580078125, -11.697998046875, -11.2001953125, -10.702392578125, -10.20458984375, -9.706787109375, -9.208984375, -8.711181640625, -8.21337890625, -7.715576171875, -7.2177734375, -6.719970703125, -6.22216796875, -5.724365234375, -5.2265625, -4.728759765625, -4.23095703125, -3.733154296875, -3.2353515625, -2.737548828125, -2.23974609375, -1.741943359375, -1.244140625, -0.746337890625, -0.24853515625, 0.249267578125, 0.7470703125, 1.244873046875, 1.74267578125, 2.240478515625, 2.73828125, 3.236083984375, 3.73388671875, 4.231689453125, 4.7294921875, 5.227294921875, 5.72509765625, 6.222900390625, 6.720703125, 7.218505859375, 7.71630859375, 8.214111328125, 8.7119140625, 9.209716796875, 9.70751953125, 10.205322265625, 10.703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 5.0, 8.0, 6.0, 5.0, 8.0, 2.0, 9.0, 19.0, 10.0, 14.0, 29.0, 49.0, 94.0, 179.0, 202.0, 119.0, 63.0, 32.0, 32.0, 17.0, 17.0, 12.0, 11.0, 8.0, 6.0, 7.0, 8.0, 4.0, 6.0, 5.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.7578125, -5.611175537109375, -5.46453857421875, -5.317901611328125, -5.1712646484375, -5.024627685546875, -4.87799072265625, -4.731353759765625, -4.584716796875, -4.438079833984375, -4.29144287109375, -4.144805908203125, -3.9981689453125, -3.851531982421875, -3.70489501953125, -3.558258056640625, -3.41162109375, -3.264984130859375, -3.11834716796875, -2.971710205078125, -2.8250732421875, -2.678436279296875, -2.53179931640625, -2.385162353515625, -2.238525390625, -2.091888427734375, -1.94525146484375, -1.798614501953125, -1.6519775390625, -1.505340576171875, -1.35870361328125, -1.212066650390625, -1.0654296875, -0.918792724609375, -0.77215576171875, -0.625518798828125, -0.4788818359375, -0.332244873046875, -0.18560791015625, -0.038970947265625, 0.107666015625, 0.254302978515625, 0.40093994140625, 0.547576904296875, 0.6942138671875, 0.840850830078125, 0.98748779296875, 1.134124755859375, 1.28076171875, 1.427398681640625, 1.57403564453125, 1.720672607421875, 1.8673095703125, 2.013946533203125, 2.16058349609375, 2.307220458984375, 2.453857421875, 2.600494384765625, 2.74713134765625, 2.893768310546875, 3.0404052734375, 3.187042236328125, 3.33367919921875, 3.480316162109375, 3.626953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 35.0, 87.0, 280.0, 398.0, 137.0, 42.0, 7.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.37384033203125, -115.61735534667969, -110.86087036132812, -106.10438537597656, -101.347900390625, -96.59141540527344, -91.83493041992188, -87.07844543457031, -82.32196044921875, -77.56547546386719, -72.80899047851562, -68.05250549316406, -63.2960205078125, -58.53953552246094, -53.78305435180664, -49.02656936645508, -44.27008819580078, -39.51360321044922, -34.757118225097656, -30.000635147094727, -25.244150161743164, -20.4876651763916, -15.731182098388672, -10.97469711303711, -6.218212127685547, -1.4617276191711426, 3.2947568893432617, 8.051240921020508, 12.80772590637207, 17.564210891723633, 22.320693969726562, 27.077178955078125, 31.833663940429688, 36.59014892578125, 41.34663391113281, 46.103118896484375, 50.85960388183594, 55.6160888671875, 60.3725700378418, 65.12905883789062, 69.88554382324219, 74.64202880859375, 79.39851379394531, 84.15499877929688, 88.91148376464844, 93.66796875, 98.42445373535156, 103.18093872070312, 107.93741607666016, 112.69390106201172, 117.45038604736328, 122.20687103271484, 126.9633560180664, 131.71983337402344, 136.476318359375, 141.23280334472656, 145.98928833007812, 150.7457733154297, 155.50225830078125, 160.2587432861328, 165.01522827148438, 169.77171325683594, 174.5281982421875, 179.28468322753906, 184.04116821289062]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 4.0, 11.0, 7.0, 5.0, 14.0, 26.0, 16.0, 20.0, 18.0, 21.0, 24.0, 26.0, 32.0, 23.0, 43.0, 39.0, 44.0, 36.0, 37.0, 46.0, 46.0, 36.0, 39.0, 36.0, 37.0, 34.0, 30.0, 30.0, 26.0, 28.0, 30.0, 23.0, 24.0, 18.0, 9.0, 13.0, 4.0, 9.0, 9.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.40213394165039, -34.38330078125, -33.364463806152344, -32.34563064575195, -31.32679557800293, -30.307960510253906, -29.289127349853516, -28.270292282104492, -27.25145721435547, -26.232622146606445, -25.213787078857422, -24.19495391845703, -23.176118850708008, -22.157283782958984, -21.138450622558594, -20.11961555480957, -19.100780487060547, -18.081945419311523, -17.0631103515625, -16.04427719116211, -15.025442123413086, -14.006607055664062, -12.987772941589355, -11.968938827514648, -10.950103759765625, -9.931268692016602, -8.912434577941895, -7.893599987030029, -6.874765396118164, -5.855930805206299, -4.837096214294434, -3.8182616233825684, -2.799427032470703, -1.780592441558838, -0.7617578506469727, 0.2570767402648926, 1.2759113311767578, 2.294745922088623, 3.3135805130004883, 4.3324151039123535, 5.351249694824219, 6.370084285736084, 7.388918876647949, 8.407752990722656, 9.42658805847168, 10.445423126220703, 11.46425724029541, 12.483091354370117, 13.50192642211914, 14.520761489868164, 15.539595603942871, 16.558429718017578, 17.5772647857666, 18.596099853515625, 19.614933013916016, 20.63376808166504, 21.652603149414062, 22.671438217163086, 23.69027328491211, 24.7091064453125, 25.727941513061523, 26.746776580810547, 27.765609741210938, 28.78444480895996, 29.803279876708984]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 10.0, 8.0, 8.0, 18.0, 16.0, 21.0, 37.0, 60.0, 83.0, 103.0, 172.0, 321.0, 508.0, 1048.0, 2580.0, 7753.0, 40825.0, 3956410.0, 161446.0, 15644.0, 4143.0, 1505.0, 687.0, 328.0, 183.0, 114.0, 82.0, 47.0, 40.0, 17.0, 21.0, 9.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -13.0946044921875, -12.728271484375, -12.3619384765625, -11.99560546875, -11.6292724609375, -11.262939453125, -10.8966064453125, -10.5302734375, -10.1639404296875, -9.797607421875, -9.4312744140625, -9.06494140625, -8.6986083984375, -8.332275390625, -7.9659423828125, -7.599609375, -7.2332763671875, -6.866943359375, -6.5006103515625, -6.13427734375, -5.7679443359375, -5.401611328125, -5.0352783203125, -4.6689453125, -4.3026123046875, -3.936279296875, -3.5699462890625, -3.20361328125, -2.8372802734375, -2.470947265625, -2.1046142578125, -1.73828125, -1.3719482421875, -1.005615234375, -0.6392822265625, -0.27294921875, 0.0933837890625, 0.459716796875, 0.8260498046875, 1.1923828125, 1.5587158203125, 1.925048828125, 2.2913818359375, 2.65771484375, 3.0240478515625, 3.390380859375, 3.7567138671875, 4.123046875, 4.4893798828125, 4.855712890625, 5.2220458984375, 5.58837890625, 5.9547119140625, 6.321044921875, 6.6873779296875, 7.0537109375, 7.4200439453125, 7.786376953125, 8.1527099609375, 8.51904296875, 8.8853759765625, 9.251708984375, 9.6180419921875, 9.984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 12.0, 9.0, 20.0, 18.0, 28.0, 44.0, 51.0, 64.0, 76.0, 83.0, 109.0, 104.0, 90.0, 64.0, 59.0, 39.0, 42.0, 33.0, 13.0, 13.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.55859375, -3.461181640625, -3.36376953125, -3.266357421875, -3.1689453125, -3.071533203125, -2.97412109375, -2.876708984375, -2.779296875, -2.681884765625, -2.58447265625, -2.487060546875, -2.3896484375, -2.292236328125, -2.19482421875, -2.097412109375, -2.0, -1.902587890625, -1.80517578125, -1.707763671875, -1.6103515625, -1.512939453125, -1.41552734375, -1.318115234375, -1.220703125, -1.123291015625, -1.02587890625, -0.928466796875, -0.8310546875, -0.733642578125, -0.63623046875, -0.538818359375, -0.44140625, -0.343994140625, -0.24658203125, -0.149169921875, -0.0517578125, 0.045654296875, 0.14306640625, 0.240478515625, 0.337890625, 0.435302734375, 0.53271484375, 0.630126953125, 0.7275390625, 0.824951171875, 0.92236328125, 1.019775390625, 1.1171875, 1.214599609375, 1.31201171875, 1.409423828125, 1.5068359375, 1.604248046875, 1.70166015625, 1.799072265625, 1.896484375, 1.993896484375, 2.09130859375, 2.188720703125, 2.2861328125, 2.383544921875, 2.48095703125, 2.578369140625, 2.67578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 8.0, 29.0, 57.0, 87.0, 218.0, 474.0, 2187.0, 26235.0, 4127368.0, 34222.0, 2360.0, 578.0, 248.0, 108.0, 43.0, 27.0, 12.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.390625, -13.520263671875, -12.64990234375, -11.779541015625, -10.9091796875, -10.038818359375, -9.16845703125, -8.298095703125, -7.427734375, -6.557373046875, -5.68701171875, -4.816650390625, -3.9462890625, -3.075927734375, -2.20556640625, -1.335205078125, -0.46484375, 0.405517578125, 1.27587890625, 2.146240234375, 3.0166015625, 3.886962890625, 4.75732421875, 5.627685546875, 6.498046875, 7.368408203125, 8.23876953125, 9.109130859375, 9.9794921875, 10.849853515625, 11.72021484375, 12.590576171875, 13.4609375, 14.331298828125, 15.20166015625, 16.072021484375, 16.9423828125, 17.812744140625, 18.68310546875, 19.553466796875, 20.423828125, 21.294189453125, 22.16455078125, 23.034912109375, 23.9052734375, 24.775634765625, 25.64599609375, 26.516357421875, 27.38671875, 28.257080078125, 29.12744140625, 29.997802734375, 30.8681640625, 31.738525390625, 32.60888671875, 33.479248046875, 34.349609375, 35.219970703125, 36.09033203125, 36.960693359375, 37.8310546875, 38.701416015625, 39.57177734375, 40.442138671875, 41.3125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 8.0, 19.0, 26.0, 53.0, 70.0, 178.0, 2621.0, 787.0, 147.0, 53.0, 41.0, 19.0, 10.0, 18.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.197265625, -3.044525146484375, -2.89178466796875, -2.739044189453125, -2.5863037109375, -2.433563232421875, -2.28082275390625, -2.128082275390625, -1.975341796875, -1.822601318359375, -1.66986083984375, -1.517120361328125, -1.3643798828125, -1.211639404296875, -1.05889892578125, -0.906158447265625, -0.75341796875, -0.600677490234375, -0.44793701171875, -0.295196533203125, -0.1424560546875, 0.010284423828125, 0.16302490234375, 0.315765380859375, 0.468505859375, 0.621246337890625, 0.77398681640625, 0.926727294921875, 1.0794677734375, 1.232208251953125, 1.38494873046875, 1.537689208984375, 1.6904296875, 1.843170166015625, 1.99591064453125, 2.148651123046875, 2.3013916015625, 2.454132080078125, 2.60687255859375, 2.759613037109375, 2.912353515625, 3.065093994140625, 3.21783447265625, 3.370574951171875, 3.5233154296875, 3.676055908203125, 3.82879638671875, 3.981536865234375, 4.13427734375, 4.287017822265625, 4.43975830078125, 4.592498779296875, 4.7452392578125, 4.897979736328125, 5.05072021484375, 5.203460693359375, 5.356201171875, 5.508941650390625, 5.66168212890625, 5.814422607421875, 5.9671630859375, 6.119903564453125, 6.27264404296875, 6.425384521484375, 6.578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 14.0, 20.0, 68.0, 216.0, 367.0, 212.0, 68.0, 18.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.676841735839844, -39.50069808959961, -38.324554443359375, -37.14841079711914, -35.972267150878906, -34.79612350463867, -33.61997985839844, -32.4438362121582, -31.26769256591797, -30.091548919677734, -28.9154052734375, -27.739261627197266, -26.56311798095703, -25.386974334716797, -24.210830688476562, -23.034687042236328, -21.858545303344727, -20.682401657104492, -19.506258010864258, -18.330114364624023, -17.15397071838379, -15.977827072143555, -14.801684379577637, -13.625540733337402, -12.449397087097168, -11.273253440856934, -10.0971097946167, -8.920967102050781, -7.744822978973389, -6.568679332733154, -5.392536163330078, -4.216392517089844, -3.0402488708496094, -1.8641053438186646, -0.6879618167877197, 0.48818159103393555, 1.66432523727417, 2.8404688835144043, 4.0166120529174805, 5.192755699157715, 6.368899345397949, 7.545042991638184, 8.721186637878418, 9.897329330444336, 11.07347297668457, 12.249616622924805, 13.425760269165039, 14.601903915405273, 15.778047561645508, 16.954191207885742, 18.130334854125977, 19.30647850036621, 20.482622146606445, 21.65876579284668, 22.83490753173828, 24.011051177978516, 25.18719482421875, 26.363338470458984, 27.53948211669922, 28.715625762939453, 29.891769409179688, 31.067913055419922, 32.244056701660156, 33.42020034790039, 34.596343994140625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 10.0, 12.0, 22.0, 36.0, 38.0, 63.0, 56.0, 72.0, 67.0, 69.0, 69.0, 67.0, 73.0, 77.0, 60.0, 48.0, 40.0, 35.0, 26.0, 21.0, 17.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.466180801391602, -15.019157409667969, -14.572134971618652, -14.12511157989502, -13.678088188171387, -13.23106575012207, -12.784042358398438, -12.337018966674805, -11.889995574951172, -11.442972183227539, -10.995949745178223, -10.54892635345459, -10.101902961730957, -9.65488052368164, -9.207857131958008, -8.760833740234375, -8.313811302185059, -7.866788387298584, -7.419764995574951, -6.972742080688477, -6.525718688964844, -6.078695774078369, -5.6316728591918945, -5.184649467468262, -4.737626552581787, -4.2906036376953125, -3.8435802459716797, -3.396557331085205, -2.9495341777801514, -2.5025110244750977, -2.055488109588623, -1.6084649562835693, -1.1614418029785156, -0.7144187092781067, -0.26739561557769775, 0.1796274185180664, 0.6266505718231201, 1.0736737251281738, 1.5206966400146484, 1.9677197933197021, 2.414742946624756, 2.8617660999298096, 3.3087892532348633, 3.755812168121338, 4.2028350830078125, 4.649858474731445, 5.09688138961792, 5.5439043045043945, 5.990927696228027, 6.437950611114502, 6.884974002838135, 7.331996917724609, 7.779020309448242, 8.226043701171875, 8.673066139221191, 9.120089530944824, 9.56711196899414, 10.014135360717773, 10.46115779876709, 10.908181190490723, 11.355204582214355, 11.802227020263672, 12.249250411987305, 12.696273803710938, 13.14329719543457]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 8.0, 27.0, 27.0, 61.0, 122.0, 227.0, 626.0, 2146.0, 12086.0, 163174.0, 803892.0, 57792.0, 6196.0, 1379.0, 422.0, 173.0, 85.0, 41.0, 22.0, 14.0, 7.0, 5.0, 7.0, 0.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-25.234375, -24.6776123046875, -24.120849609375, -23.5640869140625, -23.00732421875, -22.4505615234375, -21.893798828125, -21.3370361328125, -20.7802734375, -20.2235107421875, -19.666748046875, -19.1099853515625, -18.55322265625, -17.9964599609375, -17.439697265625, -16.8829345703125, -16.326171875, -15.7694091796875, -15.212646484375, -14.6558837890625, -14.09912109375, -13.5423583984375, -12.985595703125, -12.4288330078125, -11.8720703125, -11.3153076171875, -10.758544921875, -10.2017822265625, -9.64501953125, -9.0882568359375, -8.531494140625, -7.9747314453125, -7.41796875, -6.8612060546875, -6.304443359375, -5.7476806640625, -5.19091796875, -4.6341552734375, -4.077392578125, -3.5206298828125, -2.9638671875, -2.4071044921875, -1.850341796875, -1.2935791015625, -0.73681640625, -0.1800537109375, 0.376708984375, 0.9334716796875, 1.490234375, 2.0469970703125, 2.603759765625, 3.1605224609375, 3.71728515625, 4.2740478515625, 4.830810546875, 5.3875732421875, 5.9443359375, 6.5010986328125, 7.057861328125, 7.6146240234375, 8.17138671875, 8.7281494140625, 9.284912109375, 9.8416748046875, 10.3984375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 12.0, 15.0, 12.0, 20.0, 42.0, 54.0, 45.0, 75.0, 86.0, 127.0, 89.0, 99.0, 81.0, 58.0, 45.0, 49.0, 29.0, 19.0, 13.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.892578125, -3.7900390625, -3.6875, -3.5849609375, -3.482421875, -3.3798828125, -3.27734375, -3.1748046875, -3.072265625, -2.9697265625, -2.8671875, -2.7646484375, -2.662109375, -2.5595703125, -2.45703125, -2.3544921875, -2.251953125, -2.1494140625, -2.046875, -1.9443359375, -1.841796875, -1.7392578125, -1.63671875, -1.5341796875, -1.431640625, -1.3291015625, -1.2265625, -1.1240234375, -1.021484375, -0.9189453125, -0.81640625, -0.7138671875, -0.611328125, -0.5087890625, -0.40625, -0.3037109375, -0.201171875, -0.0986328125, 0.00390625, 0.1064453125, 0.208984375, 0.3115234375, 0.4140625, 0.5166015625, 0.619140625, 0.7216796875, 0.82421875, 0.9267578125, 1.029296875, 1.1318359375, 1.234375, 1.3369140625, 1.439453125, 1.5419921875, 1.64453125, 1.7470703125, 1.849609375, 1.9521484375, 2.0546875, 2.1572265625, 2.259765625, 2.3623046875, 2.46484375, 2.5673828125, 2.669921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 6.0, 10.0, 5.0, 13.0, 12.0, 14.0, 19.0, 43.0, 48.0, 67.0, 113.0, 162.0, 368.0, 899.0, 2362.0, 8130.0, 34669.0, 192337.0, 653471.0, 122644.0, 23739.0, 6092.0, 1866.0, 654.0, 300.0, 149.0, 105.0, 61.0, 37.0, 32.0, 24.0, 17.0, 19.0, 9.0, 7.0, 8.0, 6.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-9.421875, -9.1478271484375, -8.873779296875, -8.5997314453125, -8.32568359375, -8.0516357421875, -7.777587890625, -7.5035400390625, -7.2294921875, -6.9554443359375, -6.681396484375, -6.4073486328125, -6.13330078125, -5.8592529296875, -5.585205078125, -5.3111572265625, -5.037109375, -4.7630615234375, -4.489013671875, -4.2149658203125, -3.94091796875, -3.6668701171875, -3.392822265625, -3.1187744140625, -2.8447265625, -2.5706787109375, -2.296630859375, -2.0225830078125, -1.74853515625, -1.4744873046875, -1.200439453125, -0.9263916015625, -0.65234375, -0.3782958984375, -0.104248046875, 0.1697998046875, 0.44384765625, 0.7178955078125, 0.991943359375, 1.2659912109375, 1.5400390625, 1.8140869140625, 2.088134765625, 2.3621826171875, 2.63623046875, 2.9102783203125, 3.184326171875, 3.4583740234375, 3.732421875, 4.0064697265625, 4.280517578125, 4.5545654296875, 4.82861328125, 5.1026611328125, 5.376708984375, 5.6507568359375, 5.9248046875, 6.1988525390625, 6.472900390625, 6.7469482421875, 7.02099609375, 7.2950439453125, 7.569091796875, 7.8431396484375, 8.1171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 11.0, 8.0, 11.0, 15.0, 13.0, 14.0, 21.0, 28.0, 27.0, 32.0, 28.0, 29.0, 43.0, 39.0, 53.0, 48.0, 41.0, 45.0, 48.0, 54.0, 35.0, 47.0, 36.0, 35.0, 41.0, 33.0, 26.0, 22.0, 20.0, 21.0, 16.0, 7.0, 9.0, 7.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.0234375, -6.81524658203125, -6.6070556640625, -6.39886474609375, -6.190673828125, -5.98248291015625, -5.7742919921875, -5.56610107421875, -5.35791015625, -5.14971923828125, -4.9415283203125, -4.73333740234375, -4.525146484375, -4.31695556640625, -4.1087646484375, -3.90057373046875, -3.6923828125, -3.48419189453125, -3.2760009765625, -3.06781005859375, -2.859619140625, -2.65142822265625, -2.4432373046875, -2.23504638671875, -2.02685546875, -1.81866455078125, -1.6104736328125, -1.40228271484375, -1.194091796875, -0.98590087890625, -0.7777099609375, -0.56951904296875, -0.361328125, -0.15313720703125, 0.0550537109375, 0.26324462890625, 0.471435546875, 0.67962646484375, 0.8878173828125, 1.09600830078125, 1.30419921875, 1.51239013671875, 1.7205810546875, 1.92877197265625, 2.136962890625, 2.34515380859375, 2.5533447265625, 2.76153564453125, 2.9697265625, 3.17791748046875, 3.3861083984375, 3.59429931640625, 3.802490234375, 4.01068115234375, 4.2188720703125, 4.42706298828125, 4.63525390625, 4.84344482421875, 5.0516357421875, 5.25982666015625, 5.468017578125, 5.67620849609375, 5.8843994140625, 6.09259033203125, 6.30078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 8.0, 12.0, 24.0, 27.0, 54.0, 74.0, 145.0, 301.0, 571.0, 1408.0, 3967.0, 17839.0, 290536.0, 694103.0, 30586.0, 5602.0, 1789.0, 720.0, 351.0, 160.0, 94.0, 60.0, 42.0, 18.0, 15.0, 9.0, 3.0, 6.0, 2.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.12890625, -4.95867919921875, -4.7884521484375, -4.61822509765625, -4.447998046875, -4.27777099609375, -4.1075439453125, -3.93731689453125, -3.76708984375, -3.59686279296875, -3.4266357421875, -3.25640869140625, -3.086181640625, -2.91595458984375, -2.7457275390625, -2.57550048828125, -2.4052734375, -2.23504638671875, -2.0648193359375, -1.89459228515625, -1.724365234375, -1.55413818359375, -1.3839111328125, -1.21368408203125, -1.04345703125, -0.87322998046875, -0.7030029296875, -0.53277587890625, -0.362548828125, -0.19232177734375, -0.0220947265625, 0.14813232421875, 0.318359375, 0.48858642578125, 0.6588134765625, 0.82904052734375, 0.999267578125, 1.16949462890625, 1.3397216796875, 1.50994873046875, 1.68017578125, 1.85040283203125, 2.0206298828125, 2.19085693359375, 2.361083984375, 2.53131103515625, 2.7015380859375, 2.87176513671875, 3.0419921875, 3.21221923828125, 3.3824462890625, 3.55267333984375, 3.722900390625, 3.89312744140625, 4.0633544921875, 4.23358154296875, 4.40380859375, 4.57403564453125, 4.7442626953125, 4.91448974609375, 5.084716796875, 5.25494384765625, 5.4251708984375, 5.59539794921875, 5.765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 8.0, 10.0, 8.0, 13.0, 19.0, 36.0, 82.0, 179.0, 246.0, 173.0, 91.0, 63.0, 22.0, 19.0, 18.0, 8.0, 3.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011386871337890625, -0.001109100878238678, -0.0010795146226882935, -0.001049928367137909, -0.0010203421115875244, -0.00099075585603714, -0.0009611696004867554, -0.0009315833449363708, -0.0009019970893859863, -0.0008724108338356018, -0.0008428245782852173, -0.0008132383227348328, -0.0007836520671844482, -0.0007540658116340637, -0.0007244795560836792, -0.0006948933005332947, -0.0006653070449829102, -0.0006357207894325256, -0.0006061345338821411, -0.0005765482783317566, -0.0005469620227813721, -0.0005173757672309875, -0.00048778951168060303, -0.0004582032561302185, -0.000428617000579834, -0.00039903074502944946, -0.00036944448947906494, -0.0003398582339286804, -0.0003102719783782959, -0.0002806857228279114, -0.00025109946727752686, -0.00022151321172714233, -0.0001919269561767578, -0.0001623407006263733, -0.00013275444507598877, -0.00010316818952560425, -7.358193397521973e-05, -4.3995678424835205e-05, -1.4409422874450684e-05, 1.5176832675933838e-05, 4.476308822631836e-05, 7.434934377670288e-05, 0.0001039355993270874, 0.00013352185487747192, 0.00016310811042785645, 0.00019269436597824097, 0.0002222806215286255, 0.00025186687707901, 0.00028145313262939453, 0.00031103938817977905, 0.0003406256437301636, 0.0003702118992805481, 0.0003997981548309326, 0.00042938441038131714, 0.00045897066593170166, 0.0004885569214820862, 0.0005181431770324707, 0.0005477294325828552, 0.0005773156881332397, 0.0006069019436836243, 0.0006364881992340088, 0.0006660744547843933, 0.0006956607103347778, 0.0007252469658851624, 0.0007548332214355469]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 3.0, 6.0, 10.0, 23.0, 28.0, 74.0, 133.0, 420.0, 1830.0, 11559.0, 616497.0, 405777.0, 9797.0, 1685.0, 412.0, 136.0, 61.0, 28.0, 20.0, 11.0, 6.0, 9.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.1295166015625, -8.868408203125, -8.6072998046875, -8.34619140625, -8.0850830078125, -7.823974609375, -7.5628662109375, -7.3017578125, -7.0406494140625, -6.779541015625, -6.5184326171875, -6.25732421875, -5.9962158203125, -5.735107421875, -5.4739990234375, -5.212890625, -4.9517822265625, -4.690673828125, -4.4295654296875, -4.16845703125, -3.9073486328125, -3.646240234375, -3.3851318359375, -3.1240234375, -2.8629150390625, -2.601806640625, -2.3406982421875, -2.07958984375, -1.8184814453125, -1.557373046875, -1.2962646484375, -1.03515625, -0.7740478515625, -0.512939453125, -0.2518310546875, 0.00927734375, 0.2703857421875, 0.531494140625, 0.7926025390625, 1.0537109375, 1.3148193359375, 1.575927734375, 1.8370361328125, 2.09814453125, 2.3592529296875, 2.620361328125, 2.8814697265625, 3.142578125, 3.4036865234375, 3.664794921875, 3.9259033203125, 4.18701171875, 4.4481201171875, 4.709228515625, 4.9703369140625, 5.2314453125, 5.4925537109375, 5.753662109375, 6.0147705078125, 6.27587890625, 6.5369873046875, 6.798095703125, 7.0592041015625, 7.3203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 2.0, 5.0, 9.0, 9.0, 11.0, 18.0, 28.0, 43.0, 54.0, 72.0, 110.0, 151.0, 153.0, 102.0, 62.0, 44.0, 24.0, 16.0, 16.0, 7.0, 12.0, 7.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.423828125, -3.3310546875, -3.23828125, -3.1455078125, -3.052734375, -2.9599609375, -2.8671875, -2.7744140625, -2.681640625, -2.5888671875, -2.49609375, -2.4033203125, -2.310546875, -2.2177734375, -2.125, -2.0322265625, -1.939453125, -1.8466796875, -1.75390625, -1.6611328125, -1.568359375, -1.4755859375, -1.3828125, -1.2900390625, -1.197265625, -1.1044921875, -1.01171875, -0.9189453125, -0.826171875, -0.7333984375, -0.640625, -0.5478515625, -0.455078125, -0.3623046875, -0.26953125, -0.1767578125, -0.083984375, 0.0087890625, 0.1015625, 0.1943359375, 0.287109375, 0.3798828125, 0.47265625, 0.5654296875, 0.658203125, 0.7509765625, 0.84375, 0.9365234375, 1.029296875, 1.1220703125, 1.21484375, 1.3076171875, 1.400390625, 1.4931640625, 1.5859375, 1.6787109375, 1.771484375, 1.8642578125, 1.95703125, 2.0498046875, 2.142578125, 2.2353515625, 2.328125, 2.4208984375, 2.513671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 10.0, 21.0, 54.0, 303.0, 420.0, 160.0, 35.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.89505004882812, -83.34735870361328, -78.79966735839844, -74.2519760131836, -69.70428466796875, -65.1565933227539, -60.60890579223633, -56.061214447021484, -51.51352310180664, -46.9658317565918, -42.41814041137695, -37.870452880859375, -33.32276153564453, -28.775068283081055, -24.227378845214844, -19.6796875, -15.131996154785156, -10.584304809570312, -6.036614418029785, -1.4889240264892578, 3.058767318725586, 7.60645866394043, 12.15414810180664, 16.701839447021484, 21.249530792236328, 25.797222137451172, 30.344913482666016, 34.892601013183594, 39.44029235839844, 43.98798370361328, 48.535675048828125, 53.08336639404297, 57.63105773925781, 62.178749084472656, 66.7264404296875, 71.27413177490234, 75.82182312011719, 80.36951446533203, 84.91720581054688, 89.46488952636719, 94.01258850097656, 98.5602798461914, 103.10797119140625, 107.6556625366211, 112.20335388183594, 116.75104522705078, 121.29873657226562, 125.84642028808594, 130.39410400390625, 134.94178771972656, 139.48948669433594, 144.03717041015625, 148.58486938476562, 153.13255310058594, 157.6802520751953, 162.22793579101562, 166.775634765625, 171.3233184814453, 175.8710174560547, 180.418701171875, 184.96640014648438, 189.5140838623047, 194.06178283691406, 198.60946655273438, 203.15716552734375]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 5.0, 5.0, 10.0, 12.0, 9.0, 11.0, 13.0, 15.0, 25.0, 16.0, 28.0, 21.0, 32.0, 27.0, 25.0, 27.0, 30.0, 31.0, 48.0, 30.0, 29.0, 42.0, 42.0, 43.0, 42.0, 44.0, 22.0, 28.0, 36.0, 33.0, 24.0, 34.0, 19.0, 15.0, 12.0, 20.0, 17.0, 14.0, 12.0, 12.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-27.235368728637695, -26.405624389648438, -25.57588005065918, -24.746135711669922, -23.916391372680664, -23.086647033691406, -22.25690460205078, -21.42715835571289, -20.597415924072266, -19.767671585083008, -18.93792724609375, -18.108182907104492, -17.278438568115234, -16.448694229125977, -15.618950843811035, -14.789206504821777, -13.959461212158203, -13.129716873168945, -12.299972534179688, -11.47022819519043, -10.640483856201172, -9.810739517211914, -8.980996131896973, -8.151251792907715, -7.321507453918457, -6.491763114929199, -5.662018775939941, -4.832274913787842, -4.002530574798584, -3.172786235809326, -2.3430423736572266, -1.5132980346679688, -0.6835556030273438, 0.1461886167526245, 0.9759328365325928, 1.8056769371032715, 2.6354212760925293, 3.465165615081787, 4.294909477233887, 5.1246538162231445, 5.954398155212402, 6.78414249420166, 7.613886833190918, 8.44363021850586, 9.273374557495117, 10.103118896484375, 10.932863235473633, 11.76260757446289, 12.592351913452148, 13.422096252441406, 14.251840591430664, 15.081584930419922, 15.91132926940918, 16.741073608398438, 17.570816040039062, 18.400562286376953, 19.230304718017578, 20.060049057006836, 20.889793395996094, 21.71953773498535, 22.54928207397461, 23.379026412963867, 24.208770751953125, 25.03851318359375, 25.86825942993164]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 7.0, 4.0, 11.0, 14.0, 12.0, 20.0, 26.0, 26.0, 63.0, 91.0, 145.0, 241.0, 517.0, 1214.0, 2974.0, 11253.0, 89062.0, 4032797.0, 45015.0, 7166.0, 2010.0, 799.0, 377.0, 178.0, 100.0, 50.0, 32.0, 25.0, 12.0, 12.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0], "bins": [-28.671875, -28.039794921875, -27.40771484375, -26.775634765625, -26.1435546875, -25.511474609375, -24.87939453125, -24.247314453125, -23.615234375, -22.983154296875, -22.35107421875, -21.718994140625, -21.0869140625, -20.454833984375, -19.82275390625, -19.190673828125, -18.55859375, -17.926513671875, -17.29443359375, -16.662353515625, -16.0302734375, -15.398193359375, -14.76611328125, -14.134033203125, -13.501953125, -12.869873046875, -12.23779296875, -11.605712890625, -10.9736328125, -10.341552734375, -9.70947265625, -9.077392578125, -8.4453125, -7.813232421875, -7.18115234375, -6.549072265625, -5.9169921875, -5.284912109375, -4.65283203125, -4.020751953125, -3.388671875, -2.756591796875, -2.12451171875, -1.492431640625, -0.8603515625, -0.228271484375, 0.40380859375, 1.035888671875, 1.66796875, 2.300048828125, 2.93212890625, 3.564208984375, 4.1962890625, 4.828369140625, 5.46044921875, 6.092529296875, 6.724609375, 7.356689453125, 7.98876953125, 8.620849609375, 9.2529296875, 9.885009765625, 10.51708984375, 11.149169921875, 11.78125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 15.0, 20.0, 28.0, 31.0, 43.0, 52.0, 55.0, 89.0, 97.0, 82.0, 99.0, 84.0, 61.0, 53.0, 52.0, 37.0, 24.0, 22.0, 18.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.96875, -3.86541748046875, -3.7620849609375, -3.65875244140625, -3.555419921875, -3.45208740234375, -3.3487548828125, -3.24542236328125, -3.14208984375, -3.03875732421875, -2.9354248046875, -2.83209228515625, -2.728759765625, -2.62542724609375, -2.5220947265625, -2.41876220703125, -2.3154296875, -2.21209716796875, -2.1087646484375, -2.00543212890625, -1.902099609375, -1.79876708984375, -1.6954345703125, -1.59210205078125, -1.48876953125, -1.38543701171875, -1.2821044921875, -1.17877197265625, -1.075439453125, -0.97210693359375, -0.8687744140625, -0.76544189453125, -0.662109375, -0.55877685546875, -0.4554443359375, -0.35211181640625, -0.248779296875, -0.14544677734375, -0.0421142578125, 0.06121826171875, 0.16455078125, 0.26788330078125, 0.3712158203125, 0.47454833984375, 0.577880859375, 0.68121337890625, 0.7845458984375, 0.88787841796875, 0.9912109375, 1.09454345703125, 1.1978759765625, 1.30120849609375, 1.404541015625, 1.50787353515625, 1.6112060546875, 1.71453857421875, 1.81787109375, 1.92120361328125, 2.0245361328125, 2.12786865234375, 2.231201171875, 2.33453369140625, 2.4378662109375, 2.54119873046875, 2.64453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 12.0, 21.0, 29.0, 57.0, 69.0, 153.0, 327.0, 715.0, 2190.0, 9447.0, 109451.0, 4033713.0, 31145.0, 4708.0, 1271.0, 501.0, 223.0, 113.0, 59.0, 28.0, 18.0, 6.0, 5.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.6806640625, -22.923828125, -22.1669921875, -21.41015625, -20.6533203125, -19.896484375, -19.1396484375, -18.3828125, -17.6259765625, -16.869140625, -16.1123046875, -15.35546875, -14.5986328125, -13.841796875, -13.0849609375, -12.328125, -11.5712890625, -10.814453125, -10.0576171875, -9.30078125, -8.5439453125, -7.787109375, -7.0302734375, -6.2734375, -5.5166015625, -4.759765625, -4.0029296875, -3.24609375, -2.4892578125, -1.732421875, -0.9755859375, -0.21875, 0.5380859375, 1.294921875, 2.0517578125, 2.80859375, 3.5654296875, 4.322265625, 5.0791015625, 5.8359375, 6.5927734375, 7.349609375, 8.1064453125, 8.86328125, 9.6201171875, 10.376953125, 11.1337890625, 11.890625, 12.6474609375, 13.404296875, 14.1611328125, 14.91796875, 15.6748046875, 16.431640625, 17.1884765625, 17.9453125, 18.7021484375, 19.458984375, 20.2158203125, 20.97265625, 21.7294921875, 22.486328125, 23.2431640625, 24.0]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 4.0, 9.0, 20.0, 31.0, 35.0, 72.0, 212.0, 3307.0, 207.0, 75.0, 30.0, 21.0, 16.0, 5.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.515625, -10.2789306640625, -10.042236328125, -9.8055419921875, -9.56884765625, -9.3321533203125, -9.095458984375, -8.8587646484375, -8.6220703125, -8.3853759765625, -8.148681640625, -7.9119873046875, -7.67529296875, -7.4385986328125, -7.201904296875, -6.9652099609375, -6.728515625, -6.4918212890625, -6.255126953125, -6.0184326171875, -5.78173828125, -5.5450439453125, -5.308349609375, -5.0716552734375, -4.8349609375, -4.5982666015625, -4.361572265625, -4.1248779296875, -3.88818359375, -3.6514892578125, -3.414794921875, -3.1781005859375, -2.94140625, -2.7047119140625, -2.468017578125, -2.2313232421875, -1.99462890625, -1.7579345703125, -1.521240234375, -1.2845458984375, -1.0478515625, -0.8111572265625, -0.574462890625, -0.3377685546875, -0.10107421875, 0.1356201171875, 0.372314453125, 0.6090087890625, 0.845703125, 1.0823974609375, 1.319091796875, 1.5557861328125, 1.79248046875, 2.0291748046875, 2.265869140625, 2.5025634765625, 2.7392578125, 2.9759521484375, 3.212646484375, 3.4493408203125, 3.68603515625, 3.9227294921875, 4.159423828125, 4.3961181640625, 4.6328125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 12.0, 64.0, 480.0, 404.0, 30.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-185.8597869873047, -182.5428009033203, -179.22579956054688, -175.9088134765625, -172.59182739257812, -169.27484130859375, -165.95785522460938, -162.64085388183594, -159.32386779785156, -156.0068817138672, -152.68988037109375, -149.37289428710938, -146.055908203125, -142.73892211914062, -139.42193603515625, -136.1049346923828, -132.78794860839844, -129.47096252441406, -126.15396881103516, -122.83697509765625, -119.51998901367188, -116.2030029296875, -112.8860092163086, -109.56901550292969, -106.25202941894531, -102.93504333496094, -99.61804962158203, -96.30105590820312, -92.98406982421875, -89.66708374023438, -86.35009002685547, -83.03309631347656, -79.71610260009766, -76.39910888671875, -73.08212280273438, -69.76513671875, -66.4481430053711, -63.13115310668945, -59.81416320800781, -56.49717330932617, -53.18018341064453, -49.86319351196289, -46.54620361328125, -43.22921371459961, -39.91222381591797, -36.59523391723633, -33.27824401855469, -29.961254119873047, -26.644264221191406, -23.327274322509766, -20.010284423828125, -16.693294525146484, -13.376304626464844, -10.059314727783203, -6.7423248291015625, -3.425334930419922, -0.10834503173828125, 3.2086448669433594, 6.525634765625, 9.84262466430664, 13.159614562988281, 16.476604461669922, 19.793594360351562, 23.110584259033203, 26.427574157714844]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 12.0, 7.0, 23.0, 27.0, 27.0, 38.0, 38.0, 41.0, 44.0, 57.0, 56.0, 74.0, 71.0, 69.0, 61.0, 67.0, 48.0, 43.0, 40.0, 34.0, 29.0, 21.0, 17.0, 12.0, 10.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.015426635742188, -22.394935607910156, -21.774442672729492, -21.15395164489746, -20.53346061706543, -19.912967681884766, -19.292476654052734, -18.671985626220703, -18.051494598388672, -17.43100357055664, -16.810510635375977, -16.190019607543945, -15.569528579711914, -14.949036598205566, -14.328544616699219, -13.708053588867188, -13.087560653686523, -12.467068672180176, -11.846577644348145, -11.226085662841797, -10.605594635009766, -9.985102653503418, -9.36461067199707, -8.744119644165039, -8.123627662658691, -7.503136157989502, -6.8826446533203125, -6.262152671813965, -5.641661167144775, -5.021169662475586, -4.400677680969238, -3.780186176300049, -3.1596946716308594, -2.53920316696167, -1.9187114238739014, -1.2982197999954224, -0.6777281761169434, -0.057236671447753906, 0.5632550716400146, 1.1837468147277832, 1.8042383193969727, 2.424729824066162, 3.0452215671539307, 3.665713310241699, 4.286204814910889, 4.906696319580078, 5.527188301086426, 6.147679805755615, 6.768171310424805, 7.388662815093994, 8.009154319763184, 8.629646301269531, 9.250137329101562, 9.87062931060791, 10.491121292114258, 11.111612319946289, 11.732104301452637, 12.352596282958984, 12.973087310791016, 13.593579292297363, 14.214071273803711, 14.834562301635742, 15.45505428314209, 16.075546264648438, 16.69603729248047]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 13.0, 19.0, 23.0, 36.0, 42.0, 104.0, 188.0, 346.0, 805.0, 2047.0, 7094.0, 34707.0, 274404.0, 632498.0, 77545.0, 13220.0, 3246.0, 1108.0, 489.0, 265.0, 129.0, 66.0, 41.0, 29.0, 14.0, 12.0, 13.0, 8.0, 8.0, 5.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.0869140625, -9.611328125, -9.1357421875, -8.66015625, -8.1845703125, -7.708984375, -7.2333984375, -6.7578125, -6.2822265625, -5.806640625, -5.3310546875, -4.85546875, -4.3798828125, -3.904296875, -3.4287109375, -2.953125, -2.4775390625, -2.001953125, -1.5263671875, -1.05078125, -0.5751953125, -0.099609375, 0.3759765625, 0.8515625, 1.3271484375, 1.802734375, 2.2783203125, 2.75390625, 3.2294921875, 3.705078125, 4.1806640625, 4.65625, 5.1318359375, 5.607421875, 6.0830078125, 6.55859375, 7.0341796875, 7.509765625, 7.9853515625, 8.4609375, 8.9365234375, 9.412109375, 9.8876953125, 10.36328125, 10.8388671875, 11.314453125, 11.7900390625, 12.265625, 12.7412109375, 13.216796875, 13.6923828125, 14.16796875, 14.6435546875, 15.119140625, 15.5947265625, 16.0703125, 16.5458984375, 17.021484375, 17.4970703125, 17.97265625, 18.4482421875, 18.923828125, 19.3994140625, 19.875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 16.0, 22.0, 25.0, 26.0, 57.0, 63.0, 65.0, 98.0, 97.0, 87.0, 84.0, 76.0, 67.0, 62.0, 47.0, 33.0, 21.0, 15.0, 9.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.7734375, -4.654571533203125, -4.53570556640625, -4.416839599609375, -4.2979736328125, -4.179107666015625, -4.06024169921875, -3.941375732421875, -3.822509765625, -3.703643798828125, -3.58477783203125, -3.465911865234375, -3.3470458984375, -3.228179931640625, -3.10931396484375, -2.990447998046875, -2.87158203125, -2.752716064453125, -2.63385009765625, -2.514984130859375, -2.3961181640625, -2.277252197265625, -2.15838623046875, -2.039520263671875, -1.920654296875, -1.801788330078125, -1.68292236328125, -1.564056396484375, -1.4451904296875, -1.326324462890625, -1.20745849609375, -1.088592529296875, -0.9697265625, -0.850860595703125, -0.73199462890625, -0.613128662109375, -0.4942626953125, -0.375396728515625, -0.25653076171875, -0.137664794921875, -0.018798828125, 0.100067138671875, 0.21893310546875, 0.337799072265625, 0.4566650390625, 0.575531005859375, 0.69439697265625, 0.813262939453125, 0.93212890625, 1.050994873046875, 1.16986083984375, 1.288726806640625, 1.4075927734375, 1.526458740234375, 1.64532470703125, 1.764190673828125, 1.883056640625, 2.001922607421875, 2.12078857421875, 2.239654541015625, 2.3585205078125, 2.477386474609375, 2.59625244140625, 2.715118408203125, 2.833984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 1.0, 4.0, 11.0, 11.0, 19.0, 23.0, 40.0, 48.0, 59.0, 116.0, 237.0, 454.0, 1114.0, 3070.0, 10665.0, 52985.0, 407417.0, 493500.0, 61319.0, 11892.0, 3362.0, 1162.0, 485.0, 220.0, 121.0, 61.0, 43.0, 23.0, 23.0, 19.0, 11.0, 6.0, 12.0, 3.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.1875, -11.80712890625, -11.4267578125, -11.04638671875, -10.666015625, -10.28564453125, -9.9052734375, -9.52490234375, -9.14453125, -8.76416015625, -8.3837890625, -8.00341796875, -7.623046875, -7.24267578125, -6.8623046875, -6.48193359375, -6.1015625, -5.72119140625, -5.3408203125, -4.96044921875, -4.580078125, -4.19970703125, -3.8193359375, -3.43896484375, -3.05859375, -2.67822265625, -2.2978515625, -1.91748046875, -1.537109375, -1.15673828125, -0.7763671875, -0.39599609375, -0.015625, 0.36474609375, 0.7451171875, 1.12548828125, 1.505859375, 1.88623046875, 2.2666015625, 2.64697265625, 3.02734375, 3.40771484375, 3.7880859375, 4.16845703125, 4.548828125, 4.92919921875, 5.3095703125, 5.68994140625, 6.0703125, 6.45068359375, 6.8310546875, 7.21142578125, 7.591796875, 7.97216796875, 8.3525390625, 8.73291015625, 9.11328125, 9.49365234375, 9.8740234375, 10.25439453125, 10.634765625, 11.01513671875, 11.3955078125, 11.77587890625, 12.15625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 9.0, 9.0, 6.0, 8.0, 20.0, 12.0, 22.0, 28.0, 36.0, 31.0, 32.0, 52.0, 49.0, 55.0, 39.0, 59.0, 64.0, 61.0, 53.0, 45.0, 51.0, 44.0, 41.0, 37.0, 32.0, 21.0, 27.0, 16.0, 10.0, 9.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.9375, -11.582763671875, -11.22802734375, -10.873291015625, -10.5185546875, -10.163818359375, -9.80908203125, -9.454345703125, -9.099609375, -8.744873046875, -8.39013671875, -8.035400390625, -7.6806640625, -7.325927734375, -6.97119140625, -6.616455078125, -6.26171875, -5.906982421875, -5.55224609375, -5.197509765625, -4.8427734375, -4.488037109375, -4.13330078125, -3.778564453125, -3.423828125, -3.069091796875, -2.71435546875, -2.359619140625, -2.0048828125, -1.650146484375, -1.29541015625, -0.940673828125, -0.5859375, -0.231201171875, 0.12353515625, 0.478271484375, 0.8330078125, 1.187744140625, 1.54248046875, 1.897216796875, 2.251953125, 2.606689453125, 2.96142578125, 3.316162109375, 3.6708984375, 4.025634765625, 4.38037109375, 4.735107421875, 5.08984375, 5.444580078125, 5.79931640625, 6.154052734375, 6.5087890625, 6.863525390625, 7.21826171875, 7.572998046875, 7.927734375, 8.282470703125, 8.63720703125, 8.991943359375, 9.3466796875, 9.701416015625, 10.05615234375, 10.410888671875, 10.765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 10.0, 25.0, 33.0, 65.0, 186.0, 632.0, 2868.0, 18881.0, 987956.0, 32790.0, 3855.0, 836.0, 240.0, 69.0, 42.0, 22.0, 17.0, 5.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.116455078125, -16.42041015625, -15.724365234375, -15.0283203125, -14.332275390625, -13.63623046875, -12.940185546875, -12.244140625, -11.548095703125, -10.85205078125, -10.156005859375, -9.4599609375, -8.763916015625, -8.06787109375, -7.371826171875, -6.67578125, -5.979736328125, -5.28369140625, -4.587646484375, -3.8916015625, -3.195556640625, -2.49951171875, -1.803466796875, -1.107421875, -0.411376953125, 0.28466796875, 0.980712890625, 1.6767578125, 2.372802734375, 3.06884765625, 3.764892578125, 4.4609375, 5.156982421875, 5.85302734375, 6.549072265625, 7.2451171875, 7.941162109375, 8.63720703125, 9.333251953125, 10.029296875, 10.725341796875, 11.42138671875, 12.117431640625, 12.8134765625, 13.509521484375, 14.20556640625, 14.901611328125, 15.59765625, 16.293701171875, 16.98974609375, 17.685791015625, 18.3818359375, 19.077880859375, 19.77392578125, 20.469970703125, 21.166015625, 21.862060546875, 22.55810546875, 23.254150390625, 23.9501953125, 24.646240234375, 25.34228515625, 26.038330078125, 26.734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 9.0, 19.0, 35.0, 66.0, 163.0, 294.0, 219.0, 85.0, 54.0, 20.0, 10.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010986328125, -0.0010479092597961426, -0.0009971857070922852, -0.0009464621543884277, -0.0008957386016845703, -0.0008450150489807129, -0.0007942914962768555, -0.000743567943572998, -0.0006928443908691406, -0.0006421208381652832, -0.0005913972854614258, -0.0005406737327575684, -0.0004899501800537109, -0.0004392266273498535, -0.0003885030746459961, -0.00033777952194213867, -0.00028705596923828125, -0.00023633241653442383, -0.0001856088638305664, -0.00013488531112670898, -8.416175842285156e-05, -3.343820571899414e-05, 1.728534698486328e-05, 6.80088996887207e-05, 0.00011873245239257812, 0.00016945600509643555, 0.00022017955780029297, 0.0002709031105041504, 0.0003216266632080078, 0.00037235021591186523, 0.00042307376861572266, 0.0004737973213195801, 0.0005245208740234375, 0.0005752444267272949, 0.0006259679794311523, 0.0006766915321350098, 0.0007274150848388672, 0.0007781386375427246, 0.000828862190246582, 0.0008795857429504395, 0.0009303092956542969, 0.0009810328483581543, 0.0010317564010620117, 0.0010824799537658691, 0.0011332035064697266, 0.001183927059173584, 0.0012346506118774414, 0.0012853741645812988, 0.0013360977172851562, 0.0013868212699890137, 0.001437544822692871, 0.0014882683753967285, 0.001538991928100586, 0.0015897154808044434, 0.0016404390335083008, 0.0016911625862121582, 0.0017418861389160156, 0.001792609691619873, 0.0018433332443237305, 0.0018940567970275879, 0.0019447803497314453, 0.0019955039024353027, 0.00204622745513916, 0.0020969510078430176, 0.002147674560546875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 11.0, 12.0, 31.0, 37.0, 80.0, 186.0, 573.0, 1969.0, 9263.0, 914322.0, 114280.0, 5675.0, 1393.0, 403.0, 169.0, 64.0, 18.0, 13.0, 7.0, 10.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-33.71875, -32.872802734375, -32.02685546875, -31.180908203125, -30.3349609375, -29.489013671875, -28.64306640625, -27.797119140625, -26.951171875, -26.105224609375, -25.25927734375, -24.413330078125, -23.5673828125, -22.721435546875, -21.87548828125, -21.029541015625, -20.18359375, -19.337646484375, -18.49169921875, -17.645751953125, -16.7998046875, -15.953857421875, -15.10791015625, -14.261962890625, -13.416015625, -12.570068359375, -11.72412109375, -10.878173828125, -10.0322265625, -9.186279296875, -8.34033203125, -7.494384765625, -6.6484375, -5.802490234375, -4.95654296875, -4.110595703125, -3.2646484375, -2.418701171875, -1.57275390625, -0.726806640625, 0.119140625, 0.965087890625, 1.81103515625, 2.656982421875, 3.5029296875, 4.348876953125, 5.19482421875, 6.040771484375, 6.88671875, 7.732666015625, 8.57861328125, 9.424560546875, 10.2705078125, 11.116455078125, 11.96240234375, 12.808349609375, 13.654296875, 14.500244140625, 15.34619140625, 16.192138671875, 17.0380859375, 17.884033203125, 18.72998046875, 19.575927734375, 20.421875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 7.0, 6.0, 9.0, 13.0, 20.0, 24.0, 48.0, 106.0, 207.0, 248.0, 115.0, 63.0, 35.0, 24.0, 11.0, 13.0, 8.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-13.4765625, -13.140869140625, -12.80517578125, -12.469482421875, -12.1337890625, -11.798095703125, -11.46240234375, -11.126708984375, -10.791015625, -10.455322265625, -10.11962890625, -9.783935546875, -9.4482421875, -9.112548828125, -8.77685546875, -8.441162109375, -8.10546875, -7.769775390625, -7.43408203125, -7.098388671875, -6.7626953125, -6.427001953125, -6.09130859375, -5.755615234375, -5.419921875, -5.084228515625, -4.74853515625, -4.412841796875, -4.0771484375, -3.741455078125, -3.40576171875, -3.070068359375, -2.734375, -2.398681640625, -2.06298828125, -1.727294921875, -1.3916015625, -1.055908203125, -0.72021484375, -0.384521484375, -0.048828125, 0.286865234375, 0.62255859375, 0.958251953125, 1.2939453125, 1.629638671875, 1.96533203125, 2.301025390625, 2.63671875, 2.972412109375, 3.30810546875, 3.643798828125, 3.9794921875, 4.315185546875, 4.65087890625, 4.986572265625, 5.322265625, 5.657958984375, 5.99365234375, 6.329345703125, 6.6650390625, 7.000732421875, 7.33642578125, 7.672119140625, 8.0078125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 36.0, 138.0, 495.0, 268.0, 46.0, 17.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-435.25030517578125, -425.3087158203125, -415.3671569824219, -405.4255676269531, -395.4840087890625, -385.54241943359375, -375.6008605957031, -365.6592712402344, -355.71771240234375, -345.776123046875, -335.8345642089844, -325.8929748535156, -315.951416015625, -306.00982666015625, -296.0682678222656, -286.1266784667969, -276.18511962890625, -266.2435302734375, -256.3019714355469, -246.3603973388672, -236.4188232421875, -226.4772491455078, -216.53567504882812, -206.59408569335938, -196.65249633789062, -186.71092224121094, -176.76934814453125, -166.82777404785156, -156.88619995117188, -146.9446258544922, -137.0030517578125, -127.06147003173828, -117.11990356445312, -107.17832946777344, -97.23675537109375, -87.29518127441406, -77.35360717773438, -67.41203308105469, -57.47045135498047, -47.52887725830078, -37.587303161621094, -27.645729064941406, -17.704153060913086, -7.762577056884766, 2.178997039794922, 12.12057113647461, 22.062149047851562, 32.00372314453125, 41.94529724121094, 51.886871337890625, 61.82844543457031, 71.77001953125, 81.71159362792969, 91.65316772460938, 101.5947494506836, 111.53632354736328, 121.47789764404297, 131.4194793701172, 141.36105346679688, 151.30262756347656, 161.24420166015625, 171.18577575683594, 181.12734985351562, 191.0689239501953, 201.010498046875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 8.0, 1.0, 4.0, 2.0, 6.0, 5.0, 13.0, 10.0, 4.0, 11.0, 4.0, 17.0, 11.0, 18.0, 20.0, 19.0, 22.0, 20.0, 37.0, 32.0, 35.0, 46.0, 39.0, 39.0, 45.0, 39.0, 31.0, 37.0, 43.0, 48.0, 28.0, 29.0, 27.0, 31.0, 29.0, 25.0, 20.0, 23.0, 24.0, 15.0, 17.0, 17.0, 12.0, 10.0, 8.0, 10.0, 6.0, 2.0, 7.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0], "bins": [-54.1911506652832, -52.606178283691406, -51.021209716796875, -49.436241149902344, -47.85126876831055, -46.26629638671875, -44.68132781982422, -43.09635925292969, -41.51138687133789, -39.926414489746094, -38.34144592285156, -36.75647735595703, -35.171504974365234, -33.58653259277344, -32.001564025878906, -30.416593551635742, -28.831623077392578, -27.246652603149414, -25.66168212890625, -24.076711654663086, -22.491741180419922, -20.906770706176758, -19.321800231933594, -17.73682975769043, -16.151859283447266, -14.566888809204102, -12.981918334960938, -11.396947860717773, -9.81197738647461, -8.227006912231445, -6.642036437988281, -5.057065963745117, -3.4720916748046875, -1.8871212005615234, -0.3021507263183594, 1.2828197479248047, 2.8677902221679688, 4.452760696411133, 6.037731170654297, 7.622701644897461, 9.207672119140625, 10.792642593383789, 12.377613067626953, 13.962583541870117, 15.547554016113281, 17.132524490356445, 18.71749496459961, 20.302465438842773, 21.887435913085938, 23.4724063873291, 25.057376861572266, 26.64234733581543, 28.227317810058594, 29.812288284301758, 31.397258758544922, 32.98223114013672, 34.56719970703125, 36.15216827392578, 37.73714065551758, 39.322113037109375, 40.907081604003906, 42.49205017089844, 44.077022552490234, 45.66199493408203, 47.24696350097656]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 9.0, 3.0, 4.0, 4.0, 6.0, 9.0, 9.0, 18.0, 15.0, 30.0, 47.0, 56.0, 65.0, 108.0, 219.0, 380.0, 852.0, 2086.0, 5809.0, 20517.0, 141498.0, 3950805.0, 53861.0, 11755.0, 3549.0, 1366.0, 585.0, 271.0, 142.0, 79.0, 45.0, 30.0, 17.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-29.546875, -28.8797607421875, -28.212646484375, -27.5455322265625, -26.87841796875, -26.2113037109375, -25.544189453125, -24.8770751953125, -24.2099609375, -23.5428466796875, -22.875732421875, -22.2086181640625, -21.54150390625, -20.8743896484375, -20.207275390625, -19.5401611328125, -18.873046875, -18.2059326171875, -17.538818359375, -16.8717041015625, -16.20458984375, -15.5374755859375, -14.870361328125, -14.2032470703125, -13.5361328125, -12.8690185546875, -12.201904296875, -11.5347900390625, -10.86767578125, -10.2005615234375, -9.533447265625, -8.8663330078125, -8.19921875, -7.5321044921875, -6.864990234375, -6.1978759765625, -5.53076171875, -4.8636474609375, -4.196533203125, -3.5294189453125, -2.8623046875, -2.1951904296875, -1.528076171875, -0.8609619140625, -0.19384765625, 0.4732666015625, 1.140380859375, 1.8074951171875, 2.474609375, 3.1417236328125, 3.808837890625, 4.4759521484375, 5.14306640625, 5.8101806640625, 6.477294921875, 7.1444091796875, 7.8115234375, 8.4786376953125, 9.145751953125, 9.8128662109375, 10.47998046875, 11.1470947265625, 11.814208984375, 12.4813232421875, 13.1484375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 13.0, 5.0, 10.0, 19.0, 20.0, 32.0, 27.0, 52.0, 52.0, 71.0, 56.0, 76.0, 86.0, 57.0, 73.0, 53.0, 64.0, 51.0, 47.0, 37.0, 24.0, 26.0, 12.0, 9.0, 13.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.94140625, -4.820159912109375, -4.69891357421875, -4.577667236328125, -4.4564208984375, -4.335174560546875, -4.21392822265625, -4.092681884765625, -3.971435546875, -3.850189208984375, -3.72894287109375, -3.607696533203125, -3.4864501953125, -3.365203857421875, -3.24395751953125, -3.122711181640625, -3.00146484375, -2.880218505859375, -2.75897216796875, -2.637725830078125, -2.5164794921875, -2.395233154296875, -2.27398681640625, -2.152740478515625, -2.031494140625, -1.910247802734375, -1.78900146484375, -1.667755126953125, -1.5465087890625, -1.425262451171875, -1.30401611328125, -1.182769775390625, -1.0615234375, -0.940277099609375, -0.81903076171875, -0.697784423828125, -0.5765380859375, -0.455291748046875, -0.33404541015625, -0.212799072265625, -0.091552734375, 0.029693603515625, 0.15093994140625, 0.272186279296875, 0.3934326171875, 0.514678955078125, 0.63592529296875, 0.757171630859375, 0.87841796875, 0.999664306640625, 1.12091064453125, 1.242156982421875, 1.3634033203125, 1.484649658203125, 1.60589599609375, 1.727142333984375, 1.848388671875, 1.969635009765625, 2.09088134765625, 2.212127685546875, 2.3333740234375, 2.454620361328125, 2.57586669921875, 2.697113037109375, 2.818359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 7.0, 16.0, 29.0, 49.0, 97.0, 220.0, 468.0, 1165.0, 3035.0, 10823.0, 68125.0, 3946228.0, 140782.0, 16412.0, 4205.0, 1522.0, 621.0, 214.0, 110.0, 65.0, 32.0, 21.0, 7.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.256591796875, -17.54443359375, -16.832275390625, -16.1201171875, -15.407958984375, -14.69580078125, -13.983642578125, -13.271484375, -12.559326171875, -11.84716796875, -11.135009765625, -10.4228515625, -9.710693359375, -8.99853515625, -8.286376953125, -7.57421875, -6.862060546875, -6.14990234375, -5.437744140625, -4.7255859375, -4.013427734375, -3.30126953125, -2.589111328125, -1.876953125, -1.164794921875, -0.45263671875, 0.259521484375, 0.9716796875, 1.683837890625, 2.39599609375, 3.108154296875, 3.8203125, 4.532470703125, 5.24462890625, 5.956787109375, 6.6689453125, 7.381103515625, 8.09326171875, 8.805419921875, 9.517578125, 10.229736328125, 10.94189453125, 11.654052734375, 12.3662109375, 13.078369140625, 13.79052734375, 14.502685546875, 15.21484375, 15.927001953125, 16.63916015625, 17.351318359375, 18.0634765625, 18.775634765625, 19.48779296875, 20.199951171875, 20.912109375, 21.624267578125, 22.33642578125, 23.048583984375, 23.7607421875, 24.472900390625, 25.18505859375, 25.897216796875, 26.609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 5.0, 10.0, 9.0, 7.0, 18.0, 23.0, 22.0, 33.0, 42.0, 74.0, 106.0, 308.0, 2794.0, 250.0, 102.0, 72.0, 56.0, 36.0, 19.0, 12.0, 14.0, 9.0, 10.0, 3.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.359375, -5.15673828125, -4.9541015625, -4.75146484375, -4.548828125, -4.34619140625, -4.1435546875, -3.94091796875, -3.73828125, -3.53564453125, -3.3330078125, -3.13037109375, -2.927734375, -2.72509765625, -2.5224609375, -2.31982421875, -2.1171875, -1.91455078125, -1.7119140625, -1.50927734375, -1.306640625, -1.10400390625, -0.9013671875, -0.69873046875, -0.49609375, -0.29345703125, -0.0908203125, 0.11181640625, 0.314453125, 0.51708984375, 0.7197265625, 0.92236328125, 1.125, 1.32763671875, 1.5302734375, 1.73291015625, 1.935546875, 2.13818359375, 2.3408203125, 2.54345703125, 2.74609375, 2.94873046875, 3.1513671875, 3.35400390625, 3.556640625, 3.75927734375, 3.9619140625, 4.16455078125, 4.3671875, 4.56982421875, 4.7724609375, 4.97509765625, 5.177734375, 5.38037109375, 5.5830078125, 5.78564453125, 5.98828125, 6.19091796875, 6.3935546875, 6.59619140625, 6.798828125, 7.00146484375, 7.2041015625, 7.40673828125, 7.609375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 7.0, 8.0, 56.0, 173.0, 346.0, 265.0, 94.0, 25.0, 16.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.9105224609375, -111.41545867919922, -108.9203872680664, -106.42532348632812, -103.93025207519531, -101.43518829345703, -98.94011688232422, -96.44505310058594, -93.94998168945312, -91.45491790771484, -88.95984649658203, -86.46478271484375, -83.96971130371094, -81.47464752197266, -78.97957611083984, -76.48451232910156, -73.98944854736328, -71.494384765625, -68.99931335449219, -66.5042495727539, -64.0091781616211, -61.51411437988281, -59.019046783447266, -56.52397918701172, -54.02891159057617, -51.533843994140625, -49.03877639770508, -46.54370880126953, -44.04864501953125, -41.55357360839844, -39.058509826660156, -36.56344223022461, -34.06836700439453, -31.573299407958984, -29.078231811523438, -26.583166122436523, -24.088098526000977, -21.59303092956543, -19.097965240478516, -16.60289764404297, -14.107830047607422, -11.612762451171875, -9.117695808410645, -6.622628688812256, -4.127561569213867, -1.6324939727783203, 0.8625726699829102, 3.3576393127441406, 5.8527069091796875, 8.347774505615234, 10.842841148376465, 13.337907791137695, 15.832975387573242, 18.32804298400879, 20.823108673095703, 23.31817626953125, 25.813243865966797, 28.308311462402344, 30.80337905883789, 33.29844665527344, 35.79351043701172, 38.28858184814453, 40.78364562988281, 43.27871322631836, 45.773780822753906]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 10.0, 13.0, 10.0, 21.0, 25.0, 24.0, 28.0, 31.0, 39.0, 31.0, 39.0, 44.0, 52.0, 42.0, 47.0, 51.0, 52.0, 43.0, 61.0, 46.0, 44.0, 34.0, 33.0, 28.0, 25.0, 15.0, 17.0, 25.0, 11.0, 15.0, 6.0, 5.0, 13.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.497329711914062, -18.81647491455078, -18.1356201171875, -17.45476531982422, -16.773910522460938, -16.093055725097656, -15.412200927734375, -14.731346130371094, -14.050491333007812, -13.369636535644531, -12.68878173828125, -12.007926940917969, -11.327072143554688, -10.646217346191406, -9.965362548828125, -9.284507751464844, -8.603652954101562, -7.922798156738281, -7.241943359375, -6.561088562011719, -5.8802337646484375, -5.199378967285156, -4.518524169921875, -3.8376693725585938, -3.1568145751953125, -2.4759597778320312, -1.79510498046875, -1.1142501831054688, -0.4333953857421875, 0.24745941162109375, 0.928314208984375, 1.6091690063476562, 2.2900238037109375, 2.9708786010742188, 3.6517333984375, 4.332588195800781, 5.0134429931640625, 5.694297790527344, 6.375152587890625, 7.056007385253906, 7.7368621826171875, 8.417716979980469, 9.09857177734375, 9.779426574707031, 10.460281372070312, 11.141136169433594, 11.821990966796875, 12.502845764160156, 13.183700561523438, 13.864555358886719, 14.54541015625, 15.226264953613281, 15.907119750976562, 16.587974548339844, 17.268829345703125, 17.949684143066406, 18.630538940429688, 19.31139373779297, 19.99224853515625, 20.67310333251953, 21.353958129882812, 22.034812927246094, 22.715667724609375, 23.396522521972656, 24.077377319335938]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 10.0, 5.0, 9.0, 12.0, 22.0, 26.0, 51.0, 101.0, 201.0, 405.0, 996.0, 3258.0, 13270.0, 70392.0, 510564.0, 382089.0, 52490.0, 10307.0, 2733.0, 855.0, 364.0, 165.0, 87.0, 46.0, 28.0, 18.0, 16.0, 7.0, 10.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.23681640625, -20.6767578125, -20.11669921875, -19.556640625, -18.99658203125, -18.4365234375, -17.87646484375, -17.31640625, -16.75634765625, -16.1962890625, -15.63623046875, -15.076171875, -14.51611328125, -13.9560546875, -13.39599609375, -12.8359375, -12.27587890625, -11.7158203125, -11.15576171875, -10.595703125, -10.03564453125, -9.4755859375, -8.91552734375, -8.35546875, -7.79541015625, -7.2353515625, -6.67529296875, -6.115234375, -5.55517578125, -4.9951171875, -4.43505859375, -3.875, -3.31494140625, -2.7548828125, -2.19482421875, -1.634765625, -1.07470703125, -0.5146484375, 0.04541015625, 0.60546875, 1.16552734375, 1.7255859375, 2.28564453125, 2.845703125, 3.40576171875, 3.9658203125, 4.52587890625, 5.0859375, 5.64599609375, 6.2060546875, 6.76611328125, 7.326171875, 7.88623046875, 8.4462890625, 9.00634765625, 9.56640625, 10.12646484375, 10.6865234375, 11.24658203125, 11.806640625, 12.36669921875, 12.9267578125, 13.48681640625, 14.046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 9.0, 10.0, 12.0, 12.0, 29.0, 29.0, 39.0, 55.0, 45.0, 60.0, 66.0, 74.0, 78.0, 75.0, 62.0, 61.0, 56.0, 43.0, 54.0, 36.0, 29.0, 14.0, 14.0, 14.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.296875, -5.16632080078125, -5.0357666015625, -4.90521240234375, -4.774658203125, -4.64410400390625, -4.5135498046875, -4.38299560546875, -4.25244140625, -4.12188720703125, -3.9913330078125, -3.86077880859375, -3.730224609375, -3.59967041015625, -3.4691162109375, -3.33856201171875, -3.2080078125, -3.07745361328125, -2.9468994140625, -2.81634521484375, -2.685791015625, -2.55523681640625, -2.4246826171875, -2.29412841796875, -2.16357421875, -2.03302001953125, -1.9024658203125, -1.77191162109375, -1.641357421875, -1.51080322265625, -1.3802490234375, -1.24969482421875, -1.119140625, -0.98858642578125, -0.8580322265625, -0.72747802734375, -0.596923828125, -0.46636962890625, -0.3358154296875, -0.20526123046875, -0.07470703125, 0.05584716796875, 0.1864013671875, 0.31695556640625, 0.447509765625, 0.57806396484375, 0.7086181640625, 0.83917236328125, 0.9697265625, 1.10028076171875, 1.2308349609375, 1.36138916015625, 1.491943359375, 1.62249755859375, 1.7530517578125, 1.88360595703125, 2.01416015625, 2.14471435546875, 2.2752685546875, 2.40582275390625, 2.536376953125, 2.66693115234375, 2.7974853515625, 2.92803955078125, 3.05859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 7.0, 21.0, 37.0, 42.0, 75.0, 106.0, 245.0, 452.0, 1074.0, 3029.0, 9591.0, 40350.0, 257145.0, 606541.0, 101339.0, 19858.0, 5293.0, 1793.0, 756.0, 343.0, 159.0, 101.0, 71.0, 35.0, 20.0, 7.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.234375, -11.7685546875, -11.302734375, -10.8369140625, -10.37109375, -9.9052734375, -9.439453125, -8.9736328125, -8.5078125, -8.0419921875, -7.576171875, -7.1103515625, -6.64453125, -6.1787109375, -5.712890625, -5.2470703125, -4.78125, -4.3154296875, -3.849609375, -3.3837890625, -2.91796875, -2.4521484375, -1.986328125, -1.5205078125, -1.0546875, -0.5888671875, -0.123046875, 0.3427734375, 0.80859375, 1.2744140625, 1.740234375, 2.2060546875, 2.671875, 3.1376953125, 3.603515625, 4.0693359375, 4.53515625, 5.0009765625, 5.466796875, 5.9326171875, 6.3984375, 6.8642578125, 7.330078125, 7.7958984375, 8.26171875, 8.7275390625, 9.193359375, 9.6591796875, 10.125, 10.5908203125, 11.056640625, 11.5224609375, 11.98828125, 12.4541015625, 12.919921875, 13.3857421875, 13.8515625, 14.3173828125, 14.783203125, 15.2490234375, 15.71484375, 16.1806640625, 16.646484375, 17.1123046875, 17.578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 7.0, 12.0, 10.0, 9.0, 18.0, 14.0, 22.0, 31.0, 29.0, 34.0, 41.0, 54.0, 42.0, 51.0, 65.0, 51.0, 58.0, 51.0, 49.0, 47.0, 48.0, 41.0, 37.0, 42.0, 28.0, 20.0, 17.0, 12.0, 10.0, 6.0, 5.0, 6.0, 4.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.84375, -13.3642578125, -12.884765625, -12.4052734375, -11.92578125, -11.4462890625, -10.966796875, -10.4873046875, -10.0078125, -9.5283203125, -9.048828125, -8.5693359375, -8.08984375, -7.6103515625, -7.130859375, -6.6513671875, -6.171875, -5.6923828125, -5.212890625, -4.7333984375, -4.25390625, -3.7744140625, -3.294921875, -2.8154296875, -2.3359375, -1.8564453125, -1.376953125, -0.8974609375, -0.41796875, 0.0615234375, 0.541015625, 1.0205078125, 1.5, 1.9794921875, 2.458984375, 2.9384765625, 3.41796875, 3.8974609375, 4.376953125, 4.8564453125, 5.3359375, 5.8154296875, 6.294921875, 6.7744140625, 7.25390625, 7.7333984375, 8.212890625, 8.6923828125, 9.171875, 9.6513671875, 10.130859375, 10.6103515625, 11.08984375, 11.5693359375, 12.048828125, 12.5283203125, 13.0078125, 13.4873046875, 13.966796875, 14.4462890625, 14.92578125, 15.4052734375, 15.884765625, 16.3642578125, 16.84375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 2.0, 5.0, 9.0, 13.0, 20.0, 32.0, 49.0, 105.0, 221.0, 424.0, 1061.0, 3175.0, 12692.0, 113763.0, 788997.0, 110569.0, 12447.0, 3026.0, 1073.0, 436.0, 193.0, 100.0, 54.0, 23.0, 17.0, 17.0, 8.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.2794189453125, -6.051025390625, -5.8226318359375, -5.59423828125, -5.3658447265625, -5.137451171875, -4.9090576171875, -4.6806640625, -4.4522705078125, -4.223876953125, -3.9954833984375, -3.76708984375, -3.5386962890625, -3.310302734375, -3.0819091796875, -2.853515625, -2.6251220703125, -2.396728515625, -2.1683349609375, -1.93994140625, -1.7115478515625, -1.483154296875, -1.2547607421875, -1.0263671875, -0.7979736328125, -0.569580078125, -0.3411865234375, -0.11279296875, 0.1156005859375, 0.343994140625, 0.5723876953125, 0.80078125, 1.0291748046875, 1.257568359375, 1.4859619140625, 1.71435546875, 1.9427490234375, 2.171142578125, 2.3995361328125, 2.6279296875, 2.8563232421875, 3.084716796875, 3.3131103515625, 3.54150390625, 3.7698974609375, 3.998291015625, 4.2266845703125, 4.455078125, 4.6834716796875, 4.911865234375, 5.1402587890625, 5.36865234375, 5.5970458984375, 5.825439453125, 6.0538330078125, 6.2822265625, 6.5106201171875, 6.739013671875, 6.9674072265625, 7.19580078125, 7.4241943359375, 7.652587890625, 7.8809814453125, 8.109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 4.0, 8.0, 8.0, 7.0, 11.0, 20.0, 28.0, 56.0, 57.0, 102.0, 137.0, 142.0, 119.0, 100.0, 63.0, 43.0, 27.0, 20.0, 15.0, 11.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00119781494140625, -0.001165740191936493, -0.0011336654424667358, -0.0011015906929969788, -0.0010695159435272217, -0.0010374411940574646, -0.0010053664445877075, -0.0009732916951179504, -0.0009412169456481934, -0.0009091421961784363, -0.0008770674467086792, -0.0008449926972389221, -0.000812917947769165, -0.000780843198299408, -0.0007487684488296509, -0.0007166936993598938, -0.0006846189498901367, -0.0006525442004203796, -0.0006204694509506226, -0.0005883947014808655, -0.0005563199520111084, -0.0005242452025413513, -0.0004921704530715942, -0.00046009570360183716, -0.0004280209541320801, -0.000395946204662323, -0.0003638714551925659, -0.00033179670572280884, -0.00029972195625305176, -0.0002676472067832947, -0.0002355724573135376, -0.00020349770784378052, -0.00017142295837402344, -0.00013934820890426636, -0.00010727345943450928, -7.51987099647522e-05, -4.312396049499512e-05, -1.1049211025238037e-05, 2.1025538444519043e-05, 5.310028791427612e-05, 8.51750373840332e-05, 0.00011724978685379028, 0.00014932453632354736, 0.00018139928579330444, 0.00021347403526306152, 0.0002455487847328186, 0.0002776235342025757, 0.00030969828367233276, 0.00034177303314208984, 0.0003738477826118469, 0.000405922532081604, 0.0004379972815513611, 0.00047007203102111816, 0.0005021467804908752, 0.0005342215299606323, 0.0005662962794303894, 0.0005983710289001465, 0.0006304457783699036, 0.0006625205278396606, 0.0006945952773094177, 0.0007266700267791748, 0.0007587447762489319, 0.000790819525718689, 0.000822894275188446, 0.0008549690246582031]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 12.0, 14.0, 19.0, 44.0, 69.0, 103.0, 257.0, 638.0, 1715.0, 6497.0, 34186.0, 482171.0, 479314.0, 34357.0, 6291.0, 1713.0, 612.0, 270.0, 94.0, 59.0, 40.0, 23.0, 12.0, 8.0, 8.0, 8.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01171875, -6.76129150390625, -6.5108642578125, -6.26043701171875, -6.010009765625, -5.75958251953125, -5.5091552734375, -5.25872802734375, -5.00830078125, -4.75787353515625, -4.5074462890625, -4.25701904296875, -4.006591796875, -3.75616455078125, -3.5057373046875, -3.25531005859375, -3.0048828125, -2.75445556640625, -2.5040283203125, -2.25360107421875, -2.003173828125, -1.75274658203125, -1.5023193359375, -1.25189208984375, -1.00146484375, -0.75103759765625, -0.5006103515625, -0.25018310546875, 0.000244140625, 0.25067138671875, 0.5010986328125, 0.75152587890625, 1.001953125, 1.25238037109375, 1.5028076171875, 1.75323486328125, 2.003662109375, 2.25408935546875, 2.5045166015625, 2.75494384765625, 3.00537109375, 3.25579833984375, 3.5062255859375, 3.75665283203125, 4.007080078125, 4.25750732421875, 4.5079345703125, 4.75836181640625, 5.0087890625, 5.25921630859375, 5.5096435546875, 5.76007080078125, 6.010498046875, 6.26092529296875, 6.5113525390625, 6.76177978515625, 7.01220703125, 7.26263427734375, 7.5130615234375, 7.76348876953125, 8.013916015625, 8.26434326171875, 8.5147705078125, 8.76519775390625, 9.015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 6.0, 11.0, 12.0, 25.0, 24.0, 39.0, 71.0, 91.0, 120.0, 116.0, 134.0, 98.0, 63.0, 41.0, 30.0, 29.0, 19.0, 16.0, 7.0, 11.0, 8.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.671875, -6.46783447265625, -6.2637939453125, -6.05975341796875, -5.855712890625, -5.65167236328125, -5.4476318359375, -5.24359130859375, -5.03955078125, -4.83551025390625, -4.6314697265625, -4.42742919921875, -4.223388671875, -4.01934814453125, -3.8153076171875, -3.61126708984375, -3.4072265625, -3.20318603515625, -2.9991455078125, -2.79510498046875, -2.591064453125, -2.38702392578125, -2.1829833984375, -1.97894287109375, -1.77490234375, -1.57086181640625, -1.3668212890625, -1.16278076171875, -0.958740234375, -0.75469970703125, -0.5506591796875, -0.34661865234375, -0.142578125, 0.06146240234375, 0.2655029296875, 0.46954345703125, 0.673583984375, 0.87762451171875, 1.0816650390625, 1.28570556640625, 1.48974609375, 1.69378662109375, 1.8978271484375, 2.10186767578125, 2.305908203125, 2.50994873046875, 2.7139892578125, 2.91802978515625, 3.1220703125, 3.32611083984375, 3.5301513671875, 3.73419189453125, 3.938232421875, 4.14227294921875, 4.3463134765625, 4.55035400390625, 4.75439453125, 4.95843505859375, 5.1624755859375, 5.36651611328125, 5.570556640625, 5.77459716796875, 5.9786376953125, 6.18267822265625, 6.38671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 15.0, 34.0, 55.0, 137.0, 220.0, 223.0, 142.0, 80.0, 38.0, 28.0, 11.0, 1.0, 4.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.68299102783203, -89.24522399902344, -84.80745697021484, -80.36968994140625, -75.93192291259766, -71.49415588378906, -67.05638885498047, -62.618621826171875, -58.18085479736328, -53.74308776855469, -49.305320739746094, -44.8675537109375, -40.429786682128906, -35.99201965332031, -31.55425262451172, -27.116485595703125, -22.67871856689453, -18.240951538085938, -13.803184509277344, -9.36541748046875, -4.927650451660156, -0.4898834228515625, 3.9478836059570312, 8.385650634765625, 12.823417663574219, 17.261184692382812, 21.698951721191406, 26.13671875, 30.574485778808594, 35.01225280761719, 39.45001983642578, 43.887786865234375, 48.32554626464844, 52.76331329345703, 57.201080322265625, 61.63884735107422, 66.07661437988281, 70.5143814086914, 74.9521484375, 79.3899154663086, 83.82768249511719, 88.26544952392578, 92.70321655273438, 97.14098358154297, 101.57875061035156, 106.01651763916016, 110.45428466796875, 114.89205169677734, 119.32981872558594, 123.76758575439453, 128.20535278320312, 132.64312744140625, 137.0808868408203, 141.51864624023438, 145.9564208984375, 150.39419555664062, 154.8319549560547, 159.26971435546875, 163.70748901367188, 168.145263671875, 172.58302307128906, 177.02078247070312, 181.45855712890625, 185.89633178710938, 190.33409118652344]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 11.0, 9.0, 17.0, 13.0, 19.0, 22.0, 18.0, 33.0, 31.0, 33.0, 36.0, 33.0, 52.0, 45.0, 58.0, 43.0, 52.0, 47.0, 58.0, 41.0, 37.0, 39.0, 36.0, 36.0, 19.0, 37.0, 30.0, 21.0, 10.0, 14.0, 10.0, 10.0, 3.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.352294921875, -83.84137725830078, -81.33045196533203, -78.81953430175781, -76.3086166381836, -73.79769897460938, -71.28677368164062, -68.7758560180664, -66.26493835449219, -63.7540168762207, -61.243099212646484, -58.732177734375, -56.22126007080078, -53.7103385925293, -51.19941711425781, -48.688499450683594, -46.17757797241211, -43.666656494140625, -41.155738830566406, -38.64481735229492, -36.1338996887207, -33.62297821044922, -31.112058639526367, -28.601139068603516, -26.090219497680664, -23.579299926757812, -21.06838035583496, -18.55746078491211, -16.046539306640625, -13.53562068939209, -11.024700164794922, -8.51378059387207, -6.002861022949219, -3.491941213607788, -0.9810214042663574, 1.5298986434936523, 4.040818214416504, 6.5517377853393555, 9.062658309936523, 11.573577880859375, 14.084497451782227, 16.595417022705078, 19.10633659362793, 21.61725616455078, 24.128177642822266, 26.639095306396484, 29.15001678466797, 31.66093635559082, 34.17185592651367, 36.682777404785156, 39.193695068359375, 41.70461654663086, 44.21553421020508, 46.72645568847656, 49.23737335205078, 51.748294830322266, 54.25921630859375, 56.770137786865234, 59.28105545043945, 61.79197692871094, 64.30289459228516, 66.81381225585938, 69.32473754882812, 71.83565521240234, 74.34657287597656]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 14.0, 22.0, 63.0, 150.0, 407.0, 1295.0, 7746.0, 4166541.0, 15292.0, 1912.0, 523.0, 189.0, 77.0, 33.0, 13.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.4375, -55.252685546875, -54.06787109375, -52.883056640625, -51.6982421875, -50.513427734375, -49.32861328125, -48.143798828125, -46.958984375, -45.774169921875, -44.58935546875, -43.404541015625, -42.2197265625, -41.034912109375, -39.85009765625, -38.665283203125, -37.48046875, -36.295654296875, -35.11083984375, -33.926025390625, -32.7412109375, -31.556396484375, -30.37158203125, -29.186767578125, -28.001953125, -26.817138671875, -25.63232421875, -24.447509765625, -23.2626953125, -22.077880859375, -20.89306640625, -19.708251953125, -18.5234375, -17.338623046875, -16.15380859375, -14.968994140625, -13.7841796875, -12.599365234375, -11.41455078125, -10.229736328125, -9.044921875, -7.860107421875, -6.67529296875, -5.490478515625, -4.3056640625, -3.120849609375, -1.93603515625, -0.751220703125, 0.43359375, 1.618408203125, 2.80322265625, 3.988037109375, 5.1728515625, 6.357666015625, 7.54248046875, 8.727294921875, 9.912109375, 11.096923828125, 12.28173828125, 13.466552734375, 14.6513671875, 15.836181640625, 17.02099609375, 18.205810546875, 19.390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 10.0, 9.0, 14.0, 27.0, 26.0, 35.0, 38.0, 53.0, 48.0, 59.0, 67.0, 69.0, 69.0, 75.0, 60.0, 58.0, 55.0, 53.0, 39.0, 28.0, 25.0, 24.0, 18.0, 15.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.03515625, -5.878173828125, -5.72119140625, -5.564208984375, -5.4072265625, -5.250244140625, -5.09326171875, -4.936279296875, -4.779296875, -4.622314453125, -4.46533203125, -4.308349609375, -4.1513671875, -3.994384765625, -3.83740234375, -3.680419921875, -3.5234375, -3.366455078125, -3.20947265625, -3.052490234375, -2.8955078125, -2.738525390625, -2.58154296875, -2.424560546875, -2.267578125, -2.110595703125, -1.95361328125, -1.796630859375, -1.6396484375, -1.482666015625, -1.32568359375, -1.168701171875, -1.01171875, -0.854736328125, -0.69775390625, -0.540771484375, -0.3837890625, -0.226806640625, -0.06982421875, 0.087158203125, 0.244140625, 0.401123046875, 0.55810546875, 0.715087890625, 0.8720703125, 1.029052734375, 1.18603515625, 1.343017578125, 1.5, 1.656982421875, 1.81396484375, 1.970947265625, 2.1279296875, 2.284912109375, 2.44189453125, 2.598876953125, 2.755859375, 2.912841796875, 3.06982421875, 3.226806640625, 3.3837890625, 3.540771484375, 3.69775390625, 3.854736328125, 4.01171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 9.0, 11.0, 17.0, 21.0, 33.0, 57.0, 64.0, 113.0, 135.0, 248.0, 356.0, 586.0, 1014.0, 1908.0, 4247.0, 13521.0, 4083685.0, 70529.0, 10332.0, 3483.0, 1601.0, 873.0, 512.0, 322.0, 195.0, 137.0, 88.0, 62.0, 36.0, 19.0, 21.0, 16.0, 7.0, 5.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.921875, -17.279541015625, -16.63720703125, -15.994873046875, -15.3525390625, -14.710205078125, -14.06787109375, -13.425537109375, -12.783203125, -12.140869140625, -11.49853515625, -10.856201171875, -10.2138671875, -9.571533203125, -8.92919921875, -8.286865234375, -7.64453125, -7.002197265625, -6.35986328125, -5.717529296875, -5.0751953125, -4.432861328125, -3.79052734375, -3.148193359375, -2.505859375, -1.863525390625, -1.22119140625, -0.578857421875, 0.0634765625, 0.705810546875, 1.34814453125, 1.990478515625, 2.6328125, 3.275146484375, 3.91748046875, 4.559814453125, 5.2021484375, 5.844482421875, 6.48681640625, 7.129150390625, 7.771484375, 8.413818359375, 9.05615234375, 9.698486328125, 10.3408203125, 10.983154296875, 11.62548828125, 12.267822265625, 12.91015625, 13.552490234375, 14.19482421875, 14.837158203125, 15.4794921875, 16.121826171875, 16.76416015625, 17.406494140625, 18.048828125, 18.691162109375, 19.33349609375, 19.975830078125, 20.6181640625, 21.260498046875, 21.90283203125, 22.545166015625, 23.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 10.0, 13.0, 36.0, 3902.0, 43.0, 12.0, 9.0, 13.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.482177734375, -5.34326171875, -5.204345703125, -5.0654296875, -4.926513671875, -4.78759765625, -4.648681640625, -4.509765625, -4.370849609375, -4.23193359375, -4.093017578125, -3.9541015625, -3.815185546875, -3.67626953125, -3.537353515625, -3.3984375, -3.259521484375, -3.12060546875, -2.981689453125, -2.8427734375, -2.703857421875, -2.56494140625, -2.426025390625, -2.287109375, -2.148193359375, -2.00927734375, -1.870361328125, -1.7314453125, -1.592529296875, -1.45361328125, -1.314697265625, -1.17578125, -1.036865234375, -0.89794921875, -0.759033203125, -0.6201171875, -0.481201171875, -0.34228515625, -0.203369140625, -0.064453125, 0.074462890625, 0.21337890625, 0.352294921875, 0.4912109375, 0.630126953125, 0.76904296875, 0.907958984375, 1.046875, 1.185791015625, 1.32470703125, 1.463623046875, 1.6025390625, 1.741455078125, 1.88037109375, 2.019287109375, 2.158203125, 2.297119140625, 2.43603515625, 2.574951171875, 2.7138671875, 2.852783203125, 2.99169921875, 3.130615234375, 3.26953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 16.0, 22.0, 49.0, 64.0, 151.0, 204.0, 202.0, 130.0, 85.0, 33.0, 26.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-24.159090042114258, -23.636138916015625, -23.113189697265625, -22.590240478515625, -22.067289352416992, -21.54433822631836, -21.02138900756836, -20.49843978881836, -19.975488662719727, -19.452537536621094, -18.929588317871094, -18.406639099121094, -17.88368797302246, -17.360736846923828, -16.837787628173828, -16.314838409423828, -15.791887283325195, -15.268937110900879, -14.745986938476562, -14.223036766052246, -13.70008659362793, -13.177136421203613, -12.654186248779297, -12.13123607635498, -11.608285903930664, -11.085335731506348, -10.562385559082031, -10.039435386657715, -9.516485214233398, -8.993535041809082, -8.470584869384766, -7.947634696960449, -7.424686431884766, -6.901736259460449, -6.378786087036133, -5.855835914611816, -5.3328857421875, -4.809935569763184, -4.286985397338867, -3.764035224914551, -3.2410850524902344, -2.718134880065918, -2.1951847076416016, -1.6722345352172852, -1.1492843627929688, -0.6263341903686523, -0.10338401794433594, 0.41956615447998047, 0.9425163269042969, 1.4654664993286133, 1.9884166717529297, 2.511366844177246, 3.0343170166015625, 3.557267189025879, 4.080217361450195, 4.603167533874512, 5.126117706298828, 5.6490678787231445, 6.172018051147461, 6.694968223571777, 7.217918395996094, 7.74086856842041, 8.263818740844727, 8.786768913269043, 9.30971908569336]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 12.0, 11.0, 11.0, 9.0, 9.0, 19.0, 12.0, 25.0, 24.0, 19.0, 27.0, 27.0, 33.0, 36.0, 31.0, 33.0, 30.0, 38.0, 42.0, 43.0, 57.0, 43.0, 35.0, 56.0, 35.0, 37.0, 30.0, 36.0, 28.0, 20.0, 23.0, 22.0, 9.0, 11.0, 16.0, 7.0, 9.0, 8.0, 12.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.569635391235352, -6.362862586975098, -6.1560893058776855, -5.949316024780273, -5.7425432205200195, -5.535770416259766, -5.3289971351623535, -5.122223854064941, -4.9154510498046875, -4.708678245544434, -4.5019049644470215, -4.295131683349609, -4.0883588790893555, -3.8815858364105225, -3.6748127937316895, -3.4680397510528564, -3.2612667083740234, -3.0544936656951904, -2.8477206230163574, -2.6409475803375244, -2.4341745376586914, -2.2274014949798584, -2.0206284523010254, -1.8138554096221924, -1.6070823669433594, -1.4003093242645264, -1.1935362815856934, -0.9867632389068604, -0.7799901962280273, -0.5732171535491943, -0.36644411087036133, -0.15967106819152832, 0.04710197448730469, 0.2538750171661377, 0.4606480598449707, 0.6674211025238037, 0.8741941452026367, 1.0809671878814697, 1.2877402305603027, 1.4945132732391357, 1.7012863159179688, 1.9080593585968018, 2.1148324012756348, 2.3216054439544678, 2.528378486633301, 2.735151529312134, 2.941924571990967, 3.1486976146698, 3.355470657348633, 3.562243700027466, 3.769016742706299, 3.975789785385132, 4.182562828063965, 4.389335632324219, 4.596108913421631, 4.802882194519043, 5.009654998779297, 5.216427803039551, 5.423201084136963, 5.629974365234375, 5.836747169494629, 6.043519973754883, 6.250293254852295, 6.457066535949707, 6.663839340209961]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 8.0, 16.0, 25.0, 38.0, 47.0, 86.0, 163.0, 264.0, 605.0, 1381.0, 3545.0, 11045.0, 37656.0, 148890.0, 544466.0, 224919.0, 52310.0, 14933.0, 4808.0, 1807.0, 737.0, 378.0, 147.0, 103.0, 53.0, 27.0, 28.0, 9.0, 9.0, 12.0, 5.0, 2.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-15.265625, -14.848876953125, -14.43212890625, -14.015380859375, -13.5986328125, -13.181884765625, -12.76513671875, -12.348388671875, -11.931640625, -11.514892578125, -11.09814453125, -10.681396484375, -10.2646484375, -9.847900390625, -9.43115234375, -9.014404296875, -8.59765625, -8.180908203125, -7.76416015625, -7.347412109375, -6.9306640625, -6.513916015625, -6.09716796875, -5.680419921875, -5.263671875, -4.846923828125, -4.43017578125, -4.013427734375, -3.5966796875, -3.179931640625, -2.76318359375, -2.346435546875, -1.9296875, -1.512939453125, -1.09619140625, -0.679443359375, -0.2626953125, 0.154052734375, 0.57080078125, 0.987548828125, 1.404296875, 1.821044921875, 2.23779296875, 2.654541015625, 3.0712890625, 3.488037109375, 3.90478515625, 4.321533203125, 4.73828125, 5.155029296875, 5.57177734375, 5.988525390625, 6.4052734375, 6.822021484375, 7.23876953125, 7.655517578125, 8.072265625, 8.489013671875, 8.90576171875, 9.322509765625, 9.7392578125, 10.156005859375, 10.57275390625, 10.989501953125, 11.40625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 6.0, 8.0, 6.0, 5.0, 18.0, 13.0, 26.0, 25.0, 30.0, 45.0, 40.0, 57.0, 57.0, 60.0, 82.0, 60.0, 69.0, 65.0, 59.0, 54.0, 40.0, 46.0, 29.0, 25.0, 20.0, 19.0, 14.0, 9.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.8857421875, -5.724609375, -5.5634765625, -5.40234375, -5.2412109375, -5.080078125, -4.9189453125, -4.7578125, -4.5966796875, -4.435546875, -4.2744140625, -4.11328125, -3.9521484375, -3.791015625, -3.6298828125, -3.46875, -3.3076171875, -3.146484375, -2.9853515625, -2.82421875, -2.6630859375, -2.501953125, -2.3408203125, -2.1796875, -2.0185546875, -1.857421875, -1.6962890625, -1.53515625, -1.3740234375, -1.212890625, -1.0517578125, -0.890625, -0.7294921875, -0.568359375, -0.4072265625, -0.24609375, -0.0849609375, 0.076171875, 0.2373046875, 0.3984375, 0.5595703125, 0.720703125, 0.8818359375, 1.04296875, 1.2041015625, 1.365234375, 1.5263671875, 1.6875, 1.8486328125, 2.009765625, 2.1708984375, 2.33203125, 2.4931640625, 2.654296875, 2.8154296875, 2.9765625, 3.1376953125, 3.298828125, 3.4599609375, 3.62109375, 3.7822265625, 3.943359375, 4.1044921875, 4.265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 18.0, 11.0, 22.0, 26.0, 22.0, 41.0, 51.0, 81.0, 142.0, 232.0, 358.0, 766.0, 1620.0, 3622.0, 8962.0, 24052.0, 77622.0, 339822.0, 446252.0, 97534.0, 28687.0, 10571.0, 4238.0, 1819.0, 867.0, 401.0, 231.0, 151.0, 97.0, 81.0, 41.0, 25.0, 21.0, 20.0, 13.0, 4.0, 6.0, 5.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7890625, -10.4049072265625, -10.020751953125, -9.6365966796875, -9.25244140625, -8.8682861328125, -8.484130859375, -8.0999755859375, -7.7158203125, -7.3316650390625, -6.947509765625, -6.5633544921875, -6.17919921875, -5.7950439453125, -5.410888671875, -5.0267333984375, -4.642578125, -4.2584228515625, -3.874267578125, -3.4901123046875, -3.10595703125, -2.7218017578125, -2.337646484375, -1.9534912109375, -1.5693359375, -1.1851806640625, -0.801025390625, -0.4168701171875, -0.03271484375, 0.3514404296875, 0.735595703125, 1.1197509765625, 1.50390625, 1.8880615234375, 2.272216796875, 2.6563720703125, 3.04052734375, 3.4246826171875, 3.808837890625, 4.1929931640625, 4.5771484375, 4.9613037109375, 5.345458984375, 5.7296142578125, 6.11376953125, 6.4979248046875, 6.882080078125, 7.2662353515625, 7.650390625, 8.0345458984375, 8.418701171875, 8.8028564453125, 9.18701171875, 9.5711669921875, 9.955322265625, 10.3394775390625, 10.7236328125, 11.1077880859375, 11.491943359375, 11.8760986328125, 12.26025390625, 12.6444091796875, 13.028564453125, 13.4127197265625, 13.796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 14.0, 8.0, 24.0, 19.0, 24.0, 33.0, 36.0, 50.0, 60.0, 70.0, 63.0, 74.0, 65.0, 64.0, 70.0, 62.0, 45.0, 45.0, 44.0, 29.0, 22.0, 18.0, 17.0, 11.0, 9.0, 4.0, 8.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.563232421875, -31.68896484375, -30.814697265625, -29.9404296875, -29.066162109375, -28.19189453125, -27.317626953125, -26.443359375, -25.569091796875, -24.69482421875, -23.820556640625, -22.9462890625, -22.072021484375, -21.19775390625, -20.323486328125, -19.44921875, -18.574951171875, -17.70068359375, -16.826416015625, -15.9521484375, -15.077880859375, -14.20361328125, -13.329345703125, -12.455078125, -11.580810546875, -10.70654296875, -9.832275390625, -8.9580078125, -8.083740234375, -7.20947265625, -6.335205078125, -5.4609375, -4.586669921875, -3.71240234375, -2.838134765625, -1.9638671875, -1.089599609375, -0.21533203125, 0.658935546875, 1.533203125, 2.407470703125, 3.28173828125, 4.156005859375, 5.0302734375, 5.904541015625, 6.77880859375, 7.653076171875, 8.52734375, 9.401611328125, 10.27587890625, 11.150146484375, 12.0244140625, 12.898681640625, 13.77294921875, 14.647216796875, 15.521484375, 16.395751953125, 17.27001953125, 18.144287109375, 19.0185546875, 19.892822265625, 20.76708984375, 21.641357421875, 22.515625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 8.0, 10.0, 24.0, 33.0, 75.0, 145.0, 362.0, 1612.0, 43935.0, 997223.0, 4120.0, 594.0, 215.0, 109.0, 39.0, 33.0, 12.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.65625, -43.4228515625, -42.189453125, -40.9560546875, -39.72265625, -38.4892578125, -37.255859375, -36.0224609375, -34.7890625, -33.5556640625, -32.322265625, -31.0888671875, -29.85546875, -28.6220703125, -27.388671875, -26.1552734375, -24.921875, -23.6884765625, -22.455078125, -21.2216796875, -19.98828125, -18.7548828125, -17.521484375, -16.2880859375, -15.0546875, -13.8212890625, -12.587890625, -11.3544921875, -10.12109375, -8.8876953125, -7.654296875, -6.4208984375, -5.1875, -3.9541015625, -2.720703125, -1.4873046875, -0.25390625, 0.9794921875, 2.212890625, 3.4462890625, 4.6796875, 5.9130859375, 7.146484375, 8.3798828125, 9.61328125, 10.8466796875, 12.080078125, 13.3134765625, 14.546875, 15.7802734375, 17.013671875, 18.2470703125, 19.48046875, 20.7138671875, 21.947265625, 23.1806640625, 24.4140625, 25.6474609375, 26.880859375, 28.1142578125, 29.34765625, 30.5810546875, 31.814453125, 33.0478515625, 34.28125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 4.0, 3.0, 12.0, 17.0, 20.0, 38.0, 74.0, 105.0, 155.0, 181.0, 146.0, 82.0, 69.0, 31.0, 30.0, 12.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001255035400390625, -0.0012123733758926392, -0.0011697113513946533, -0.0011270493268966675, -0.0010843873023986816, -0.0010417252779006958, -0.00099906325340271, -0.0009564012289047241, -0.0009137392044067383, -0.0008710771799087524, -0.0008284151554107666, -0.0007857531309127808, -0.0007430911064147949, -0.0007004290819168091, -0.0006577670574188232, -0.0006151050329208374, -0.0005724430084228516, -0.0005297809839248657, -0.0004871189594268799, -0.00044445693492889404, -0.0004017949104309082, -0.00035913288593292236, -0.0003164708614349365, -0.0002738088369369507, -0.00023114681243896484, -0.000188484787940979, -0.00014582276344299316, -0.00010316073894500732, -6.0498714447021484e-05, -1.7836689949035645e-05, 2.4825334548950195e-05, 6.748735904693604e-05, 0.00011014938354492188, 0.00015281140804290771, 0.00019547343254089355, 0.0002381354570388794, 0.00028079748153686523, 0.0003234595060348511, 0.0003661215305328369, 0.00040878355503082275, 0.0004514455795288086, 0.0004941076040267944, 0.0005367696285247803, 0.0005794316530227661, 0.000622093677520752, 0.0006647557020187378, 0.0007074177265167236, 0.0007500797510147095, 0.0007927417755126953, 0.0008354038000106812, 0.000878065824508667, 0.0009207278490066528, 0.0009633898735046387, 0.0010060518980026245, 0.0010487139225006104, 0.0010913759469985962, 0.001134037971496582, 0.0011766999959945679, 0.0012193620204925537, 0.0012620240449905396, 0.0013046860694885254, 0.0013473480939865112, 0.001390010118484497, 0.001432672142982483, 0.0014753341674804688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 23.0, 30.0, 71.0, 128.0, 285.0, 658.0, 1895.0, 7112.0, 109791.0, 898789.0, 24060.0, 3676.0, 1198.0, 401.0, 191.0, 98.0, 57.0, 30.0, 14.0, 6.0, 5.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.71875, -11.2891845703125, -10.859619140625, -10.4300537109375, -10.00048828125, -9.5709228515625, -9.141357421875, -8.7117919921875, -8.2822265625, -7.8526611328125, -7.423095703125, -6.9935302734375, -6.56396484375, -6.1343994140625, -5.704833984375, -5.2752685546875, -4.845703125, -4.4161376953125, -3.986572265625, -3.5570068359375, -3.12744140625, -2.6978759765625, -2.268310546875, -1.8387451171875, -1.4091796875, -0.9796142578125, -0.550048828125, -0.1204833984375, 0.30908203125, 0.7386474609375, 1.168212890625, 1.5977783203125, 2.02734375, 2.4569091796875, 2.886474609375, 3.3160400390625, 3.74560546875, 4.1751708984375, 4.604736328125, 5.0343017578125, 5.4638671875, 5.8934326171875, 6.322998046875, 6.7525634765625, 7.18212890625, 7.6116943359375, 8.041259765625, 8.4708251953125, 8.900390625, 9.3299560546875, 9.759521484375, 10.1890869140625, 10.61865234375, 11.0482177734375, 11.477783203125, 11.9073486328125, 12.3369140625, 12.7664794921875, 13.196044921875, 13.6256103515625, 14.05517578125, 14.4847412109375, 14.914306640625, 15.3438720703125, 15.7734375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 0.0, 9.0, 22.0, 30.0, 73.0, 131.0, 322.0, 203.0, 94.0, 49.0, 26.0, 12.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.375, -15.823486328125, -15.27197265625, -14.720458984375, -14.1689453125, -13.617431640625, -13.06591796875, -12.514404296875, -11.962890625, -11.411376953125, -10.85986328125, -10.308349609375, -9.7568359375, -9.205322265625, -8.65380859375, -8.102294921875, -7.55078125, -6.999267578125, -6.44775390625, -5.896240234375, -5.3447265625, -4.793212890625, -4.24169921875, -3.690185546875, -3.138671875, -2.587158203125, -2.03564453125, -1.484130859375, -0.9326171875, -0.381103515625, 0.17041015625, 0.721923828125, 1.2734375, 1.824951171875, 2.37646484375, 2.927978515625, 3.4794921875, 4.031005859375, 4.58251953125, 5.134033203125, 5.685546875, 6.237060546875, 6.78857421875, 7.340087890625, 7.8916015625, 8.443115234375, 8.99462890625, 9.546142578125, 10.09765625, 10.649169921875, 11.20068359375, 11.752197265625, 12.3037109375, 12.855224609375, 13.40673828125, 13.958251953125, 14.509765625, 15.061279296875, 15.61279296875, 16.164306640625, 16.7158203125, 17.267333984375, 17.81884765625, 18.370361328125, 18.921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 13.0, 21.0, 35.0, 68.0, 102.0, 157.0, 245.0, 158.0, 99.0, 55.0, 19.0, 19.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.37255859375, -89.57077026367188, -83.76897430419922, -77.96717834472656, -72.16539001464844, -66.36360168457031, -60.561805725097656, -54.760013580322266, -48.958221435546875, -43.156429290771484, -37.354637145996094, -31.552845001220703, -25.751052856445312, -19.949260711669922, -14.147468566894531, -8.34567642211914, -2.54388427734375, 3.2579078674316406, 9.059700012207031, 14.861492156982422, 20.663284301757812, 26.465076446533203, 32.266868591308594, 38.068660736083984, 43.870452880859375, 49.672245025634766, 55.474037170410156, 61.27582931518555, 67.07762145996094, 72.87940979003906, 78.68120574951172, 84.48300170898438, 90.2847900390625, 96.08657836914062, 101.88837432861328, 107.69017028808594, 113.49195861816406, 119.29374694824219, 125.09554290771484, 130.8973388671875, 136.69912719726562, 142.50091552734375, 148.30270385742188, 154.10450744628906, 159.9062957763672, 165.7080841064453, 171.5098876953125, 177.31167602539062, 183.11346435546875, 188.91525268554688, 194.717041015625, 200.5188446044922, 206.3206329345703, 212.12242126464844, 217.92422485351562, 223.72601318359375, 229.52780151367188, 235.32958984375, 241.13137817382812, 246.9331817626953, 252.73497009277344, 258.5367736816406, 264.33856201171875, 270.1403503417969, 275.942138671875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 9.0, 16.0, 14.0, 18.0, 26.0, 28.0, 33.0, 41.0, 35.0, 44.0, 34.0, 37.0, 53.0, 52.0, 65.0, 57.0, 51.0, 54.0, 46.0, 45.0, 28.0, 31.0, 32.0, 28.0, 22.0, 20.0, 11.0, 15.0, 17.0, 7.0, 8.0, 1.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.41399383544922, -75.10453033447266, -71.79507446289062, -68.48561096191406, -65.1761474609375, -61.86669158935547, -58.557228088378906, -55.24776840209961, -51.93830871582031, -48.628849029541016, -45.31938934326172, -42.009925842285156, -38.70046615600586, -35.39100646972656, -32.08154296875, -28.772083282470703, -25.462623596191406, -22.15316390991211, -18.84370231628418, -15.534241676330566, -12.224781036376953, -8.915321350097656, -5.605859756469727, -2.296398162841797, 1.0130615234375, 4.322522163391113, 7.631982803344727, 10.94144344329834, 14.250904083251953, 17.56036376953125, 20.86982536315918, 24.17928695678711, 27.488754272460938, 30.798213958740234, 34.10767364501953, 37.417137145996094, 40.72659683227539, 44.03605651855469, 47.34552001953125, 50.65497970581055, 53.964439392089844, 57.27389907836914, 60.58335876464844, 63.892822265625, 67.20228576660156, 70.5117416381836, 73.82120513916016, 77.13066101074219, 80.44012451171875, 83.74958801269531, 87.05904388427734, 90.3685073852539, 93.67796325683594, 96.9874267578125, 100.29689025878906, 103.60635375976562, 106.91580963134766, 110.22527313232422, 113.53472900390625, 116.84419250488281, 120.15365600585938, 123.4631118774414, 126.77257537841797, 130.08203125, 133.39149475097656]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 3.0, 6.0, 7.0, 15.0, 8.0, 18.0, 20.0, 52.0, 51.0, 81.0, 168.0, 285.0, 544.0, 1032.0, 2795.0, 13388.0, 4158380.0, 12482.0, 2736.0, 985.0, 447.0, 299.0, 184.0, 96.0, 65.0, 35.0, 33.0, 18.0, 12.0, 13.0, 7.0, 6.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.625, -25.829833984375, -25.03466796875, -24.239501953125, -23.4443359375, -22.649169921875, -21.85400390625, -21.058837890625, -20.263671875, -19.468505859375, -18.67333984375, -17.878173828125, -17.0830078125, -16.287841796875, -15.49267578125, -14.697509765625, -13.90234375, -13.107177734375, -12.31201171875, -11.516845703125, -10.7216796875, -9.926513671875, -9.13134765625, -8.336181640625, -7.541015625, -6.745849609375, -5.95068359375, -5.155517578125, -4.3603515625, -3.565185546875, -2.77001953125, -1.974853515625, -1.1796875, -0.384521484375, 0.41064453125, 1.205810546875, 2.0009765625, 2.796142578125, 3.59130859375, 4.386474609375, 5.181640625, 5.976806640625, 6.77197265625, 7.567138671875, 8.3623046875, 9.157470703125, 9.95263671875, 10.747802734375, 11.54296875, 12.338134765625, 13.13330078125, 13.928466796875, 14.7236328125, 15.518798828125, 16.31396484375, 17.109130859375, 17.904296875, 18.699462890625, 19.49462890625, 20.289794921875, 21.0849609375, 21.880126953125, 22.67529296875, 23.470458984375, 24.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 6.0, 13.0, 12.0, 10.0, 17.0, 23.0, 33.0, 32.0, 35.0, 49.0, 49.0, 63.0, 67.0, 72.0, 65.0, 52.0, 71.0, 54.0, 49.0, 39.0, 37.0, 22.0, 29.0, 21.0, 14.0, 13.0, 10.0, 4.0, 7.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.84375, -5.6768798828125, -5.510009765625, -5.3431396484375, -5.17626953125, -5.0093994140625, -4.842529296875, -4.6756591796875, -4.5087890625, -4.3419189453125, -4.175048828125, -4.0081787109375, -3.84130859375, -3.6744384765625, -3.507568359375, -3.3406982421875, -3.173828125, -3.0069580078125, -2.840087890625, -2.6732177734375, -2.50634765625, -2.3394775390625, -2.172607421875, -2.0057373046875, -1.8388671875, -1.6719970703125, -1.505126953125, -1.3382568359375, -1.17138671875, -1.0045166015625, -0.837646484375, -0.6707763671875, -0.50390625, -0.3370361328125, -0.170166015625, -0.0032958984375, 0.16357421875, 0.3304443359375, 0.497314453125, 0.6641845703125, 0.8310546875, 0.9979248046875, 1.164794921875, 1.3316650390625, 1.49853515625, 1.6654052734375, 1.832275390625, 1.9991455078125, 2.166015625, 2.3328857421875, 2.499755859375, 2.6666259765625, 2.83349609375, 3.0003662109375, 3.167236328125, 3.3341064453125, 3.5009765625, 3.6678466796875, 3.834716796875, 4.0015869140625, 4.16845703125, 4.3353271484375, 4.502197265625, 4.6690673828125, 4.8359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 2.0, 5.0, 12.0, 12.0, 9.0, 12.0, 23.0, 36.0, 47.0, 86.0, 86.0, 129.0, 230.0, 363.0, 569.0, 1041.0, 1923.0, 4433.0, 15875.0, 4120293.0, 36099.0, 7071.0, 2617.0, 1319.0, 734.0, 412.0, 295.0, 159.0, 102.0, 91.0, 45.0, 32.0, 37.0, 20.0, 12.0, 7.0, 7.0, 12.0, 13.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.234375, -23.418701171875, -22.60302734375, -21.787353515625, -20.9716796875, -20.156005859375, -19.34033203125, -18.524658203125, -17.708984375, -16.893310546875, -16.07763671875, -15.261962890625, -14.4462890625, -13.630615234375, -12.81494140625, -11.999267578125, -11.18359375, -10.367919921875, -9.55224609375, -8.736572265625, -7.9208984375, -7.105224609375, -6.28955078125, -5.473876953125, -4.658203125, -3.842529296875, -3.02685546875, -2.211181640625, -1.3955078125, -0.579833984375, 0.23583984375, 1.051513671875, 1.8671875, 2.682861328125, 3.49853515625, 4.314208984375, 5.1298828125, 5.945556640625, 6.76123046875, 7.576904296875, 8.392578125, 9.208251953125, 10.02392578125, 10.839599609375, 11.6552734375, 12.470947265625, 13.28662109375, 14.102294921875, 14.91796875, 15.733642578125, 16.54931640625, 17.364990234375, 18.1806640625, 18.996337890625, 19.81201171875, 20.627685546875, 21.443359375, 22.259033203125, 23.07470703125, 23.890380859375, 24.7060546875, 25.521728515625, 26.33740234375, 27.153076171875, 27.96875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 13.0, 17.0, 203.0, 3760.0, 21.0, 13.0, 14.0, 6.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.72174072265625, -6.4981689453125, -6.27459716796875, -6.051025390625, -5.82745361328125, -5.6038818359375, -5.38031005859375, -5.15673828125, -4.93316650390625, -4.7095947265625, -4.48602294921875, -4.262451171875, -4.03887939453125, -3.8153076171875, -3.59173583984375, -3.3681640625, -3.14459228515625, -2.9210205078125, -2.69744873046875, -2.473876953125, -2.25030517578125, -2.0267333984375, -1.80316162109375, -1.57958984375, -1.35601806640625, -1.1324462890625, -0.90887451171875, -0.685302734375, -0.46173095703125, -0.2381591796875, -0.01458740234375, 0.208984375, 0.43255615234375, 0.6561279296875, 0.87969970703125, 1.103271484375, 1.32684326171875, 1.5504150390625, 1.77398681640625, 1.99755859375, 2.22113037109375, 2.4447021484375, 2.66827392578125, 2.891845703125, 3.11541748046875, 3.3389892578125, 3.56256103515625, 3.7861328125, 4.00970458984375, 4.2332763671875, 4.45684814453125, 4.680419921875, 4.90399169921875, 5.1275634765625, 5.35113525390625, 5.57470703125, 5.79827880859375, 6.0218505859375, 6.24542236328125, 6.468994140625, 6.69256591796875, 6.9161376953125, 7.13970947265625, 7.36328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 10.0, 20.0, 62.0, 115.0, 243.0, 243.0, 133.0, 84.0, 39.0, 23.0, 13.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.189288139343262, -13.073980331420898, -11.958673477172852, -10.843366622924805, -9.728058815002441, -8.612751007080078, -7.497444152832031, -6.382136821746826, -5.266829490661621, -4.151522159576416, -3.036214828491211, -1.9209074974060059, -0.8056001663208008, 0.3097071647644043, 1.4250144958496094, 2.5403218269348145, 3.6556291580200195, 4.770936489105225, 5.88624382019043, 7.001551151275635, 8.11685848236084, 9.232166290283203, 10.34747314453125, 11.462779998779297, 12.57808780670166, 13.693395614624023, 14.80870246887207, 15.924009323120117, 17.039318084716797, 18.154624938964844, 19.26993179321289, 20.385238647460938, 21.50054931640625, 22.615856170654297, 23.731163024902344, 24.846471786499023, 25.96177864074707, 27.077085494995117, 28.192394256591797, 29.307701110839844, 30.42300796508789, 31.538314819335938, 32.653621673583984, 33.76892852783203, 34.884239196777344, 35.99954605102539, 37.11485290527344, 38.230159759521484, 39.34546661376953, 40.46077346801758, 41.576080322265625, 42.69138717651367, 43.80669403076172, 44.92200469970703, 46.03731155395508, 47.152618408203125, 48.26792526245117, 49.38323211669922, 50.498538970947266, 51.61384582519531, 52.729156494140625, 53.84446334838867, 54.95977020263672, 56.075077056884766, 57.19038391113281]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 5.0, 8.0, 7.0, 13.0, 10.0, 7.0, 14.0, 13.0, 16.0, 13.0, 23.0, 19.0, 27.0, 23.0, 37.0, 41.0, 33.0, 39.0, 28.0, 25.0, 37.0, 42.0, 35.0, 35.0, 35.0, 39.0, 37.0, 29.0, 38.0, 37.0, 26.0, 30.0, 24.0, 26.0, 21.0, 12.0, 12.0, 11.0, 16.0, 3.0, 13.0, 7.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-9.801961898803711, -9.484550476074219, -9.167140007019043, -8.849729537963867, -8.532318115234375, -8.214906692504883, -7.897496223449707, -7.580085277557373, -7.262674331665039, -6.945263385772705, -6.627852439880371, -6.310441493988037, -5.993030548095703, -5.675619602203369, -5.358208656311035, -5.040797710418701, -4.723386764526367, -4.405975818634033, -4.088564872741699, -3.7711539268493652, -3.4537429809570312, -3.1363320350646973, -2.8189210891723633, -2.5015101432800293, -2.1840991973876953, -1.8666882514953613, -1.5492773056030273, -1.2318663597106934, -0.9144554138183594, -0.5970444679260254, -0.2796335220336914, 0.03777742385864258, 0.35518741607666016, 0.6725983619689941, 0.9900093078613281, 1.307420253753662, 1.624831199645996, 1.94224214553833, 2.259653091430664, 2.577064037322998, 2.894474983215332, 3.211885929107666, 3.529296875, 3.846707820892334, 4.164118766784668, 4.481529712677002, 4.798940658569336, 5.11635160446167, 5.433762550354004, 5.751173496246338, 6.068584442138672, 6.385995388031006, 6.70340633392334, 7.020817279815674, 7.338228225708008, 7.655639171600342, 7.973050117492676, 8.290460586547852, 8.607872009277344, 8.925283432006836, 9.242693901062012, 9.560104370117188, 9.87751579284668, 10.194927215576172, 10.512337684631348]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 16.0, 19.0, 28.0, 49.0, 100.0, 108.0, 160.0, 265.0, 491.0, 843.0, 1532.0, 2935.0, 6039.0, 13601.0, 34496.0, 101125.0, 353538.0, 365539.0, 105056.0, 35456.0, 14105.0, 6291.0, 2978.0, 1588.0, 854.0, 514.0, 309.0, 184.0, 92.0, 91.0, 41.0, 27.0, 30.0, 12.0, 9.0, 12.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.109375, -9.7725830078125, -9.435791015625, -9.0989990234375, -8.76220703125, -8.4254150390625, -8.088623046875, -7.7518310546875, -7.4150390625, -7.0782470703125, -6.741455078125, -6.4046630859375, -6.06787109375, -5.7310791015625, -5.394287109375, -5.0574951171875, -4.720703125, -4.3839111328125, -4.047119140625, -3.7103271484375, -3.37353515625, -3.0367431640625, -2.699951171875, -2.3631591796875, -2.0263671875, -1.6895751953125, -1.352783203125, -1.0159912109375, -0.67919921875, -0.3424072265625, -0.005615234375, 0.3311767578125, 0.66796875, 1.0047607421875, 1.341552734375, 1.6783447265625, 2.01513671875, 2.3519287109375, 2.688720703125, 3.0255126953125, 3.3623046875, 3.6990966796875, 4.035888671875, 4.3726806640625, 4.70947265625, 5.0462646484375, 5.383056640625, 5.7198486328125, 6.056640625, 6.3934326171875, 6.730224609375, 7.0670166015625, 7.40380859375, 7.7406005859375, 8.077392578125, 8.4141845703125, 8.7509765625, 9.0877685546875, 9.424560546875, 9.7613525390625, 10.09814453125, 10.4349365234375, 10.771728515625, 11.1085205078125, 11.4453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 8.0, 9.0, 8.0, 12.0, 11.0, 15.0, 26.0, 21.0, 24.0, 44.0, 41.0, 41.0, 53.0, 37.0, 63.0, 58.0, 63.0, 60.0, 73.0, 52.0, 45.0, 40.0, 31.0, 39.0, 23.0, 22.0, 23.0, 16.0, 4.0, 6.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.703125, -5.53594970703125, -5.3687744140625, -5.20159912109375, -5.034423828125, -4.86724853515625, -4.7000732421875, -4.53289794921875, -4.36572265625, -4.19854736328125, -4.0313720703125, -3.86419677734375, -3.697021484375, -3.52984619140625, -3.3626708984375, -3.19549560546875, -3.0283203125, -2.86114501953125, -2.6939697265625, -2.52679443359375, -2.359619140625, -2.19244384765625, -2.0252685546875, -1.85809326171875, -1.69091796875, -1.52374267578125, -1.3565673828125, -1.18939208984375, -1.022216796875, -0.85504150390625, -0.6878662109375, -0.52069091796875, -0.353515625, -0.18634033203125, -0.0191650390625, 0.14801025390625, 0.315185546875, 0.48236083984375, 0.6495361328125, 0.81671142578125, 0.98388671875, 1.15106201171875, 1.3182373046875, 1.48541259765625, 1.652587890625, 1.81976318359375, 1.9869384765625, 2.15411376953125, 2.3212890625, 2.48846435546875, 2.6556396484375, 2.82281494140625, 2.989990234375, 3.15716552734375, 3.3243408203125, 3.49151611328125, 3.65869140625, 3.82586669921875, 3.9930419921875, 4.16021728515625, 4.327392578125, 4.49456787109375, 4.6617431640625, 4.82891845703125, 4.99609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 8.0, 3.0, 11.0, 11.0, 9.0, 17.0, 25.0, 30.0, 51.0, 85.0, 108.0, 180.0, 253.0, 457.0, 762.0, 1438.0, 2606.0, 5443.0, 13380.0, 39346.0, 174861.0, 623320.0, 131816.0, 32641.0, 11262.0, 5095.0, 2303.0, 1212.0, 684.0, 407.0, 264.0, 150.0, 105.0, 72.0, 46.0, 33.0, 21.0, 9.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.4453125, -14.9537353515625, -14.462158203125, -13.9705810546875, -13.47900390625, -12.9874267578125, -12.495849609375, -12.0042724609375, -11.5126953125, -11.0211181640625, -10.529541015625, -10.0379638671875, -9.54638671875, -9.0548095703125, -8.563232421875, -8.0716552734375, -7.580078125, -7.0885009765625, -6.596923828125, -6.1053466796875, -5.61376953125, -5.1221923828125, -4.630615234375, -4.1390380859375, -3.6474609375, -3.1558837890625, -2.664306640625, -2.1727294921875, -1.68115234375, -1.1895751953125, -0.697998046875, -0.2064208984375, 0.28515625, 0.7767333984375, 1.268310546875, 1.7598876953125, 2.25146484375, 2.7430419921875, 3.234619140625, 3.7261962890625, 4.2177734375, 4.7093505859375, 5.200927734375, 5.6925048828125, 6.18408203125, 6.6756591796875, 7.167236328125, 7.6588134765625, 8.150390625, 8.6419677734375, 9.133544921875, 9.6251220703125, 10.11669921875, 10.6082763671875, 11.099853515625, 11.5914306640625, 12.0830078125, 12.5745849609375, 13.066162109375, 13.5577392578125, 14.04931640625, 14.5408935546875, 15.032470703125, 15.5240478515625, 16.015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 2.0, 5.0, 3.0, 1.0, 5.0, 8.0, 5.0, 9.0, 21.0, 16.0, 22.0, 25.0, 34.0, 40.0, 49.0, 52.0, 47.0, 47.0, 74.0, 72.0, 71.0, 59.0, 50.0, 55.0, 40.0, 42.0, 34.0, 23.0, 26.0, 18.0, 13.0, 9.0, 12.0, 7.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.9375, -26.025634765625, -25.11376953125, -24.201904296875, -23.2900390625, -22.378173828125, -21.46630859375, -20.554443359375, -19.642578125, -18.730712890625, -17.81884765625, -16.906982421875, -15.9951171875, -15.083251953125, -14.17138671875, -13.259521484375, -12.34765625, -11.435791015625, -10.52392578125, -9.612060546875, -8.7001953125, -7.788330078125, -6.87646484375, -5.964599609375, -5.052734375, -4.140869140625, -3.22900390625, -2.317138671875, -1.4052734375, -0.493408203125, 0.41845703125, 1.330322265625, 2.2421875, 3.154052734375, 4.06591796875, 4.977783203125, 5.8896484375, 6.801513671875, 7.71337890625, 8.625244140625, 9.537109375, 10.448974609375, 11.36083984375, 12.272705078125, 13.1845703125, 14.096435546875, 15.00830078125, 15.920166015625, 16.83203125, 17.743896484375, 18.65576171875, 19.567626953125, 20.4794921875, 21.391357421875, 22.30322265625, 23.215087890625, 24.126953125, 25.038818359375, 25.95068359375, 26.862548828125, 27.7744140625, 28.686279296875, 29.59814453125, 30.510009765625, 31.421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 4.0, 22.0, 18.0, 26.0, 47.0, 90.0, 176.0, 324.0, 705.0, 1906.0, 7021.0, 50293.0, 861035.0, 111485.0, 10985.0, 2625.0, 938.0, 401.0, 180.0, 116.0, 64.0, 36.0, 21.0, 13.0, 9.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1796875, -13.7012939453125, -13.222900390625, -12.7445068359375, -12.26611328125, -11.7877197265625, -11.309326171875, -10.8309326171875, -10.3525390625, -9.8741455078125, -9.395751953125, -8.9173583984375, -8.43896484375, -7.9605712890625, -7.482177734375, -7.0037841796875, -6.525390625, -6.0469970703125, -5.568603515625, -5.0902099609375, -4.61181640625, -4.1334228515625, -3.655029296875, -3.1766357421875, -2.6982421875, -2.2198486328125, -1.741455078125, -1.2630615234375, -0.78466796875, -0.3062744140625, 0.172119140625, 0.6505126953125, 1.12890625, 1.6072998046875, 2.085693359375, 2.5640869140625, 3.04248046875, 3.5208740234375, 3.999267578125, 4.4776611328125, 4.9560546875, 5.4344482421875, 5.912841796875, 6.3912353515625, 6.86962890625, 7.3480224609375, 7.826416015625, 8.3048095703125, 8.783203125, 9.2615966796875, 9.739990234375, 10.2183837890625, 10.69677734375, 11.1751708984375, 11.653564453125, 12.1319580078125, 12.6103515625, 13.0887451171875, 13.567138671875, 14.0455322265625, 14.52392578125, 15.0023193359375, 15.480712890625, 15.9591064453125, 16.4375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 11.0, 7.0, 15.0, 17.0, 21.0, 25.0, 35.0, 58.0, 78.0, 117.0, 151.0, 123.0, 93.0, 58.0, 54.0, 30.0, 19.0, 15.0, 10.0, 12.0, 6.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0013456344604492188, -0.0013079643249511719, -0.001270294189453125, -0.0012326240539550781, -0.0011949539184570312, -0.0011572837829589844, -0.0011196136474609375, -0.0010819435119628906, -0.0010442733764648438, -0.0010066032409667969, -0.00096893310546875, -0.0009312629699707031, -0.0008935928344726562, -0.0008559226989746094, -0.0008182525634765625, -0.0007805824279785156, -0.0007429122924804688, -0.0007052421569824219, -0.000667572021484375, -0.0006299018859863281, -0.0005922317504882812, -0.0005545616149902344, -0.0005168914794921875, -0.0004792213439941406, -0.00044155120849609375, -0.0004038810729980469, -0.0003662109375, -0.0003285408020019531, -0.00029087066650390625, -0.0002532005310058594, -0.0002155303955078125, -0.00017786026000976562, -0.00014019012451171875, -0.00010251998901367188, -6.4849853515625e-05, -2.7179718017578125e-05, 1.049041748046875e-05, 4.8160552978515625e-05, 8.58306884765625e-05, 0.00012350082397460938, 0.00016117095947265625, 0.00019884109497070312, 0.00023651123046875, 0.0002741813659667969, 0.00031185150146484375, 0.0003495216369628906, 0.0003871917724609375, 0.0004248619079589844, 0.00046253204345703125, 0.0005002021789550781, 0.000537872314453125, 0.0005755424499511719, 0.0006132125854492188, 0.0006508827209472656, 0.0006885528564453125, 0.0007262229919433594, 0.0007638931274414062, 0.0008015632629394531, 0.0008392333984375, 0.0008769035339355469, 0.0009145736694335938, 0.0009522438049316406, 0.0009899139404296875, 0.0010275840759277344, 0.0010652542114257812]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 11.0, 35.0, 42.0, 81.0, 267.0, 769.0, 3816.0, 48522.0, 958708.0, 32211.0, 2986.0, 698.0, 218.0, 87.0, 47.0, 26.0, 12.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.125, -32.28515625, -31.4453125, -30.60546875, -29.765625, -28.92578125, -28.0859375, -27.24609375, -26.40625, -25.56640625, -24.7265625, -23.88671875, -23.046875, -22.20703125, -21.3671875, -20.52734375, -19.6875, -18.84765625, -18.0078125, -17.16796875, -16.328125, -15.48828125, -14.6484375, -13.80859375, -12.96875, -12.12890625, -11.2890625, -10.44921875, -9.609375, -8.76953125, -7.9296875, -7.08984375, -6.25, -5.41015625, -4.5703125, -3.73046875, -2.890625, -2.05078125, -1.2109375, -0.37109375, 0.46875, 1.30859375, 2.1484375, 2.98828125, 3.828125, 4.66796875, 5.5078125, 6.34765625, 7.1875, 8.02734375, 8.8671875, 9.70703125, 10.546875, 11.38671875, 12.2265625, 13.06640625, 13.90625, 14.74609375, 15.5859375, 16.42578125, 17.265625, 18.10546875, 18.9453125, 19.78515625, 20.625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 5.0, 7.0, 8.0, 10.0, 13.0, 21.0, 25.0, 33.0, 44.0, 66.0, 114.0, 131.0, 141.0, 113.0, 88.0, 58.0, 33.0, 20.0, 17.0, 10.0, 10.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.6995849609375, -9.344482421875, -8.9893798828125, -8.63427734375, -8.2791748046875, -7.924072265625, -7.5689697265625, -7.2138671875, -6.8587646484375, -6.503662109375, -6.1485595703125, -5.79345703125, -5.4383544921875, -5.083251953125, -4.7281494140625, -4.373046875, -4.0179443359375, -3.662841796875, -3.3077392578125, -2.95263671875, -2.5975341796875, -2.242431640625, -1.8873291015625, -1.5322265625, -1.1771240234375, -0.822021484375, -0.4669189453125, -0.11181640625, 0.2432861328125, 0.598388671875, 0.9534912109375, 1.30859375, 1.6636962890625, 2.018798828125, 2.3739013671875, 2.72900390625, 3.0841064453125, 3.439208984375, 3.7943115234375, 4.1494140625, 4.5045166015625, 4.859619140625, 5.2147216796875, 5.56982421875, 5.9249267578125, 6.280029296875, 6.6351318359375, 6.990234375, 7.3453369140625, 7.700439453125, 8.0555419921875, 8.41064453125, 8.7657470703125, 9.120849609375, 9.4759521484375, 9.8310546875, 10.1861572265625, 10.541259765625, 10.8963623046875, 11.25146484375, 11.6065673828125, 11.961669921875, 12.3167724609375, 12.671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 9.0, 19.0, 38.0, 91.0, 213.0, 323.0, 184.0, 77.0, 30.0, 16.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.25106811523438, -149.0913848876953, -138.9317169189453, -128.77203369140625, -118.61235809326172, -108.45268249511719, -98.29299926757812, -88.1333236694336, -77.97364807128906, -67.81397247314453, -57.654293060302734, -47.49461364746094, -37.334938049316406, -27.175262451171875, -17.015583038330078, -6.855903625488281, 3.30377197265625, 13.463449478149414, 23.623126983642578, 33.782806396484375, 43.942481994628906, 54.10215759277344, 64.2618408203125, 74.42151641845703, 84.58119201660156, 94.7408676147461, 104.90054321289062, 115.06022644042969, 125.21990203857422, 135.37957763671875, 145.5392608642578, 155.69894409179688, 165.858642578125, 176.01832580566406, 186.17799377441406, 196.33767700195312, 206.49734497070312, 216.6570281982422, 226.81671142578125, 236.97637939453125, 247.1360626220703, 257.2957458496094, 267.4554138183594, 277.6150817871094, 287.7747802734375, 297.9344482421875, 308.0941162109375, 318.2538146972656, 328.4134826660156, 338.5731506347656, 348.73284912109375, 358.89251708984375, 369.05218505859375, 379.21185302734375, 389.3715515136719, 399.5312194824219, 409.69091796875, 419.8505859375, 430.0102844238281, 440.1699523925781, 450.3296203613281, 460.48931884765625, 470.64898681640625, 480.80865478515625, 490.96832275390625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 9.0, 5.0, 5.0, 9.0, 8.0, 12.0, 12.0, 11.0, 17.0, 19.0, 24.0, 26.0, 31.0, 41.0, 44.0, 48.0, 46.0, 51.0, 60.0, 57.0, 51.0, 46.0, 47.0, 42.0, 52.0, 26.0, 33.0, 22.0, 23.0, 25.0, 21.0, 14.0, 19.0, 7.0, 5.0, 7.0, 10.0, 5.0, 0.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-126.72867584228516, -123.26766967773438, -119.8066635131836, -116.34565734863281, -112.88465118408203, -109.42364501953125, -105.96263885498047, -102.50163269042969, -99.0406265258789, -95.57962036132812, -92.11861419677734, -88.65760803222656, -85.19660186767578, -81.735595703125, -78.27458953857422, -74.81358337402344, -71.35256958007812, -67.89156341552734, -64.43055725097656, -60.96955108642578, -57.508544921875, -54.04753875732422, -50.58653259277344, -47.125526428222656, -43.664520263671875, -40.203514099121094, -36.74250793457031, -33.28150177001953, -29.82049560546875, -26.359487533569336, -22.898481369018555, -19.437475204467773, -15.976470947265625, -12.515464782714844, -9.054458618164062, -5.593451499938965, -2.1324453353881836, 1.328561782836914, 4.789567947387695, 8.250574111938477, 11.711580276489258, 15.172586441040039, 18.63359260559082, 22.094600677490234, 25.555606842041016, 29.016613006591797, 32.47761917114258, 35.93862533569336, 39.39963150024414, 42.86063766479492, 46.3216438293457, 49.782649993896484, 53.243656158447266, 56.70466613769531, 60.165672302246094, 63.626678466796875, 67.08768463134766, 70.54869079589844, 74.00969696044922, 77.470703125, 80.93170928955078, 84.39271545410156, 87.85372161865234, 91.31472778320312, 94.7757339477539]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 9.0, 8.0, 14.0, 15.0, 13.0, 35.0, 40.0, 53.0, 85.0, 114.0, 170.0, 302.0, 521.0, 1129.0, 12230.0, 4176369.0, 1612.0, 557.0, 342.0, 203.0, 119.0, 85.0, 68.0, 35.0, 52.0, 33.0, 6.0, 17.0, 8.0, 6.0, 9.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.09375, -52.4609375, -50.828125, -49.1953125, -47.5625, -45.9296875, -44.296875, -42.6640625, -41.03125, -39.3984375, -37.765625, -36.1328125, -34.5, -32.8671875, -31.234375, -29.6015625, -27.96875, -26.3359375, -24.703125, -23.0703125, -21.4375, -19.8046875, -18.171875, -16.5390625, -14.90625, -13.2734375, -11.640625, -10.0078125, -8.375, -6.7421875, -5.109375, -3.4765625, -1.84375, -0.2109375, 1.421875, 3.0546875, 4.6875, 6.3203125, 7.953125, 9.5859375, 11.21875, 12.8515625, 14.484375, 16.1171875, 17.75, 19.3828125, 21.015625, 22.6484375, 24.28125, 25.9140625, 27.546875, 29.1796875, 30.8125, 32.4453125, 34.078125, 35.7109375, 37.34375, 38.9765625, 40.609375, 42.2421875, 43.875, 45.5078125, 47.140625, 48.7734375, 50.40625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 5.0, 9.0, 13.0, 19.0, 14.0, 10.0, 22.0, 25.0, 27.0, 33.0, 33.0, 39.0, 41.0, 73.0, 52.0, 67.0, 66.0, 56.0, 51.0, 52.0, 51.0, 35.0, 32.0, 33.0, 25.0, 21.0, 17.0, 12.0, 8.0, 9.0, 10.0, 4.0, 6.0, 7.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.07421875, -5.89483642578125, -5.7154541015625, -5.53607177734375, -5.356689453125, -5.17730712890625, -4.9979248046875, -4.81854248046875, -4.63916015625, -4.45977783203125, -4.2803955078125, -4.10101318359375, -3.921630859375, -3.74224853515625, -3.5628662109375, -3.38348388671875, -3.2041015625, -3.02471923828125, -2.8453369140625, -2.66595458984375, -2.486572265625, -2.30718994140625, -2.1278076171875, -1.94842529296875, -1.76904296875, -1.58966064453125, -1.4102783203125, -1.23089599609375, -1.051513671875, -0.87213134765625, -0.6927490234375, -0.51336669921875, -0.333984375, -0.15460205078125, 0.0247802734375, 0.20416259765625, 0.383544921875, 0.56292724609375, 0.7423095703125, 0.92169189453125, 1.10107421875, 1.28045654296875, 1.4598388671875, 1.63922119140625, 1.818603515625, 1.99798583984375, 2.1773681640625, 2.35675048828125, 2.5361328125, 2.71551513671875, 2.8948974609375, 3.07427978515625, 3.253662109375, 3.43304443359375, 3.6124267578125, 3.79180908203125, 3.97119140625, 4.15057373046875, 4.3299560546875, 4.50933837890625, 4.688720703125, 4.86810302734375, 5.0474853515625, 5.22686767578125, 5.40625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 6.0, 5.0, 14.0, 30.0, 38.0, 46.0, 71.0, 95.0, 130.0, 194.0, 288.0, 417.0, 670.0, 1195.0, 2714.0, 8967.0, 4160672.0, 11893.0, 3272.0, 1437.0, 689.0, 425.0, 304.0, 213.0, 140.0, 106.0, 56.0, 59.0, 34.0, 24.0, 13.0, 21.0, 6.0, 7.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.6162109375, -31.513671875, -30.4111328125, -29.30859375, -28.2060546875, -27.103515625, -26.0009765625, -24.8984375, -23.7958984375, -22.693359375, -21.5908203125, -20.48828125, -19.3857421875, -18.283203125, -17.1806640625, -16.078125, -14.9755859375, -13.873046875, -12.7705078125, -11.66796875, -10.5654296875, -9.462890625, -8.3603515625, -7.2578125, -6.1552734375, -5.052734375, -3.9501953125, -2.84765625, -1.7451171875, -0.642578125, 0.4599609375, 1.5625, 2.6650390625, 3.767578125, 4.8701171875, 5.97265625, 7.0751953125, 8.177734375, 9.2802734375, 10.3828125, 11.4853515625, 12.587890625, 13.6904296875, 14.79296875, 15.8955078125, 16.998046875, 18.1005859375, 19.203125, 20.3056640625, 21.408203125, 22.5107421875, 23.61328125, 24.7158203125, 25.818359375, 26.9208984375, 28.0234375, 29.1259765625, 30.228515625, 31.3310546875, 32.43359375, 33.5361328125, 34.638671875, 35.7412109375, 36.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 3900.0, 135.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.73583984375, -9.4404296875, -9.14501953125, -8.849609375, -8.55419921875, -8.2587890625, -7.96337890625, -7.66796875, -7.37255859375, -7.0771484375, -6.78173828125, -6.486328125, -6.19091796875, -5.8955078125, -5.60009765625, -5.3046875, -5.00927734375, -4.7138671875, -4.41845703125, -4.123046875, -3.82763671875, -3.5322265625, -3.23681640625, -2.94140625, -2.64599609375, -2.3505859375, -2.05517578125, -1.759765625, -1.46435546875, -1.1689453125, -0.87353515625, -0.578125, -0.28271484375, 0.0126953125, 0.30810546875, 0.603515625, 0.89892578125, 1.1943359375, 1.48974609375, 1.78515625, 2.08056640625, 2.3759765625, 2.67138671875, 2.966796875, 3.26220703125, 3.5576171875, 3.85302734375, 4.1484375, 4.44384765625, 4.7392578125, 5.03466796875, 5.330078125, 5.62548828125, 5.9208984375, 6.21630859375, 6.51171875, 6.80712890625, 7.1025390625, 7.39794921875, 7.693359375, 7.98876953125, 8.2841796875, 8.57958984375, 8.875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 12.0, 25.0, 44.0, 95.0, 175.0, 193.0, 185.0, 119.0, 49.0, 41.0, 22.0, 14.0, 10.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.10572624206543, -29.258777618408203, -28.41183090209961, -27.564882278442383, -26.717933654785156, -25.870986938476562, -25.024038314819336, -24.17708969116211, -23.330141067504883, -22.483192443847656, -21.636245727539062, -20.789297103881836, -19.94234848022461, -19.095401763916016, -18.24845314025879, -17.401504516601562, -16.55455780029297, -15.707610130310059, -14.860661506652832, -14.013713836669922, -13.166765213012695, -12.319817543029785, -11.472869873046875, -10.625921249389648, -9.778972625732422, -8.932024955749512, -8.085076332092285, -7.238128662109375, -6.391180038452148, -5.544232368469238, -4.69728422164917, -3.8503360748291016, -3.003387451171875, -2.1564393043518066, -1.3094912767410278, -0.462543249130249, 0.38440489768981934, 1.2313528060913086, 2.078300952911377, 2.9252490997314453, 3.7721972465515137, 4.619145393371582, 5.46609354019165, 6.313041687011719, 7.159989356994629, 8.006937026977539, 8.853885650634766, 9.700834274291992, 10.547781944274902, 11.394729614257812, 12.241678237915039, 13.08862590789795, 13.935574531555176, 14.782522201538086, 15.629470825195312, 16.476417541503906, 17.323366165161133, 18.17031478881836, 19.017261505126953, 19.86421012878418, 20.711158752441406, 21.55810546875, 22.405054092407227, 23.252002716064453, 24.09895133972168]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 4.0, 2.0, 10.0, 7.0, 11.0, 16.0, 23.0, 11.0, 23.0, 16.0, 23.0, 20.0, 21.0, 23.0, 37.0, 34.0, 33.0, 45.0, 49.0, 50.0, 54.0, 38.0, 43.0, 34.0, 37.0, 37.0, 32.0, 28.0, 28.0, 27.0, 29.0, 12.0, 12.0, 20.0, 14.0, 13.0, 18.0, 14.0, 6.0, 9.0, 5.0, 6.0, 6.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.614145278930664, -8.327057838439941, -8.039969444274902, -7.7528815269470215, -7.465793609619141, -7.178706169128418, -6.891618251800537, -6.604530334472656, -6.317442417144775, -6.0303544998168945, -5.743266582489014, -5.456178665161133, -5.16909122467041, -4.882002830505371, -4.594915390014648, -4.307827472686768, -4.020739555358887, -3.733651638031006, -3.446563720703125, -3.1594760417938232, -2.8723881244659424, -2.5853002071380615, -2.2982125282287598, -2.011124610900879, -1.724036693572998, -1.4369487762451172, -1.1498609781265259, -0.8627731204032898, -0.5756852626800537, -0.28859734535217285, -0.001509547233581543, 0.28557825088500977, 0.5726652145385742, 0.8597530722618103, 1.1468409299850464, 1.4339287281036377, 1.7210166454315186, 2.0081045627593994, 2.295192241668701, 2.582280158996582, 2.869368076324463, 3.1564559936523438, 3.4435439109802246, 3.7306315898895264, 4.017719268798828, 4.304807662963867, 4.59189510345459, 4.878983020782471, 5.166070938110352, 5.453158855438232, 5.740246772766113, 6.027334690093994, 6.314422607421875, 6.601510047912598, 6.8885979652404785, 7.175685882568359, 7.46277379989624, 7.749861717224121, 8.036949157714844, 8.324037551879883, 8.611124992370605, 8.898213386535645, 9.185300827026367, 9.472389221191406, 9.759476661682129]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 10.0, 10.0, 16.0, 20.0, 27.0, 47.0, 62.0, 83.0, 119.0, 163.0, 239.0, 353.0, 573.0, 912.0, 1502.0, 2685.0, 5011.0, 10477.0, 24110.0, 68738.0, 258485.0, 473082.0, 129758.0, 40042.0, 15781.0, 7192.0, 3743.0, 2051.0, 1148.0, 708.0, 451.0, 288.0, 190.0, 144.0, 99.0, 62.0, 59.0, 32.0, 11.0, 17.0, 12.0, 16.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.65625, -10.3153076171875, -9.974365234375, -9.6334228515625, -9.29248046875, -8.9515380859375, -8.610595703125, -8.2696533203125, -7.9287109375, -7.5877685546875, -7.246826171875, -6.9058837890625, -6.56494140625, -6.2239990234375, -5.883056640625, -5.5421142578125, -5.201171875, -4.8602294921875, -4.519287109375, -4.1783447265625, -3.83740234375, -3.4964599609375, -3.155517578125, -2.8145751953125, -2.4736328125, -2.1326904296875, -1.791748046875, -1.4508056640625, -1.10986328125, -0.7689208984375, -0.427978515625, -0.0870361328125, 0.25390625, 0.5948486328125, 0.935791015625, 1.2767333984375, 1.61767578125, 1.9586181640625, 2.299560546875, 2.6405029296875, 2.9814453125, 3.3223876953125, 3.663330078125, 4.0042724609375, 4.34521484375, 4.6861572265625, 5.027099609375, 5.3680419921875, 5.708984375, 6.0499267578125, 6.390869140625, 6.7318115234375, 7.07275390625, 7.4136962890625, 7.754638671875, 8.0955810546875, 8.4365234375, 8.7774658203125, 9.118408203125, 9.4593505859375, 9.80029296875, 10.1412353515625, 10.482177734375, 10.8231201171875, 11.1640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 1.0, 8.0, 8.0, 14.0, 7.0, 12.0, 18.0, 20.0, 19.0, 28.0, 32.0, 34.0, 34.0, 42.0, 57.0, 58.0, 60.0, 65.0, 61.0, 61.0, 41.0, 54.0, 40.0, 36.0, 28.0, 40.0, 24.0, 22.0, 13.0, 10.0, 13.0, 8.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.05078125, -5.85919189453125, -5.6676025390625, -5.47601318359375, -5.284423828125, -5.09283447265625, -4.9012451171875, -4.70965576171875, -4.51806640625, -4.32647705078125, -4.1348876953125, -3.94329833984375, -3.751708984375, -3.56011962890625, -3.3685302734375, -3.17694091796875, -2.9853515625, -2.79376220703125, -2.6021728515625, -2.41058349609375, -2.218994140625, -2.02740478515625, -1.8358154296875, -1.64422607421875, -1.45263671875, -1.26104736328125, -1.0694580078125, -0.87786865234375, -0.686279296875, -0.49468994140625, -0.3031005859375, -0.11151123046875, 0.080078125, 0.27166748046875, 0.4632568359375, 0.65484619140625, 0.846435546875, 1.03802490234375, 1.2296142578125, 1.42120361328125, 1.61279296875, 1.80438232421875, 1.9959716796875, 2.18756103515625, 2.379150390625, 2.57073974609375, 2.7623291015625, 2.95391845703125, 3.1455078125, 3.33709716796875, 3.5286865234375, 3.72027587890625, 3.911865234375, 4.10345458984375, 4.2950439453125, 4.48663330078125, 4.67822265625, 4.86981201171875, 5.0614013671875, 5.25299072265625, 5.444580078125, 5.63616943359375, 5.8277587890625, 6.01934814453125, 6.2109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 7.0, 9.0, 17.0, 20.0, 24.0, 39.0, 68.0, 94.0, 137.0, 279.0, 402.0, 846.0, 1849.0, 5303.0, 21717.0, 177450.0, 745055.0, 76000.0, 12529.0, 3562.0, 1501.0, 653.0, 383.0, 214.0, 127.0, 92.0, 45.0, 38.0, 31.0, 11.0, 14.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.140625, -18.41357421875, -17.6865234375, -16.95947265625, -16.232421875, -15.50537109375, -14.7783203125, -14.05126953125, -13.32421875, -12.59716796875, -11.8701171875, -11.14306640625, -10.416015625, -9.68896484375, -8.9619140625, -8.23486328125, -7.5078125, -6.78076171875, -6.0537109375, -5.32666015625, -4.599609375, -3.87255859375, -3.1455078125, -2.41845703125, -1.69140625, -0.96435546875, -0.2373046875, 0.48974609375, 1.216796875, 1.94384765625, 2.6708984375, 3.39794921875, 4.125, 4.85205078125, 5.5791015625, 6.30615234375, 7.033203125, 7.76025390625, 8.4873046875, 9.21435546875, 9.94140625, 10.66845703125, 11.3955078125, 12.12255859375, 12.849609375, 13.57666015625, 14.3037109375, 15.03076171875, 15.7578125, 16.48486328125, 17.2119140625, 17.93896484375, 18.666015625, 19.39306640625, 20.1201171875, 20.84716796875, 21.57421875, 22.30126953125, 23.0283203125, 23.75537109375, 24.482421875, 25.20947265625, 25.9365234375, 26.66357421875, 27.390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 24.0, 19.0, 27.0, 39.0, 53.0, 55.0, 67.0, 58.0, 79.0, 82.0, 66.0, 75.0, 78.0, 54.0, 54.0, 32.0, 29.0, 22.0, 21.0, 8.0, 11.0, 2.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -31.96630859375, -30.6513671875, -29.33642578125, -28.021484375, -26.70654296875, -25.3916015625, -24.07666015625, -22.76171875, -21.44677734375, -20.1318359375, -18.81689453125, -17.501953125, -16.18701171875, -14.8720703125, -13.55712890625, -12.2421875, -10.92724609375, -9.6123046875, -8.29736328125, -6.982421875, -5.66748046875, -4.3525390625, -3.03759765625, -1.72265625, -0.40771484375, 0.9072265625, 2.22216796875, 3.537109375, 4.85205078125, 6.1669921875, 7.48193359375, 8.796875, 10.11181640625, 11.4267578125, 12.74169921875, 14.056640625, 15.37158203125, 16.6865234375, 18.00146484375, 19.31640625, 20.63134765625, 21.9462890625, 23.26123046875, 24.576171875, 25.89111328125, 27.2060546875, 28.52099609375, 29.8359375, 31.15087890625, 32.4658203125, 33.78076171875, 35.095703125, 36.41064453125, 37.7255859375, 39.04052734375, 40.35546875, 41.67041015625, 42.9853515625, 44.30029296875, 45.615234375, 46.93017578125, 48.2451171875, 49.56005859375, 50.875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 4.0, 10.0, 9.0, 8.0, 16.0, 32.0, 39.0, 61.0, 139.0, 281.0, 742.0, 2480.0, 12879.0, 793356.0, 226944.0, 8552.0, 1842.0, 621.0, 266.0, 106.0, 66.0, 22.0, 18.0, 13.0, 9.0, 12.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.296875, -16.737060546875, -16.17724609375, -15.617431640625, -15.0576171875, -14.497802734375, -13.93798828125, -13.378173828125, -12.818359375, -12.258544921875, -11.69873046875, -11.138916015625, -10.5791015625, -10.019287109375, -9.45947265625, -8.899658203125, -8.33984375, -7.780029296875, -7.22021484375, -6.660400390625, -6.1005859375, -5.540771484375, -4.98095703125, -4.421142578125, -3.861328125, -3.301513671875, -2.74169921875, -2.181884765625, -1.6220703125, -1.062255859375, -0.50244140625, 0.057373046875, 0.6171875, 1.177001953125, 1.73681640625, 2.296630859375, 2.8564453125, 3.416259765625, 3.97607421875, 4.535888671875, 5.095703125, 5.655517578125, 6.21533203125, 6.775146484375, 7.3349609375, 7.894775390625, 8.45458984375, 9.014404296875, 9.57421875, 10.134033203125, 10.69384765625, 11.253662109375, 11.8134765625, 12.373291015625, 12.93310546875, 13.492919921875, 14.052734375, 14.612548828125, 15.17236328125, 15.732177734375, 16.2919921875, 16.851806640625, 17.41162109375, 17.971435546875, 18.53125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 11.0, 12.0, 18.0, 33.0, 51.0, 82.0, 156.0, 196.0, 148.0, 106.0, 65.0, 39.0, 21.0, 15.0, 12.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011911392211914062, -0.0011429041624069214, -0.0010946691036224365, -0.0010464340448379517, -0.0009981989860534668, -0.0009499639272689819, -0.0009017288684844971, -0.0008534938097000122, -0.0008052587509155273, -0.0007570236921310425, -0.0007087886333465576, -0.0006605535745620728, -0.0006123185157775879, -0.000564083456993103, -0.0005158483982086182, -0.0004676133394241333, -0.00041937828063964844, -0.0003711432218551636, -0.0003229081630706787, -0.00027467310428619385, -0.00022643804550170898, -0.00017820298671722412, -0.00012996792793273926, -8.17328691482544e-05, -3.349781036376953e-05, 1.4737248420715332e-05, 6.29723072052002e-05, 0.00011120736598968506, 0.00015944242477416992, 0.00020767748355865479, 0.00025591254234313965, 0.0003041476011276245, 0.0003523826599121094, 0.00040061771869659424, 0.0004488527774810791, 0.000497087836265564, 0.0005453228950500488, 0.0005935579538345337, 0.0006417930126190186, 0.0006900280714035034, 0.0007382631301879883, 0.0007864981889724731, 0.000834733247756958, 0.0008829683065414429, 0.0009312033653259277, 0.0009794384241104126, 0.0010276734828948975, 0.0010759085416793823, 0.0011241436004638672, 0.001172378659248352, 0.001220613718032837, 0.0012688487768173218, 0.0013170838356018066, 0.0013653188943862915, 0.0014135539531707764, 0.0014617890119552612, 0.001510024070739746, 0.001558259129524231, 0.0016064941883087158, 0.0016547292470932007, 0.0017029643058776855, 0.0017511993646621704, 0.0017994344234466553, 0.0018476694822311401, 0.001895904541015625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 11.0, 8.0, 12.0, 22.0, 29.0, 60.0, 93.0, 139.0, 330.0, 557.0, 1240.0, 2993.0, 11014.0, 117823.0, 867760.0, 36121.0, 6388.0, 2040.0, 879.0, 430.0, 248.0, 130.0, 100.0, 49.0, 20.0, 17.0, 15.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.3671875, -13.971435546875, -13.57568359375, -13.179931640625, -12.7841796875, -12.388427734375, -11.99267578125, -11.596923828125, -11.201171875, -10.805419921875, -10.40966796875, -10.013916015625, -9.6181640625, -9.222412109375, -8.82666015625, -8.430908203125, -8.03515625, -7.639404296875, -7.24365234375, -6.847900390625, -6.4521484375, -6.056396484375, -5.66064453125, -5.264892578125, -4.869140625, -4.473388671875, -4.07763671875, -3.681884765625, -3.2861328125, -2.890380859375, -2.49462890625, -2.098876953125, -1.703125, -1.307373046875, -0.91162109375, -0.515869140625, -0.1201171875, 0.275634765625, 0.67138671875, 1.067138671875, 1.462890625, 1.858642578125, 2.25439453125, 2.650146484375, 3.0458984375, 3.441650390625, 3.83740234375, 4.233154296875, 4.62890625, 5.024658203125, 5.42041015625, 5.816162109375, 6.2119140625, 6.607666015625, 7.00341796875, 7.399169921875, 7.794921875, 8.190673828125, 8.58642578125, 8.982177734375, 9.3779296875, 9.773681640625, 10.16943359375, 10.565185546875, 10.9609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 13.0, 29.0, 44.0, 82.0, 200.0, 244.0, 170.0, 83.0, 39.0, 24.0, 12.0, 12.0, 8.0, 7.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.875, -19.297607421875, -18.72021484375, -18.142822265625, -17.5654296875, -16.988037109375, -16.41064453125, -15.833251953125, -15.255859375, -14.678466796875, -14.10107421875, -13.523681640625, -12.9462890625, -12.368896484375, -11.79150390625, -11.214111328125, -10.63671875, -10.059326171875, -9.48193359375, -8.904541015625, -8.3271484375, -7.749755859375, -7.17236328125, -6.594970703125, -6.017578125, -5.440185546875, -4.86279296875, -4.285400390625, -3.7080078125, -3.130615234375, -2.55322265625, -1.975830078125, -1.3984375, -0.821044921875, -0.24365234375, 0.333740234375, 0.9111328125, 1.488525390625, 2.06591796875, 2.643310546875, 3.220703125, 3.798095703125, 4.37548828125, 4.952880859375, 5.5302734375, 6.107666015625, 6.68505859375, 7.262451171875, 7.83984375, 8.417236328125, 8.99462890625, 9.572021484375, 10.1494140625, 10.726806640625, 11.30419921875, 11.881591796875, 12.458984375, 13.036376953125, 13.61376953125, 14.191162109375, 14.7685546875, 15.345947265625, 15.92333984375, 16.500732421875, 17.078125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 19.0, 28.0, 66.0, 191.0, 315.0, 251.0, 94.0, 27.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-535.55419921875, -525.1531372070312, -514.7521362304688, -504.3511047363281, -493.9500732421875, -483.5490417480469, -473.14801025390625, -462.7469482421875, -452.345947265625, -441.9449157714844, -431.54388427734375, -421.1428527832031, -410.7418212890625, -400.3407897949219, -389.93975830078125, -379.5386962890625, -369.1376647949219, -358.73663330078125, -348.3356018066406, -337.9345703125, -327.5335388183594, -317.13250732421875, -306.7314758300781, -296.3304443359375, -285.92938232421875, -275.5283508300781, -265.1273193359375, -254.72628784179688, -244.32525634765625, -233.92422485351562, -223.52317810058594, -213.1221466064453, -202.7211456298828, -192.3201141357422, -181.91908264160156, -171.51805114746094, -161.11700439453125, -150.71597290039062, -140.31494140625, -129.91390991210938, -119.51287841796875, -109.11184692382812, -98.7108154296875, -88.30977630615234, -77.90874481201172, -67.5077133178711, -57.1066780090332, -46.70564270019531, -36.30461120605469, -25.90357780456543, -15.502544403076172, -5.101511001586914, 5.299522399902344, 15.700553894042969, 26.10158920288086, 36.50262451171875, 46.903656005859375, 57.3046875, 67.70571899414062, 78.10675811767578, 88.5077896118164, 98.90882110595703, 109.30986022949219, 119.71089172363281, 130.11192321777344]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 12.0, 7.0, 11.0, 15.0, 8.0, 18.0, 22.0, 19.0, 31.0, 36.0, 35.0, 48.0, 44.0, 49.0, 35.0, 53.0, 57.0, 50.0, 53.0, 51.0, 32.0, 33.0, 31.0, 32.0, 32.0, 25.0, 30.0, 20.0, 20.0, 15.0, 10.0, 15.0, 8.0, 8.0, 7.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0], "bins": [-145.06704711914062, -141.10931396484375, -137.1515655517578, -133.19381713867188, -129.236083984375, -125.2783432006836, -121.32060241699219, -117.36286163330078, -113.40512084960938, -109.44738006591797, -105.48963928222656, -101.53189849853516, -97.57415771484375, -93.61641693115234, -89.65867614746094, -85.70093536376953, -81.74319458007812, -77.78545379638672, -73.82771301269531, -69.8699722290039, -65.9122314453125, -61.954490661621094, -57.99674987792969, -54.03900909423828, -50.081268310546875, -46.12352752685547, -42.16578674316406, -38.208045959472656, -34.25030517578125, -30.292564392089844, -26.334823608398438, -22.37708282470703, -18.419342041015625, -14.461601257324219, -10.503860473632812, -6.546119689941406, -2.58837890625, 1.3693618774414062, 5.3271026611328125, 9.284843444824219, 13.242584228515625, 17.20032501220703, 21.158065795898438, 25.115806579589844, 29.07354736328125, 33.031288146972656, 36.98902893066406, 40.94676971435547, 44.904510498046875, 48.86225128173828, 52.81999206542969, 56.777732849121094, 60.7354736328125, 64.6932144165039, 68.65095520019531, 72.60869598388672, 76.56643676757812, 80.52417755126953, 84.48191833496094, 88.43965911865234, 92.39739990234375, 96.35514068603516, 100.31288146972656, 104.27062225341797, 108.22836303710938]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 9.0, 6.0, 10.0, 19.0, 22.0, 36.0, 46.0, 67.0, 82.0, 146.0, 202.0, 285.0, 578.0, 955.0, 2162.0, 7352.0, 4142711.0, 31714.0, 4291.0, 1529.0, 730.0, 444.0, 248.0, 178.0, 116.0, 88.0, 57.0, 52.0, 36.0, 27.0, 18.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-32.03125, -31.05517578125, -30.0791015625, -29.10302734375, -28.126953125, -27.15087890625, -26.1748046875, -25.19873046875, -24.22265625, -23.24658203125, -22.2705078125, -21.29443359375, -20.318359375, -19.34228515625, -18.3662109375, -17.39013671875, -16.4140625, -15.43798828125, -14.4619140625, -13.48583984375, -12.509765625, -11.53369140625, -10.5576171875, -9.58154296875, -8.60546875, -7.62939453125, -6.6533203125, -5.67724609375, -4.701171875, -3.72509765625, -2.7490234375, -1.77294921875, -0.796875, 0.17919921875, 1.1552734375, 2.13134765625, 3.107421875, 4.08349609375, 5.0595703125, 6.03564453125, 7.01171875, 7.98779296875, 8.9638671875, 9.93994140625, 10.916015625, 11.89208984375, 12.8681640625, 13.84423828125, 14.8203125, 15.79638671875, 16.7724609375, 17.74853515625, 18.724609375, 19.70068359375, 20.6767578125, 21.65283203125, 22.62890625, 23.60498046875, 24.5810546875, 25.55712890625, 26.533203125, 27.50927734375, 28.4853515625, 29.46142578125, 30.4375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 13.0, 20.0, 31.0, 46.0, 64.0, 71.0, 90.0, 100.0, 101.0, 96.0, 84.0, 73.0, 57.0, 35.0, 37.0, 24.0, 24.0, 11.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.8125, -11.4989013671875, -11.185302734375, -10.8717041015625, -10.55810546875, -10.2445068359375, -9.930908203125, -9.6173095703125, -9.3037109375, -8.9901123046875, -8.676513671875, -8.3629150390625, -8.04931640625, -7.7357177734375, -7.422119140625, -7.1085205078125, -6.794921875, -6.4813232421875, -6.167724609375, -5.8541259765625, -5.54052734375, -5.2269287109375, -4.913330078125, -4.5997314453125, -4.2861328125, -3.9725341796875, -3.658935546875, -3.3453369140625, -3.03173828125, -2.7181396484375, -2.404541015625, -2.0909423828125, -1.77734375, -1.4637451171875, -1.150146484375, -0.8365478515625, -0.52294921875, -0.2093505859375, 0.104248046875, 0.4178466796875, 0.7314453125, 1.0450439453125, 1.358642578125, 1.6722412109375, 1.98583984375, 2.2994384765625, 2.613037109375, 2.9266357421875, 3.240234375, 3.5538330078125, 3.867431640625, 4.1810302734375, 4.49462890625, 4.8082275390625, 5.121826171875, 5.4354248046875, 5.7490234375, 6.0626220703125, 6.376220703125, 6.6898193359375, 7.00341796875, 7.3170166015625, 7.630615234375, 7.9442138671875, 8.2578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 8.0, 13.0, 12.0, 25.0, 16.0, 34.0, 40.0, 75.0, 112.0, 185.0, 339.0, 610.0, 1148.0, 2565.0, 7334.0, 42144.0, 4115960.0, 15444.0, 4438.0, 1756.0, 829.0, 458.0, 270.0, 163.0, 109.0, 47.0, 41.0, 26.0, 15.0, 18.0, 15.0, 11.0, 11.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.34375, -33.3115234375, -32.279296875, -31.2470703125, -30.21484375, -29.1826171875, -28.150390625, -27.1181640625, -26.0859375, -25.0537109375, -24.021484375, -22.9892578125, -21.95703125, -20.9248046875, -19.892578125, -18.8603515625, -17.828125, -16.7958984375, -15.763671875, -14.7314453125, -13.69921875, -12.6669921875, -11.634765625, -10.6025390625, -9.5703125, -8.5380859375, -7.505859375, -6.4736328125, -5.44140625, -4.4091796875, -3.376953125, -2.3447265625, -1.3125, -0.2802734375, 0.751953125, 1.7841796875, 2.81640625, 3.8486328125, 4.880859375, 5.9130859375, 6.9453125, 7.9775390625, 9.009765625, 10.0419921875, 11.07421875, 12.1064453125, 13.138671875, 14.1708984375, 15.203125, 16.2353515625, 17.267578125, 18.2998046875, 19.33203125, 20.3642578125, 21.396484375, 22.4287109375, 23.4609375, 24.4931640625, 25.525390625, 26.5576171875, 27.58984375, 28.6220703125, 29.654296875, 30.6865234375, 31.71875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 8.0, 14.0, 29.0, 3827.0, 109.0, 33.0, 17.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.242431640625, -16.79736328125, -16.352294921875, -15.9072265625, -15.462158203125, -15.01708984375, -14.572021484375, -14.126953125, -13.681884765625, -13.23681640625, -12.791748046875, -12.3466796875, -11.901611328125, -11.45654296875, -11.011474609375, -10.56640625, -10.121337890625, -9.67626953125, -9.231201171875, -8.7861328125, -8.341064453125, -7.89599609375, -7.450927734375, -7.005859375, -6.560791015625, -6.11572265625, -5.670654296875, -5.2255859375, -4.780517578125, -4.33544921875, -3.890380859375, -3.4453125, -3.000244140625, -2.55517578125, -2.110107421875, -1.6650390625, -1.219970703125, -0.77490234375, -0.329833984375, 0.115234375, 0.560302734375, 1.00537109375, 1.450439453125, 1.8955078125, 2.340576171875, 2.78564453125, 3.230712890625, 3.67578125, 4.120849609375, 4.56591796875, 5.010986328125, 5.4560546875, 5.901123046875, 6.34619140625, 6.791259765625, 7.236328125, 7.681396484375, 8.12646484375, 8.571533203125, 9.0166015625, 9.461669921875, 9.90673828125, 10.351806640625, 10.796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 17.0, 46.0, 94.0, 185.0, 245.0, 182.0, 115.0, 50.0, 27.0, 16.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.75697326660156, -56.887794494628906, -55.018611907958984, -53.14943313598633, -51.28025436401367, -49.41107177734375, -47.541893005371094, -45.67271423339844, -43.80353546142578, -41.934356689453125, -40.0651741027832, -38.19599533081055, -36.32681655883789, -34.45763397216797, -32.58845520019531, -30.719276428222656, -28.850093841552734, -26.980913162231445, -25.11173439025879, -23.2425537109375, -21.373374938964844, -19.504194259643555, -17.635013580322266, -15.765833854675293, -13.89665412902832, -12.027474403381348, -10.158294677734375, -8.289113998413086, -6.419934272766113, -4.550754547119141, -2.6815738677978516, -0.8123941421508789, 1.0567893981933594, 2.925969362258911, 4.795149326324463, 6.664329528808594, 8.533509254455566, 10.402688980102539, 12.271869659423828, 14.1410493850708, 16.010229110717773, 17.879409790039062, 19.74858856201172, 21.617769241333008, 23.486949920654297, 25.356128692626953, 27.225309371948242, 29.09449005126953, 30.963668823242188, 32.832847595214844, 34.702030181884766, 36.57120895385742, 38.44038772583008, 40.3095703125, 42.178749084472656, 44.04792785644531, 45.91710662841797, 47.786285400390625, 49.65546798706055, 51.5246467590332, 53.39382553100586, 55.26300811767578, 57.13218688964844, 59.001365661621094, 60.870548248291016]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 13.0, 6.0, 17.0, 12.0, 17.0, 15.0, 24.0, 43.0, 37.0, 42.0, 47.0, 63.0, 62.0, 72.0, 61.0, 67.0, 61.0, 55.0, 71.0, 43.0, 34.0, 30.0, 35.0, 20.0, 20.0, 12.0, 12.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.450119018554688, -28.517234802246094, -27.5843505859375, -26.65146827697754, -25.718584060668945, -24.78569984436035, -23.85281753540039, -22.919933319091797, -21.987049102783203, -21.05416488647461, -20.121280670166016, -19.188398361206055, -18.25551414489746, -17.322629928588867, -16.389747619628906, -15.456863403320312, -14.523979187011719, -13.591094970703125, -12.658211708068848, -11.72532844543457, -10.792444229125977, -9.859560012817383, -8.926676750183105, -7.99379301071167, -7.060909271240234, -6.128025531768799, -5.195141792297363, -4.262258052825928, -3.329374313354492, -2.3964905738830566, -1.463606834411621, -0.5307230949401855, 0.40216064453125, 1.3350443840026855, 2.267928123474121, 3.2008118629455566, 4.133695602416992, 5.066579341888428, 5.999463081359863, 6.932346820831299, 7.865230560302734, 8.798114776611328, 9.730998039245605, 10.663881301879883, 11.596765518188477, 12.52964973449707, 13.462532997131348, 14.395416259765625, 15.328300476074219, 16.261184692382812, 17.194068908691406, 18.126951217651367, 19.05983543395996, 19.992719650268555, 20.925601959228516, 21.85848617553711, 22.791370391845703, 23.724254608154297, 24.65713882446289, 25.59002113342285, 26.522905349731445, 27.45578956604004, 28.388671875, 29.321556091308594, 30.254440307617188]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 5.0, 10.0, 10.0, 22.0, 22.0, 31.0, 33.0, 51.0, 91.0, 164.0, 220.0, 404.0, 720.0, 1489.0, 3144.0, 7374.0, 19606.0, 59142.0, 218194.0, 489482.0, 171957.0, 48169.0, 16157.0, 6340.0, 2851.0, 1275.0, 636.0, 364.0, 190.0, 116.0, 84.0, 57.0, 37.0, 29.0, 19.0, 12.0, 15.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.21875, -15.7607421875, -15.302734375, -14.8447265625, -14.38671875, -13.9287109375, -13.470703125, -13.0126953125, -12.5546875, -12.0966796875, -11.638671875, -11.1806640625, -10.72265625, -10.2646484375, -9.806640625, -9.3486328125, -8.890625, -8.4326171875, -7.974609375, -7.5166015625, -7.05859375, -6.6005859375, -6.142578125, -5.6845703125, -5.2265625, -4.7685546875, -4.310546875, -3.8525390625, -3.39453125, -2.9365234375, -2.478515625, -2.0205078125, -1.5625, -1.1044921875, -0.646484375, -0.1884765625, 0.26953125, 0.7275390625, 1.185546875, 1.6435546875, 2.1015625, 2.5595703125, 3.017578125, 3.4755859375, 3.93359375, 4.3916015625, 4.849609375, 5.3076171875, 5.765625, 6.2236328125, 6.681640625, 7.1396484375, 7.59765625, 8.0556640625, 8.513671875, 8.9716796875, 9.4296875, 9.8876953125, 10.345703125, 10.8037109375, 11.26171875, 11.7197265625, 12.177734375, 12.6357421875, 13.09375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 14.0, 12.0, 19.0, 19.0, 44.0, 39.0, 66.0, 74.0, 86.0, 87.0, 89.0, 82.0, 80.0, 67.0, 56.0, 46.0, 34.0, 27.0, 30.0, 14.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.62451171875, -9.3193359375, -9.01416015625, -8.708984375, -8.40380859375, -8.0986328125, -7.79345703125, -7.48828125, -7.18310546875, -6.8779296875, -6.57275390625, -6.267578125, -5.96240234375, -5.6572265625, -5.35205078125, -5.046875, -4.74169921875, -4.4365234375, -4.13134765625, -3.826171875, -3.52099609375, -3.2158203125, -2.91064453125, -2.60546875, -2.30029296875, -1.9951171875, -1.68994140625, -1.384765625, -1.07958984375, -0.7744140625, -0.46923828125, -0.1640625, 0.14111328125, 0.4462890625, 0.75146484375, 1.056640625, 1.36181640625, 1.6669921875, 1.97216796875, 2.27734375, 2.58251953125, 2.8876953125, 3.19287109375, 3.498046875, 3.80322265625, 4.1083984375, 4.41357421875, 4.71875, 5.02392578125, 5.3291015625, 5.63427734375, 5.939453125, 6.24462890625, 6.5498046875, 6.85498046875, 7.16015625, 7.46533203125, 7.7705078125, 8.07568359375, 8.380859375, 8.68603515625, 8.9912109375, 9.29638671875, 9.6015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 17.0, 19.0, 31.0, 37.0, 77.0, 94.0, 157.0, 258.0, 487.0, 952.0, 2253.0, 6040.0, 22066.0, 124205.0, 674022.0, 177094.0, 28503.0, 7136.0, 2599.0, 1124.0, 550.0, 300.0, 160.0, 113.0, 66.0, 48.0, 39.0, 20.0, 20.0, 20.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.8125, -22.18896484375, -21.5654296875, -20.94189453125, -20.318359375, -19.69482421875, -19.0712890625, -18.44775390625, -17.82421875, -17.20068359375, -16.5771484375, -15.95361328125, -15.330078125, -14.70654296875, -14.0830078125, -13.45947265625, -12.8359375, -12.21240234375, -11.5888671875, -10.96533203125, -10.341796875, -9.71826171875, -9.0947265625, -8.47119140625, -7.84765625, -7.22412109375, -6.6005859375, -5.97705078125, -5.353515625, -4.72998046875, -4.1064453125, -3.48291015625, -2.859375, -2.23583984375, -1.6123046875, -0.98876953125, -0.365234375, 0.25830078125, 0.8818359375, 1.50537109375, 2.12890625, 2.75244140625, 3.3759765625, 3.99951171875, 4.623046875, 5.24658203125, 5.8701171875, 6.49365234375, 7.1171875, 7.74072265625, 8.3642578125, 8.98779296875, 9.611328125, 10.23486328125, 10.8583984375, 11.48193359375, 12.10546875, 12.72900390625, 13.3525390625, 13.97607421875, 14.599609375, 15.22314453125, 15.8466796875, 16.47021484375, 17.09375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 11.0, 8.0, 7.0, 6.0, 18.0, 16.0, 18.0, 22.0, 22.0, 30.0, 27.0, 42.0, 32.0, 45.0, 46.0, 60.0, 61.0, 50.0, 53.0, 54.0, 49.0, 42.0, 31.0, 40.0, 38.0, 24.0, 23.0, 21.0, 16.0, 18.0, 12.0, 12.0, 15.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.390625, -25.576904296875, -24.76318359375, -23.949462890625, -23.1357421875, -22.322021484375, -21.50830078125, -20.694580078125, -19.880859375, -19.067138671875, -18.25341796875, -17.439697265625, -16.6259765625, -15.812255859375, -14.99853515625, -14.184814453125, -13.37109375, -12.557373046875, -11.74365234375, -10.929931640625, -10.1162109375, -9.302490234375, -8.48876953125, -7.675048828125, -6.861328125, -6.047607421875, -5.23388671875, -4.420166015625, -3.6064453125, -2.792724609375, -1.97900390625, -1.165283203125, -0.3515625, 0.462158203125, 1.27587890625, 2.089599609375, 2.9033203125, 3.717041015625, 4.53076171875, 5.344482421875, 6.158203125, 6.971923828125, 7.78564453125, 8.599365234375, 9.4130859375, 10.226806640625, 11.04052734375, 11.854248046875, 12.66796875, 13.481689453125, 14.29541015625, 15.109130859375, 15.9228515625, 16.736572265625, 17.55029296875, 18.364013671875, 19.177734375, 19.991455078125, 20.80517578125, 21.618896484375, 22.4326171875, 23.246337890625, 24.06005859375, 24.873779296875, 25.6875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 7.0, 13.0, 9.0, 27.0, 38.0, 61.0, 122.0, 274.0, 746.0, 2713.0, 25374.0, 904399.0, 107380.0, 5493.0, 1144.0, 409.0, 152.0, 73.0, 47.0, 23.0, 17.0, 11.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.745849609375, -10.34326171875, -9.940673828125, -9.5380859375, -9.135498046875, -8.73291015625, -8.330322265625, -7.927734375, -7.525146484375, -7.12255859375, -6.719970703125, -6.3173828125, -5.914794921875, -5.51220703125, -5.109619140625, -4.70703125, -4.304443359375, -3.90185546875, -3.499267578125, -3.0966796875, -2.694091796875, -2.29150390625, -1.888916015625, -1.486328125, -1.083740234375, -0.68115234375, -0.278564453125, 0.1240234375, 0.526611328125, 0.92919921875, 1.331787109375, 1.734375, 2.136962890625, 2.53955078125, 2.942138671875, 3.3447265625, 3.747314453125, 4.14990234375, 4.552490234375, 4.955078125, 5.357666015625, 5.76025390625, 6.162841796875, 6.5654296875, 6.968017578125, 7.37060546875, 7.773193359375, 8.17578125, 8.578369140625, 8.98095703125, 9.383544921875, 9.7861328125, 10.188720703125, 10.59130859375, 10.993896484375, 11.396484375, 11.799072265625, 12.20166015625, 12.604248046875, 13.0068359375, 13.409423828125, 13.81201171875, 14.214599609375, 14.6171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 7.0, 10.0, 11.0, 20.0, 16.0, 25.0, 30.0, 33.0, 63.0, 57.0, 64.0, 87.0, 80.0, 76.0, 74.0, 60.0, 43.0, 42.0, 30.0, 29.0, 25.0, 20.0, 8.0, 9.0, 8.0, 8.0, 10.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0006632804870605469, -0.0006410554051399231, -0.0006188303232192993, -0.0005966052412986755, -0.0005743801593780518, -0.000552155077457428, -0.0005299299955368042, -0.0005077049136161804, -0.00048547983169555664, -0.00046325474977493286, -0.0004410296678543091, -0.0004188045859336853, -0.0003965795040130615, -0.00037435442209243774, -0.00035212934017181396, -0.0003299042582511902, -0.0003076791763305664, -0.0002854540944099426, -0.00026322901248931885, -0.00024100393056869507, -0.0002187788486480713, -0.0001965537667274475, -0.00017432868480682373, -0.00015210360288619995, -0.00012987852096557617, -0.00010765343904495239, -8.542835712432861e-05, -6.320327520370483e-05, -4.0978193283081055e-05, -1.8753111362457275e-05, 3.471970558166504e-06, 2.5697052478790283e-05, 4.792213439941406e-05, 7.014721632003784e-05, 9.237229824066162e-05, 0.0001145973801612854, 0.00013682246208190918, 0.00015904754400253296, 0.00018127262592315674, 0.00020349770784378052, 0.0002257227897644043, 0.0002479478716850281, 0.00027017295360565186, 0.00029239803552627563, 0.0003146231174468994, 0.0003368481993675232, 0.00035907328128814697, 0.00038129836320877075, 0.00040352344512939453, 0.0004257485270500183, 0.0004479736089706421, 0.00047019869089126587, 0.0004924237728118896, 0.0005146488547325134, 0.0005368739366531372, 0.000559099018573761, 0.0005813241004943848, 0.0006035491824150085, 0.0006257742643356323, 0.0006479993462562561, 0.0006702244281768799, 0.0006924495100975037, 0.0007146745920181274, 0.0007368996739387512, 0.000759124755859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 10.0, 22.0, 47.0, 97.0, 334.0, 1638.0, 23971.0, 991396.0, 28726.0, 1705.0, 384.0, 125.0, 44.0, 20.0, 10.0, 16.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.403564453125, -14.82275390625, -14.241943359375, -13.6611328125, -13.080322265625, -12.49951171875, -11.918701171875, -11.337890625, -10.757080078125, -10.17626953125, -9.595458984375, -9.0146484375, -8.433837890625, -7.85302734375, -7.272216796875, -6.69140625, -6.110595703125, -5.52978515625, -4.948974609375, -4.3681640625, -3.787353515625, -3.20654296875, -2.625732421875, -2.044921875, -1.464111328125, -0.88330078125, -0.302490234375, 0.2783203125, 0.859130859375, 1.43994140625, 2.020751953125, 2.6015625, 3.182373046875, 3.76318359375, 4.343994140625, 4.9248046875, 5.505615234375, 6.08642578125, 6.667236328125, 7.248046875, 7.828857421875, 8.40966796875, 8.990478515625, 9.5712890625, 10.152099609375, 10.73291015625, 11.313720703125, 11.89453125, 12.475341796875, 13.05615234375, 13.636962890625, 14.2177734375, 14.798583984375, 15.37939453125, 15.960205078125, 16.541015625, 17.121826171875, 17.70263671875, 18.283447265625, 18.8642578125, 19.445068359375, 20.02587890625, 20.606689453125, 21.1875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 7.0, 12.0, 20.0, 37.0, 54.0, 108.0, 156.0, 184.0, 150.0, 98.0, 76.0, 37.0, 30.0, 16.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.015625, -17.60107421875, -17.1865234375, -16.77197265625, -16.357421875, -15.94287109375, -15.5283203125, -15.11376953125, -14.69921875, -14.28466796875, -13.8701171875, -13.45556640625, -13.041015625, -12.62646484375, -12.2119140625, -11.79736328125, -11.3828125, -10.96826171875, -10.5537109375, -10.13916015625, -9.724609375, -9.31005859375, -8.8955078125, -8.48095703125, -8.06640625, -7.65185546875, -7.2373046875, -6.82275390625, -6.408203125, -5.99365234375, -5.5791015625, -5.16455078125, -4.75, -4.33544921875, -3.9208984375, -3.50634765625, -3.091796875, -2.67724609375, -2.2626953125, -1.84814453125, -1.43359375, -1.01904296875, -0.6044921875, -0.18994140625, 0.224609375, 0.63916015625, 1.0537109375, 1.46826171875, 1.8828125, 2.29736328125, 2.7119140625, 3.12646484375, 3.541015625, 3.95556640625, 4.3701171875, 4.78466796875, 5.19921875, 5.61376953125, 6.0283203125, 6.44287109375, 6.857421875, 7.27197265625, 7.6865234375, 8.10107421875, 8.515625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 14.0, 20.0, 53.0, 112.0, 207.0, 211.0, 196.0, 105.0, 46.0, 12.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.77745056152344, -130.9923858642578, -124.20731353759766, -117.42224884033203, -110.63717651367188, -103.85211181640625, -97.06704711914062, -90.281982421875, -83.49691009521484, -76.71184539794922, -69.92677307128906, -63.14170837402344, -56.35663986206055, -49.571571350097656, -42.78650665283203, -36.00143814086914, -29.21636962890625, -22.43130111694336, -15.646234512329102, -8.861167907714844, -2.076099395751953, 4.7089691162109375, 11.494033813476562, 18.279102325439453, 25.064170837402344, 31.849239349365234, 38.634307861328125, 45.41937255859375, 52.20444107055664, 58.98950958251953, 65.77457427978516, 72.55964660644531, 79.34469604492188, 86.1297607421875, 92.91483306884766, 99.69989776611328, 106.48497009277344, 113.27003479003906, 120.05509948730469, 126.84016418457031, 133.625244140625, 140.41030883789062, 147.19537353515625, 153.98043823242188, 160.76551818847656, 167.5505828857422, 174.3356475830078, 181.12071228027344, 187.90577697753906, 194.6908416748047, 201.4759063720703, 208.260986328125, 215.04605102539062, 221.83111572265625, 228.61618041992188, 235.4012451171875, 242.18630981445312, 248.97137451171875, 255.75643920898438, 262.54150390625, 269.3265686035156, 276.11163330078125, 282.896728515625, 289.6817932128906, 296.46685791015625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 7.0, 5.0, 3.0, 5.0, 10.0, 6.0, 16.0, 14.0, 14.0, 21.0, 27.0, 27.0, 24.0, 36.0, 29.0, 45.0, 34.0, 51.0, 62.0, 67.0, 53.0, 50.0, 56.0, 50.0, 36.0, 29.0, 37.0, 38.0, 38.0, 28.0, 26.0, 15.0, 19.0, 9.0, 6.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.80905151367188, -114.03343200683594, -110.25780487060547, -106.48218536376953, -102.70655822753906, -98.93093872070312, -95.15531158447266, -91.37969207763672, -87.60406494140625, -83.82844543457031, -80.05281829833984, -76.2771987915039, -72.50157165527344, -68.7259521484375, -64.95032501220703, -61.174705505371094, -57.39908218383789, -53.62345886230469, -49.847835540771484, -46.07221221923828, -42.29658889770508, -38.520965576171875, -34.74534606933594, -30.9697208404541, -27.1940975189209, -23.418474197387695, -19.642850875854492, -15.867228507995605, -12.091605186462402, -8.315982818603516, -4.5403594970703125, -0.7647361755371094, 3.0108871459960938, 6.786510467529297, 10.5621337890625, 14.337756156921387, 18.113380432128906, 21.889001846313477, 25.66462516784668, 29.440248489379883, 33.21587371826172, 36.99149703979492, 40.767120361328125, 44.54274368286133, 48.31836700439453, 52.09398651123047, 55.86961364746094, 59.645233154296875, 63.42085647583008, 67.19647979736328, 70.97209930419922, 74.74772644042969, 78.52334594726562, 82.2989730834961, 86.07459259033203, 89.8502197265625, 93.62583923339844, 97.40145874023438, 101.17708587646484, 104.95270538330078, 108.72833251953125, 112.50395202636719, 116.27957916259766, 120.0551986694336, 123.83082580566406]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 5.0, 9.0, 7.0, 12.0, 19.0, 20.0, 40.0, 47.0, 61.0, 110.0, 145.0, 212.0, 415.0, 750.0, 1788.0, 5701.0, 30167.0, 3522443.0, 604899.0, 19819.0, 4500.0, 1410.0, 654.0, 341.0, 205.0, 170.0, 103.0, 77.0, 45.0, 42.0, 23.0, 14.0, 10.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.578125, -24.776123046875, -23.97412109375, -23.172119140625, -22.3701171875, -21.568115234375, -20.76611328125, -19.964111328125, -19.162109375, -18.360107421875, -17.55810546875, -16.756103515625, -15.9541015625, -15.152099609375, -14.35009765625, -13.548095703125, -12.74609375, -11.944091796875, -11.14208984375, -10.340087890625, -9.5380859375, -8.736083984375, -7.93408203125, -7.132080078125, -6.330078125, -5.528076171875, -4.72607421875, -3.924072265625, -3.1220703125, -2.320068359375, -1.51806640625, -0.716064453125, 0.0859375, 0.887939453125, 1.68994140625, 2.491943359375, 3.2939453125, 4.095947265625, 4.89794921875, 5.699951171875, 6.501953125, 7.303955078125, 8.10595703125, 8.907958984375, 9.7099609375, 10.511962890625, 11.31396484375, 12.115966796875, 12.91796875, 13.719970703125, 14.52197265625, 15.323974609375, 16.1259765625, 16.927978515625, 17.72998046875, 18.531982421875, 19.333984375, 20.135986328125, 20.93798828125, 21.739990234375, 22.5419921875, 23.343994140625, 24.14599609375, 24.947998046875, 25.75]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 9.0, 8.0, 14.0, 19.0, 12.0, 26.0, 27.0, 31.0, 41.0, 45.0, 63.0, 50.0, 62.0, 52.0, 65.0, 63.0, 60.0, 55.0, 46.0, 51.0, 41.0, 25.0, 32.0, 25.0, 23.0, 9.0, 12.0, 4.0, 12.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.8515625, -6.6632080078125, -6.474853515625, -6.2864990234375, -6.09814453125, -5.9097900390625, -5.721435546875, -5.5330810546875, -5.3447265625, -5.1563720703125, -4.968017578125, -4.7796630859375, -4.59130859375, -4.4029541015625, -4.214599609375, -4.0262451171875, -3.837890625, -3.6495361328125, -3.461181640625, -3.2728271484375, -3.08447265625, -2.8961181640625, -2.707763671875, -2.5194091796875, -2.3310546875, -2.1427001953125, -1.954345703125, -1.7659912109375, -1.57763671875, -1.3892822265625, -1.200927734375, -1.0125732421875, -0.82421875, -0.6358642578125, -0.447509765625, -0.2591552734375, -0.07080078125, 0.1175537109375, 0.305908203125, 0.4942626953125, 0.6826171875, 0.8709716796875, 1.059326171875, 1.2476806640625, 1.43603515625, 1.6243896484375, 1.812744140625, 2.0010986328125, 2.189453125, 2.3778076171875, 2.566162109375, 2.7545166015625, 2.94287109375, 3.1312255859375, 3.319580078125, 3.5079345703125, 3.6962890625, 3.8846435546875, 4.072998046875, 4.2613525390625, 4.44970703125, 4.6380615234375, 4.826416015625, 5.0147705078125, 5.203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 2.0, 2.0, 2.0, 9.0, 5.0, 7.0, 23.0, 31.0, 50.0, 120.0, 335.0, 1323.0, 6298.0, 57215.0, 3998235.0, 118472.0, 9682.0, 1760.0, 429.0, 139.0, 54.0, 28.0, 15.0, 13.0, 8.0, 8.0, 8.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.921875, -30.97216796875, -30.0224609375, -29.07275390625, -28.123046875, -27.17333984375, -26.2236328125, -25.27392578125, -24.32421875, -23.37451171875, -22.4248046875, -21.47509765625, -20.525390625, -19.57568359375, -18.6259765625, -17.67626953125, -16.7265625, -15.77685546875, -14.8271484375, -13.87744140625, -12.927734375, -11.97802734375, -11.0283203125, -10.07861328125, -9.12890625, -8.17919921875, -7.2294921875, -6.27978515625, -5.330078125, -4.38037109375, -3.4306640625, -2.48095703125, -1.53125, -0.58154296875, 0.3681640625, 1.31787109375, 2.267578125, 3.21728515625, 4.1669921875, 5.11669921875, 6.06640625, 7.01611328125, 7.9658203125, 8.91552734375, 9.865234375, 10.81494140625, 11.7646484375, 12.71435546875, 13.6640625, 14.61376953125, 15.5634765625, 16.51318359375, 17.462890625, 18.41259765625, 19.3623046875, 20.31201171875, 21.26171875, 22.21142578125, 23.1611328125, 24.11083984375, 25.060546875, 26.01025390625, 26.9599609375, 27.90966796875, 28.859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 7.0, 9.0, 6.0, 8.0, 7.0, 16.0, 23.0, 42.0, 58.0, 86.0, 187.0, 905.0, 1781.0, 500.0, 138.0, 83.0, 63.0, 44.0, 25.0, 17.0, 14.0, 10.0, 10.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.625, -19.0693359375, -18.513671875, -17.9580078125, -17.40234375, -16.8466796875, -16.291015625, -15.7353515625, -15.1796875, -14.6240234375, -14.068359375, -13.5126953125, -12.95703125, -12.4013671875, -11.845703125, -11.2900390625, -10.734375, -10.1787109375, -9.623046875, -9.0673828125, -8.51171875, -7.9560546875, -7.400390625, -6.8447265625, -6.2890625, -5.7333984375, -5.177734375, -4.6220703125, -4.06640625, -3.5107421875, -2.955078125, -2.3994140625, -1.84375, -1.2880859375, -0.732421875, -0.1767578125, 0.37890625, 0.9345703125, 1.490234375, 2.0458984375, 2.6015625, 3.1572265625, 3.712890625, 4.2685546875, 4.82421875, 5.3798828125, 5.935546875, 6.4912109375, 7.046875, 7.6025390625, 8.158203125, 8.7138671875, 9.26953125, 9.8251953125, 10.380859375, 10.9365234375, 11.4921875, 12.0478515625, 12.603515625, 13.1591796875, 13.71484375, 14.2705078125, 14.826171875, 15.3818359375, 15.9375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 9.0, 8.0, 22.0, 44.0, 88.0, 148.0, 198.0, 200.0, 127.0, 63.0, 30.0, 21.0, 12.0, 6.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-114.9828872680664, -110.6606674194336, -106.33843994140625, -102.01622009277344, -97.69400024414062, -93.37178039550781, -89.049560546875, -84.72733306884766, -80.40511322021484, -76.08289337158203, -71.76066589355469, -67.43844604492188, -63.11622619628906, -58.79400634765625, -54.47178268432617, -50.149559020996094, -45.82733917236328, -41.50511932373047, -37.18289566040039, -32.86067199707031, -28.5384521484375, -24.216230392456055, -19.89400863647461, -15.571786880493164, -11.249565124511719, -6.927343368530273, -2.605121612548828, 1.7171001434326172, 6.0393218994140625, 10.361543655395508, 14.683765411376953, 19.0059871673584, 23.328216552734375, 27.65043830871582, 31.972660064697266, 36.294883728027344, 40.617103576660156, 44.93932342529297, 49.26154708862305, 53.583770751953125, 57.90599060058594, 62.22821044921875, 66.55043029785156, 70.8726577758789, 75.19487762451172, 79.51709747314453, 83.83932495117188, 88.16154479980469, 92.4837646484375, 96.80598449707031, 101.12820434570312, 105.45043182373047, 109.77265167236328, 114.0948715209961, 118.41709899902344, 122.73931884765625, 127.06153869628906, 131.38375854492188, 135.7059783935547, 140.0281982421875, 144.35043334960938, 148.6726531982422, 152.994873046875, 157.3170928955078, 161.63931274414062]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 10.0, 22.0, 15.0, 15.0, 15.0, 25.0, 19.0, 36.0, 26.0, 45.0, 47.0, 39.0, 52.0, 56.0, 54.0, 58.0, 55.0, 55.0, 38.0, 41.0, 46.0, 37.0, 36.0, 29.0, 27.0, 17.0, 15.0, 12.0, 12.0, 7.0, 12.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.789066314697266, -56.751033782958984, -54.7130012512207, -52.674964904785156, -50.636932373046875, -48.598899841308594, -46.56086730957031, -44.52283477783203, -42.48480224609375, -40.44676971435547, -38.40873718261719, -36.370704650878906, -34.33266830444336, -32.29463577270508, -30.256603240966797, -28.218570709228516, -26.18053436279297, -24.142501831054688, -22.104467391967773, -20.066434860229492, -18.028400421142578, -15.990367889404297, -13.952335357666016, -11.914301872253418, -9.87626838684082, -7.838234901428223, -5.800201892852783, -3.7621688842773438, -1.724135398864746, 0.31389808654785156, 2.351930618286133, 4.3899641036987305, 6.428001403808594, 8.466034889221191, 10.504068374633789, 12.54210090637207, 14.580134391784668, 16.618167877197266, 18.656200408935547, 20.694232940673828, 22.732267379760742, 24.770299911499023, 26.808334350585938, 28.84636688232422, 30.8843994140625, 32.92243194580078, 34.96046447753906, 36.99850082397461, 39.03653335571289, 41.07456588745117, 43.11259841918945, 45.150634765625, 47.18866729736328, 49.22669982910156, 51.264732360839844, 53.302764892578125, 55.340797424316406, 57.37882995605469, 59.41686248779297, 61.45489501953125, 63.4929313659668, 65.53096008300781, 67.56900024414062, 69.6070327758789, 71.64506530761719]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 13.0, 7.0, 19.0, 30.0, 49.0, 77.0, 106.0, 177.0, 316.0, 556.0, 1010.0, 1814.0, 3558.0, 7497.0, 17313.0, 43253.0, 114547.0, 296849.0, 335780.0, 136557.0, 51568.0, 20203.0, 8607.0, 3993.0, 1992.0, 1138.0, 609.0, 378.0, 224.0, 126.0, 62.0, 42.0, 32.0, 18.0, 16.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.653564453125, -9.36181640625, -9.070068359375, -8.7783203125, -8.486572265625, -8.19482421875, -7.903076171875, -7.611328125, -7.319580078125, -7.02783203125, -6.736083984375, -6.4443359375, -6.152587890625, -5.86083984375, -5.569091796875, -5.27734375, -4.985595703125, -4.69384765625, -4.402099609375, -4.1103515625, -3.818603515625, -3.52685546875, -3.235107421875, -2.943359375, -2.651611328125, -2.35986328125, -2.068115234375, -1.7763671875, -1.484619140625, -1.19287109375, -0.901123046875, -0.609375, -0.317626953125, -0.02587890625, 0.265869140625, 0.5576171875, 0.849365234375, 1.14111328125, 1.432861328125, 1.724609375, 2.016357421875, 2.30810546875, 2.599853515625, 2.8916015625, 3.183349609375, 3.47509765625, 3.766845703125, 4.05859375, 4.350341796875, 4.64208984375, 4.933837890625, 5.2255859375, 5.517333984375, 5.80908203125, 6.100830078125, 6.392578125, 6.684326171875, 6.97607421875, 7.267822265625, 7.5595703125, 7.851318359375, 8.14306640625, 8.434814453125, 8.7265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 2.0, 3.0, 6.0, 6.0, 15.0, 13.0, 12.0, 17.0, 31.0, 23.0, 26.0, 37.0, 34.0, 41.0, 48.0, 35.0, 39.0, 49.0, 46.0, 38.0, 57.0, 42.0, 52.0, 62.0, 42.0, 37.0, 29.0, 21.0, 28.0, 13.0, 22.0, 17.0, 14.0, 6.0, 7.0, 9.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-5.80859375, -5.651611328125, -5.49462890625, -5.337646484375, -5.1806640625, -5.023681640625, -4.86669921875, -4.709716796875, -4.552734375, -4.395751953125, -4.23876953125, -4.081787109375, -3.9248046875, -3.767822265625, -3.61083984375, -3.453857421875, -3.296875, -3.139892578125, -2.98291015625, -2.825927734375, -2.6689453125, -2.511962890625, -2.35498046875, -2.197998046875, -2.041015625, -1.884033203125, -1.72705078125, -1.570068359375, -1.4130859375, -1.256103515625, -1.09912109375, -0.942138671875, -0.78515625, -0.628173828125, -0.47119140625, -0.314208984375, -0.1572265625, -0.000244140625, 0.15673828125, 0.313720703125, 0.470703125, 0.627685546875, 0.78466796875, 0.941650390625, 1.0986328125, 1.255615234375, 1.41259765625, 1.569580078125, 1.7265625, 1.883544921875, 2.04052734375, 2.197509765625, 2.3544921875, 2.511474609375, 2.66845703125, 2.825439453125, 2.982421875, 3.139404296875, 3.29638671875, 3.453369140625, 3.6103515625, 3.767333984375, 3.92431640625, 4.081298828125, 4.23828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 6.0, 11.0, 19.0, 20.0, 26.0, 51.0, 64.0, 131.0, 191.0, 361.0, 642.0, 1292.0, 3310.0, 12283.0, 82704.0, 713906.0, 201570.0, 23326.0, 5035.0, 1709.0, 833.0, 453.0, 256.0, 132.0, 75.0, 52.0, 26.0, 25.0, 9.0, 11.0, 5.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.71875, -17.10107421875, -16.4833984375, -15.86572265625, -15.248046875, -14.63037109375, -14.0126953125, -13.39501953125, -12.77734375, -12.15966796875, -11.5419921875, -10.92431640625, -10.306640625, -9.68896484375, -9.0712890625, -8.45361328125, -7.8359375, -7.21826171875, -6.6005859375, -5.98291015625, -5.365234375, -4.74755859375, -4.1298828125, -3.51220703125, -2.89453125, -2.27685546875, -1.6591796875, -1.04150390625, -0.423828125, 0.19384765625, 0.8115234375, 1.42919921875, 2.046875, 2.66455078125, 3.2822265625, 3.89990234375, 4.517578125, 5.13525390625, 5.7529296875, 6.37060546875, 6.98828125, 7.60595703125, 8.2236328125, 8.84130859375, 9.458984375, 10.07666015625, 10.6943359375, 11.31201171875, 11.9296875, 12.54736328125, 13.1650390625, 13.78271484375, 14.400390625, 15.01806640625, 15.6357421875, 16.25341796875, 16.87109375, 17.48876953125, 18.1064453125, 18.72412109375, 19.341796875, 19.95947265625, 20.5771484375, 21.19482421875, 21.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 8.0, 4.0, 7.0, 9.0, 11.0, 21.0, 34.0, 20.0, 26.0, 39.0, 41.0, 38.0, 44.0, 44.0, 41.0, 56.0, 53.0, 51.0, 37.0, 43.0, 51.0, 42.0, 42.0, 29.0, 34.0, 37.0, 20.0, 17.0, 22.0, 22.0, 18.0, 5.0, 9.0, 8.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.431396484375, -16.75341796875, -16.075439453125, -15.3974609375, -14.719482421875, -14.04150390625, -13.363525390625, -12.685546875, -12.007568359375, -11.32958984375, -10.651611328125, -9.9736328125, -9.295654296875, -8.61767578125, -7.939697265625, -7.26171875, -6.583740234375, -5.90576171875, -5.227783203125, -4.5498046875, -3.871826171875, -3.19384765625, -2.515869140625, -1.837890625, -1.159912109375, -0.48193359375, 0.196044921875, 0.8740234375, 1.552001953125, 2.22998046875, 2.907958984375, 3.5859375, 4.263916015625, 4.94189453125, 5.619873046875, 6.2978515625, 6.975830078125, 7.65380859375, 8.331787109375, 9.009765625, 9.687744140625, 10.36572265625, 11.043701171875, 11.7216796875, 12.399658203125, 13.07763671875, 13.755615234375, 14.43359375, 15.111572265625, 15.78955078125, 16.467529296875, 17.1455078125, 17.823486328125, 18.50146484375, 19.179443359375, 19.857421875, 20.535400390625, 21.21337890625, 21.891357421875, 22.5693359375, 23.247314453125, 23.92529296875, 24.603271484375, 25.28125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 4.0, 12.0, 10.0, 13.0, 35.0, 54.0, 79.0, 115.0, 241.0, 527.0, 1319.0, 4564.0, 29646.0, 772191.0, 221815.0, 13422.0, 2762.0, 894.0, 366.0, 199.0, 91.0, 51.0, 38.0, 30.0, 15.0, 12.0, 15.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.66796875, -8.3671875, -8.06640625, -7.765625, -7.46484375, -7.1640625, -6.86328125, -6.5625, -6.26171875, -5.9609375, -5.66015625, -5.359375, -5.05859375, -4.7578125, -4.45703125, -4.15625, -3.85546875, -3.5546875, -3.25390625, -2.953125, -2.65234375, -2.3515625, -2.05078125, -1.75, -1.44921875, -1.1484375, -0.84765625, -0.546875, -0.24609375, 0.0546875, 0.35546875, 0.65625, 0.95703125, 1.2578125, 1.55859375, 1.859375, 2.16015625, 2.4609375, 2.76171875, 3.0625, 3.36328125, 3.6640625, 3.96484375, 4.265625, 4.56640625, 4.8671875, 5.16796875, 5.46875, 5.76953125, 6.0703125, 6.37109375, 6.671875, 6.97265625, 7.2734375, 7.57421875, 7.875, 8.17578125, 8.4765625, 8.77734375, 9.078125, 9.37890625, 9.6796875, 9.98046875, 10.28125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 4.0, 7.0, 11.0, 17.0, 13.0, 28.0, 40.0, 42.0, 52.0, 82.0, 109.0, 130.0, 107.0, 104.0, 70.0, 46.0, 44.0, 18.0, 19.0, 17.0, 9.0, 5.0, 8.0, 5.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013637542724609375, -0.0013275966048240662, -0.0012914389371871948, -0.0012552812695503235, -0.0012191236019134521, -0.0011829659342765808, -0.0011468082666397095, -0.0011106505990028381, -0.0010744929313659668, -0.0010383352637290955, -0.0010021775960922241, -0.0009660199284553528, -0.0009298622608184814, -0.0008937045931816101, -0.0008575469255447388, -0.0008213892579078674, -0.0007852315902709961, -0.0007490739226341248, -0.0007129162549972534, -0.0006767585873603821, -0.0006406009197235107, -0.0006044432520866394, -0.0005682855844497681, -0.0005321279168128967, -0.0004959702491760254, -0.00045981258153915405, -0.0004236549139022827, -0.0003874972462654114, -0.00035133957862854004, -0.0003151819109916687, -0.00027902424335479736, -0.00024286657571792603, -0.0002067089080810547, -0.00017055124044418335, -0.000134393572807312, -9.823590517044067e-05, -6.207823753356934e-05, -2.5920569896697998e-05, 1.023709774017334e-05, 4.639476537704468e-05, 8.255243301391602e-05, 0.00011871010065078735, 0.0001548677682876587, 0.00019102543592453003, 0.00022718310356140137, 0.0002633407711982727, 0.00029949843883514404, 0.0003356561064720154, 0.0003718137741088867, 0.00040797144174575806, 0.0004441291093826294, 0.00048028677701950073, 0.0005164444446563721, 0.0005526021122932434, 0.0005887597799301147, 0.0006249174475669861, 0.0006610751152038574, 0.0006972327828407288, 0.0007333904504776001, 0.0007695481181144714, 0.0008057057857513428, 0.0008418634533882141, 0.0008780211210250854, 0.0009141787886619568, 0.0009503364562988281]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 10.0, 15.0, 11.0, 18.0, 23.0, 46.0, 68.0, 124.0, 239.0, 471.0, 1236.0, 4068.0, 18809.0, 512764.0, 485606.0, 18710.0, 4058.0, 1218.0, 502.0, 215.0, 113.0, 62.0, 35.0, 29.0, 26.0, 18.0, 17.0, 9.0, 6.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -10.1273193359375, -9.778076171875, -9.4288330078125, -9.07958984375, -8.7303466796875, -8.381103515625, -8.0318603515625, -7.6826171875, -7.3333740234375, -6.984130859375, -6.6348876953125, -6.28564453125, -5.9364013671875, -5.587158203125, -5.2379150390625, -4.888671875, -4.5394287109375, -4.190185546875, -3.8409423828125, -3.49169921875, -3.1424560546875, -2.793212890625, -2.4439697265625, -2.0947265625, -1.7454833984375, -1.396240234375, -1.0469970703125, -0.69775390625, -0.3485107421875, 0.000732421875, 0.3499755859375, 0.69921875, 1.0484619140625, 1.397705078125, 1.7469482421875, 2.09619140625, 2.4454345703125, 2.794677734375, 3.1439208984375, 3.4931640625, 3.8424072265625, 4.191650390625, 4.5408935546875, 4.89013671875, 5.2393798828125, 5.588623046875, 5.9378662109375, 6.287109375, 6.6363525390625, 6.985595703125, 7.3348388671875, 7.68408203125, 8.0333251953125, 8.382568359375, 8.7318115234375, 9.0810546875, 9.4302978515625, 9.779541015625, 10.1287841796875, 10.47802734375, 10.8272705078125, 11.176513671875, 11.5257568359375, 11.875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 10.0, 10.0, 20.0, 20.0, 26.0, 32.0, 40.0, 55.0, 59.0, 87.0, 86.0, 97.0, 87.0, 79.0, 66.0, 53.0, 40.0, 23.0, 16.0, 27.0, 14.0, 13.0, 7.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.87890625, -6.6656494140625, -6.452392578125, -6.2391357421875, -6.02587890625, -5.8126220703125, -5.599365234375, -5.3861083984375, -5.1728515625, -4.9595947265625, -4.746337890625, -4.5330810546875, -4.31982421875, -4.1065673828125, -3.893310546875, -3.6800537109375, -3.466796875, -3.2535400390625, -3.040283203125, -2.8270263671875, -2.61376953125, -2.4005126953125, -2.187255859375, -1.9739990234375, -1.7607421875, -1.5474853515625, -1.334228515625, -1.1209716796875, -0.90771484375, -0.6944580078125, -0.481201171875, -0.2679443359375, -0.0546875, 0.1585693359375, 0.371826171875, 0.5850830078125, 0.79833984375, 1.0115966796875, 1.224853515625, 1.4381103515625, 1.6513671875, 1.8646240234375, 2.077880859375, 2.2911376953125, 2.50439453125, 2.7176513671875, 2.930908203125, 3.1441650390625, 3.357421875, 3.5706787109375, 3.783935546875, 3.9971923828125, 4.21044921875, 4.4237060546875, 4.636962890625, 4.8502197265625, 5.0634765625, 5.2767333984375, 5.489990234375, 5.7032470703125, 5.91650390625, 6.1297607421875, 6.343017578125, 6.5562744140625, 6.76953125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 10.0, 37.0, 274.0, 524.0, 119.0, 29.0, 11.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-571.5399780273438, -559.1664428710938, -546.79296875, -534.41943359375, -522.0458984375, -509.6723937988281, -497.2988586425781, -484.92535400390625, -472.55181884765625, -460.1783142089844, -447.8047790527344, -435.4312744140625, -423.0577392578125, -410.6842346191406, -398.3106994628906, -385.93719482421875, -373.56365966796875, -361.1901550292969, -348.8166198730469, -336.443115234375, -324.069580078125, -311.6960754394531, -299.3225402832031, -286.94903564453125, -274.5755310058594, -262.2020263671875, -249.8284912109375, -237.45497131347656, -225.08145141601562, -212.7079315185547, -200.33441162109375, -187.96090698242188, -175.58737182617188, -163.21385192871094, -150.84033203125, -138.46681213378906, -126.09329223632812, -113.71977233886719, -101.34626007080078, -88.97274017333984, -76.5992202758789, -64.22570037841797, -51.85218048095703, -39.47866439819336, -27.105144500732422, -14.731624603271484, -2.3581085205078125, 10.015411376953125, 22.388931274414062, 34.762451171875, 47.13597106933594, 59.50948715209961, 71.88301086425781, 84.25653076171875, 96.63004302978516, 109.0035629272461, 121.37708282470703, 133.75059509277344, 146.12411499023438, 158.4976348876953, 170.87115478515625, 183.2446746826172, 195.61819458007812, 207.99171447753906, 220.365234375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 9.0, 11.0, 11.0, 10.0, 18.0, 13.0, 21.0, 39.0, 26.0, 25.0, 25.0, 37.0, 48.0, 54.0, 47.0, 46.0, 53.0, 56.0, 58.0, 47.0, 41.0, 27.0, 50.0, 21.0, 36.0, 30.0, 19.0, 16.0, 19.0, 15.0, 15.0, 12.0, 9.0, 5.0, 3.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.9045639038086, -72.42153930664062, -69.93852233886719, -67.45549774169922, -64.97247314453125, -62.48945617675781, -60.006431579589844, -57.52341079711914, -55.04039001464844, -52.557369232177734, -50.07434844970703, -47.59132385253906, -45.10830307006836, -42.625282287597656, -40.14225769042969, -37.659236907958984, -35.17621612548828, -32.69319534301758, -30.210172653198242, -27.727149963378906, -25.244129180908203, -22.7611083984375, -20.278085708618164, -17.795063018798828, -15.312042236328125, -12.829020500183105, -10.345998764038086, -7.862977027893066, -5.379955291748047, -2.8969335556030273, -0.4139118194580078, 2.069110870361328, 4.5521392822265625, 7.035161018371582, 9.518182754516602, 12.001204490661621, 14.48422622680664, 16.967247009277344, 19.45026969909668, 21.933292388916016, 24.41631317138672, 26.899333953857422, 29.382356643676758, 31.865379333496094, 34.3484001159668, 36.8314208984375, 39.31444549560547, 41.79746627807617, 44.280487060546875, 46.76350784301758, 49.24652862548828, 51.72955322265625, 54.21257400512695, 56.695594787597656, 59.178619384765625, 61.66164016723633, 64.14466094970703, 66.627685546875, 69.11070251464844, 71.5937271118164, 74.07675170898438, 76.55976867675781, 79.04279327392578, 81.52581787109375, 84.00883483886719]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 14.0, 11.0, 17.0, 24.0, 38.0, 40.0, 70.0, 144.0, 316.0, 698.0, 2379.0, 11548.0, 161060.0, 3971409.0, 38552.0, 5458.0, 1423.0, 466.0, 217.0, 116.0, 86.0, 53.0, 28.0, 19.0, 20.0, 10.0, 8.0, 5.0, 8.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.078125, -23.3759765625, -22.673828125, -21.9716796875, -21.26953125, -20.5673828125, -19.865234375, -19.1630859375, -18.4609375, -17.7587890625, -17.056640625, -16.3544921875, -15.65234375, -14.9501953125, -14.248046875, -13.5458984375, -12.84375, -12.1416015625, -11.439453125, -10.7373046875, -10.03515625, -9.3330078125, -8.630859375, -7.9287109375, -7.2265625, -6.5244140625, -5.822265625, -5.1201171875, -4.41796875, -3.7158203125, -3.013671875, -2.3115234375, -1.609375, -0.9072265625, -0.205078125, 0.4970703125, 1.19921875, 1.9013671875, 2.603515625, 3.3056640625, 4.0078125, 4.7099609375, 5.412109375, 6.1142578125, 6.81640625, 7.5185546875, 8.220703125, 8.9228515625, 9.625, 10.3271484375, 11.029296875, 11.7314453125, 12.43359375, 13.1357421875, 13.837890625, 14.5400390625, 15.2421875, 15.9443359375, 16.646484375, 17.3486328125, 18.05078125, 18.7529296875, 19.455078125, 20.1572265625, 20.859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 9.0, 5.0, 14.0, 16.0, 26.0, 27.0, 45.0, 65.0, 53.0, 71.0, 68.0, 74.0, 91.0, 70.0, 68.0, 60.0, 53.0, 48.0, 34.0, 26.0, 19.0, 28.0, 13.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.4427490234375, -4.213623046875, -3.9844970703125, -3.75537109375, -3.5262451171875, -3.297119140625, -3.0679931640625, -2.8388671875, -2.6097412109375, -2.380615234375, -2.1514892578125, -1.92236328125, -1.6932373046875, -1.464111328125, -1.2349853515625, -1.005859375, -0.7767333984375, -0.547607421875, -0.3184814453125, -0.08935546875, 0.1397705078125, 0.368896484375, 0.5980224609375, 0.8271484375, 1.0562744140625, 1.285400390625, 1.5145263671875, 1.74365234375, 1.9727783203125, 2.201904296875, 2.4310302734375, 2.66015625, 2.8892822265625, 3.118408203125, 3.3475341796875, 3.57666015625, 3.8057861328125, 4.034912109375, 4.2640380859375, 4.4931640625, 4.7222900390625, 4.951416015625, 5.1805419921875, 5.40966796875, 5.6387939453125, 5.867919921875, 6.0970458984375, 6.326171875, 6.5552978515625, 6.784423828125, 7.0135498046875, 7.24267578125, 7.4718017578125, 7.700927734375, 7.9300537109375, 8.1591796875, 8.3883056640625, 8.617431640625, 8.8465576171875, 9.07568359375, 9.3048095703125, 9.533935546875, 9.7630615234375, 9.9921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 23.0, 30.0, 48.0, 96.0, 204.0, 515.0, 1731.0, 8629.0, 65362.0, 3927009.0, 170838.0, 15574.0, 2961.0, 744.0, 270.0, 113.0, 52.0, 32.0, 13.0, 14.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.6875, -23.975341796875, -23.26318359375, -22.551025390625, -21.8388671875, -21.126708984375, -20.41455078125, -19.702392578125, -18.990234375, -18.278076171875, -17.56591796875, -16.853759765625, -16.1416015625, -15.429443359375, -14.71728515625, -14.005126953125, -13.29296875, -12.580810546875, -11.86865234375, -11.156494140625, -10.4443359375, -9.732177734375, -9.02001953125, -8.307861328125, -7.595703125, -6.883544921875, -6.17138671875, -5.459228515625, -4.7470703125, -4.034912109375, -3.32275390625, -2.610595703125, -1.8984375, -1.186279296875, -0.47412109375, 0.238037109375, 0.9501953125, 1.662353515625, 2.37451171875, 3.086669921875, 3.798828125, 4.510986328125, 5.22314453125, 5.935302734375, 6.6474609375, 7.359619140625, 8.07177734375, 8.783935546875, 9.49609375, 10.208251953125, 10.92041015625, 11.632568359375, 12.3447265625, 13.056884765625, 13.76904296875, 14.481201171875, 15.193359375, 15.905517578125, 16.61767578125, 17.329833984375, 18.0419921875, 18.754150390625, 19.46630859375, 20.178466796875, 20.890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 7.0, 12.0, 20.0, 15.0, 30.0, 46.0, 62.0, 105.0, 263.0, 1015.0, 1671.0, 409.0, 163.0, 57.0, 49.0, 38.0, 13.0, 12.0, 14.0, 14.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -16.17041015625, -15.7470703125, -15.32373046875, -14.900390625, -14.47705078125, -14.0537109375, -13.63037109375, -13.20703125, -12.78369140625, -12.3603515625, -11.93701171875, -11.513671875, -11.09033203125, -10.6669921875, -10.24365234375, -9.8203125, -9.39697265625, -8.9736328125, -8.55029296875, -8.126953125, -7.70361328125, -7.2802734375, -6.85693359375, -6.43359375, -6.01025390625, -5.5869140625, -5.16357421875, -4.740234375, -4.31689453125, -3.8935546875, -3.47021484375, -3.046875, -2.62353515625, -2.2001953125, -1.77685546875, -1.353515625, -0.93017578125, -0.5068359375, -0.08349609375, 0.33984375, 0.76318359375, 1.1865234375, 1.60986328125, 2.033203125, 2.45654296875, 2.8798828125, 3.30322265625, 3.7265625, 4.14990234375, 4.5732421875, 4.99658203125, 5.419921875, 5.84326171875, 6.2666015625, 6.68994140625, 7.11328125, 7.53662109375, 7.9599609375, 8.38330078125, 8.806640625, 9.22998046875, 9.6533203125, 10.07666015625, 10.5]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 12.0, 22.0, 58.0, 109.0, 237.0, 260.0, 140.0, 73.0, 34.0, 18.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.82405090332031, -109.06523895263672, -105.30642700195312, -101.54762268066406, -97.78881072998047, -94.02999877929688, -90.27118682861328, -86.51237487792969, -82.75357055664062, -78.99475860595703, -75.23594665527344, -71.47714233398438, -67.71833038330078, -63.95951843261719, -60.200706481933594, -56.44189453125, -52.683082580566406, -48.92427062988281, -45.165462493896484, -41.40665054321289, -37.64784240722656, -33.88903045654297, -30.130218505859375, -26.371408462524414, -22.612598419189453, -18.853788375854492, -15.094977378845215, -11.336166381835938, -7.577356338500977, -3.8185462951660156, -0.059734344482421875, 3.699075698852539, 7.4578857421875, 11.216695785522461, 14.975506782531738, 18.734317779541016, 22.493127822875977, 26.251937866210938, 30.01074981689453, 33.769561767578125, 37.52836990356445, 41.28718185424805, 45.045989990234375, 48.80480194091797, 52.56361389160156, 56.32242202758789, 60.081233978271484, 63.84004211425781, 67.5988540649414, 71.357666015625, 75.1164779663086, 78.87528991699219, 82.63409423828125, 86.39290618896484, 90.15171813964844, 93.91053009033203, 97.66934204101562, 101.42815399169922, 105.18696594238281, 108.94577026367188, 112.70458221435547, 116.46339416503906, 120.22220611572266, 123.98101806640625, 127.73982238769531]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 13.0, 11.0, 7.0, 9.0, 15.0, 14.0, 23.0, 14.0, 29.0, 21.0, 31.0, 32.0, 32.0, 42.0, 37.0, 45.0, 40.0, 42.0, 48.0, 41.0, 54.0, 45.0, 40.0, 27.0, 39.0, 28.0, 28.0, 22.0, 26.0, 20.0, 23.0, 18.0, 16.0, 18.0, 9.0, 8.0, 6.0, 4.0, 2.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.01543045043945, -41.7248420715332, -40.43425750732422, -39.14366912841797, -37.853084564208984, -36.562496185302734, -35.27191162109375, -33.9813232421875, -32.69073486328125, -31.400148391723633, -30.109561920166016, -28.8189754486084, -27.52838897705078, -26.23780059814453, -24.947214126586914, -23.656627655029297, -22.366043090820312, -21.075456619262695, -19.784870147705078, -18.49428367614746, -17.203697204589844, -15.91310977935791, -14.622522354125977, -13.33193588256836, -12.041349411010742, -10.750762939453125, -9.460176467895508, -8.169589042663574, -6.879002571105957, -5.58841609954834, -4.2978291511535645, -3.007242202758789, -1.7166519165039062, -0.42606520652770996, 0.8645215034484863, 2.1551082134246826, 3.445694923400879, 4.736281394958496, 6.0268683433532715, 7.317455291748047, 8.608041763305664, 9.898628234863281, 11.189214706420898, 12.479802131652832, 13.77038860321045, 15.060975074768066, 16.3515625, 17.642148971557617, 18.932735443115234, 20.22332191467285, 21.51390838623047, 22.804494857788086, 24.095081329345703, 25.385669708251953, 26.67625617980957, 27.966842651367188, 29.257429122924805, 30.548015594482422, 31.83860206604004, 33.129188537597656, 34.419776916503906, 35.71036148071289, 37.00094985961914, 38.291534423828125, 39.582122802734375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 11.0, 14.0, 14.0, 43.0, 59.0, 111.0, 190.0, 331.0, 593.0, 1176.0, 2500.0, 5828.0, 14371.0, 38200.0, 108679.0, 304945.0, 359376.0, 135121.0, 46655.0, 17439.0, 6906.0, 3009.0, 1426.0, 714.0, 350.0, 191.0, 129.0, 50.0, 36.0, 25.0, 19.0, 13.0, 5.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.7708740234375, -10.424560546875, -10.0782470703125, -9.73193359375, -9.3856201171875, -9.039306640625, -8.6929931640625, -8.3466796875, -8.0003662109375, -7.654052734375, -7.3077392578125, -6.96142578125, -6.6151123046875, -6.268798828125, -5.9224853515625, -5.576171875, -5.2298583984375, -4.883544921875, -4.5372314453125, -4.19091796875, -3.8446044921875, -3.498291015625, -3.1519775390625, -2.8056640625, -2.4593505859375, -2.113037109375, -1.7667236328125, -1.42041015625, -1.0740966796875, -0.727783203125, -0.3814697265625, -0.03515625, 0.3111572265625, 0.657470703125, 1.0037841796875, 1.35009765625, 1.6964111328125, 2.042724609375, 2.3890380859375, 2.7353515625, 3.0816650390625, 3.427978515625, 3.7742919921875, 4.12060546875, 4.4669189453125, 4.813232421875, 5.1595458984375, 5.505859375, 5.8521728515625, 6.198486328125, 6.5447998046875, 6.89111328125, 7.2374267578125, 7.583740234375, 7.9300537109375, 8.2763671875, 8.6226806640625, 8.968994140625, 9.3153076171875, 9.66162109375, 10.0079345703125, 10.354248046875, 10.7005615234375, 11.046875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 4.0, 8.0, 8.0, 21.0, 17.0, 14.0, 22.0, 28.0, 37.0, 34.0, 41.0, 36.0, 38.0, 51.0, 40.0, 55.0, 49.0, 45.0, 46.0, 39.0, 50.0, 48.0, 34.0, 29.0, 30.0, 28.0, 26.0, 18.0, 13.0, 21.0, 20.0, 11.0, 8.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.8046875, -4.658447265625, -4.51220703125, -4.365966796875, -4.2197265625, -4.073486328125, -3.92724609375, -3.781005859375, -3.634765625, -3.488525390625, -3.34228515625, -3.196044921875, -3.0498046875, -2.903564453125, -2.75732421875, -2.611083984375, -2.46484375, -2.318603515625, -2.17236328125, -2.026123046875, -1.8798828125, -1.733642578125, -1.58740234375, -1.441162109375, -1.294921875, -1.148681640625, -1.00244140625, -0.856201171875, -0.7099609375, -0.563720703125, -0.41748046875, -0.271240234375, -0.125, 0.021240234375, 0.16748046875, 0.313720703125, 0.4599609375, 0.606201171875, 0.75244140625, 0.898681640625, 1.044921875, 1.191162109375, 1.33740234375, 1.483642578125, 1.6298828125, 1.776123046875, 1.92236328125, 2.068603515625, 2.21484375, 2.361083984375, 2.50732421875, 2.653564453125, 2.7998046875, 2.946044921875, 3.09228515625, 3.238525390625, 3.384765625, 3.531005859375, 3.67724609375, 3.823486328125, 3.9697265625, 4.115966796875, 4.26220703125, 4.408447265625, 4.5546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 2.0, 8.0, 13.0, 22.0, 11.0, 42.0, 51.0, 82.0, 124.0, 212.0, 519.0, 1087.0, 3514.0, 15861.0, 119728.0, 739656.0, 142887.0, 18573.0, 3777.0, 1192.0, 550.0, 255.0, 115.0, 91.0, 56.0, 28.0, 24.0, 15.0, 15.0, 10.0, 13.0, 4.0, 4.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.647216796875, -20.98193359375, -20.316650390625, -19.6513671875, -18.986083984375, -18.32080078125, -17.655517578125, -16.990234375, -16.324951171875, -15.65966796875, -14.994384765625, -14.3291015625, -13.663818359375, -12.99853515625, -12.333251953125, -11.66796875, -11.002685546875, -10.33740234375, -9.672119140625, -9.0068359375, -8.341552734375, -7.67626953125, -7.010986328125, -6.345703125, -5.680419921875, -5.01513671875, -4.349853515625, -3.6845703125, -3.019287109375, -2.35400390625, -1.688720703125, -1.0234375, -0.358154296875, 0.30712890625, 0.972412109375, 1.6376953125, 2.302978515625, 2.96826171875, 3.633544921875, 4.298828125, 4.964111328125, 5.62939453125, 6.294677734375, 6.9599609375, 7.625244140625, 8.29052734375, 8.955810546875, 9.62109375, 10.286376953125, 10.95166015625, 11.616943359375, 12.2822265625, 12.947509765625, 13.61279296875, 14.278076171875, 14.943359375, 15.608642578125, 16.27392578125, 16.939208984375, 17.6044921875, 18.269775390625, 18.93505859375, 19.600341796875, 20.265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 6.0, 4.0, 4.0, 9.0, 11.0, 15.0, 18.0, 16.0, 18.0, 16.0, 28.0, 23.0, 46.0, 35.0, 39.0, 46.0, 51.0, 55.0, 45.0, 53.0, 46.0, 46.0, 48.0, 61.0, 35.0, 38.0, 27.0, 29.0, 31.0, 17.0, 15.0, 16.0, 10.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-16.328125, -15.781005859375, -15.23388671875, -14.686767578125, -14.1396484375, -13.592529296875, -13.04541015625, -12.498291015625, -11.951171875, -11.404052734375, -10.85693359375, -10.309814453125, -9.7626953125, -9.215576171875, -8.66845703125, -8.121337890625, -7.57421875, -7.027099609375, -6.47998046875, -5.932861328125, -5.3857421875, -4.838623046875, -4.29150390625, -3.744384765625, -3.197265625, -2.650146484375, -2.10302734375, -1.555908203125, -1.0087890625, -0.461669921875, 0.08544921875, 0.632568359375, 1.1796875, 1.726806640625, 2.27392578125, 2.821044921875, 3.3681640625, 3.915283203125, 4.46240234375, 5.009521484375, 5.556640625, 6.103759765625, 6.65087890625, 7.197998046875, 7.7451171875, 8.292236328125, 8.83935546875, 9.386474609375, 9.93359375, 10.480712890625, 11.02783203125, 11.574951171875, 12.1220703125, 12.669189453125, 13.21630859375, 13.763427734375, 14.310546875, 14.857666015625, 15.40478515625, 15.951904296875, 16.4990234375, 17.046142578125, 17.59326171875, 18.140380859375, 18.6875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 13.0, 18.0, 18.0, 21.0, 50.0, 72.0, 147.0, 306.0, 770.0, 2635.0, 18352.0, 739583.0, 273229.0, 10356.0, 1867.0, 559.0, 243.0, 122.0, 66.0, 32.0, 23.0, 14.0, 13.0, 6.0, 5.0, 4.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.623291015625, -8.26220703125, -7.901123046875, -7.5400390625, -7.178955078125, -6.81787109375, -6.456787109375, -6.095703125, -5.734619140625, -5.37353515625, -5.012451171875, -4.6513671875, -4.290283203125, -3.92919921875, -3.568115234375, -3.20703125, -2.845947265625, -2.48486328125, -2.123779296875, -1.7626953125, -1.401611328125, -1.04052734375, -0.679443359375, -0.318359375, 0.042724609375, 0.40380859375, 0.764892578125, 1.1259765625, 1.487060546875, 1.84814453125, 2.209228515625, 2.5703125, 2.931396484375, 3.29248046875, 3.653564453125, 4.0146484375, 4.375732421875, 4.73681640625, 5.097900390625, 5.458984375, 5.820068359375, 6.18115234375, 6.542236328125, 6.9033203125, 7.264404296875, 7.62548828125, 7.986572265625, 8.34765625, 8.708740234375, 9.06982421875, 9.430908203125, 9.7919921875, 10.153076171875, 10.51416015625, 10.875244140625, 11.236328125, 11.597412109375, 11.95849609375, 12.319580078125, 12.6806640625, 13.041748046875, 13.40283203125, 13.763916015625, 14.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 11.0, 15.0, 18.0, 46.0, 80.0, 88.0, 174.0, 219.0, 133.0, 93.0, 52.0, 31.0, 19.0, 17.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002613067626953125, -0.0025446414947509766, -0.002476215362548828, -0.0024077892303466797, -0.0023393630981445312, -0.002270936965942383, -0.0022025108337402344, -0.002134084701538086, -0.0020656585693359375, -0.001997232437133789, -0.0019288063049316406, -0.0018603801727294922, -0.0017919540405273438, -0.0017235279083251953, -0.0016551017761230469, -0.0015866756439208984, -0.00151824951171875, -0.0014498233795166016, -0.0013813972473144531, -0.0013129711151123047, -0.0012445449829101562, -0.0011761188507080078, -0.0011076927185058594, -0.001039266586303711, -0.0009708404541015625, -0.0009024143218994141, -0.0008339881896972656, -0.0007655620574951172, -0.0006971359252929688, -0.0006287097930908203, -0.0005602836608886719, -0.0004918575286865234, -0.000423431396484375, -0.00035500526428222656, -0.0002865791320800781, -0.0002181529998779297, -0.00014972686767578125, -8.130073547363281e-05, -1.2874603271484375e-05, 5.555152893066406e-05, 0.0001239776611328125, 0.00019240379333496094, 0.0002608299255371094, 0.0003292560577392578, 0.00039768218994140625, 0.0004661083221435547, 0.0005345344543457031, 0.0006029605865478516, 0.00067138671875, 0.0007398128509521484, 0.0008082389831542969, 0.0008766651153564453, 0.0009450912475585938, 0.0010135173797607422, 0.0010819435119628906, 0.001150369644165039, 0.0012187957763671875, 0.001287221908569336, 0.0013556480407714844, 0.0014240741729736328, 0.0014925003051757812, 0.0015609264373779297, 0.0016293525695800781, 0.0016977787017822266, 0.001766204833984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 12.0, 10.0, 13.0, 40.0, 60.0, 101.0, 193.0, 412.0, 1043.0, 3690.0, 25619.0, 618297.0, 374796.0, 19388.0, 3145.0, 941.0, 385.0, 194.0, 83.0, 47.0, 27.0, 16.0, 6.0, 10.0, 10.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.984375, -10.7093505859375, -10.434326171875, -10.1593017578125, -9.88427734375, -9.6092529296875, -9.334228515625, -9.0592041015625, -8.7841796875, -8.5091552734375, -8.234130859375, -7.9591064453125, -7.68408203125, -7.4090576171875, -7.134033203125, -6.8590087890625, -6.583984375, -6.3089599609375, -6.033935546875, -5.7589111328125, -5.48388671875, -5.2088623046875, -4.933837890625, -4.6588134765625, -4.3837890625, -4.1087646484375, -3.833740234375, -3.5587158203125, -3.28369140625, -3.0086669921875, -2.733642578125, -2.4586181640625, -2.18359375, -1.9085693359375, -1.633544921875, -1.3585205078125, -1.08349609375, -0.8084716796875, -0.533447265625, -0.2584228515625, 0.0166015625, 0.2916259765625, 0.566650390625, 0.8416748046875, 1.11669921875, 1.3917236328125, 1.666748046875, 1.9417724609375, 2.216796875, 2.4918212890625, 2.766845703125, 3.0418701171875, 3.31689453125, 3.5919189453125, 3.866943359375, 4.1419677734375, 4.4169921875, 4.6920166015625, 4.967041015625, 5.2420654296875, 5.51708984375, 5.7921142578125, 6.067138671875, 6.3421630859375, 6.6171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 6.0, 4.0, 7.0, 17.0, 26.0, 19.0, 43.0, 65.0, 97.0, 123.0, 131.0, 129.0, 98.0, 72.0, 51.0, 40.0, 26.0, 18.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1015625, -9.8258056640625, -9.550048828125, -9.2742919921875, -8.99853515625, -8.7227783203125, -8.447021484375, -8.1712646484375, -7.8955078125, -7.6197509765625, -7.343994140625, -7.0682373046875, -6.79248046875, -6.5167236328125, -6.240966796875, -5.9652099609375, -5.689453125, -5.4136962890625, -5.137939453125, -4.8621826171875, -4.58642578125, -4.3106689453125, -4.034912109375, -3.7591552734375, -3.4833984375, -3.2076416015625, -2.931884765625, -2.6561279296875, -2.38037109375, -2.1046142578125, -1.828857421875, -1.5531005859375, -1.27734375, -1.0015869140625, -0.725830078125, -0.4500732421875, -0.17431640625, 0.1014404296875, 0.377197265625, 0.6529541015625, 0.9287109375, 1.2044677734375, 1.480224609375, 1.7559814453125, 2.03173828125, 2.3074951171875, 2.583251953125, 2.8590087890625, 3.134765625, 3.4105224609375, 3.686279296875, 3.9620361328125, 4.23779296875, 4.5135498046875, 4.789306640625, 5.0650634765625, 5.3408203125, 5.6165771484375, 5.892333984375, 6.1680908203125, 6.44384765625, 6.7196044921875, 6.995361328125, 7.2711181640625, 7.546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 2.0, 7.0, 13.0, 23.0, 107.0, 239.0, 316.0, 164.0, 76.0, 34.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.85491943359375, -163.13082885742188, -156.40673828125, -149.68264770507812, -142.9585723876953, -136.23448181152344, -129.51039123535156, -122.78630065917969, -116.06221771240234, -109.33812713623047, -102.61404418945312, -95.88995361328125, -89.16586303710938, -82.44178009033203, -75.71768951416016, -68.99360656738281, -62.26951599121094, -55.54542922973633, -48.82134246826172, -42.097251892089844, -35.373165130615234, -28.649078369140625, -21.92498779296875, -15.20090103149414, -8.476814270019531, -1.7527265548706055, 4.97136116027832, 11.695449829101562, 18.419536590576172, 25.14362335205078, 31.867713928222656, 38.591800689697266, 45.315887451171875, 52.039974212646484, 58.764060974121094, 65.48815155029297, 72.21223449707031, 78.93632507324219, 85.66041564941406, 92.38450622558594, 99.10858917236328, 105.83267974853516, 112.5567626953125, 119.28085327148438, 126.00494384765625, 132.72903442382812, 139.453125, 146.1772003173828, 152.9012908935547, 159.62538146972656, 166.34947204589844, 173.07354736328125, 179.79763793945312, 186.521728515625, 193.24581909179688, 199.96990966796875, 206.69400024414062, 213.4180908203125, 220.14218139648438, 226.86627197265625, 233.59034729003906, 240.31443786621094, 247.0385284423828, 253.7626190185547, 260.4866943359375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 3.0, 4.0, 6.0, 12.0, 6.0, 10.0, 13.0, 17.0, 15.0, 22.0, 30.0, 25.0, 33.0, 25.0, 40.0, 34.0, 32.0, 27.0, 54.0, 52.0, 54.0, 54.0, 58.0, 42.0, 38.0, 25.0, 37.0, 22.0, 26.0, 20.0, 31.0, 19.0, 19.0, 17.0, 12.0, 9.0, 13.0, 12.0, 5.0, 4.0, 10.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-58.842262268066406, -56.85445785522461, -54.86664962768555, -52.87884521484375, -50.89104080200195, -48.903236389160156, -46.915428161621094, -44.9276237487793, -42.9398193359375, -40.9520149230957, -38.96420669555664, -36.976402282714844, -34.98859786987305, -33.00079345703125, -31.012985229492188, -29.02518081665039, -27.037372589111328, -25.0495662689209, -23.0617618560791, -21.073955535888672, -19.086151123046875, -17.098344802856445, -15.110538482666016, -13.122733116149902, -11.134927749633789, -9.147122383117676, -7.159316539764404, -5.171510696411133, -3.1837053298950195, -1.1958999633789062, 0.7919063568115234, 2.7797117233276367, 4.76751708984375, 6.755322456359863, 8.743127822875977, 10.730934143066406, 12.71873950958252, 14.706544876098633, 16.694351196289062, 18.68215560913086, 20.66996192932129, 22.65776824951172, 24.645572662353516, 26.633378982543945, 28.621185302734375, 30.608989715576172, 32.59679412841797, 34.58460235595703, 36.57240676879883, 38.560211181640625, 40.54801940917969, 42.535823822021484, 44.52362823486328, 46.511436462402344, 48.49924087524414, 50.48704528808594, 52.474853515625, 54.4626579284668, 56.45046615600586, 58.438270568847656, 60.42607498168945, 62.41387939453125, 64.40168762207031, 66.38949584960938, 68.3772964477539]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 9.0, 5.0, 9.0, 14.0, 27.0, 42.0, 45.0, 86.0, 130.0, 258.0, 423.0, 860.0, 1727.0, 3803.0, 10204.0, 34217.0, 202708.0, 3291668.0, 566757.0, 56181.0, 14907.0, 5390.0, 2264.0, 1086.0, 576.0, 314.0, 200.0, 139.0, 59.0, 43.0, 40.0, 22.0, 15.0, 11.0, 13.0, 4.0, 8.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.875, -8.585693359375, -8.29638671875, -8.007080078125, -7.7177734375, -7.428466796875, -7.13916015625, -6.849853515625, -6.560546875, -6.271240234375, -5.98193359375, -5.692626953125, -5.4033203125, -5.114013671875, -4.82470703125, -4.535400390625, -4.24609375, -3.956787109375, -3.66748046875, -3.378173828125, -3.0888671875, -2.799560546875, -2.51025390625, -2.220947265625, -1.931640625, -1.642333984375, -1.35302734375, -1.063720703125, -0.7744140625, -0.485107421875, -0.19580078125, 0.093505859375, 0.3828125, 0.672119140625, 0.96142578125, 1.250732421875, 1.5400390625, 1.829345703125, 2.11865234375, 2.407958984375, 2.697265625, 2.986572265625, 3.27587890625, 3.565185546875, 3.8544921875, 4.143798828125, 4.43310546875, 4.722412109375, 5.01171875, 5.301025390625, 5.59033203125, 5.879638671875, 6.1689453125, 6.458251953125, 6.74755859375, 7.036865234375, 7.326171875, 7.615478515625, 7.90478515625, 8.194091796875, 8.4833984375, 8.772705078125, 9.06201171875, 9.351318359375, 9.640625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 1.0, 3.0, 6.0, 10.0, 9.0, 10.0, 18.0, 15.0, 24.0, 26.0, 31.0, 28.0, 41.0, 56.0, 42.0, 37.0, 42.0, 46.0, 48.0, 46.0, 45.0, 60.0, 45.0, 42.0, 40.0, 37.0, 23.0, 32.0, 22.0, 20.0, 17.0, 23.0, 13.0, 13.0, 7.0, 8.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.03802490234375, -3.9041748046875, -3.77032470703125, -3.636474609375, -3.50262451171875, -3.3687744140625, -3.23492431640625, -3.10107421875, -2.96722412109375, -2.8333740234375, -2.69952392578125, -2.565673828125, -2.43182373046875, -2.2979736328125, -2.16412353515625, -2.0302734375, -1.89642333984375, -1.7625732421875, -1.62872314453125, -1.494873046875, -1.36102294921875, -1.2271728515625, -1.09332275390625, -0.95947265625, -0.82562255859375, -0.6917724609375, -0.55792236328125, -0.424072265625, -0.29022216796875, -0.1563720703125, -0.02252197265625, 0.111328125, 0.24517822265625, 0.3790283203125, 0.51287841796875, 0.646728515625, 0.78057861328125, 0.9144287109375, 1.04827880859375, 1.18212890625, 1.31597900390625, 1.4498291015625, 1.58367919921875, 1.717529296875, 1.85137939453125, 1.9852294921875, 2.11907958984375, 2.2529296875, 2.38677978515625, 2.5206298828125, 2.65447998046875, 2.788330078125, 2.92218017578125, 3.0560302734375, 3.18988037109375, 3.32373046875, 3.45758056640625, 3.5914306640625, 3.72528076171875, 3.859130859375, 3.99298095703125, 4.1268310546875, 4.26068115234375, 4.39453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 10.0, 8.0, 14.0, 35.0, 28.0, 91.0, 167.0, 407.0, 1142.0, 4367.0, 31229.0, 2000839.0, 2120961.0, 29494.0, 4017.0, 961.0, 259.0, 120.0, 54.0, 29.0, 19.0, 8.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-32.3125, -31.594482421875, -30.87646484375, -30.158447265625, -29.4404296875, -28.722412109375, -28.00439453125, -27.286376953125, -26.568359375, -25.850341796875, -25.13232421875, -24.414306640625, -23.6962890625, -22.978271484375, -22.26025390625, -21.542236328125, -20.82421875, -20.106201171875, -19.38818359375, -18.670166015625, -17.9521484375, -17.234130859375, -16.51611328125, -15.798095703125, -15.080078125, -14.362060546875, -13.64404296875, -12.926025390625, -12.2080078125, -11.489990234375, -10.77197265625, -10.053955078125, -9.3359375, -8.617919921875, -7.89990234375, -7.181884765625, -6.4638671875, -5.745849609375, -5.02783203125, -4.309814453125, -3.591796875, -2.873779296875, -2.15576171875, -1.437744140625, -0.7197265625, -0.001708984375, 0.71630859375, 1.434326171875, 2.15234375, 2.870361328125, 3.58837890625, 4.306396484375, 5.0244140625, 5.742431640625, 6.46044921875, 7.178466796875, 7.896484375, 8.614501953125, 9.33251953125, 10.050537109375, 10.7685546875, 11.486572265625, 12.20458984375, 12.922607421875, 13.640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 5.0, 9.0, 9.0, 15.0, 10.0, 27.0, 34.0, 40.0, 42.0, 80.0, 108.0, 163.0, 326.0, 758.0, 1215.0, 543.0, 246.0, 137.0, 89.0, 57.0, 38.0, 30.0, 23.0, 14.0, 10.0, 11.0, 7.0, 6.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-15.8359375, -15.452880859375, -15.06982421875, -14.686767578125, -14.3037109375, -13.920654296875, -13.53759765625, -13.154541015625, -12.771484375, -12.388427734375, -12.00537109375, -11.622314453125, -11.2392578125, -10.856201171875, -10.47314453125, -10.090087890625, -9.70703125, -9.323974609375, -8.94091796875, -8.557861328125, -8.1748046875, -7.791748046875, -7.40869140625, -7.025634765625, -6.642578125, -6.259521484375, -5.87646484375, -5.493408203125, -5.1103515625, -4.727294921875, -4.34423828125, -3.961181640625, -3.578125, -3.195068359375, -2.81201171875, -2.428955078125, -2.0458984375, -1.662841796875, -1.27978515625, -0.896728515625, -0.513671875, -0.130615234375, 0.25244140625, 0.635498046875, 1.0185546875, 1.401611328125, 1.78466796875, 2.167724609375, 2.55078125, 2.933837890625, 3.31689453125, 3.699951171875, 4.0830078125, 4.466064453125, 4.84912109375, 5.232177734375, 5.615234375, 5.998291015625, 6.38134765625, 6.764404296875, 7.1474609375, 7.530517578125, 7.91357421875, 8.296630859375, 8.6796875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 16.0, 66.0, 300.0, 413.0, 138.0, 30.0, 14.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-406.7867736816406, -398.69659423828125, -390.60638427734375, -382.5162048339844, -374.426025390625, -366.3358154296875, -358.2456359863281, -350.1554260253906, -342.06524658203125, -333.9750671386719, -325.8848571777344, -317.794677734375, -309.7044677734375, -301.6142883300781, -293.52410888671875, -285.43389892578125, -277.3437194824219, -269.2535400390625, -261.163330078125, -253.07315063476562, -244.9829559326172, -236.89276123046875, -228.80258178710938, -220.71238708496094, -212.6221923828125, -204.53199768066406, -196.44180297851562, -188.35162353515625, -180.2614288330078, -172.17123413085938, -164.0810546875, -155.99085998535156, -147.9006805419922, -139.81048583984375, -131.72030639648438, -123.63011169433594, -115.5399169921875, -107.44972229003906, -99.35953521728516, -91.26934814453125, -83.17915344238281, -75.08895874023438, -66.99877166748047, -58.9085807800293, -50.818389892578125, -42.72819900512695, -34.63800811767578, -26.54781723022461, -18.457626342773438, -10.367435455322266, -2.2772445678710938, 5.812946319580078, 13.90313720703125, 21.993328094482422, 30.083518981933594, 38.173709869384766, 46.26390075683594, 54.35409164428711, 62.44428253173828, 70.53446960449219, 78.62466430664062, 86.71485900878906, 94.80504608154297, 102.89523315429688, 110.98542785644531]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 5.0, 14.0, 10.0, 12.0, 11.0, 13.0, 21.0, 20.0, 20.0, 33.0, 32.0, 44.0, 37.0, 46.0, 41.0, 49.0, 51.0, 47.0, 49.0, 45.0, 45.0, 41.0, 45.0, 44.0, 35.0, 32.0, 31.0, 26.0, 20.0, 17.0, 15.0, 8.0, 8.0, 8.0, 2.0, 7.0, 2.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.77496337890625, -45.157508850097656, -43.54005432128906, -41.92259979248047, -40.305145263671875, -38.68769073486328, -37.07023620605469, -35.452781677246094, -33.8353271484375, -32.217872619628906, -30.600418090820312, -28.98296356201172, -27.365509033203125, -25.74805450439453, -24.13060188293457, -22.513147354125977, -20.895694732666016, -19.278240203857422, -17.660785675048828, -16.043331146240234, -14.425877571105957, -12.808423042297363, -11.190969467163086, -9.573514938354492, -7.956060409545898, -6.338605880737305, -4.721151828765869, -3.1036977767944336, -1.4862432479858398, 0.1312112808227539, 1.7486648559570312, 3.366119384765625, 4.983573913574219, 6.6010284423828125, 8.218482971191406, 9.835936546325684, 11.453391075134277, 13.070845603942871, 14.688299179077148, 16.305753707885742, 17.923208236694336, 19.54066276550293, 21.158117294311523, 22.775569915771484, 24.393024444580078, 26.010478973388672, 27.627933502197266, 29.24538803100586, 30.862842559814453, 32.48029708862305, 34.09775161743164, 35.715206146240234, 37.33266067504883, 38.95011520385742, 40.56756591796875, 42.185020446777344, 43.80247497558594, 45.41992950439453, 47.037384033203125, 48.65483856201172, 50.27229309082031, 51.889747619628906, 53.5072021484375, 55.124656677246094, 56.74211120605469]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 14.0, 10.0, 25.0, 26.0, 48.0, 63.0, 89.0, 185.0, 266.0, 421.0, 682.0, 1211.0, 2424.0, 5150.0, 11225.0, 26893.0, 68002.0, 171647.0, 351085.0, 242338.0, 98458.0, 38667.0, 15846.0, 6834.0, 3097.0, 1587.0, 851.0, 514.0, 312.0, 230.0, 128.0, 68.0, 54.0, 36.0, 29.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6138916015625, -8.313720703125, -8.0135498046875, -7.71337890625, -7.4132080078125, -7.113037109375, -6.8128662109375, -6.5126953125, -6.2125244140625, -5.912353515625, -5.6121826171875, -5.31201171875, -5.0118408203125, -4.711669921875, -4.4114990234375, -4.111328125, -3.8111572265625, -3.510986328125, -3.2108154296875, -2.91064453125, -2.6104736328125, -2.310302734375, -2.0101318359375, -1.7099609375, -1.4097900390625, -1.109619140625, -0.8094482421875, -0.50927734375, -0.2091064453125, 0.091064453125, 0.3912353515625, 0.69140625, 0.9915771484375, 1.291748046875, 1.5919189453125, 1.89208984375, 2.1922607421875, 2.492431640625, 2.7926025390625, 3.0927734375, 3.3929443359375, 3.693115234375, 3.9932861328125, 4.29345703125, 4.5936279296875, 4.893798828125, 5.1939697265625, 5.494140625, 5.7943115234375, 6.094482421875, 6.3946533203125, 6.69482421875, 6.9949951171875, 7.295166015625, 7.5953369140625, 7.8955078125, 8.1956787109375, 8.495849609375, 8.7960205078125, 9.09619140625, 9.3963623046875, 9.696533203125, 9.9967041015625, 10.296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 5.0, 4.0, 5.0, 5.0, 8.0, 11.0, 12.0, 12.0, 22.0, 14.0, 29.0, 30.0, 34.0, 30.0, 40.0, 40.0, 41.0, 33.0, 41.0, 47.0, 43.0, 57.0, 46.0, 41.0, 47.0, 24.0, 32.0, 37.0, 38.0, 28.0, 26.0, 19.0, 15.0, 14.0, 9.0, 11.0, 12.0, 7.0, 4.0, 8.0, 2.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -4.005157470703125, -3.88140869140625, -3.757659912109375, -3.6339111328125, -3.510162353515625, -3.38641357421875, -3.262664794921875, -3.138916015625, -3.015167236328125, -2.89141845703125, -2.767669677734375, -2.6439208984375, -2.520172119140625, -2.39642333984375, -2.272674560546875, -2.14892578125, -2.025177001953125, -1.90142822265625, -1.777679443359375, -1.6539306640625, -1.530181884765625, -1.40643310546875, -1.282684326171875, -1.158935546875, -1.035186767578125, -0.91143798828125, -0.787689208984375, -0.6639404296875, -0.540191650390625, -0.41644287109375, -0.292694091796875, -0.1689453125, -0.045196533203125, 0.07855224609375, 0.202301025390625, 0.3260498046875, 0.449798583984375, 0.57354736328125, 0.697296142578125, 0.821044921875, 0.944793701171875, 1.06854248046875, 1.192291259765625, 1.3160400390625, 1.439788818359375, 1.56353759765625, 1.687286376953125, 1.81103515625, 1.934783935546875, 2.05853271484375, 2.182281494140625, 2.3060302734375, 2.429779052734375, 2.55352783203125, 2.677276611328125, 2.801025390625, 2.924774169921875, 3.04852294921875, 3.172271728515625, 3.2960205078125, 3.419769287109375, 3.54351806640625, 3.667266845703125, 3.791015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 8.0, 3.0, 8.0, 12.0, 22.0, 29.0, 48.0, 63.0, 121.0, 200.0, 378.0, 741.0, 1612.0, 4729.0, 26825.0, 419419.0, 556449.0, 29531.0, 5057.0, 1639.0, 750.0, 408.0, 214.0, 106.0, 67.0, 33.0, 31.0, 14.0, 10.0, 14.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.703125, -24.900390625, -24.09765625, -23.294921875, -22.4921875, -21.689453125, -20.88671875, -20.083984375, -19.28125, -18.478515625, -17.67578125, -16.873046875, -16.0703125, -15.267578125, -14.46484375, -13.662109375, -12.859375, -12.056640625, -11.25390625, -10.451171875, -9.6484375, -8.845703125, -8.04296875, -7.240234375, -6.4375, -5.634765625, -4.83203125, -4.029296875, -3.2265625, -2.423828125, -1.62109375, -0.818359375, -0.015625, 0.787109375, 1.58984375, 2.392578125, 3.1953125, 3.998046875, 4.80078125, 5.603515625, 6.40625, 7.208984375, 8.01171875, 8.814453125, 9.6171875, 10.419921875, 11.22265625, 12.025390625, 12.828125, 13.630859375, 14.43359375, 15.236328125, 16.0390625, 16.841796875, 17.64453125, 18.447265625, 19.25, 20.052734375, 20.85546875, 21.658203125, 22.4609375, 23.263671875, 24.06640625, 24.869140625, 25.671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 14.0, 8.0, 15.0, 23.0, 28.0, 28.0, 31.0, 27.0, 41.0, 48.0, 45.0, 41.0, 44.0, 53.0, 41.0, 53.0, 45.0, 53.0, 60.0, 35.0, 34.0, 28.0, 23.0, 36.0, 27.0, 19.0, 12.0, 20.0, 12.0, 13.0, 10.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.609375, -18.995361328125, -18.38134765625, -17.767333984375, -17.1533203125, -16.539306640625, -15.92529296875, -15.311279296875, -14.697265625, -14.083251953125, -13.46923828125, -12.855224609375, -12.2412109375, -11.627197265625, -11.01318359375, -10.399169921875, -9.78515625, -9.171142578125, -8.55712890625, -7.943115234375, -7.3291015625, -6.715087890625, -6.10107421875, -5.487060546875, -4.873046875, -4.259033203125, -3.64501953125, -3.031005859375, -2.4169921875, -1.802978515625, -1.18896484375, -0.574951171875, 0.0390625, 0.653076171875, 1.26708984375, 1.881103515625, 2.4951171875, 3.109130859375, 3.72314453125, 4.337158203125, 4.951171875, 5.565185546875, 6.17919921875, 6.793212890625, 7.4072265625, 8.021240234375, 8.63525390625, 9.249267578125, 9.86328125, 10.477294921875, 11.09130859375, 11.705322265625, 12.3193359375, 12.933349609375, 13.54736328125, 14.161376953125, 14.775390625, 15.389404296875, 16.00341796875, 16.617431640625, 17.2314453125, 17.845458984375, 18.45947265625, 19.073486328125, 19.6875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 2.0, 9.0, 10.0, 8.0, 15.0, 17.0, 30.0, 52.0, 90.0, 106.0, 290.0, 640.0, 1840.0, 7457.0, 129662.0, 887226.0, 16367.0, 2921.0, 947.0, 375.0, 168.0, 103.0, 70.0, 42.0, 25.0, 21.0, 13.0, 9.0, 10.0, 9.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.03125, -18.440185546875, -17.84912109375, -17.258056640625, -16.6669921875, -16.075927734375, -15.48486328125, -14.893798828125, -14.302734375, -13.711669921875, -13.12060546875, -12.529541015625, -11.9384765625, -11.347412109375, -10.75634765625, -10.165283203125, -9.57421875, -8.983154296875, -8.39208984375, -7.801025390625, -7.2099609375, -6.618896484375, -6.02783203125, -5.436767578125, -4.845703125, -4.254638671875, -3.66357421875, -3.072509765625, -2.4814453125, -1.890380859375, -1.29931640625, -0.708251953125, -0.1171875, 0.473876953125, 1.06494140625, 1.656005859375, 2.2470703125, 2.838134765625, 3.42919921875, 4.020263671875, 4.611328125, 5.202392578125, 5.79345703125, 6.384521484375, 6.9755859375, 7.566650390625, 8.15771484375, 8.748779296875, 9.33984375, 9.930908203125, 10.52197265625, 11.113037109375, 11.7041015625, 12.295166015625, 12.88623046875, 13.477294921875, 14.068359375, 14.659423828125, 15.25048828125, 15.841552734375, 16.4326171875, 17.023681640625, 17.61474609375, 18.205810546875, 18.796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 14.0, 20.0, 24.0, 54.0, 142.0, 261.0, 260.0, 98.0, 55.0, 20.0, 11.0, 11.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004344940185546875, -0.004204094409942627, -0.004063248634338379, -0.003922402858734131, -0.003781557083129883, -0.0036407113075256348, -0.0034998655319213867, -0.0033590197563171387, -0.0032181739807128906, -0.0030773282051086426, -0.0029364824295043945, -0.0027956366539001465, -0.0026547908782958984, -0.0025139451026916504, -0.0023730993270874023, -0.0022322535514831543, -0.0020914077758789062, -0.0019505620002746582, -0.0018097162246704102, -0.0016688704490661621, -0.001528024673461914, -0.001387178897857666, -0.001246333122253418, -0.00110548734664917, -0.0009646415710449219, -0.0008237957954406738, -0.0006829500198364258, -0.0005421042442321777, -0.0004012584686279297, -0.00026041269302368164, -0.0001195669174194336, 2.1278858184814453e-05, 0.0001621246337890625, 0.00030297040939331055, 0.0004438161849975586, 0.0005846619606018066, 0.0007255077362060547, 0.0008663535118103027, 0.0010071992874145508, 0.0011480450630187988, 0.0012888908386230469, 0.001429736614227295, 0.001570582389831543, 0.001711428165435791, 0.001852273941040039, 0.001993119716644287, 0.002133965492248535, 0.002274811267852783, 0.0024156570434570312, 0.0025565028190612793, 0.0026973485946655273, 0.0028381943702697754, 0.0029790401458740234, 0.0031198859214782715, 0.0032607316970825195, 0.0034015774726867676, 0.0035424232482910156, 0.0036832690238952637, 0.0038241147994995117, 0.00396496057510376, 0.004105806350708008, 0.004246652126312256, 0.004387497901916504, 0.004528343677520752, 0.004669189453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 6.0, 14.0, 15.0, 22.0, 29.0, 46.0, 63.0, 122.0, 263.0, 605.0, 1598.0, 5463.0, 112707.0, 914857.0, 9119.0, 2192.0, 754.0, 272.0, 157.0, 77.0, 62.0, 27.0, 22.0, 10.0, 6.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-33.8125, -32.90234375, -31.9921875, -31.08203125, -30.171875, -29.26171875, -28.3515625, -27.44140625, -26.53125, -25.62109375, -24.7109375, -23.80078125, -22.890625, -21.98046875, -21.0703125, -20.16015625, -19.25, -18.33984375, -17.4296875, -16.51953125, -15.609375, -14.69921875, -13.7890625, -12.87890625, -11.96875, -11.05859375, -10.1484375, -9.23828125, -8.328125, -7.41796875, -6.5078125, -5.59765625, -4.6875, -3.77734375, -2.8671875, -1.95703125, -1.046875, -0.13671875, 0.7734375, 1.68359375, 2.59375, 3.50390625, 4.4140625, 5.32421875, 6.234375, 7.14453125, 8.0546875, 8.96484375, 9.875, 10.78515625, 11.6953125, 12.60546875, 13.515625, 14.42578125, 15.3359375, 16.24609375, 17.15625, 18.06640625, 18.9765625, 19.88671875, 20.796875, 21.70703125, 22.6171875, 23.52734375, 24.4375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 4.0, 6.0, 6.0, 7.0, 5.0, 14.0, 34.0, 73.0, 154.0, 272.0, 223.0, 106.0, 47.0, 19.0, 10.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.625732421875, -23.00146484375, -22.377197265625, -21.7529296875, -21.128662109375, -20.50439453125, -19.880126953125, -19.255859375, -18.631591796875, -18.00732421875, -17.383056640625, -16.7587890625, -16.134521484375, -15.51025390625, -14.885986328125, -14.26171875, -13.637451171875, -13.01318359375, -12.388916015625, -11.7646484375, -11.140380859375, -10.51611328125, -9.891845703125, -9.267578125, -8.643310546875, -8.01904296875, -7.394775390625, -6.7705078125, -6.146240234375, -5.52197265625, -4.897705078125, -4.2734375, -3.649169921875, -3.02490234375, -2.400634765625, -1.7763671875, -1.152099609375, -0.52783203125, 0.096435546875, 0.720703125, 1.344970703125, 1.96923828125, 2.593505859375, 3.2177734375, 3.842041015625, 4.46630859375, 5.090576171875, 5.71484375, 6.339111328125, 6.96337890625, 7.587646484375, 8.2119140625, 8.836181640625, 9.46044921875, 10.084716796875, 10.708984375, 11.333251953125, 11.95751953125, 12.581787109375, 13.2060546875, 13.830322265625, 14.45458984375, 15.078857421875, 15.703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 17.0, 45.0, 155.0, 408.0, 234.0, 79.0, 24.0, 14.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.2576599121094, -264.6259460449219, -255.9942169189453, -247.36248779296875, -238.73077392578125, -230.0990447998047, -221.46731567382812, -212.83560180664062, -204.20387268066406, -195.5721435546875, -186.9404296875, -178.30870056152344, -169.67697143554688, -161.04525756835938, -152.4135284423828, -143.78179931640625, -135.15008544921875, -126.51836395263672, -117.88664245605469, -109.25491333007812, -100.6231918334961, -91.99147033691406, -83.3597412109375, -74.72801971435547, -66.09629821777344, -57.464576721191406, -48.83285140991211, -40.20112609863281, -31.56940460205078, -22.93768310546875, -14.305957794189453, -5.674232482910156, 2.957489013671875, 11.589212417602539, 20.220935821533203, 28.852659225463867, 37.48438262939453, 46.11610412597656, 54.74782943725586, 63.379554748535156, 72.01127624511719, 80.64299774169922, 89.27471923828125, 97.90644836425781, 106.53816986083984, 115.16989135742188, 123.80162048339844, 132.433349609375, 141.0650634765625, 149.69679260253906, 158.32850646972656, 166.96023559570312, 175.59194946289062, 184.2236785888672, 192.85540771484375, 201.48712158203125, 210.1188507080078, 218.75057983398438, 227.38229370117188, 236.01402282714844, 244.645751953125, 253.2774658203125, 261.9091796875, 270.5409240722656, 279.1726379394531]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 6.0, 6.0, 6.0, 7.0, 9.0, 14.0, 14.0, 17.0, 22.0, 26.0, 27.0, 44.0, 40.0, 44.0, 49.0, 51.0, 74.0, 85.0, 72.0, 46.0, 66.0, 36.0, 38.0, 29.0, 26.0, 24.0, 27.0, 23.0, 15.0, 9.0, 8.0, 12.0, 8.0, 5.0, 8.0, 4.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.81991577148438, -76.06816864013672, -73.31642150878906, -70.5646743774414, -67.81292724609375, -65.0611801147461, -62.30943298339844, -59.55768585205078, -56.805938720703125, -54.05419158935547, -51.30244445800781, -48.550697326660156, -45.7989501953125, -43.047203063964844, -40.29545593261719, -37.54370880126953, -34.79196548461914, -32.040218353271484, -29.288471221923828, -26.536724090576172, -23.784976959228516, -21.03322982788086, -18.281484603881836, -15.52973747253418, -12.777990341186523, -10.026243209838867, -7.274496555328369, -4.522749900817871, -1.7710027694702148, 0.9807443618774414, 3.7324905395507812, 6.4842376708984375, 9.235984802246094, 11.98773193359375, 14.739479064941406, 17.491226196289062, 20.24297332763672, 22.994720458984375, 25.7464656829834, 28.498212814331055, 31.24995994567871, 34.001705169677734, 36.75345230102539, 39.50519943237305, 42.2569465637207, 45.00869369506836, 47.760440826416016, 50.51218795776367, 53.26393508911133, 56.015682220458984, 58.76742935180664, 61.5191764831543, 64.27091979980469, 67.02266693115234, 69.7744140625, 72.52616119384766, 75.27790832519531, 78.02965545654297, 80.78140258789062, 83.53314971923828, 86.28489685058594, 89.0366439819336, 91.78839111328125, 94.5401382446289, 97.29188537597656]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 8.0, 15.0, 28.0, 50.0, 127.0, 259.0, 958.0, 4574.0, 116206.0, 4040094.0, 28837.0, 2161.0, 571.0, 212.0, 76.0, 35.0, 19.0, 14.0, 10.0, 4.0, 6.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.218017578125, -18.35791015625, -17.497802734375, -16.6376953125, -15.777587890625, -14.91748046875, -14.057373046875, -13.197265625, -12.337158203125, -11.47705078125, -10.616943359375, -9.7568359375, -8.896728515625, -8.03662109375, -7.176513671875, -6.31640625, -5.456298828125, -4.59619140625, -3.736083984375, -2.8759765625, -2.015869140625, -1.15576171875, -0.295654296875, 0.564453125, 1.424560546875, 2.28466796875, 3.144775390625, 4.0048828125, 4.864990234375, 5.72509765625, 6.585205078125, 7.4453125, 8.305419921875, 9.16552734375, 10.025634765625, 10.8857421875, 11.745849609375, 12.60595703125, 13.466064453125, 14.326171875, 15.186279296875, 16.04638671875, 16.906494140625, 17.7666015625, 18.626708984375, 19.48681640625, 20.346923828125, 21.20703125, 22.067138671875, 22.92724609375, 23.787353515625, 24.6474609375, 25.507568359375, 26.36767578125, 27.227783203125, 28.087890625, 28.947998046875, 29.80810546875, 30.668212890625, 31.5283203125, 32.388427734375, 33.24853515625, 34.108642578125, 34.96875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 9.0, 13.0, 14.0, 22.0, 35.0, 53.0, 56.0, 75.0, 69.0, 80.0, 72.0, 90.0, 82.0, 71.0, 63.0, 56.0, 43.0, 26.0, 28.0, 15.0, 7.0, 10.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.93359375, -6.68377685546875, -6.4339599609375, -6.18414306640625, -5.934326171875, -5.68450927734375, -5.4346923828125, -5.18487548828125, -4.93505859375, -4.68524169921875, -4.4354248046875, -4.18560791015625, -3.935791015625, -3.68597412109375, -3.4361572265625, -3.18634033203125, -2.9365234375, -2.68670654296875, -2.4368896484375, -2.18707275390625, -1.937255859375, -1.68743896484375, -1.4376220703125, -1.18780517578125, -0.93798828125, -0.68817138671875, -0.4383544921875, -0.18853759765625, 0.061279296875, 0.31109619140625, 0.5609130859375, 0.81072998046875, 1.060546875, 1.31036376953125, 1.5601806640625, 1.80999755859375, 2.059814453125, 2.30963134765625, 2.5594482421875, 2.80926513671875, 3.05908203125, 3.30889892578125, 3.5587158203125, 3.80853271484375, 4.058349609375, 4.30816650390625, 4.5579833984375, 4.80780029296875, 5.0576171875, 5.30743408203125, 5.5572509765625, 5.80706787109375, 6.056884765625, 6.30670166015625, 6.5565185546875, 6.80633544921875, 7.05615234375, 7.30596923828125, 7.5557861328125, 7.80560302734375, 8.055419921875, 8.30523681640625, 8.5550537109375, 8.80487060546875, 9.0546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 12.0, 21.0, 46.0, 86.0, 140.0, 286.0, 579.0, 1393.0, 5033.0, 29124.0, 751532.0, 3343946.0, 51407.0, 7324.0, 1909.0, 715.0, 306.0, 165.0, 93.0, 66.0, 36.0, 24.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.296875, -22.701416015625, -22.10595703125, -21.510498046875, -20.9150390625, -20.319580078125, -19.72412109375, -19.128662109375, -18.533203125, -17.937744140625, -17.34228515625, -16.746826171875, -16.1513671875, -15.555908203125, -14.96044921875, -14.364990234375, -13.76953125, -13.174072265625, -12.57861328125, -11.983154296875, -11.3876953125, -10.792236328125, -10.19677734375, -9.601318359375, -9.005859375, -8.410400390625, -7.81494140625, -7.219482421875, -6.6240234375, -6.028564453125, -5.43310546875, -4.837646484375, -4.2421875, -3.646728515625, -3.05126953125, -2.455810546875, -1.8603515625, -1.264892578125, -0.66943359375, -0.073974609375, 0.521484375, 1.116943359375, 1.71240234375, 2.307861328125, 2.9033203125, 3.498779296875, 4.09423828125, 4.689697265625, 5.28515625, 5.880615234375, 6.47607421875, 7.071533203125, 7.6669921875, 8.262451171875, 8.85791015625, 9.453369140625, 10.048828125, 10.644287109375, 11.23974609375, 11.835205078125, 12.4306640625, 13.026123046875, 13.62158203125, 14.217041015625, 14.8125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 11.0, 8.0, 24.0, 21.0, 38.0, 65.0, 76.0, 151.0, 304.0, 801.0, 1280.0, 664.0, 263.0, 131.0, 66.0, 45.0, 30.0, 26.0, 21.0, 16.0, 7.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.55908203125, -14.0947265625, -13.63037109375, -13.166015625, -12.70166015625, -12.2373046875, -11.77294921875, -11.30859375, -10.84423828125, -10.3798828125, -9.91552734375, -9.451171875, -8.98681640625, -8.5224609375, -8.05810546875, -7.59375, -7.12939453125, -6.6650390625, -6.20068359375, -5.736328125, -5.27197265625, -4.8076171875, -4.34326171875, -3.87890625, -3.41455078125, -2.9501953125, -2.48583984375, -2.021484375, -1.55712890625, -1.0927734375, -0.62841796875, -0.1640625, 0.30029296875, 0.7646484375, 1.22900390625, 1.693359375, 2.15771484375, 2.6220703125, 3.08642578125, 3.55078125, 4.01513671875, 4.4794921875, 4.94384765625, 5.408203125, 5.87255859375, 6.3369140625, 6.80126953125, 7.265625, 7.72998046875, 8.1943359375, 8.65869140625, 9.123046875, 9.58740234375, 10.0517578125, 10.51611328125, 10.98046875, 11.44482421875, 11.9091796875, 12.37353515625, 12.837890625, 13.30224609375, 13.7666015625, 14.23095703125, 14.6953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 13.0, 34.0, 69.0, 137.0, 246.0, 238.0, 134.0, 59.0, 29.0, 11.0, 10.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.30014038085938, -117.5668716430664, -112.8335952758789, -108.10032653808594, -103.36705017089844, -98.63378143310547, -93.9005126953125, -89.167236328125, -84.43396759033203, -79.70069885253906, -74.96742248535156, -70.2341537475586, -65.50088500976562, -60.767608642578125, -56.034339904785156, -51.30106735229492, -46.56779479980469, -41.83452224731445, -37.10124969482422, -32.36798095703125, -27.634708404541016, -22.90143585205078, -18.16816520690918, -13.434894561767578, -8.701622009277344, -3.968350410461426, 0.7649211883544922, 5.49819278717041, 10.231464385986328, 14.964736938476562, 19.698007583618164, 24.431278228759766, 29.16455078125, 33.897823333740234, 38.63109588623047, 43.36436462402344, 48.09763717651367, 52.830909729003906, 57.564178466796875, 62.29745101928711, 67.03072357177734, 71.76399230957031, 76.49726867675781, 81.23053741455078, 85.96380615234375, 90.69708251953125, 95.43035125732422, 100.16361999511719, 104.89689636230469, 109.63016510009766, 114.36344146728516, 119.09671020507812, 123.82998657226562, 128.56326293945312, 133.29652404785156, 138.02980041503906, 142.7630615234375, 147.496337890625, 152.22959899902344, 156.96287536621094, 161.69615173339844, 166.42941284179688, 171.16268920898438, 175.89596557617188, 180.62924194335938]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 12.0, 7.0, 18.0, 14.0, 28.0, 24.0, 23.0, 21.0, 37.0, 37.0, 36.0, 41.0, 48.0, 49.0, 42.0, 57.0, 48.0, 53.0, 54.0, 35.0, 46.0, 37.0, 38.0, 29.0, 42.0, 24.0, 17.0, 10.0, 10.0, 13.0, 9.0, 5.0, 9.0, 8.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.42506408691406, -58.70603942871094, -56.98701095581055, -55.267982482910156, -53.54895782470703, -51.829933166503906, -50.110904693603516, -48.391876220703125, -46.6728515625, -44.953826904296875, -43.234798431396484, -41.515769958496094, -39.79674530029297, -38.077720642089844, -36.35869216918945, -34.63966369628906, -32.92063903808594, -31.20161247253418, -29.482585906982422, -27.763559341430664, -26.044532775878906, -24.32550621032715, -22.60647964477539, -20.887453079223633, -19.168426513671875, -17.449399948120117, -15.73037338256836, -14.011346817016602, -12.292320251464844, -10.573293685913086, -8.854267120361328, -7.13524055480957, -5.416217803955078, -3.6971912384033203, -1.9781646728515625, -0.2591381072998047, 1.4598884582519531, 3.178915023803711, 4.897941589355469, 6.616968154907227, 8.335994720458984, 10.055021286010742, 11.7740478515625, 13.493074417114258, 15.212100982666016, 16.931127548217773, 18.65015411376953, 20.36918067932129, 22.088207244873047, 23.807233810424805, 25.526260375976562, 27.24528694152832, 28.964313507080078, 30.683340072631836, 32.402366638183594, 34.12139129638672, 35.84041976928711, 37.5594482421875, 39.278472900390625, 40.99749755859375, 42.71652603149414, 44.43555450439453, 46.154579162597656, 47.87360382080078, 49.59263229370117]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 4.0, 8.0, 11.0, 11.0, 19.0, 31.0, 42.0, 67.0, 133.0, 189.0, 356.0, 871.0, 2378.0, 8041.0, 35562.0, 198531.0, 594056.0, 167263.0, 30052.0, 7161.0, 2138.0, 775.0, 354.0, 168.0, 107.0, 70.0, 39.0, 29.0, 26.0, 16.0, 12.0, 3.0, 8.0, 7.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.89892578125, -15.2978515625, -14.69677734375, -14.095703125, -13.49462890625, -12.8935546875, -12.29248046875, -11.69140625, -11.09033203125, -10.4892578125, -9.88818359375, -9.287109375, -8.68603515625, -8.0849609375, -7.48388671875, -6.8828125, -6.28173828125, -5.6806640625, -5.07958984375, -4.478515625, -3.87744140625, -3.2763671875, -2.67529296875, -2.07421875, -1.47314453125, -0.8720703125, -0.27099609375, 0.330078125, 0.93115234375, 1.5322265625, 2.13330078125, 2.734375, 3.33544921875, 3.9365234375, 4.53759765625, 5.138671875, 5.73974609375, 6.3408203125, 6.94189453125, 7.54296875, 8.14404296875, 8.7451171875, 9.34619140625, 9.947265625, 10.54833984375, 11.1494140625, 11.75048828125, 12.3515625, 12.95263671875, 13.5537109375, 14.15478515625, 14.755859375, 15.35693359375, 15.9580078125, 16.55908203125, 17.16015625, 17.76123046875, 18.3623046875, 18.96337890625, 19.564453125, 20.16552734375, 20.7666015625, 21.36767578125, 21.96875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 7.0, 16.0, 28.0, 37.0, 40.0, 48.0, 56.0, 55.0, 85.0, 91.0, 72.0, 79.0, 78.0, 63.0, 61.0, 46.0, 43.0, 26.0, 24.0, 14.0, 8.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0546875, -6.805419921875, -6.55615234375, -6.306884765625, -6.0576171875, -5.808349609375, -5.55908203125, -5.309814453125, -5.060546875, -4.811279296875, -4.56201171875, -4.312744140625, -4.0634765625, -3.814208984375, -3.56494140625, -3.315673828125, -3.06640625, -2.817138671875, -2.56787109375, -2.318603515625, -2.0693359375, -1.820068359375, -1.57080078125, -1.321533203125, -1.072265625, -0.822998046875, -0.57373046875, -0.324462890625, -0.0751953125, 0.174072265625, 0.42333984375, 0.672607421875, 0.921875, 1.171142578125, 1.42041015625, 1.669677734375, 1.9189453125, 2.168212890625, 2.41748046875, 2.666748046875, 2.916015625, 3.165283203125, 3.41455078125, 3.663818359375, 3.9130859375, 4.162353515625, 4.41162109375, 4.660888671875, 4.91015625, 5.159423828125, 5.40869140625, 5.657958984375, 5.9072265625, 6.156494140625, 6.40576171875, 6.655029296875, 6.904296875, 7.153564453125, 7.40283203125, 7.652099609375, 7.9013671875, 8.150634765625, 8.39990234375, 8.649169921875, 8.8984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 16.0, 30.0, 44.0, 58.0, 114.0, 221.0, 431.0, 1093.0, 3951.0, 27961.0, 799796.0, 199969.0, 11131.0, 2262.0, 751.0, 331.0, 159.0, 74.0, 47.0, 35.0, 15.0, 13.0, 11.0, 7.0, 3.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.47412109375, -34.1982421875, -32.92236328125, -31.646484375, -30.37060546875, -29.0947265625, -27.81884765625, -26.54296875, -25.26708984375, -23.9912109375, -22.71533203125, -21.439453125, -20.16357421875, -18.8876953125, -17.61181640625, -16.3359375, -15.06005859375, -13.7841796875, -12.50830078125, -11.232421875, -9.95654296875, -8.6806640625, -7.40478515625, -6.12890625, -4.85302734375, -3.5771484375, -2.30126953125, -1.025390625, 0.25048828125, 1.5263671875, 2.80224609375, 4.078125, 5.35400390625, 6.6298828125, 7.90576171875, 9.181640625, 10.45751953125, 11.7333984375, 13.00927734375, 14.28515625, 15.56103515625, 16.8369140625, 18.11279296875, 19.388671875, 20.66455078125, 21.9404296875, 23.21630859375, 24.4921875, 25.76806640625, 27.0439453125, 28.31982421875, 29.595703125, 30.87158203125, 32.1474609375, 33.42333984375, 34.69921875, 35.97509765625, 37.2509765625, 38.52685546875, 39.802734375, 41.07861328125, 42.3544921875, 43.63037109375, 44.90625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 6.0, 10.0, 12.0, 19.0, 21.0, 39.0, 30.0, 42.0, 49.0, 55.0, 66.0, 62.0, 61.0, 57.0, 64.0, 61.0, 53.0, 58.0, 35.0, 31.0, 29.0, 24.0, 22.0, 20.0, 16.0, 13.0, 2.0, 2.0, 9.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.21875, -22.426513671875, -21.63427734375, -20.842041015625, -20.0498046875, -19.257568359375, -18.46533203125, -17.673095703125, -16.880859375, -16.088623046875, -15.29638671875, -14.504150390625, -13.7119140625, -12.919677734375, -12.12744140625, -11.335205078125, -10.54296875, -9.750732421875, -8.95849609375, -8.166259765625, -7.3740234375, -6.581787109375, -5.78955078125, -4.997314453125, -4.205078125, -3.412841796875, -2.62060546875, -1.828369140625, -1.0361328125, -0.243896484375, 0.54833984375, 1.340576171875, 2.1328125, 2.925048828125, 3.71728515625, 4.509521484375, 5.3017578125, 6.093994140625, 6.88623046875, 7.678466796875, 8.470703125, 9.262939453125, 10.05517578125, 10.847412109375, 11.6396484375, 12.431884765625, 13.22412109375, 14.016357421875, 14.80859375, 15.600830078125, 16.39306640625, 17.185302734375, 17.9775390625, 18.769775390625, 19.56201171875, 20.354248046875, 21.146484375, 21.938720703125, 22.73095703125, 23.523193359375, 24.3154296875, 25.107666015625, 25.89990234375, 26.692138671875, 27.484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 12.0, 20.0, 27.0, 50.0, 70.0, 146.0, 297.0, 651.0, 1542.0, 4709.0, 23782.0, 810142.0, 189769.0, 12117.0, 3122.0, 1078.0, 483.0, 214.0, 120.0, 65.0, 46.0, 24.0, 19.0, 9.0, 16.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.296875, -18.7867431640625, -18.276611328125, -17.7664794921875, -17.25634765625, -16.7462158203125, -16.236083984375, -15.7259521484375, -15.2158203125, -14.7056884765625, -14.195556640625, -13.6854248046875, -13.17529296875, -12.6651611328125, -12.155029296875, -11.6448974609375, -11.134765625, -10.6246337890625, -10.114501953125, -9.6043701171875, -9.09423828125, -8.5841064453125, -8.073974609375, -7.5638427734375, -7.0537109375, -6.5435791015625, -6.033447265625, -5.5233154296875, -5.01318359375, -4.5030517578125, -3.992919921875, -3.4827880859375, -2.97265625, -2.4625244140625, -1.952392578125, -1.4422607421875, -0.93212890625, -0.4219970703125, 0.088134765625, 0.5982666015625, 1.1083984375, 1.6185302734375, 2.128662109375, 2.6387939453125, 3.14892578125, 3.6590576171875, 4.169189453125, 4.6793212890625, 5.189453125, 5.6995849609375, 6.209716796875, 6.7198486328125, 7.22998046875, 7.7401123046875, 8.250244140625, 8.7603759765625, 9.2705078125, 9.7806396484375, 10.290771484375, 10.8009033203125, 11.31103515625, 11.8211669921875, 12.331298828125, 12.8414306640625, 13.3515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 9.0, 11.0, 16.0, 18.0, 24.0, 52.0, 99.0, 140.0, 227.0, 159.0, 90.0, 47.0, 26.0, 19.0, 18.0, 12.0, 9.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004344940185546875, -0.004237711429595947, -0.0041304826736450195, -0.004023253917694092, -0.003916025161743164, -0.0038087964057922363, -0.0037015676498413086, -0.003594338893890381, -0.003487110137939453, -0.0033798813819885254, -0.0032726526260375977, -0.00316542387008667, -0.003058195114135742, -0.0029509663581848145, -0.0028437376022338867, -0.002736508846282959, -0.0026292800903320312, -0.0025220513343811035, -0.0024148225784301758, -0.002307593822479248, -0.0022003650665283203, -0.0020931363105773926, -0.001985907554626465, -0.0018786787986755371, -0.0017714500427246094, -0.0016642212867736816, -0.001556992530822754, -0.0014497637748718262, -0.0013425350189208984, -0.0012353062629699707, -0.001128077507019043, -0.0010208487510681152, -0.0009136199951171875, -0.0008063912391662598, -0.000699162483215332, -0.0005919337272644043, -0.00048470497131347656, -0.00037747621536254883, -0.0002702474594116211, -0.00016301870346069336, -5.5789947509765625e-05, 5.143880844116211e-05, 0.00015866756439208984, 0.0002658963203430176, 0.0003731250762939453, 0.00048035383224487305, 0.0005875825881958008, 0.0006948113441467285, 0.0008020401000976562, 0.000909268856048584, 0.0010164976119995117, 0.0011237263679504395, 0.0012309551239013672, 0.001338183879852295, 0.0014454126358032227, 0.0015526413917541504, 0.0016598701477050781, 0.0017670989036560059, 0.0018743276596069336, 0.0019815564155578613, 0.002088785171508789, 0.002196013927459717, 0.0023032426834106445, 0.0024104714393615723, 0.0025177001953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 2.0, 6.0, 11.0, 9.0, 20.0, 21.0, 23.0, 33.0, 53.0, 69.0, 90.0, 145.0, 242.0, 371.0, 621.0, 1046.0, 1942.0, 4141.0, 10338.0, 40063.0, 530523.0, 401626.0, 38414.0, 10343.0, 3929.0, 1823.0, 1047.0, 581.0, 368.0, 196.0, 134.0, 102.0, 51.0, 46.0, 37.0, 16.0, 19.0, 9.0, 14.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-10.046875, -9.7423095703125, -9.437744140625, -9.1331787109375, -8.82861328125, -8.5240478515625, -8.219482421875, -7.9149169921875, -7.6103515625, -7.3057861328125, -7.001220703125, -6.6966552734375, -6.39208984375, -6.0875244140625, -5.782958984375, -5.4783935546875, -5.173828125, -4.8692626953125, -4.564697265625, -4.2601318359375, -3.95556640625, -3.6510009765625, -3.346435546875, -3.0418701171875, -2.7373046875, -2.4327392578125, -2.128173828125, -1.8236083984375, -1.51904296875, -1.2144775390625, -0.909912109375, -0.6053466796875, -0.30078125, 0.0037841796875, 0.308349609375, 0.6129150390625, 0.91748046875, 1.2220458984375, 1.526611328125, 1.8311767578125, 2.1357421875, 2.4403076171875, 2.744873046875, 3.0494384765625, 3.35400390625, 3.6585693359375, 3.963134765625, 4.2677001953125, 4.572265625, 4.8768310546875, 5.181396484375, 5.4859619140625, 5.79052734375, 6.0950927734375, 6.399658203125, 6.7042236328125, 7.0087890625, 7.3133544921875, 7.617919921875, 7.9224853515625, 8.22705078125, 8.5316162109375, 8.836181640625, 9.1407470703125, 9.4453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 6.0, 1.0, 8.0, 9.0, 3.0, 14.0, 18.0, 17.0, 14.0, 22.0, 31.0, 50.0, 74.0, 115.0, 113.0, 111.0, 112.0, 80.0, 57.0, 33.0, 15.0, 19.0, 20.0, 10.0, 10.0, 9.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.6796875, -11.38818359375, -11.0966796875, -10.80517578125, -10.513671875, -10.22216796875, -9.9306640625, -9.63916015625, -9.34765625, -9.05615234375, -8.7646484375, -8.47314453125, -8.181640625, -7.89013671875, -7.5986328125, -7.30712890625, -7.015625, -6.72412109375, -6.4326171875, -6.14111328125, -5.849609375, -5.55810546875, -5.2666015625, -4.97509765625, -4.68359375, -4.39208984375, -4.1005859375, -3.80908203125, -3.517578125, -3.22607421875, -2.9345703125, -2.64306640625, -2.3515625, -2.06005859375, -1.7685546875, -1.47705078125, -1.185546875, -0.89404296875, -0.6025390625, -0.31103515625, -0.01953125, 0.27197265625, 0.5634765625, 0.85498046875, 1.146484375, 1.43798828125, 1.7294921875, 2.02099609375, 2.3125, 2.60400390625, 2.8955078125, 3.18701171875, 3.478515625, 3.77001953125, 4.0615234375, 4.35302734375, 4.64453125, 4.93603515625, 5.2275390625, 5.51904296875, 5.810546875, 6.10205078125, 6.3935546875, 6.68505859375, 6.9765625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 13.0, 20.0, 76.0, 318.0, 449.0, 91.0, 26.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-564.4317626953125, -551.3387451171875, -538.2456665039062, -525.1526489257812, -512.0595703125, -498.966552734375, -485.8735046386719, -472.78045654296875, -459.68743896484375, -446.5943908691406, -433.5013427734375, -420.4083251953125, -407.3152770996094, -394.22222900390625, -381.1291809082031, -368.0361328125, -354.9430847167969, -341.85003662109375, -328.7569885253906, -315.6639404296875, -302.5709228515625, -289.4778747558594, -276.38482666015625, -263.2917785644531, -250.19874572753906, -237.10569763183594, -224.01266479492188, -210.91961669921875, -197.82656860351562, -184.73353576660156, -171.64048767089844, -158.54745483398438, -145.45440673828125, -132.36135864257812, -119.26832580566406, -106.17527770996094, -93.08223724365234, -79.98919677734375, -66.89614868164062, -53.80310821533203, -40.71006774902344, -27.61702537536621, -14.523983001708984, -1.430938720703125, 11.662101745605469, 24.755142211914062, 37.84819030761719, 50.94123077392578, 64.03427124023438, 77.12731170654297, 90.22035217285156, 103.31340026855469, 116.40644073486328, 129.49948120117188, 142.592529296875, 155.68557739257812, 168.7786102294922, 181.8716583251953, 194.96469116210938, 208.0577392578125, 221.15078735351562, 234.2438201904297, 247.3368682861328, 260.4299011230469, 273.52294921875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 1.0, 6.0, 7.0, 5.0, 7.0, 5.0, 11.0, 14.0, 20.0, 20.0, 23.0, 23.0, 23.0, 27.0, 22.0, 28.0, 37.0, 54.0, 65.0, 78.0, 81.0, 68.0, 47.0, 53.0, 45.0, 33.0, 21.0, 29.0, 25.0, 21.0, 19.0, 11.0, 15.0, 15.0, 11.0, 9.0, 9.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.65325927734375, -88.95291900634766, -86.25257873535156, -83.55223846435547, -80.85189819335938, -78.15155792236328, -75.45121765136719, -72.7508773803711, -70.050537109375, -67.3501968383789, -64.64985656738281, -61.94951629638672, -59.249176025390625, -56.54883575439453, -53.84849548339844, -51.148155212402344, -48.44781494140625, -45.747474670410156, -43.04713439941406, -40.34679412841797, -37.646453857421875, -34.94611358642578, -32.24577331542969, -29.545433044433594, -26.8450927734375, -24.144752502441406, -21.444412231445312, -18.74407196044922, -16.043731689453125, -13.343391418457031, -10.643051147460938, -7.942710876464844, -5.242378234863281, -2.5420379638671875, 0.15830230712890625, 2.858642578125, 5.558982849121094, 8.259323120117188, 10.959663391113281, 13.660003662109375, 16.36034393310547, 19.060684204101562, 21.761024475097656, 24.46136474609375, 27.161705017089844, 29.862045288085938, 32.56238555908203, 35.262725830078125, 37.96306610107422, 40.66340637207031, 43.363746643066406, 46.0640869140625, 48.764427185058594, 51.46476745605469, 54.16510772705078, 56.865447998046875, 59.56578826904297, 62.26612854003906, 64.96646881103516, 67.66680908203125, 70.36714935302734, 73.06748962402344, 75.76782989501953, 78.46817016601562, 81.16851043701172]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 8.0, 9.0, 13.0, 32.0, 35.0, 69.0, 132.0, 378.0, 1319.0, 6963.0, 1256620.0, 2918526.0, 8186.0, 1314.0, 319.0, 159.0, 70.0, 43.0, 21.0, 13.0, 12.0, 7.0, 11.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.078125, -24.993408203125, -23.90869140625, -22.823974609375, -21.7392578125, -20.654541015625, -19.56982421875, -18.485107421875, -17.400390625, -16.315673828125, -15.23095703125, -14.146240234375, -13.0615234375, -11.976806640625, -10.89208984375, -9.807373046875, -8.72265625, -7.637939453125, -6.55322265625, -5.468505859375, -4.3837890625, -3.299072265625, -2.21435546875, -1.129638671875, -0.044921875, 1.039794921875, 2.12451171875, 3.209228515625, 4.2939453125, 5.378662109375, 6.46337890625, 7.548095703125, 8.6328125, 9.717529296875, 10.80224609375, 11.886962890625, 12.9716796875, 14.056396484375, 15.14111328125, 16.225830078125, 17.310546875, 18.395263671875, 19.47998046875, 20.564697265625, 21.6494140625, 22.734130859375, 23.81884765625, 24.903564453125, 25.98828125, 27.072998046875, 28.15771484375, 29.242431640625, 30.3271484375, 31.411865234375, 32.49658203125, 33.581298828125, 34.666015625, 35.750732421875, 36.83544921875, 37.920166015625, 39.0048828125, 40.089599609375, 41.17431640625, 42.259033203125, 43.34375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 9.0, 4.0, 5.0, 9.0, 15.0, 27.0, 47.0, 41.0, 41.0, 72.0, 82.0, 83.0, 77.0, 77.0, 87.0, 88.0, 63.0, 55.0, 34.0, 38.0, 20.0, 16.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.25390625, -6.99322509765625, -6.7325439453125, -6.47186279296875, -6.211181640625, -5.95050048828125, -5.6898193359375, -5.42913818359375, -5.16845703125, -4.90777587890625, -4.6470947265625, -4.38641357421875, -4.125732421875, -3.86505126953125, -3.6043701171875, -3.34368896484375, -3.0830078125, -2.82232666015625, -2.5616455078125, -2.30096435546875, -2.040283203125, -1.77960205078125, -1.5189208984375, -1.25823974609375, -0.99755859375, -0.73687744140625, -0.4761962890625, -0.21551513671875, 0.045166015625, 0.30584716796875, 0.5665283203125, 0.82720947265625, 1.087890625, 1.34857177734375, 1.6092529296875, 1.86993408203125, 2.130615234375, 2.39129638671875, 2.6519775390625, 2.91265869140625, 3.17333984375, 3.43402099609375, 3.6947021484375, 3.95538330078125, 4.216064453125, 4.47674560546875, 4.7374267578125, 4.99810791015625, 5.2587890625, 5.51947021484375, 5.7801513671875, 6.04083251953125, 6.301513671875, 6.56219482421875, 6.8228759765625, 7.08355712890625, 7.34423828125, 7.60491943359375, 7.8656005859375, 8.12628173828125, 8.386962890625, 8.64764404296875, 8.9083251953125, 9.16900634765625, 9.4296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 8.0, 5.0, 14.0, 17.0, 21.0, 49.0, 95.0, 169.0, 331.0, 851.0, 3665.0, 53112.0, 4115424.0, 17222.0, 2155.0, 620.0, 260.0, 126.0, 67.0, 28.0, 18.0, 12.0, 12.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.65625, -48.02099609375, -46.3857421875, -44.75048828125, -43.115234375, -41.47998046875, -39.8447265625, -38.20947265625, -36.57421875, -34.93896484375, -33.3037109375, -31.66845703125, -30.033203125, -28.39794921875, -26.7626953125, -25.12744140625, -23.4921875, -21.85693359375, -20.2216796875, -18.58642578125, -16.951171875, -15.31591796875, -13.6806640625, -12.04541015625, -10.41015625, -8.77490234375, -7.1396484375, -5.50439453125, -3.869140625, -2.23388671875, -0.5986328125, 1.03662109375, 2.671875, 4.30712890625, 5.9423828125, 7.57763671875, 9.212890625, 10.84814453125, 12.4833984375, 14.11865234375, 15.75390625, 17.38916015625, 19.0244140625, 20.65966796875, 22.294921875, 23.93017578125, 25.5654296875, 27.20068359375, 28.8359375, 30.47119140625, 32.1064453125, 33.74169921875, 35.376953125, 37.01220703125, 38.6474609375, 40.28271484375, 41.91796875, 43.55322265625, 45.1884765625, 46.82373046875, 48.458984375, 50.09423828125, 51.7294921875, 53.36474609375, 55.0]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 3.0, 7.0, 5.0, 16.0, 15.0, 46.0, 49.0, 125.0, 355.0, 1512.0, 1354.0, 352.0, 97.0, 52.0, 32.0, 13.0, 16.0, 10.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.40625, -27.658447265625, -26.91064453125, -26.162841796875, -25.4150390625, -24.667236328125, -23.91943359375, -23.171630859375, -22.423828125, -21.676025390625, -20.92822265625, -20.180419921875, -19.4326171875, -18.684814453125, -17.93701171875, -17.189208984375, -16.44140625, -15.693603515625, -14.94580078125, -14.197998046875, -13.4501953125, -12.702392578125, -11.95458984375, -11.206787109375, -10.458984375, -9.711181640625, -8.96337890625, -8.215576171875, -7.4677734375, -6.719970703125, -5.97216796875, -5.224365234375, -4.4765625, -3.728759765625, -2.98095703125, -2.233154296875, -1.4853515625, -0.737548828125, 0.01025390625, 0.758056640625, 1.505859375, 2.253662109375, 3.00146484375, 3.749267578125, 4.4970703125, 5.244873046875, 5.99267578125, 6.740478515625, 7.48828125, 8.236083984375, 8.98388671875, 9.731689453125, 10.4794921875, 11.227294921875, 11.97509765625, 12.722900390625, 13.470703125, 14.218505859375, 14.96630859375, 15.714111328125, 16.4619140625, 17.209716796875, 17.95751953125, 18.705322265625, 19.453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 5.0, 12.0, 38.0, 145.0, 496.0, 238.0, 54.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-499.31146240234375, -486.387939453125, -473.4644470214844, -460.5409240722656, -447.6174011230469, -434.69390869140625, -421.7703857421875, -408.84686279296875, -395.92333984375, -382.99981689453125, -370.0763244628906, -357.1528015136719, -344.2292785644531, -331.3057861328125, -318.38226318359375, -305.458740234375, -292.5352478027344, -279.6117248535156, -266.688232421875, -253.76470947265625, -240.8411865234375, -227.9176788330078, -214.99417114257812, -202.07064819335938, -189.1471405029297, -176.2236328125, -163.30010986328125, -150.37660217285156, -137.45309448242188, -124.52957153320312, -111.60606384277344, -98.68254852294922, -85.75906372070312, -72.8355484008789, -59.91203689575195, -46.988525390625, -34.06501007080078, -21.141494750976562, -8.217987060546875, 4.705528259277344, 17.629043579101562, 30.55255699157715, 43.476070404052734, 56.39958190917969, 69.3230972290039, 82.24661254882812, 95.17012023925781, 108.09363555908203, 121.01715087890625, 133.94065856933594, 146.8641815185547, 159.78768920898438, 172.71121215820312, 185.6347198486328, 198.5582275390625, 211.48175048828125, 224.40525817871094, 237.32876586914062, 250.25228881835938, 263.17578125, 276.09930419921875, 289.0228271484375, 301.94635009765625, 314.8698425292969, 327.7933654785156]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 9.0, 16.0, 25.0, 56.0, 75.0, 104.0, 106.0, 118.0, 112.0, 102.0, 110.0, 71.0, 46.0, 21.0, 14.0, 8.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-185.2910919189453, -180.87242126464844, -176.4537353515625, -172.03506469726562, -167.6163787841797, -163.1977081298828, -158.77902221679688, -154.3603515625, -149.94166564941406, -145.5229949951172, -141.10430908203125, -136.68563842773438, -132.26695251464844, -127.84827423095703, -123.42959594726562, -119.01092529296875, -114.59224700927734, -110.17356872558594, -105.75489044189453, -101.33621215820312, -96.91753387451172, -92.49885559082031, -88.08018493652344, -83.6614990234375, -79.24282836914062, -74.82415008544922, -70.40547180175781, -65.9867935180664, -61.568115234375, -57.149436950683594, -52.73076248168945, -48.31208419799805, -43.893402099609375, -39.47472381591797, -35.05604553222656, -30.63736915588379, -26.218690872192383, -21.800012588500977, -17.381336212158203, -12.962657928466797, -8.54397964477539, -4.125301837921143, 0.29337596893310547, 4.712053298950195, 9.130731582641602, 13.549409866333008, 17.96808624267578, 22.386764526367188, 26.805442810058594, 31.22412109375, 35.642799377441406, 40.06147766113281, 44.48015594482422, 48.898834228515625, 53.317508697509766, 57.73618698120117, 62.15486526489258, 66.57353973388672, 70.99221801757812, 75.41089630126953, 79.82957458496094, 84.24825286865234, 88.66693115234375, 93.08560943603516, 97.50428771972656]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 3.0, 5.0, 7.0, 9.0, 15.0, 25.0, 24.0, 32.0, 46.0, 70.0, 106.0, 181.0, 319.0, 719.0, 1892.0, 5800.0, 20584.0, 88750.0, 416790.0, 399890.0, 84503.0, 19814.0, 5560.0, 1850.0, 698.0, 357.0, 151.0, 103.0, 65.0, 54.0, 40.0, 20.0, 16.0, 18.0, 7.0, 8.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.94970703125, -15.3994140625, -14.84912109375, -14.298828125, -13.74853515625, -13.1982421875, -12.64794921875, -12.09765625, -11.54736328125, -10.9970703125, -10.44677734375, -9.896484375, -9.34619140625, -8.7958984375, -8.24560546875, -7.6953125, -7.14501953125, -6.5947265625, -6.04443359375, -5.494140625, -4.94384765625, -4.3935546875, -3.84326171875, -3.29296875, -2.74267578125, -2.1923828125, -1.64208984375, -1.091796875, -0.54150390625, 0.0087890625, 0.55908203125, 1.109375, 1.65966796875, 2.2099609375, 2.76025390625, 3.310546875, 3.86083984375, 4.4111328125, 4.96142578125, 5.51171875, 6.06201171875, 6.6123046875, 7.16259765625, 7.712890625, 8.26318359375, 8.8134765625, 9.36376953125, 9.9140625, 10.46435546875, 11.0146484375, 11.56494140625, 12.115234375, 12.66552734375, 13.2158203125, 13.76611328125, 14.31640625, 14.86669921875, 15.4169921875, 15.96728515625, 16.517578125, 17.06787109375, 17.6181640625, 18.16845703125, 18.71875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 8.0, 3.0, 9.0, 10.0, 21.0, 24.0, 20.0, 40.0, 39.0, 50.0, 74.0, 60.0, 73.0, 81.0, 67.0, 67.0, 67.0, 75.0, 52.0, 43.0, 39.0, 29.0, 23.0, 11.0, 2.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6953125, -6.444580078125, -6.19384765625, -5.943115234375, -5.6923828125, -5.441650390625, -5.19091796875, -4.940185546875, -4.689453125, -4.438720703125, -4.18798828125, -3.937255859375, -3.6865234375, -3.435791015625, -3.18505859375, -2.934326171875, -2.68359375, -2.432861328125, -2.18212890625, -1.931396484375, -1.6806640625, -1.429931640625, -1.17919921875, -0.928466796875, -0.677734375, -0.427001953125, -0.17626953125, 0.074462890625, 0.3251953125, 0.575927734375, 0.82666015625, 1.077392578125, 1.328125, 1.578857421875, 1.82958984375, 2.080322265625, 2.3310546875, 2.581787109375, 2.83251953125, 3.083251953125, 3.333984375, 3.584716796875, 3.83544921875, 4.086181640625, 4.3369140625, 4.587646484375, 4.83837890625, 5.089111328125, 5.33984375, 5.590576171875, 5.84130859375, 6.092041015625, 6.3427734375, 6.593505859375, 6.84423828125, 7.094970703125, 7.345703125, 7.596435546875, 7.84716796875, 8.097900390625, 8.3486328125, 8.599365234375, 8.85009765625, 9.100830078125, 9.3515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 5.0, 0.0, 9.0, 10.0, 15.0, 13.0, 31.0, 46.0, 62.0, 117.0, 189.0, 388.0, 908.0, 2130.0, 6444.0, 25070.0, 142922.0, 705152.0, 131401.0, 23957.0, 6074.0, 1971.0, 763.0, 374.0, 185.0, 104.0, 76.0, 49.0, 22.0, 22.0, 15.0, 11.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.703125, -18.04638671875, -17.3896484375, -16.73291015625, -16.076171875, -15.41943359375, -14.7626953125, -14.10595703125, -13.44921875, -12.79248046875, -12.1357421875, -11.47900390625, -10.822265625, -10.16552734375, -9.5087890625, -8.85205078125, -8.1953125, -7.53857421875, -6.8818359375, -6.22509765625, -5.568359375, -4.91162109375, -4.2548828125, -3.59814453125, -2.94140625, -2.28466796875, -1.6279296875, -0.97119140625, -0.314453125, 0.34228515625, 0.9990234375, 1.65576171875, 2.3125, 2.96923828125, 3.6259765625, 4.28271484375, 4.939453125, 5.59619140625, 6.2529296875, 6.90966796875, 7.56640625, 8.22314453125, 8.8798828125, 9.53662109375, 10.193359375, 10.85009765625, 11.5068359375, 12.16357421875, 12.8203125, 13.47705078125, 14.1337890625, 14.79052734375, 15.447265625, 16.10400390625, 16.7607421875, 17.41748046875, 18.07421875, 18.73095703125, 19.3876953125, 20.04443359375, 20.701171875, 21.35791015625, 22.0146484375, 22.67138671875, 23.328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 8.0, 15.0, 16.0, 14.0, 18.0, 21.0, 19.0, 29.0, 32.0, 30.0, 42.0, 52.0, 38.0, 54.0, 44.0, 72.0, 47.0, 64.0, 56.0, 41.0, 47.0, 35.0, 25.0, 26.0, 18.0, 25.0, 16.0, 21.0, 17.0, 13.0, 9.0, 11.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.532470703125, -19.92431640625, -19.316162109375, -18.7080078125, -18.099853515625, -17.49169921875, -16.883544921875, -16.275390625, -15.667236328125, -15.05908203125, -14.450927734375, -13.8427734375, -13.234619140625, -12.62646484375, -12.018310546875, -11.41015625, -10.802001953125, -10.19384765625, -9.585693359375, -8.9775390625, -8.369384765625, -7.76123046875, -7.153076171875, -6.544921875, -5.936767578125, -5.32861328125, -4.720458984375, -4.1123046875, -3.504150390625, -2.89599609375, -2.287841796875, -1.6796875, -1.071533203125, -0.46337890625, 0.144775390625, 0.7529296875, 1.361083984375, 1.96923828125, 2.577392578125, 3.185546875, 3.793701171875, 4.40185546875, 5.010009765625, 5.6181640625, 6.226318359375, 6.83447265625, 7.442626953125, 8.05078125, 8.658935546875, 9.26708984375, 9.875244140625, 10.4833984375, 11.091552734375, 11.69970703125, 12.307861328125, 12.916015625, 13.524169921875, 14.13232421875, 14.740478515625, 15.3486328125, 15.956787109375, 16.56494140625, 17.173095703125, 17.78125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 8.0, 21.0, 14.0, 32.0, 43.0, 67.0, 109.0, 169.0, 293.0, 569.0, 1007.0, 2160.0, 4761.0, 11764.0, 34432.0, 117818.0, 547521.0, 229541.0, 63895.0, 20256.0, 7521.0, 3218.0, 1502.0, 772.0, 405.0, 245.0, 141.0, 90.0, 56.0, 38.0, 24.0, 18.0, 8.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.37109375, -5.2249755859375, -5.078857421875, -4.9327392578125, -4.78662109375, -4.6405029296875, -4.494384765625, -4.3482666015625, -4.2021484375, -4.0560302734375, -3.909912109375, -3.7637939453125, -3.61767578125, -3.4715576171875, -3.325439453125, -3.1793212890625, -3.033203125, -2.8870849609375, -2.740966796875, -2.5948486328125, -2.44873046875, -2.3026123046875, -2.156494140625, -2.0103759765625, -1.8642578125, -1.7181396484375, -1.572021484375, -1.4259033203125, -1.27978515625, -1.1336669921875, -0.987548828125, -0.8414306640625, -0.6953125, -0.5491943359375, -0.403076171875, -0.2569580078125, -0.11083984375, 0.0352783203125, 0.181396484375, 0.3275146484375, 0.4736328125, 0.6197509765625, 0.765869140625, 0.9119873046875, 1.05810546875, 1.2042236328125, 1.350341796875, 1.4964599609375, 1.642578125, 1.7886962890625, 1.934814453125, 2.0809326171875, 2.22705078125, 2.3731689453125, 2.519287109375, 2.6654052734375, 2.8115234375, 2.9576416015625, 3.103759765625, 3.2498779296875, 3.39599609375, 3.5421142578125, 3.688232421875, 3.8343505859375, 3.98046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 3.0, 3.0, 7.0, 11.0, 21.0, 23.0, 61.0, 94.0, 145.0, 177.0, 155.0, 124.0, 70.0, 40.0, 21.0, 16.0, 11.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027141571044921875, -0.00261610746383667, -0.0025180578231811523, -0.0024200081825256348, -0.002321958541870117, -0.0022239089012145996, -0.002125859260559082, -0.0020278096199035645, -0.0019297599792480469, -0.0018317103385925293, -0.0017336606979370117, -0.0016356110572814941, -0.0015375614166259766, -0.001439511775970459, -0.0013414621353149414, -0.0012434124946594238, -0.0011453628540039062, -0.0010473132133483887, -0.0009492635726928711, -0.0008512139320373535, -0.0007531642913818359, -0.0006551146507263184, -0.0005570650100708008, -0.0004590153694152832, -0.0003609657287597656, -0.00026291608810424805, -0.00016486644744873047, -6.681680679321289e-05, 3.123283386230469e-05, 0.00012928247451782227, 0.00022733211517333984, 0.0003253817558288574, 0.000423431396484375, 0.0005214810371398926, 0.0006195306777954102, 0.0007175803184509277, 0.0008156299591064453, 0.0009136795997619629, 0.0010117292404174805, 0.001109778881072998, 0.0012078285217285156, 0.0013058781623840332, 0.0014039278030395508, 0.0015019774436950684, 0.001600027084350586, 0.0016980767250061035, 0.001796126365661621, 0.0018941760063171387, 0.0019922256469726562, 0.002090275287628174, 0.0021883249282836914, 0.002286374568939209, 0.0023844242095947266, 0.002482473850250244, 0.0025805234909057617, 0.0026785731315612793, 0.002776622772216797, 0.0028746724128723145, 0.002972722053527832, 0.0030707716941833496, 0.003168821334838867, 0.0032668709754943848, 0.0033649206161499023, 0.00346297025680542, 0.0035610198974609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 12.0, 23.0, 31.0, 39.0, 98.0, 137.0, 317.0, 622.0, 1262.0, 3181.0, 10019.0, 47333.0, 371450.0, 545934.0, 51603.0, 10574.0, 3334.0, 1288.0, 610.0, 301.0, 137.0, 86.0, 56.0, 36.0, 17.0, 22.0, 4.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.64801025390625, -7.4014892578125, -7.15496826171875, -6.908447265625, -6.66192626953125, -6.4154052734375, -6.16888427734375, -5.92236328125, -5.67584228515625, -5.4293212890625, -5.18280029296875, -4.936279296875, -4.68975830078125, -4.4432373046875, -4.19671630859375, -3.9501953125, -3.70367431640625, -3.4571533203125, -3.21063232421875, -2.964111328125, -2.71759033203125, -2.4710693359375, -2.22454833984375, -1.97802734375, -1.73150634765625, -1.4849853515625, -1.23846435546875, -0.991943359375, -0.74542236328125, -0.4989013671875, -0.25238037109375, -0.005859375, 0.24066162109375, 0.4871826171875, 0.73370361328125, 0.980224609375, 1.22674560546875, 1.4732666015625, 1.71978759765625, 1.96630859375, 2.21282958984375, 2.4593505859375, 2.70587158203125, 2.952392578125, 3.19891357421875, 3.4454345703125, 3.69195556640625, 3.9384765625, 4.18499755859375, 4.4315185546875, 4.67803955078125, 4.924560546875, 5.17108154296875, 5.4176025390625, 5.66412353515625, 5.91064453125, 6.15716552734375, 6.4036865234375, 6.65020751953125, 6.896728515625, 7.14324951171875, 7.3897705078125, 7.63629150390625, 7.8828125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 14.0, 7.0, 16.0, 20.0, 23.0, 36.0, 56.0, 48.0, 63.0, 69.0, 86.0, 87.0, 91.0, 75.0, 62.0, 53.0, 40.0, 39.0, 27.0, 20.0, 14.0, 10.0, 8.0, 5.0, 6.0, 2.0, 3.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.93402099609375, -4.7430419921875, -4.55206298828125, -4.361083984375, -4.17010498046875, -3.9791259765625, -3.78814697265625, -3.59716796875, -3.40618896484375, -3.2152099609375, -3.02423095703125, -2.833251953125, -2.64227294921875, -2.4512939453125, -2.26031494140625, -2.0693359375, -1.87835693359375, -1.6873779296875, -1.49639892578125, -1.305419921875, -1.11444091796875, -0.9234619140625, -0.73248291015625, -0.54150390625, -0.35052490234375, -0.1595458984375, 0.03143310546875, 0.222412109375, 0.41339111328125, 0.6043701171875, 0.79534912109375, 0.986328125, 1.17730712890625, 1.3682861328125, 1.55926513671875, 1.750244140625, 1.94122314453125, 2.1322021484375, 2.32318115234375, 2.51416015625, 2.70513916015625, 2.8961181640625, 3.08709716796875, 3.278076171875, 3.46905517578125, 3.6600341796875, 3.85101318359375, 4.0419921875, 4.23297119140625, 4.4239501953125, 4.61492919921875, 4.805908203125, 4.99688720703125, 5.1878662109375, 5.37884521484375, 5.56982421875, 5.76080322265625, 5.9517822265625, 6.14276123046875, 6.333740234375, 6.52471923828125, 6.7156982421875, 6.90667724609375, 7.09765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 7.0, 8.0, 12.0, 14.0, 27.0, 43.0, 84.0, 107.0, 243.0, 207.0, 115.0, 59.0, 27.0, 13.0, 15.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.07264709472656, -109.68798828125, -105.30332946777344, -100.91867065429688, -96.53401184082031, -92.14935302734375, -87.76469421386719, -83.38003540039062, -78.99537658691406, -74.6107177734375, -70.22605895996094, -65.84140014648438, -61.45674133300781, -57.07208251953125, -52.68742370605469, -48.302764892578125, -43.91810607910156, -39.533447265625, -35.14878845214844, -30.764129638671875, -26.379470825195312, -21.99481201171875, -17.610153198242188, -13.225494384765625, -8.840835571289062, -4.4561767578125, -0.0715179443359375, 4.313140869140625, 8.697799682617188, 13.08245849609375, 17.467117309570312, 21.851776123046875, 26.2364501953125, 30.621109008789062, 35.005767822265625, 39.39042663574219, 43.77508544921875, 48.15974426269531, 52.544403076171875, 56.92906188964844, 61.313720703125, 65.69837951660156, 70.08303833007812, 74.46769714355469, 78.85235595703125, 83.23701477050781, 87.62167358398438, 92.00633239746094, 96.3909912109375, 100.77565002441406, 105.16030883789062, 109.54496765136719, 113.92962646484375, 118.31428527832031, 122.69894409179688, 127.08360290527344, 131.46826171875, 135.85292053222656, 140.23757934570312, 144.6222381591797, 149.00689697265625, 153.3915557861328, 157.77621459960938, 162.16087341308594, 166.5455322265625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 5.0, 6.0, 7.0, 5.0, 8.0, 8.0, 16.0, 19.0, 22.0, 25.0, 12.0, 24.0, 18.0, 23.0, 25.0, 37.0, 37.0, 55.0, 58.0, 70.0, 81.0, 51.0, 57.0, 29.0, 28.0, 33.0, 22.0, 26.0, 23.0, 15.0, 18.0, 21.0, 16.0, 19.0, 14.0, 13.0, 7.0, 9.0, 6.0, 4.0, 6.0, 6.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-67.41326141357422, -65.29957580566406, -63.185890197753906, -61.07220458984375, -58.958518981933594, -56.84483337402344, -54.731143951416016, -52.61745834350586, -50.5037727355957, -48.39008712768555, -46.27640151977539, -44.162715911865234, -42.04902648925781, -39.935340881347656, -37.8216552734375, -35.707969665527344, -33.59428405761719, -31.48059844970703, -29.366912841796875, -27.253225326538086, -25.13953971862793, -23.025854110717773, -20.912166595458984, -18.798480987548828, -16.684795379638672, -14.571109771728516, -12.457423210144043, -10.34373664855957, -8.230051040649414, -6.116365432739258, -4.002678871154785, -1.8889923095703125, 0.2246856689453125, 2.338371753692627, 4.452057838439941, 6.565743923187256, 8.67943000793457, 10.793115615844727, 12.9068021774292, 15.020488739013672, 17.134174346923828, 19.247859954833984, 21.36154556274414, 23.47523307800293, 25.588918685913086, 27.702604293823242, 29.81629180908203, 31.929977416992188, 34.043663024902344, 36.1573486328125, 38.271034240722656, 40.38471984863281, 42.49840545654297, 44.612091064453125, 46.72578048706055, 48.8394660949707, 50.95315170288086, 53.066837310791016, 55.18052291870117, 57.29420852661133, 59.40789794921875, 61.521583557128906, 63.63526916503906, 65.74895477294922, 67.86264038085938]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 6.0, 9.0, 16.0, 15.0, 26.0, 51.0, 89.0, 174.0, 404.0, 1025.0, 4016.0, 38227.0, 4076819.0, 66782.0, 4625.0, 1087.0, 404.0, 229.0, 93.0, 49.0, 30.0, 27.0, 20.0, 8.0, 10.0, 15.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.984375, -26.889892578125, -25.79541015625, -24.700927734375, -23.6064453125, -22.511962890625, -21.41748046875, -20.322998046875, -19.228515625, -18.134033203125, -17.03955078125, -15.945068359375, -14.8505859375, -13.756103515625, -12.66162109375, -11.567138671875, -10.47265625, -9.378173828125, -8.28369140625, -7.189208984375, -6.0947265625, -5.000244140625, -3.90576171875, -2.811279296875, -1.716796875, -0.622314453125, 0.47216796875, 1.566650390625, 2.6611328125, 3.755615234375, 4.85009765625, 5.944580078125, 7.0390625, 8.133544921875, 9.22802734375, 10.322509765625, 11.4169921875, 12.511474609375, 13.60595703125, 14.700439453125, 15.794921875, 16.889404296875, 17.98388671875, 19.078369140625, 20.1728515625, 21.267333984375, 22.36181640625, 23.456298828125, 24.55078125, 25.645263671875, 26.73974609375, 27.834228515625, 28.9287109375, 30.023193359375, 31.11767578125, 32.212158203125, 33.306640625, 34.401123046875, 35.49560546875, 36.590087890625, 37.6845703125, 38.779052734375, 39.87353515625, 40.968017578125, 42.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 15.0, 9.0, 17.0, 21.0, 18.0, 15.0, 31.0, 26.0, 44.0, 48.0, 46.0, 58.0, 61.0, 62.0, 62.0, 70.0, 48.0, 49.0, 47.0, 45.0, 34.0, 39.0, 26.0, 16.0, 21.0, 20.0, 15.0, 8.0, 7.0, 3.0, 6.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21484375, -5.02288818359375, -4.8309326171875, -4.63897705078125, -4.447021484375, -4.25506591796875, -4.0631103515625, -3.87115478515625, -3.67919921875, -3.48724365234375, -3.2952880859375, -3.10333251953125, -2.911376953125, -2.71942138671875, -2.5274658203125, -2.33551025390625, -2.1435546875, -1.95159912109375, -1.7596435546875, -1.56768798828125, -1.375732421875, -1.18377685546875, -0.9918212890625, -0.79986572265625, -0.60791015625, -0.41595458984375, -0.2239990234375, -0.03204345703125, 0.159912109375, 0.35186767578125, 0.5438232421875, 0.73577880859375, 0.927734375, 1.11968994140625, 1.3116455078125, 1.50360107421875, 1.695556640625, 1.88751220703125, 2.0794677734375, 2.27142333984375, 2.46337890625, 2.65533447265625, 2.8472900390625, 3.03924560546875, 3.231201171875, 3.42315673828125, 3.6151123046875, 3.80706787109375, 3.9990234375, 4.19097900390625, 4.3829345703125, 4.57489013671875, 4.766845703125, 4.95880126953125, 5.1507568359375, 5.34271240234375, 5.53466796875, 5.72662353515625, 5.9185791015625, 6.11053466796875, 6.302490234375, 6.49444580078125, 6.6864013671875, 6.87835693359375, 7.0703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 8.0, 29.0, 38.0, 80.0, 281.0, 1172.0, 15874.0, 4137523.0, 37065.0, 1641.0, 341.0, 119.0, 48.0, 22.0, 12.0, 8.0, 5.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.6875, -57.6708984375, -55.654296875, -53.6376953125, -51.62109375, -49.6044921875, -47.587890625, -45.5712890625, -43.5546875, -41.5380859375, -39.521484375, -37.5048828125, -35.48828125, -33.4716796875, -31.455078125, -29.4384765625, -27.421875, -25.4052734375, -23.388671875, -21.3720703125, -19.35546875, -17.3388671875, -15.322265625, -13.3056640625, -11.2890625, -9.2724609375, -7.255859375, -5.2392578125, -3.22265625, -1.2060546875, 0.810546875, 2.8271484375, 4.84375, 6.8603515625, 8.876953125, 10.8935546875, 12.91015625, 14.9267578125, 16.943359375, 18.9599609375, 20.9765625, 22.9931640625, 25.009765625, 27.0263671875, 29.04296875, 31.0595703125, 33.076171875, 35.0927734375, 37.109375, 39.1259765625, 41.142578125, 43.1591796875, 45.17578125, 47.1923828125, 49.208984375, 51.2255859375, 53.2421875, 55.2587890625, 57.275390625, 59.2919921875, 61.30859375, 63.3251953125, 65.341796875, 67.3583984375, 69.375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 10.0, 12.0, 15.0, 29.0, 44.0, 72.0, 169.0, 441.0, 1272.0, 1256.0, 403.0, 135.0, 75.0, 41.0, 26.0, 20.0, 17.0, 8.0, 4.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-31.328125, -30.632568359375, -29.93701171875, -29.241455078125, -28.5458984375, -27.850341796875, -27.15478515625, -26.459228515625, -25.763671875, -25.068115234375, -24.37255859375, -23.677001953125, -22.9814453125, -22.285888671875, -21.59033203125, -20.894775390625, -20.19921875, -19.503662109375, -18.80810546875, -18.112548828125, -17.4169921875, -16.721435546875, -16.02587890625, -15.330322265625, -14.634765625, -13.939208984375, -13.24365234375, -12.548095703125, -11.8525390625, -11.156982421875, -10.46142578125, -9.765869140625, -9.0703125, -8.374755859375, -7.67919921875, -6.983642578125, -6.2880859375, -5.592529296875, -4.89697265625, -4.201416015625, -3.505859375, -2.810302734375, -2.11474609375, -1.419189453125, -0.7236328125, -0.028076171875, 0.66748046875, 1.363037109375, 2.05859375, 2.754150390625, 3.44970703125, 4.145263671875, 4.8408203125, 5.536376953125, 6.23193359375, 6.927490234375, 7.623046875, 8.318603515625, 9.01416015625, 9.709716796875, 10.4052734375, 11.100830078125, 11.79638671875, 12.491943359375, 13.1875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 24.0, 49.0, 145.0, 357.0, 278.0, 95.0, 30.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-370.10137939453125, -361.2460021972656, -352.390625, -343.53521728515625, -334.6798400878906, -325.824462890625, -316.9690856933594, -308.11370849609375, -299.25830078125, -290.4029235839844, -281.54754638671875, -272.692138671875, -263.8367614746094, -254.98138427734375, -246.12600708007812, -237.2706298828125, -228.41525268554688, -219.55987548828125, -210.70448303222656, -201.84910583496094, -192.99371337890625, -184.13833618164062, -175.282958984375, -166.42758178710938, -157.5721893310547, -148.71681213378906, -139.86141967773438, -131.00604248046875, -122.1506576538086, -113.29527282714844, -104.43989562988281, -95.58451080322266, -86.7291259765625, -77.87374114990234, -69.01835632324219, -60.16297912597656, -51.307594299316406, -42.45220947265625, -33.59682846069336, -24.74144744873047, -15.886062622070312, -7.030679702758789, 1.8247032165527344, 10.680086135864258, 19.53546905517578, 28.390853881835938, 37.24623489379883, 46.10161590576172, 54.957000732421875, 63.81238555908203, 72.66777038574219, 81.52314758300781, 90.37853240966797, 99.23391723632812, 108.08929443359375, 116.9446792602539, 125.80006408691406, 134.6554412841797, 143.51083374023438, 152.3662109375, 161.22158813476562, 170.0769805908203, 178.93235778808594, 187.78775024414062, 196.64312744140625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 5.0, 7.0, 13.0, 16.0, 25.0, 40.0, 33.0, 33.0, 48.0, 42.0, 52.0, 64.0, 44.0, 64.0, 65.0, 64.0, 51.0, 63.0, 56.0, 39.0, 36.0, 29.0, 29.0, 21.0, 16.0, 14.0, 8.0, 6.0, 4.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.507728576660156, -50.88240051269531, -48.257076263427734, -45.631752014160156, -43.00642395019531, -40.38109588623047, -37.75577163696289, -35.13044738769531, -32.50511932373047, -29.879793167114258, -27.254467010498047, -24.629140853881836, -22.003814697265625, -19.378488540649414, -16.753162384033203, -14.127836227416992, -11.502510070800781, -8.87718391418457, -6.251857757568359, -3.6265316009521484, -1.0012054443359375, 1.6241207122802734, 4.249446868896484, 6.874773025512695, 9.500099182128906, 12.125425338745117, 14.750751495361328, 17.37607765197754, 20.00140380859375, 22.62672996520996, 25.252056121826172, 27.877382278442383, 30.502716064453125, 33.12804412841797, 35.75336837768555, 38.378692626953125, 41.00402069091797, 43.62934875488281, 46.25467300415039, 48.87999725341797, 51.50532531738281, 54.130653381347656, 56.755977630615234, 59.38130187988281, 62.006629943847656, 64.6319580078125, 67.25727844238281, 69.88260650634766, 72.5079345703125, 75.13326263427734, 77.75859069824219, 80.3839111328125, 83.00923919677734, 85.63456726074219, 88.2598876953125, 90.88521575927734, 93.51054382324219, 96.13587188720703, 98.76119995117188, 101.38652038574219, 104.01184844970703, 106.63717651367188, 109.26249694824219, 111.88782501220703, 114.51315307617188]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 11.0, 12.0, 20.0, 24.0, 42.0, 57.0, 105.0, 239.0, 565.0, 1369.0, 3835.0, 13551.0, 62005.0, 453556.0, 434106.0, 59748.0, 13094.0, 3844.0, 1305.0, 536.0, 227.0, 97.0, 63.0, 38.0, 28.0, 18.0, 8.0, 18.0, 10.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.796875, -26.031005859375, -25.26513671875, -24.499267578125, -23.7333984375, -22.967529296875, -22.20166015625, -21.435791015625, -20.669921875, -19.904052734375, -19.13818359375, -18.372314453125, -17.6064453125, -16.840576171875, -16.07470703125, -15.308837890625, -14.54296875, -13.777099609375, -13.01123046875, -12.245361328125, -11.4794921875, -10.713623046875, -9.94775390625, -9.181884765625, -8.416015625, -7.650146484375, -6.88427734375, -6.118408203125, -5.3525390625, -4.586669921875, -3.82080078125, -3.054931640625, -2.2890625, -1.523193359375, -0.75732421875, 0.008544921875, 0.7744140625, 1.540283203125, 2.30615234375, 3.072021484375, 3.837890625, 4.603759765625, 5.36962890625, 6.135498046875, 6.9013671875, 7.667236328125, 8.43310546875, 9.198974609375, 9.96484375, 10.730712890625, 11.49658203125, 12.262451171875, 13.0283203125, 13.794189453125, 14.56005859375, 15.325927734375, 16.091796875, 16.857666015625, 17.62353515625, 18.389404296875, 19.1552734375, 19.921142578125, 20.68701171875, 21.452880859375, 22.21875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 5.0, 7.0, 11.0, 10.0, 4.0, 10.0, 25.0, 19.0, 21.0, 29.0, 26.0, 34.0, 40.0, 46.0, 47.0, 58.0, 55.0, 45.0, 65.0, 48.0, 57.0, 48.0, 35.0, 46.0, 31.0, 35.0, 30.0, 16.0, 17.0, 19.0, 11.0, 10.0, 4.0, 10.0, 3.0, 3.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12890625, -4.93731689453125, -4.7457275390625, -4.55413818359375, -4.362548828125, -4.17095947265625, -3.9793701171875, -3.78778076171875, -3.59619140625, -3.40460205078125, -3.2130126953125, -3.02142333984375, -2.829833984375, -2.63824462890625, -2.4466552734375, -2.25506591796875, -2.0634765625, -1.87188720703125, -1.6802978515625, -1.48870849609375, -1.297119140625, -1.10552978515625, -0.9139404296875, -0.72235107421875, -0.53076171875, -0.33917236328125, -0.1475830078125, 0.04400634765625, 0.235595703125, 0.42718505859375, 0.6187744140625, 0.81036376953125, 1.001953125, 1.19354248046875, 1.3851318359375, 1.57672119140625, 1.768310546875, 1.95989990234375, 2.1514892578125, 2.34307861328125, 2.53466796875, 2.72625732421875, 2.9178466796875, 3.10943603515625, 3.301025390625, 3.49261474609375, 3.6842041015625, 3.87579345703125, 4.0673828125, 4.25897216796875, 4.4505615234375, 4.64215087890625, 4.833740234375, 5.02532958984375, 5.2169189453125, 5.40850830078125, 5.60009765625, 5.79168701171875, 5.9832763671875, 6.17486572265625, 6.366455078125, 6.55804443359375, 6.7496337890625, 6.94122314453125, 7.1328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 11.0, 11.0, 23.0, 29.0, 45.0, 76.0, 132.0, 253.0, 404.0, 1046.0, 3320.0, 13112.0, 86666.0, 813140.0, 108972.0, 15359.0, 3678.0, 1252.0, 446.0, 233.0, 135.0, 76.0, 54.0, 21.0, 26.0, 8.0, 12.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.796875, -21.828857421875, -20.86083984375, -19.892822265625, -18.9248046875, -17.956787109375, -16.98876953125, -16.020751953125, -15.052734375, -14.084716796875, -13.11669921875, -12.148681640625, -11.1806640625, -10.212646484375, -9.24462890625, -8.276611328125, -7.30859375, -6.340576171875, -5.37255859375, -4.404541015625, -3.4365234375, -2.468505859375, -1.50048828125, -0.532470703125, 0.435546875, 1.403564453125, 2.37158203125, 3.339599609375, 4.3076171875, 5.275634765625, 6.24365234375, 7.211669921875, 8.1796875, 9.147705078125, 10.11572265625, 11.083740234375, 12.0517578125, 13.019775390625, 13.98779296875, 14.955810546875, 15.923828125, 16.891845703125, 17.85986328125, 18.827880859375, 19.7958984375, 20.763916015625, 21.73193359375, 22.699951171875, 23.66796875, 24.635986328125, 25.60400390625, 26.572021484375, 27.5400390625, 28.508056640625, 29.47607421875, 30.444091796875, 31.412109375, 32.380126953125, 33.34814453125, 34.316162109375, 35.2841796875, 36.252197265625, 37.22021484375, 38.188232421875, 39.15625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 5.0, 6.0, 8.0, 5.0, 7.0, 14.0, 20.0, 20.0, 36.0, 38.0, 45.0, 58.0, 58.0, 64.0, 64.0, 62.0, 47.0, 70.0, 56.0, 60.0, 34.0, 45.0, 34.0, 26.0, 29.0, 17.0, 8.0, 16.0, 12.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.0625, -29.175537109375, -28.28857421875, -27.401611328125, -26.5146484375, -25.627685546875, -24.74072265625, -23.853759765625, -22.966796875, -22.079833984375, -21.19287109375, -20.305908203125, -19.4189453125, -18.531982421875, -17.64501953125, -16.758056640625, -15.87109375, -14.984130859375, -14.09716796875, -13.210205078125, -12.3232421875, -11.436279296875, -10.54931640625, -9.662353515625, -8.775390625, -7.888427734375, -7.00146484375, -6.114501953125, -5.2275390625, -4.340576171875, -3.45361328125, -2.566650390625, -1.6796875, -0.792724609375, 0.09423828125, 0.981201171875, 1.8681640625, 2.755126953125, 3.64208984375, 4.529052734375, 5.416015625, 6.302978515625, 7.18994140625, 8.076904296875, 8.9638671875, 9.850830078125, 10.73779296875, 11.624755859375, 12.51171875, 13.398681640625, 14.28564453125, 15.172607421875, 16.0595703125, 16.946533203125, 17.83349609375, 18.720458984375, 19.607421875, 20.494384765625, 21.38134765625, 22.268310546875, 23.1552734375, 24.042236328125, 24.92919921875, 25.816162109375, 26.703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 8.0, 16.0, 22.0, 28.0, 47.0, 51.0, 85.0, 110.0, 191.0, 350.0, 571.0, 1057.0, 2067.0, 4742.0, 12713.0, 44287.0, 239084.0, 641694.0, 71216.0, 18173.0, 6284.0, 2604.0, 1310.0, 681.0, 416.0, 260.0, 142.0, 82.0, 74.0, 49.0, 28.0, 16.0, 19.0, 10.0, 10.0, 8.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0], "bins": [-7.44140625, -7.22357177734375, -7.0057373046875, -6.78790283203125, -6.570068359375, -6.35223388671875, -6.1343994140625, -5.91656494140625, -5.69873046875, -5.48089599609375, -5.2630615234375, -5.04522705078125, -4.827392578125, -4.60955810546875, -4.3917236328125, -4.17388916015625, -3.9560546875, -3.73822021484375, -3.5203857421875, -3.30255126953125, -3.084716796875, -2.86688232421875, -2.6490478515625, -2.43121337890625, -2.21337890625, -1.99554443359375, -1.7777099609375, -1.55987548828125, -1.342041015625, -1.12420654296875, -0.9063720703125, -0.68853759765625, -0.470703125, -0.25286865234375, -0.0350341796875, 0.18280029296875, 0.400634765625, 0.61846923828125, 0.8363037109375, 1.05413818359375, 1.27197265625, 1.48980712890625, 1.7076416015625, 1.92547607421875, 2.143310546875, 2.36114501953125, 2.5789794921875, 2.79681396484375, 3.0146484375, 3.23248291015625, 3.4503173828125, 3.66815185546875, 3.885986328125, 4.10382080078125, 4.3216552734375, 4.53948974609375, 4.75732421875, 4.97515869140625, 5.1929931640625, 5.41082763671875, 5.628662109375, 5.84649658203125, 6.0643310546875, 6.28216552734375, 6.5]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 5.0, 10.0, 17.0, 23.0, 27.0, 61.0, 101.0, 207.0, 230.0, 127.0, 76.0, 48.0, 22.0, 23.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034961700439453125, -0.0033760368824005127, -0.003255903720855713, -0.003135770559310913, -0.0030156373977661133, -0.0028955042362213135, -0.0027753710746765137, -0.002655237913131714, -0.002535104751586914, -0.0024149715900421143, -0.0022948384284973145, -0.0021747052669525146, -0.002054572105407715, -0.001934438943862915, -0.0018143057823181152, -0.0016941726207733154, -0.0015740394592285156, -0.0014539062976837158, -0.001333773136138916, -0.0012136399745941162, -0.0010935068130493164, -0.0009733736515045166, -0.0008532404899597168, -0.000733107328414917, -0.0006129741668701172, -0.0004928410053253174, -0.0003727078437805176, -0.0002525746822357178, -0.00013244152069091797, -1.2308359146118164e-05, 0.00010782480239868164, 0.00022795796394348145, 0.00034809112548828125, 0.00046822428703308105, 0.0005883574485778809, 0.0007084906101226807, 0.0008286237716674805, 0.0009487569332122803, 0.00106889009475708, 0.0011890232563018799, 0.0013091564178466797, 0.0014292895793914795, 0.0015494227409362793, 0.001669555902481079, 0.001789689064025879, 0.0019098222255706787, 0.0020299553871154785, 0.0021500885486602783, 0.002270221710205078, 0.002390354871749878, 0.0025104880332946777, 0.0026306211948394775, 0.0027507543563842773, 0.002870887517929077, 0.002991020679473877, 0.0031111538410186768, 0.0032312870025634766, 0.0033514201641082764, 0.003471553325653076, 0.003591686487197876, 0.0037118196487426758, 0.0038319528102874756, 0.003952085971832275, 0.004072219133377075, 0.004192352294921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 12.0, 12.0, 28.0, 41.0, 55.0, 123.0, 233.0, 482.0, 1281.0, 3712.0, 16768.0, 152892.0, 813034.0, 48007.0, 8158.0, 2212.0, 790.0, 317.0, 164.0, 78.0, 50.0, 42.0, 19.0, 15.0, 13.0, 10.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.0106201171875, -8.654052734375, -8.2974853515625, -7.94091796875, -7.5843505859375, -7.227783203125, -6.8712158203125, -6.5146484375, -6.1580810546875, -5.801513671875, -5.4449462890625, -5.08837890625, -4.7318115234375, -4.375244140625, -4.0186767578125, -3.662109375, -3.3055419921875, -2.948974609375, -2.5924072265625, -2.23583984375, -1.8792724609375, -1.522705078125, -1.1661376953125, -0.8095703125, -0.4530029296875, -0.096435546875, 0.2601318359375, 0.61669921875, 0.9732666015625, 1.329833984375, 1.6864013671875, 2.04296875, 2.3995361328125, 2.756103515625, 3.1126708984375, 3.46923828125, 3.8258056640625, 4.182373046875, 4.5389404296875, 4.8955078125, 5.2520751953125, 5.608642578125, 5.9652099609375, 6.32177734375, 6.6783447265625, 7.034912109375, 7.3914794921875, 7.748046875, 8.1046142578125, 8.461181640625, 8.8177490234375, 9.17431640625, 9.5308837890625, 9.887451171875, 10.2440185546875, 10.6005859375, 10.9571533203125, 11.313720703125, 11.6702880859375, 12.02685546875, 12.3834228515625, 12.739990234375, 13.0965576171875, 13.453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 7.0, 8.0, 7.0, 10.0, 9.0, 12.0, 20.0, 28.0, 22.0, 31.0, 54.0, 54.0, 67.0, 74.0, 92.0, 88.0, 72.0, 75.0, 53.0, 31.0, 28.0, 23.0, 19.0, 16.0, 8.0, 10.0, 10.0, 9.0, 8.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.51690673828125, -5.3424072265625, -5.16790771484375, -4.993408203125, -4.81890869140625, -4.6444091796875, -4.46990966796875, -4.29541015625, -4.12091064453125, -3.9464111328125, -3.77191162109375, -3.597412109375, -3.42291259765625, -3.2484130859375, -3.07391357421875, -2.8994140625, -2.72491455078125, -2.5504150390625, -2.37591552734375, -2.201416015625, -2.02691650390625, -1.8524169921875, -1.67791748046875, -1.50341796875, -1.32891845703125, -1.1544189453125, -0.97991943359375, -0.805419921875, -0.63092041015625, -0.4564208984375, -0.28192138671875, -0.107421875, 0.06707763671875, 0.2415771484375, 0.41607666015625, 0.590576171875, 0.76507568359375, 0.9395751953125, 1.11407470703125, 1.28857421875, 1.46307373046875, 1.6375732421875, 1.81207275390625, 1.986572265625, 2.16107177734375, 2.3355712890625, 2.51007080078125, 2.6845703125, 2.85906982421875, 3.0335693359375, 3.20806884765625, 3.382568359375, 3.55706787109375, 3.7315673828125, 3.90606689453125, 4.08056640625, 4.25506591796875, 4.4295654296875, 4.60406494140625, 4.778564453125, 4.95306396484375, 5.1275634765625, 5.30206298828125, 5.4765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 8.0, 20.0, 34.0, 55.0, 122.0, 308.0, 235.0, 119.0, 48.0, 27.0, 13.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.7552947998047, -124.18218231201172, -117.60906982421875, -111.03596496582031, -104.46284484863281, -97.88973999023438, -91.3166275024414, -84.74351501464844, -78.17040252685547, -71.5972900390625, -65.02417755126953, -58.45106887817383, -51.87795639038086, -45.30484390258789, -38.73173522949219, -32.15862274169922, -25.58551025390625, -19.01239776611328, -12.439287185668945, -5.866176605224609, 0.7069358825683594, 7.280048370361328, 13.853157043457031, 20.42626953125, 26.99938201904297, 33.57249450683594, 40.145606994628906, 46.71871566772461, 53.29182815551758, 59.86494064331055, 66.43804931640625, 73.01116180419922, 79.58428955078125, 86.15740203857422, 92.73051452636719, 99.30361938476562, 105.87673950195312, 112.44984436035156, 119.02295684814453, 125.5960693359375, 132.169189453125, 138.74229431152344, 145.31541442871094, 151.88851928710938, 158.46163940429688, 165.0347442626953, 171.60784912109375, 178.18096923828125, 184.7540740966797, 191.32717895507812, 197.90029907226562, 204.47340393066406, 211.04652404785156, 217.61962890625, 224.1927490234375, 230.76585388183594, 237.33895874023438, 243.9120635986328, 250.4851837158203, 257.05828857421875, 263.63140869140625, 270.20452880859375, 276.7776184082031, 283.3507385253906, 289.9238586425781]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 7.0, 3.0, 10.0, 3.0, 4.0, 7.0, 10.0, 7.0, 16.0, 17.0, 15.0, 25.0, 21.0, 30.0, 40.0, 29.0, 41.0, 50.0, 96.0, 111.0, 87.0, 60.0, 40.0, 33.0, 34.0, 33.0, 19.0, 35.0, 19.0, 17.0, 13.0, 14.0, 8.0, 12.0, 12.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-90.29438781738281, -87.5201187133789, -84.74585723876953, -81.97158813476562, -79.19731903076172, -76.42304992675781, -73.64878845214844, -70.87451934814453, -68.10025024414062, -65.32598114013672, -62.55171585083008, -59.77745056152344, -57.00318145751953, -54.22891616821289, -51.45465087890625, -48.680381774902344, -45.90612030029297, -43.13185501098633, -40.35758590698242, -37.58332061767578, -34.809051513671875, -32.034786224365234, -29.260520935058594, -26.48625373840332, -23.711986541748047, -20.937719345092773, -18.1634521484375, -15.38918685913086, -12.614919662475586, -9.840652465820312, -7.066387176513672, -4.292119979858398, -1.5178451538085938, 1.2564215660095215, 4.030688285827637, 6.804954528808594, 9.579221725463867, 12.35348892211914, 15.127754211425781, 17.902021408081055, 20.676288604736328, 23.4505558013916, 26.224822998046875, 28.999088287353516, 31.77335548400879, 34.54762268066406, 37.3218879699707, 40.096153259277344, 42.87042236328125, 45.64468765258789, 48.4189567565918, 51.19322204589844, 53.967491149902344, 56.741756439208984, 59.516021728515625, 62.29029083251953, 65.06455993652344, 67.83882904052734, 70.61309051513672, 73.38735961914062, 76.16162872314453, 78.93589782714844, 81.71015930175781, 84.48442840576172, 87.2586898803711]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 8.0, 0.0, 8.0, 13.0, 24.0, 47.0, 87.0, 170.0, 436.0, 1246.0, 5195.0, 66813.0, 4081665.0, 33562.0, 3549.0, 904.0, 300.0, 103.0, 58.0, 34.0, 19.0, 16.0, 9.0, 6.0, 9.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.875, -33.50244140625, -32.1298828125, -30.75732421875, -29.384765625, -28.01220703125, -26.6396484375, -25.26708984375, -23.89453125, -22.52197265625, -21.1494140625, -19.77685546875, -18.404296875, -17.03173828125, -15.6591796875, -14.28662109375, -12.9140625, -11.54150390625, -10.1689453125, -8.79638671875, -7.423828125, -6.05126953125, -4.6787109375, -3.30615234375, -1.93359375, -0.56103515625, 0.8115234375, 2.18408203125, 3.556640625, 4.92919921875, 6.3017578125, 7.67431640625, 9.046875, 10.41943359375, 11.7919921875, 13.16455078125, 14.537109375, 15.90966796875, 17.2822265625, 18.65478515625, 20.02734375, 21.39990234375, 22.7724609375, 24.14501953125, 25.517578125, 26.89013671875, 28.2626953125, 29.63525390625, 31.0078125, 32.38037109375, 33.7529296875, 35.12548828125, 36.498046875, 37.87060546875, 39.2431640625, 40.61572265625, 41.98828125, 43.36083984375, 44.7333984375, 46.10595703125, 47.478515625, 48.85107421875, 50.2236328125, 51.59619140625, 52.96875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 9.0, 9.0, 11.0, 8.0, 13.0, 17.0, 22.0, 25.0, 35.0, 32.0, 59.0, 47.0, 48.0, 54.0, 74.0, 50.0, 63.0, 50.0, 54.0, 66.0, 40.0, 42.0, 31.0, 30.0, 25.0, 20.0, 10.0, 13.0, 10.0, 4.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.22265625, -7.0133056640625, -6.803955078125, -6.5946044921875, -6.38525390625, -6.1759033203125, -5.966552734375, -5.7572021484375, -5.5478515625, -5.3385009765625, -5.129150390625, -4.9197998046875, -4.71044921875, -4.5010986328125, -4.291748046875, -4.0823974609375, -3.873046875, -3.6636962890625, -3.454345703125, -3.2449951171875, -3.03564453125, -2.8262939453125, -2.616943359375, -2.4075927734375, -2.1982421875, -1.9888916015625, -1.779541015625, -1.5701904296875, -1.36083984375, -1.1514892578125, -0.942138671875, -0.7327880859375, -0.5234375, -0.3140869140625, -0.104736328125, 0.1046142578125, 0.31396484375, 0.5233154296875, 0.732666015625, 0.9420166015625, 1.1513671875, 1.3607177734375, 1.570068359375, 1.7794189453125, 1.98876953125, 2.1981201171875, 2.407470703125, 2.6168212890625, 2.826171875, 3.0355224609375, 3.244873046875, 3.4542236328125, 3.66357421875, 3.8729248046875, 4.082275390625, 4.2916259765625, 4.5009765625, 4.7103271484375, 4.919677734375, 5.1290283203125, 5.33837890625, 5.5477294921875, 5.757080078125, 5.9664306640625, 6.17578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 14.0, 14.0, 21.0, 35.0, 66.0, 101.0, 180.0, 487.0, 1352.0, 5275.0, 40123.0, 3687162.0, 437392.0, 17350.0, 3119.0, 872.0, 332.0, 163.0, 80.0, 42.0, 25.0, 19.0, 12.0, 10.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.03125, -31.9931640625, -30.955078125, -29.9169921875, -28.87890625, -27.8408203125, -26.802734375, -25.7646484375, -24.7265625, -23.6884765625, -22.650390625, -21.6123046875, -20.57421875, -19.5361328125, -18.498046875, -17.4599609375, -16.421875, -15.3837890625, -14.345703125, -13.3076171875, -12.26953125, -11.2314453125, -10.193359375, -9.1552734375, -8.1171875, -7.0791015625, -6.041015625, -5.0029296875, -3.96484375, -2.9267578125, -1.888671875, -0.8505859375, 0.1875, 1.2255859375, 2.263671875, 3.3017578125, 4.33984375, 5.3779296875, 6.416015625, 7.4541015625, 8.4921875, 9.5302734375, 10.568359375, 11.6064453125, 12.64453125, 13.6826171875, 14.720703125, 15.7587890625, 16.796875, 17.8349609375, 18.873046875, 19.9111328125, 20.94921875, 21.9873046875, 23.025390625, 24.0634765625, 25.1015625, 26.1396484375, 27.177734375, 28.2158203125, 29.25390625, 30.2919921875, 31.330078125, 32.3681640625, 33.40625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 2.0, 8.0, 12.0, 6.0, 13.0, 22.0, 30.0, 32.0, 60.0, 77.0, 121.0, 254.0, 541.0, 991.0, 890.0, 437.0, 193.0, 133.0, 68.0, 42.0, 44.0, 24.0, 12.0, 17.0, 10.0, 3.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.42822265625, -18.8564453125, -18.28466796875, -17.712890625, -17.14111328125, -16.5693359375, -15.99755859375, -15.42578125, -14.85400390625, -14.2822265625, -13.71044921875, -13.138671875, -12.56689453125, -11.9951171875, -11.42333984375, -10.8515625, -10.27978515625, -9.7080078125, -9.13623046875, -8.564453125, -7.99267578125, -7.4208984375, -6.84912109375, -6.27734375, -5.70556640625, -5.1337890625, -4.56201171875, -3.990234375, -3.41845703125, -2.8466796875, -2.27490234375, -1.703125, -1.13134765625, -0.5595703125, 0.01220703125, 0.583984375, 1.15576171875, 1.7275390625, 2.29931640625, 2.87109375, 3.44287109375, 4.0146484375, 4.58642578125, 5.158203125, 5.72998046875, 6.3017578125, 6.87353515625, 7.4453125, 8.01708984375, 8.5888671875, 9.16064453125, 9.732421875, 10.30419921875, 10.8759765625, 11.44775390625, 12.01953125, 12.59130859375, 13.1630859375, 13.73486328125, 14.306640625, 14.87841796875, 15.4501953125, 16.02197265625, 16.59375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 5.0, 2.0, 9.0, 8.0, 11.0, 16.0, 54.0, 103.0, 157.0, 250.0, 180.0, 103.0, 48.0, 28.0, 18.0, 8.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-269.1133117675781, -263.5760803222656, -258.0388488769531, -252.50161743164062, -246.96438598632812, -241.42715454101562, -235.88992309570312, -230.35269165039062, -224.81546020507812, -219.27822875976562, -213.74099731445312, -208.20376586914062, -202.66653442382812, -197.12930297851562, -191.59207153320312, -186.05484008789062, -180.51760864257812, -174.98037719726562, -169.44314575195312, -163.90591430664062, -158.36868286132812, -152.83145141601562, -147.29421997070312, -141.75698852539062, -136.21974182128906, -130.68251037597656, -125.14527893066406, -119.60804748535156, -114.07081604003906, -108.53358459472656, -102.99635314941406, -97.45912170410156, -91.92188262939453, -86.38465118408203, -80.84741973876953, -75.31018829345703, -69.77295684814453, -64.23572540283203, -58.698490142822266, -53.161258697509766, -47.624027252197266, -42.086795806884766, -36.549564361572266, -31.012331008911133, -25.475099563598633, -19.937868118286133, -14.400634765625, -8.8634033203125, -3.326171875, 2.211060047149658, 7.748291969299316, 13.285524368286133, 18.822755813598633, 24.359987258911133, 29.897220611572266, 35.434452056884766, 40.971683502197266, 46.508914947509766, 52.046146392822266, 57.58338165283203, 63.12061309814453, 68.65784454345703, 74.19507598876953, 79.73230743408203, 85.26953887939453]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 11.0, 17.0, 12.0, 15.0, 23.0, 21.0, 28.0, 26.0, 34.0, 30.0, 35.0, 37.0, 43.0, 46.0, 38.0, 58.0, 37.0, 41.0, 49.0, 44.0, 34.0, 43.0, 38.0, 34.0, 32.0, 36.0, 26.0, 19.0, 15.0, 14.0, 12.0, 6.0, 11.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.44347381591797, -68.26459503173828, -66.0857162475586, -63.90683364868164, -61.72795486450195, -59.549076080322266, -57.37019348144531, -55.191314697265625, -53.01243591308594, -50.83355712890625, -48.65467834472656, -46.47579574584961, -44.29691696166992, -42.118038177490234, -39.93915557861328, -37.760276794433594, -35.581398010253906, -33.40251922607422, -31.2236385345459, -29.044757843017578, -26.86587905883789, -24.687000274658203, -22.508119583129883, -20.329238891601562, -18.150360107421875, -15.971480369567871, -13.792600631713867, -11.613720893859863, -9.43484115600586, -7.2559614181518555, -5.077081680297852, -2.8982019424438477, -0.7193145751953125, 1.4595651626586914, 3.6384449005126953, 5.817324638366699, 7.996204376220703, 10.175084114074707, 12.353963851928711, 14.532843589782715, 16.71172332763672, 18.890602111816406, 21.069482803344727, 23.248363494873047, 25.427242279052734, 27.606121063232422, 29.785001754760742, 31.963882446289062, 34.14276123046875, 36.32164001464844, 38.500518798828125, 40.67940139770508, 42.858280181884766, 45.03715896606445, 47.216041564941406, 49.394920349121094, 51.57379913330078, 53.75267791748047, 55.931556701660156, 58.11043930053711, 60.2893180847168, 62.468196868896484, 64.64707946777344, 66.82595825195312, 69.00483703613281]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 10.0, 4.0, 13.0, 9.0, 22.0, 34.0, 72.0, 126.0, 214.0, 423.0, 964.0, 2232.0, 5724.0, 16776.0, 62531.0, 326492.0, 501080.0, 95472.0, 23578.0, 7568.0, 2861.0, 1163.0, 551.0, 291.0, 132.0, 81.0, 46.0, 36.0, 18.0, 15.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.773193359375, -17.09326171875, -16.413330078125, -15.7333984375, -15.053466796875, -14.37353515625, -13.693603515625, -13.013671875, -12.333740234375, -11.65380859375, -10.973876953125, -10.2939453125, -9.614013671875, -8.93408203125, -8.254150390625, -7.57421875, -6.894287109375, -6.21435546875, -5.534423828125, -4.8544921875, -4.174560546875, -3.49462890625, -2.814697265625, -2.134765625, -1.454833984375, -0.77490234375, -0.094970703125, 0.5849609375, 1.264892578125, 1.94482421875, 2.624755859375, 3.3046875, 3.984619140625, 4.66455078125, 5.344482421875, 6.0244140625, 6.704345703125, 7.38427734375, 8.064208984375, 8.744140625, 9.424072265625, 10.10400390625, 10.783935546875, 11.4638671875, 12.143798828125, 12.82373046875, 13.503662109375, 14.18359375, 14.863525390625, 15.54345703125, 16.223388671875, 16.9033203125, 17.583251953125, 18.26318359375, 18.943115234375, 19.623046875, 20.302978515625, 20.98291015625, 21.662841796875, 22.3427734375, 23.022705078125, 23.70263671875, 24.382568359375, 25.0625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 1.0, 2.0, 3.0, 6.0, 7.0, 12.0, 11.0, 12.0, 14.0, 20.0, 16.0, 24.0, 32.0, 26.0, 38.0, 29.0, 57.0, 43.0, 60.0, 50.0, 44.0, 44.0, 52.0, 43.0, 39.0, 47.0, 35.0, 32.0, 30.0, 38.0, 23.0, 24.0, 24.0, 15.0, 13.0, 9.0, 7.0, 7.0, 7.0, 5.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.535888671875, -5.34521484375, -5.154541015625, -4.9638671875, -4.773193359375, -4.58251953125, -4.391845703125, -4.201171875, -4.010498046875, -3.81982421875, -3.629150390625, -3.4384765625, -3.247802734375, -3.05712890625, -2.866455078125, -2.67578125, -2.485107421875, -2.29443359375, -2.103759765625, -1.9130859375, -1.722412109375, -1.53173828125, -1.341064453125, -1.150390625, -0.959716796875, -0.76904296875, -0.578369140625, -0.3876953125, -0.197021484375, -0.00634765625, 0.184326171875, 0.375, 0.565673828125, 0.75634765625, 0.947021484375, 1.1376953125, 1.328369140625, 1.51904296875, 1.709716796875, 1.900390625, 2.091064453125, 2.28173828125, 2.472412109375, 2.6630859375, 2.853759765625, 3.04443359375, 3.235107421875, 3.42578125, 3.616455078125, 3.80712890625, 3.997802734375, 4.1884765625, 4.379150390625, 4.56982421875, 4.760498046875, 4.951171875, 5.141845703125, 5.33251953125, 5.523193359375, 5.7138671875, 5.904541015625, 6.09521484375, 6.285888671875, 6.4765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 4.0, 10.0, 21.0, 27.0, 37.0, 41.0, 78.0, 104.0, 153.0, 258.0, 470.0, 934.0, 1984.0, 6263.0, 28690.0, 259447.0, 695365.0, 41463.0, 8184.0, 2538.0, 1033.0, 592.0, 296.0, 197.0, 88.0, 88.0, 52.0, 34.0, 23.0, 19.0, 13.0, 13.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.765625, -27.946044921875, -27.12646484375, -26.306884765625, -25.4873046875, -24.667724609375, -23.84814453125, -23.028564453125, -22.208984375, -21.389404296875, -20.56982421875, -19.750244140625, -18.9306640625, -18.111083984375, -17.29150390625, -16.471923828125, -15.65234375, -14.832763671875, -14.01318359375, -13.193603515625, -12.3740234375, -11.554443359375, -10.73486328125, -9.915283203125, -9.095703125, -8.276123046875, -7.45654296875, -6.636962890625, -5.8173828125, -4.997802734375, -4.17822265625, -3.358642578125, -2.5390625, -1.719482421875, -0.89990234375, -0.080322265625, 0.7392578125, 1.558837890625, 2.37841796875, 3.197998046875, 4.017578125, 4.837158203125, 5.65673828125, 6.476318359375, 7.2958984375, 8.115478515625, 8.93505859375, 9.754638671875, 10.57421875, 11.393798828125, 12.21337890625, 13.032958984375, 13.8525390625, 14.672119140625, 15.49169921875, 16.311279296875, 17.130859375, 17.950439453125, 18.77001953125, 19.589599609375, 20.4091796875, 21.228759765625, 22.04833984375, 22.867919921875, 23.6875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 9.0, 9.0, 7.0, 18.0, 18.0, 27.0, 25.0, 23.0, 26.0, 43.0, 44.0, 41.0, 61.0, 51.0, 59.0, 64.0, 51.0, 59.0, 45.0, 56.0, 47.0, 33.0, 41.0, 27.0, 25.0, 23.0, 13.0, 17.0, 7.0, 9.0, 4.0, 6.0, 3.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.078125, -23.33447265625, -22.5908203125, -21.84716796875, -21.103515625, -20.35986328125, -19.6162109375, -18.87255859375, -18.12890625, -17.38525390625, -16.6416015625, -15.89794921875, -15.154296875, -14.41064453125, -13.6669921875, -12.92333984375, -12.1796875, -11.43603515625, -10.6923828125, -9.94873046875, -9.205078125, -8.46142578125, -7.7177734375, -6.97412109375, -6.23046875, -5.48681640625, -4.7431640625, -3.99951171875, -3.255859375, -2.51220703125, -1.7685546875, -1.02490234375, -0.28125, 0.46240234375, 1.2060546875, 1.94970703125, 2.693359375, 3.43701171875, 4.1806640625, 4.92431640625, 5.66796875, 6.41162109375, 7.1552734375, 7.89892578125, 8.642578125, 9.38623046875, 10.1298828125, 10.87353515625, 11.6171875, 12.36083984375, 13.1044921875, 13.84814453125, 14.591796875, 15.33544921875, 16.0791015625, 16.82275390625, 17.56640625, 18.31005859375, 19.0537109375, 19.79736328125, 20.541015625, 21.28466796875, 22.0283203125, 22.77197265625, 23.515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 10.0, 11.0, 13.0, 12.0, 33.0, 29.0, 52.0, 76.0, 93.0, 153.0, 232.0, 313.0, 576.0, 969.0, 1796.0, 3639.0, 8976.0, 27669.0, 127669.0, 732104.0, 104296.0, 24199.0, 8006.0, 3419.0, 1709.0, 963.0, 505.0, 317.0, 212.0, 140.0, 111.0, 67.0, 43.0, 33.0, 27.0, 20.0, 14.0, 12.0, 13.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-6.8359375, -6.63153076171875, -6.4271240234375, -6.22271728515625, -6.018310546875, -5.81390380859375, -5.6094970703125, -5.40509033203125, -5.20068359375, -4.99627685546875, -4.7918701171875, -4.58746337890625, -4.383056640625, -4.17864990234375, -3.9742431640625, -3.76983642578125, -3.5654296875, -3.36102294921875, -3.1566162109375, -2.95220947265625, -2.747802734375, -2.54339599609375, -2.3389892578125, -2.13458251953125, -1.93017578125, -1.72576904296875, -1.5213623046875, -1.31695556640625, -1.112548828125, -0.90814208984375, -0.7037353515625, -0.49932861328125, -0.294921875, -0.09051513671875, 0.1138916015625, 0.31829833984375, 0.522705078125, 0.72711181640625, 0.9315185546875, 1.13592529296875, 1.34033203125, 1.54473876953125, 1.7491455078125, 1.95355224609375, 2.157958984375, 2.36236572265625, 2.5667724609375, 2.77117919921875, 2.9755859375, 3.17999267578125, 3.3843994140625, 3.58880615234375, 3.793212890625, 3.99761962890625, 4.2020263671875, 4.40643310546875, 4.61083984375, 4.81524658203125, 5.0196533203125, 5.22406005859375, 5.428466796875, 5.63287353515625, 5.8372802734375, 6.04168701171875, 6.24609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 11.0, 27.0, 36.0, 49.0, 89.0, 140.0, 209.0, 149.0, 96.0, 60.0, 45.0, 23.0, 19.0, 7.0, 11.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004573822021484375, -0.004433929920196533, -0.004294037818908691, -0.00415414571762085, -0.004014253616333008, -0.003874361515045166, -0.0037344694137573242, -0.0035945773124694824, -0.0034546852111816406, -0.003314793109893799, -0.003174901008605957, -0.0030350089073181152, -0.0028951168060302734, -0.0027552247047424316, -0.00261533260345459, -0.002475440502166748, -0.0023355484008789062, -0.0021956562995910645, -0.0020557641983032227, -0.0019158720970153809, -0.001775979995727539, -0.0016360878944396973, -0.0014961957931518555, -0.0013563036918640137, -0.0012164115905761719, -0.00107651948928833, -0.0009366273880004883, -0.0007967352867126465, -0.0006568431854248047, -0.0005169510841369629, -0.0003770589828491211, -0.0002371668815612793, -9.72747802734375e-05, 4.26173210144043e-05, 0.0001825094223022461, 0.0003224015235900879, 0.0004622936248779297, 0.0006021857261657715, 0.0007420778274536133, 0.0008819699287414551, 0.0010218620300292969, 0.0011617541313171387, 0.0013016462326049805, 0.0014415383338928223, 0.001581430435180664, 0.0017213225364685059, 0.0018612146377563477, 0.0020011067390441895, 0.0021409988403320312, 0.002280890941619873, 0.002420783042907715, 0.0025606751441955566, 0.0027005672454833984, 0.0028404593467712402, 0.002980351448059082, 0.003120243549346924, 0.0032601356506347656, 0.0034000277519226074, 0.0035399198532104492, 0.003679811954498291, 0.003819704055786133, 0.003959596157073975, 0.004099488258361816, 0.004239380359649658, 0.0043792724609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 12.0, 15.0, 24.0, 30.0, 54.0, 142.0, 281.0, 654.0, 1760.0, 6576.0, 54517.0, 916660.0, 58184.0, 6636.0, 1791.0, 640.0, 266.0, 136.0, 58.0, 34.0, 37.0, 10.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.578125, -12.136962890625, -11.69580078125, -11.254638671875, -10.8134765625, -10.372314453125, -9.93115234375, -9.489990234375, -9.048828125, -8.607666015625, -8.16650390625, -7.725341796875, -7.2841796875, -6.843017578125, -6.40185546875, -5.960693359375, -5.51953125, -5.078369140625, -4.63720703125, -4.196044921875, -3.7548828125, -3.313720703125, -2.87255859375, -2.431396484375, -1.990234375, -1.549072265625, -1.10791015625, -0.666748046875, -0.2255859375, 0.215576171875, 0.65673828125, 1.097900390625, 1.5390625, 1.980224609375, 2.42138671875, 2.862548828125, 3.3037109375, 3.744873046875, 4.18603515625, 4.627197265625, 5.068359375, 5.509521484375, 5.95068359375, 6.391845703125, 6.8330078125, 7.274169921875, 7.71533203125, 8.156494140625, 8.59765625, 9.038818359375, 9.47998046875, 9.921142578125, 10.3623046875, 10.803466796875, 11.24462890625, 11.685791015625, 12.126953125, 12.568115234375, 13.00927734375, 13.450439453125, 13.8916015625, 14.332763671875, 14.77392578125, 15.215087890625, 15.65625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 4.0, 7.0, 5.0, 9.0, 7.0, 10.0, 13.0, 20.0, 26.0, 15.0, 27.0, 44.0, 40.0, 46.0, 59.0, 82.0, 89.0, 92.0, 78.0, 60.0, 53.0, 44.0, 34.0, 20.0, 26.0, 22.0, 8.0, 8.0, 6.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.48333740234375, -4.3299560546875, -4.17657470703125, -4.023193359375, -3.86981201171875, -3.7164306640625, -3.56304931640625, -3.40966796875, -3.25628662109375, -3.1029052734375, -2.94952392578125, -2.796142578125, -2.64276123046875, -2.4893798828125, -2.33599853515625, -2.1826171875, -2.02923583984375, -1.8758544921875, -1.72247314453125, -1.569091796875, -1.41571044921875, -1.2623291015625, -1.10894775390625, -0.95556640625, -0.80218505859375, -0.6488037109375, -0.49542236328125, -0.342041015625, -0.18865966796875, -0.0352783203125, 0.11810302734375, 0.271484375, 0.42486572265625, 0.5782470703125, 0.73162841796875, 0.885009765625, 1.03839111328125, 1.1917724609375, 1.34515380859375, 1.49853515625, 1.65191650390625, 1.8052978515625, 1.95867919921875, 2.112060546875, 2.26544189453125, 2.4188232421875, 2.57220458984375, 2.7255859375, 2.87896728515625, 3.0323486328125, 3.18572998046875, 3.339111328125, 3.49249267578125, 3.6458740234375, 3.79925537109375, 3.95263671875, 4.10601806640625, 4.2593994140625, 4.41278076171875, 4.566162109375, 4.71954345703125, 4.8729248046875, 5.02630615234375, 5.1796875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 10.0, 3.0, 7.0, 6.0, 13.0, 31.0, 49.0, 84.0, 162.0, 355.0, 117.0, 74.0, 43.0, 15.0, 11.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.86544799804688, -123.31143188476562, -117.75741577148438, -112.20339965820312, -106.64938354492188, -101.09536743164062, -95.54135131835938, -89.98733520507812, -84.43331909179688, -78.87930297851562, -73.32528686523438, -67.77127075195312, -62.217254638671875, -56.663238525390625, -51.10922622680664, -45.55521011352539, -40.001197814941406, -34.447181701660156, -28.893165588378906, -23.33915138244629, -17.78513526916504, -12.231119155883789, -6.677104949951172, -1.1230888366699219, 4.430927276611328, 9.984943389892578, 15.538958549499512, 21.092973709106445, 26.646989822387695, 32.20100402832031, 37.75502014160156, 43.30903625488281, 48.86305236816406, 54.41706848144531, 59.97108459472656, 65.52510070800781, 71.07911682128906, 76.63313293457031, 82.18714904785156, 87.74116516113281, 93.29518127441406, 98.84919738769531, 104.40321350097656, 109.95722961425781, 115.51124572753906, 121.06526184082031, 126.61927795410156, 132.1732940673828, 137.727294921875, 143.28131103515625, 148.8353271484375, 154.38934326171875, 159.943359375, 165.49737548828125, 171.0513916015625, 176.60540771484375, 182.159423828125, 187.71343994140625, 193.2674560546875, 198.82147216796875, 204.37548828125, 209.92950439453125, 215.4835205078125, 221.03753662109375, 226.591552734375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 2.0, 5.0, 8.0, 11.0, 11.0, 12.0, 11.0, 15.0, 15.0, 18.0, 11.0, 19.0, 19.0, 25.0, 26.0, 31.0, 26.0, 35.0, 47.0, 82.0, 141.0, 88.0, 50.0, 30.0, 30.0, 25.0, 25.0, 28.0, 26.0, 18.0, 13.0, 12.0, 16.0, 9.0, 7.0, 11.0, 13.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.51902770996094, -73.26681518554688, -71.01461029052734, -68.76239776611328, -66.51018524169922, -64.25798034667969, -62.005767822265625, -59.75355911254883, -57.50135040283203, -55.249141693115234, -52.99692916870117, -50.744720458984375, -48.49251174926758, -46.24030303955078, -43.98809051513672, -41.73588180541992, -39.48366928100586, -37.23146057128906, -34.979248046875, -32.7270393371582, -30.474830627441406, -28.222620010375977, -25.970409393310547, -23.71820068359375, -21.46599006652832, -19.21377944946289, -16.961570739746094, -14.709360122680664, -12.45715045928955, -10.204940795898438, -7.952730178833008, -5.7005205154418945, -3.4483108520507812, -1.1961009502410889, 1.0561089515686035, 3.308319091796875, 5.560528755187988, 7.812738418579102, 10.064949035644531, 12.317158699035645, 14.569368362426758, 16.821578979492188, 19.073787689208984, 21.325998306274414, 23.578208923339844, 25.83041763305664, 28.08262825012207, 30.3348388671875, 32.5870475769043, 34.839256286621094, 37.091468811035156, 39.34367752075195, 41.59588623046875, 43.84809875488281, 46.10030746459961, 48.352516174316406, 50.60472869873047, 52.856937408447266, 55.10914993286133, 57.361358642578125, 59.61356735229492, 61.86577606201172, 64.11798858642578, 66.37020111083984, 68.62240600585938]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 16.0, 16.0, 27.0, 39.0, 100.0, 171.0, 451.0, 1106.0, 3727.0, 16572.0, 236275.0, 3724634.0, 191659.0, 14697.0, 3038.0, 977.0, 359.0, 151.0, 92.0, 58.0, 30.0, 18.0, 16.0, 10.0, 9.0, 5.0, 7.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.875, -21.97705078125, -21.0791015625, -20.18115234375, -19.283203125, -18.38525390625, -17.4873046875, -16.58935546875, -15.69140625, -14.79345703125, -13.8955078125, -12.99755859375, -12.099609375, -11.20166015625, -10.3037109375, -9.40576171875, -8.5078125, -7.60986328125, -6.7119140625, -5.81396484375, -4.916015625, -4.01806640625, -3.1201171875, -2.22216796875, -1.32421875, -0.42626953125, 0.4716796875, 1.36962890625, 2.267578125, 3.16552734375, 4.0634765625, 4.96142578125, 5.859375, 6.75732421875, 7.6552734375, 8.55322265625, 9.451171875, 10.34912109375, 11.2470703125, 12.14501953125, 13.04296875, 13.94091796875, 14.8388671875, 15.73681640625, 16.634765625, 17.53271484375, 18.4306640625, 19.32861328125, 20.2265625, 21.12451171875, 22.0224609375, 22.92041015625, 23.818359375, 24.71630859375, 25.6142578125, 26.51220703125, 27.41015625, 28.30810546875, 29.2060546875, 30.10400390625, 31.001953125, 31.89990234375, 32.7978515625, 33.69580078125, 34.59375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 10.0, 8.0, 6.0, 10.0, 9.0, 11.0, 17.0, 14.0, 18.0, 27.0, 22.0, 33.0, 42.0, 35.0, 33.0, 42.0, 40.0, 55.0, 34.0, 29.0, 35.0, 39.0, 47.0, 42.0, 43.0, 29.0, 33.0, 26.0, 23.0, 28.0, 27.0, 23.0, 18.0, 14.0, 12.0, 16.0, 13.0, 8.0, 4.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.25, -5.0916748046875, -4.933349609375, -4.7750244140625, -4.61669921875, -4.4583740234375, -4.300048828125, -4.1417236328125, -3.9833984375, -3.8250732421875, -3.666748046875, -3.5084228515625, -3.35009765625, -3.1917724609375, -3.033447265625, -2.8751220703125, -2.716796875, -2.5584716796875, -2.400146484375, -2.2418212890625, -2.08349609375, -1.9251708984375, -1.766845703125, -1.6085205078125, -1.4501953125, -1.2918701171875, -1.133544921875, -0.9752197265625, -0.81689453125, -0.6585693359375, -0.500244140625, -0.3419189453125, -0.18359375, -0.0252685546875, 0.133056640625, 0.2913818359375, 0.44970703125, 0.6080322265625, 0.766357421875, 0.9246826171875, 1.0830078125, 1.2413330078125, 1.399658203125, 1.5579833984375, 1.71630859375, 1.8746337890625, 2.032958984375, 2.1912841796875, 2.349609375, 2.5079345703125, 2.666259765625, 2.8245849609375, 2.98291015625, 3.1412353515625, 3.299560546875, 3.4578857421875, 3.6162109375, 3.7745361328125, 3.932861328125, 4.0911865234375, 4.24951171875, 4.4078369140625, 4.566162109375, 4.7244873046875, 4.8828125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 13.0, 13.0, 43.0, 50.0, 104.0, 236.0, 499.0, 1489.0, 7314.0, 803798.0, 3368459.0, 9514.0, 1637.0, 562.0, 263.0, 128.0, 70.0, 30.0, 15.0, 13.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.5625, -71.46435546875, -69.3662109375, -67.26806640625, -65.169921875, -63.07177734375, -60.9736328125, -58.87548828125, -56.77734375, -54.67919921875, -52.5810546875, -50.48291015625, -48.384765625, -46.28662109375, -44.1884765625, -42.09033203125, -39.9921875, -37.89404296875, -35.7958984375, -33.69775390625, -31.599609375, -29.50146484375, -27.4033203125, -25.30517578125, -23.20703125, -21.10888671875, -19.0107421875, -16.91259765625, -14.814453125, -12.71630859375, -10.6181640625, -8.52001953125, -6.421875, -4.32373046875, -2.2255859375, -0.12744140625, 1.970703125, 4.06884765625, 6.1669921875, 8.26513671875, 10.36328125, 12.46142578125, 14.5595703125, 16.65771484375, 18.755859375, 20.85400390625, 22.9521484375, 25.05029296875, 27.1484375, 29.24658203125, 31.3447265625, 33.44287109375, 35.541015625, 37.63916015625, 39.7373046875, 41.83544921875, 43.93359375, 46.03173828125, 48.1298828125, 50.22802734375, 52.326171875, 54.42431640625, 56.5224609375, 58.62060546875, 60.71875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 9.0, 9.0, 18.0, 33.0, 63.0, 85.0, 144.0, 284.0, 656.0, 1249.0, 800.0, 363.0, 158.0, 98.0, 46.0, 33.0, 8.0, 16.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.41943359375, -39.1826171875, -37.94580078125, -36.708984375, -35.47216796875, -34.2353515625, -32.99853515625, -31.76171875, -30.52490234375, -29.2880859375, -28.05126953125, -26.814453125, -25.57763671875, -24.3408203125, -23.10400390625, -21.8671875, -20.63037109375, -19.3935546875, -18.15673828125, -16.919921875, -15.68310546875, -14.4462890625, -13.20947265625, -11.97265625, -10.73583984375, -9.4990234375, -8.26220703125, -7.025390625, -5.78857421875, -4.5517578125, -3.31494140625, -2.078125, -0.84130859375, 0.3955078125, 1.63232421875, 2.869140625, 4.10595703125, 5.3427734375, 6.57958984375, 7.81640625, 9.05322265625, 10.2900390625, 11.52685546875, 12.763671875, 14.00048828125, 15.2373046875, 16.47412109375, 17.7109375, 18.94775390625, 20.1845703125, 21.42138671875, 22.658203125, 23.89501953125, 25.1318359375, 26.36865234375, 27.60546875, 28.84228515625, 30.0791015625, 31.31591796875, 32.552734375, 33.78955078125, 35.0263671875, 36.26318359375, 37.5]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 8.0, 7.0, 11.0, 20.0, 28.0, 50.0, 84.0, 128.0, 187.0, 168.0, 122.0, 69.0, 42.0, 20.0, 17.0, 12.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-281.06365966796875, -273.0006408691406, -264.9375915527344, -256.87457275390625, -248.81155395507812, -240.74851989746094, -232.68548583984375, -224.62246704101562, -216.55943298339844, -208.49639892578125, -200.43338012695312, -192.37034606933594, -184.30731201171875, -176.24429321289062, -168.18125915527344, -160.11822509765625, -152.05520629882812, -143.99217224121094, -135.9291534423828, -127.86611938476562, -119.80309295654297, -111.74006652832031, -103.67703247070312, -95.61400604248047, -87.55097961425781, -79.48795318603516, -71.4249267578125, -63.36189270019531, -55.298866271972656, -47.23583984375, -39.17280960083008, -31.109779357910156, -23.0467529296875, -14.983724594116211, -6.920696258544922, 1.1423320770263672, 9.205360412597656, 17.268386840820312, 25.331417083740234, 33.394447326660156, 41.45747375488281, 49.52050018310547, 57.58353042602539, 65.64656066894531, 73.70958709716797, 81.77261352539062, 89.83564758300781, 97.89867401123047, 105.96170043945312, 114.02472686767578, 122.08775329589844, 130.15078735351562, 138.21380615234375, 146.27684020996094, 154.33987426757812, 162.40289306640625, 170.46592712402344, 178.52896118164062, 186.59197998046875, 194.65501403808594, 202.71804809570312, 210.78106689453125, 218.84410095214844, 226.90713500976562, 234.97015380859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 7.0, 5.0, 12.0, 17.0, 19.0, 31.0, 29.0, 24.0, 40.0, 50.0, 49.0, 35.0, 54.0, 61.0, 68.0, 64.0, 54.0, 49.0, 49.0, 55.0, 29.0, 34.0, 35.0, 30.0, 24.0, 14.0, 4.0, 17.0, 11.0, 6.0, 10.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-141.9376220703125, -137.2917022705078, -132.64578247070312, -127.99987030029297, -123.35395812988281, -118.70803833007812, -114.06211853027344, -109.41619873046875, -104.7702865600586, -100.1243667602539, -95.47845458984375, -90.83253479003906, -86.18661499023438, -81.54070281982422, -76.89478302001953, -72.24887084960938, -67.60295104980469, -62.957035064697266, -58.311119079589844, -53.665199279785156, -49.019283294677734, -44.37336730957031, -39.727447509765625, -35.0815315246582, -30.43561553955078, -25.78969955444336, -21.143781661987305, -16.49786376953125, -11.851947784423828, -7.206031799316406, -2.5601139068603516, 2.085803985595703, 6.731719970703125, 11.377636909484863, 16.0235538482666, 20.669471740722656, 25.315387725830078, 29.9613037109375, 34.60722351074219, 39.25313949584961, 43.89905548095703, 48.54497146606445, 53.190887451171875, 57.83680725097656, 62.482723236083984, 67.1286392211914, 71.7745590209961, 76.42047119140625, 81.06639099121094, 85.71231079101562, 90.35822296142578, 95.00414276123047, 99.65005493164062, 104.29597473144531, 108.94189453125, 113.58781433105469, 118.23372650146484, 122.87964630126953, 127.52555847167969, 132.17147827148438, 136.81739807128906, 141.46331787109375, 146.10922241210938, 150.75514221191406, 155.40106201171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 8.0, 10.0, 18.0, 31.0, 36.0, 52.0, 96.0, 128.0, 248.0, 479.0, 821.0, 1944.0, 4743.0, 15508.0, 74149.0, 757627.0, 155095.0, 25423.0, 7097.0, 2570.0, 1089.0, 589.0, 315.0, 163.0, 111.0, 62.0, 35.0, 29.0, 20.0, 13.0, 9.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.779296875, -22.01171875, -21.244140625, -20.4765625, -19.708984375, -18.94140625, -18.173828125, -17.40625, -16.638671875, -15.87109375, -15.103515625, -14.3359375, -13.568359375, -12.80078125, -12.033203125, -11.265625, -10.498046875, -9.73046875, -8.962890625, -8.1953125, -7.427734375, -6.66015625, -5.892578125, -5.125, -4.357421875, -3.58984375, -2.822265625, -2.0546875, -1.287109375, -0.51953125, 0.248046875, 1.015625, 1.783203125, 2.55078125, 3.318359375, 4.0859375, 4.853515625, 5.62109375, 6.388671875, 7.15625, 7.923828125, 8.69140625, 9.458984375, 10.2265625, 10.994140625, 11.76171875, 12.529296875, 13.296875, 14.064453125, 14.83203125, 15.599609375, 16.3671875, 17.134765625, 17.90234375, 18.669921875, 19.4375, 20.205078125, 20.97265625, 21.740234375, 22.5078125, 23.275390625, 24.04296875, 24.810546875, 25.578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 7.0, 17.0, 16.0, 35.0, 34.0, 39.0, 63.0, 61.0, 87.0, 82.0, 91.0, 88.0, 76.0, 76.0, 45.0, 40.0, 45.0, 32.0, 20.0, 13.0, 11.0, 8.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.622802734375, -12.22216796875, -11.821533203125, -11.4208984375, -11.020263671875, -10.61962890625, -10.218994140625, -9.818359375, -9.417724609375, -9.01708984375, -8.616455078125, -8.2158203125, -7.815185546875, -7.41455078125, -7.013916015625, -6.61328125, -6.212646484375, -5.81201171875, -5.411376953125, -5.0107421875, -4.610107421875, -4.20947265625, -3.808837890625, -3.408203125, -3.007568359375, -2.60693359375, -2.206298828125, -1.8056640625, -1.405029296875, -1.00439453125, -0.603759765625, -0.203125, 0.197509765625, 0.59814453125, 0.998779296875, 1.3994140625, 1.800048828125, 2.20068359375, 2.601318359375, 3.001953125, 3.402587890625, 3.80322265625, 4.203857421875, 4.6044921875, 5.005126953125, 5.40576171875, 5.806396484375, 6.20703125, 6.607666015625, 7.00830078125, 7.408935546875, 7.8095703125, 8.210205078125, 8.61083984375, 9.011474609375, 9.412109375, 9.812744140625, 10.21337890625, 10.614013671875, 11.0146484375, 11.415283203125, 11.81591796875, 12.216552734375, 12.6171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 10.0, 12.0, 11.0, 22.0, 22.0, 34.0, 42.0, 64.0, 95.0, 132.0, 237.0, 445.0, 820.0, 1757.0, 4649.0, 17136.0, 135081.0, 847181.0, 29365.0, 6862.0, 2313.0, 975.0, 495.0, 277.0, 162.0, 101.0, 79.0, 56.0, 26.0, 21.0, 23.0, 10.0, 5.0, 8.0, 2.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.69677734375, -18.9716796875, -18.24658203125, -17.521484375, -16.79638671875, -16.0712890625, -15.34619140625, -14.62109375, -13.89599609375, -13.1708984375, -12.44580078125, -11.720703125, -10.99560546875, -10.2705078125, -9.54541015625, -8.8203125, -8.09521484375, -7.3701171875, -6.64501953125, -5.919921875, -5.19482421875, -4.4697265625, -3.74462890625, -3.01953125, -2.29443359375, -1.5693359375, -0.84423828125, -0.119140625, 0.60595703125, 1.3310546875, 2.05615234375, 2.78125, 3.50634765625, 4.2314453125, 4.95654296875, 5.681640625, 6.40673828125, 7.1318359375, 7.85693359375, 8.58203125, 9.30712890625, 10.0322265625, 10.75732421875, 11.482421875, 12.20751953125, 12.9326171875, 13.65771484375, 14.3828125, 15.10791015625, 15.8330078125, 16.55810546875, 17.283203125, 18.00830078125, 18.7333984375, 19.45849609375, 20.18359375, 20.90869140625, 21.6337890625, 22.35888671875, 23.083984375, 23.80908203125, 24.5341796875, 25.25927734375, 25.984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 9.0, 9.0, 9.0, 10.0, 14.0, 19.0, 27.0, 31.0, 35.0, 54.0, 49.0, 81.0, 126.0, 120.0, 93.0, 72.0, 49.0, 48.0, 27.0, 24.0, 24.0, 13.0, 8.0, 9.0, 10.0, 8.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.75, -41.29736328125, -39.8447265625, -38.39208984375, -36.939453125, -35.48681640625, -34.0341796875, -32.58154296875, -31.12890625, -29.67626953125, -28.2236328125, -26.77099609375, -25.318359375, -23.86572265625, -22.4130859375, -20.96044921875, -19.5078125, -18.05517578125, -16.6025390625, -15.14990234375, -13.697265625, -12.24462890625, -10.7919921875, -9.33935546875, -7.88671875, -6.43408203125, -4.9814453125, -3.52880859375, -2.076171875, -0.62353515625, 0.8291015625, 2.28173828125, 3.734375, 5.18701171875, 6.6396484375, 8.09228515625, 9.544921875, 10.99755859375, 12.4501953125, 13.90283203125, 15.35546875, 16.80810546875, 18.2607421875, 19.71337890625, 21.166015625, 22.61865234375, 24.0712890625, 25.52392578125, 26.9765625, 28.42919921875, 29.8818359375, 31.33447265625, 32.787109375, 34.23974609375, 35.6923828125, 37.14501953125, 38.59765625, 40.05029296875, 41.5029296875, 42.95556640625, 44.408203125, 45.86083984375, 47.3134765625, 48.76611328125, 50.21875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 9.0, 10.0, 8.0, 15.0, 23.0, 28.0, 42.0, 51.0, 62.0, 103.0, 176.0, 313.0, 514.0, 1050.0, 2603.0, 8631.0, 52634.0, 915961.0, 52835.0, 8403.0, 2649.0, 1024.0, 511.0, 327.0, 181.0, 99.0, 75.0, 44.0, 36.0, 30.0, 19.0, 19.0, 11.0, 11.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.6328125, -6.4405517578125, -6.248291015625, -6.0560302734375, -5.86376953125, -5.6715087890625, -5.479248046875, -5.2869873046875, -5.0947265625, -4.9024658203125, -4.710205078125, -4.5179443359375, -4.32568359375, -4.1334228515625, -3.941162109375, -3.7489013671875, -3.556640625, -3.3643798828125, -3.172119140625, -2.9798583984375, -2.78759765625, -2.5953369140625, -2.403076171875, -2.2108154296875, -2.0185546875, -1.8262939453125, -1.634033203125, -1.4417724609375, -1.24951171875, -1.0572509765625, -0.864990234375, -0.6727294921875, -0.48046875, -0.2882080078125, -0.095947265625, 0.0963134765625, 0.28857421875, 0.4808349609375, 0.673095703125, 0.8653564453125, 1.0576171875, 1.2498779296875, 1.442138671875, 1.6343994140625, 1.82666015625, 2.0189208984375, 2.211181640625, 2.4034423828125, 2.595703125, 2.7879638671875, 2.980224609375, 3.1724853515625, 3.36474609375, 3.5570068359375, 3.749267578125, 3.9415283203125, 4.1337890625, 4.3260498046875, 4.518310546875, 4.7105712890625, 4.90283203125, 5.0950927734375, 5.287353515625, 5.4796142578125, 5.671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 5.0, 10.0, 14.0, 6.0, 11.0, 28.0, 41.0, 70.0, 99.0, 137.0, 189.0, 135.0, 83.0, 47.0, 37.0, 34.0, 17.0, 12.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002765655517578125, -0.002684950828552246, -0.002604246139526367, -0.0025235414505004883, -0.0024428367614746094, -0.0023621320724487305, -0.0022814273834228516, -0.0022007226943969727, -0.0021200180053710938, -0.002039313316345215, -0.001958608627319336, -0.001877903938293457, -0.0017971992492675781, -0.0017164945602416992, -0.0016357898712158203, -0.0015550851821899414, -0.0014743804931640625, -0.0013936758041381836, -0.0013129711151123047, -0.0012322664260864258, -0.0011515617370605469, -0.001070857048034668, -0.000990152359008789, -0.0009094476699829102, -0.0008287429809570312, -0.0007480382919311523, -0.0006673336029052734, -0.0005866289138793945, -0.0005059242248535156, -0.0004252195358276367, -0.0003445148468017578, -0.0002638101577758789, -0.00018310546875, -0.0001024007797241211, -2.1696090698242188e-05, 5.900859832763672e-05, 0.00013971328735351562, 0.00022041797637939453, 0.00030112266540527344, 0.00038182735443115234, 0.00046253204345703125, 0.0005432367324829102, 0.0006239414215087891, 0.000704646110534668, 0.0007853507995605469, 0.0008660554885864258, 0.0009467601776123047, 0.0010274648666381836, 0.0011081695556640625, 0.0011888742446899414, 0.0012695789337158203, 0.0013502836227416992, 0.0014309883117675781, 0.001511693000793457, 0.001592397689819336, 0.0016731023788452148, 0.0017538070678710938, 0.0018345117568969727, 0.0019152164459228516, 0.0019959211349487305, 0.0020766258239746094, 0.0021573305130004883, 0.002238035202026367, 0.002318739891052246, 0.002399444580078125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 1.0, 9.0, 7.0, 9.0, 23.0, 29.0, 40.0, 87.0, 125.0, 241.0, 492.0, 1199.0, 3478.0, 17525.0, 767829.0, 237635.0, 14577.0, 3151.0, 1082.0, 463.0, 211.0, 129.0, 90.0, 48.0, 20.0, 18.0, 10.0, 9.0, 2.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.66668701171875, -4.4935302734375, -4.32037353515625, -4.147216796875, -3.97406005859375, -3.8009033203125, -3.62774658203125, -3.45458984375, -3.28143310546875, -3.1082763671875, -2.93511962890625, -2.761962890625, -2.58880615234375, -2.4156494140625, -2.24249267578125, -2.0693359375, -1.89617919921875, -1.7230224609375, -1.54986572265625, -1.376708984375, -1.20355224609375, -1.0303955078125, -0.85723876953125, -0.68408203125, -0.51092529296875, -0.3377685546875, -0.16461181640625, 0.008544921875, 0.18170166015625, 0.3548583984375, 0.52801513671875, 0.701171875, 0.87432861328125, 1.0474853515625, 1.22064208984375, 1.393798828125, 1.56695556640625, 1.7401123046875, 1.91326904296875, 2.08642578125, 2.25958251953125, 2.4327392578125, 2.60589599609375, 2.779052734375, 2.95220947265625, 3.1253662109375, 3.29852294921875, 3.4716796875, 3.64483642578125, 3.8179931640625, 3.99114990234375, 4.164306640625, 4.33746337890625, 4.5106201171875, 4.68377685546875, 4.85693359375, 5.03009033203125, 5.2032470703125, 5.37640380859375, 5.549560546875, 5.72271728515625, 5.8958740234375, 6.06903076171875, 6.2421875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 2.0, 11.0, 12.0, 10.0, 6.0, 13.0, 33.0, 42.0, 43.0, 49.0, 84.0, 76.0, 93.0, 112.0, 68.0, 62.0, 50.0, 38.0, 27.0, 30.0, 18.0, 16.0, 15.0, 12.0, 12.0, 8.0, 8.0, 7.0, 3.0, 1.0, 5.0, 5.0, 3.0, 2.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.05078125, -2.948486328125, -2.84619140625, -2.743896484375, -2.6416015625, -2.539306640625, -2.43701171875, -2.334716796875, -2.232421875, -2.130126953125, -2.02783203125, -1.925537109375, -1.8232421875, -1.720947265625, -1.61865234375, -1.516357421875, -1.4140625, -1.311767578125, -1.20947265625, -1.107177734375, -1.0048828125, -0.902587890625, -0.80029296875, -0.697998046875, -0.595703125, -0.493408203125, -0.39111328125, -0.288818359375, -0.1865234375, -0.084228515625, 0.01806640625, 0.120361328125, 0.22265625, 0.324951171875, 0.42724609375, 0.529541015625, 0.6318359375, 0.734130859375, 0.83642578125, 0.938720703125, 1.041015625, 1.143310546875, 1.24560546875, 1.347900390625, 1.4501953125, 1.552490234375, 1.65478515625, 1.757080078125, 1.859375, 1.961669921875, 2.06396484375, 2.166259765625, 2.2685546875, 2.370849609375, 2.47314453125, 2.575439453125, 2.677734375, 2.780029296875, 2.88232421875, 2.984619140625, 3.0869140625, 3.189208984375, 3.29150390625, 3.393798828125, 3.49609375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 9.0, 18.0, 16.0, 21.0, 27.0, 40.0, 67.0, 115.0, 417.0, 81.0, 52.0, 34.0, 25.0, 16.0, 12.0, 8.0, 6.0, 1.0, 8.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.13442993164062, -69.05243682861328, -65.97045135498047, -62.888458251953125, -59.80646514892578, -56.7244758605957, -53.642486572265625, -50.56049346923828, -47.47850036621094, -44.39651107788086, -41.314517974853516, -38.23252868652344, -35.150535583496094, -32.068546295166016, -28.986555099487305, -25.904563903808594, -22.822574615478516, -19.740583419799805, -16.658592224121094, -13.5766019821167, -10.494610786437988, -7.412619590759277, -4.330629348754883, -1.2486381530761719, 1.833353042602539, 4.91534423828125, 7.997334957122803, 11.079325675964355, 14.161316871643066, 17.243309020996094, 20.325298309326172, 23.407289505004883, 26.489280700683594, 29.571271896362305, 32.653263092041016, 35.735252380371094, 38.81724548339844, 41.899234771728516, 44.981224060058594, 48.06321716308594, 51.14521026611328, 54.22719955444336, 57.3091926574707, 60.39118194580078, 63.473175048828125, 66.55516815185547, 69.63715362548828, 72.71914672851562, 75.80113220214844, 78.88312530517578, 81.9651107788086, 85.04710388183594, 88.12909698486328, 91.21109008789062, 94.29307556152344, 97.37506866455078, 100.45706176757812, 103.53905487060547, 106.62104034423828, 109.70303344726562, 112.78502655029297, 115.86701965332031, 118.94900512695312, 122.03099822998047, 125.11299133300781]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 5.0, 4.0, 9.0, 13.0, 15.0, 13.0, 21.0, 16.0, 20.0, 30.0, 32.0, 29.0, 52.0, 195.0, 262.0, 72.0, 22.0, 15.0, 22.0, 31.0, 18.0, 20.0, 13.0, 10.0, 6.0, 5.0, 8.0, 5.0, 12.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.41090393066406, -92.34678649902344, -89.28266906738281, -86.21855163574219, -83.15443420410156, -80.09031677246094, -77.02619934082031, -73.96207427978516, -70.89795684814453, -67.8338394165039, -64.76972198486328, -61.705604553222656, -58.641483306884766, -55.57736587524414, -52.513248443603516, -49.449127197265625, -46.385013580322266, -43.32089614868164, -40.256778717041016, -37.192657470703125, -34.1285400390625, -31.064422607421875, -28.00030517578125, -24.936185836791992, -21.872068405151367, -18.807950973510742, -15.743831634521484, -12.67971420288086, -9.615595817565918, -6.551477432250977, -3.4873600006103516, -0.42324066162109375, 2.6408767700195312, 5.704995155334473, 8.769113540649414, 11.833230972290039, 14.89734935760498, 17.961467742919922, 21.025585174560547, 24.089704513549805, 27.15382194519043, 30.217939376831055, 33.28205871582031, 36.34617614746094, 39.41029357910156, 42.47441101074219, 45.53852844238281, 48.6026496887207, 51.66676712036133, 54.73088455200195, 57.79500198364258, 60.85912322998047, 63.923240661621094, 66.98735809326172, 70.05147552490234, 73.11559295654297, 76.1797103881836, 79.24382781982422, 82.30794525146484, 85.37206268310547, 88.4361801147461, 91.50030517578125, 94.56442260742188, 97.6285400390625, 100.69265747070312]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 10.0, 16.0, 15.0, 19.0, 30.0, 38.0, 50.0, 61.0, 190.0, 268.0, 84.0, 55.0, 44.0, 26.0, 26.0, 21.0, 10.0, 7.0, 4.0, 12.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.5548095703125, -8.148681640625, -7.7425537109375, -7.33642578125, -6.9302978515625, -6.524169921875, -6.1180419921875, -5.7119140625, -5.3057861328125, -4.899658203125, -4.4935302734375, -4.08740234375, -3.6812744140625, -3.275146484375, -2.8690185546875, -2.462890625, -2.0567626953125, -1.650634765625, -1.2445068359375, -0.83837890625, -0.4322509765625, -0.026123046875, 0.3800048828125, 0.7861328125, 1.1922607421875, 1.598388671875, 2.0045166015625, 2.41064453125, 2.8167724609375, 3.222900390625, 3.6290283203125, 4.03515625, 4.4412841796875, 4.847412109375, 5.2535400390625, 5.65966796875, 6.0657958984375, 6.471923828125, 6.8780517578125, 7.2841796875, 7.6903076171875, 8.096435546875, 8.5025634765625, 8.90869140625, 9.3148193359375, 9.720947265625, 10.1270751953125, 10.533203125, 10.9393310546875, 11.345458984375, 11.7515869140625, 12.15771484375, 12.5638427734375, 12.969970703125, 13.3760986328125, 13.7822265625, 14.1883544921875, 14.594482421875, 15.0006103515625, 15.40673828125, 15.8128662109375, 16.218994140625, 16.6251220703125, 17.03125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 0.0, 1.0, 4.0, 5.0, 9.0, 16.0, 30.0, 64.0, 193.0, 1149.0, 8147985.0, 237717.0, 1093.0, 194.0, 50.0, 28.0, 20.0, 13.0, 5.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-310.53485107421875, -303.31011962890625, -296.0853576660156, -288.8606262207031, -281.6358642578125, -274.4111328125, -267.1863708496094, -259.9616394042969, -252.73687744140625, -245.5121307373047, -238.28738403320312, -231.06263732910156, -223.837890625, -216.61314392089844, -209.38839721679688, -202.16366577148438, -194.9389190673828, -187.71417236328125, -180.4894256591797, -173.26467895507812, -166.03993225097656, -158.815185546875, -151.5904541015625, -144.36569213867188, -137.14096069335938, -129.9162139892578, -122.69146728515625, -115.46672058105469, -108.24197387695312, -101.01722717285156, -93.79248809814453, -86.56774139404297, -79.34298706054688, -72.11824035644531, -64.89349365234375, -57.66875076293945, -50.44400405883789, -43.21925735473633, -35.99451446533203, -28.76976776123047, -21.545021057128906, -14.32027530670166, -7.095529556274414, 0.12921524047851562, 7.353961944580078, 14.57870864868164, 21.803451538085938, 29.0281982421875, 36.25294494628906, 43.477691650390625, 50.70243835449219, 57.927181243896484, 65.15193176269531, 72.37667846679688, 79.6014175415039, 86.82616424560547, 94.05091094970703, 101.2756576538086, 108.50040435791016, 115.72514343261719, 122.94989013671875, 130.1746368408203, 137.39938354492188, 144.62413024902344, 151.848876953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 2.0, 2.0, 5.0, 8.0, 5.0, 8.0, 12.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-175.32557678222656, -170.28524780273438, -165.2449188232422, -160.20458984375, -155.1642608642578, -150.12393188476562, -145.08360290527344, -140.04327392578125, -135.00294494628906, -129.96261596679688, -124.92228698730469, -119.8819580078125, -114.84162902832031, -109.80130004882812, -104.76097106933594, -99.72064208984375, -94.68031311035156, -89.63998413085938, -84.59965515136719, -79.559326171875, -74.51899719238281, -69.47866821289062, -64.43833923339844, -59.39801025390625, -54.35768127441406, -49.317352294921875, -44.27702331542969, -39.2366943359375, -34.19636535644531, -29.156036376953125, -24.115707397460938, -19.07537841796875, -14.035049438476562, -8.994720458984375, -3.9543914794921875, 1.0859375, 6.1262664794921875, 11.166595458984375, 16.206924438476562, 21.24725341796875, 26.287582397460938, 31.327911376953125, 36.36824035644531, 41.4085693359375, 46.44889831542969, 51.489227294921875, 56.52955627441406, 61.56988525390625, 66.61021423339844, 71.65054321289062, 76.69087219238281, 81.731201171875, 86.77153015136719, 91.81185913085938, 96.85218811035156, 101.89251708984375, 106.93284606933594, 111.97317504882812, 117.01350402832031, 122.0538330078125, 127.09416198730469, 132.13449096679688, 137.17481994628906, 142.21514892578125, 147.25547790527344]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 4.0, 1.0, 9.0, 10.0, 13.0, 20.0, 30.0, 66.0, 128.0, 289.0, 754.0, 3007.0, 20586.0, 307493.0, 176904.0, 11825.0, 2004.0, 602.0, 249.0, 118.0, 55.0, 38.0, 23.0, 14.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.625, -157.962890625, -153.30078125, -148.638671875, -143.9765625, -139.314453125, -134.65234375, -129.990234375, -125.328125, -120.666015625, -116.00390625, -111.341796875, -106.6796875, -102.017578125, -97.35546875, -92.693359375, -88.03125, -83.369140625, -78.70703125, -74.044921875, -69.3828125, -64.720703125, -60.05859375, -55.396484375, -50.734375, -46.072265625, -41.41015625, -36.748046875, -32.0859375, -27.423828125, -22.76171875, -18.099609375, -13.4375, -8.775390625, -4.11328125, 0.548828125, 5.2109375, 9.873046875, 14.53515625, 19.197265625, 23.859375, 28.521484375, 33.18359375, 37.845703125, 42.5078125, 47.169921875, 51.83203125, 56.494140625, 61.15625, 65.818359375, 70.48046875, 75.142578125, 79.8046875, 84.466796875, 89.12890625, 93.791015625, 98.453125, 103.115234375, 107.77734375, 112.439453125, 117.1015625, 121.763671875, 126.42578125, 131.087890625, 135.75]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 6.0, 13.0, 13.0, 25.0, 25.0, 52.0, 65.0, 69.0, 69.0, 106.0, 90.0, 102.0, 88.0, 67.0, 55.0, 46.0, 22.0, 17.0, 18.0, 12.0, 10.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -12.0169677734375, -11.635498046875, -11.2540283203125, -10.87255859375, -10.4910888671875, -10.109619140625, -9.7281494140625, -9.3466796875, -8.9652099609375, -8.583740234375, -8.2022705078125, -7.82080078125, -7.4393310546875, -7.057861328125, -6.6763916015625, -6.294921875, -5.9134521484375, -5.531982421875, -5.1505126953125, -4.76904296875, -4.3875732421875, -4.006103515625, -3.6246337890625, -3.2431640625, -2.8616943359375, -2.480224609375, -2.0987548828125, -1.71728515625, -1.3358154296875, -0.954345703125, -0.5728759765625, -0.19140625, 0.1900634765625, 0.571533203125, 0.9530029296875, 1.33447265625, 1.7159423828125, 2.097412109375, 2.4788818359375, 2.8603515625, 3.2418212890625, 3.623291015625, 4.0047607421875, 4.38623046875, 4.7677001953125, 5.149169921875, 5.5306396484375, 5.912109375, 6.2935791015625, 6.675048828125, 7.0565185546875, 7.43798828125, 7.8194580078125, 8.200927734375, 8.5823974609375, 8.9638671875, 9.3453369140625, 9.726806640625, 10.1082763671875, 10.48974609375, 10.8712158203125, 11.252685546875, 11.6341552734375, 12.015625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 22.0, 63.0, 140.0, 113.0, 61.0, 26.0, 15.0, 12.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.50978088378906, -129.83786010742188, -126.16593933105469, -122.4940185546875, -118.82209014892578, -115.1501693725586, -111.4782485961914, -107.80632781982422, -104.13440704345703, -100.46248626708984, -96.79056549072266, -93.11863708496094, -89.44671630859375, -85.77479553222656, -82.10287475585938, -78.43095397949219, -74.759033203125, -71.08711242675781, -67.41519165039062, -63.74326705932617, -60.071346282958984, -56.39942169189453, -52.727500915527344, -49.055580139160156, -45.38365173339844, -41.71173095703125, -38.0398063659668, -34.36788558959961, -30.695964813232422, -27.0240421295166, -23.35211944580078, -19.680198669433594, -16.008277893066406, -12.336356163024902, -8.664434432983398, -4.992511749267578, -1.3205900192260742, 2.3513317108154297, 6.02325439453125, 9.695175170898438, 13.367097854614258, 17.039020538330078, 20.710941314697266, 24.382863998413086, 28.054786682128906, 31.726707458496094, 35.39862823486328, 39.07054901123047, 42.74247360229492, 46.41439437866211, 50.08631896972656, 53.75823974609375, 57.43016052246094, 61.102081298828125, 64.77400207519531, 68.4459228515625, 72.11785125732422, 75.7897720336914, 79.4616928100586, 83.13362121582031, 86.8055419921875, 90.47746276855469, 94.14938354492188, 97.82130432128906, 101.49322509765625]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 0.0, 6.0, 16.0, 41.0, 63.0, 80.0, 93.0, 61.0, 35.0, 17.0, 12.0, 5.0, 5.0, 7.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.763465881347656, -35.23151397705078, -33.699562072753906, -32.1676139831543, -30.635662078857422, -29.103710174560547, -27.571758270263672, -26.03980827331543, -24.507858276367188, -22.975906372070312, -21.44395637512207, -19.912004470825195, -18.380054473876953, -16.848102569580078, -15.31615161895752, -13.784200668334961, -12.252248764038086, -10.720297813415527, -9.188346862792969, -7.656395435333252, -6.124444484710693, -4.592493534088135, -3.060542106628418, -1.5285911560058594, 0.0033597946166992188, 1.5353108644485474, 3.0672619342803955, 4.599213123321533, 6.131164073944092, 7.66311502456665, 9.195066452026367, 10.727017402648926, 12.258968353271484, 13.790919303894043, 15.322870254516602, 16.854822158813477, 18.38677215576172, 19.918724060058594, 21.45067596435547, 22.98262596130371, 24.514575958251953, 26.046527862548828, 27.57847785949707, 29.110429763793945, 30.642379760742188, 32.17433166503906, 33.70628356933594, 35.23823547363281, 36.77018737792969, 38.30213928222656, 39.83409118652344, 41.36603927612305, 42.89799118041992, 44.4299430847168, 45.96189498901367, 47.49384307861328, 49.025794982910156, 50.55774688720703, 52.089698791503906, 53.621646881103516, 55.15359878540039, 56.685550689697266, 58.21750259399414, 59.74945068359375, 61.281402587890625]}, "_wandb": {"runtime": 2368}}