diff --git "a/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" "b/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" --- "a/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" +++ "b/wandb/run-20220301_082052-1y1by2yf/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3963, "train/learning_rate": 2.976e-05, "train/epoch": 0.42, "train/global_step": 500, "_runtime": 2827, "_timestamp": 1646125679, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 70.0, 377.0, 448.0, 100.0, 11.0, 0.0, 1.0, 1.0], "bins": [-268.59259033203125, -263.96728515625, -259.3419494628906, -254.7166290283203, -250.09130859375, -245.4659881591797, -240.84066772460938, -236.21534729003906, -231.59002685546875, -226.96470642089844, -222.33938598632812, -217.7140655517578, -213.0887451171875, -208.4634246826172, -203.83810424804688, -199.21278381347656, -194.58746337890625, -189.96214294433594, -185.33682250976562, -180.7115020751953, -176.086181640625, -171.4608612060547, -166.83554077148438, -162.21022033691406, -157.58489990234375, -152.95957946777344, -148.33425903320312, -143.7089385986328, -139.0836181640625, -134.4582977294922, -129.83297729492188, -125.20765686035156, -120.58234405517578, -115.95702362060547, -111.33170318603516, -106.70638275146484, -102.08106231689453, -97.45574188232422, -92.8304214477539, -88.2051010131836, -83.57978057861328, -78.95446014404297, -74.32913970947266, -69.70381927490234, -65.07849884033203, -60.45317840576172, -55.827857971191406, -51.202537536621094, -46.57721710205078, -41.95189666748047, -37.326576232910156, -32.701255798339844, -28.07593536376953, -23.45061492919922, -18.825294494628906, -14.199974060058594, -9.574655532836914, -4.949335098266602, -0.32401466369628906, 4.301305770874023, 8.926626205444336, 13.551946640014648, 18.17726707458496, 22.802587509155273, 27.427907943725586]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 15.0, 14.0, 17.0, 15.0, 10.0, 23.0, 20.0, 25.0, 23.0, 28.0, 28.0, 36.0, 37.0, 30.0, 43.0, 35.0, 40.0, 58.0, 34.0, 43.0, 38.0, 41.0, 37.0, 31.0, 32.0, 23.0, 24.0, 25.0, 26.0, 24.0, 12.0, 17.0, 17.0, 9.0, 9.0, 8.0, 8.0, 7.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.99211120605469, -46.43101119995117, -44.869911193847656, -43.308815002441406, -41.74771499633789, -40.186614990234375, -38.62551498413086, -37.064414978027344, -35.503318786621094, -33.94221878051758, -32.38111877441406, -30.82002067565918, -29.258922576904297, -27.69782257080078, -26.136722564697266, -24.57562255859375, -23.014522552490234, -21.45342254638672, -19.892324447631836, -18.33122444152832, -16.770126342773438, -15.209026336669922, -13.647926330566406, -12.086827278137207, -10.525728225708008, -8.964629173278809, -7.403529644012451, -5.842430114746094, -4.2813310623168945, -2.7202320098876953, -1.1591320037841797, 0.40196704864501953, 1.9630622863769531, 3.5241615772247314, 5.08526086807251, 6.646360397338867, 8.207459449768066, 9.768558502197266, 11.329658508300781, 12.89075756072998, 14.45185661315918, 16.012956619262695, 17.574054718017578, 19.135154724121094, 20.69625473022461, 22.257352828979492, 23.818452835083008, 25.37955093383789, 26.940650939941406, 28.501750946044922, 30.062849044799805, 31.62394905090332, 33.1850471496582, 34.74614715576172, 36.307247161865234, 37.86834716796875, 39.429443359375, 40.990543365478516, 42.55164337158203, 44.11273956298828, 45.6738395690918, 47.23493957519531, 48.79603958129883, 50.357139587402344, 51.91823959350586]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 6.0, 2.0, 7.0, 9.0, 13.0, 8.0, 15.0, 13.0, 17.0, 16.0, 19.0, 20.0, 27.0, 26.0, 28.0, 44.0, 30.0, 36.0, 37.0, 39.0, 31.0, 39.0, 52.0, 35.0, 47.0, 51.0, 37.0, 30.0, 32.0, 27.0, 19.0, 23.0, 32.0, 18.0, 19.0, 15.0, 11.0, 13.0, 11.0, 14.0, 15.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.884765625, -2.797698974609375, -2.71063232421875, -2.623565673828125, -2.5364990234375, -2.449432373046875, -2.36236572265625, -2.275299072265625, -2.188232421875, -2.101165771484375, -2.01409912109375, -1.927032470703125, -1.8399658203125, -1.752899169921875, -1.66583251953125, -1.578765869140625, -1.49169921875, -1.404632568359375, -1.31756591796875, -1.230499267578125, -1.1434326171875, -1.056365966796875, -0.96929931640625, -0.882232666015625, -0.795166015625, -0.708099365234375, -0.62103271484375, -0.533966064453125, -0.4468994140625, -0.359832763671875, -0.27276611328125, -0.185699462890625, -0.0986328125, -0.011566162109375, 0.07550048828125, 0.162567138671875, 0.2496337890625, 0.336700439453125, 0.42376708984375, 0.510833740234375, 0.597900390625, 0.684967041015625, 0.77203369140625, 0.859100341796875, 0.9461669921875, 1.033233642578125, 1.12030029296875, 1.207366943359375, 1.29443359375, 1.381500244140625, 1.46856689453125, 1.555633544921875, 1.6427001953125, 1.729766845703125, 1.81683349609375, 1.903900146484375, 1.990966796875, 2.078033447265625, 2.16510009765625, 2.252166748046875, 2.3392333984375, 2.426300048828125, 2.51336669921875, 2.600433349609375, 2.6875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 8.0, 5.0, 4.0, 7.0, 12.0, 26.0, 26.0, 40.0, 42.0, 48.0, 84.0, 101.0, 136.0, 147.0, 215.0, 316.0, 498.0, 704.0, 1240.0, 1910.0, 3408.0, 6862.0, 16326.0, 52557.0, 301008.0, 2268364.0, 1332880.0, 147828.0, 33911.0, 12204.0, 5375.0, 2869.0, 1678.0, 1028.0, 712.0, 491.0, 329.0, 201.0, 155.0, 127.0, 101.0, 71.0, 61.0, 35.0, 33.0, 35.0, 14.0, 11.0, 8.0, 5.0, 9.0, 1.0, 5.0, 2.0, 4.0, 4.0, 2.0], "bins": [-9.6015625, -9.30908203125, -9.0166015625, -8.72412109375, -8.431640625, -8.13916015625, -7.8466796875, -7.55419921875, -7.26171875, -6.96923828125, -6.6767578125, -6.38427734375, -6.091796875, -5.79931640625, -5.5068359375, -5.21435546875, -4.921875, -4.62939453125, -4.3369140625, -4.04443359375, -3.751953125, -3.45947265625, -3.1669921875, -2.87451171875, -2.58203125, -2.28955078125, -1.9970703125, -1.70458984375, -1.412109375, -1.11962890625, -0.8271484375, -0.53466796875, -0.2421875, 0.05029296875, 0.3427734375, 0.63525390625, 0.927734375, 1.22021484375, 1.5126953125, 1.80517578125, 2.09765625, 2.39013671875, 2.6826171875, 2.97509765625, 3.267578125, 3.56005859375, 3.8525390625, 4.14501953125, 4.4375, 4.72998046875, 5.0224609375, 5.31494140625, 5.607421875, 5.89990234375, 6.1923828125, 6.48486328125, 6.77734375, 7.06982421875, 7.3623046875, 7.65478515625, 7.947265625, 8.23974609375, 8.5322265625, 8.82470703125, 9.1171875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 10.0, 15.0, 54.0, 102.0, 287.0, 739.0, 1439.0, 856.0, 343.0, 149.0, 43.0, 28.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.15625, -42.119140625, -41.08203125, -40.044921875, -39.0078125, -37.970703125, -36.93359375, -35.896484375, -34.859375, -33.822265625, -32.78515625, -31.748046875, -30.7109375, -29.673828125, -28.63671875, -27.599609375, -26.5625, -25.525390625, -24.48828125, -23.451171875, -22.4140625, -21.376953125, -20.33984375, -19.302734375, -18.265625, -17.228515625, -16.19140625, -15.154296875, -14.1171875, -13.080078125, -12.04296875, -11.005859375, -9.96875, -8.931640625, -7.89453125, -6.857421875, -5.8203125, -4.783203125, -3.74609375, -2.708984375, -1.671875, -0.634765625, 0.40234375, 1.439453125, 2.4765625, 3.513671875, 4.55078125, 5.587890625, 6.625, 7.662109375, 8.69921875, 9.736328125, 10.7734375, 11.810546875, 12.84765625, 13.884765625, 14.921875, 15.958984375, 16.99609375, 18.033203125, 19.0703125, 20.107421875, 21.14453125, 22.181640625, 23.21875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 13.0, 28.0, 75.0, 254.0, 846.0, 4298.0, 4171038.0, 15974.0, 1217.0, 354.0, 117.0, 32.0, 24.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.8125, -123.7744140625, -119.736328125, -115.6982421875, -111.66015625, -107.6220703125, -103.583984375, -99.5458984375, -95.5078125, -91.4697265625, -87.431640625, -83.3935546875, -79.35546875, -75.3173828125, -71.279296875, -67.2412109375, -63.203125, -59.1650390625, -55.126953125, -51.0888671875, -47.05078125, -43.0126953125, -38.974609375, -34.9365234375, -30.8984375, -26.8603515625, -22.822265625, -18.7841796875, -14.74609375, -10.7080078125, -6.669921875, -2.6318359375, 1.40625, 5.4443359375, 9.482421875, 13.5205078125, 17.55859375, 21.5966796875, 25.634765625, 29.6728515625, 33.7109375, 37.7490234375, 41.787109375, 45.8251953125, 49.86328125, 53.9013671875, 57.939453125, 61.9775390625, 66.015625, 70.0537109375, 74.091796875, 78.1298828125, 82.16796875, 86.2060546875, 90.244140625, 94.2822265625, 98.3203125, 102.3583984375, 106.396484375, 110.4345703125, 114.47265625, 118.5107421875, 122.548828125, 126.5869140625, 130.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 20.0, 107.0, 258.0, 382.0, 176.0, 48.0, 15.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-118.37948608398438, -115.2860336303711, -112.19258117675781, -109.09912109375, -106.00566864013672, -102.91221618652344, -99.81876373291016, -96.72531127929688, -93.63185119628906, -90.53839874267578, -87.4449462890625, -84.35148620605469, -81.2580337524414, -78.16458129882812, -75.07112884521484, -71.97767639160156, -68.88422393798828, -65.790771484375, -62.69731521606445, -59.60386276245117, -56.510406494140625, -53.416954040527344, -50.32350158691406, -47.23004913330078, -44.136592864990234, -41.04314041137695, -37.949684143066406, -34.856231689453125, -31.76277732849121, -28.669322967529297, -25.575870513916016, -22.4824161529541, -19.38896942138672, -16.295515060424805, -13.202061653137207, -10.10860824584961, -7.015153884887695, -3.9216995239257812, -0.8282470703125, 2.265207290649414, 5.358661651611328, 8.452116012573242, 11.54556941986084, 14.639022827148438, 17.73247718811035, 20.825931549072266, 23.919384002685547, 27.01283836364746, 30.106292724609375, 33.199745178222656, 36.2932014465332, 39.386653900146484, 42.48011016845703, 45.57356262207031, 48.667015075683594, 51.760467529296875, 54.85392379760742, 57.9473762512207, 61.04083251953125, 64.13428497314453, 67.22773742675781, 70.32119750976562, 73.41464233398438, 76.50810241699219, 79.60155487060547]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 9.0, 6.0, 10.0, 8.0, 12.0, 22.0, 11.0, 38.0, 26.0, 25.0, 36.0, 36.0, 49.0, 31.0, 45.0, 48.0, 35.0, 49.0, 33.0, 45.0, 39.0, 45.0, 35.0, 36.0, 38.0, 31.0, 42.0, 30.0, 21.0, 18.0, 13.0, 21.0, 24.0, 8.0, 14.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15552520751953, -37.875423431396484, -36.59531784057617, -35.315216064453125, -34.03511428833008, -32.75501251220703, -31.47490692138672, -30.194805145263672, -28.914701461791992, -27.634597778320312, -26.354496002197266, -25.074392318725586, -23.794288635253906, -22.51418685913086, -21.23408317565918, -19.9539794921875, -18.673877716064453, -17.393774032592773, -16.113672256469727, -14.833568572998047, -13.553465843200684, -12.27336311340332, -10.99325942993164, -9.713156700134277, -8.433053970336914, -7.152951240539551, -5.872848033905029, -4.592744827270508, -3.3126420974731445, -2.0325393676757812, -0.7524361610412598, 0.5276670455932617, 1.807769775390625, 3.0878727436065674, 4.36797571182251, 5.648078918457031, 6.9281816482543945, 8.208284378051758, 9.488388061523438, 10.7684907913208, 12.048593521118164, 13.328696250915527, 14.60879898071289, 15.88890266418457, 17.16900634765625, 18.449108123779297, 19.729211807250977, 21.009315490722656, 22.289417266845703, 23.569520950317383, 24.84962272644043, 26.12972640991211, 27.409828186035156, 28.689931869506836, 29.970035552978516, 31.250137329101562, 32.530242919921875, 33.81034469604492, 35.090450286865234, 36.37055206298828, 37.65065383911133, 38.930755615234375, 40.21086120605469, 41.490962982177734, 42.77106475830078]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 10.0, 16.0, 12.0, 15.0, 19.0, 28.0, 24.0, 21.0, 25.0, 35.0, 43.0, 42.0, 39.0, 46.0, 51.0, 41.0, 45.0, 43.0, 45.0, 39.0, 43.0, 48.0, 36.0, 34.0, 29.0, 28.0, 22.0, 27.0, 22.0, 15.0, 16.0, 4.0, 5.0, 9.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.609375, -3.5010986328125, -3.392822265625, -3.2845458984375, -3.17626953125, -3.0679931640625, -2.959716796875, -2.8514404296875, -2.7431640625, -2.6348876953125, -2.526611328125, -2.4183349609375, -2.31005859375, -2.2017822265625, -2.093505859375, -1.9852294921875, -1.876953125, -1.7686767578125, -1.660400390625, -1.5521240234375, -1.44384765625, -1.3355712890625, -1.227294921875, -1.1190185546875, -1.0107421875, -0.9024658203125, -0.794189453125, -0.6859130859375, -0.57763671875, -0.4693603515625, -0.361083984375, -0.2528076171875, -0.14453125, -0.0362548828125, 0.072021484375, 0.1802978515625, 0.28857421875, 0.3968505859375, 0.505126953125, 0.6134033203125, 0.7216796875, 0.8299560546875, 0.938232421875, 1.0465087890625, 1.15478515625, 1.2630615234375, 1.371337890625, 1.4796142578125, 1.587890625, 1.6961669921875, 1.804443359375, 1.9127197265625, 2.02099609375, 2.1292724609375, 2.237548828125, 2.3458251953125, 2.4541015625, 2.5623779296875, 2.670654296875, 2.7789306640625, 2.88720703125, 2.9954833984375, 3.103759765625, 3.2120361328125, 3.3203125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 9.0, 21.0, 27.0, 29.0, 51.0, 72.0, 99.0, 160.0, 210.0, 361.0, 527.0, 833.0, 1320.0, 2068.0, 3450.0, 5770.0, 9793.0, 17405.0, 31274.0, 59105.0, 116141.0, 218182.0, 258485.0, 152598.0, 77748.0, 40244.0, 21884.0, 12409.0, 7043.0, 4219.0, 2574.0, 1568.0, 1020.0, 599.0, 433.0, 276.0, 170.0, 118.0, 78.0, 59.0, 42.0, 24.0, 14.0, 13.0, 13.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.363037109375, -0.3510169982910156, -0.33899688720703125, -0.3269767761230469, -0.3149566650390625, -0.3029365539550781, -0.29091644287109375, -0.2788963317871094, -0.266876220703125, -0.2548561096191406, -0.24283599853515625, -0.23081588745117188, -0.2187957763671875, -0.20677566528320312, -0.19475555419921875, -0.18273544311523438, -0.17071533203125, -0.15869522094726562, -0.14667510986328125, -0.13465499877929688, -0.1226348876953125, -0.11061477661132812, -0.09859466552734375, -0.08657455444335938, -0.074554443359375, -0.06253433227539062, -0.05051422119140625, -0.038494110107421875, -0.0264739990234375, -0.014453887939453125, -0.00243377685546875, 0.009586334228515625, 0.0216064453125, 0.033626556396484375, 0.04564666748046875, 0.057666778564453125, 0.0696868896484375, 0.08170700073242188, 0.09372711181640625, 0.10574722290039062, 0.117767333984375, 0.12978744506835938, 0.14180755615234375, 0.15382766723632812, 0.1658477783203125, 0.17786788940429688, 0.18988800048828125, 0.20190811157226562, 0.21392822265625, 0.22594833374023438, 0.23796844482421875, 0.24998855590820312, 0.2620086669921875, 0.2740287780761719, 0.28604888916015625, 0.2980690002441406, 0.310089111328125, 0.3221092224121094, 0.33412933349609375, 0.3461494445800781, 0.3581695556640625, 0.3701896667480469, 0.38220977783203125, 0.3942298889160156, 0.40625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 9.0, 9.0, 10.0, 23.0, 9.0, 12.0, 15.0, 18.0, 14.0, 18.0, 23.0, 32.0, 26.0, 35.0, 27.0, 39.0, 27.0, 31.0, 41.0, 39.0, 1062.0, 38.0, 39.0, 29.0, 31.0, 31.0, 26.0, 25.0, 32.0, 22.0, 35.0, 25.0, 26.0, 30.0, 23.0, 14.0, 17.0, 8.0, 11.0, 11.0, 4.0, 8.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-1.7734375, -1.7162017822265625, -1.658966064453125, -1.6017303466796875, -1.54449462890625, -1.4872589111328125, -1.430023193359375, -1.3727874755859375, -1.3155517578125, -1.2583160400390625, -1.201080322265625, -1.1438446044921875, -1.08660888671875, -1.0293731689453125, -0.972137451171875, -0.9149017333984375, -0.857666015625, -0.8004302978515625, -0.743194580078125, -0.6859588623046875, -0.62872314453125, -0.5714874267578125, -0.514251708984375, -0.4570159912109375, -0.3997802734375, -0.3425445556640625, -0.285308837890625, -0.2280731201171875, -0.17083740234375, -0.1136016845703125, -0.056365966796875, 0.0008697509765625, 0.05810546875, 0.1153411865234375, 0.172576904296875, 0.2298126220703125, 0.28704833984375, 0.3442840576171875, 0.401519775390625, 0.4587554931640625, 0.5159912109375, 0.5732269287109375, 0.630462646484375, 0.6876983642578125, 0.74493408203125, 0.8021697998046875, 0.859405517578125, 0.9166412353515625, 0.973876953125, 1.0311126708984375, 1.088348388671875, 1.1455841064453125, 1.20281982421875, 1.2600555419921875, 1.317291259765625, 1.3745269775390625, 1.4317626953125, 1.4889984130859375, 1.546234130859375, 1.6034698486328125, 1.66070556640625, 1.7179412841796875, 1.775177001953125, 1.8324127197265625, 1.8896484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 11.0, 7.0, 9.0, 9.0, 16.0, 52.0, 62.0, 64.0, 132.0, 180.0, 259.0, 371.0, 598.0, 965.0, 1353.0, 2169.0, 3073.0, 4734.0, 7357.0, 11798.0, 18582.0, 30382.0, 49936.0, 82156.0, 132468.0, 1234795.0, 187769.0, 125672.0, 77517.0, 46836.0, 28676.0, 17595.0, 11026.0, 7116.0, 4550.0, 2997.0, 1965.0, 1332.0, 894.0, 539.0, 397.0, 242.0, 158.0, 92.0, 62.0, 56.0, 36.0, 26.0, 19.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0], "bins": [-0.30126953125, -0.2926483154296875, -0.284027099609375, -0.2754058837890625, -0.26678466796875, -0.2581634521484375, -0.249542236328125, -0.2409210205078125, -0.2322998046875, -0.2236785888671875, -0.215057373046875, -0.2064361572265625, -0.19781494140625, -0.1891937255859375, -0.180572509765625, -0.1719512939453125, -0.163330078125, -0.1547088623046875, -0.146087646484375, -0.1374664306640625, -0.12884521484375, -0.1202239990234375, -0.111602783203125, -0.1029815673828125, -0.0943603515625, -0.0857391357421875, -0.077117919921875, -0.0684967041015625, -0.05987548828125, -0.0512542724609375, -0.042633056640625, -0.0340118408203125, -0.025390625, -0.0167694091796875, -0.008148193359375, 0.0004730224609375, 0.00909423828125, 0.0177154541015625, 0.026336669921875, 0.0349578857421875, 0.0435791015625, 0.0522003173828125, 0.060821533203125, 0.0694427490234375, 0.07806396484375, 0.0866851806640625, 0.095306396484375, 0.1039276123046875, 0.112548828125, 0.1211700439453125, 0.129791259765625, 0.1384124755859375, 0.14703369140625, 0.1556549072265625, 0.164276123046875, 0.1728973388671875, 0.1815185546875, 0.1901397705078125, 0.198760986328125, 0.2073822021484375, 0.21600341796875, 0.2246246337890625, 0.233245849609375, 0.2418670654296875, 0.25048828125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 1.0, 6.0, 6.0, 13.0, 5.0, 10.0, 13.0, 17.0, 18.0, 15.0, 23.0, 24.0, 29.0, 40.0, 43.0, 29.0, 29.0, 34.0, 42.0, 39.0, 39.0, 40.0, 36.0, 41.0, 40.0, 40.0, 50.0, 28.0, 30.0, 29.0, 24.0, 22.0, 21.0, 25.0, 17.0, 13.0, 10.0, 10.0, 9.0, 9.0, 9.0, 7.0, 4.0, 8.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0004277229309082031, -0.00041572004556655884, -0.00040371716022491455, -0.00039171427488327026, -0.000379711389541626, -0.0003677085041999817, -0.0003557056188583374, -0.0003437027335166931, -0.00033169984817504883, -0.00031969696283340454, -0.00030769407749176025, -0.00029569119215011597, -0.0002836883068084717, -0.0002716854214668274, -0.0002596825361251831, -0.0002476796507835388, -0.00023567676544189453, -0.00022367388010025024, -0.00021167099475860596, -0.00019966810941696167, -0.00018766522407531738, -0.0001756623387336731, -0.0001636594533920288, -0.00015165656805038452, -0.00013965368270874023, -0.00012765079736709595, -0.00011564791202545166, -0.00010364502668380737, -9.164214134216309e-05, -7.96392560005188e-05, -6.763637065887451e-05, -5.5633485317230225e-05, -4.363059997558594e-05, -3.162771463394165e-05, -1.9624829292297363e-05, -7.621943950653076e-06, 4.380941390991211e-06, 1.6383826732635498e-05, 2.8386712074279785e-05, 4.038959741592407e-05, 5.239248275756836e-05, 6.439536809921265e-05, 7.639825344085693e-05, 8.840113878250122e-05, 0.00010040402412414551, 0.0001124069094657898, 0.00012440979480743408, 0.00013641268014907837, 0.00014841556549072266, 0.00016041845083236694, 0.00017242133617401123, 0.00018442422151565552, 0.0001964271068572998, 0.0002084299921989441, 0.00022043287754058838, 0.00023243576288223267, 0.00024443864822387695, 0.00025644153356552124, 0.00026844441890716553, 0.0002804473042488098, 0.0002924501895904541, 0.0003044530749320984, 0.0003164559602737427, 0.00032845884561538696, 0.00034046173095703125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 7.0, 7.0, 10.0, 8.0, 18.0, 17.0, 28.0, 18.0, 27.0, 41.0, 30.0, 62.0, 64.0, 64.0, 72.0, 103.0, 116.0, 156.0, 195.0, 277.0, 352.0, 496.0, 1092.0, 439657.0, 602372.0, 1178.0, 472.0, 342.0, 244.0, 185.0, 148.0, 126.0, 86.0, 84.0, 66.0, 60.0, 45.0, 50.0, 35.0, 34.0, 23.0, 28.0, 15.0, 18.0, 9.0, 7.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0066375732421875, -0.006416499614715576, -0.006195425987243652, -0.0059743523597717285, -0.005753278732299805, -0.005532205104827881, -0.005311131477355957, -0.005090057849884033, -0.004868984222412109, -0.0046479105949401855, -0.004426836967468262, -0.004205763339996338, -0.003984689712524414, -0.0037636160850524902, -0.0035425424575805664, -0.0033214688301086426, -0.0031003952026367188, -0.002879321575164795, -0.002658247947692871, -0.0024371743202209473, -0.0022161006927490234, -0.0019950270652770996, -0.0017739534378051758, -0.001552879810333252, -0.0013318061828613281, -0.0011107325553894043, -0.0008896589279174805, -0.0006685853004455566, -0.0004475116729736328, -0.00022643804550170898, -5.364418029785156e-06, 0.00021570920944213867, 0.0004367828369140625, 0.0006578564643859863, 0.0008789300918579102, 0.001100003719329834, 0.0013210773468017578, 0.0015421509742736816, 0.0017632246017456055, 0.0019842982292175293, 0.002205371856689453, 0.002426445484161377, 0.0026475191116333008, 0.0028685927391052246, 0.0030896663665771484, 0.0033107399940490723, 0.003531813621520996, 0.00375288724899292, 0.003973960876464844, 0.004195034503936768, 0.004416108131408691, 0.004637181758880615, 0.004858255386352539, 0.005079329013824463, 0.005300402641296387, 0.0055214762687683105, 0.005742549896240234, 0.005963623523712158, 0.006184697151184082, 0.006405770778656006, 0.00662684440612793, 0.0068479180335998535, 0.007068991661071777, 0.007290065288543701, 0.007511138916015625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 14.0, 567.0, 428.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009308363078162074, -0.0008816313347779214, -0.0008324263617396355, -0.0007832214469090104, -0.0007340164738707244, -0.0006848115008324385, -0.0006356065860018134, -0.0005864016129635274, -0.0005371966399252415, -0.0004879916668869555, -0.0004387867229525, -0.00038958177901804447, -0.0003403768059797585, -0.00029117183294147253, -0.00024196688900701702, -0.0001927619450725615, -0.00014355697203427553, -9.435201354790479e-05, -4.514705506153405e-05, 4.057903424836695e-06, 5.326286191120744e-05, 0.00010246783494949341, 0.00015167277888394892, 0.00020087772281840444, 0.0002500826958566904, 0.0002992876688949764, 0.0003484926128294319, 0.0003976975567638874, 0.0004469025298021734, 0.0004961075028404593, 0.0005453124176710844, 0.0005945173907093704, 0.0006437224801629782, 0.0006929274532012641, 0.0007421324262395501, 0.0007913373410701752, 0.0008405423141084611, 0.0008897472871467471, 0.0009389522019773722, 0.000988157233223319, 0.0010373621480539441, 0.0010865670628845692, 0.001135772094130516, 0.0011849770089611411, 0.0012341819237917662, 0.001283386955037713, 0.001332591869868338, 0.0013817967846989632, 0.00143100181594491, 0.001480206730775535, 0.001529411762021482, 0.001578616676852107, 0.001627821708098054, 0.001677026622928679, 0.001726231537759304, 0.001775436569005251, 0.001824641483835876, 0.001873846398666501, 0.001923051429912448, 0.001972256461158395, 0.002021461259573698, 0.002070666290819645, 0.002119871322065592, 0.002169076120480895, 0.002218281151726842]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 10.0, 6.0, 9.0, 13.0, 18.0, 20.0, 13.0, 23.0, 17.0, 24.0, 31.0, 19.0, 26.0, 38.0, 37.0, 51.0, 40.0, 39.0, 42.0, 34.0, 40.0, 36.0, 35.0, 39.0, 34.0, 44.0, 33.0, 26.0, 24.0, 21.0, 22.0, 23.0, 18.0, 22.0, 9.0, 11.0, 6.0, 8.0, 5.0, 6.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00023990869522094727, -0.00023235194385051727, -0.00022479519248008728, -0.0002172384411096573, -0.0002096816897392273, -0.0002021249383687973, -0.0001945681869983673, -0.00018701143562793732, -0.00017945468425750732, -0.00017189793288707733, -0.00016434118151664734, -0.00015678443014621735, -0.00014922767877578735, -0.00014167092740535736, -0.00013411417603492737, -0.00012655742466449738, -0.00011900067329406738, -0.00011144392192363739, -0.0001038871705532074, -9.63304191827774e-05, -8.877366781234741e-05, -8.121691644191742e-05, -7.366016507148743e-05, -6.610341370105743e-05, -5.854666233062744e-05, -5.098991096019745e-05, -4.3433159589767456e-05, -3.587640821933746e-05, -2.831965684890747e-05, -2.0762905478477478e-05, -1.3206154108047485e-05, -5.649402737617493e-06, 1.9073486328125e-06, 9.464100003242493e-06, 1.7020851373672485e-05, 2.4577602744102478e-05, 3.213435411453247e-05, 3.969110548496246e-05, 4.7247856855392456e-05, 5.480460822582245e-05, 6.236135959625244e-05, 6.991811096668243e-05, 7.747486233711243e-05, 8.503161370754242e-05, 9.258836507797241e-05, 0.0001001451164484024, 0.0001077018678188324, 0.00011525861918926239, 0.00012281537055969238, 0.00013037212193012238, 0.00013792887330055237, 0.00014548562467098236, 0.00015304237604141235, 0.00016059912741184235, 0.00016815587878227234, 0.00017571263015270233, 0.00018326938152313232, 0.00019082613289356232, 0.0001983828842639923, 0.0002059396356344223, 0.0002134963870048523, 0.0002210531383752823, 0.00022860988974571228, 0.00023616664111614227, 0.00024372339248657227]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 10.0, 16.0, 12.0, 15.0, 19.0, 28.0, 24.0, 21.0, 25.0, 35.0, 43.0, 42.0, 39.0, 46.0, 51.0, 41.0, 45.0, 43.0, 45.0, 39.0, 43.0, 48.0, 36.0, 34.0, 29.0, 28.0, 22.0, 27.0, 22.0, 15.0, 16.0, 4.0, 5.0, 9.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.609375, -3.5010986328125, -3.392822265625, -3.2845458984375, -3.17626953125, -3.0679931640625, -2.959716796875, -2.8514404296875, -2.7431640625, -2.6348876953125, -2.526611328125, -2.4183349609375, -2.31005859375, -2.2017822265625, -2.093505859375, -1.9852294921875, -1.876953125, -1.7686767578125, -1.660400390625, -1.5521240234375, -1.44384765625, -1.3355712890625, -1.227294921875, -1.1190185546875, -1.0107421875, -0.9024658203125, -0.794189453125, -0.6859130859375, -0.57763671875, -0.4693603515625, -0.361083984375, -0.2528076171875, -0.14453125, -0.0362548828125, 0.072021484375, 0.1802978515625, 0.28857421875, 0.3968505859375, 0.505126953125, 0.6134033203125, 0.7216796875, 0.8299560546875, 0.938232421875, 1.0465087890625, 1.15478515625, 1.2630615234375, 1.371337890625, 1.4796142578125, 1.587890625, 1.6961669921875, 1.804443359375, 1.9127197265625, 2.02099609375, 2.1292724609375, 2.237548828125, 2.3458251953125, 2.4541015625, 2.5623779296875, 2.670654296875, 2.7789306640625, 2.88720703125, 2.9954833984375, 3.103759765625, 3.2120361328125, 3.3203125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 13.0, 19.0, 11.0, 31.0, 36.0, 48.0, 70.0, 109.0, 167.0, 215.0, 324.0, 472.0, 625.0, 935.0, 1439.0, 2130.0, 3551.0, 6250.0, 12784.0, 38346.0, 736301.0, 199202.0, 22381.0, 9584.0, 4896.0, 2866.0, 1807.0, 1266.0, 817.0, 569.0, 383.0, 245.0, 182.0, 162.0, 90.0, 60.0, 42.0, 41.0, 22.0, 23.0, 13.0, 8.0, 9.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.25, -18.644775390625, -18.03955078125, -17.434326171875, -16.8291015625, -16.223876953125, -15.61865234375, -15.013427734375, -14.408203125, -13.802978515625, -13.19775390625, -12.592529296875, -11.9873046875, -11.382080078125, -10.77685546875, -10.171630859375, -9.56640625, -8.961181640625, -8.35595703125, -7.750732421875, -7.1455078125, -6.540283203125, -5.93505859375, -5.329833984375, -4.724609375, -4.119384765625, -3.51416015625, -2.908935546875, -2.3037109375, -1.698486328125, -1.09326171875, -0.488037109375, 0.1171875, 0.722412109375, 1.32763671875, 1.932861328125, 2.5380859375, 3.143310546875, 3.74853515625, 4.353759765625, 4.958984375, 5.564208984375, 6.16943359375, 6.774658203125, 7.3798828125, 7.985107421875, 8.59033203125, 9.195556640625, 9.80078125, 10.406005859375, 11.01123046875, 11.616455078125, 12.2216796875, 12.826904296875, 13.43212890625, 14.037353515625, 14.642578125, 15.247802734375, 15.85302734375, 16.458251953125, 17.0634765625, 17.668701171875, 18.27392578125, 18.879150390625, 19.484375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 9.0, 16.0, 14.0, 12.0, 18.0, 26.0, 24.0, 34.0, 42.0, 38.0, 39.0, 52.0, 68.0, 72.0, 190.0, 1595.0, 256.0, 105.0, 60.0, 49.0, 49.0, 40.0, 32.0, 24.0, 27.0, 27.0, 22.0, 20.0, 20.0, 8.0, 10.0, 6.0, 9.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.5718994140625, -10.237548828125, -9.9031982421875, -9.56884765625, -9.2344970703125, -8.900146484375, -8.5657958984375, -8.2314453125, -7.8970947265625, -7.562744140625, -7.2283935546875, -6.89404296875, -6.5596923828125, -6.225341796875, -5.8909912109375, -5.556640625, -5.2222900390625, -4.887939453125, -4.5535888671875, -4.21923828125, -3.8848876953125, -3.550537109375, -3.2161865234375, -2.8818359375, -2.5474853515625, -2.213134765625, -1.8787841796875, -1.54443359375, -1.2100830078125, -0.875732421875, -0.5413818359375, -0.20703125, 0.1273193359375, 0.461669921875, 0.7960205078125, 1.13037109375, 1.4647216796875, 1.799072265625, 2.1334228515625, 2.4677734375, 2.8021240234375, 3.136474609375, 3.4708251953125, 3.80517578125, 4.1395263671875, 4.473876953125, 4.8082275390625, 5.142578125, 5.4769287109375, 5.811279296875, 6.1456298828125, 6.47998046875, 6.8143310546875, 7.148681640625, 7.4830322265625, 7.8173828125, 8.1517333984375, 8.486083984375, 8.8204345703125, 9.15478515625, 9.4891357421875, 9.823486328125, 10.1578369140625, 10.4921875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 8.0, 7.0, 11.0, 11.0, 13.0, 9.0, 26.0, 24.0, 27.0, 26.0, 38.0, 55.0, 69.0, 93.0, 234.0, 746.0, 24061.0, 3116189.0, 3052.0, 447.0, 169.0, 83.0, 57.0, 37.0, 45.0, 23.0, 34.0, 19.0, 16.0, 16.0, 14.0, 6.0, 11.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.625, -46.1044921875, -44.583984375, -43.0634765625, -41.54296875, -40.0224609375, -38.501953125, -36.9814453125, -35.4609375, -33.9404296875, -32.419921875, -30.8994140625, -29.37890625, -27.8583984375, -26.337890625, -24.8173828125, -23.296875, -21.7763671875, -20.255859375, -18.7353515625, -17.21484375, -15.6943359375, -14.173828125, -12.6533203125, -11.1328125, -9.6123046875, -8.091796875, -6.5712890625, -5.05078125, -3.5302734375, -2.009765625, -0.4892578125, 1.03125, 2.5517578125, 4.072265625, 5.5927734375, 7.11328125, 8.6337890625, 10.154296875, 11.6748046875, 13.1953125, 14.7158203125, 16.236328125, 17.7568359375, 19.27734375, 20.7978515625, 22.318359375, 23.8388671875, 25.359375, 26.8798828125, 28.400390625, 29.9208984375, 31.44140625, 32.9619140625, 34.482421875, 36.0029296875, 37.5234375, 39.0439453125, 40.564453125, 42.0849609375, 43.60546875, 45.1259765625, 46.646484375, 48.1669921875, 49.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 134.0, 884.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.57590103149414, -21.71120262145996, -14.846504211425781, -7.981805801391602, -1.1171073913574219, 5.747592926025391, 12.612289428710938, 19.476985931396484, 26.341686248779297, 33.206382751464844, 40.071083068847656, 46.93578338623047, 53.800479888916016, 60.66518020629883, 67.52987670898438, 74.39457702636719, 81.25927734375, 88.12397766113281, 94.98867797851562, 101.8533706665039, 108.71807098388672, 115.58277130126953, 122.44746398925781, 129.31216430664062, 136.17686462402344, 143.04156494140625, 149.90626525878906, 156.77096557617188, 163.63565063476562, 170.5003662109375, 177.36505126953125, 184.22975158691406, 191.09445190429688, 197.9591522216797, 204.8238525390625, 211.6885528564453, 218.55325317382812, 225.41793823242188, 232.2826385498047, 239.1473388671875, 246.0120391845703, 252.87673950195312, 259.7414245605469, 266.60614013671875, 273.4708251953125, 280.3355407714844, 287.2002258300781, 294.06494140625, 300.92962646484375, 307.7943115234375, 314.6590270996094, 321.5237121582031, 328.388427734375, 335.25311279296875, 342.1178283691406, 348.9825134277344, 355.84722900390625, 362.7119140625, 369.5766296386719, 376.4413146972656, 383.3060302734375, 390.17071533203125, 397.0354309082031, 403.9001159667969, 410.7648010253906]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 11.0, 8.0, 7.0, 16.0, 7.0, 9.0, 28.0, 19.0, 22.0, 24.0, 27.0, 25.0, 38.0, 33.0, 42.0, 47.0, 42.0, 43.0, 54.0, 49.0, 39.0, 37.0, 32.0, 48.0, 35.0, 32.0, 31.0, 23.0, 34.0, 20.0, 20.0, 12.0, 10.0, 14.0, 5.0, 12.0, 11.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.854663848876953, -27.87007713317871, -26.8854923248291, -25.90090560913086, -24.91632080078125, -23.931734085083008, -22.947147369384766, -21.962562561035156, -20.977975845336914, -19.993389129638672, -19.008804321289062, -18.02421760559082, -17.039630889892578, -16.05504608154297, -15.070459365844727, -14.0858736038208, -13.101287841796875, -12.11670207977295, -11.132116317749023, -10.147529602050781, -9.162943840026855, -8.17835807800293, -7.193771839141846, -6.209185600280762, -5.224599838256836, -4.24001407623291, -3.255427837371826, -2.2708418369293213, -1.2862558364868164, -0.3016700744628906, 0.6829161643981934, 1.6675024032592773, 2.652088165283203, 3.636674165725708, 4.621260166168213, 5.605846405029297, 6.590432167053223, 7.575017929077148, 8.55960464477539, 9.544190406799316, 10.528776168823242, 11.513361930847168, 12.497947692871094, 13.482534408569336, 14.467120170593262, 15.451705932617188, 16.43629264831543, 17.420879364013672, 18.40546417236328, 19.390050888061523, 20.374635696411133, 21.359222412109375, 22.343807220458984, 23.328393936157227, 24.31298065185547, 25.297565460205078, 26.28215217590332, 27.266738891601562, 28.251323699951172, 29.235910415649414, 30.220497131347656, 31.205081939697266, 32.189666748046875, 33.17425537109375, 34.15884017944336]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 9.0, 14.0, 14.0, 17.0, 19.0, 17.0, 32.0, 30.0, 13.0, 28.0, 35.0, 61.0, 36.0, 46.0, 43.0, 45.0, 45.0, 45.0, 30.0, 43.0, 59.0, 37.0, 31.0, 32.0, 33.0, 33.0, 20.0, 24.0, 19.0, 18.0, 19.0, 8.0, 6.0, 7.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.828125, -3.71685791015625, -3.6055908203125, -3.49432373046875, -3.383056640625, -3.27178955078125, -3.1605224609375, -3.04925537109375, -2.93798828125, -2.82672119140625, -2.7154541015625, -2.60418701171875, -2.492919921875, -2.38165283203125, -2.2703857421875, -2.15911865234375, -2.0478515625, -1.93658447265625, -1.8253173828125, -1.71405029296875, -1.602783203125, -1.49151611328125, -1.3802490234375, -1.26898193359375, -1.15771484375, -1.04644775390625, -0.9351806640625, -0.82391357421875, -0.712646484375, -0.60137939453125, -0.4901123046875, -0.37884521484375, -0.267578125, -0.15631103515625, -0.0450439453125, 0.06622314453125, 0.177490234375, 0.28875732421875, 0.4000244140625, 0.51129150390625, 0.62255859375, 0.73382568359375, 0.8450927734375, 0.95635986328125, 1.067626953125, 1.17889404296875, 1.2901611328125, 1.40142822265625, 1.5126953125, 1.62396240234375, 1.7352294921875, 1.84649658203125, 1.957763671875, 2.06903076171875, 2.1802978515625, 2.29156494140625, 2.40283203125, 2.51409912109375, 2.6253662109375, 2.73663330078125, 2.847900390625, 2.95916748046875, 3.0704345703125, 3.18170166015625, 3.29296875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 2.0, 9.0, 7.0, 10.0, 10.0, 16.0, 25.0, 33.0, 44.0, 64.0, 91.0, 114.0, 201.0, 296.0, 519.0, 845.0, 1539.0, 3283.0, 6847.0, 18271.0, 74757.0, 1247968.0, 2663385.0, 133226.0, 25450.0, 8815.0, 3976.0, 1859.0, 1038.0, 538.0, 324.0, 205.0, 136.0, 100.0, 83.0, 53.0, 40.0, 20.0, 22.0, 13.0, 10.0, 13.0, 5.0, 6.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.78125, -15.23974609375, -14.6982421875, -14.15673828125, -13.615234375, -13.07373046875, -12.5322265625, -11.99072265625, -11.44921875, -10.90771484375, -10.3662109375, -9.82470703125, -9.283203125, -8.74169921875, -8.2001953125, -7.65869140625, -7.1171875, -6.57568359375, -6.0341796875, -5.49267578125, -4.951171875, -4.40966796875, -3.8681640625, -3.32666015625, -2.78515625, -2.24365234375, -1.7021484375, -1.16064453125, -0.619140625, -0.07763671875, 0.4638671875, 1.00537109375, 1.546875, 2.08837890625, 2.6298828125, 3.17138671875, 3.712890625, 4.25439453125, 4.7958984375, 5.33740234375, 5.87890625, 6.42041015625, 6.9619140625, 7.50341796875, 8.044921875, 8.58642578125, 9.1279296875, 9.66943359375, 10.2109375, 10.75244140625, 11.2939453125, 11.83544921875, 12.376953125, 12.91845703125, 13.4599609375, 14.00146484375, 14.54296875, 15.08447265625, 15.6259765625, 16.16748046875, 16.708984375, 17.25048828125, 17.7919921875, 18.33349609375, 18.875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 13.0, 19.0, 34.0, 50.0, 66.0, 91.0, 146.0, 218.0, 342.0, 513.0, 686.0, 622.0, 405.0, 277.0, 183.0, 121.0, 82.0, 56.0, 45.0, 30.0, 22.0, 12.0, 6.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8828125, -13.3209228515625, -12.759033203125, -12.1971435546875, -11.63525390625, -11.0733642578125, -10.511474609375, -9.9495849609375, -9.3876953125, -8.8258056640625, -8.263916015625, -7.7020263671875, -7.14013671875, -6.5782470703125, -6.016357421875, -5.4544677734375, -4.892578125, -4.3306884765625, -3.768798828125, -3.2069091796875, -2.64501953125, -2.0831298828125, -1.521240234375, -0.9593505859375, -0.3974609375, 0.1644287109375, 0.726318359375, 1.2882080078125, 1.85009765625, 2.4119873046875, 2.973876953125, 3.5357666015625, 4.09765625, 4.6595458984375, 5.221435546875, 5.7833251953125, 6.34521484375, 6.9071044921875, 7.468994140625, 8.0308837890625, 8.5927734375, 9.1546630859375, 9.716552734375, 10.2784423828125, 10.84033203125, 11.4022216796875, 11.964111328125, 12.5260009765625, 13.087890625, 13.6497802734375, 14.211669921875, 14.7735595703125, 15.33544921875, 15.8973388671875, 16.459228515625, 17.0211181640625, 17.5830078125, 18.1448974609375, 18.706787109375, 19.2686767578125, 19.83056640625, 20.3924560546875, 20.954345703125, 21.5162353515625, 22.078125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 14.0, 14.0, 22.0, 34.0, 54.0, 91.0, 127.0, 219.0, 459.0, 2227.0, 4037848.0, 151558.0, 894.0, 286.0, 160.0, 101.0, 55.0, 38.0, 27.0, 15.0, 15.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.0, -116.0107421875, -113.021484375, -110.0322265625, -107.04296875, -104.0537109375, -101.064453125, -98.0751953125, -95.0859375, -92.0966796875, -89.107421875, -86.1181640625, -83.12890625, -80.1396484375, -77.150390625, -74.1611328125, -71.171875, -68.1826171875, -65.193359375, -62.2041015625, -59.21484375, -56.2255859375, -53.236328125, -50.2470703125, -47.2578125, -44.2685546875, -41.279296875, -38.2900390625, -35.30078125, -32.3115234375, -29.322265625, -26.3330078125, -23.34375, -20.3544921875, -17.365234375, -14.3759765625, -11.38671875, -8.3974609375, -5.408203125, -2.4189453125, 0.5703125, 3.5595703125, 6.548828125, 9.5380859375, 12.52734375, 15.5166015625, 18.505859375, 21.4951171875, 24.484375, 27.4736328125, 30.462890625, 33.4521484375, 36.44140625, 39.4306640625, 42.419921875, 45.4091796875, 48.3984375, 51.3876953125, 54.376953125, 57.3662109375, 60.35546875, 63.3447265625, 66.333984375, 69.3232421875, 72.3125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 14.0, 43.0, 154.0, 270.0, 324.0, 139.0, 56.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.48699188232422, -122.87354278564453, -120.26010131835938, -117.64665222167969, -115.033203125, -112.41975402832031, -109.80631256103516, -107.19286346435547, -104.57942199707031, -101.96597290039062, -99.35253143310547, -96.73908233642578, -94.1256332397461, -91.51219177246094, -88.89874267578125, -86.28529357910156, -83.67184448242188, -81.05839538574219, -78.44495391845703, -75.83150482177734, -73.21805572509766, -70.6046142578125, -67.99116516113281, -65.37771606445312, -62.7642707824707, -60.15082550048828, -57.537376403808594, -54.92393112182617, -52.31048583984375, -49.69703674316406, -47.08359146118164, -44.47014617919922, -41.8567008972168, -39.243255615234375, -36.62980651855469, -34.016361236572266, -31.40291404724121, -28.789466857910156, -26.176021575927734, -23.56257438659668, -20.949127197265625, -18.33568000793457, -15.722233772277832, -13.108787536621094, -10.495340347290039, -7.881893157958984, -5.268446922302246, -2.655000686645508, -0.041553497314453125, 2.5718932151794434, 5.18533992767334, 7.798786640167236, 10.412233352661133, 13.025680541992188, 15.639126777648926, 18.252573013305664, 20.86602020263672, 23.479467391967773, 26.092914581298828, 28.70635986328125, 31.319807052612305, 33.93325424194336, 36.54669952392578, 39.16014862060547, 41.77359390258789]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 2.0, 6.0, 7.0, 6.0, 7.0, 10.0, 9.0, 15.0, 12.0, 13.0, 16.0, 22.0, 21.0, 27.0, 23.0, 24.0, 40.0, 33.0, 38.0, 30.0, 40.0, 39.0, 48.0, 46.0, 41.0, 49.0, 36.0, 30.0, 37.0, 29.0, 25.0, 21.0, 24.0, 26.0, 19.0, 20.0, 13.0, 11.0, 15.0, 15.0, 9.0, 7.0, 7.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-40.972190856933594, -39.57497787475586, -38.177764892578125, -36.78055191040039, -35.383338928222656, -33.986122131347656, -32.58891296386719, -31.191696166992188, -29.794483184814453, -28.39727020263672, -27.000057220458984, -25.60284423828125, -24.205629348754883, -22.80841636657715, -21.411203384399414, -20.013988494873047, -18.616777420043945, -17.21956443786621, -15.82235050201416, -14.425137519836426, -13.027923583984375, -11.63071060180664, -10.233497619628906, -8.836283683776855, -7.439070701599121, -6.0418572425842285, -4.644643783569336, -3.2474308013916016, -1.850217342376709, -0.4530038833618164, 0.944209098815918, 2.3414230346679688, 3.738636016845703, 5.135849475860596, 6.533062934875488, 7.930275917053223, 9.327489852905273, 10.724702835083008, 12.121915817260742, 13.519129753112793, 14.916342735290527, 16.313556671142578, 17.710769653320312, 19.107982635498047, 20.50519561767578, 21.902408599853516, 23.29962158203125, 24.696836471557617, 26.09404945373535, 27.491262435913086, 28.88847541809082, 30.285690307617188, 31.682903289794922, 33.080116271972656, 34.47732925415039, 35.874542236328125, 37.27175521850586, 38.668968200683594, 40.06618118286133, 41.46339416503906, 42.8606071472168, 44.25782012939453, 45.65503692626953, 47.052249908447266, 48.449462890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 6.0, 8.0, 10.0, 10.0, 15.0, 8.0, 20.0, 23.0, 24.0, 17.0, 20.0, 26.0, 32.0, 41.0, 31.0, 41.0, 39.0, 41.0, 48.0, 44.0, 49.0, 42.0, 41.0, 48.0, 36.0, 28.0, 32.0, 30.0, 28.0, 26.0, 22.0, 20.0, 25.0, 13.0, 12.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.49609375, -3.388092041015625, -3.28009033203125, -3.172088623046875, -3.0640869140625, -2.956085205078125, -2.84808349609375, -2.740081787109375, -2.632080078125, -2.524078369140625, -2.41607666015625, -2.308074951171875, -2.2000732421875, -2.092071533203125, -1.98406982421875, -1.876068115234375, -1.76806640625, -1.660064697265625, -1.55206298828125, -1.444061279296875, -1.3360595703125, -1.228057861328125, -1.12005615234375, -1.012054443359375, -0.904052734375, -0.796051025390625, -0.68804931640625, -0.580047607421875, -0.4720458984375, -0.364044189453125, -0.25604248046875, -0.148040771484375, -0.0400390625, 0.067962646484375, 0.17596435546875, 0.283966064453125, 0.3919677734375, 0.499969482421875, 0.60797119140625, 0.715972900390625, 0.823974609375, 0.931976318359375, 1.03997802734375, 1.147979736328125, 1.2559814453125, 1.363983154296875, 1.47198486328125, 1.579986572265625, 1.68798828125, 1.795989990234375, 1.90399169921875, 2.011993408203125, 2.1199951171875, 2.227996826171875, 2.33599853515625, 2.444000244140625, 2.552001953125, 2.660003662109375, 2.76800537109375, 2.876007080078125, 2.9840087890625, 3.092010498046875, 3.20001220703125, 3.308013916015625, 3.416015625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 0.0, 7.0, 10.0, 7.0, 16.0, 27.0, 38.0, 49.0, 82.0, 115.0, 137.0, 234.0, 340.0, 540.0, 811.0, 1216.0, 1840.0, 2901.0, 4486.0, 7440.0, 12522.0, 21665.0, 39086.0, 74661.0, 146630.0, 248752.0, 221178.0, 120993.0, 62254.0, 33006.0, 18734.0, 10759.0, 6550.0, 4019.0, 2606.0, 1658.0, 1102.0, 666.0, 452.0, 320.0, 201.0, 165.0, 90.0, 63.0, 40.0, 33.0, 22.0, 15.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.423828125, -0.4116706848144531, -0.39951324462890625, -0.3873558044433594, -0.3751983642578125, -0.3630409240722656, -0.35088348388671875, -0.3387260437011719, -0.326568603515625, -0.3144111633300781, -0.30225372314453125, -0.2900962829589844, -0.2779388427734375, -0.2657814025878906, -0.25362396240234375, -0.24146652221679688, -0.22930908203125, -0.21715164184570312, -0.20499420166015625, -0.19283676147460938, -0.1806793212890625, -0.16852188110351562, -0.15636444091796875, -0.14420700073242188, -0.132049560546875, -0.11989212036132812, -0.10773468017578125, -0.09557723999023438, -0.0834197998046875, -0.07126235961914062, -0.05910491943359375, -0.046947479248046875, -0.0347900390625, -0.022632598876953125, -0.01047515869140625, 0.001682281494140625, 0.0138397216796875, 0.025997161865234375, 0.03815460205078125, 0.050312042236328125, 0.062469482421875, 0.07462692260742188, 0.08678436279296875, 0.09894180297851562, 0.1110992431640625, 0.12325668334960938, 0.13541412353515625, 0.14757156372070312, 0.15972900390625, 0.17188644409179688, 0.18404388427734375, 0.19620132446289062, 0.2083587646484375, 0.22051620483398438, 0.23267364501953125, 0.24483108520507812, 0.256988525390625, 0.2691459655761719, 0.28130340576171875, 0.2934608459472656, 0.3056182861328125, 0.3177757263183594, 0.32993316650390625, 0.3420906066894531, 0.354248046875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 11.0, 7.0, 3.0, 9.0, 7.0, 13.0, 17.0, 15.0, 14.0, 21.0, 16.0, 25.0, 28.0, 30.0, 33.0, 35.0, 33.0, 32.0, 53.0, 41.0, 1074.0, 58.0, 41.0, 46.0, 41.0, 37.0, 41.0, 26.0, 31.0, 31.0, 38.0, 14.0, 18.0, 17.0, 17.0, 10.0, 7.0, 7.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.158203125, -2.089691162109375, -2.02117919921875, -1.952667236328125, -1.8841552734375, -1.815643310546875, -1.74713134765625, -1.678619384765625, -1.610107421875, -1.541595458984375, -1.47308349609375, -1.404571533203125, -1.3360595703125, -1.267547607421875, -1.19903564453125, -1.130523681640625, -1.06201171875, -0.993499755859375, -0.92498779296875, -0.856475830078125, -0.7879638671875, -0.719451904296875, -0.65093994140625, -0.582427978515625, -0.513916015625, -0.445404052734375, -0.37689208984375, -0.308380126953125, -0.2398681640625, -0.171356201171875, -0.10284423828125, -0.034332275390625, 0.0341796875, 0.102691650390625, 0.17120361328125, 0.239715576171875, 0.3082275390625, 0.376739501953125, 0.44525146484375, 0.513763427734375, 0.582275390625, 0.650787353515625, 0.71929931640625, 0.787811279296875, 0.8563232421875, 0.924835205078125, 0.99334716796875, 1.061859130859375, 1.13037109375, 1.198883056640625, 1.26739501953125, 1.335906982421875, 1.4044189453125, 1.472930908203125, 1.54144287109375, 1.609954833984375, 1.678466796875, 1.746978759765625, 1.81549072265625, 1.884002685546875, 1.9525146484375, 2.021026611328125, 2.08953857421875, 2.158050537109375, 2.2265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 2.0, 5.0, 8.0, 12.0, 19.0, 28.0, 42.0, 72.0, 115.0, 148.0, 208.0, 310.0, 467.0, 709.0, 1067.0, 1607.0, 2324.0, 3433.0, 5420.0, 8337.0, 12935.0, 20349.0, 32523.0, 52896.0, 85190.0, 135111.0, 1233073.0, 175344.0, 122155.0, 76493.0, 46919.0, 28637.0, 17862.0, 11591.0, 7406.0, 4840.0, 3223.0, 2035.0, 1407.0, 927.0, 633.0, 413.0, 275.0, 191.0, 129.0, 75.0, 52.0, 43.0, 28.0, 13.0, 13.0, 8.0, 8.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.292236328125, -0.2836112976074219, -0.27498626708984375, -0.2663612365722656, -0.2577362060546875, -0.24911117553710938, -0.24048614501953125, -0.23186111450195312, -0.223236083984375, -0.21461105346679688, -0.20598602294921875, -0.19736099243164062, -0.1887359619140625, -0.18011093139648438, -0.17148590087890625, -0.16286087036132812, -0.15423583984375, -0.14561080932617188, -0.13698577880859375, -0.12836074829101562, -0.1197357177734375, -0.11111068725585938, -0.10248565673828125, -0.09386062622070312, -0.085235595703125, -0.07661056518554688, -0.06798553466796875, -0.059360504150390625, -0.0507354736328125, -0.042110443115234375, -0.03348541259765625, -0.024860382080078125, -0.0162353515625, -0.007610321044921875, 0.00101470947265625, 0.009639739990234375, 0.0182647705078125, 0.026889801025390625, 0.03551483154296875, 0.044139862060546875, 0.052764892578125, 0.061389923095703125, 0.07001495361328125, 0.07863998413085938, 0.0872650146484375, 0.09589004516601562, 0.10451507568359375, 0.11314010620117188, 0.12176513671875, 0.13039016723632812, 0.13901519775390625, 0.14764022827148438, 0.1562652587890625, 0.16489028930664062, 0.17351531982421875, 0.18214035034179688, 0.190765380859375, 0.19939041137695312, 0.20801544189453125, 0.21664047241210938, 0.2252655029296875, 0.23389053344726562, 0.24251556396484375, 0.2511405944824219, 0.259765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 2.0, 1.0, 6.0, 7.0, 12.0, 15.0, 19.0, 6.0, 11.0, 12.0, 14.0, 23.0, 28.0, 26.0, 37.0, 39.0, 37.0, 42.0, 40.0, 33.0, 44.0, 39.0, 41.0, 42.0, 43.0, 39.0, 45.0, 28.0, 33.0, 32.0, 39.0, 29.0, 25.0, 19.0, 21.0, 17.0, 11.0, 8.0, 11.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003657341003417969, -0.00035266950726509094, -0.000339604914188385, -0.0003265403211116791, -0.00031347572803497314, -0.0003004111349582672, -0.0002873465418815613, -0.00027428194880485535, -0.0002612173557281494, -0.0002481527626514435, -0.00023508816957473755, -0.00022202357649803162, -0.00020895898342132568, -0.00019589439034461975, -0.00018282979726791382, -0.00016976520419120789, -0.00015670061111450195, -0.00014363601803779602, -0.0001305714249610901, -0.00011750683188438416, -0.00010444223880767822, -9.137764573097229e-05, -7.831305265426636e-05, -6.524845957756042e-05, -5.218386650085449e-05, -3.911927342414856e-05, -2.6054680347442627e-05, -1.2990087270736694e-05, 7.450580596923828e-08, 1.3139098882675171e-05, 2.6203691959381104e-05, 3.9268285036087036e-05, 5.233287811279297e-05, 6.53974711894989e-05, 7.846206426620483e-05, 9.152665734291077e-05, 0.0001045912504196167, 0.00011765584349632263, 0.00013072043657302856, 0.0001437850296497345, 0.00015684962272644043, 0.00016991421580314636, 0.0001829788088798523, 0.00019604340195655823, 0.00020910799503326416, 0.0002221725881099701, 0.00023523718118667603, 0.00024830177426338196, 0.0002613663673400879, 0.0002744309604167938, 0.00028749555349349976, 0.0003005601465702057, 0.0003136247396469116, 0.00032668933272361755, 0.0003397539258003235, 0.0003528185188770294, 0.00036588311195373535, 0.0003789477050304413, 0.0003920122981071472, 0.00040507689118385315, 0.0004181414842605591, 0.000431206077337265, 0.00044427067041397095, 0.0004573352634906769, 0.0004703998565673828]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 5.0, 4.0, 5.0, 4.0, 13.0, 9.0, 9.0, 19.0, 20.0, 39.0, 46.0, 58.0, 54.0, 100.0, 104.0, 129.0, 179.0, 255.0, 456.0, 949.0, 92393.0, 950393.0, 1529.0, 602.0, 251.0, 184.0, 153.0, 122.0, 99.0, 87.0, 81.0, 36.0, 38.0, 24.0, 17.0, 11.0, 16.0, 10.0, 9.0, 10.0, 12.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0090179443359375, -0.008728742599487305, -0.00843954086303711, -0.008150339126586914, -0.007861137390136719, -0.0075719356536865234, -0.007282733917236328, -0.006993532180786133, -0.0067043304443359375, -0.006415128707885742, -0.006125926971435547, -0.0058367252349853516, -0.005547523498535156, -0.005258321762084961, -0.004969120025634766, -0.00467991828918457, -0.004390716552734375, -0.00410151481628418, -0.0038123130798339844, -0.003523111343383789, -0.0032339096069335938, -0.0029447078704833984, -0.002655506134033203, -0.002366304397583008, -0.0020771026611328125, -0.0017879009246826172, -0.0014986991882324219, -0.0012094974517822266, -0.0009202957153320312, -0.0006310939788818359, -0.0003418922424316406, -5.269050598144531e-05, 0.00023651123046875, 0.0005257129669189453, 0.0008149147033691406, 0.001104116439819336, 0.0013933181762695312, 0.0016825199127197266, 0.001971721649169922, 0.002260923385620117, 0.0025501251220703125, 0.002839326858520508, 0.003128528594970703, 0.0034177303314208984, 0.0037069320678710938, 0.003996133804321289, 0.004285335540771484, 0.00457453727722168, 0.004863739013671875, 0.00515294075012207, 0.005442142486572266, 0.005731344223022461, 0.006020545959472656, 0.0063097476959228516, 0.006598949432373047, 0.006888151168823242, 0.0071773529052734375, 0.007466554641723633, 0.007755756378173828, 0.008044958114624023, 0.008334159851074219, 0.008623361587524414, 0.00891256332397461, 0.009201765060424805, 0.009490966796875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 7.0, 127.0, 662.0, 216.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026136671658605337, -0.00021434942027553916, -0.00016733213851694018, -0.00012031485675834119, -7.329756044782698e-05, -2.628026413731277e-05, 2.0737003069370985e-05, 6.77542993798852e-05, 0.00011477159569039941, 0.00016178889200091362, 0.0002088061737595126, 0.0002558234555181116, 0.0003028407518286258, 0.00034985804813914, 0.00039687531534582376, 0.000443892611656338, 0.0004909099079668522, 0.0005379272042773664, 0.0005849445005878806, 0.0006319617386907339, 0.000678979093208909, 0.0007259963313117623, 0.0007730136276222765, 0.0008200309239327908, 0.000867048220243305, 0.0009140655165538192, 0.0009610828128643334, 0.0010081001091748476, 0.001055117347277701, 0.001102134701795876, 0.0011491519398987293, 0.0011961692944169044, 0.001243186416104436, 0.0012902036542072892, 0.0013372210087254643, 0.0013842382468283176, 0.0014312556013464928, 0.001478272839449346, 0.0015252900775521994, 0.0015723074320703745, 0.0016193247865885496, 0.001666342024691403, 0.001713359379209578, 0.0017603766173124313, 0.0018073939718306065, 0.0018544112099334598, 0.001901428448036313, 0.0019484458025544882, 0.0019954629242420197, 0.0020424802787601948, 0.0020894974004477262, 0.0021365147549659014, 0.0021835321094840765, 0.0022305494640022516, 0.002277566585689783, 0.0023245839402079582, 0.0023716012947261333, 0.0024186186492443085, 0.00246563577093184, 0.002512653125450015, 0.00255967047996819, 0.0026066878344863653, 0.002653704956173897, 0.002700722310692072, 0.002747739665210247]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 5.0, 7.0, 6.0, 14.0, 14.0, 24.0, 17.0, 23.0, 29.0, 22.0, 23.0, 25.0, 39.0, 39.0, 32.0, 32.0, 28.0, 46.0, 41.0, 43.0, 45.0, 46.0, 44.0, 37.0, 35.0, 29.0, 37.0, 31.0, 30.0, 26.0, 25.0, 19.0, 12.0, 20.0, 8.0, 7.0, 9.0, 7.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00026220083236694336, -0.00025414954870939255, -0.00024609826505184174, -0.00023804698139429092, -0.0002299956977367401, -0.0002219444140791893, -0.0002138931304216385, -0.00020584184676408768, -0.00019779056310653687, -0.00018973927944898605, -0.00018168799579143524, -0.00017363671213388443, -0.00016558542847633362, -0.0001575341448187828, -0.000149482861161232, -0.00014143157750368118, -0.00013338029384613037, -0.00012532901018857956, -0.00011727772653102875, -0.00010922644287347794, -0.00010117515921592712, -9.312387555837631e-05, -8.50725919008255e-05, -7.702130824327469e-05, -6.897002458572388e-05, -6.0918740928173065e-05, -5.2867457270622253e-05, -4.481617361307144e-05, -3.676488995552063e-05, -2.8713606297969818e-05, -2.0662322640419006e-05, -1.2611038982868195e-05, -4.559755325317383e-06, 3.491528332233429e-06, 1.154281198978424e-05, 1.9594095647335052e-05, 2.7645379304885864e-05, 3.5696662962436676e-05, 4.374794661998749e-05, 5.17992302775383e-05, 5.985051393508911e-05, 6.790179759263992e-05, 7.595308125019073e-05, 8.400436490774155e-05, 9.205564856529236e-05, 0.00010010693222284317, 0.00010815821588039398, 0.0001162094995379448, 0.0001242607831954956, 0.00013231206685304642, 0.00014036335051059723, 0.00014841463416814804, 0.00015646591782569885, 0.00016451720148324966, 0.00017256848514080048, 0.0001806197687983513, 0.0001886710524559021, 0.0001967223361134529, 0.00020477361977100372, 0.00021282490342855453, 0.00022087618708610535, 0.00022892747074365616, 0.00023697875440120697, 0.0002450300380587578, 0.0002530813217163086]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 6.0, 8.0, 10.0, 10.0, 15.0, 8.0, 20.0, 23.0, 24.0, 17.0, 20.0, 26.0, 32.0, 41.0, 31.0, 41.0, 39.0, 41.0, 48.0, 44.0, 49.0, 42.0, 41.0, 48.0, 36.0, 28.0, 32.0, 30.0, 28.0, 26.0, 22.0, 20.0, 25.0, 13.0, 12.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.49609375, -3.388092041015625, -3.28009033203125, -3.172088623046875, -3.0640869140625, -2.956085205078125, -2.84808349609375, -2.740081787109375, -2.632080078125, -2.524078369140625, -2.41607666015625, -2.308074951171875, -2.2000732421875, -2.092071533203125, -1.98406982421875, -1.876068115234375, -1.76806640625, -1.660064697265625, -1.55206298828125, -1.444061279296875, -1.3360595703125, -1.228057861328125, -1.12005615234375, -1.012054443359375, -0.904052734375, -0.796051025390625, -0.68804931640625, -0.580047607421875, -0.4720458984375, -0.364044189453125, -0.25604248046875, -0.148040771484375, -0.0400390625, 0.067962646484375, 0.17596435546875, 0.283966064453125, 0.3919677734375, 0.499969482421875, 0.60797119140625, 0.715972900390625, 0.823974609375, 0.931976318359375, 1.03997802734375, 1.147979736328125, 1.2559814453125, 1.363983154296875, 1.47198486328125, 1.579986572265625, 1.68798828125, 1.795989990234375, 1.90399169921875, 2.011993408203125, 2.1199951171875, 2.227996826171875, 2.33599853515625, 2.444000244140625, 2.552001953125, 2.660003662109375, 2.76800537109375, 2.876007080078125, 2.9840087890625, 3.092010498046875, 3.20001220703125, 3.308013916015625, 3.416015625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 7.0, 4.0, 4.0, 10.0, 16.0, 15.0, 24.0, 25.0, 40.0, 40.0, 69.0, 89.0, 145.0, 193.0, 243.0, 417.0, 588.0, 1060.0, 1917.0, 4013.0, 9350.0, 24606.0, 74632.0, 260686.0, 447155.0, 148856.0, 44999.0, 15885.0, 6495.0, 2981.0, 1547.0, 814.0, 514.0, 331.0, 230.0, 150.0, 106.0, 78.0, 61.0, 57.0, 21.0, 19.0, 18.0, 16.0, 13.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.3515625, -3.24774169921875, -3.1439208984375, -3.04010009765625, -2.936279296875, -2.83245849609375, -2.7286376953125, -2.62481689453125, -2.52099609375, -2.41717529296875, -2.3133544921875, -2.20953369140625, -2.105712890625, -2.00189208984375, -1.8980712890625, -1.79425048828125, -1.6904296875, -1.58660888671875, -1.4827880859375, -1.37896728515625, -1.275146484375, -1.17132568359375, -1.0675048828125, -0.96368408203125, -0.85986328125, -0.75604248046875, -0.6522216796875, -0.54840087890625, -0.444580078125, -0.34075927734375, -0.2369384765625, -0.13311767578125, -0.029296875, 0.07452392578125, 0.1783447265625, 0.28216552734375, 0.385986328125, 0.48980712890625, 0.5936279296875, 0.69744873046875, 0.80126953125, 0.90509033203125, 1.0089111328125, 1.11273193359375, 1.216552734375, 1.32037353515625, 1.4241943359375, 1.52801513671875, 1.6318359375, 1.73565673828125, 1.8394775390625, 1.94329833984375, 2.047119140625, 2.15093994140625, 2.2547607421875, 2.35858154296875, 2.46240234375, 2.56622314453125, 2.6700439453125, 2.77386474609375, 2.877685546875, 2.98150634765625, 3.0853271484375, 3.18914794921875, 3.29296875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 4.0, 7.0, 13.0, 9.0, 11.0, 11.0, 16.0, 21.0, 21.0, 24.0, 28.0, 30.0, 30.0, 42.0, 43.0, 50.0, 60.0, 76.0, 237.0, 1688.0, 118.0, 66.0, 65.0, 46.0, 36.0, 40.0, 53.0, 21.0, 26.0, 29.0, 24.0, 19.0, 15.0, 12.0, 14.0, 7.0, 4.0, 4.0, 2.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.390625, -10.023681640625, -9.65673828125, -9.289794921875, -8.9228515625, -8.555908203125, -8.18896484375, -7.822021484375, -7.455078125, -7.088134765625, -6.72119140625, -6.354248046875, -5.9873046875, -5.620361328125, -5.25341796875, -4.886474609375, -4.51953125, -4.152587890625, -3.78564453125, -3.418701171875, -3.0517578125, -2.684814453125, -2.31787109375, -1.950927734375, -1.583984375, -1.217041015625, -0.85009765625, -0.483154296875, -0.1162109375, 0.250732421875, 0.61767578125, 0.984619140625, 1.3515625, 1.718505859375, 2.08544921875, 2.452392578125, 2.8193359375, 3.186279296875, 3.55322265625, 3.920166015625, 4.287109375, 4.654052734375, 5.02099609375, 5.387939453125, 5.7548828125, 6.121826171875, 6.48876953125, 6.855712890625, 7.22265625, 7.589599609375, 7.95654296875, 8.323486328125, 8.6904296875, 9.057373046875, 9.42431640625, 9.791259765625, 10.158203125, 10.525146484375, 10.89208984375, 11.259033203125, 11.6259765625, 11.992919921875, 12.35986328125, 12.726806640625, 13.09375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 3.0, 4.0, 4.0, 6.0, 8.0, 13.0, 15.0, 16.0, 22.0, 28.0, 37.0, 37.0, 55.0, 65.0, 94.0, 141.0, 318.0, 823.0, 3395.0, 78479.0, 3045815.0, 13373.0, 1718.0, 535.0, 235.0, 105.0, 78.0, 53.0, 43.0, 25.0, 26.0, 23.0, 17.0, 19.0, 11.0, 13.0, 5.0, 11.0, 10.0, 6.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-29.796875, -28.95263671875, -28.1083984375, -27.26416015625, -26.419921875, -25.57568359375, -24.7314453125, -23.88720703125, -23.04296875, -22.19873046875, -21.3544921875, -20.51025390625, -19.666015625, -18.82177734375, -17.9775390625, -17.13330078125, -16.2890625, -15.44482421875, -14.6005859375, -13.75634765625, -12.912109375, -12.06787109375, -11.2236328125, -10.37939453125, -9.53515625, -8.69091796875, -7.8466796875, -7.00244140625, -6.158203125, -5.31396484375, -4.4697265625, -3.62548828125, -2.78125, -1.93701171875, -1.0927734375, -0.24853515625, 0.595703125, 1.43994140625, 2.2841796875, 3.12841796875, 3.97265625, 4.81689453125, 5.6611328125, 6.50537109375, 7.349609375, 8.19384765625, 9.0380859375, 9.88232421875, 10.7265625, 11.57080078125, 12.4150390625, 13.25927734375, 14.103515625, 14.94775390625, 15.7919921875, 16.63623046875, 17.48046875, 18.32470703125, 19.1689453125, 20.01318359375, 20.857421875, 21.70166015625, 22.5458984375, 23.39013671875, 24.234375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 19.0, 54.0, 159.0, 301.0, 265.0, 131.0, 53.0, 21.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.19638729095459, -10.334346771240234, -9.472307205200195, -8.610267639160156, -7.748227119445801, -6.8861870765686035, -6.024147033691406, -5.162106990814209, -4.300066947937012, -3.4380269050598145, -2.575986862182617, -1.71394681930542, -0.8519067764282227, 0.01013326644897461, 0.8721733093261719, 1.7342133522033691, 2.5962533950805664, 3.4582934379577637, 4.320333480834961, 5.182373523712158, 6.0444135665893555, 6.906453609466553, 7.76849365234375, 8.630533218383789, 9.492573738098145, 10.3546142578125, 11.216653823852539, 12.078693389892578, 12.940733909606934, 13.802774429321289, 14.664813995361328, 15.526853561401367, 16.388893127441406, 17.250932693481445, 18.112972259521484, 18.975013732910156, 19.837053298950195, 20.699092864990234, 21.561134338378906, 22.423173904418945, 23.285213470458984, 24.147253036499023, 25.009292602539062, 25.871334075927734, 26.733373641967773, 27.595413208007812, 28.457454681396484, 29.319494247436523, 30.181533813476562, 31.0435733795166, 31.90561294555664, 32.76765441894531, 33.62969207763672, 34.49173355102539, 35.35377502441406, 36.21581268310547, 37.07785415649414, 37.93989562988281, 38.80193328857422, 39.66397476196289, 40.52601623535156, 41.38805389404297, 42.25009536743164, 43.11213302612305, 43.97417449951172]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 11.0, 9.0, 6.0, 24.0, 24.0, 21.0, 29.0, 28.0, 37.0, 30.0, 38.0, 41.0, 52.0, 44.0, 58.0, 46.0, 52.0, 45.0, 44.0, 32.0, 39.0, 28.0, 29.0, 24.0, 25.0, 30.0, 23.0, 21.0, 11.0, 15.0, 18.0, 11.0, 11.0, 4.0, 8.0, 3.0, 3.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-44.0554084777832, -42.83355712890625, -41.61170959472656, -40.38985824584961, -39.168006896972656, -37.94615936279297, -36.724308013916016, -35.50245666503906, -34.280609130859375, -33.05875778198242, -31.8369083404541, -30.61505889892578, -29.393207550048828, -28.171358108520508, -26.949508666992188, -25.727657318115234, -24.50580596923828, -23.28395652770996, -22.062105178833008, -20.840255737304688, -19.618404388427734, -18.396554946899414, -17.174705505371094, -15.952855110168457, -14.73100471496582, -13.509154319763184, -12.287303924560547, -11.065454483032227, -9.84360408782959, -8.621753692626953, -7.399903774261475, -6.178053855895996, -4.956207275390625, -3.7343571186065674, -2.5125069618225098, -1.2906568050384521, -0.06880664825439453, 1.1530437469482422, 2.3748936653137207, 3.596743583679199, 4.818593978881836, 6.040444374084473, 7.262294292449951, 8.48414421081543, 9.705994606018066, 10.927845001220703, 12.149694442749023, 13.37154483795166, 14.593395233154297, 15.815245628356934, 17.03709602355957, 18.25894546508789, 19.480796813964844, 20.702646255493164, 21.924495697021484, 23.146347045898438, 24.368196487426758, 25.590045928955078, 26.81189727783203, 28.03374671936035, 29.255596160888672, 30.477447509765625, 31.699296951293945, 32.921146392822266, 34.14299774169922]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 10.0, 9.0, 13.0, 11.0, 20.0, 17.0, 22.0, 23.0, 24.0, 20.0, 22.0, 44.0, 41.0, 42.0, 38.0, 41.0, 39.0, 46.0, 51.0, 42.0, 38.0, 43.0, 39.0, 37.0, 36.0, 32.0, 25.0, 22.0, 21.0, 22.0, 20.0, 15.0, 15.0, 10.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.7265625, -3.61553955078125, -3.5045166015625, -3.39349365234375, -3.282470703125, -3.17144775390625, -3.0604248046875, -2.94940185546875, -2.83837890625, -2.72735595703125, -2.6163330078125, -2.50531005859375, -2.394287109375, -2.28326416015625, -2.1722412109375, -2.06121826171875, -1.9501953125, -1.83917236328125, -1.7281494140625, -1.61712646484375, -1.506103515625, -1.39508056640625, -1.2840576171875, -1.17303466796875, -1.06201171875, -0.95098876953125, -0.8399658203125, -0.72894287109375, -0.617919921875, -0.50689697265625, -0.3958740234375, -0.28485107421875, -0.173828125, -0.06280517578125, 0.0482177734375, 0.15924072265625, 0.270263671875, 0.38128662109375, 0.4923095703125, 0.60333251953125, 0.71435546875, 0.82537841796875, 0.9364013671875, 1.04742431640625, 1.158447265625, 1.26947021484375, 1.3804931640625, 1.49151611328125, 1.6025390625, 1.71356201171875, 1.8245849609375, 1.93560791015625, 2.046630859375, 2.15765380859375, 2.2686767578125, 2.37969970703125, 2.49072265625, 2.60174560546875, 2.7127685546875, 2.82379150390625, 2.934814453125, 3.04583740234375, 3.1568603515625, 3.26788330078125, 3.37890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 4.0, 6.0, 13.0, 15.0, 23.0, 25.0, 27.0, 31.0, 57.0, 72.0, 101.0, 185.0, 278.0, 665.0, 2425.0, 16219.0, 221239.0, 3094830.0, 811660.0, 39460.0, 4801.0, 1032.0, 418.0, 222.0, 111.0, 83.0, 64.0, 54.0, 36.0, 30.0, 19.0, 16.0, 14.0, 9.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1796875, -11.755126953125, -11.33056640625, -10.906005859375, -10.4814453125, -10.056884765625, -9.63232421875, -9.207763671875, -8.783203125, -8.358642578125, -7.93408203125, -7.509521484375, -7.0849609375, -6.660400390625, -6.23583984375, -5.811279296875, -5.38671875, -4.962158203125, -4.53759765625, -4.113037109375, -3.6884765625, -3.263916015625, -2.83935546875, -2.414794921875, -1.990234375, -1.565673828125, -1.14111328125, -0.716552734375, -0.2919921875, 0.132568359375, 0.55712890625, 0.981689453125, 1.40625, 1.830810546875, 2.25537109375, 2.679931640625, 3.1044921875, 3.529052734375, 3.95361328125, 4.378173828125, 4.802734375, 5.227294921875, 5.65185546875, 6.076416015625, 6.5009765625, 6.925537109375, 7.35009765625, 7.774658203125, 8.19921875, 8.623779296875, 9.04833984375, 9.472900390625, 9.8974609375, 10.322021484375, 10.74658203125, 11.171142578125, 11.595703125, 12.020263671875, 12.44482421875, 12.869384765625, 13.2939453125, 13.718505859375, 14.14306640625, 14.567626953125, 14.9921875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 11.0, 14.0, 17.0, 42.0, 38.0, 88.0, 114.0, 176.0, 288.0, 441.0, 618.0, 714.0, 526.0, 343.0, 250.0, 153.0, 78.0, 59.0, 41.0, 26.0, 14.0, 6.0, 7.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.5625, -23.0164794921875, -22.470458984375, -21.9244384765625, -21.37841796875, -20.8323974609375, -20.286376953125, -19.7403564453125, -19.1943359375, -18.6483154296875, -18.102294921875, -17.5562744140625, -17.01025390625, -16.4642333984375, -15.918212890625, -15.3721923828125, -14.826171875, -14.2801513671875, -13.734130859375, -13.1881103515625, -12.64208984375, -12.0960693359375, -11.550048828125, -11.0040283203125, -10.4580078125, -9.9119873046875, -9.365966796875, -8.8199462890625, -8.27392578125, -7.7279052734375, -7.181884765625, -6.6358642578125, -6.08984375, -5.5438232421875, -4.997802734375, -4.4517822265625, -3.90576171875, -3.3597412109375, -2.813720703125, -2.2677001953125, -1.7216796875, -1.1756591796875, -0.629638671875, -0.0836181640625, 0.46240234375, 1.0084228515625, 1.554443359375, 2.1004638671875, 2.646484375, 3.1925048828125, 3.738525390625, 4.2845458984375, 4.83056640625, 5.3765869140625, 5.922607421875, 6.4686279296875, 7.0146484375, 7.5606689453125, 8.106689453125, 8.6527099609375, 9.19873046875, 9.7447509765625, 10.290771484375, 10.8367919921875, 11.3828125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 6.0, 17.0, 21.0, 34.0, 70.0, 126.0, 245.0, 625.0, 7115.0, 4111363.0, 73030.0, 970.0, 316.0, 152.0, 92.0, 37.0, 33.0, 15.0, 10.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.0, -49.70703125, -47.4140625, -45.12109375, -42.828125, -40.53515625, -38.2421875, -35.94921875, -33.65625, -31.36328125, -29.0703125, -26.77734375, -24.484375, -22.19140625, -19.8984375, -17.60546875, -15.3125, -13.01953125, -10.7265625, -8.43359375, -6.140625, -3.84765625, -1.5546875, 0.73828125, 3.03125, 5.32421875, 7.6171875, 9.91015625, 12.203125, 14.49609375, 16.7890625, 19.08203125, 21.375, 23.66796875, 25.9609375, 28.25390625, 30.546875, 32.83984375, 35.1328125, 37.42578125, 39.71875, 42.01171875, 44.3046875, 46.59765625, 48.890625, 51.18359375, 53.4765625, 55.76953125, 58.0625, 60.35546875, 62.6484375, 64.94140625, 67.234375, 69.52734375, 71.8203125, 74.11328125, 76.40625, 78.69921875, 80.9921875, 83.28515625, 85.578125, 87.87109375, 90.1640625, 92.45703125, 94.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 56.0, 242.0, 426.0, 236.0, 42.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-155.42294311523438, -151.27183532714844, -147.1207275390625, -142.96961975097656, -138.81851196289062, -134.6674041748047, -130.51629638671875, -126.36518859863281, -122.21408081054688, -118.06297302246094, -113.911865234375, -109.76075744628906, -105.60964965820312, -101.45854187011719, -97.30743408203125, -93.15632629394531, -89.00521087646484, -84.8541030883789, -80.70299530029297, -76.55188751220703, -72.4007797241211, -68.24967193603516, -64.09855651855469, -59.947452545166016, -55.79634475708008, -51.64523696899414, -47.4941291809082, -43.343017578125, -39.19190979003906, -35.040802001953125, -30.889694213867188, -26.73858642578125, -22.58747100830078, -18.436363220214844, -14.28525447845459, -10.134145736694336, -5.983037948608398, -1.831930160522461, 2.3191795349121094, 6.470287322998047, 10.621395111083984, 14.772502899169922, 18.92361068725586, 23.07472038269043, 27.225828170776367, 31.376935958862305, 35.528045654296875, 39.67915344238281, 43.83026123046875, 47.98136901855469, 52.132476806640625, 56.28358459472656, 60.4346923828125, 64.58580017089844, 68.73690795898438, 72.88801574707031, 77.03912353515625, 81.19023132324219, 85.34133911132812, 89.49244689941406, 93.6435546875, 97.79466247558594, 101.94577026367188, 106.09687805175781, 110.24799346923828]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 7.0, 12.0, 7.0, 9.0, 11.0, 13.0, 16.0, 15.0, 20.0, 19.0, 20.0, 25.0, 33.0, 28.0, 28.0, 35.0, 31.0, 30.0, 40.0, 40.0, 40.0, 41.0, 42.0, 46.0, 33.0, 33.0, 37.0, 37.0, 26.0, 29.0, 24.0, 15.0, 21.0, 22.0, 19.0, 11.0, 13.0, 13.0, 7.0, 5.0, 10.0, 6.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-36.650146484375, -35.53551483154297, -34.42088317871094, -33.306251525878906, -32.191619873046875, -31.07698631286621, -29.96235466003418, -28.84772300720215, -27.733089447021484, -26.618457794189453, -25.503826141357422, -24.38919448852539, -23.274560928344727, -22.159929275512695, -21.045297622680664, -19.930665969848633, -18.8160343170166, -17.70140266418457, -16.58677101135254, -15.472138404846191, -14.357505798339844, -13.242874145507812, -12.128242492675781, -11.01361083984375, -9.898978233337402, -8.784346580505371, -7.669713973999023, -6.555082321166992, -5.440450191497803, -4.325818061828613, -3.211186408996582, -2.0965542793273926, -0.9819221496582031, 0.13270986080169678, 1.2473418712615967, 2.361973762512207, 3.4766058921813965, 4.591238021850586, 5.705869674682617, 6.820501804351807, 7.935133934020996, 9.049765586853027, 10.164398193359375, 11.279029846191406, 12.393661499023438, 13.508294105529785, 14.622925758361816, 15.737558364868164, 16.852190017700195, 17.966821670532227, 19.081453323364258, 20.196086883544922, 21.310718536376953, 22.425350189208984, 23.539981842041016, 24.654613494873047, 25.769245147705078, 26.88387680053711, 27.99850845336914, 29.113140106201172, 30.227773666381836, 31.342405319213867, 32.45703887939453, 33.57167053222656, 34.686302185058594]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 7.0, 7.0, 11.0, 10.0, 13.0, 20.0, 19.0, 17.0, 21.0, 29.0, 26.0, 19.0, 28.0, 28.0, 27.0, 36.0, 37.0, 46.0, 41.0, 36.0, 31.0, 34.0, 42.0, 47.0, 36.0, 31.0, 39.0, 26.0, 21.0, 34.0, 24.0, 22.0, 23.0, 14.0, 18.0, 13.0, 10.0, 7.0, 8.0, 7.0, 5.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.33984375, -3.238555908203125, -3.13726806640625, -3.035980224609375, -2.9346923828125, -2.833404541015625, -2.73211669921875, -2.630828857421875, -2.529541015625, -2.428253173828125, -2.32696533203125, -2.225677490234375, -2.1243896484375, -2.023101806640625, -1.92181396484375, -1.820526123046875, -1.71923828125, -1.617950439453125, -1.51666259765625, -1.415374755859375, -1.3140869140625, -1.212799072265625, -1.11151123046875, -1.010223388671875, -0.908935546875, -0.807647705078125, -0.70635986328125, -0.605072021484375, -0.5037841796875, -0.402496337890625, -0.30120849609375, -0.199920654296875, -0.0986328125, 0.002655029296875, 0.10394287109375, 0.205230712890625, 0.3065185546875, 0.407806396484375, 0.50909423828125, 0.610382080078125, 0.711669921875, 0.812957763671875, 0.91424560546875, 1.015533447265625, 1.1168212890625, 1.218109130859375, 1.31939697265625, 1.420684814453125, 1.52197265625, 1.623260498046875, 1.72454833984375, 1.825836181640625, 1.9271240234375, 2.028411865234375, 2.12969970703125, 2.230987548828125, 2.332275390625, 2.433563232421875, 2.53485107421875, 2.636138916015625, 2.7374267578125, 2.838714599609375, 2.94000244140625, 3.041290283203125, 3.142578125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 8.0, 22.0, 24.0, 48.0, 57.0, 89.0, 122.0, 173.0, 256.0, 381.0, 516.0, 733.0, 1073.0, 1469.0, 2089.0, 3204.0, 4725.0, 7022.0, 10653.0, 16507.0, 26382.0, 42866.0, 72003.0, 120525.0, 179969.0, 194702.0, 139932.0, 85328.0, 50365.0, 30915.0, 19061.0, 12237.0, 8157.0, 5307.0, 3630.0, 2464.0, 1654.0, 1098.0, 855.0, 601.0, 435.0, 292.0, 172.0, 156.0, 83.0, 73.0, 42.0, 29.0, 23.0, 12.0, 14.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.337890625, -0.3277015686035156, -0.31751251220703125, -0.3073234558105469, -0.2971343994140625, -0.2869453430175781, -0.27675628662109375, -0.2665672302246094, -0.256378173828125, -0.24618911743164062, -0.23600006103515625, -0.22581100463867188, -0.2156219482421875, -0.20543289184570312, -0.19524383544921875, -0.18505477905273438, -0.17486572265625, -0.16467666625976562, -0.15448760986328125, -0.14429855346679688, -0.1341094970703125, -0.12392044067382812, -0.11373138427734375, -0.10354232788085938, -0.093353271484375, -0.08316421508789062, -0.07297515869140625, -0.06278610229492188, -0.0525970458984375, -0.042407989501953125, -0.03221893310546875, -0.022029876708984375, -0.0118408203125, -0.001651763916015625, 0.00853729248046875, 0.018726348876953125, 0.0289154052734375, 0.039104461669921875, 0.04929351806640625, 0.059482574462890625, 0.069671630859375, 0.07986068725585938, 0.09004974365234375, 0.10023880004882812, 0.1104278564453125, 0.12061691284179688, 0.13080596923828125, 0.14099502563476562, 0.15118408203125, 0.16137313842773438, 0.17156219482421875, 0.18175125122070312, 0.1919403076171875, 0.20212936401367188, 0.21231842041015625, 0.22250747680664062, 0.232696533203125, 0.24288558959960938, 0.25307464599609375, 0.2632637023925781, 0.2734527587890625, 0.2836418151855469, 0.29383087158203125, 0.3040199279785156, 0.314208984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 6.0, 11.0, 9.0, 12.0, 8.0, 10.0, 17.0, 26.0, 20.0, 23.0, 17.0, 20.0, 33.0, 31.0, 29.0, 31.0, 34.0, 45.0, 34.0, 45.0, 37.0, 1065.0, 36.0, 42.0, 41.0, 28.0, 27.0, 33.0, 38.0, 36.0, 12.0, 22.0, 17.0, 16.0, 15.0, 14.0, 13.0, 15.0, 9.0, 5.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.0546875, -1.9926910400390625, -1.930694580078125, -1.8686981201171875, -1.80670166015625, -1.7447052001953125, -1.682708740234375, -1.6207122802734375, -1.5587158203125, -1.4967193603515625, -1.434722900390625, -1.3727264404296875, -1.31072998046875, -1.2487335205078125, -1.186737060546875, -1.1247406005859375, -1.062744140625, -1.0007476806640625, -0.938751220703125, -0.8767547607421875, -0.81475830078125, -0.7527618408203125, -0.690765380859375, -0.6287689208984375, -0.5667724609375, -0.5047760009765625, -0.442779541015625, -0.3807830810546875, -0.31878662109375, -0.2567901611328125, -0.194793701171875, -0.1327972412109375, -0.07080078125, -0.0088043212890625, 0.053192138671875, 0.1151885986328125, 0.17718505859375, 0.2391815185546875, 0.301177978515625, 0.3631744384765625, 0.4251708984375, 0.4871673583984375, 0.549163818359375, 0.6111602783203125, 0.67315673828125, 0.7351531982421875, 0.797149658203125, 0.8591461181640625, 0.921142578125, 0.9831390380859375, 1.045135498046875, 1.1071319580078125, 1.16912841796875, 1.2311248779296875, 1.293121337890625, 1.3551177978515625, 1.4171142578125, 1.4791107177734375, 1.541107177734375, 1.6031036376953125, 1.66510009765625, 1.7270965576171875, 1.789093017578125, 1.8510894775390625, 1.9130859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 11.0, 10.0, 17.0, 37.0, 46.0, 93.0, 121.0, 205.0, 337.0, 519.0, 891.0, 1442.0, 2360.0, 3915.0, 6286.0, 10754.0, 18243.0, 31661.0, 56273.0, 103985.0, 184302.0, 1285118.0, 171728.0, 95325.0, 51946.0, 29210.0, 16867.0, 9900.0, 6113.0, 3636.0, 2243.0, 1367.0, 804.0, 530.0, 322.0, 189.0, 109.0, 81.0, 53.0, 26.0, 24.0, 14.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32275390625, -0.3114013671875, -0.300048828125, -0.2886962890625, -0.27734375, -0.2659912109375, -0.254638671875, -0.2432861328125, -0.23193359375, -0.2205810546875, -0.209228515625, -0.1978759765625, -0.1865234375, -0.1751708984375, -0.163818359375, -0.1524658203125, -0.14111328125, -0.1297607421875, -0.118408203125, -0.1070556640625, -0.095703125, -0.0843505859375, -0.072998046875, -0.0616455078125, -0.05029296875, -0.0389404296875, -0.027587890625, -0.0162353515625, -0.0048828125, 0.0064697265625, 0.017822265625, 0.0291748046875, 0.04052734375, 0.0518798828125, 0.063232421875, 0.0745849609375, 0.0859375, 0.0972900390625, 0.108642578125, 0.1199951171875, 0.13134765625, 0.1427001953125, 0.154052734375, 0.1654052734375, 0.1767578125, 0.1881103515625, 0.199462890625, 0.2108154296875, 0.22216796875, 0.2335205078125, 0.244873046875, 0.2562255859375, 0.267578125, 0.2789306640625, 0.290283203125, 0.3016357421875, 0.31298828125, 0.3243408203125, 0.335693359375, 0.3470458984375, 0.3583984375, 0.3697509765625, 0.381103515625, 0.3924560546875, 0.40380859375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 10.0, 9.0, 8.0, 7.0, 16.0, 30.0, 24.0, 26.0, 28.0, 31.0, 26.0, 38.0, 31.0, 42.0, 47.0, 39.0, 44.0, 44.0, 39.0, 38.0, 47.0, 37.0, 33.0, 34.0, 36.0, 29.0, 28.0, 29.0, 24.0, 18.0, 11.0, 18.0, 8.0, 8.0, 11.0, 7.0, 6.0, 8.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0004627704620361328, -0.0004489533603191376, -0.00043513625860214233, -0.0004213191568851471, -0.00040750205516815186, -0.0003936849534511566, -0.0003798678517341614, -0.00036605075001716614, -0.0003522336483001709, -0.00033841654658317566, -0.0003245994448661804, -0.0003107823431491852, -0.00029696524143218994, -0.0002831481397151947, -0.00026933103799819946, -0.0002555139362812042, -0.00024169683456420898, -0.00022787973284721375, -0.0002140626311302185, -0.00020024552941322327, -0.00018642842769622803, -0.0001726113259792328, -0.00015879422426223755, -0.0001449771225452423, -0.00013116002082824707, -0.00011734291911125183, -0.00010352581739425659, -8.970871567726135e-05, -7.589161396026611e-05, -6.207451224327087e-05, -4.8257410526275635e-05, -3.4440308809280396e-05, -2.0623207092285156e-05, -6.806105375289917e-06, 7.010996341705322e-06, 2.082809805870056e-05, 3.46451997756958e-05, 4.846230149269104e-05, 6.227940320968628e-05, 7.609650492668152e-05, 8.991360664367676e-05, 0.000103730708360672, 0.00011754781007766724, 0.00013136491179466248, 0.00014518201351165771, 0.00015899911522865295, 0.0001728162169456482, 0.00018663331866264343, 0.00020045042037963867, 0.0002142675220966339, 0.00022808462381362915, 0.0002419017255306244, 0.00025571882724761963, 0.00026953592896461487, 0.0002833530306816101, 0.00029717013239860535, 0.0003109872341156006, 0.0003248043358325958, 0.00033862143754959106, 0.0003524385392665863, 0.00036625564098358154, 0.0003800727427005768, 0.000393889844417572, 0.00040770694613456726, 0.0004215240478515625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 6.0, 19.0, 12.0, 18.0, 23.0, 21.0, 38.0, 56.0, 59.0, 73.0, 101.0, 118.0, 150.0, 206.0, 376.0, 890.0, 68014.0, 974916.0, 1763.0, 561.0, 269.0, 193.0, 147.0, 119.0, 82.0, 76.0, 59.0, 42.0, 34.0, 18.0, 22.0, 12.0, 14.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01091766357421875, -0.010589122772216797, -0.010260581970214844, -0.00993204116821289, -0.009603500366210938, -0.009274959564208984, -0.008946418762207031, -0.008617877960205078, -0.008289337158203125, -0.007960796356201172, -0.007632255554199219, -0.007303714752197266, -0.0069751739501953125, -0.006646633148193359, -0.006318092346191406, -0.005989551544189453, -0.0056610107421875, -0.005332469940185547, -0.005003929138183594, -0.004675388336181641, -0.0043468475341796875, -0.004018306732177734, -0.0036897659301757812, -0.003361225128173828, -0.003032684326171875, -0.002704143524169922, -0.0023756027221679688, -0.0020470619201660156, -0.0017185211181640625, -0.0013899803161621094, -0.0010614395141601562, -0.0007328987121582031, -0.00040435791015625, -7.581710815429688e-05, 0.00025272369384765625, 0.0005812644958496094, 0.0009098052978515625, 0.0012383460998535156, 0.0015668869018554688, 0.0018954277038574219, 0.002223968505859375, 0.002552509307861328, 0.0028810501098632812, 0.0032095909118652344, 0.0035381317138671875, 0.0038666725158691406, 0.004195213317871094, 0.004523754119873047, 0.004852294921875, 0.005180835723876953, 0.005509376525878906, 0.005837917327880859, 0.0061664581298828125, 0.006494998931884766, 0.006823539733886719, 0.007152080535888672, 0.007480621337890625, 0.007809162139892578, 0.008137702941894531, 0.008466243743896484, 0.008794784545898438, 0.00912332534790039, 0.009451866149902344, 0.009780406951904297, 0.01010894775390625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 151.0, 656.0, 190.0, 12.0, 3.0], "bins": [-0.0034860901068896055, -0.0034285029396414757, -0.003370915772393346, -0.0033133288379758596, -0.00325574167072773, -0.0031981545034796, -0.00314056733623147, -0.003082980401813984, -0.003025393234565854, -0.0029678060673177242, -0.0029102189000695944, -0.002852631965652108, -0.0027950447984039783, -0.0027374576311558485, -0.0026798704639077187, -0.0026222835294902325, -0.0025646963622421026, -0.0025071091949939728, -0.002449522027745843, -0.0023919350933283567, -0.002334347926080227, -0.002276760758832097, -0.002219173591583967, -0.002161586657166481, -0.002103999489918351, -0.0020464123226702213, -0.0019888251554220915, -0.0019312381045892835, -0.0018736510537564754, -0.0018160638865083456, -0.0017584768356755376, -0.0017008896684274077, -0.001643302384763956, -0.0015857152175158262, -0.0015281281666830182, -0.0014705409994348884, -0.0014129539486020803, -0.0013553667813539505, -0.0012977797305211425, -0.0012401925632730126, -0.0011826055124402046, -0.0011250183451920748, -0.0010674312943592668, -0.001009844127111137, -0.0009522570762783289, -0.000894669909030199, -0.000837082858197391, -0.0007794956909492612, -0.0007219086401164532, -0.0006643215310759842, -0.0006067344220355153, -0.0005491473129950464, -0.0004915602039545774, -0.00043397306581027806, -0.0003763859567698091, -0.0003187988477293402, -0.00026121173868887126, -0.00020362462964840233, -0.0001460375206079334, -8.845039701554924e-05, -3.086328797508031e-05, 2.6723835617303848e-05, 8.431094465777278e-05, 0.0001418980536982417, 0.00019948516273871064]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 10.0, 9.0, 7.0, 10.0, 13.0, 14.0, 26.0, 18.0, 18.0, 17.0, 18.0, 25.0, 35.0, 34.0, 37.0, 29.0, 36.0, 43.0, 49.0, 49.0, 41.0, 62.0, 43.0, 30.0, 30.0, 31.0, 35.0, 23.0, 25.0, 26.0, 20.0, 16.0, 11.0, 16.0, 16.0, 17.0, 7.0, 9.0, 12.0, 10.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002422928810119629, -0.00023375451564788818, -0.00022521615028381348, -0.00021667778491973877, -0.00020813941955566406, -0.00019960105419158936, -0.00019106268882751465, -0.00018252432346343994, -0.00017398595809936523, -0.00016544759273529053, -0.00015690922737121582, -0.0001483708620071411, -0.0001398324966430664, -0.0001312941312789917, -0.000122755765914917, -0.00011421740055084229, -0.00010567903518676758, -9.714066982269287e-05, -8.860230445861816e-05, -8.006393909454346e-05, -7.152557373046875e-05, -6.298720836639404e-05, -5.4448843002319336e-05, -4.591047763824463e-05, -3.737211227416992e-05, -2.8833746910095215e-05, -2.0295381546020508e-05, -1.17570161819458e-05, -3.2186508178710938e-06, 5.319714546203613e-06, 1.385807991027832e-05, 2.2396445274353027e-05, 3.0934810638427734e-05, 3.947317600250244e-05, 4.801154136657715e-05, 5.6549906730651855e-05, 6.508827209472656e-05, 7.362663745880127e-05, 8.216500282287598e-05, 9.070336818695068e-05, 9.924173355102539e-05, 0.0001077800989151001, 0.0001163184642791748, 0.0001248568296432495, 0.00013339519500732422, 0.00014193356037139893, 0.00015047192573547363, 0.00015901029109954834, 0.00016754865646362305, 0.00017608702182769775, 0.00018462538719177246, 0.00019316375255584717, 0.00020170211791992188, 0.00021024048328399658, 0.0002187788486480713, 0.000227317214012146, 0.0002358555793762207, 0.0002443939447402954, 0.0002529323101043701, 0.0002614706754684448, 0.00027000904083251953, 0.00027854740619659424, 0.00028708577156066895, 0.00029562413692474365, 0.00030416250228881836]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 7.0, 7.0, 11.0, 10.0, 13.0, 20.0, 19.0, 17.0, 21.0, 29.0, 26.0, 19.0, 28.0, 28.0, 27.0, 36.0, 37.0, 46.0, 41.0, 36.0, 31.0, 34.0, 42.0, 47.0, 36.0, 31.0, 39.0, 26.0, 21.0, 34.0, 24.0, 22.0, 23.0, 14.0, 18.0, 13.0, 10.0, 7.0, 8.0, 7.0, 5.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.33984375, -3.238555908203125, -3.13726806640625, -3.035980224609375, -2.9346923828125, -2.833404541015625, -2.73211669921875, -2.630828857421875, -2.529541015625, -2.428253173828125, -2.32696533203125, -2.225677490234375, -2.1243896484375, -2.023101806640625, -1.92181396484375, -1.820526123046875, -1.71923828125, -1.617950439453125, -1.51666259765625, -1.415374755859375, -1.3140869140625, -1.212799072265625, -1.11151123046875, -1.010223388671875, -0.908935546875, -0.807647705078125, -0.70635986328125, -0.605072021484375, -0.5037841796875, -0.402496337890625, -0.30120849609375, -0.199920654296875, -0.0986328125, 0.002655029296875, 0.10394287109375, 0.205230712890625, 0.3065185546875, 0.407806396484375, 0.50909423828125, 0.610382080078125, 0.711669921875, 0.812957763671875, 0.91424560546875, 1.015533447265625, 1.1168212890625, 1.218109130859375, 1.31939697265625, 1.420684814453125, 1.52197265625, 1.623260498046875, 1.72454833984375, 1.825836181640625, 1.9271240234375, 2.028411865234375, 2.12969970703125, 2.230987548828125, 2.332275390625, 2.433563232421875, 2.53485107421875, 2.636138916015625, 2.7374267578125, 2.838714599609375, 2.94000244140625, 3.041290283203125, 3.142578125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 6.0, 15.0, 18.0, 27.0, 31.0, 41.0, 71.0, 122.0, 156.0, 206.0, 354.0, 495.0, 764.0, 1173.0, 2067.0, 3507.0, 6867.0, 14705.0, 35515.0, 95709.0, 307007.0, 385888.0, 116273.0, 42576.0, 17093.0, 7930.0, 3923.0, 2136.0, 1344.0, 805.0, 512.0, 395.0, 259.0, 165.0, 119.0, 82.0, 56.0, 36.0, 26.0, 20.0, 18.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.640625, -2.555694580078125, -2.47076416015625, -2.385833740234375, -2.3009033203125, -2.215972900390625, -2.13104248046875, -2.046112060546875, -1.961181640625, -1.876251220703125, -1.79132080078125, -1.706390380859375, -1.6214599609375, -1.536529541015625, -1.45159912109375, -1.366668701171875, -1.28173828125, -1.196807861328125, -1.11187744140625, -1.026947021484375, -0.9420166015625, -0.857086181640625, -0.77215576171875, -0.687225341796875, -0.602294921875, -0.517364501953125, -0.43243408203125, -0.347503662109375, -0.2625732421875, -0.177642822265625, -0.09271240234375, -0.007781982421875, 0.0771484375, 0.162078857421875, 0.24700927734375, 0.331939697265625, 0.4168701171875, 0.501800537109375, 0.58673095703125, 0.671661376953125, 0.756591796875, 0.841522216796875, 0.92645263671875, 1.011383056640625, 1.0963134765625, 1.181243896484375, 1.26617431640625, 1.351104736328125, 1.43603515625, 1.520965576171875, 1.60589599609375, 1.690826416015625, 1.7757568359375, 1.860687255859375, 1.94561767578125, 2.030548095703125, 2.115478515625, 2.200408935546875, 2.28533935546875, 2.370269775390625, 2.4552001953125, 2.540130615234375, 2.62506103515625, 2.709991455078125, 2.794921875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 9.0, 13.0, 9.0, 6.0, 14.0, 17.0, 15.0, 16.0, 14.0, 34.0, 32.0, 30.0, 28.0, 35.0, 43.0, 34.0, 45.0, 75.0, 105.0, 1657.0, 243.0, 93.0, 73.0, 53.0, 37.0, 49.0, 27.0, 34.0, 30.0, 22.0, 30.0, 21.0, 23.0, 23.0, 10.0, 7.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.5574951171875, -11.169677734375, -10.7818603515625, -10.39404296875, -10.0062255859375, -9.618408203125, -9.2305908203125, -8.8427734375, -8.4549560546875, -8.067138671875, -7.6793212890625, -7.29150390625, -6.9036865234375, -6.515869140625, -6.1280517578125, -5.740234375, -5.3524169921875, -4.964599609375, -4.5767822265625, -4.18896484375, -3.8011474609375, -3.413330078125, -3.0255126953125, -2.6376953125, -2.2498779296875, -1.862060546875, -1.4742431640625, -1.08642578125, -0.6986083984375, -0.310791015625, 0.0770263671875, 0.46484375, 0.8526611328125, 1.240478515625, 1.6282958984375, 2.01611328125, 2.4039306640625, 2.791748046875, 3.1795654296875, 3.5673828125, 3.9552001953125, 4.343017578125, 4.7308349609375, 5.11865234375, 5.5064697265625, 5.894287109375, 6.2821044921875, 6.669921875, 7.0577392578125, 7.445556640625, 7.8333740234375, 8.22119140625, 8.6090087890625, 8.996826171875, 9.3846435546875, 9.7724609375, 10.1602783203125, 10.548095703125, 10.9359130859375, 11.32373046875, 11.7115478515625, 12.099365234375, 12.4871826171875, 12.875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 5.0, 14.0, 10.0, 16.0, 24.0, 25.0, 30.0, 36.0, 30.0, 55.0, 60.0, 100.0, 164.0, 235.0, 493.0, 1336.0, 7872.0, 526154.0, 2593056.0, 12799.0, 1735.0, 566.0, 270.0, 134.0, 103.0, 67.0, 47.0, 46.0, 43.0, 25.0, 18.0, 21.0, 17.0, 13.0, 14.0, 6.0, 16.0, 6.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.578125, -18.948486328125, -18.31884765625, -17.689208984375, -17.0595703125, -16.429931640625, -15.80029296875, -15.170654296875, -14.541015625, -13.911376953125, -13.28173828125, -12.652099609375, -12.0224609375, -11.392822265625, -10.76318359375, -10.133544921875, -9.50390625, -8.874267578125, -8.24462890625, -7.614990234375, -6.9853515625, -6.355712890625, -5.72607421875, -5.096435546875, -4.466796875, -3.837158203125, -3.20751953125, -2.577880859375, -1.9482421875, -1.318603515625, -0.68896484375, -0.059326171875, 0.5703125, 1.199951171875, 1.82958984375, 2.459228515625, 3.0888671875, 3.718505859375, 4.34814453125, 4.977783203125, 5.607421875, 6.237060546875, 6.86669921875, 7.496337890625, 8.1259765625, 8.755615234375, 9.38525390625, 10.014892578125, 10.64453125, 11.274169921875, 11.90380859375, 12.533447265625, 13.1630859375, 13.792724609375, 14.42236328125, 15.052001953125, 15.681640625, 16.311279296875, 16.94091796875, 17.570556640625, 18.2001953125, 18.829833984375, 19.45947265625, 20.089111328125, 20.71875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 72.0, 751.0, 182.0, 8.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.508129119873047, -26.452463150024414, -23.39679718017578, -20.341129302978516, -17.285463333129883, -14.22979736328125, -11.174129486083984, -8.118463516235352, -5.062797546386719, -2.0071310997009277, 1.0485353469848633, 4.1042022705078125, 7.159868240356445, 10.215534210205078, 13.271202087402344, 16.326868057250977, 19.38253402709961, 22.438199996948242, 25.493865966796875, 28.54953384399414, 31.605199813842773, 34.660865783691406, 37.71653366088867, 40.77220153808594, 43.82786560058594, 46.8835334777832, 49.9391975402832, 52.99486541748047, 56.05052947998047, 59.106197357177734, 62.161865234375, 65.217529296875, 68.273193359375, 71.328857421875, 74.38452911376953, 77.44019317626953, 80.49585723876953, 83.55152893066406, 86.60719299316406, 89.66285705566406, 92.71852111816406, 95.77418518066406, 98.8298568725586, 101.8855209350586, 104.9411849975586, 107.99685668945312, 111.05252075195312, 114.10818481445312, 117.16385650634766, 120.21952056884766, 123.27519226074219, 126.33085632324219, 129.3865203857422, 132.4421844482422, 135.49786376953125, 138.55352783203125, 141.60919189453125, 144.66485595703125, 147.72052001953125, 150.77618408203125, 153.8318634033203, 156.8875274658203, 159.9431915283203, 162.9988555908203, 166.0545196533203]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 9.0, 11.0, 9.0, 14.0, 10.0, 25.0, 18.0, 24.0, 23.0, 27.0, 27.0, 37.0, 28.0, 29.0, 36.0, 39.0, 37.0, 45.0, 46.0, 41.0, 28.0, 37.0, 43.0, 38.0, 46.0, 34.0, 24.0, 23.0, 25.0, 19.0, 19.0, 15.0, 18.0, 15.0, 13.0, 14.0, 12.0, 11.0, 3.0, 5.0, 1.0, 5.0, 4.0, 1.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-42.91389083862305, -41.59577941894531, -40.277671813964844, -38.95956039428711, -37.64145278930664, -36.323341369628906, -35.00523376464844, -33.6871223449707, -32.36901092529297, -31.050901412963867, -29.732791900634766, -28.414682388305664, -27.096572875976562, -25.778461456298828, -24.460351943969727, -23.142242431640625, -21.824134826660156, -20.506025314331055, -19.187915802001953, -17.86980628967285, -16.55169677734375, -15.233586311340332, -13.915475845336914, -12.597366333007812, -11.279256820678711, -9.96114730834961, -8.643037796020508, -7.32492733001709, -6.006817817687988, -4.688708305358887, -3.370598316192627, -2.052488327026367, -0.7343826293945312, 0.5837271213531494, 1.90183687210083, 3.2199466228485107, 4.538056373596191, 5.856165885925293, 7.174275875091553, 8.492385864257812, 9.810495376586914, 11.128604888916016, 12.446714401245117, 13.764824867248535, 15.082934379577637, 16.401042938232422, 17.719154357910156, 19.037263870239258, 20.35537338256836, 21.67348289489746, 22.991592407226562, 24.309701919555664, 25.627811431884766, 26.9459228515625, 28.2640323638916, 29.582141876220703, 30.900251388549805, 32.218360900878906, 33.53647232055664, 34.85457992553711, 36.172691345214844, 37.49079895019531, 38.80891036987305, 40.12702178955078, 41.44512939453125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 6.0, 12.0, 19.0, 21.0, 17.0, 19.0, 28.0, 35.0, 18.0, 28.0, 21.0, 26.0, 37.0, 41.0, 49.0, 45.0, 31.0, 33.0, 38.0, 48.0, 43.0, 32.0, 35.0, 39.0, 33.0, 25.0, 19.0, 27.0, 19.0, 22.0, 21.0, 17.0, 16.0, 10.0, 6.0, 6.0, 8.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.490234375, -3.381622314453125, -3.27301025390625, -3.164398193359375, -3.0557861328125, -2.947174072265625, -2.83856201171875, -2.729949951171875, -2.621337890625, -2.512725830078125, -2.40411376953125, -2.295501708984375, -2.1868896484375, -2.078277587890625, -1.96966552734375, -1.861053466796875, -1.75244140625, -1.643829345703125, -1.53521728515625, -1.426605224609375, -1.3179931640625, -1.209381103515625, -1.10076904296875, -0.992156982421875, -0.883544921875, -0.774932861328125, -0.66632080078125, -0.557708740234375, -0.4490966796875, -0.340484619140625, -0.23187255859375, -0.123260498046875, -0.0146484375, 0.093963623046875, 0.20257568359375, 0.311187744140625, 0.4197998046875, 0.528411865234375, 0.63702392578125, 0.745635986328125, 0.854248046875, 0.962860107421875, 1.07147216796875, 1.180084228515625, 1.2886962890625, 1.397308349609375, 1.50592041015625, 1.614532470703125, 1.72314453125, 1.831756591796875, 1.94036865234375, 2.048980712890625, 2.1575927734375, 2.266204833984375, 2.37481689453125, 2.483428955078125, 2.592041015625, 2.700653076171875, 2.80926513671875, 2.917877197265625, 3.0264892578125, 3.135101318359375, 3.24371337890625, 3.352325439453125, 3.4609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 12.0, 10.0, 12.0, 12.0, 12.0, 20.0, 14.0, 29.0, 22.0, 27.0, 21.0, 39.0, 54.0, 97.0, 228.0, 881.0, 7478.0, 237980.0, 3779848.0, 159991.0, 6010.0, 835.0, 220.0, 77.0, 63.0, 37.0, 29.0, 32.0, 22.0, 23.0, 22.0, 19.0, 17.0, 7.0, 16.0, 13.0, 3.0, 9.0, 0.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-21.375, -20.736083984375, -20.09716796875, -19.458251953125, -18.8193359375, -18.180419921875, -17.54150390625, -16.902587890625, -16.263671875, -15.624755859375, -14.98583984375, -14.346923828125, -13.7080078125, -13.069091796875, -12.43017578125, -11.791259765625, -11.15234375, -10.513427734375, -9.87451171875, -9.235595703125, -8.5966796875, -7.957763671875, -7.31884765625, -6.679931640625, -6.041015625, -5.402099609375, -4.76318359375, -4.124267578125, -3.4853515625, -2.846435546875, -2.20751953125, -1.568603515625, -0.9296875, -0.290771484375, 0.34814453125, 0.987060546875, 1.6259765625, 2.264892578125, 2.90380859375, 3.542724609375, 4.181640625, 4.820556640625, 5.45947265625, 6.098388671875, 6.7373046875, 7.376220703125, 8.01513671875, 8.654052734375, 9.29296875, 9.931884765625, 10.57080078125, 11.209716796875, 11.8486328125, 12.487548828125, 13.12646484375, 13.765380859375, 14.404296875, 15.043212890625, 15.68212890625, 16.321044921875, 16.9599609375, 17.598876953125, 18.23779296875, 18.876708984375, 19.515625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 5.0, 14.0, 13.0, 27.0, 33.0, 44.0, 74.0, 113.0, 174.0, 253.0, 319.0, 510.0, 617.0, 539.0, 444.0, 298.0, 211.0, 110.0, 87.0, 57.0, 51.0, 20.0, 16.0, 21.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7421875, -14.3050537109375, -13.867919921875, -13.4307861328125, -12.99365234375, -12.5565185546875, -12.119384765625, -11.6822509765625, -11.2451171875, -10.8079833984375, -10.370849609375, -9.9337158203125, -9.49658203125, -9.0594482421875, -8.622314453125, -8.1851806640625, -7.748046875, -7.3109130859375, -6.873779296875, -6.4366455078125, -5.99951171875, -5.5623779296875, -5.125244140625, -4.6881103515625, -4.2509765625, -3.8138427734375, -3.376708984375, -2.9395751953125, -2.50244140625, -2.0653076171875, -1.628173828125, -1.1910400390625, -0.75390625, -0.3167724609375, 0.120361328125, 0.5574951171875, 0.99462890625, 1.4317626953125, 1.868896484375, 2.3060302734375, 2.7431640625, 3.1802978515625, 3.617431640625, 4.0545654296875, 4.49169921875, 4.9288330078125, 5.365966796875, 5.8031005859375, 6.240234375, 6.6773681640625, 7.114501953125, 7.5516357421875, 7.98876953125, 8.4259033203125, 8.863037109375, 9.3001708984375, 9.7373046875, 10.1744384765625, 10.611572265625, 11.0487060546875, 11.48583984375, 11.9229736328125, 12.360107421875, 12.7972412109375, 13.234375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 17.0, 32.0, 38.0, 76.0, 105.0, 205.0, 399.0, 1260.0, 88550.0, 4089718.0, 12351.0, 794.0, 318.0, 165.0, 85.0, 57.0, 38.0, 19.0, 8.0, 11.0, 5.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.46875, -57.44189453125, -55.4150390625, -53.38818359375, -51.361328125, -49.33447265625, -47.3076171875, -45.28076171875, -43.25390625, -41.22705078125, -39.2001953125, -37.17333984375, -35.146484375, -33.11962890625, -31.0927734375, -29.06591796875, -27.0390625, -25.01220703125, -22.9853515625, -20.95849609375, -18.931640625, -16.90478515625, -14.8779296875, -12.85107421875, -10.82421875, -8.79736328125, -6.7705078125, -4.74365234375, -2.716796875, -0.68994140625, 1.3369140625, 3.36376953125, 5.390625, 7.41748046875, 9.4443359375, 11.47119140625, 13.498046875, 15.52490234375, 17.5517578125, 19.57861328125, 21.60546875, 23.63232421875, 25.6591796875, 27.68603515625, 29.712890625, 31.73974609375, 33.7666015625, 35.79345703125, 37.8203125, 39.84716796875, 41.8740234375, 43.90087890625, 45.927734375, 47.95458984375, 49.9814453125, 52.00830078125, 54.03515625, 56.06201171875, 58.0888671875, 60.11572265625, 62.142578125, 64.16943359375, 66.1962890625, 68.22314453125, 70.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [14.0, 102.0, 341.0, 419.0, 124.0, 16.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.621432304382324, -9.83110523223877, -5.040778160095215, -0.25045108795166016, 4.5398759841918945, 9.33020305633545, 14.120530128479004, 18.91085433959961, 23.701183319091797, 28.49151039123535, 33.281837463378906, 38.072166442871094, 42.862491607666016, 47.65281677246094, 52.443145751953125, 57.23347091674805, 62.023799896240234, 66.81412506103516, 71.60445404052734, 76.39478302001953, 81.18510437011719, 85.97543334960938, 90.76576232910156, 95.55609130859375, 100.34642028808594, 105.13674926757812, 109.92707824707031, 114.71739959716797, 119.50772857666016, 124.29805755615234, 129.08837890625, 133.8787078857422, 138.66903686523438, 143.45936584472656, 148.24969482421875, 153.04002380371094, 157.83035278320312, 162.62066650390625, 167.41099548339844, 172.20132446289062, 176.9916534423828, 181.781982421875, 186.5723114013672, 191.36264038085938, 196.1529541015625, 200.9432830810547, 205.73361206054688, 210.52394104003906, 215.31427001953125, 220.10459899902344, 224.89492797851562, 229.6852569580078, 234.4755859375, 239.26589965820312, 244.0562286376953, 248.8465576171875, 253.6368865966797, 258.4272155761719, 263.217529296875, 268.00787353515625, 272.7981872558594, 277.5885314941406, 282.37884521484375, 287.169189453125, 291.9595031738281]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 9.0, 6.0, 10.0, 8.0, 18.0, 21.0, 13.0, 16.0, 20.0, 21.0, 26.0, 19.0, 22.0, 32.0, 27.0, 34.0, 39.0, 36.0, 47.0, 35.0, 34.0, 37.0, 45.0, 37.0, 41.0, 32.0, 31.0, 34.0, 35.0, 36.0, 36.0, 24.0, 24.0, 9.0, 17.0, 12.0, 16.0, 13.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.776397705078125, -32.67884063720703, -31.581283569335938, -30.483728408813477, -29.386171340942383, -28.28861427307129, -27.191059112548828, -26.093502044677734, -24.99594497680664, -23.898387908935547, -22.800830841064453, -21.703275680541992, -20.6057186126709, -19.508161544799805, -18.410606384277344, -17.31304931640625, -16.215492248535156, -15.117935180664062, -14.020379066467285, -12.922822952270508, -11.825265884399414, -10.72770881652832, -9.630152702331543, -8.532596588134766, -7.435039520263672, -6.337482929229736, -5.239926338195801, -4.142369747161865, -3.0448131561279297, -1.9472565650939941, -0.8496999740600586, 0.24785661697387695, 1.3454132080078125, 2.442969799041748, 3.5405263900756836, 4.638082981109619, 5.735639572143555, 6.83319616317749, 7.930752754211426, 9.028308868408203, 10.125865936279297, 11.22342300415039, 12.320979118347168, 13.418535232543945, 14.516092300415039, 15.613649368286133, 16.711204528808594, 17.808761596679688, 18.90631866455078, 20.003875732421875, 21.10143280029297, 22.19898796081543, 23.296545028686523, 24.394102096557617, 25.491657257080078, 26.589214324951172, 27.686771392822266, 28.78432846069336, 29.881885528564453, 30.979440689086914, 32.076995849609375, 33.17455291748047, 34.27210998535156, 35.369667053222656, 36.46722412109375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 1.0, 6.0, 5.0, 5.0, 3.0, 7.0, 10.0, 11.0, 18.0, 14.0, 25.0, 23.0, 32.0, 33.0, 26.0, 26.0, 30.0, 34.0, 40.0, 50.0, 44.0, 33.0, 47.0, 42.0, 39.0, 40.0, 45.0, 45.0, 43.0, 23.0, 23.0, 34.0, 22.0, 27.0, 21.0, 18.0, 18.0, 3.0, 10.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.977935791015625, -3.85430908203125, -3.730682373046875, -3.6070556640625, -3.483428955078125, -3.35980224609375, -3.236175537109375, -3.112548828125, -2.988922119140625, -2.86529541015625, -2.741668701171875, -2.6180419921875, -2.494415283203125, -2.37078857421875, -2.247161865234375, -2.12353515625, -1.999908447265625, -1.87628173828125, -1.752655029296875, -1.6290283203125, -1.505401611328125, -1.38177490234375, -1.258148193359375, -1.134521484375, -1.010894775390625, -0.88726806640625, -0.763641357421875, -0.6400146484375, -0.516387939453125, -0.39276123046875, -0.269134521484375, -0.1455078125, -0.021881103515625, 0.10174560546875, 0.225372314453125, 0.3489990234375, 0.472625732421875, 0.59625244140625, 0.719879150390625, 0.843505859375, 0.967132568359375, 1.09075927734375, 1.214385986328125, 1.3380126953125, 1.461639404296875, 1.58526611328125, 1.708892822265625, 1.83251953125, 1.956146240234375, 2.07977294921875, 2.203399658203125, 2.3270263671875, 2.450653076171875, 2.57427978515625, 2.697906494140625, 2.821533203125, 2.945159912109375, 3.06878662109375, 3.192413330078125, 3.3160400390625, 3.439666748046875, 3.56329345703125, 3.686920166015625, 3.810546875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 13.0, 5.0, 11.0, 20.0, 23.0, 51.0, 56.0, 66.0, 104.0, 153.0, 226.0, 303.0, 423.0, 638.0, 816.0, 1263.0, 1730.0, 2722.0, 3995.0, 6162.0, 9334.0, 14807.0, 23498.0, 39231.0, 67609.0, 119456.0, 192108.0, 211359.0, 144131.0, 83082.0, 47134.0, 28241.0, 17306.0, 10943.0, 6950.0, 4695.0, 3132.0, 2009.0, 1503.0, 945.0, 711.0, 437.0, 334.0, 240.0, 156.0, 119.0, 114.0, 58.0, 43.0, 36.0, 18.0, 16.0, 15.0, 9.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.379150390625, -0.3673667907714844, -0.35558319091796875, -0.3437995910644531, -0.3320159912109375, -0.3202323913574219, -0.30844879150390625, -0.2966651916503906, -0.284881591796875, -0.2730979919433594, -0.26131439208984375, -0.24953079223632812, -0.2377471923828125, -0.22596359252929688, -0.21417999267578125, -0.20239639282226562, -0.19061279296875, -0.17882919311523438, -0.16704559326171875, -0.15526199340820312, -0.1434783935546875, -0.13169479370117188, -0.11991119384765625, -0.10812759399414062, -0.096343994140625, -0.08456039428710938, -0.07277679443359375, -0.060993194580078125, -0.0492095947265625, -0.037425994873046875, -0.02564239501953125, -0.013858795166015625, -0.0020751953125, 0.009708404541015625, 0.02149200439453125, 0.033275604248046875, 0.0450592041015625, 0.056842803955078125, 0.06862640380859375, 0.08041000366210938, 0.092193603515625, 0.10397720336914062, 0.11576080322265625, 0.12754440307617188, 0.1393280029296875, 0.15111160278320312, 0.16289520263671875, 0.17467880249023438, 0.18646240234375, 0.19824600219726562, 0.21002960205078125, 0.22181320190429688, 0.2335968017578125, 0.24538040161132812, 0.25716400146484375, 0.2689476013183594, 0.280731201171875, 0.2925148010253906, 0.30429840087890625, 0.3160820007324219, 0.3278656005859375, 0.3396492004394531, 0.35143280029296875, 0.3632164001464844, 0.375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 7.0, 8.0, 10.0, 13.0, 16.0, 19.0, 25.0, 20.0, 35.0, 30.0, 40.0, 27.0, 31.0, 44.0, 30.0, 37.0, 36.0, 39.0, 1063.0, 41.0, 43.0, 54.0, 34.0, 37.0, 30.0, 25.0, 29.0, 29.0, 25.0, 25.0, 16.0, 22.0, 19.0, 11.0, 10.0, 7.0, 6.0, 4.0, 3.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.392578125, -2.318511962890625, -2.24444580078125, -2.170379638671875, -2.0963134765625, -2.022247314453125, -1.94818115234375, -1.874114990234375, -1.800048828125, -1.725982666015625, -1.65191650390625, -1.577850341796875, -1.5037841796875, -1.429718017578125, -1.35565185546875, -1.281585693359375, -1.20751953125, -1.133453369140625, -1.05938720703125, -0.985321044921875, -0.9112548828125, -0.837188720703125, -0.76312255859375, -0.689056396484375, -0.614990234375, -0.540924072265625, -0.46685791015625, -0.392791748046875, -0.3187255859375, -0.244659423828125, -0.17059326171875, -0.096527099609375, -0.0224609375, 0.051605224609375, 0.12567138671875, 0.199737548828125, 0.2738037109375, 0.347869873046875, 0.42193603515625, 0.496002197265625, 0.570068359375, 0.644134521484375, 0.71820068359375, 0.792266845703125, 0.8663330078125, 0.940399169921875, 1.01446533203125, 1.088531494140625, 1.16259765625, 1.236663818359375, 1.31072998046875, 1.384796142578125, 1.4588623046875, 1.532928466796875, 1.60699462890625, 1.681060791015625, 1.755126953125, 1.829193115234375, 1.90325927734375, 1.977325439453125, 2.0513916015625, 2.125457763671875, 2.19952392578125, 2.273590087890625, 2.34765625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 16.0, 24.0, 33.0, 46.0, 79.0, 111.0, 161.0, 264.0, 393.0, 597.0, 886.0, 1396.0, 2192.0, 3443.0, 5556.0, 8842.0, 14473.0, 24010.0, 40426.0, 68795.0, 116382.0, 183026.0, 1254920.0, 148513.0, 89269.0, 52821.0, 31228.0, 18490.0, 11431.0, 6887.0, 4412.0, 2787.0, 1804.0, 1124.0, 786.0, 501.0, 318.0, 225.0, 149.0, 94.0, 62.0, 45.0, 30.0, 26.0, 14.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.349853515625, -0.3390045166015625, -0.328155517578125, -0.3173065185546875, -0.30645751953125, -0.2956085205078125, -0.284759521484375, -0.2739105224609375, -0.2630615234375, -0.2522125244140625, -0.241363525390625, -0.2305145263671875, -0.21966552734375, -0.2088165283203125, -0.197967529296875, -0.1871185302734375, -0.17626953125, -0.1654205322265625, -0.154571533203125, -0.1437225341796875, -0.13287353515625, -0.1220245361328125, -0.111175537109375, -0.1003265380859375, -0.0894775390625, -0.0786285400390625, -0.067779541015625, -0.0569305419921875, -0.04608154296875, -0.0352325439453125, -0.024383544921875, -0.0135345458984375, -0.002685546875, 0.0081634521484375, 0.019012451171875, 0.0298614501953125, 0.04071044921875, 0.0515594482421875, 0.062408447265625, 0.0732574462890625, 0.0841064453125, 0.0949554443359375, 0.105804443359375, 0.1166534423828125, 0.12750244140625, 0.1383514404296875, 0.149200439453125, 0.1600494384765625, 0.1708984375, 0.1817474365234375, 0.192596435546875, 0.2034454345703125, 0.21429443359375, 0.2251434326171875, 0.235992431640625, 0.2468414306640625, 0.2576904296875, 0.2685394287109375, 0.279388427734375, 0.2902374267578125, 0.30108642578125, 0.3119354248046875, 0.322784423828125, 0.3336334228515625, 0.344482421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 14.0, 3.0, 19.0, 14.0, 22.0, 27.0, 27.0, 27.0, 21.0, 36.0, 34.0, 40.0, 48.0, 49.0, 55.0, 53.0, 49.0, 52.0, 56.0, 42.0, 41.0, 33.0, 34.0, 36.0, 29.0, 28.0, 15.0, 22.0, 15.0, 14.0, 4.0, 8.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004818439483642578, -0.0004656873643398285, -0.00044953078031539917, -0.00043337419629096985, -0.00041721761226654053, -0.0004010610282421112, -0.0003849044442176819, -0.00036874786019325256, -0.00035259127616882324, -0.0003364346921443939, -0.0003202781081199646, -0.0003041215240955353, -0.00028796494007110596, -0.00027180835604667664, -0.0002556517720222473, -0.000239495187997818, -0.00022333860397338867, -0.00020718201994895935, -0.00019102543592453003, -0.0001748688519001007, -0.0001587122678756714, -0.00014255568385124207, -0.00012639909982681274, -0.00011024251580238342, -9.40859317779541e-05, -7.792934775352478e-05, -6.177276372909546e-05, -4.561617970466614e-05, -2.9459595680236816e-05, -1.3303011655807495e-05, 2.853572368621826e-06, 1.9010156393051147e-05, 3.516674041748047e-05, 5.132332444190979e-05, 6.747990846633911e-05, 8.363649249076843e-05, 9.979307651519775e-05, 0.00011594966053962708, 0.0001321062445640564, 0.00014826282858848572, 0.00016441941261291504, 0.00018057599663734436, 0.00019673258066177368, 0.000212889164686203, 0.00022904574871063232, 0.00024520233273506165, 0.00026135891675949097, 0.0002775155007839203, 0.0002936720848083496, 0.00030982866883277893, 0.00032598525285720825, 0.0003421418368816376, 0.0003582984209060669, 0.0003744550049304962, 0.00039061158895492554, 0.00040676817297935486, 0.0004229247570037842, 0.0004390813410282135, 0.0004552379250526428, 0.00047139450907707214, 0.00048755109310150146, 0.0005037076771259308, 0.0005198642611503601, 0.0005360208451747894, 0.0005521774291992188]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 7.0, 14.0, 12.0, 16.0, 16.0, 14.0, 20.0, 30.0, 38.0, 53.0, 74.0, 85.0, 112.0, 143.0, 227.0, 337.0, 592.0, 2178.0, 889139.0, 152841.0, 1047.0, 461.0, 287.0, 187.0, 144.0, 101.0, 83.0, 65.0, 48.0, 32.0, 27.0, 20.0, 26.0, 17.0, 6.0, 14.0, 5.0, 3.0, 7.0, 3.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00959014892578125, -0.00927889347076416, -0.00896763801574707, -0.00865638256072998, -0.00834512710571289, -0.0080338716506958, -0.007722616195678711, -0.007411360740661621, -0.007100105285644531, -0.006788849830627441, -0.0064775943756103516, -0.006166338920593262, -0.005855083465576172, -0.005543828010559082, -0.005232572555541992, -0.004921317100524902, -0.0046100616455078125, -0.004298806190490723, -0.003987550735473633, -0.003676295280456543, -0.003365039825439453, -0.0030537843704223633, -0.0027425289154052734, -0.0024312734603881836, -0.0021200180053710938, -0.001808762550354004, -0.001497507095336914, -0.0011862516403198242, -0.0008749961853027344, -0.0005637407302856445, -0.0002524852752685547, 5.8770179748535156e-05, 0.000370025634765625, 0.0006812810897827148, 0.0009925365447998047, 0.0013037919998168945, 0.0016150474548339844, 0.0019263029098510742, 0.002237558364868164, 0.002548813819885254, 0.0028600692749023438, 0.0031713247299194336, 0.0034825801849365234, 0.0037938356399536133, 0.004105091094970703, 0.004416346549987793, 0.004727602005004883, 0.005038857460021973, 0.0053501129150390625, 0.005661368370056152, 0.005972623825073242, 0.006283879280090332, 0.006595134735107422, 0.006906390190124512, 0.0072176456451416016, 0.007528901100158691, 0.007840156555175781, 0.008151412010192871, 0.008462667465209961, 0.00877392292022705, 0.00908517837524414, 0.00939643383026123, 0.00970768928527832, 0.01001894474029541, 0.0103302001953125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 16.0, 86.0, 374.0, 397.0, 124.0, 19.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009585164953023195, -0.0009150714031420648, -0.0008716263109818101, -0.0008281812770292163, -0.0007847361266613007, -0.0007412910927087069, -0.0006978460005484521, -0.0006544009083881974, -0.0006109558162279427, -0.000567510724067688, -0.0005240656319074333, -0.000480620568851009, -0.0004371754766907543, -0.0003937303845304996, -0.0003502853214740753, -0.0003068402293138206, -0.0002633951371535659, -0.00021995004499331117, -0.00017650496738497168, -0.0001330598897766322, -8.961479761637747e-05, -4.6169705456122756e-05, -2.724642399698496e-06, 4.072044976055622e-05, 8.416554192081094e-05, 0.00012761063408106565, 0.00017105571168940514, 0.00021450078929774463, 0.00025794588145799935, 0.00030139097361825407, 0.0003448360366746783, 0.00038828112883493304, 0.00043172610457986593, 0.00047517119674012065, 0.0005186162889003754, 0.0005620613228529692, 0.0006055064732208848, 0.0006489515071734786, 0.0006923965993337333, 0.000735841691493988, 0.0007792867836542428, 0.0008227318758144975, 0.0008661769679747522, 0.0009096220601350069, 0.0009530670940876007, 0.0009965122444555163, 0.0010399572784081101, 0.0010834024287760258, 0.0011268474627286196, 0.0011702924966812134, 0.001213737647049129, 0.0012571826810017228, 0.0013006278313696384, 0.0013440728653222322, 0.001387517899274826, 0.0014309630496427417, 0.0014744082000106573, 0.0015178532339632511, 0.0015612983843311667, 0.0016047434182837605, 0.0016481885686516762, 0.00169163360260427, 0.0017350786365568638, 0.0017785237869247794, 0.0018219688208773732]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 6.0, 9.0, 14.0, 9.0, 22.0, 21.0, 26.0, 24.0, 37.0, 42.0, 27.0, 39.0, 41.0, 39.0, 38.0, 48.0, 32.0, 48.0, 34.0, 42.0, 40.0, 32.0, 36.0, 33.0, 28.0, 26.0, 28.0, 26.0, 21.0, 22.0, 14.0, 19.0, 16.0, 8.0, 6.0, 9.0, 5.0, 4.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00028693675994873047, -0.00027785543352365494, -0.0002687741070985794, -0.0002596927806735039, -0.00025061145424842834, -0.00024153012782335281, -0.00023244880139827728, -0.00022336747497320175, -0.00021428614854812622, -0.0002052048221230507, -0.00019612349569797516, -0.00018704216927289963, -0.0001779608428478241, -0.00016887951642274857, -0.00015979818999767303, -0.0001507168635725975, -0.00014163553714752197, -0.00013255421072244644, -0.0001234728842973709, -0.00011439155787229538, -0.00010531023144721985, -9.622890502214432e-05, -8.714757859706879e-05, -7.806625217199326e-05, -6.898492574691772e-05, -5.9903599321842194e-05, -5.082227289676666e-05, -4.174094647169113e-05, -3.26596200466156e-05, -2.357829362154007e-05, -1.4496967196464539e-05, -5.4156407713890076e-06, 3.6656856536865234e-06, 1.2747012078762054e-05, 2.1828338503837585e-05, 3.0909664928913116e-05, 3.999099135398865e-05, 4.907231777906418e-05, 5.815364420413971e-05, 6.723497062921524e-05, 7.631629705429077e-05, 8.53976234793663e-05, 9.447894990444183e-05, 0.00010356027632951736, 0.0001126416027545929, 0.00012172292917966843, 0.00013080425560474396, 0.0001398855820298195, 0.00014896690845489502, 0.00015804823487997055, 0.00016712956130504608, 0.0001762108877301216, 0.00018529221415519714, 0.00019437354058027267, 0.0002034548670053482, 0.00021253619343042374, 0.00022161751985549927, 0.0002306988462805748, 0.00023978017270565033, 0.00024886149913072586, 0.0002579428255558014, 0.0002670241519808769, 0.00027610547840595245, 0.000285186804831028, 0.0002942681312561035]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 1.0, 6.0, 5.0, 5.0, 3.0, 7.0, 10.0, 11.0, 18.0, 14.0, 25.0, 23.0, 32.0, 33.0, 26.0, 26.0, 30.0, 34.0, 40.0, 50.0, 44.0, 33.0, 47.0, 42.0, 39.0, 40.0, 45.0, 45.0, 43.0, 23.0, 23.0, 34.0, 22.0, 27.0, 21.0, 18.0, 18.0, 3.0, 10.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.977935791015625, -3.85430908203125, -3.730682373046875, -3.6070556640625, -3.483428955078125, -3.35980224609375, -3.236175537109375, -3.112548828125, -2.988922119140625, -2.86529541015625, -2.741668701171875, -2.6180419921875, -2.494415283203125, -2.37078857421875, -2.247161865234375, -2.12353515625, -1.999908447265625, -1.87628173828125, -1.752655029296875, -1.6290283203125, -1.505401611328125, -1.38177490234375, -1.258148193359375, -1.134521484375, -1.010894775390625, -0.88726806640625, -0.763641357421875, -0.6400146484375, -0.516387939453125, -0.39276123046875, -0.269134521484375, -0.1455078125, -0.021881103515625, 0.10174560546875, 0.225372314453125, 0.3489990234375, 0.472625732421875, 0.59625244140625, 0.719879150390625, 0.843505859375, 0.967132568359375, 1.09075927734375, 1.214385986328125, 1.3380126953125, 1.461639404296875, 1.58526611328125, 1.708892822265625, 1.83251953125, 1.956146240234375, 2.07977294921875, 2.203399658203125, 2.3270263671875, 2.450653076171875, 2.57427978515625, 2.697906494140625, 2.821533203125, 2.945159912109375, 3.06878662109375, 3.192413330078125, 3.3160400390625, 3.439666748046875, 3.56329345703125, 3.686920166015625, 3.810546875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 17.0, 18.0, 26.0, 36.0, 40.0, 48.0, 77.0, 119.0, 159.0, 221.0, 284.0, 465.0, 658.0, 1132.0, 2067.0, 3767.0, 7651.0, 17661.0, 51968.0, 201991.0, 517528.0, 167059.0, 44173.0, 15778.0, 6998.0, 3573.0, 1920.0, 1051.0, 625.0, 404.0, 305.0, 229.0, 128.0, 82.0, 78.0, 50.0, 40.0, 36.0, 26.0, 19.0, 10.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.25390625, -3.156585693359375, -3.05926513671875, -2.961944580078125, -2.8646240234375, -2.767303466796875, -2.66998291015625, -2.572662353515625, -2.475341796875, -2.378021240234375, -2.28070068359375, -2.183380126953125, -2.0860595703125, -1.988739013671875, -1.89141845703125, -1.794097900390625, -1.69677734375, -1.599456787109375, -1.50213623046875, -1.404815673828125, -1.3074951171875, -1.210174560546875, -1.11285400390625, -1.015533447265625, -0.918212890625, -0.820892333984375, -0.72357177734375, -0.626251220703125, -0.5289306640625, -0.431610107421875, -0.33428955078125, -0.236968994140625, -0.1396484375, -0.042327880859375, 0.05499267578125, 0.152313232421875, 0.2496337890625, 0.346954345703125, 0.44427490234375, 0.541595458984375, 0.638916015625, 0.736236572265625, 0.83355712890625, 0.930877685546875, 1.0281982421875, 1.125518798828125, 1.22283935546875, 1.320159912109375, 1.41748046875, 1.514801025390625, 1.61212158203125, 1.709442138671875, 1.8067626953125, 1.904083251953125, 2.00140380859375, 2.098724365234375, 2.196044921875, 2.293365478515625, 2.39068603515625, 2.488006591796875, 2.5853271484375, 2.682647705078125, 2.77996826171875, 2.877288818359375, 2.974609375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 5.0, 7.0, 7.0, 9.0, 8.0, 14.0, 8.0, 10.0, 13.0, 18.0, 17.0, 32.0, 24.0, 32.0, 42.0, 23.0, 36.0, 38.0, 36.0, 70.0, 139.0, 1820.0, 125.0, 55.0, 52.0, 43.0, 40.0, 32.0, 39.0, 35.0, 32.0, 23.0, 27.0, 16.0, 27.0, 15.0, 15.0, 11.0, 6.0, 13.0, 5.0, 7.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.421875, -11.047607421875, -10.67333984375, -10.299072265625, -9.9248046875, -9.550537109375, -9.17626953125, -8.802001953125, -8.427734375, -8.053466796875, -7.67919921875, -7.304931640625, -6.9306640625, -6.556396484375, -6.18212890625, -5.807861328125, -5.43359375, -5.059326171875, -4.68505859375, -4.310791015625, -3.9365234375, -3.562255859375, -3.18798828125, -2.813720703125, -2.439453125, -2.065185546875, -1.69091796875, -1.316650390625, -0.9423828125, -0.568115234375, -0.19384765625, 0.180419921875, 0.5546875, 0.928955078125, 1.30322265625, 1.677490234375, 2.0517578125, 2.426025390625, 2.80029296875, 3.174560546875, 3.548828125, 3.923095703125, 4.29736328125, 4.671630859375, 5.0458984375, 5.420166015625, 5.79443359375, 6.168701171875, 6.54296875, 6.917236328125, 7.29150390625, 7.665771484375, 8.0400390625, 8.414306640625, 8.78857421875, 9.162841796875, 9.537109375, 9.911376953125, 10.28564453125, 10.659912109375, 11.0341796875, 11.408447265625, 11.78271484375, 12.156982421875, 12.53125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 5.0, 11.0, 8.0, 12.0, 12.0, 18.0, 24.0, 11.0, 30.0, 30.0, 44.0, 49.0, 77.0, 110.0, 162.0, 205.0, 360.0, 862.0, 5243.0, 629185.0, 2499526.0, 7533.0, 1014.0, 384.0, 218.0, 116.0, 100.0, 87.0, 45.0, 36.0, 34.0, 23.0, 19.0, 15.0, 10.0, 8.0, 15.0, 8.0, 10.0, 3.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-20.0, -19.39501953125, -18.7900390625, -18.18505859375, -17.580078125, -16.97509765625, -16.3701171875, -15.76513671875, -15.16015625, -14.55517578125, -13.9501953125, -13.34521484375, -12.740234375, -12.13525390625, -11.5302734375, -10.92529296875, -10.3203125, -9.71533203125, -9.1103515625, -8.50537109375, -7.900390625, -7.29541015625, -6.6904296875, -6.08544921875, -5.48046875, -4.87548828125, -4.2705078125, -3.66552734375, -3.060546875, -2.45556640625, -1.8505859375, -1.24560546875, -0.640625, -0.03564453125, 0.5693359375, 1.17431640625, 1.779296875, 2.38427734375, 2.9892578125, 3.59423828125, 4.19921875, 4.80419921875, 5.4091796875, 6.01416015625, 6.619140625, 7.22412109375, 7.8291015625, 8.43408203125, 9.0390625, 9.64404296875, 10.2490234375, 10.85400390625, 11.458984375, 12.06396484375, 12.6689453125, 13.27392578125, 13.87890625, 14.48388671875, 15.0888671875, 15.69384765625, 16.298828125, 16.90380859375, 17.5087890625, 18.11376953125, 18.71875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [6.0, 30.0, 191.0, 416.0, 292.0, 68.0, 13.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.445855617523193, -3.247065544128418, -2.0482752323150635, -0.849484920501709, 0.3493051528930664, 1.5480952262878418, 2.7468857765197754, 3.9456753730773926, 5.144465923309326, 6.343255996704102, 7.542046546936035, 8.740837097167969, 9.939626693725586, 11.138416290283203, 12.337207794189453, 13.53599739074707, 14.734786987304688, 15.933577537536621, 17.132368087768555, 18.331157684326172, 19.52994728088379, 20.728736877441406, 21.927528381347656, 23.126317977905273, 24.325109481811523, 25.52389907836914, 26.72269058227539, 27.921480178833008, 29.120269775390625, 30.319061279296875, 31.517850875854492, 32.71664047241211, 33.91543197631836, 35.11422348022461, 36.313011169433594, 37.511802673339844, 38.710594177246094, 39.90938186645508, 41.10817337036133, 42.30696105957031, 43.50575256347656, 44.70454406738281, 45.9033317565918, 47.10212326049805, 48.3009147644043, 49.49970245361328, 50.69849395751953, 51.89728546142578, 53.09607696533203, 54.29486846923828, 55.493656158447266, 56.692447662353516, 57.891239166259766, 59.09002685546875, 60.288818359375, 61.48760986328125, 62.686397552490234, 63.885189056396484, 65.08397674560547, 66.28276824951172, 67.48155975341797, 68.68035125732422, 69.87913513183594, 71.07792663574219, 72.27671813964844]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 3.0, 3.0, 7.0, 8.0, 15.0, 13.0, 20.0, 23.0, 24.0, 21.0, 28.0, 26.0, 36.0, 34.0, 37.0, 38.0, 25.0, 51.0, 40.0, 34.0, 21.0, 51.0, 35.0, 43.0, 46.0, 39.0, 48.0, 33.0, 30.0, 21.0, 26.0, 14.0, 12.0, 15.0, 18.0, 6.0, 10.0, 14.0, 4.0, 5.0, 4.0, 5.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.279701232910156, -37.03469467163086, -35.78969192504883, -34.54468536376953, -33.299678802490234, -32.05467224121094, -30.809669494628906, -29.56466293334961, -28.319658279418945, -27.07465362548828, -25.829647064208984, -24.58464241027832, -23.339637756347656, -22.09463119506836, -20.849626541137695, -19.60462188720703, -18.359615325927734, -17.11461067199707, -15.869604110717773, -14.62459945678711, -13.379593849182129, -12.134588241577148, -10.889583587646484, -9.644577980041504, -8.399572372436523, -7.154566764831543, -5.909561634063721, -4.664556503295898, -3.419550895690918, -2.1745452880859375, -0.9295401573181152, 0.31546497344970703, 1.5604705810546875, 2.805475950241089, 4.05048131942749, 5.2954864501953125, 6.540492057800293, 7.785497665405273, 9.030502319335938, 10.275507926940918, 11.520513534545898, 12.765519142150879, 14.01052474975586, 15.255529403686523, 16.500534057617188, 17.745540618896484, 18.99054527282715, 20.235549926757812, 21.48055648803711, 22.725561141967773, 23.97056770324707, 25.215572357177734, 26.46057891845703, 27.705583572387695, 28.95058822631836, 30.195594787597656, 31.44059944152832, 32.685604095458984, 33.93061065673828, 35.17561721801758, 36.42061996459961, 37.665626525878906, 38.9106330871582, 40.155635833740234, 41.40064239501953]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 4.0, 5.0, 4.0, 9.0, 9.0, 13.0, 18.0, 25.0, 21.0, 30.0, 30.0, 31.0, 26.0, 20.0, 36.0, 48.0, 50.0, 36.0, 45.0, 46.0, 45.0, 32.0, 52.0, 38.0, 40.0, 44.0, 26.0, 29.0, 32.0, 29.0, 23.0, 23.0, 18.0, 12.0, 12.0, 8.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.141815185546875, -4.01409912109375, -3.886383056640625, -3.7586669921875, -3.630950927734375, -3.50323486328125, -3.375518798828125, -3.247802734375, -3.120086669921875, -2.99237060546875, -2.864654541015625, -2.7369384765625, -2.609222412109375, -2.48150634765625, -2.353790283203125, -2.22607421875, -2.098358154296875, -1.97064208984375, -1.842926025390625, -1.7152099609375, -1.587493896484375, -1.45977783203125, -1.332061767578125, -1.204345703125, -1.076629638671875, -0.94891357421875, -0.821197509765625, -0.6934814453125, -0.565765380859375, -0.43804931640625, -0.310333251953125, -0.1826171875, -0.054901123046875, 0.07281494140625, 0.200531005859375, 0.3282470703125, 0.455963134765625, 0.58367919921875, 0.711395263671875, 0.839111328125, 0.966827392578125, 1.09454345703125, 1.222259521484375, 1.3499755859375, 1.477691650390625, 1.60540771484375, 1.733123779296875, 1.86083984375, 1.988555908203125, 2.11627197265625, 2.243988037109375, 2.3717041015625, 2.499420166015625, 2.62713623046875, 2.754852294921875, 2.882568359375, 3.010284423828125, 3.13800048828125, 3.265716552734375, 3.3934326171875, 3.521148681640625, 3.64886474609375, 3.776580810546875, 3.904296875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 10.0, 7.0, 10.0, 15.0, 15.0, 19.0, 27.0, 43.0, 53.0, 79.0, 136.0, 272.0, 533.0, 1413.0, 4567.0, 16822.0, 79618.0, 641392.0, 2390473.0, 913123.0, 115399.0, 21520.0, 5560.0, 1751.0, 598.0, 308.0, 165.0, 93.0, 54.0, 38.0, 26.0, 30.0, 18.0, 21.0, 16.0, 11.0, 10.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.7578125, -8.4970703125, -8.236328125, -7.9755859375, -7.71484375, -7.4541015625, -7.193359375, -6.9326171875, -6.671875, -6.4111328125, -6.150390625, -5.8896484375, -5.62890625, -5.3681640625, -5.107421875, -4.8466796875, -4.5859375, -4.3251953125, -4.064453125, -3.8037109375, -3.54296875, -3.2822265625, -3.021484375, -2.7607421875, -2.5, -2.2392578125, -1.978515625, -1.7177734375, -1.45703125, -1.1962890625, -0.935546875, -0.6748046875, -0.4140625, -0.1533203125, 0.107421875, 0.3681640625, 0.62890625, 0.8896484375, 1.150390625, 1.4111328125, 1.671875, 1.9326171875, 2.193359375, 2.4541015625, 2.71484375, 2.9755859375, 3.236328125, 3.4970703125, 3.7578125, 4.0185546875, 4.279296875, 4.5400390625, 4.80078125, 5.0615234375, 5.322265625, 5.5830078125, 5.84375, 6.1044921875, 6.365234375, 6.6259765625, 6.88671875, 7.1474609375, 7.408203125, 7.6689453125, 7.9296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 8.0, 20.0, 41.0, 66.0, 104.0, 141.0, 226.0, 329.0, 522.0, 696.0, 635.0, 432.0, 316.0, 187.0, 130.0, 76.0, 40.0, 27.0, 23.0, 13.0, 7.0, 4.0, 8.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.634033203125, -20.12744140625, -19.620849609375, -19.1142578125, -18.607666015625, -18.10107421875, -17.594482421875, -17.087890625, -16.581298828125, -16.07470703125, -15.568115234375, -15.0615234375, -14.554931640625, -14.04833984375, -13.541748046875, -13.03515625, -12.528564453125, -12.02197265625, -11.515380859375, -11.0087890625, -10.502197265625, -9.99560546875, -9.489013671875, -8.982421875, -8.475830078125, -7.96923828125, -7.462646484375, -6.9560546875, -6.449462890625, -5.94287109375, -5.436279296875, -4.9296875, -4.423095703125, -3.91650390625, -3.409912109375, -2.9033203125, -2.396728515625, -1.89013671875, -1.383544921875, -0.876953125, -0.370361328125, 0.13623046875, 0.642822265625, 1.1494140625, 1.656005859375, 2.16259765625, 2.669189453125, 3.17578125, 3.682373046875, 4.18896484375, 4.695556640625, 5.2021484375, 5.708740234375, 6.21533203125, 6.721923828125, 7.228515625, 7.735107421875, 8.24169921875, 8.748291015625, 9.2548828125, 9.761474609375, 10.26806640625, 10.774658203125, 11.28125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 2.0, 5.0, 11.0, 12.0, 9.0, 21.0, 29.0, 40.0, 44.0, 103.0, 165.0, 294.0, 805.0, 5023.0, 1167677.0, 3011089.0, 7398.0, 831.0, 282.0, 142.0, 93.0, 66.0, 37.0, 21.0, 23.0, 23.0, 9.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.5625, -32.921875, -31.28125, -29.640625, -28.0, -26.359375, -24.71875, -23.078125, -21.4375, -19.796875, -18.15625, -16.515625, -14.875, -13.234375, -11.59375, -9.953125, -8.3125, -6.671875, -5.03125, -3.390625, -1.75, -0.109375, 1.53125, 3.171875, 4.8125, 6.453125, 8.09375, 9.734375, 11.375, 13.015625, 14.65625, 16.296875, 17.9375, 19.578125, 21.21875, 22.859375, 24.5, 26.140625, 27.78125, 29.421875, 31.0625, 32.703125, 34.34375, 35.984375, 37.625, 39.265625, 40.90625, 42.546875, 44.1875, 45.828125, 47.46875, 49.109375, 50.75, 52.390625, 54.03125, 55.671875, 57.3125, 58.953125, 60.59375, 62.234375, 63.875, 65.515625, 67.15625, 68.796875, 70.4375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 84.0, 511.0, 382.0, 37.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-376.8096618652344, -369.2497863769531, -361.6899108886719, -354.1300354003906, -346.5701599121094, -339.0102844238281, -331.4504089355469, -323.89056396484375, -316.3306884765625, -308.77081298828125, -301.2109375, -293.65106201171875, -286.0911865234375, -278.53131103515625, -270.971435546875, -263.41156005859375, -255.8516845703125, -248.29180908203125, -240.73193359375, -233.17205810546875, -225.6121826171875, -218.05230712890625, -210.49244689941406, -202.9325714111328, -195.37269592285156, -187.8128204345703, -180.25294494628906, -172.6930694580078, -165.13320922851562, -157.57333374023438, -150.01345825195312, -142.45358276367188, -134.89370727539062, -127.33383178710938, -119.77395629882812, -112.2140884399414, -104.65421295166016, -97.0943374633789, -89.53446960449219, -81.97459411621094, -74.41471099853516, -66.8548355102539, -59.29496383666992, -51.73509216308594, -44.17521667480469, -36.61534118652344, -29.055469512939453, -21.49559783935547, -13.935722351074219, -6.375848770141602, 1.1840248107910156, 8.743898391723633, 16.30377197265625, 23.8636474609375, 31.423519134521484, 38.98339080810547, 46.54326629638672, 54.10314178466797, 61.66301345825195, 69.22288513183594, 76.78276062011719, 84.34263610839844, 91.90251159667969, 99.4623794555664, 107.02225494384766]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 8.0, 4.0, 9.0, 10.0, 14.0, 12.0, 20.0, 14.0, 22.0, 23.0, 23.0, 29.0, 24.0, 33.0, 30.0, 27.0, 29.0, 31.0, 34.0, 26.0, 43.0, 34.0, 37.0, 39.0, 46.0, 35.0, 32.0, 21.0, 33.0, 26.0, 32.0, 20.0, 24.0, 22.0, 18.0, 27.0, 14.0, 12.0, 14.0, 8.0, 10.0, 8.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.246925354003906, -30.21388053894043, -29.180835723876953, -28.14779281616211, -27.114748001098633, -26.081703186035156, -25.04865837097168, -24.015613555908203, -22.98257064819336, -21.949525833129883, -20.916481018066406, -19.883438110351562, -18.850393295288086, -17.81734848022461, -16.784303665161133, -15.751258850097656, -14.71821403503418, -13.685169219970703, -12.652125358581543, -11.619080543518066, -10.586036682128906, -9.55299186706543, -8.519947052001953, -7.486902713775635, -6.453858375549316, -5.420814037322998, -4.38776969909668, -3.354724884033203, -2.3216805458068848, -1.2886362075805664, -0.25559139251708984, 0.7774529457092285, 1.8104972839355469, 2.8435416221618652, 3.8765861988067627, 4.90963077545166, 5.9426751136779785, 6.975719451904297, 8.008764266967773, 9.04180908203125, 10.07485294342041, 11.107897758483887, 12.140941619873047, 13.173986434936523, 14.20703125, 15.24007511138916, 16.273120880126953, 17.306163787841797, 18.339208602905273, 19.37225341796875, 20.405298233032227, 21.438343048095703, 22.471385955810547, 23.504430770874023, 24.5374755859375, 25.570520401000977, 26.603565216064453, 27.63661003112793, 28.669654846191406, 29.70269775390625, 30.735742568969727, 31.768787384033203, 32.80183410644531, 33.834877014160156, 34.867919921875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 8.0, 13.0, 11.0, 18.0, 15.0, 16.0, 21.0, 18.0, 26.0, 29.0, 29.0, 38.0, 46.0, 31.0, 34.0, 42.0, 30.0, 45.0, 46.0, 46.0, 26.0, 42.0, 34.0, 31.0, 41.0, 32.0, 28.0, 25.0, 25.0, 22.0, 25.0, 20.0, 12.0, 11.0, 4.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.828948974609375, -3.70867919921875, -3.588409423828125, -3.4681396484375, -3.347869873046875, -3.22760009765625, -3.107330322265625, -2.987060546875, -2.866790771484375, -2.74652099609375, -2.626251220703125, -2.5059814453125, -2.385711669921875, -2.26544189453125, -2.145172119140625, -2.02490234375, -1.904632568359375, -1.78436279296875, -1.664093017578125, -1.5438232421875, -1.423553466796875, -1.30328369140625, -1.183013916015625, -1.062744140625, -0.942474365234375, -0.82220458984375, -0.701934814453125, -0.5816650390625, -0.461395263671875, -0.34112548828125, -0.220855712890625, -0.1005859375, 0.019683837890625, 0.13995361328125, 0.260223388671875, 0.3804931640625, 0.500762939453125, 0.62103271484375, 0.741302490234375, 0.861572265625, 0.981842041015625, 1.10211181640625, 1.222381591796875, 1.3426513671875, 1.462921142578125, 1.58319091796875, 1.703460693359375, 1.82373046875, 1.944000244140625, 2.06427001953125, 2.184539794921875, 2.3048095703125, 2.425079345703125, 2.54534912109375, 2.665618896484375, 2.785888671875, 2.906158447265625, 3.02642822265625, 3.146697998046875, 3.2669677734375, 3.387237548828125, 3.50750732421875, 3.627777099609375, 3.748046875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 12.0, 11.0, 25.0, 27.0, 47.0, 62.0, 100.0, 144.0, 261.0, 337.0, 521.0, 793.0, 1328.0, 2144.0, 3362.0, 5722.0, 9853.0, 17710.0, 32354.0, 62722.0, 125658.0, 234050.0, 253066.0, 143436.0, 70715.0, 36801.0, 19857.0, 11090.0, 6323.0, 3725.0, 2261.0, 1426.0, 899.0, 593.0, 376.0, 249.0, 154.0, 109.0, 58.0, 55.0, 37.0, 29.0, 11.0, 10.0, 8.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.496337890625, -0.48087310791015625, -0.4654083251953125, -0.44994354248046875, -0.434478759765625, -0.41901397705078125, -0.4035491943359375, -0.38808441162109375, -0.37261962890625, -0.35715484619140625, -0.3416900634765625, -0.32622528076171875, -0.310760498046875, -0.29529571533203125, -0.2798309326171875, -0.26436614990234375, -0.2489013671875, -0.23343658447265625, -0.2179718017578125, -0.20250701904296875, -0.187042236328125, -0.17157745361328125, -0.1561126708984375, -0.14064788818359375, -0.12518310546875, -0.10971832275390625, -0.0942535400390625, -0.07878875732421875, -0.063323974609375, -0.04785919189453125, -0.0323944091796875, -0.01692962646484375, -0.00146484375, 0.01399993896484375, 0.0294647216796875, 0.04492950439453125, 0.060394287109375, 0.07585906982421875, 0.0913238525390625, 0.10678863525390625, 0.12225341796875, 0.13771820068359375, 0.1531829833984375, 0.16864776611328125, 0.184112548828125, 0.19957733154296875, 0.2150421142578125, 0.23050689697265625, 0.2459716796875, 0.26143646240234375, 0.2769012451171875, 0.29236602783203125, 0.307830810546875, 0.32329559326171875, 0.3387603759765625, 0.35422515869140625, 0.36968994140625, 0.38515472412109375, 0.4006195068359375, 0.41608428955078125, 0.431549072265625, 0.44701385498046875, 0.4624786376953125, 0.47794342041015625, 0.493408203125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 4.0, 1.0, 2.0, 9.0, 7.0, 14.0, 10.0, 10.0, 13.0, 13.0, 16.0, 15.0, 26.0, 26.0, 22.0, 28.0, 31.0, 27.0, 35.0, 31.0, 44.0, 27.0, 30.0, 29.0, 1052.0, 32.0, 26.0, 34.0, 32.0, 29.0, 32.0, 36.0, 28.0, 29.0, 25.0, 26.0, 23.0, 19.0, 20.0, 14.0, 16.0, 15.0, 13.0, 7.0, 8.0, 7.0, 3.0, 7.0, 5.0, 1.0, 5.0, 4.0, 3.0, 1.0, 3.0], "bins": [-2.158203125, -2.093597412109375, -2.02899169921875, -1.964385986328125, -1.8997802734375, -1.835174560546875, -1.77056884765625, -1.705963134765625, -1.641357421875, -1.576751708984375, -1.51214599609375, -1.447540283203125, -1.3829345703125, -1.318328857421875, -1.25372314453125, -1.189117431640625, -1.12451171875, -1.059906005859375, -0.99530029296875, -0.930694580078125, -0.8660888671875, -0.801483154296875, -0.73687744140625, -0.672271728515625, -0.607666015625, -0.543060302734375, -0.47845458984375, -0.413848876953125, -0.3492431640625, -0.284637451171875, -0.22003173828125, -0.155426025390625, -0.0908203125, -0.026214599609375, 0.03839111328125, 0.102996826171875, 0.1676025390625, 0.232208251953125, 0.29681396484375, 0.361419677734375, 0.426025390625, 0.490631103515625, 0.55523681640625, 0.619842529296875, 0.6844482421875, 0.749053955078125, 0.81365966796875, 0.878265380859375, 0.94287109375, 1.007476806640625, 1.07208251953125, 1.136688232421875, 1.2012939453125, 1.265899658203125, 1.33050537109375, 1.395111083984375, 1.459716796875, 1.524322509765625, 1.58892822265625, 1.653533935546875, 1.7181396484375, 1.782745361328125, 1.84735107421875, 1.911956787109375, 1.9765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 13.0, 15.0, 20.0, 34.0, 51.0, 73.0, 130.0, 185.0, 248.0, 447.0, 673.0, 1113.0, 1692.0, 2698.0, 4180.0, 6731.0, 11148.0, 18659.0, 31882.0, 54903.0, 95719.0, 159837.0, 1262561.0, 178885.0, 109956.0, 63647.0, 36718.0, 21271.0, 12726.0, 7754.0, 4836.0, 3080.0, 1874.0, 1243.0, 756.0, 451.0, 325.0, 198.0, 137.0, 95.0, 53.0, 34.0, 26.0, 16.0, 9.0, 13.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.341796875, -0.33026123046875, -0.3187255859375, -0.30718994140625, -0.295654296875, -0.28411865234375, -0.2725830078125, -0.26104736328125, -0.24951171875, -0.23797607421875, -0.2264404296875, -0.21490478515625, -0.203369140625, -0.19183349609375, -0.1802978515625, -0.16876220703125, -0.1572265625, -0.14569091796875, -0.1341552734375, -0.12261962890625, -0.111083984375, -0.09954833984375, -0.0880126953125, -0.07647705078125, -0.06494140625, -0.05340576171875, -0.0418701171875, -0.03033447265625, -0.018798828125, -0.00726318359375, 0.0042724609375, 0.01580810546875, 0.02734375, 0.03887939453125, 0.0504150390625, 0.06195068359375, 0.073486328125, 0.08502197265625, 0.0965576171875, 0.10809326171875, 0.11962890625, 0.13116455078125, 0.1427001953125, 0.15423583984375, 0.165771484375, 0.17730712890625, 0.1888427734375, 0.20037841796875, 0.2119140625, 0.22344970703125, 0.2349853515625, 0.24652099609375, 0.258056640625, 0.26959228515625, 0.2811279296875, 0.29266357421875, 0.30419921875, 0.31573486328125, 0.3272705078125, 0.33880615234375, 0.350341796875, 0.36187744140625, 0.3734130859375, 0.38494873046875, 0.396484375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 11.0, 8.0, 15.0, 15.0, 22.0, 11.0, 10.0, 34.0, 16.0, 30.0, 36.0, 25.0, 28.0, 47.0, 41.0, 48.0, 51.0, 42.0, 54.0, 38.0, 36.0, 32.0, 47.0, 31.0, 41.0, 25.0, 18.0, 27.0, 29.0, 19.0, 15.0, 17.0, 15.0, 8.0, 7.0, 9.0, 7.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004105567932128906, -0.00039696693420410156, -0.0003833770751953125, -0.00036978721618652344, -0.0003561973571777344, -0.0003426074981689453, -0.00032901763916015625, -0.0003154277801513672, -0.0003018379211425781, -0.00028824806213378906, -0.000274658203125, -0.00026106834411621094, -0.0002474784851074219, -0.0002338886260986328, -0.00022029876708984375, -0.0002067089080810547, -0.00019311904907226562, -0.00017952919006347656, -0.0001659393310546875, -0.00015234947204589844, -0.00013875961303710938, -0.0001251697540283203, -0.00011157989501953125, -9.799003601074219e-05, -8.440017700195312e-05, -7.081031799316406e-05, -5.7220458984375e-05, -4.363059997558594e-05, -3.0040740966796875e-05, -1.6450881958007812e-05, -2.86102294921875e-06, 1.0728836059570312e-05, 2.4318695068359375e-05, 3.790855407714844e-05, 5.14984130859375e-05, 6.508827209472656e-05, 7.867813110351562e-05, 9.226799011230469e-05, 0.00010585784912109375, 0.00011944770812988281, 0.00013303756713867188, 0.00014662742614746094, 0.00016021728515625, 0.00017380714416503906, 0.00018739700317382812, 0.0002009868621826172, 0.00021457672119140625, 0.0002281665802001953, 0.00024175643920898438, 0.00025534629821777344, 0.0002689361572265625, 0.00028252601623535156, 0.0002961158752441406, 0.0003097057342529297, 0.00032329559326171875, 0.0003368854522705078, 0.0003504753112792969, 0.00036406517028808594, 0.000377655029296875, 0.00039124488830566406, 0.0004048347473144531, 0.0004184246063232422, 0.00043201446533203125, 0.0004456043243408203, 0.0004591941833496094]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 16.0, 8.0, 18.0, 20.0, 26.0, 34.0, 44.0, 57.0, 70.0, 104.0, 161.0, 224.0, 326.0, 683.0, 3342.0, 981674.0, 59425.0, 909.0, 464.0, 266.0, 167.0, 120.0, 90.0, 64.0, 38.0, 53.0, 28.0, 24.0, 11.0, 11.0, 13.0, 12.0, 6.0, 7.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0106353759765625, -0.01029980182647705, -0.009964227676391602, -0.009628653526306152, -0.009293079376220703, -0.008957505226135254, -0.008621931076049805, -0.008286356925964355, -0.007950782775878906, -0.007615208625793457, -0.007279634475708008, -0.006944060325622559, -0.006608486175537109, -0.00627291202545166, -0.005937337875366211, -0.005601763725280762, -0.0052661895751953125, -0.004930615425109863, -0.004595041275024414, -0.004259467124938965, -0.003923892974853516, -0.0035883188247680664, -0.003252744674682617, -0.002917170524597168, -0.0025815963745117188, -0.0022460222244262695, -0.0019104480743408203, -0.001574873924255371, -0.0012392997741699219, -0.0009037256240844727, -0.0005681514739990234, -0.00023257732391357422, 0.000102996826171875, 0.0004385709762573242, 0.0007741451263427734, 0.0011097192764282227, 0.0014452934265136719, 0.001780867576599121, 0.0021164417266845703, 0.0024520158767700195, 0.0027875900268554688, 0.003123164176940918, 0.003458738327026367, 0.0037943124771118164, 0.004129886627197266, 0.004465460777282715, 0.004801034927368164, 0.005136609077453613, 0.0054721832275390625, 0.005807757377624512, 0.006143331527709961, 0.00647890567779541, 0.006814479827880859, 0.007150053977966309, 0.007485628128051758, 0.007821202278137207, 0.008156776428222656, 0.008492350578308105, 0.008827924728393555, 0.009163498878479004, 0.009499073028564453, 0.009834647178649902, 0.010170221328735352, 0.0105057954788208, 0.01084136962890625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 152.0, 652.0, 197.0, 13.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024344755802303553, -0.0023640389554202557, -0.002293602330610156, -0.0022231657058000565, -0.0021527293138206005, -0.002082292689010501, -0.0020118560642004013, -0.0019414194393903017, -0.001870982814580202, -0.0018005461897701025, -0.001730109564960003, -0.0016596730565652251, -0.0015892364317551255, -0.001518799806945026, -0.0014483632985502481, -0.0013779266737401485, -0.001307490048930049, -0.0012370534241199493, -0.0011666167993098497, -0.001096180290915072, -0.0010257436661049724, -0.0009553070412948728, -0.0008848704746924341, -0.0008144339080899954, -0.0007439972832798958, -0.0006735606584697962, -0.0006031240918673575, -0.0005326875252649188, -0.0004622509004548192, -0.00039181430474855006, -0.0003213777090422809, -0.0002509411424398422, -0.00018050428479909897, -0.00011006768909282982, -3.963109338656068e-05, 3.0805502319708467e-05, 0.00010124209802597761, 0.00017167869373224676, 0.0002421152894385159, 0.0003125518560409546, 0.0003829884808510542, 0.00045342507655732334, 0.0005238616722635925, 0.0005942982388660312, 0.0006647348636761308, 0.0007351714884862304, 0.0008056080550886691, 0.0008760446216911077, 0.0009464812465012074, 0.001016917871311307, 0.0010873544961214066, 0.0011577910045161843, 0.001228227629326284, 0.0012986642541363835, 0.0013691007625311613, 0.001439537387341261, 0.0015099740121513605, 0.0015804106369614601, 0.0016508472617715597, 0.0017212837701663375, 0.001791720394976437, 0.0018621570197865367, 0.0019325935281813145, 0.002003030152991414, 0.0020734667778015137]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 8.0, 2.0, 3.0, 7.0, 6.0, 14.0, 8.0, 6.0, 18.0, 11.0, 21.0, 18.0, 38.0, 22.0, 23.0, 26.0, 33.0, 28.0, 33.0, 41.0, 40.0, 36.0, 38.0, 37.0, 51.0, 41.0, 41.0, 36.0, 33.0, 28.0, 31.0, 29.0, 33.0, 23.0, 25.0, 21.0, 17.0, 19.0, 9.0, 10.0, 11.0, 10.0, 10.0, 3.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002688169479370117, -0.00026031024754047394, -0.00025180354714393616, -0.00024329684674739838, -0.0002347901463508606, -0.00022628344595432281, -0.00021777674555778503, -0.00020927004516124725, -0.00020076334476470947, -0.0001922566443681717, -0.0001837499439716339, -0.00017524324357509613, -0.00016673654317855835, -0.00015822984278202057, -0.0001497231423854828, -0.000141216441988945, -0.00013270974159240723, -0.00012420304119586945, -0.00011569634079933167, -0.00010718964040279388, -9.86829400062561e-05, -9.017623960971832e-05, -8.166953921318054e-05, -7.316283881664276e-05, -6.465613842010498e-05, -5.61494380235672e-05, -4.764273762702942e-05, -3.913603723049164e-05, -3.062933683395386e-05, -2.2122636437416077e-05, -1.3615936040878296e-05, -5.109235644340515e-06, 3.3974647521972656e-06, 1.1904165148735046e-05, 2.0410865545272827e-05, 2.8917565941810608e-05, 3.742426633834839e-05, 4.593096673488617e-05, 5.443766713142395e-05, 6.294436752796173e-05, 7.145106792449951e-05, 7.995776832103729e-05, 8.846446871757507e-05, 9.697116911411285e-05, 0.00010547786951065063, 0.00011398456990718842, 0.0001224912703037262, 0.00013099797070026398, 0.00013950467109680176, 0.00014801137149333954, 0.00015651807188987732, 0.0001650247722864151, 0.00017353147268295288, 0.00018203817307949066, 0.00019054487347602844, 0.00019905157387256622, 0.000207558274269104, 0.00021606497466564178, 0.00022457167506217957, 0.00023307837545871735, 0.00024158507585525513, 0.0002500917762517929, 0.0002585984766483307, 0.00026710517704486847, 0.00027561187744140625]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 8.0, 13.0, 11.0, 18.0, 15.0, 16.0, 21.0, 18.0, 26.0, 29.0, 29.0, 38.0, 46.0, 31.0, 34.0, 42.0, 30.0, 45.0, 46.0, 46.0, 26.0, 42.0, 34.0, 31.0, 41.0, 32.0, 28.0, 25.0, 25.0, 22.0, 25.0, 20.0, 12.0, 11.0, 4.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.828948974609375, -3.70867919921875, -3.588409423828125, -3.4681396484375, -3.347869873046875, -3.22760009765625, -3.107330322265625, -2.987060546875, -2.866790771484375, -2.74652099609375, -2.626251220703125, -2.5059814453125, -2.385711669921875, -2.26544189453125, -2.145172119140625, -2.02490234375, -1.904632568359375, -1.78436279296875, -1.664093017578125, -1.5438232421875, -1.423553466796875, -1.30328369140625, -1.183013916015625, -1.062744140625, -0.942474365234375, -0.82220458984375, -0.701934814453125, -0.5816650390625, -0.461395263671875, -0.34112548828125, -0.220855712890625, -0.1005859375, 0.019683837890625, 0.13995361328125, 0.260223388671875, 0.3804931640625, 0.500762939453125, 0.62103271484375, 0.741302490234375, 0.861572265625, 0.981842041015625, 1.10211181640625, 1.222381591796875, 1.3426513671875, 1.462921142578125, 1.58319091796875, 1.703460693359375, 1.82373046875, 1.944000244140625, 2.06427001953125, 2.184539794921875, 2.3048095703125, 2.425079345703125, 2.54534912109375, 2.665618896484375, 2.785888671875, 2.906158447265625, 3.02642822265625, 3.146697998046875, 3.2669677734375, 3.387237548828125, 3.50750732421875, 3.627777099609375, 3.748046875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 12.0, 12.0, 32.0, 37.0, 46.0, 84.0, 101.0, 211.0, 296.0, 509.0, 830.0, 1398.0, 2533.0, 4431.0, 8322.0, 16855.0, 37285.0, 89433.0, 225022.0, 351387.0, 178748.0, 70638.0, 29885.0, 14092.0, 7065.0, 3917.0, 2194.0, 1221.0, 680.0, 479.0, 267.0, 186.0, 103.0, 72.0, 57.0, 24.0, 18.0, 21.0, 8.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.466796875, -2.390594482421875, -2.31439208984375, -2.238189697265625, -2.1619873046875, -2.085784912109375, -2.00958251953125, -1.933380126953125, -1.857177734375, -1.780975341796875, -1.70477294921875, -1.628570556640625, -1.5523681640625, -1.476165771484375, -1.39996337890625, -1.323760986328125, -1.24755859375, -1.171356201171875, -1.09515380859375, -1.018951416015625, -0.9427490234375, -0.866546630859375, -0.79034423828125, -0.714141845703125, -0.637939453125, -0.561737060546875, -0.48553466796875, -0.409332275390625, -0.3331298828125, -0.256927490234375, -0.18072509765625, -0.104522705078125, -0.0283203125, 0.047882080078125, 0.12408447265625, 0.200286865234375, 0.2764892578125, 0.352691650390625, 0.42889404296875, 0.505096435546875, 0.581298828125, 0.657501220703125, 0.73370361328125, 0.809906005859375, 0.8861083984375, 0.962310791015625, 1.03851318359375, 1.114715576171875, 1.19091796875, 1.267120361328125, 1.34332275390625, 1.419525146484375, 1.4957275390625, 1.571929931640625, 1.64813232421875, 1.724334716796875, 1.800537109375, 1.876739501953125, 1.95294189453125, 2.029144287109375, 2.1053466796875, 2.181549072265625, 2.25775146484375, 2.333953857421875, 2.41015625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 11.0, 13.0, 8.0, 14.0, 23.0, 20.0, 15.0, 34.0, 45.0, 45.0, 55.0, 60.0, 68.0, 124.0, 1588.0, 396.0, 116.0, 76.0, 48.0, 57.0, 33.0, 34.0, 25.0, 29.0, 25.0, 22.0, 14.0, 14.0, 12.0, 10.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.96875, -17.405517578125, -16.84228515625, -16.279052734375, -15.7158203125, -15.152587890625, -14.58935546875, -14.026123046875, -13.462890625, -12.899658203125, -12.33642578125, -11.773193359375, -11.2099609375, -10.646728515625, -10.08349609375, -9.520263671875, -8.95703125, -8.393798828125, -7.83056640625, -7.267333984375, -6.7041015625, -6.140869140625, -5.57763671875, -5.014404296875, -4.451171875, -3.887939453125, -3.32470703125, -2.761474609375, -2.1982421875, -1.635009765625, -1.07177734375, -0.508544921875, 0.0546875, 0.617919921875, 1.18115234375, 1.744384765625, 2.3076171875, 2.870849609375, 3.43408203125, 3.997314453125, 4.560546875, 5.123779296875, 5.68701171875, 6.250244140625, 6.8134765625, 7.376708984375, 7.93994140625, 8.503173828125, 9.06640625, 9.629638671875, 10.19287109375, 10.756103515625, 11.3193359375, 11.882568359375, 12.44580078125, 13.009033203125, 13.572265625, 14.135498046875, 14.69873046875, 15.261962890625, 15.8251953125, 16.388427734375, 16.95166015625, 17.514892578125, 18.078125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 13.0, 13.0, 19.0, 29.0, 39.0, 32.0, 32.0, 75.0, 86.0, 172.0, 301.0, 699.0, 4853.0, 2491327.0, 643064.0, 3556.0, 620.0, 270.0, 159.0, 86.0, 64.0, 47.0, 27.0, 24.0, 20.0, 18.0, 14.0, 12.0, 9.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5, -27.578857421875, -26.65771484375, -25.736572265625, -24.8154296875, -23.894287109375, -22.97314453125, -22.052001953125, -21.130859375, -20.209716796875, -19.28857421875, -18.367431640625, -17.4462890625, -16.525146484375, -15.60400390625, -14.682861328125, -13.76171875, -12.840576171875, -11.91943359375, -10.998291015625, -10.0771484375, -9.156005859375, -8.23486328125, -7.313720703125, -6.392578125, -5.471435546875, -4.55029296875, -3.629150390625, -2.7080078125, -1.786865234375, -0.86572265625, 0.055419921875, 0.9765625, 1.897705078125, 2.81884765625, 3.739990234375, 4.6611328125, 5.582275390625, 6.50341796875, 7.424560546875, 8.345703125, 9.266845703125, 10.18798828125, 11.109130859375, 12.0302734375, 12.951416015625, 13.87255859375, 14.793701171875, 15.71484375, 16.635986328125, 17.55712890625, 18.478271484375, 19.3994140625, 20.320556640625, 21.24169921875, 22.162841796875, 23.083984375, 24.005126953125, 24.92626953125, 25.847412109375, 26.7685546875, 27.689697265625, 28.61083984375, 29.531982421875, 30.453125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 34.0, 97.0, 249.0, 342.0, 197.0, 67.0, 18.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.961304664611816, -13.64436149597168, -12.327418327331543, -11.010475158691406, -9.693531036376953, -8.376588821411133, -7.05964469909668, -5.742701530456543, -4.425758361816406, -3.1088151931762695, -1.7918717861175537, -0.4749283790588379, 0.8420147895812988, 2.1589579582214355, 3.4759016036987305, 4.792844772338867, 6.109787940979004, 7.426731109619141, 8.743674278259277, 10.060617446899414, 11.377561569213867, 12.694503784179688, 14.01144790649414, 15.328391075134277, 16.645334243774414, 17.962278366088867, 19.279220581054688, 20.59616470336914, 21.91310691833496, 23.230051040649414, 24.546993255615234, 25.863937377929688, 27.18088150024414, 28.497825622558594, 29.814767837524414, 31.131711959838867, 32.44865417480469, 33.76559829711914, 35.082542419433594, 36.39948272705078, 37.716426849365234, 39.03337097167969, 40.35031509399414, 41.66725540161133, 42.98419952392578, 44.301143646240234, 45.61808776855469, 46.935028076171875, 48.251976013183594, 49.56892013549805, 50.8858642578125, 52.20280456542969, 53.51974868774414, 54.836692810058594, 56.15363693237305, 57.4705810546875, 58.78752136230469, 60.10446548461914, 61.421409606933594, 62.73834991455078, 64.0552978515625, 65.37223815917969, 66.68917846679688, 68.0061264038086, 69.32306671142578]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 10.0, 8.0, 8.0, 8.0, 16.0, 12.0, 8.0, 22.0, 20.0, 17.0, 24.0, 23.0, 28.0, 40.0, 45.0, 29.0, 36.0, 47.0, 37.0, 41.0, 46.0, 34.0, 34.0, 32.0, 33.0, 35.0, 30.0, 27.0, 31.0, 26.0, 29.0, 25.0, 20.0, 14.0, 19.0, 17.0, 12.0, 12.0, 7.0, 7.0, 7.0, 4.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-43.115684509277344, -41.81609344482422, -40.516502380371094, -39.21691131591797, -37.917320251464844, -36.61772918701172, -35.318138122558594, -34.01854705810547, -32.718955993652344, -31.41936492919922, -30.119773864746094, -28.82018280029297, -27.520591735839844, -26.22100067138672, -24.92140769958496, -23.621816635131836, -22.322223663330078, -21.022632598876953, -19.723041534423828, -18.423450469970703, -17.123859405517578, -15.824267387390137, -14.524675369262695, -13.22508430480957, -11.925493240356445, -10.62590217590332, -9.326311111450195, -8.026719093322754, -6.727128028869629, -5.427536964416504, -4.127945423126221, -2.8283538818359375, -1.5287628173828125, -0.2291715145111084, 1.0704197883605957, 2.3700110912323, 3.669602394104004, 4.969193458557129, 6.268784999847412, 7.568376541137695, 8.86796760559082, 10.167558670043945, 11.46714973449707, 12.766741752624512, 14.066332817077637, 15.365923881530762, 16.665515899658203, 17.965106964111328, 19.264698028564453, 20.564289093017578, 21.863880157470703, 23.163471221923828, 24.463062286376953, 25.762653350830078, 27.062246322631836, 28.36183738708496, 29.661428451538086, 30.96101951599121, 32.26061248779297, 33.560203552246094, 34.85979461669922, 36.159385681152344, 37.45897674560547, 38.758567810058594, 40.05815887451172]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 2.0, 4.0, 0.0, 3.0, 7.0, 7.0, 5.0, 16.0, 10.0, 17.0, 9.0, 20.0, 22.0, 17.0, 31.0, 26.0, 31.0, 36.0, 36.0, 43.0, 26.0, 38.0, 54.0, 42.0, 50.0, 37.0, 30.0, 34.0, 26.0, 47.0, 36.0, 36.0, 30.0, 27.0, 24.0, 27.0, 19.0, 12.0, 17.0, 13.0, 7.0, 7.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.033416748046875, -3.90667724609375, -3.779937744140625, -3.6531982421875, -3.526458740234375, -3.39971923828125, -3.272979736328125, -3.146240234375, -3.019500732421875, -2.89276123046875, -2.766021728515625, -2.6392822265625, -2.512542724609375, -2.38580322265625, -2.259063720703125, -2.13232421875, -2.005584716796875, -1.87884521484375, -1.752105712890625, -1.6253662109375, -1.498626708984375, -1.37188720703125, -1.245147705078125, -1.118408203125, -0.991668701171875, -0.86492919921875, -0.738189697265625, -0.6114501953125, -0.484710693359375, -0.35797119140625, -0.231231689453125, -0.1044921875, 0.022247314453125, 0.14898681640625, 0.275726318359375, 0.4024658203125, 0.529205322265625, 0.65594482421875, 0.782684326171875, 0.909423828125, 1.036163330078125, 1.16290283203125, 1.289642333984375, 1.4163818359375, 1.543121337890625, 1.66986083984375, 1.796600341796875, 1.92333984375, 2.050079345703125, 2.17681884765625, 2.303558349609375, 2.4302978515625, 2.557037353515625, 2.68377685546875, 2.810516357421875, 2.937255859375, 3.063995361328125, 3.19073486328125, 3.317474365234375, 3.4442138671875, 3.570953369140625, 3.69769287109375, 3.824432373046875, 3.951171875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 6.0, 6.0, 12.0, 10.0, 12.0, 17.0, 6.0, 16.0, 29.0, 30.0, 36.0, 55.0, 70.0, 118.0, 225.0, 536.0, 1668.0, 9040.0, 74454.0, 1513751.0, 2424288.0, 151583.0, 14238.0, 2616.0, 708.0, 261.0, 129.0, 88.0, 53.0, 50.0, 22.0, 25.0, 22.0, 19.0, 18.0, 13.0, 12.0, 6.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.484375, -13.0772705078125, -12.670166015625, -12.2630615234375, -11.85595703125, -11.4488525390625, -11.041748046875, -10.6346435546875, -10.2275390625, -9.8204345703125, -9.413330078125, -9.0062255859375, -8.59912109375, -8.1920166015625, -7.784912109375, -7.3778076171875, -6.970703125, -6.5635986328125, -6.156494140625, -5.7493896484375, -5.34228515625, -4.9351806640625, -4.528076171875, -4.1209716796875, -3.7138671875, -3.3067626953125, -2.899658203125, -2.4925537109375, -2.08544921875, -1.6783447265625, -1.271240234375, -0.8641357421875, -0.45703125, -0.0499267578125, 0.357177734375, 0.7642822265625, 1.17138671875, 1.5784912109375, 1.985595703125, 2.3927001953125, 2.7998046875, 3.2069091796875, 3.614013671875, 4.0211181640625, 4.42822265625, 4.8353271484375, 5.242431640625, 5.6495361328125, 6.056640625, 6.4637451171875, 6.870849609375, 7.2779541015625, 7.68505859375, 8.0921630859375, 8.499267578125, 8.9063720703125, 9.3134765625, 9.7205810546875, 10.127685546875, 10.5347900390625, 10.94189453125, 11.3489990234375, 11.756103515625, 12.1632080078125, 12.5703125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 12.0, 6.0, 7.0, 21.0, 23.0, 28.0, 30.0, 39.0, 65.0, 89.0, 122.0, 193.0, 215.0, 270.0, 405.0, 486.0, 464.0, 454.0, 305.0, 241.0, 169.0, 107.0, 93.0, 64.0, 48.0, 37.0, 25.0, 21.0, 12.0, 10.0, 0.0, 3.0, 7.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.5997314453125, -9.230712890625, -8.8616943359375, -8.49267578125, -8.1236572265625, -7.754638671875, -7.3856201171875, -7.0166015625, -6.6475830078125, -6.278564453125, -5.9095458984375, -5.54052734375, -5.1715087890625, -4.802490234375, -4.4334716796875, -4.064453125, -3.6954345703125, -3.326416015625, -2.9573974609375, -2.58837890625, -2.2193603515625, -1.850341796875, -1.4813232421875, -1.1123046875, -0.7432861328125, -0.374267578125, -0.0052490234375, 0.36376953125, 0.7327880859375, 1.101806640625, 1.4708251953125, 1.83984375, 2.2088623046875, 2.577880859375, 2.9468994140625, 3.31591796875, 3.6849365234375, 4.053955078125, 4.4229736328125, 4.7919921875, 5.1610107421875, 5.530029296875, 5.8990478515625, 6.26806640625, 6.6370849609375, 7.006103515625, 7.3751220703125, 7.744140625, 8.1131591796875, 8.482177734375, 8.8511962890625, 9.22021484375, 9.5892333984375, 9.958251953125, 10.3272705078125, 10.6962890625, 11.0653076171875, 11.434326171875, 11.8033447265625, 12.17236328125, 12.5413818359375, 12.910400390625, 13.2794189453125, 13.6484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 11.0, 18.0, 15.0, 24.0, 31.0, 39.0, 68.0, 54.0, 104.0, 147.0, 256.0, 486.0, 1416.0, 8974.0, 559015.0, 3582444.0, 36891.0, 2563.0, 737.0, 342.0, 188.0, 125.0, 83.0, 59.0, 43.0, 38.0, 30.0, 21.0, 10.0, 10.0, 6.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.25, -36.056640625, -34.86328125, -33.669921875, -32.4765625, -31.283203125, -30.08984375, -28.896484375, -27.703125, -26.509765625, -25.31640625, -24.123046875, -22.9296875, -21.736328125, -20.54296875, -19.349609375, -18.15625, -16.962890625, -15.76953125, -14.576171875, -13.3828125, -12.189453125, -10.99609375, -9.802734375, -8.609375, -7.416015625, -6.22265625, -5.029296875, -3.8359375, -2.642578125, -1.44921875, -0.255859375, 0.9375, 2.130859375, 3.32421875, 4.517578125, 5.7109375, 6.904296875, 8.09765625, 9.291015625, 10.484375, 11.677734375, 12.87109375, 14.064453125, 15.2578125, 16.451171875, 17.64453125, 18.837890625, 20.03125, 21.224609375, 22.41796875, 23.611328125, 24.8046875, 25.998046875, 27.19140625, 28.384765625, 29.578125, 30.771484375, 31.96484375, 33.158203125, 34.3515625, 35.544921875, 36.73828125, 37.931640625, 39.125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 25.0, 56.0, 133.0, 208.0, 241.0, 184.0, 89.0, 41.0, 23.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3055648803711, -70.2851333618164, -67.26470184326172, -64.24427032470703, -61.22383499145508, -58.20340347290039, -55.18296813964844, -52.16253662109375, -49.14210510253906, -46.121673583984375, -43.10124206542969, -40.080806732177734, -37.06037521362305, -34.03994369506836, -31.01951026916504, -27.99907684326172, -24.97864532470703, -21.958213806152344, -18.937780380249023, -15.91734790802002, -12.896915435791016, -9.876482963562012, -6.856050491333008, -3.8356170654296875, -0.815185546875, 2.205246925354004, 5.225679397583008, 8.246111869812012, 11.266544342041016, 14.28697681427002, 17.307409286499023, 20.327842712402344, 23.3482666015625, 26.368698120117188, 29.389131546020508, 32.40956497192383, 35.429996490478516, 38.4504280090332, 41.470863342285156, 44.491294860839844, 47.51172637939453, 50.53215789794922, 53.552589416503906, 56.57302474975586, 59.59345626831055, 62.613887786865234, 65.63432312011719, 68.65475463867188, 71.67518615722656, 74.69561767578125, 77.71604919433594, 80.73648071289062, 83.75691223144531, 86.77735137939453, 89.79778289794922, 92.8182144165039, 95.8386459350586, 98.85907745361328, 101.87950897216797, 104.89994049072266, 107.92037963867188, 110.94081115722656, 113.96124267578125, 116.98167419433594, 120.00210571289062]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 3.0, 5.0, 3.0, 14.0, 11.0, 12.0, 16.0, 17.0, 14.0, 26.0, 23.0, 34.0, 32.0, 33.0, 29.0, 33.0, 37.0, 35.0, 35.0, 42.0, 33.0, 38.0, 34.0, 42.0, 49.0, 30.0, 32.0, 30.0, 33.0, 30.0, 29.0, 25.0, 20.0, 33.0, 9.0, 10.0, 10.0, 7.0, 12.0, 5.0, 5.0, 9.0, 3.0, 1.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.41150665283203, -35.32534408569336, -34.23918151855469, -33.153018951416016, -32.066856384277344, -30.98069190979004, -29.894529342651367, -28.808366775512695, -27.72220230102539, -26.63603973388672, -25.549877166748047, -24.463714599609375, -23.37755012512207, -22.2913875579834, -21.205224990844727, -20.119062423706055, -19.032899856567383, -17.94673728942871, -16.86057472229004, -15.77441120147705, -14.688247680664062, -13.60208511352539, -12.515922546386719, -11.429759979248047, -10.343596458435059, -9.257433891296387, -8.171270370483398, -7.085107803344727, -5.9989447593688965, -4.912781715393066, -3.8266191482543945, -2.7404561042785645, -1.6542930603027344, -0.5681301355361938, 0.5180327892303467, 1.6041955947875977, 2.6903586387634277, 3.776521682739258, 4.86268424987793, 5.94884729385376, 7.03501033782959, 8.121172904968262, 9.20733642578125, 10.293498992919922, 11.379661560058594, 12.465825080871582, 13.551987648010254, 14.638151168823242, 15.724313735961914, 16.810476303100586, 17.896638870239258, 18.982803344726562, 20.068965911865234, 21.155128479003906, 22.241291046142578, 23.32745361328125, 24.413616180419922, 25.499778747558594, 26.585941314697266, 27.672103881835938, 28.758268356323242, 29.844430923461914, 30.930593490600586, 32.01675796508789, 33.10292053222656]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 3.0, 9.0, 12.0, 13.0, 10.0, 16.0, 14.0, 36.0, 24.0, 29.0, 20.0, 36.0, 25.0, 34.0, 39.0, 34.0, 37.0, 53.0, 46.0, 44.0, 40.0, 37.0, 47.0, 27.0, 41.0, 21.0, 30.0, 25.0, 39.0, 23.0, 20.0, 15.0, 11.0, 14.0, 5.0, 10.0, 8.0, 10.0, 8.0, 7.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.28515625, -4.158294677734375, -4.03143310546875, -3.904571533203125, -3.7777099609375, -3.650848388671875, -3.52398681640625, -3.397125244140625, -3.270263671875, -3.143402099609375, -3.01654052734375, -2.889678955078125, -2.7628173828125, -2.635955810546875, -2.50909423828125, -2.382232666015625, -2.25537109375, -2.128509521484375, -2.00164794921875, -1.874786376953125, -1.7479248046875, -1.621063232421875, -1.49420166015625, -1.367340087890625, -1.240478515625, -1.113616943359375, -0.98675537109375, -0.859893798828125, -0.7330322265625, -0.606170654296875, -0.47930908203125, -0.352447509765625, -0.2255859375, -0.098724365234375, 0.02813720703125, 0.154998779296875, 0.2818603515625, 0.408721923828125, 0.53558349609375, 0.662445068359375, 0.789306640625, 0.916168212890625, 1.04302978515625, 1.169891357421875, 1.2967529296875, 1.423614501953125, 1.55047607421875, 1.677337646484375, 1.80419921875, 1.931060791015625, 2.05792236328125, 2.184783935546875, 2.3116455078125, 2.438507080078125, 2.56536865234375, 2.692230224609375, 2.819091796875, 2.945953369140625, 3.07281494140625, 3.199676513671875, 3.3265380859375, 3.453399658203125, 3.58026123046875, 3.707122802734375, 3.833984375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 8.0, 10.0, 11.0, 11.0, 12.0, 26.0, 42.0, 46.0, 70.0, 108.0, 136.0, 210.0, 283.0, 407.0, 576.0, 864.0, 1173.0, 1645.0, 2414.0, 3443.0, 5322.0, 7618.0, 11451.0, 17432.0, 26818.0, 42257.0, 68941.0, 115071.0, 176224.0, 193745.0, 140055.0, 85021.0, 51545.0, 32445.0, 20739.0, 13684.0, 9163.0, 5970.0, 4242.0, 2866.0, 1846.0, 1357.0, 992.0, 661.0, 467.0, 351.0, 216.0, 169.0, 112.0, 87.0, 66.0, 47.0, 26.0, 23.0, 11.0, 10.0, 9.0, 11.0, 4.0, 3.0, 1.0], "bins": [-0.37939453125, -0.36761474609375, -0.3558349609375, -0.34405517578125, -0.332275390625, -0.32049560546875, -0.3087158203125, -0.29693603515625, -0.28515625, -0.27337646484375, -0.2615966796875, -0.24981689453125, -0.238037109375, -0.22625732421875, -0.2144775390625, -0.20269775390625, -0.19091796875, -0.17913818359375, -0.1673583984375, -0.15557861328125, -0.143798828125, -0.13201904296875, -0.1202392578125, -0.10845947265625, -0.0966796875, -0.08489990234375, -0.0731201171875, -0.06134033203125, -0.049560546875, -0.03778076171875, -0.0260009765625, -0.01422119140625, -0.00244140625, 0.00933837890625, 0.0211181640625, 0.03289794921875, 0.044677734375, 0.05645751953125, 0.0682373046875, 0.08001708984375, 0.091796875, 0.10357666015625, 0.1153564453125, 0.12713623046875, 0.138916015625, 0.15069580078125, 0.1624755859375, 0.17425537109375, 0.18603515625, 0.19781494140625, 0.2095947265625, 0.22137451171875, 0.233154296875, 0.24493408203125, 0.2567138671875, 0.26849365234375, 0.2802734375, 0.29205322265625, 0.3038330078125, 0.31561279296875, 0.327392578125, 0.33917236328125, 0.3509521484375, 0.36273193359375, 0.37451171875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 6.0, 6.0, 7.0, 12.0, 14.0, 14.0, 23.0, 23.0, 14.0, 27.0, 42.0, 27.0, 46.0, 43.0, 47.0, 46.0, 37.0, 1072.0, 52.0, 55.0, 37.0, 51.0, 39.0, 41.0, 40.0, 36.0, 22.0, 22.0, 12.0, 17.0, 27.0, 12.0, 8.0, 12.0, 6.0, 6.0, 4.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.791015625, -2.694091796875, -2.59716796875, -2.500244140625, -2.4033203125, -2.306396484375, -2.20947265625, -2.112548828125, -2.015625, -1.918701171875, -1.82177734375, -1.724853515625, -1.6279296875, -1.531005859375, -1.43408203125, -1.337158203125, -1.240234375, -1.143310546875, -1.04638671875, -0.949462890625, -0.8525390625, -0.755615234375, -0.65869140625, -0.561767578125, -0.46484375, -0.367919921875, -0.27099609375, -0.174072265625, -0.0771484375, 0.019775390625, 0.11669921875, 0.213623046875, 0.310546875, 0.407470703125, 0.50439453125, 0.601318359375, 0.6982421875, 0.795166015625, 0.89208984375, 0.989013671875, 1.0859375, 1.182861328125, 1.27978515625, 1.376708984375, 1.4736328125, 1.570556640625, 1.66748046875, 1.764404296875, 1.861328125, 1.958251953125, 2.05517578125, 2.152099609375, 2.2490234375, 2.345947265625, 2.44287109375, 2.539794921875, 2.63671875, 2.733642578125, 2.83056640625, 2.927490234375, 3.0244140625, 3.121337890625, 3.21826171875, 3.315185546875, 3.412109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 3.0, 11.0, 10.0, 18.0, 30.0, 35.0, 76.0, 94.0, 168.0, 265.0, 410.0, 673.0, 1167.0, 1882.0, 2969.0, 5238.0, 8911.0, 15507.0, 26908.0, 48579.0, 89090.0, 160749.0, 1284638.0, 195408.0, 112865.0, 61623.0, 33821.0, 19063.0, 10936.0, 6385.0, 3748.0, 2203.0, 1395.0, 856.0, 499.0, 340.0, 216.0, 120.0, 84.0, 48.0, 32.0, 26.0, 14.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.4086036682128906, -0.39484405517578125, -0.3810844421386719, -0.3673248291015625, -0.3535652160644531, -0.33980560302734375, -0.3260459899902344, -0.312286376953125, -0.2985267639160156, -0.28476715087890625, -0.2710075378417969, -0.2572479248046875, -0.24348831176757812, -0.22972869873046875, -0.21596908569335938, -0.20220947265625, -0.18844985961914062, -0.17469024658203125, -0.16093063354492188, -0.1471710205078125, -0.13341140747070312, -0.11965179443359375, -0.10589218139648438, -0.092132568359375, -0.07837295532226562, -0.06461334228515625, -0.050853729248046875, -0.0370941162109375, -0.023334503173828125, -0.00957489013671875, 0.004184722900390625, 0.0179443359375, 0.031703948974609375, 0.04546356201171875, 0.059223175048828125, 0.0729827880859375, 0.08674240112304688, 0.10050201416015625, 0.11426162719726562, 0.128021240234375, 0.14178085327148438, 0.15554046630859375, 0.16930007934570312, 0.1830596923828125, 0.19681930541992188, 0.21057891845703125, 0.22433853149414062, 0.23809814453125, 0.2518577575683594, 0.26561737060546875, 0.2793769836425781, 0.2931365966796875, 0.3068962097167969, 0.32065582275390625, 0.3344154357910156, 0.348175048828125, 0.3619346618652344, 0.37569427490234375, 0.3894538879394531, 0.4032135009765625, 0.4169731140136719, 0.43073272705078125, 0.4444923400878906, 0.458251953125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 9.0, 2.0, 3.0, 5.0, 10.0, 15.0, 14.0, 14.0, 12.0, 22.0, 21.0, 30.0, 18.0, 26.0, 30.0, 25.0, 37.0, 43.0, 45.0, 44.0, 47.0, 40.0, 39.0, 44.0, 42.0, 51.0, 46.0, 43.0, 25.0, 45.0, 31.0, 21.0, 9.0, 16.0, 8.0, 19.0, 10.0, 9.0, 4.0, 5.0, 8.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005526542663574219, -0.0005359575152397156, -0.0005192607641220093, -0.000502564013004303, -0.0004858672618865967, -0.0004691705107688904, -0.0004524737596511841, -0.0004357770085334778, -0.0004190802574157715, -0.0004023835062980652, -0.0003856867551803589, -0.0003689900040626526, -0.0003522932529449463, -0.00033559650182724, -0.0003188997507095337, -0.0003022029995918274, -0.0002855062484741211, -0.0002688094973564148, -0.0002521127462387085, -0.0002354159951210022, -0.0002187192440032959, -0.0002020224928855896, -0.0001853257417678833, -0.000168628990650177, -0.0001519322395324707, -0.0001352354884147644, -0.0001185387372970581, -0.0001018419861793518, -8.514523506164551e-05, -6.844848394393921e-05, -5.175173282623291e-05, -3.505498170852661e-05, -1.8358230590820312e-05, -1.6614794731140137e-06, 1.5035271644592285e-05, 3.1732022762298584e-05, 4.842877388000488e-05, 6.512552499771118e-05, 8.182227611541748e-05, 9.851902723312378e-05, 0.00011521577835083008, 0.00013191252946853638, 0.00014860928058624268, 0.00016530603170394897, 0.00018200278282165527, 0.00019869953393936157, 0.00021539628505706787, 0.00023209303617477417, 0.00024878978729248047, 0.00026548653841018677, 0.00028218328952789307, 0.00029888004064559937, 0.00031557679176330566, 0.00033227354288101196, 0.00034897029399871826, 0.00036566704511642456, 0.00038236379623413086, 0.00039906054735183716, 0.00041575729846954346, 0.00043245404958724976, 0.00044915080070495605, 0.00046584755182266235, 0.00048254430294036865, 0.000499241054058075, 0.0005159378051757812]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 6.0, 6.0, 6.0, 10.0, 15.0, 20.0, 22.0, 32.0, 37.0, 57.0, 85.0, 100.0, 108.0, 165.0, 232.0, 442.0, 931.0, 40875.0, 997990.0, 5403.0, 759.0, 379.0, 250.0, 161.0, 110.0, 72.0, 54.0, 46.0, 39.0, 21.0, 25.0, 14.0, 20.0, 10.0, 8.0, 7.0, 7.0, 4.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01122283935546875, -0.010853171348571777, -0.010483503341674805, -0.010113835334777832, -0.00974416732788086, -0.009374499320983887, -0.009004831314086914, -0.008635163307189941, -0.008265495300292969, -0.007895827293395996, -0.0075261592864990234, -0.007156491279602051, -0.006786823272705078, -0.0064171552658081055, -0.006047487258911133, -0.00567781925201416, -0.0053081512451171875, -0.004938483238220215, -0.004568815231323242, -0.0041991472244262695, -0.003829479217529297, -0.0034598112106323242, -0.0030901432037353516, -0.002720475196838379, -0.0023508071899414062, -0.0019811391830444336, -0.001611471176147461, -0.0012418031692504883, -0.0008721351623535156, -0.000502467155456543, -0.0001327991485595703, 0.00023686885833740234, 0.000606536865234375, 0.0009762048721313477, 0.0013458728790283203, 0.001715540885925293, 0.0020852088928222656, 0.0024548768997192383, 0.002824544906616211, 0.0031942129135131836, 0.0035638809204101562, 0.003933548927307129, 0.0043032169342041016, 0.004672884941101074, 0.005042552947998047, 0.0054122209548950195, 0.005781888961791992, 0.006151556968688965, 0.0065212249755859375, 0.00689089298248291, 0.007260560989379883, 0.0076302289962768555, 0.007999897003173828, 0.0083695650100708, 0.008739233016967773, 0.009108901023864746, 0.009478569030761719, 0.009848237037658691, 0.010217905044555664, 0.010587573051452637, 0.01095724105834961, 0.011326909065246582, 0.011696577072143555, 0.012066245079040527, 0.0124359130859375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 68.0, 310.0, 460.0, 138.0, 25.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.003090477315708995, -0.003034519497305155, -0.0029785616789013147, -0.0029226038604974747, -0.0028666462749242783, -0.002810688456520438, -0.002754730638116598, -0.002698772819712758, -0.002642815001308918, -0.002586857182905078, -0.002530899364501238, -0.0024749417789280415, -0.0024189839605242014, -0.0023630261421203613, -0.0023070683237165213, -0.002251110505312681, -0.002195152919739485, -0.0021391951013356447, -0.0020832372829318047, -0.0020272796973586082, -0.001971321878954768, -0.0019153640605509281, -0.001859406242147088, -0.001803448423743248, -0.001747490605339408, -0.0016915327869355679, -0.0016355750849470496, -0.0015796172665432096, -0.0015236594481393695, -0.0014677017461508512, -0.0014117439277470112, -0.0013557861093431711, -0.0012998281745240092, -0.0012438703561201692, -0.001187912654131651, -0.0011319548357278109, -0.0010759970173239708, -0.0010200391989201307, -0.0009640814969316125, -0.0009081236785277724, -0.0008521659183315933, -0.0007962081581354141, -0.0007402503397315741, -0.0006842925795353949, -0.0006283348193392158, -0.0005723770009353757, -0.0005164192407391965, -0.00046046145143918693, -0.0004045036621391773, -0.0003485458728391677, -0.0002925880835391581, -0.00023663032334297895, -0.00018067253404296935, -0.00012471474474295974, -6.875698454678059e-05, -1.2799195246770978e-05, 4.315859405323863e-05, 9.911637607729062e-05, 0.00015507415810134262, 0.000211031932849437, 0.0002669897221494466, 0.0003229475114494562, 0.00037890527164563537, 0.000434863060945645, 0.0004908208502456546]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 10.0, 2.0, 8.0, 12.0, 13.0, 16.0, 15.0, 14.0, 22.0, 17.0, 30.0, 42.0, 44.0, 52.0, 55.0, 39.0, 47.0, 44.0, 48.0, 49.0, 43.0, 39.0, 49.0, 41.0, 30.0, 27.0, 23.0, 24.0, 31.0, 23.0, 15.0, 17.0, 14.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.00043088197708129883, -0.0004191724583506584, -0.000407462939620018, -0.0003957534208893776, -0.0003840439021587372, -0.00037233438342809677, -0.00036062486469745636, -0.00034891534596681595, -0.00033720582723617554, -0.0003254963085055351, -0.0003137867897748947, -0.0003020772710442543, -0.0002903677523136139, -0.0002786582335829735, -0.00026694871485233307, -0.00025523919612169266, -0.00024352967739105225, -0.00023182015866041183, -0.00022011063992977142, -0.000208401121199131, -0.0001966916024684906, -0.0001849820837378502, -0.00017327256500720978, -0.00016156304627656937, -0.00014985352754592896, -0.00013814400881528854, -0.00012643449008464813, -0.00011472497135400772, -0.00010301545262336731, -9.13059338927269e-05, -7.959641516208649e-05, -6.788689643144608e-05, -5.6177377700805664e-05, -4.446785897016525e-05, -3.275834023952484e-05, -2.104882150888443e-05, -9.339302778244019e-06, 2.370215952396393e-06, 1.4079734683036804e-05, 2.5789253413677216e-05, 3.749877214431763e-05, 4.920829087495804e-05, 6.091780960559845e-05, 7.262732833623886e-05, 8.433684706687927e-05, 9.604636579751968e-05, 0.0001077558845281601, 0.0001194654032588005, 0.00013117492198944092, 0.00014288444072008133, 0.00015459395945072174, 0.00016630347818136215, 0.00017801299691200256, 0.00018972251564264297, 0.00020143203437328339, 0.0002131415531039238, 0.0002248510718345642, 0.00023656059056520462, 0.00024827010929584503, 0.00025997962802648544, 0.00027168914675712585, 0.00028339866548776627, 0.0002951081842184067, 0.0003068177029490471, 0.0003185272216796875]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 3.0, 9.0, 12.0, 13.0, 10.0, 16.0, 14.0, 36.0, 24.0, 29.0, 20.0, 36.0, 25.0, 34.0, 39.0, 34.0, 37.0, 53.0, 46.0, 44.0, 40.0, 37.0, 47.0, 27.0, 41.0, 21.0, 30.0, 25.0, 39.0, 23.0, 20.0, 15.0, 11.0, 14.0, 5.0, 10.0, 8.0, 10.0, 8.0, 7.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.28515625, -4.158294677734375, -4.03143310546875, -3.904571533203125, -3.7777099609375, -3.650848388671875, -3.52398681640625, -3.397125244140625, -3.270263671875, -3.143402099609375, -3.01654052734375, -2.889678955078125, -2.7628173828125, -2.635955810546875, -2.50909423828125, -2.382232666015625, -2.25537109375, -2.128509521484375, -2.00164794921875, -1.874786376953125, -1.7479248046875, -1.621063232421875, -1.49420166015625, -1.367340087890625, -1.240478515625, -1.113616943359375, -0.98675537109375, -0.859893798828125, -0.7330322265625, -0.606170654296875, -0.47930908203125, -0.352447509765625, -0.2255859375, -0.098724365234375, 0.02813720703125, 0.154998779296875, 0.2818603515625, 0.408721923828125, 0.53558349609375, 0.662445068359375, 0.789306640625, 0.916168212890625, 1.04302978515625, 1.169891357421875, 1.2967529296875, 1.423614501953125, 1.55047607421875, 1.677337646484375, 1.80419921875, 1.931060791015625, 2.05792236328125, 2.184783935546875, 2.3116455078125, 2.438507080078125, 2.56536865234375, 2.692230224609375, 2.819091796875, 2.945953369140625, 3.07281494140625, 3.199676513671875, 3.3265380859375, 3.453399658203125, 3.58026123046875, 3.707122802734375, 3.833984375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 9.0, 8.0, 14.0, 24.0, 19.0, 30.0, 39.0, 47.0, 71.0, 115.0, 173.0, 251.0, 418.0, 620.0, 946.0, 1520.0, 2561.0, 4390.0, 7900.0, 15107.0, 31929.0, 80521.0, 285475.0, 422972.0, 111334.0, 40651.0, 18858.0, 9609.0, 5237.0, 2797.0, 1773.0, 1033.0, 707.0, 423.0, 289.0, 233.0, 110.0, 109.0, 70.0, 53.0, 32.0, 22.0, 15.0, 15.0, 10.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.3515625, -4.22027587890625, -4.0889892578125, -3.95770263671875, -3.826416015625, -3.69512939453125, -3.5638427734375, -3.43255615234375, -3.30126953125, -3.16998291015625, -3.0386962890625, -2.90740966796875, -2.776123046875, -2.64483642578125, -2.5135498046875, -2.38226318359375, -2.2509765625, -2.11968994140625, -1.9884033203125, -1.85711669921875, -1.725830078125, -1.59454345703125, -1.4632568359375, -1.33197021484375, -1.20068359375, -1.06939697265625, -0.9381103515625, -0.80682373046875, -0.675537109375, -0.54425048828125, -0.4129638671875, -0.28167724609375, -0.150390625, -0.01910400390625, 0.1121826171875, 0.24346923828125, 0.374755859375, 0.50604248046875, 0.6373291015625, 0.76861572265625, 0.89990234375, 1.03118896484375, 1.1624755859375, 1.29376220703125, 1.425048828125, 1.55633544921875, 1.6876220703125, 1.81890869140625, 1.9501953125, 2.08148193359375, 2.2127685546875, 2.34405517578125, 2.475341796875, 2.60662841796875, 2.7379150390625, 2.86920166015625, 3.00048828125, 3.13177490234375, 3.2630615234375, 3.39434814453125, 3.525634765625, 3.65692138671875, 3.7882080078125, 3.91949462890625, 4.05078125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 8.0, 10.0, 14.0, 15.0, 23.0, 16.0, 26.0, 28.0, 30.0, 25.0, 31.0, 23.0, 20.0, 43.0, 52.0, 76.0, 120.0, 421.0, 1460.0, 123.0, 66.0, 36.0, 40.0, 40.0, 42.0, 24.0, 32.0, 28.0, 26.0, 21.0, 20.0, 12.0, 13.0, 16.0, 6.0, 12.0, 6.0, 8.0, 6.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.2109375, -14.7503662109375, -14.289794921875, -13.8292236328125, -13.36865234375, -12.9080810546875, -12.447509765625, -11.9869384765625, -11.5263671875, -11.0657958984375, -10.605224609375, -10.1446533203125, -9.68408203125, -9.2235107421875, -8.762939453125, -8.3023681640625, -7.841796875, -7.3812255859375, -6.920654296875, -6.4600830078125, -5.99951171875, -5.5389404296875, -5.078369140625, -4.6177978515625, -4.1572265625, -3.6966552734375, -3.236083984375, -2.7755126953125, -2.31494140625, -1.8543701171875, -1.393798828125, -0.9332275390625, -0.47265625, -0.0120849609375, 0.448486328125, 0.9090576171875, 1.36962890625, 1.8302001953125, 2.290771484375, 2.7513427734375, 3.2119140625, 3.6724853515625, 4.133056640625, 4.5936279296875, 5.05419921875, 5.5147705078125, 5.975341796875, 6.4359130859375, 6.896484375, 7.3570556640625, 7.817626953125, 8.2781982421875, 8.73876953125, 9.1993408203125, 9.659912109375, 10.1204833984375, 10.5810546875, 11.0416259765625, 11.502197265625, 11.9627685546875, 12.42333984375, 12.8839111328125, 13.344482421875, 13.8050537109375, 14.265625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 7.0, 8.0, 5.0, 7.0, 12.0, 10.0, 18.0, 17.0, 20.0, 24.0, 39.0, 41.0, 72.0, 105.0, 134.0, 201.0, 339.0, 756.0, 5662.0, 757036.0, 2371905.0, 7332.0, 895.0, 346.0, 206.0, 136.0, 106.0, 58.0, 52.0, 36.0, 30.0, 26.0, 20.0, 9.0, 13.0, 7.0, 7.0, 4.0, 7.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203125, -27.160400390625, -26.11767578125, -25.074951171875, -24.0322265625, -22.989501953125, -21.94677734375, -20.904052734375, -19.861328125, -18.818603515625, -17.77587890625, -16.733154296875, -15.6904296875, -14.647705078125, -13.60498046875, -12.562255859375, -11.51953125, -10.476806640625, -9.43408203125, -8.391357421875, -7.3486328125, -6.305908203125, -5.26318359375, -4.220458984375, -3.177734375, -2.135009765625, -1.09228515625, -0.049560546875, 0.9931640625, 2.035888671875, 3.07861328125, 4.121337890625, 5.1640625, 6.206787109375, 7.24951171875, 8.292236328125, 9.3349609375, 10.377685546875, 11.42041015625, 12.463134765625, 13.505859375, 14.548583984375, 15.59130859375, 16.634033203125, 17.6767578125, 18.719482421875, 19.76220703125, 20.804931640625, 21.84765625, 22.890380859375, 23.93310546875, 24.975830078125, 26.0185546875, 27.061279296875, 28.10400390625, 29.146728515625, 30.189453125, 31.232177734375, 32.27490234375, 33.317626953125, 34.3603515625, 35.403076171875, 36.44580078125, 37.488525390625, 38.53125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 8.0, 238.0, 729.0, 41.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.848793029785156, -20.982648849487305, -16.116504669189453, -11.250358581542969, -6.384214401245117, -1.5180702209472656, 3.3480758666992188, 8.214218139648438, 13.080364227294922, 17.946508407592773, 22.812652587890625, 27.67879867553711, 32.544944763183594, 37.41108703613281, 42.2772331237793, 47.143375396728516, 52.009521484375, 56.875667572021484, 61.7418098449707, 66.60795593261719, 71.4740982055664, 76.34024047851562, 81.20639038085938, 86.0725326538086, 90.93867492675781, 95.80481719970703, 100.67096710205078, 105.537109375, 110.40325164794922, 115.26939392089844, 120.13554382324219, 125.0016860961914, 129.8678436279297, 134.73399353027344, 139.60012817382812, 144.46627807617188, 149.33242797851562, 154.1985626220703, 159.06471252441406, 163.93084716796875, 168.7969970703125, 173.66314697265625, 178.52928161621094, 183.3954315185547, 188.26158142089844, 193.12771606445312, 197.99386596679688, 202.86001586914062, 207.72616577148438, 212.59231567382812, 217.4584503173828, 222.32460021972656, 227.1907501220703, 232.056884765625, 236.92303466796875, 241.7891845703125, 246.6553192138672, 251.52146911621094, 256.3876037597656, 261.2537536621094, 266.1199035644531, 270.9860534667969, 275.8521728515625, 280.71832275390625, 285.58447265625]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 2.0, 8.0, 7.0, 14.0, 15.0, 17.0, 14.0, 21.0, 28.0, 30.0, 23.0, 43.0, 44.0, 44.0, 49.0, 45.0, 43.0, 52.0, 51.0, 53.0, 43.0, 37.0, 31.0, 39.0, 30.0, 29.0, 37.0, 28.0, 13.0, 14.0, 20.0, 8.0, 10.0, 12.0, 8.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.049686431884766, -46.38274383544922, -44.71580123901367, -43.048858642578125, -41.38191604614258, -39.71497344970703, -38.048030853271484, -36.38108825683594, -34.71414566040039, -33.047203063964844, -31.380260467529297, -29.71331787109375, -28.046375274658203, -26.379432678222656, -24.71249008178711, -23.045547485351562, -21.378604888916016, -19.71166229248047, -18.044719696044922, -16.377777099609375, -14.710834503173828, -13.043891906738281, -11.376949310302734, -9.710006713867188, -8.04306411743164, -6.376121520996094, -4.709178924560547, -3.042236328125, -1.3752937316894531, 0.29164886474609375, 1.9585914611816406, 3.6255340576171875, 5.29248046875, 6.959423065185547, 8.626365661621094, 10.29330825805664, 11.960250854492188, 13.627193450927734, 15.294136047363281, 16.961078643798828, 18.628021240234375, 20.294963836669922, 21.96190643310547, 23.628849029541016, 25.295791625976562, 26.96273422241211, 28.629676818847656, 30.296619415283203, 31.96356201171875, 33.6305046081543, 35.297447204589844, 36.96438980102539, 38.63133239746094, 40.298274993896484, 41.96521759033203, 43.63216018676758, 45.299102783203125, 46.96604537963867, 48.63298797607422, 50.299930572509766, 51.96687316894531, 53.63381576538086, 55.300758361816406, 56.96770095825195, 58.6346435546875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 7.0, 6.0, 11.0, 8.0, 8.0, 9.0, 19.0, 21.0, 28.0, 25.0, 26.0, 21.0, 35.0, 25.0, 26.0, 45.0, 32.0, 34.0, 39.0, 46.0, 38.0, 58.0, 37.0, 43.0, 32.0, 29.0, 27.0, 32.0, 33.0, 18.0, 26.0, 22.0, 19.0, 16.0, 16.0, 11.0, 7.0, 10.0, 11.0, 3.0, 9.0, 4.0, 7.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.09375, -3.966552734375, -3.83935546875, -3.712158203125, -3.5849609375, -3.457763671875, -3.33056640625, -3.203369140625, -3.076171875, -2.948974609375, -2.82177734375, -2.694580078125, -2.5673828125, -2.440185546875, -2.31298828125, -2.185791015625, -2.05859375, -1.931396484375, -1.80419921875, -1.677001953125, -1.5498046875, -1.422607421875, -1.29541015625, -1.168212890625, -1.041015625, -0.913818359375, -0.78662109375, -0.659423828125, -0.5322265625, -0.405029296875, -0.27783203125, -0.150634765625, -0.0234375, 0.103759765625, 0.23095703125, 0.358154296875, 0.4853515625, 0.612548828125, 0.73974609375, 0.866943359375, 0.994140625, 1.121337890625, 1.24853515625, 1.375732421875, 1.5029296875, 1.630126953125, 1.75732421875, 1.884521484375, 2.01171875, 2.138916015625, 2.26611328125, 2.393310546875, 2.5205078125, 2.647705078125, 2.77490234375, 2.902099609375, 3.029296875, 3.156494140625, 3.28369140625, 3.410888671875, 3.5380859375, 3.665283203125, 3.79248046875, 3.919677734375, 4.046875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 8.0, 6.0, 21.0, 23.0, 33.0, 33.0, 46.0, 73.0, 119.0, 187.0, 299.0, 511.0, 958.0, 1773.0, 3606.0, 8383.0, 20899.0, 60818.0, 225443.0, 813275.0, 1607746.0, 1022222.0, 301651.0, 80704.0, 25844.0, 10148.0, 4497.0, 2237.0, 1068.0, 558.0, 350.0, 239.0, 145.0, 101.0, 70.0, 33.0, 39.0, 33.0, 23.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0], "bins": [-6.0078125, -5.834228515625, -5.66064453125, -5.487060546875, -5.3134765625, -5.139892578125, -4.96630859375, -4.792724609375, -4.619140625, -4.445556640625, -4.27197265625, -4.098388671875, -3.9248046875, -3.751220703125, -3.57763671875, -3.404052734375, -3.23046875, -3.056884765625, -2.88330078125, -2.709716796875, -2.5361328125, -2.362548828125, -2.18896484375, -2.015380859375, -1.841796875, -1.668212890625, -1.49462890625, -1.321044921875, -1.1474609375, -0.973876953125, -0.80029296875, -0.626708984375, -0.453125, -0.279541015625, -0.10595703125, 0.067626953125, 0.2412109375, 0.414794921875, 0.58837890625, 0.761962890625, 0.935546875, 1.109130859375, 1.28271484375, 1.456298828125, 1.6298828125, 1.803466796875, 1.97705078125, 2.150634765625, 2.32421875, 2.497802734375, 2.67138671875, 2.844970703125, 3.0185546875, 3.192138671875, 3.36572265625, 3.539306640625, 3.712890625, 3.886474609375, 4.06005859375, 4.233642578125, 4.4072265625, 4.580810546875, 4.75439453125, 4.927978515625, 5.1015625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 6.0, 11.0, 15.0, 18.0, 25.0, 27.0, 40.0, 48.0, 61.0, 71.0, 77.0, 122.0, 141.0, 175.0, 237.0, 295.0, 321.0, 366.0, 367.0, 329.0, 269.0, 257.0, 158.0, 148.0, 108.0, 82.0, 64.0, 48.0, 37.0, 32.0, 27.0, 22.0, 16.0, 12.0, 9.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.078125, -8.79296875, -8.5078125, -8.22265625, -7.9375, -7.65234375, -7.3671875, -7.08203125, -6.796875, -6.51171875, -6.2265625, -5.94140625, -5.65625, -5.37109375, -5.0859375, -4.80078125, -4.515625, -4.23046875, -3.9453125, -3.66015625, -3.375, -3.08984375, -2.8046875, -2.51953125, -2.234375, -1.94921875, -1.6640625, -1.37890625, -1.09375, -0.80859375, -0.5234375, -0.23828125, 0.046875, 0.33203125, 0.6171875, 0.90234375, 1.1875, 1.47265625, 1.7578125, 2.04296875, 2.328125, 2.61328125, 2.8984375, 3.18359375, 3.46875, 3.75390625, 4.0390625, 4.32421875, 4.609375, 4.89453125, 5.1796875, 5.46484375, 5.75, 6.03515625, 6.3203125, 6.60546875, 6.890625, 7.17578125, 7.4609375, 7.74609375, 8.03125, 8.31640625, 8.6015625, 8.88671875, 9.171875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 10.0, 4.0, 3.0, 11.0, 10.0, 16.0, 35.0, 30.0, 40.0, 61.0, 63.0, 112.0, 137.0, 252.0, 482.0, 2212.0, 37150.0, 3582177.0, 560950.0, 8544.0, 991.0, 319.0, 185.0, 133.0, 84.0, 66.0, 50.0, 33.0, 35.0, 22.0, 21.0, 11.0, 7.0, 10.0, 10.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.5, -34.30810546875, -33.1162109375, -31.92431640625, -30.732421875, -29.54052734375, -28.3486328125, -27.15673828125, -25.96484375, -24.77294921875, -23.5810546875, -22.38916015625, -21.197265625, -20.00537109375, -18.8134765625, -17.62158203125, -16.4296875, -15.23779296875, -14.0458984375, -12.85400390625, -11.662109375, -10.47021484375, -9.2783203125, -8.08642578125, -6.89453125, -5.70263671875, -4.5107421875, -3.31884765625, -2.126953125, -0.93505859375, 0.2568359375, 1.44873046875, 2.640625, 3.83251953125, 5.0244140625, 6.21630859375, 7.408203125, 8.60009765625, 9.7919921875, 10.98388671875, 12.17578125, 13.36767578125, 14.5595703125, 15.75146484375, 16.943359375, 18.13525390625, 19.3271484375, 20.51904296875, 21.7109375, 22.90283203125, 24.0947265625, 25.28662109375, 26.478515625, 27.67041015625, 28.8623046875, 30.05419921875, 31.24609375, 32.43798828125, 33.6298828125, 34.82177734375, 36.013671875, 37.20556640625, 38.3974609375, 39.58935546875, 40.78125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 9.0, 39.0, 114.0, 290.0, 308.0, 183.0, 53.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.5034637451172, -134.05325317382812, -129.60304260253906, -125.15283203125, -120.70262145996094, -116.25241088867188, -111.80220794677734, -107.35199737548828, -102.90178680419922, -98.45157623291016, -94.0013656616211, -89.55115509033203, -85.1009521484375, -80.65074157714844, -76.20053100585938, -71.75032043457031, -67.30010986328125, -62.84989929199219, -58.399688720703125, -53.94948196411133, -49.499271392822266, -45.0490608215332, -40.598854064941406, -36.148643493652344, -31.69843292236328, -27.24822235107422, -22.79801368713379, -18.34780502319336, -13.897594451904297, -9.447383880615234, -4.997175216674805, -0.546966552734375, 3.90325927734375, 8.353468894958496, 12.803678512573242, 17.253887176513672, 21.704097747802734, 26.154308319091797, 30.604516983032227, 35.054725646972656, 39.50493621826172, 43.95514678955078, 48.405357360839844, 52.85556411743164, 57.3057746887207, 61.755985260009766, 66.20619201660156, 70.65640258789062, 75.10661315917969, 79.55682373046875, 84.00703430175781, 88.45724487304688, 92.90745544433594, 97.357666015625, 101.80786895751953, 106.2580795288086, 110.70829010009766, 115.15850067138672, 119.60871124267578, 124.05892181396484, 128.50912475585938, 132.95933532714844, 137.4095458984375, 141.85975646972656, 146.30996704101562]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 9.0, 3.0, 8.0, 6.0, 13.0, 16.0, 7.0, 24.0, 25.0, 16.0, 28.0, 20.0, 26.0, 23.0, 31.0, 35.0, 42.0, 38.0, 35.0, 42.0, 41.0, 37.0, 43.0, 44.0, 44.0, 29.0, 34.0, 34.0, 43.0, 24.0, 30.0, 30.0, 24.0, 23.0, 11.0, 14.0, 5.0, 10.0, 4.0, 7.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.172996520996094, -35.0078125, -33.842628479003906, -32.67744445800781, -31.51226234436035, -30.347078323364258, -29.181894302368164, -28.016712188720703, -26.85152816772461, -25.686344146728516, -24.521160125732422, -23.355976104736328, -22.190793991088867, -21.025609970092773, -19.86042594909668, -18.69524383544922, -17.530057907104492, -16.3648738861084, -15.199690818786621, -14.034506797790527, -12.86932373046875, -11.704139709472656, -10.538955688476562, -9.373772621154785, -8.208588600158691, -7.043405055999756, -5.87822151184082, -4.713037490844727, -3.547853946685791, -2.3826704025268555, -1.2174863815307617, -0.052303314208984375, 1.1128807067871094, 2.278064250946045, 3.4432480335235596, 4.608431816101074, 5.77361536026001, 6.938798904418945, 8.103982925415039, 9.269165992736816, 10.43435001373291, 11.599534034729004, 12.764717102050781, 13.929901123046875, 15.095085144042969, 16.260269165039062, 17.425453186035156, 18.590635299682617, 19.75581932067871, 20.921003341674805, 22.0861873626709, 23.25136947631836, 24.416553497314453, 25.581737518310547, 26.74692153930664, 27.912105560302734, 29.077289581298828, 30.242473602294922, 31.407657623291016, 32.57284164428711, 33.7380256652832, 34.90320587158203, 36.068389892578125, 37.23357391357422, 38.39875793457031]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 12.0, 7.0, 12.0, 16.0, 14.0, 12.0, 23.0, 20.0, 29.0, 30.0, 39.0, 21.0, 35.0, 41.0, 38.0, 33.0, 59.0, 35.0, 40.0, 37.0, 38.0, 41.0, 53.0, 41.0, 32.0, 19.0, 28.0, 32.0, 23.0, 7.0, 16.0, 19.0, 15.0, 12.0, 13.0, 7.0, 4.0, 7.0, 4.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.046875, -3.911865234375, -3.77685546875, -3.641845703125, -3.5068359375, -3.371826171875, -3.23681640625, -3.101806640625, -2.966796875, -2.831787109375, -2.69677734375, -2.561767578125, -2.4267578125, -2.291748046875, -2.15673828125, -2.021728515625, -1.88671875, -1.751708984375, -1.61669921875, -1.481689453125, -1.3466796875, -1.211669921875, -1.07666015625, -0.941650390625, -0.806640625, -0.671630859375, -0.53662109375, -0.401611328125, -0.2666015625, -0.131591796875, 0.00341796875, 0.138427734375, 0.2734375, 0.408447265625, 0.54345703125, 0.678466796875, 0.8134765625, 0.948486328125, 1.08349609375, 1.218505859375, 1.353515625, 1.488525390625, 1.62353515625, 1.758544921875, 1.8935546875, 2.028564453125, 2.16357421875, 2.298583984375, 2.43359375, 2.568603515625, 2.70361328125, 2.838623046875, 2.9736328125, 3.108642578125, 3.24365234375, 3.378662109375, 3.513671875, 3.648681640625, 3.78369140625, 3.918701171875, 4.0537109375, 4.188720703125, 4.32373046875, 4.458740234375, 4.59375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 12.0, 12.0, 40.0, 47.0, 83.0, 107.0, 162.0, 265.0, 413.0, 584.0, 932.0, 1472.0, 2233.0, 3506.0, 5545.0, 8758.0, 14325.0, 23110.0, 38570.0, 65822.0, 120182.0, 203384.0, 221437.0, 143056.0, 78274.0, 45272.0, 26610.0, 16394.0, 10241.0, 6348.0, 4108.0, 2559.0, 1580.0, 1085.0, 660.0, 467.0, 322.0, 188.0, 123.0, 92.0, 55.0, 50.0, 18.0, 16.0, 11.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.51416015625, -0.4991035461425781, -0.48404693603515625, -0.4689903259277344, -0.4539337158203125, -0.4388771057128906, -0.42382049560546875, -0.4087638854980469, -0.393707275390625, -0.3786506652832031, -0.36359405517578125, -0.3485374450683594, -0.3334808349609375, -0.3184242248535156, -0.30336761474609375, -0.2883110046386719, -0.27325439453125, -0.2581977844238281, -0.24314117431640625, -0.22808456420898438, -0.2130279541015625, -0.19797134399414062, -0.18291473388671875, -0.16785812377929688, -0.152801513671875, -0.13774490356445312, -0.12268829345703125, -0.10763168334960938, -0.0925750732421875, -0.07751846313476562, -0.06246185302734375, -0.047405242919921875, -0.0323486328125, -0.017292022705078125, -0.00223541259765625, 0.012821197509765625, 0.0278778076171875, 0.042934417724609375, 0.05799102783203125, 0.07304763793945312, 0.088104248046875, 0.10316085815429688, 0.11821746826171875, 0.13327407836914062, 0.1483306884765625, 0.16338729858398438, 0.17844390869140625, 0.19350051879882812, 0.20855712890625, 0.22361373901367188, 0.23867034912109375, 0.2537269592285156, 0.2687835693359375, 0.2838401794433594, 0.29889678955078125, 0.3139533996582031, 0.329010009765625, 0.3440666198730469, 0.35912322998046875, 0.3741798400878906, 0.3892364501953125, 0.4042930603027344, 0.41934967041015625, 0.4344062805175781, 0.449462890625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 11.0, 8.0, 14.0, 12.0, 10.0, 9.0, 19.0, 17.0, 25.0, 36.0, 30.0, 40.0, 35.0, 31.0, 48.0, 61.0, 44.0, 1081.0, 56.0, 43.0, 48.0, 34.0, 38.0, 38.0, 27.0, 41.0, 39.0, 26.0, 19.0, 15.0, 12.0, 8.0, 14.0, 13.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.419921875, -3.324859619140625, -3.22979736328125, -3.134735107421875, -3.0396728515625, -2.944610595703125, -2.84954833984375, -2.754486083984375, -2.659423828125, -2.564361572265625, -2.46929931640625, -2.374237060546875, -2.2791748046875, -2.184112548828125, -2.08905029296875, -1.993988037109375, -1.89892578125, -1.803863525390625, -1.70880126953125, -1.613739013671875, -1.5186767578125, -1.423614501953125, -1.32855224609375, -1.233489990234375, -1.138427734375, -1.043365478515625, -0.94830322265625, -0.853240966796875, -0.7581787109375, -0.663116455078125, -0.56805419921875, -0.472991943359375, -0.3779296875, -0.282867431640625, -0.18780517578125, -0.092742919921875, 0.0023193359375, 0.097381591796875, 0.19244384765625, 0.287506103515625, 0.382568359375, 0.477630615234375, 0.57269287109375, 0.667755126953125, 0.7628173828125, 0.857879638671875, 0.95294189453125, 1.048004150390625, 1.14306640625, 1.238128662109375, 1.33319091796875, 1.428253173828125, 1.5233154296875, 1.618377685546875, 1.71343994140625, 1.808502197265625, 1.903564453125, 1.998626708984375, 2.09368896484375, 2.188751220703125, 2.2838134765625, 2.378875732421875, 2.47393798828125, 2.569000244140625, 2.6640625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 10.0, 14.0, 19.0, 33.0, 42.0, 76.0, 83.0, 151.0, 215.0, 304.0, 535.0, 761.0, 1142.0, 1812.0, 2741.0, 4326.0, 6668.0, 10746.0, 17049.0, 28075.0, 46337.0, 77456.0, 130346.0, 1092744.0, 349261.0, 128851.0, 77138.0, 46082.0, 27842.0, 16997.0, 10452.0, 6697.0, 4222.0, 2748.0, 1761.0, 1101.0, 767.0, 515.0, 330.0, 219.0, 159.0, 104.0, 60.0, 52.0, 23.0, 27.0, 8.0, 14.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.396484375, -0.38368988037109375, -0.3708953857421875, -0.35810089111328125, -0.345306396484375, -0.33251190185546875, -0.3197174072265625, -0.30692291259765625, -0.29412841796875, -0.28133392333984375, -0.2685394287109375, -0.25574493408203125, -0.242950439453125, -0.23015594482421875, -0.2173614501953125, -0.20456695556640625, -0.1917724609375, -0.17897796630859375, -0.1661834716796875, -0.15338897705078125, -0.140594482421875, -0.12779998779296875, -0.1150054931640625, -0.10221099853515625, -0.08941650390625, -0.07662200927734375, -0.0638275146484375, -0.05103302001953125, -0.038238525390625, -0.02544403076171875, -0.0126495361328125, 0.00014495849609375, 0.012939453125, 0.02573394775390625, 0.0385284423828125, 0.05132293701171875, 0.064117431640625, 0.07691192626953125, 0.0897064208984375, 0.10250091552734375, 0.11529541015625, 0.12808990478515625, 0.1408843994140625, 0.15367889404296875, 0.166473388671875, 0.17926788330078125, 0.1920623779296875, 0.20485687255859375, 0.2176513671875, 0.23044586181640625, 0.2432403564453125, 0.25603485107421875, 0.268829345703125, 0.28162384033203125, 0.2944183349609375, 0.30721282958984375, 0.32000732421875, 0.33280181884765625, 0.3455963134765625, 0.35839080810546875, 0.371185302734375, 0.38397979736328125, 0.3967742919921875, 0.40956878662109375, 0.42236328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 9.0, 11.0, 10.0, 17.0, 10.0, 17.0, 13.0, 17.0, 28.0, 24.0, 21.0, 32.0, 36.0, 37.0, 27.0, 26.0, 54.0, 47.0, 36.0, 45.0, 45.0, 36.0, 35.0, 36.0, 37.0, 36.0, 38.0, 25.0, 26.0, 24.0, 16.0, 10.0, 14.0, 10.0, 14.0, 14.0, 7.0, 13.0, 7.0, 5.0, 6.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0], "bins": [-0.000579833984375, -0.0005631446838378906, -0.0005464553833007812, -0.0005297660827636719, -0.0005130767822265625, -0.0004963874816894531, -0.00047969818115234375, -0.0004630088806152344, -0.000446319580078125, -0.0004296302795410156, -0.00041294097900390625, -0.0003962516784667969, -0.0003795623779296875, -0.0003628730773925781, -0.00034618377685546875, -0.0003294944763183594, -0.00031280517578125, -0.0002961158752441406, -0.00027942657470703125, -0.0002627372741699219, -0.0002460479736328125, -0.00022935867309570312, -0.00021266937255859375, -0.00019598007202148438, -0.000179290771484375, -0.00016260147094726562, -0.00014591217041015625, -0.00012922286987304688, -0.0001125335693359375, -9.584426879882812e-05, -7.915496826171875e-05, -6.246566772460938e-05, -4.57763671875e-05, -2.9087066650390625e-05, -1.239776611328125e-05, 4.291534423828125e-06, 2.09808349609375e-05, 3.7670135498046875e-05, 5.435943603515625e-05, 7.104873657226562e-05, 8.7738037109375e-05, 0.00010442733764648438, 0.00012111663818359375, 0.00013780593872070312, 0.0001544952392578125, 0.00017118453979492188, 0.00018787384033203125, 0.00020456314086914062, 0.00022125244140625, 0.00023794174194335938, 0.00025463104248046875, 0.0002713203430175781, 0.0002880096435546875, 0.0003046989440917969, 0.00032138824462890625, 0.0003380775451660156, 0.000354766845703125, 0.0003714561462402344, 0.00038814544677734375, 0.0004048347473144531, 0.0004215240478515625, 0.0004382133483886719, 0.00045490264892578125, 0.0004715919494628906, 0.00048828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 7.0, 8.0, 16.0, 9.0, 13.0, 18.0, 16.0, 26.0, 28.0, 52.0, 65.0, 87.0, 108.0, 205.0, 266.0, 466.0, 1078.0, 79021.0, 961652.0, 3467.0, 728.0, 370.0, 240.0, 157.0, 114.0, 84.0, 42.0, 44.0, 16.0, 18.0, 20.0, 25.0, 12.0, 11.0, 9.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01114654541015625, -0.010752439498901367, -0.010358333587646484, -0.009964227676391602, -0.009570121765136719, -0.009176015853881836, -0.008781909942626953, -0.00838780403137207, -0.007993698120117188, -0.007599592208862305, -0.007205486297607422, -0.006811380386352539, -0.006417274475097656, -0.0060231685638427734, -0.005629062652587891, -0.005234956741333008, -0.004840850830078125, -0.004446744918823242, -0.004052639007568359, -0.0036585330963134766, -0.0032644271850585938, -0.002870321273803711, -0.002476215362548828, -0.0020821094512939453, -0.0016880035400390625, -0.0012938976287841797, -0.0008997917175292969, -0.0005056858062744141, -0.00011157989501953125, 0.00028252601623535156, 0.0006766319274902344, 0.0010707378387451172, 0.00146484375, 0.0018589496612548828, 0.0022530555725097656, 0.0026471614837646484, 0.0030412673950195312, 0.003435373306274414, 0.003829479217529297, 0.00422358512878418, 0.0046176910400390625, 0.005011796951293945, 0.005405902862548828, 0.005800008773803711, 0.006194114685058594, 0.0065882205963134766, 0.006982326507568359, 0.007376432418823242, 0.007770538330078125, 0.008164644241333008, 0.00855875015258789, 0.008952856063842773, 0.009346961975097656, 0.009741067886352539, 0.010135173797607422, 0.010529279708862305, 0.010923385620117188, 0.01131749153137207, 0.011711597442626953, 0.012105703353881836, 0.012499809265136719, 0.012893915176391602, 0.013288021087646484, 0.013682126998901367, 0.01407623291015625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 12.0, 45.0, 196.0, 341.0, 238.0, 126.0, 39.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018014187226071954, -0.0017620956059545279, -0.0017227723728865385, -0.001683449256233871, -0.0016441261395812035, -0.0016048029065132141, -0.0015654797898605466, -0.001526156673207879, -0.0014868334401398897, -0.0014475103234872222, -0.0014081870904192328, -0.0013688639737665653, -0.0013295408571138978, -0.0012902176240459085, -0.001250894507393241, -0.0012115712743252516, -0.0011722482740879059, -0.0011329251574352384, -0.001093601924367249, -0.0010542788077145815, -0.001014955691061914, -0.0009756324579939246, -0.0009363093413412571, -0.0008969861664809287, -0.0008576629916206002, -0.0008183398167602718, -0.0007790167001076043, -0.0007396935252472758, -0.0007003703503869474, -0.000661047175526619, -0.0006217240588739514, -0.000582400884013623, -0.0005430777091532946, -0.0005037545342929661, -0.00046443138853646815, -0.00042510824277997017, -0.00038578506791964173, -0.00034646192216314375, -0.0003071387764066458, -0.00026781560154631734, -0.00022849245578981936, -0.00018916929548140615, -0.00014984613517299294, -0.00011052298941649497, -7.119982910808176e-05, -3.187666879966855e-05, 7.446476956829429e-06, 4.6769651817157865e-05, 8.609279757365584e-05, 0.00012541595788206905, 0.00016473911819048226, 0.00020406226394698024, 0.00024338542425539345, 0.00028270858456380665, 0.00032203173032030463, 0.00036135490518063307, 0.00040067805093713105, 0.000440001196693629, 0.00047932437155395746, 0.000518647488206625, 0.0005579706630669534, 0.0005972938379272819, 0.0006366169545799494, 0.0006759401876479387, 0.0007152633043006063]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 12.0, 9.0, 13.0, 18.0, 33.0, 27.0, 28.0, 31.0, 33.0, 32.0, 36.0, 51.0, 41.0, 54.0, 61.0, 44.0, 42.0, 45.0, 48.0, 38.0, 31.0, 36.0, 33.0, 21.0, 25.0, 26.0, 20.0, 32.0, 18.0, 12.0, 10.0, 8.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00042742490768432617, -0.0004142066463828087, -0.0004009883850812912, -0.0003877701237797737, -0.0003745518624782562, -0.00036133360117673874, -0.00034811533987522125, -0.00033489707857370377, -0.0003216788172721863, -0.0003084605559706688, -0.0002952422946691513, -0.0002820240333676338, -0.00026880577206611633, -0.00025558751076459885, -0.00024236924946308136, -0.00022915098816156387, -0.0002159327268600464, -0.0002027144655585289, -0.00018949620425701141, -0.00017627794295549393, -0.00016305968165397644, -0.00014984142035245895, -0.00013662315905094147, -0.00012340489774942398, -0.0001101866364479065, -9.696837514638901e-05, -8.375011384487152e-05, -7.053185254335403e-05, -5.731359124183655e-05, -4.409532994031906e-05, -3.0877068638801575e-05, -1.7658807337284088e-05, -4.4405460357666016e-06, 8.777715265750885e-06, 2.199597656726837e-05, 3.521423786878586e-05, 4.8432499170303345e-05, 6.165076047182083e-05, 7.486902177333832e-05, 8.80872830748558e-05, 0.00010130554437637329, 0.00011452380567789078, 0.00012774206697940826, 0.00014096032828092575, 0.00015417858958244324, 0.00016739685088396072, 0.0001806151121854782, 0.0001938333734869957, 0.00020705163478851318, 0.00022026989609003067, 0.00023348815739154816, 0.00024670641869306564, 0.00025992467999458313, 0.0002731429412961006, 0.0002863612025976181, 0.0002995794638991356, 0.0003127977252006531, 0.00032601598650217056, 0.00033923424780368805, 0.00035245250910520554, 0.000365670770406723, 0.0003788890317082405, 0.000392107293009758, 0.0004053255543112755, 0.00041854381561279297]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 12.0, 7.0, 12.0, 16.0, 14.0, 12.0, 23.0, 20.0, 29.0, 30.0, 39.0, 21.0, 35.0, 41.0, 38.0, 33.0, 59.0, 35.0, 40.0, 37.0, 38.0, 41.0, 53.0, 41.0, 32.0, 19.0, 28.0, 32.0, 23.0, 7.0, 16.0, 19.0, 15.0, 12.0, 13.0, 7.0, 4.0, 7.0, 4.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.046875, -3.911865234375, -3.77685546875, -3.641845703125, -3.5068359375, -3.371826171875, -3.23681640625, -3.101806640625, -2.966796875, -2.831787109375, -2.69677734375, -2.561767578125, -2.4267578125, -2.291748046875, -2.15673828125, -2.021728515625, -1.88671875, -1.751708984375, -1.61669921875, -1.481689453125, -1.3466796875, -1.211669921875, -1.07666015625, -0.941650390625, -0.806640625, -0.671630859375, -0.53662109375, -0.401611328125, -0.2666015625, -0.131591796875, 0.00341796875, 0.138427734375, 0.2734375, 0.408447265625, 0.54345703125, 0.678466796875, 0.8134765625, 0.948486328125, 1.08349609375, 1.218505859375, 1.353515625, 1.488525390625, 1.62353515625, 1.758544921875, 1.8935546875, 2.028564453125, 2.16357421875, 2.298583984375, 2.43359375, 2.568603515625, 2.70361328125, 2.838623046875, 2.9736328125, 3.108642578125, 3.24365234375, 3.378662109375, 3.513671875, 3.648681640625, 3.78369140625, 3.918701171875, 4.0537109375, 4.188720703125, 4.32373046875, 4.458740234375, 4.59375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 8.0, 4.0, 7.0, 10.0, 10.0, 24.0, 19.0, 28.0, 49.0, 62.0, 90.0, 154.0, 217.0, 331.0, 564.0, 841.0, 1312.0, 2537.0, 4593.0, 9490.0, 20666.0, 50845.0, 142375.0, 397320.0, 265708.0, 87821.0, 33873.0, 14415.0, 6831.0, 3396.0, 1897.0, 1088.0, 638.0, 421.0, 270.0, 191.0, 131.0, 87.0, 53.0, 57.0, 35.0, 23.0, 20.0, 11.0, 8.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.74609375, -3.628204345703125, -3.51031494140625, -3.392425537109375, -3.2745361328125, -3.156646728515625, -3.03875732421875, -2.920867919921875, -2.802978515625, -2.685089111328125, -2.56719970703125, -2.449310302734375, -2.3314208984375, -2.213531494140625, -2.09564208984375, -1.977752685546875, -1.85986328125, -1.741973876953125, -1.62408447265625, -1.506195068359375, -1.3883056640625, -1.270416259765625, -1.15252685546875, -1.034637451171875, -0.916748046875, -0.798858642578125, -0.68096923828125, -0.563079833984375, -0.4451904296875, -0.327301025390625, -0.20941162109375, -0.091522216796875, 0.0263671875, 0.144256591796875, 0.26214599609375, 0.380035400390625, 0.4979248046875, 0.615814208984375, 0.73370361328125, 0.851593017578125, 0.969482421875, 1.087371826171875, 1.20526123046875, 1.323150634765625, 1.4410400390625, 1.558929443359375, 1.67681884765625, 1.794708251953125, 1.91259765625, 2.030487060546875, 2.14837646484375, 2.266265869140625, 2.3841552734375, 2.502044677734375, 2.61993408203125, 2.737823486328125, 2.855712890625, 2.973602294921875, 3.09149169921875, 3.209381103515625, 3.3272705078125, 3.445159912109375, 3.56304931640625, 3.680938720703125, 3.798828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 4.0, 6.0, 13.0, 10.0, 16.0, 16.0, 17.0, 15.0, 16.0, 19.0, 29.0, 34.0, 42.0, 48.0, 68.0, 47.0, 101.0, 368.0, 1561.0, 157.0, 67.0, 44.0, 40.0, 41.0, 28.0, 38.0, 29.0, 28.0, 22.0, 22.0, 15.0, 7.0, 21.0, 17.0, 4.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.796875, -14.306640625, -13.81640625, -13.326171875, -12.8359375, -12.345703125, -11.85546875, -11.365234375, -10.875, -10.384765625, -9.89453125, -9.404296875, -8.9140625, -8.423828125, -7.93359375, -7.443359375, -6.953125, -6.462890625, -5.97265625, -5.482421875, -4.9921875, -4.501953125, -4.01171875, -3.521484375, -3.03125, -2.541015625, -2.05078125, -1.560546875, -1.0703125, -0.580078125, -0.08984375, 0.400390625, 0.890625, 1.380859375, 1.87109375, 2.361328125, 2.8515625, 3.341796875, 3.83203125, 4.322265625, 4.8125, 5.302734375, 5.79296875, 6.283203125, 6.7734375, 7.263671875, 7.75390625, 8.244140625, 8.734375, 9.224609375, 9.71484375, 10.205078125, 10.6953125, 11.185546875, 11.67578125, 12.166015625, 12.65625, 13.146484375, 13.63671875, 14.126953125, 14.6171875, 15.107421875, 15.59765625, 16.087890625, 16.578125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 13.0, 10.0, 16.0, 25.0, 17.0, 16.0, 26.0, 30.0, 56.0, 63.0, 98.0, 136.0, 180.0, 304.0, 677.0, 3723.0, 302143.0, 2828386.0, 7787.0, 920.0, 375.0, 200.0, 135.0, 80.0, 65.0, 43.0, 25.0, 35.0, 27.0, 13.0, 20.0, 11.0, 9.0, 7.0, 8.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.67333984375, -34.5966796875, -33.52001953125, -32.443359375, -31.36669921875, -30.2900390625, -29.21337890625, -28.13671875, -27.06005859375, -25.9833984375, -24.90673828125, -23.830078125, -22.75341796875, -21.6767578125, -20.60009765625, -19.5234375, -18.44677734375, -17.3701171875, -16.29345703125, -15.216796875, -14.14013671875, -13.0634765625, -11.98681640625, -10.91015625, -9.83349609375, -8.7568359375, -7.68017578125, -6.603515625, -5.52685546875, -4.4501953125, -3.37353515625, -2.296875, -1.22021484375, -0.1435546875, 0.93310546875, 2.009765625, 3.08642578125, 4.1630859375, 5.23974609375, 6.31640625, 7.39306640625, 8.4697265625, 9.54638671875, 10.623046875, 11.69970703125, 12.7763671875, 13.85302734375, 14.9296875, 16.00634765625, 17.0830078125, 18.15966796875, 19.236328125, 20.31298828125, 21.3896484375, 22.46630859375, 23.54296875, 24.61962890625, 25.6962890625, 26.77294921875, 27.849609375, 28.92626953125, 30.0029296875, 31.07958984375, 32.15625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 15.0, 22.0, 37.0, 47.0, 68.0, 110.0, 120.0, 116.0, 108.0, 104.0, 85.0, 60.0, 40.0, 28.0, 18.0, 13.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.82720375061035, -18.2998104095459, -17.772415161132812, -17.24502182006836, -16.717628479003906, -16.190235137939453, -15.662840843200684, -15.135446548461914, -14.608053207397461, -14.080659866333008, -13.553265571594238, -13.025871276855469, -12.498477935791016, -11.971084594726562, -11.443690299987793, -10.916296005249023, -10.38890266418457, -9.861509323120117, -9.334115028381348, -8.806720733642578, -8.279327392578125, -7.751933574676514, -7.224539756774902, -6.697145938873291, -6.16975212097168, -5.642358303070068, -5.114964485168457, -4.587570667266846, -4.060176849365234, -3.532783031463623, -3.0053892135620117, -2.4779953956604004, -1.9506034851074219, -1.4232096672058105, -0.8958158493041992, -0.3684220314025879, 0.15897178649902344, 0.6863656044006348, 1.213759422302246, 1.7411532402038574, 2.2685470581054688, 2.79594087600708, 3.3233346939086914, 3.8507285118103027, 4.378122329711914, 4.905516147613525, 5.432909965515137, 5.960303783416748, 6.487697601318359, 7.015091419219971, 7.542485237121582, 8.069879531860352, 8.597272872924805, 9.124666213989258, 9.652060508728027, 10.179454803466797, 10.70684814453125, 11.234241485595703, 11.761635780334473, 12.289030075073242, 12.816423416137695, 13.343816757202148, 13.871211051940918, 14.398605346679688, 14.92599868774414]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 14.0, 6.0, 4.0, 13.0, 16.0, 18.0, 15.0, 20.0, 27.0, 26.0, 17.0, 28.0, 28.0, 30.0, 30.0, 36.0, 43.0, 36.0, 41.0, 45.0, 43.0, 39.0, 41.0, 30.0, 37.0, 33.0, 44.0, 39.0, 30.0, 21.0, 18.0, 16.0, 15.0, 18.0, 14.0, 15.0, 8.0, 6.0, 11.0, 8.0, 3.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.9434814453125, -30.816221237182617, -29.688961029052734, -28.56170082092285, -27.43444061279297, -26.30718231201172, -25.179922103881836, -24.052661895751953, -22.92540168762207, -21.798141479492188, -20.670881271362305, -19.543621063232422, -18.416362762451172, -17.289100646972656, -16.161842346191406, -15.034582138061523, -13.90732192993164, -12.780061721801758, -11.652801513671875, -10.525542259216309, -9.398282051086426, -8.271021842956543, -7.143762111663818, -6.016502380371094, -4.889242172241211, -3.7619822025299072, -2.6347222328186035, -1.5074622631072998, -0.3802022933959961, 0.7470579147338867, 1.8743176460266113, 3.001577377319336, 4.128841400146484, 5.256101608276367, 6.383361339569092, 7.510621070861816, 8.6378812789917, 9.765141487121582, 10.892400741577148, 12.019660949707031, 13.146921157836914, 14.274181365966797, 15.40144157409668, 16.528701782226562, 17.655960083007812, 18.783222198486328, 19.910480499267578, 21.03774070739746, 22.165000915527344, 23.292261123657227, 24.41952133178711, 25.546781539916992, 26.674041748046875, 27.801300048828125, 28.928560256958008, 30.05582046508789, 31.183080673217773, 32.310340881347656, 33.437599182128906, 34.56486129760742, 35.69211959838867, 36.81938171386719, 37.94664001464844, 39.07389831542969, 40.2011604309082]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 3.0, 12.0, 4.0, 9.0, 11.0, 12.0, 14.0, 16.0, 18.0, 23.0, 19.0, 22.0, 20.0, 40.0, 44.0, 32.0, 33.0, 35.0, 46.0, 45.0, 49.0, 32.0, 35.0, 41.0, 42.0, 45.0, 38.0, 28.0, 39.0, 26.0, 23.0, 16.0, 23.0, 12.0, 12.0, 11.0, 14.0, 13.0, 7.0, 7.0, 7.0, 2.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.38671875, -4.2486572265625, -4.110595703125, -3.9725341796875, -3.83447265625, -3.6964111328125, -3.558349609375, -3.4202880859375, -3.2822265625, -3.1441650390625, -3.006103515625, -2.8680419921875, -2.72998046875, -2.5919189453125, -2.453857421875, -2.3157958984375, -2.177734375, -2.0396728515625, -1.901611328125, -1.7635498046875, -1.62548828125, -1.4874267578125, -1.349365234375, -1.2113037109375, -1.0732421875, -0.9351806640625, -0.797119140625, -0.6590576171875, -0.52099609375, -0.3829345703125, -0.244873046875, -0.1068115234375, 0.03125, 0.1693115234375, 0.307373046875, 0.4454345703125, 0.58349609375, 0.7215576171875, 0.859619140625, 0.9976806640625, 1.1357421875, 1.2738037109375, 1.411865234375, 1.5499267578125, 1.68798828125, 1.8260498046875, 1.964111328125, 2.1021728515625, 2.240234375, 2.3782958984375, 2.516357421875, 2.6544189453125, 2.79248046875, 2.9305419921875, 3.068603515625, 3.2066650390625, 3.3447265625, 3.4827880859375, 3.620849609375, 3.7589111328125, 3.89697265625, 4.0350341796875, 4.173095703125, 4.3111572265625, 4.44921875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 8.0, 6.0, 10.0, 10.0, 12.0, 11.0, 10.0, 17.0, 22.0, 28.0, 36.0, 38.0, 47.0, 72.0, 81.0, 91.0, 169.0, 484.0, 2641.0, 78058.0, 3749061.0, 356037.0, 5799.0, 722.0, 257.0, 121.0, 94.0, 50.0, 47.0, 48.0, 33.0, 26.0, 17.0, 35.0, 13.0, 11.0, 11.0, 9.0, 5.0, 9.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.265625, -22.50634765625, -21.7470703125, -20.98779296875, -20.228515625, -19.46923828125, -18.7099609375, -17.95068359375, -17.19140625, -16.43212890625, -15.6728515625, -14.91357421875, -14.154296875, -13.39501953125, -12.6357421875, -11.87646484375, -11.1171875, -10.35791015625, -9.5986328125, -8.83935546875, -8.080078125, -7.32080078125, -6.5615234375, -5.80224609375, -5.04296875, -4.28369140625, -3.5244140625, -2.76513671875, -2.005859375, -1.24658203125, -0.4873046875, 0.27197265625, 1.03125, 1.79052734375, 2.5498046875, 3.30908203125, 4.068359375, 4.82763671875, 5.5869140625, 6.34619140625, 7.10546875, 7.86474609375, 8.6240234375, 9.38330078125, 10.142578125, 10.90185546875, 11.6611328125, 12.42041015625, 13.1796875, 13.93896484375, 14.6982421875, 15.45751953125, 16.216796875, 16.97607421875, 17.7353515625, 18.49462890625, 19.25390625, 20.01318359375, 20.7724609375, 21.53173828125, 22.291015625, 23.05029296875, 23.8095703125, 24.56884765625, 25.328125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 13.0, 17.0, 35.0, 49.0, 118.0, 179.0, 331.0, 517.0, 781.0, 746.0, 547.0, 310.0, 190.0, 112.0, 63.0, 38.0, 13.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.984375, -28.3677978515625, -27.751220703125, -27.1346435546875, -26.51806640625, -25.9014892578125, -25.284912109375, -24.6683349609375, -24.0517578125, -23.4351806640625, -22.818603515625, -22.2020263671875, -21.58544921875, -20.9688720703125, -20.352294921875, -19.7357177734375, -19.119140625, -18.5025634765625, -17.885986328125, -17.2694091796875, -16.65283203125, -16.0362548828125, -15.419677734375, -14.8031005859375, -14.1865234375, -13.5699462890625, -12.953369140625, -12.3367919921875, -11.72021484375, -11.1036376953125, -10.487060546875, -9.8704833984375, -9.25390625, -8.6373291015625, -8.020751953125, -7.4041748046875, -6.78759765625, -6.1710205078125, -5.554443359375, -4.9378662109375, -4.3212890625, -3.7047119140625, -3.088134765625, -2.4715576171875, -1.85498046875, -1.2384033203125, -0.621826171875, -0.0052490234375, 0.611328125, 1.2279052734375, 1.844482421875, 2.4610595703125, 3.07763671875, 3.6942138671875, 4.310791015625, 4.9273681640625, 5.5439453125, 6.1605224609375, 6.777099609375, 7.3936767578125, 8.01025390625, 8.6268310546875, 9.243408203125, 9.8599853515625, 10.4765625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 15.0, 21.0, 31.0, 74.0, 143.0, 232.0, 455.0, 1393.0, 69106.0, 4113156.0, 7961.0, 868.0, 356.0, 199.0, 117.0, 69.0, 44.0, 16.0, 8.0, 11.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.84375, -48.56689453125, -46.2900390625, -44.01318359375, -41.736328125, -39.45947265625, -37.1826171875, -34.90576171875, -32.62890625, -30.35205078125, -28.0751953125, -25.79833984375, -23.521484375, -21.24462890625, -18.9677734375, -16.69091796875, -14.4140625, -12.13720703125, -9.8603515625, -7.58349609375, -5.306640625, -3.02978515625, -0.7529296875, 1.52392578125, 3.80078125, 6.07763671875, 8.3544921875, 10.63134765625, 12.908203125, 15.18505859375, 17.4619140625, 19.73876953125, 22.015625, 24.29248046875, 26.5693359375, 28.84619140625, 31.123046875, 33.39990234375, 35.6767578125, 37.95361328125, 40.23046875, 42.50732421875, 44.7841796875, 47.06103515625, 49.337890625, 51.61474609375, 53.8916015625, 56.16845703125, 58.4453125, 60.72216796875, 62.9990234375, 65.27587890625, 67.552734375, 69.82958984375, 72.1064453125, 74.38330078125, 76.66015625, 78.93701171875, 81.2138671875, 83.49072265625, 85.767578125, 88.04443359375, 90.3212890625, 92.59814453125, 94.875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 36.0, 185.0, 348.0, 310.0, 114.0, 15.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.33694458007812, -230.20626831054688, -225.07559204101562, -219.94493103027344, -214.8142547607422, -209.68357849121094, -204.5529022216797, -199.4222412109375, -194.29156494140625, -189.160888671875, -184.03021240234375, -178.89955139160156, -173.7688751220703, -168.63819885253906, -163.5075225830078, -158.37686157226562, -153.24618530273438, -148.11550903320312, -142.98483276367188, -137.8541717529297, -132.72349548339844, -127.59281921386719, -122.46214294433594, -117.33147430419922, -112.20079040527344, -107.07011413574219, -101.93944549560547, -96.80876922607422, -91.6781005859375, -86.54742431640625, -81.416748046875, -76.28607940673828, -71.15541076660156, -66.02473449707031, -60.894065856933594, -55.763389587402344, -50.632720947265625, -45.502044677734375, -40.37137222290039, -35.240699768066406, -30.110027313232422, -24.979354858398438, -19.848682403564453, -14.718008041381836, -9.587335586547852, -4.456663131713867, 0.67401123046875, 5.804683685302734, 10.935356140136719, 16.066028594970703, 21.196701049804688, 26.327375411987305, 31.45804786682129, 36.588722229003906, 41.71939468383789, 46.850067138671875, 51.98073959350586, 57.111412048339844, 62.24208450317383, 67.37275695800781, 72.50343322753906, 77.63410186767578, 82.76477813720703, 87.89544677734375, 93.026123046875]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 4.0, 6.0, 7.0, 7.0, 22.0, 12.0, 13.0, 10.0, 19.0, 15.0, 22.0, 19.0, 24.0, 16.0, 36.0, 26.0, 24.0, 25.0, 38.0, 21.0, 35.0, 30.0, 32.0, 37.0, 30.0, 45.0, 27.0, 34.0, 33.0, 33.0, 37.0, 35.0, 26.0, 28.0, 23.0, 21.0, 18.0, 18.0, 7.0, 13.0, 14.0, 5.0, 6.0, 7.0, 6.0, 5.0, 7.0, 9.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-32.60755157470703, -31.63173484802246, -30.65591812133789, -29.68010139465332, -28.70428466796875, -27.728469848632812, -26.752653121948242, -25.776836395263672, -24.8010196685791, -23.82520294189453, -22.84938621520996, -21.87356948852539, -20.897754669189453, -19.92193603515625, -18.946121215820312, -17.970304489135742, -16.994487762451172, -16.0186710357666, -15.042854309082031, -14.067038536071777, -13.091221809387207, -12.115405082702637, -11.139589309692383, -10.163772583007812, -9.187955856323242, -8.212139129638672, -7.23632287979126, -6.260506629943848, -5.284689903259277, -4.308873176574707, -3.333056926727295, -2.357240676879883, -1.3814239501953125, -0.4056074619293213, 0.5702090263366699, 1.5460255146026611, 2.5218420028686523, 3.4976587295532227, 4.473474979400635, 5.449291229248047, 6.425107955932617, 7.4009246826171875, 8.376741409301758, 9.352557182312012, 10.328373908996582, 11.304190635681152, 12.280006408691406, 13.255823135375977, 14.231639862060547, 15.207456588745117, 16.183273315429688, 17.159090042114258, 18.134906768798828, 19.110721588134766, 20.086538314819336, 21.062355041503906, 22.038171768188477, 23.013988494873047, 23.989805221557617, 24.965621948242188, 25.941436767578125, 26.917255401611328, 27.893070220947266, 28.868886947631836, 29.844703674316406]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 6.0, 8.0, 10.0, 11.0, 15.0, 21.0, 13.0, 18.0, 12.0, 17.0, 20.0, 29.0, 28.0, 32.0, 33.0, 51.0, 35.0, 42.0, 44.0, 49.0, 44.0, 44.0, 41.0, 35.0, 38.0, 39.0, 45.0, 29.0, 36.0, 25.0, 16.0, 19.0, 12.0, 13.0, 14.0, 13.0, 11.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.40234375, -4.26031494140625, -4.1182861328125, -3.97625732421875, -3.834228515625, -3.69219970703125, -3.5501708984375, -3.40814208984375, -3.26611328125, -3.12408447265625, -2.9820556640625, -2.84002685546875, -2.697998046875, -2.55596923828125, -2.4139404296875, -2.27191162109375, -2.1298828125, -1.98785400390625, -1.8458251953125, -1.70379638671875, -1.561767578125, -1.41973876953125, -1.2777099609375, -1.13568115234375, -0.99365234375, -0.85162353515625, -0.7095947265625, -0.56756591796875, -0.425537109375, -0.28350830078125, -0.1414794921875, 0.00054931640625, 0.142578125, 0.28460693359375, 0.4266357421875, 0.56866455078125, 0.710693359375, 0.85272216796875, 0.9947509765625, 1.13677978515625, 1.27880859375, 1.42083740234375, 1.5628662109375, 1.70489501953125, 1.846923828125, 1.98895263671875, 2.1309814453125, 2.27301025390625, 2.4150390625, 2.55706787109375, 2.6990966796875, 2.84112548828125, 2.983154296875, 3.12518310546875, 3.2672119140625, 3.40924072265625, 3.55126953125, 3.69329833984375, 3.8353271484375, 3.97735595703125, 4.119384765625, 4.26141357421875, 4.4034423828125, 4.54547119140625, 4.6875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 15.0, 25.0, 36.0, 34.0, 71.0, 109.0, 127.0, 225.0, 296.0, 463.0, 668.0, 960.0, 1497.0, 2164.0, 3156.0, 4830.0, 7162.0, 10483.0, 16308.0, 25807.0, 42110.0, 70920.0, 121713.0, 190680.0, 202225.0, 137557.0, 79694.0, 46764.0, 28617.0, 18219.0, 11845.0, 7899.0, 5174.0, 3499.0, 2322.0, 1543.0, 1086.0, 725.0, 503.0, 340.0, 212.0, 168.0, 91.0, 71.0, 36.0, 36.0, 19.0, 16.0, 10.0, 6.0, 9.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.476318359375, -0.4619331359863281, -0.44754791259765625, -0.4331626892089844, -0.4187774658203125, -0.4043922424316406, -0.39000701904296875, -0.3756217956542969, -0.361236572265625, -0.3468513488769531, -0.33246612548828125, -0.3180809020996094, -0.3036956787109375, -0.2893104553222656, -0.27492523193359375, -0.2605400085449219, -0.24615478515625, -0.23176956176757812, -0.21738433837890625, -0.20299911499023438, -0.1886138916015625, -0.17422866821289062, -0.15984344482421875, -0.14545822143554688, -0.131072998046875, -0.11668777465820312, -0.10230255126953125, -0.08791732788085938, -0.0735321044921875, -0.059146881103515625, -0.04476165771484375, -0.030376434326171875, -0.0159912109375, -0.001605987548828125, 0.01277923583984375, 0.027164459228515625, 0.0415496826171875, 0.055934906005859375, 0.07032012939453125, 0.08470535278320312, 0.099090576171875, 0.11347579956054688, 0.12786102294921875, 0.14224624633789062, 0.1566314697265625, 0.17101669311523438, 0.18540191650390625, 0.19978713989257812, 0.21417236328125, 0.22855758666992188, 0.24294281005859375, 0.2573280334472656, 0.2717132568359375, 0.2860984802246094, 0.30048370361328125, 0.3148689270019531, 0.329254150390625, 0.3436393737792969, 0.35802459716796875, 0.3724098205566406, 0.3867950439453125, 0.4011802673339844, 0.41556549072265625, 0.4299507141113281, 0.4443359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 3.0, 6.0, 8.0, 2.0, 7.0, 9.0, 12.0, 18.0, 17.0, 21.0, 14.0, 20.0, 34.0, 31.0, 33.0, 36.0, 42.0, 30.0, 40.0, 45.0, 40.0, 1068.0, 42.0, 41.0, 38.0, 34.0, 40.0, 35.0, 26.0, 29.0, 22.0, 33.0, 18.0, 30.0, 22.0, 16.0, 13.0, 10.0, 13.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.701171875, -2.6123046875, -2.5234375, -2.4345703125, -2.345703125, -2.2568359375, -2.16796875, -2.0791015625, -1.990234375, -1.9013671875, -1.8125, -1.7236328125, -1.634765625, -1.5458984375, -1.45703125, -1.3681640625, -1.279296875, -1.1904296875, -1.1015625, -1.0126953125, -0.923828125, -0.8349609375, -0.74609375, -0.6572265625, -0.568359375, -0.4794921875, -0.390625, -0.3017578125, -0.212890625, -0.1240234375, -0.03515625, 0.0537109375, 0.142578125, 0.2314453125, 0.3203125, 0.4091796875, 0.498046875, 0.5869140625, 0.67578125, 0.7646484375, 0.853515625, 0.9423828125, 1.03125, 1.1201171875, 1.208984375, 1.2978515625, 1.38671875, 1.4755859375, 1.564453125, 1.6533203125, 1.7421875, 1.8310546875, 1.919921875, 2.0087890625, 2.09765625, 2.1865234375, 2.275390625, 2.3642578125, 2.453125, 2.5419921875, 2.630859375, 2.7197265625, 2.80859375, 2.8974609375, 2.986328125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 11.0, 17.0, 19.0, 26.0, 32.0, 46.0, 87.0, 118.0, 224.0, 295.0, 462.0, 702.0, 1099.0, 1732.0, 2748.0, 4347.0, 7248.0, 11785.0, 19886.0, 33933.0, 59909.0, 103860.0, 171600.0, 1265654.0, 168875.0, 101556.0, 58193.0, 33187.0, 19614.0, 11431.0, 7053.0, 4166.0, 2645.0, 1669.0, 999.0, 648.0, 404.0, 299.0, 180.0, 119.0, 99.0, 53.0, 39.0, 16.0, 14.0, 18.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.4443359375, -0.4302215576171875, -0.416107177734375, -0.4019927978515625, -0.38787841796875, -0.3737640380859375, -0.359649658203125, -0.3455352783203125, -0.3314208984375, -0.3173065185546875, -0.303192138671875, -0.2890777587890625, -0.27496337890625, -0.2608489990234375, -0.246734619140625, -0.2326202392578125, -0.218505859375, -0.2043914794921875, -0.190277099609375, -0.1761627197265625, -0.16204833984375, -0.1479339599609375, -0.133819580078125, -0.1197052001953125, -0.1055908203125, -0.0914764404296875, -0.077362060546875, -0.0632476806640625, -0.04913330078125, -0.0350189208984375, -0.020904541015625, -0.0067901611328125, 0.00732421875, 0.0214385986328125, 0.035552978515625, 0.0496673583984375, 0.06378173828125, 0.0778961181640625, 0.092010498046875, 0.1061248779296875, 0.1202392578125, 0.1343536376953125, 0.148468017578125, 0.1625823974609375, 0.17669677734375, 0.1908111572265625, 0.204925537109375, 0.2190399169921875, 0.233154296875, 0.2472686767578125, 0.261383056640625, 0.2754974365234375, 0.28961181640625, 0.3037261962890625, 0.317840576171875, 0.3319549560546875, 0.3460693359375, 0.3601837158203125, 0.374298095703125, 0.3884124755859375, 0.40252685546875, 0.4166412353515625, 0.430755615234375, 0.4448699951171875, 0.458984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 15.0, 7.0, 9.0, 10.0, 20.0, 17.0, 30.0, 34.0, 33.0, 32.0, 40.0, 37.0, 57.0, 51.0, 60.0, 66.0, 48.0, 34.0, 48.0, 48.0, 35.0, 44.0, 32.0, 48.0, 21.0, 34.0, 23.0, 14.0, 14.0, 10.0, 8.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00075531005859375, -0.0007317662239074707, -0.0007082223892211914, -0.0006846785545349121, -0.0006611347198486328, -0.0006375908851623535, -0.0006140470504760742, -0.0005905032157897949, -0.0005669593811035156, -0.0005434155464172363, -0.000519871711730957, -0.0004963278770446777, -0.00047278404235839844, -0.00044924020767211914, -0.00042569637298583984, -0.00040215253829956055, -0.00037860870361328125, -0.00035506486892700195, -0.00033152103424072266, -0.00030797719955444336, -0.00028443336486816406, -0.00026088953018188477, -0.00023734569549560547, -0.00021380186080932617, -0.00019025802612304688, -0.00016671419143676758, -0.00014317035675048828, -0.00011962652206420898, -9.608268737792969e-05, -7.253885269165039e-05, -4.8995018005371094e-05, -2.5451183319091797e-05, -1.9073486328125e-06, 2.1636486053466797e-05, 4.5180320739746094e-05, 6.872415542602539e-05, 9.226799011230469e-05, 0.00011581182479858398, 0.00013935565948486328, 0.00016289949417114258, 0.00018644332885742188, 0.00020998716354370117, 0.00023353099822998047, 0.00025707483291625977, 0.00028061866760253906, 0.00030416250228881836, 0.00032770633697509766, 0.00035125017166137695, 0.00037479400634765625, 0.00039833784103393555, 0.00042188167572021484, 0.00044542551040649414, 0.00046896934509277344, 0.0004925131797790527, 0.000516057014465332, 0.0005396008491516113, 0.0005631446838378906, 0.0005866885185241699, 0.0006102323532104492, 0.0006337761878967285, 0.0006573200225830078, 0.0006808638572692871, 0.0007044076919555664, 0.0007279515266418457, 0.000751495361328125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 11.0, 10.0, 12.0, 11.0, 16.0, 20.0, 27.0, 35.0, 33.0, 44.0, 78.0, 105.0, 188.0, 286.0, 535.0, 1346.0, 232150.0, 809933.0, 1984.0, 701.0, 350.0, 198.0, 129.0, 70.0, 57.0, 42.0, 36.0, 23.0, 18.0, 16.0, 17.0, 10.0, 17.0, 9.0, 5.0, 6.0, 10.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01517486572265625, -0.014716863632202148, -0.014258861541748047, -0.013800859451293945, -0.013342857360839844, -0.012884855270385742, -0.01242685317993164, -0.011968851089477539, -0.011510848999023438, -0.011052846908569336, -0.010594844818115234, -0.010136842727661133, -0.009678840637207031, -0.00922083854675293, -0.008762836456298828, -0.008304834365844727, -0.007846832275390625, -0.0073888301849365234, -0.006930828094482422, -0.00647282600402832, -0.006014823913574219, -0.005556821823120117, -0.005098819732666016, -0.004640817642211914, -0.0041828155517578125, -0.003724813461303711, -0.0032668113708496094, -0.002808809280395508, -0.0023508071899414062, -0.0018928050994873047, -0.0014348030090332031, -0.0009768009185791016, -0.000518798828125, -6.079673767089844e-05, 0.0003972053527832031, 0.0008552074432373047, 0.0013132095336914062, 0.0017712116241455078, 0.0022292137145996094, 0.002687215805053711, 0.0031452178955078125, 0.003603219985961914, 0.004061222076416016, 0.004519224166870117, 0.004977226257324219, 0.00543522834777832, 0.005893230438232422, 0.0063512325286865234, 0.006809234619140625, 0.0072672367095947266, 0.007725238800048828, 0.00818324089050293, 0.008641242980957031, 0.009099245071411133, 0.009557247161865234, 0.010015249252319336, 0.010473251342773438, 0.010931253433227539, 0.01138925552368164, 0.011847257614135742, 0.012305259704589844, 0.012763261795043945, 0.013221263885498047, 0.013679265975952148, 0.01413726806640625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 15.0, 33.0, 136.0, 261.0, 265.0, 197.0, 70.0, 22.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014417300699278712, -0.0014030232559889555, -0.0013643165584653616, -0.0013256098609417677, -0.001286903047002852, -0.0012481962330639362, -0.0012094895355403423, -0.0011707828380167484, -0.0011320760240778327, -0.001093369210138917, -0.001054662512615323, -0.0010159558150917292, -0.0009772490011528134, -0.0009385422454215586, -0.0008998354896903038, -0.000861128733959049, -0.0008224219782277942, -0.0007837152224965394, -0.0007450084667652845, -0.0007063017110340297, -0.0006675949553027749, -0.0006288881995715201, -0.0005901814438402653, -0.0005514746881090105, -0.0005127679323777556, -0.0004740611766465008, -0.000435354420915246, -0.0003966476651839912, -0.0003579409094527364, -0.00031923415372148156, -0.00028052739799022675, -0.00024182064225897193, -0.0002031137701123953, -0.00016440701438114047, -0.00012570025864988565, -8.699350291863084e-05, -4.828674718737602e-05, -9.579991456121206e-06, 2.912676427513361e-05, 6.783352000638843e-05, 0.00010654027573764324, 0.00014524703146889806, 0.00018395378720015287, 0.0002226605429314077, 0.0002613672986626625, 0.0003000740543939173, 0.00033878081012517214, 0.00037748756585642695, 0.00041619432158768177, 0.0004549010773189366, 0.0004936078330501914, 0.0005323145887814462, 0.000571021344512701, 0.0006097281002439559, 0.0006484348559752107, 0.0006871416117064655, 0.0007258483674377203, 0.0007645551231689751, 0.0008032618789002299, 0.0008419686346314847, 0.0008806753903627396, 0.0009193821460939944, 0.0009580889018252492, 0.000996795715764165, 0.0010355024132877588]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 10.0, 8.0, 8.0, 5.0, 11.0, 17.0, 10.0, 20.0, 14.0, 18.0, 32.0, 23.0, 38.0, 38.0, 39.0, 39.0, 40.0, 33.0, 41.0, 41.0, 33.0, 26.0, 37.0, 46.0, 42.0, 28.0, 35.0, 37.0, 27.0, 29.0, 20.0, 29.0, 22.0, 21.0, 9.0, 12.0, 14.0, 8.0, 6.0, 6.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003584623336791992, -0.00034604407846927643, -0.00033362582325935364, -0.00032120756804943085, -0.00030878931283950806, -0.00029637105762958527, -0.0002839528024196625, -0.0002715345472097397, -0.0002591162919998169, -0.0002466980367898941, -0.0002342797815799713, -0.00022186152637004852, -0.00020944327116012573, -0.00019702501595020294, -0.00018460676074028015, -0.00017218850553035736, -0.00015977025032043457, -0.00014735199511051178, -0.000134933739900589, -0.0001225154846906662, -0.00011009722948074341, -9.767897427082062e-05, -8.526071906089783e-05, -7.284246385097504e-05, -6.0424208641052246e-05, -4.8005953431129456e-05, -3.5587698221206665e-05, -2.3169443011283875e-05, -1.0751187801361084e-05, 1.6670674085617065e-06, 1.4085322618484497e-05, 2.6503577828407288e-05, 3.892183303833008e-05, 5.134008824825287e-05, 6.375834345817566e-05, 7.617659866809845e-05, 8.859485387802124e-05, 0.00010101310908794403, 0.00011343136429786682, 0.0001258496195077896, 0.0001382678747177124, 0.0001506861299276352, 0.00016310438513755798, 0.00017552264034748077, 0.00018794089555740356, 0.00020035915076732635, 0.00021277740597724915, 0.00022519566118717194, 0.00023761391639709473, 0.0002500321716070175, 0.0002624504268169403, 0.0002748686820268631, 0.0002872869372367859, 0.0002997051924467087, 0.00031212344765663147, 0.00032454170286655426, 0.00033695995807647705, 0.00034937821328639984, 0.00036179646849632263, 0.0003742147237062454, 0.0003866329789161682, 0.000399051234126091, 0.0004114694893360138, 0.0004238877445459366, 0.0004363059997558594]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 6.0, 8.0, 10.0, 11.0, 15.0, 21.0, 13.0, 18.0, 12.0, 17.0, 20.0, 29.0, 28.0, 32.0, 33.0, 51.0, 35.0, 42.0, 44.0, 49.0, 44.0, 44.0, 41.0, 35.0, 38.0, 39.0, 45.0, 29.0, 36.0, 25.0, 16.0, 19.0, 12.0, 13.0, 14.0, 13.0, 11.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.40234375, -4.26031494140625, -4.1182861328125, -3.97625732421875, -3.834228515625, -3.69219970703125, -3.5501708984375, -3.40814208984375, -3.26611328125, -3.12408447265625, -2.9820556640625, -2.84002685546875, -2.697998046875, -2.55596923828125, -2.4139404296875, -2.27191162109375, -2.1298828125, -1.98785400390625, -1.8458251953125, -1.70379638671875, -1.561767578125, -1.41973876953125, -1.2777099609375, -1.13568115234375, -0.99365234375, -0.85162353515625, -0.7095947265625, -0.56756591796875, -0.425537109375, -0.28350830078125, -0.1414794921875, 0.00054931640625, 0.142578125, 0.28460693359375, 0.4266357421875, 0.56866455078125, 0.710693359375, 0.85272216796875, 0.9947509765625, 1.13677978515625, 1.27880859375, 1.42083740234375, 1.5628662109375, 1.70489501953125, 1.846923828125, 1.98895263671875, 2.1309814453125, 2.27301025390625, 2.4150390625, 2.55706787109375, 2.6990966796875, 2.84112548828125, 2.983154296875, 3.12518310546875, 3.2672119140625, 3.40924072265625, 3.55126953125, 3.69329833984375, 3.8353271484375, 3.97735595703125, 4.119384765625, 4.26141357421875, 4.4034423828125, 4.54547119140625, 4.6875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 10.0, 8.0, 10.0, 8.0, 25.0, 21.0, 30.0, 46.0, 70.0, 117.0, 181.0, 269.0, 412.0, 632.0, 977.0, 1541.0, 2478.0, 3979.0, 6349.0, 10371.0, 17231.0, 30881.0, 62314.0, 147775.0, 356523.0, 222834.0, 87357.0, 40521.0, 21857.0, 12836.0, 7778.0, 4775.0, 2970.0, 1951.0, 1210.0, 748.0, 474.0, 332.0, 215.0, 143.0, 105.0, 63.0, 44.0, 22.0, 18.0, 21.0, 10.0, 6.0, 2.0, 3.0, 2.0, 5.0, 4.0, 1.0], "bins": [-3.001953125, -2.91546630859375, -2.8289794921875, -2.74249267578125, -2.656005859375, -2.56951904296875, -2.4830322265625, -2.39654541015625, -2.31005859375, -2.22357177734375, -2.1370849609375, -2.05059814453125, -1.964111328125, -1.87762451171875, -1.7911376953125, -1.70465087890625, -1.6181640625, -1.53167724609375, -1.4451904296875, -1.35870361328125, -1.272216796875, -1.18572998046875, -1.0992431640625, -1.01275634765625, -0.92626953125, -0.83978271484375, -0.7532958984375, -0.66680908203125, -0.580322265625, -0.49383544921875, -0.4073486328125, -0.32086181640625, -0.234375, -0.14788818359375, -0.0614013671875, 0.02508544921875, 0.111572265625, 0.19805908203125, 0.2845458984375, 0.37103271484375, 0.45751953125, 0.54400634765625, 0.6304931640625, 0.71697998046875, 0.803466796875, 0.88995361328125, 0.9764404296875, 1.06292724609375, 1.1494140625, 1.23590087890625, 1.3223876953125, 1.40887451171875, 1.495361328125, 1.58184814453125, 1.6683349609375, 1.75482177734375, 1.84130859375, 1.92779541015625, 2.0142822265625, 2.10076904296875, 2.187255859375, 2.27374267578125, 2.3602294921875, 2.44671630859375, 2.533203125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 10.0, 8.0, 14.0, 4.0, 13.0, 9.0, 13.0, 23.0, 26.0, 19.0, 25.0, 27.0, 33.0, 25.0, 34.0, 39.0, 39.0, 41.0, 78.0, 180.0, 1635.0, 208.0, 68.0, 56.0, 46.0, 35.0, 35.0, 39.0, 26.0, 29.0, 38.0, 17.0, 24.0, 17.0, 22.0, 17.0, 11.0, 12.0, 10.0, 6.0, 9.0, 3.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.609375, -13.1644287109375, -12.719482421875, -12.2745361328125, -11.82958984375, -11.3846435546875, -10.939697265625, -10.4947509765625, -10.0498046875, -9.6048583984375, -9.159912109375, -8.7149658203125, -8.27001953125, -7.8250732421875, -7.380126953125, -6.9351806640625, -6.490234375, -6.0452880859375, -5.600341796875, -5.1553955078125, -4.71044921875, -4.2655029296875, -3.820556640625, -3.3756103515625, -2.9306640625, -2.4857177734375, -2.040771484375, -1.5958251953125, -1.15087890625, -0.7059326171875, -0.260986328125, 0.1839599609375, 0.62890625, 1.0738525390625, 1.518798828125, 1.9637451171875, 2.40869140625, 2.8536376953125, 3.298583984375, 3.7435302734375, 4.1884765625, 4.6334228515625, 5.078369140625, 5.5233154296875, 5.96826171875, 6.4132080078125, 6.858154296875, 7.3031005859375, 7.748046875, 8.1929931640625, 8.637939453125, 9.0828857421875, 9.52783203125, 9.9727783203125, 10.417724609375, 10.8626708984375, 11.3076171875, 11.7525634765625, 12.197509765625, 12.6424560546875, 13.08740234375, 13.5323486328125, 13.977294921875, 14.4222412109375, 14.8671875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 9.0, 13.0, 19.0, 26.0, 44.0, 67.0, 79.0, 116.0, 204.0, 407.0, 1054.0, 46131.0, 3091058.0, 5089.0, 612.0, 309.0, 167.0, 86.0, 48.0, 38.0, 42.0, 23.0, 12.0, 6.0, 9.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-63.65625, -61.85205078125, -60.0478515625, -58.24365234375, -56.439453125, -54.63525390625, -52.8310546875, -51.02685546875, -49.22265625, -47.41845703125, -45.6142578125, -43.81005859375, -42.005859375, -40.20166015625, -38.3974609375, -36.59326171875, -34.7890625, -32.98486328125, -31.1806640625, -29.37646484375, -27.572265625, -25.76806640625, -23.9638671875, -22.15966796875, -20.35546875, -18.55126953125, -16.7470703125, -14.94287109375, -13.138671875, -11.33447265625, -9.5302734375, -7.72607421875, -5.921875, -4.11767578125, -2.3134765625, -0.50927734375, 1.294921875, 3.09912109375, 4.9033203125, 6.70751953125, 8.51171875, 10.31591796875, 12.1201171875, 13.92431640625, 15.728515625, 17.53271484375, 19.3369140625, 21.14111328125, 22.9453125, 24.74951171875, 26.5537109375, 28.35791015625, 30.162109375, 31.96630859375, 33.7705078125, 35.57470703125, 37.37890625, 39.18310546875, 40.9873046875, 42.79150390625, 44.595703125, 46.39990234375, 48.2041015625, 50.00830078125, 51.8125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 28.0, 778.0, 211.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-305.2459716796875, -299.4556884765625, -293.6654052734375, -287.8751525878906, -282.0848693847656, -276.2945861816406, -270.5043029785156, -264.7140197753906, -258.92376708984375, -253.13348388671875, -247.3432159423828, -241.5529327392578, -235.76266479492188, -229.97238159179688, -224.18209838867188, -218.39181518554688, -212.60153198242188, -206.81124877929688, -201.02098083496094, -195.23069763183594, -189.4404296875, -183.650146484375, -177.85986328125, -172.069580078125, -166.27931213378906, -160.48902893066406, -154.69876098632812, -148.90847778320312, -143.11819458007812, -137.3279266357422, -131.5376434326172, -125.74736785888672, -119.95708465576172, -114.16680908203125, -108.37652587890625, -102.58625030517578, -96.79597473144531, -91.00569915771484, -85.21542358398438, -79.42514038085938, -73.6348648071289, -67.84458923339844, -62.0543098449707, -56.26403045654297, -50.4737548828125, -44.68347930908203, -38.8931999206543, -33.10292053222656, -27.312644958496094, -21.522367477416992, -15.73208999633789, -9.941812515258789, -4.1515350341796875, 1.638742446899414, 7.429019927978516, 13.21929931640625, 19.00957489013672, 24.79985237121582, 30.590129852294922, 36.380409240722656, 42.170684814453125, 47.960960388183594, 53.75123977661133, 59.54151916503906, 65.33179473876953]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 7.0, 8.0, 9.0, 7.0, 16.0, 24.0, 25.0, 25.0, 25.0, 45.0, 28.0, 39.0, 42.0, 38.0, 41.0, 44.0, 39.0, 44.0, 37.0, 44.0, 40.0, 39.0, 44.0, 31.0, 35.0, 28.0, 35.0, 30.0, 25.0, 23.0, 22.0, 16.0, 8.0, 13.0, 6.0, 2.0, 1.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.61305236816406, -48.06504821777344, -46.51704025268555, -44.96903610229492, -43.4210319519043, -41.873023986816406, -40.32501983642578, -38.777015686035156, -37.22901153564453, -35.681007385253906, -34.132999420166016, -32.58499526977539, -31.036991119384766, -29.488985061645508, -27.94097900390625, -26.392974853515625, -24.844966888427734, -23.296960830688477, -21.74895668029785, -20.200950622558594, -18.65294647216797, -17.10494041442871, -15.556934356689453, -14.008929252624512, -12.46092414855957, -10.912919044494629, -9.364913940429688, -7.81690788269043, -6.268902778625488, -4.720897674560547, -3.172891616821289, -1.6248865127563477, -0.07688140869140625, 1.4711239337921143, 3.0191292762756348, 4.567134857177734, 6.115139961242676, 7.663145065307617, 9.211151123046875, 10.759156227111816, 12.307161331176758, 13.8551664352417, 15.40317153930664, 16.9511775970459, 18.499183654785156, 20.04718780517578, 21.59519386291504, 23.143199920654297, 24.691204071044922, 26.23921012878418, 27.787214279174805, 29.335220336914062, 30.883224487304688, 32.43122863769531, 33.9792366027832, 35.52724075317383, 37.07524871826172, 38.623252868652344, 40.171260833740234, 41.71926498413086, 43.267269134521484, 44.815277099609375, 46.36328125, 47.911285400390625, 49.45928955078125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 4.0, 9.0, 11.0, 6.0, 17.0, 22.0, 18.0, 14.0, 14.0, 14.0, 21.0, 29.0, 40.0, 38.0, 40.0, 33.0, 44.0, 43.0, 52.0, 48.0, 46.0, 42.0, 38.0, 43.0, 42.0, 36.0, 44.0, 25.0, 26.0, 26.0, 17.0, 21.0, 13.0, 11.0, 8.0, 12.0, 12.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.9375, -4.781005859375, -4.62451171875, -4.468017578125, -4.3115234375, -4.155029296875, -3.99853515625, -3.842041015625, -3.685546875, -3.529052734375, -3.37255859375, -3.216064453125, -3.0595703125, -2.903076171875, -2.74658203125, -2.590087890625, -2.43359375, -2.277099609375, -2.12060546875, -1.964111328125, -1.8076171875, -1.651123046875, -1.49462890625, -1.338134765625, -1.181640625, -1.025146484375, -0.86865234375, -0.712158203125, -0.5556640625, -0.399169921875, -0.24267578125, -0.086181640625, 0.0703125, 0.226806640625, 0.38330078125, 0.539794921875, 0.6962890625, 0.852783203125, 1.00927734375, 1.165771484375, 1.322265625, 1.478759765625, 1.63525390625, 1.791748046875, 1.9482421875, 2.104736328125, 2.26123046875, 2.417724609375, 2.57421875, 2.730712890625, 2.88720703125, 3.043701171875, 3.2001953125, 3.356689453125, 3.51318359375, 3.669677734375, 3.826171875, 3.982666015625, 4.13916015625, 4.295654296875, 4.4521484375, 4.608642578125, 4.76513671875, 4.921630859375, 5.078125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 8.0, 10.0, 13.0, 14.0, 30.0, 33.0, 39.0, 42.0, 52.0, 59.0, 108.0, 148.0, 253.0, 531.0, 1148.0, 3715.0, 15193.0, 93876.0, 806701.0, 2388524.0, 777209.0, 85657.0, 14581.0, 3748.0, 1226.0, 527.0, 271.0, 144.0, 106.0, 63.0, 52.0, 50.0, 31.0, 22.0, 23.0, 16.0, 12.0, 10.0, 6.0, 5.0, 12.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.03125, -8.7249755859375, -8.418701171875, -8.1124267578125, -7.80615234375, -7.4998779296875, -7.193603515625, -6.8873291015625, -6.5810546875, -6.2747802734375, -5.968505859375, -5.6622314453125, -5.35595703125, -5.0496826171875, -4.743408203125, -4.4371337890625, -4.130859375, -3.8245849609375, -3.518310546875, -3.2120361328125, -2.90576171875, -2.5994873046875, -2.293212890625, -1.9869384765625, -1.6806640625, -1.3743896484375, -1.068115234375, -0.7618408203125, -0.45556640625, -0.1492919921875, 0.156982421875, 0.4632568359375, 0.76953125, 1.0758056640625, 1.382080078125, 1.6883544921875, 1.99462890625, 2.3009033203125, 2.607177734375, 2.9134521484375, 3.2197265625, 3.5260009765625, 3.832275390625, 4.1385498046875, 4.44482421875, 4.7510986328125, 5.057373046875, 5.3636474609375, 5.669921875, 5.9761962890625, 6.282470703125, 6.5887451171875, 6.89501953125, 7.2012939453125, 7.507568359375, 7.8138427734375, 8.1201171875, 8.4263916015625, 8.732666015625, 9.0389404296875, 9.34521484375, 9.6514892578125, 9.957763671875, 10.2640380859375, 10.5703125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 14.0, 8.0, 11.0, 15.0, 28.0, 35.0, 48.0, 60.0, 85.0, 112.0, 164.0, 203.0, 271.0, 349.0, 402.0, 470.0, 432.0, 352.0, 261.0, 200.0, 148.0, 113.0, 76.0, 64.0, 41.0, 21.0, 20.0, 16.0, 19.0, 9.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.2421875, -9.8946533203125, -9.547119140625, -9.1995849609375, -8.85205078125, -8.5045166015625, -8.156982421875, -7.8094482421875, -7.4619140625, -7.1143798828125, -6.766845703125, -6.4193115234375, -6.07177734375, -5.7242431640625, -5.376708984375, -5.0291748046875, -4.681640625, -4.3341064453125, -3.986572265625, -3.6390380859375, -3.29150390625, -2.9439697265625, -2.596435546875, -2.2489013671875, -1.9013671875, -1.5538330078125, -1.206298828125, -0.8587646484375, -0.51123046875, -0.1636962890625, 0.183837890625, 0.5313720703125, 0.87890625, 1.2264404296875, 1.573974609375, 1.9215087890625, 2.26904296875, 2.6165771484375, 2.964111328125, 3.3116455078125, 3.6591796875, 4.0067138671875, 4.354248046875, 4.7017822265625, 5.04931640625, 5.3968505859375, 5.744384765625, 6.0919189453125, 6.439453125, 6.7869873046875, 7.134521484375, 7.4820556640625, 7.82958984375, 8.1771240234375, 8.524658203125, 8.8721923828125, 9.2197265625, 9.5672607421875, 9.914794921875, 10.2623291015625, 10.60986328125, 10.9573974609375, 11.304931640625, 11.6524658203125, 12.0]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 6.0, 8.0, 6.0, 7.0, 8.0, 8.0, 9.0, 16.0, 19.0, 37.0, 42.0, 51.0, 69.0, 84.0, 108.0, 153.0, 301.0, 632.0, 1508.0, 11253.0, 973081.0, 3174743.0, 28149.0, 2152.0, 704.0, 358.0, 229.0, 121.0, 84.0, 73.0, 65.0, 55.0, 33.0, 26.0, 24.0, 14.0, 9.0, 6.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-43.8125, -42.66357421875, -41.5146484375, -40.36572265625, -39.216796875, -38.06787109375, -36.9189453125, -35.77001953125, -34.62109375, -33.47216796875, -32.3232421875, -31.17431640625, -30.025390625, -28.87646484375, -27.7275390625, -26.57861328125, -25.4296875, -24.28076171875, -23.1318359375, -21.98291015625, -20.833984375, -19.68505859375, -18.5361328125, -17.38720703125, -16.23828125, -15.08935546875, -13.9404296875, -12.79150390625, -11.642578125, -10.49365234375, -9.3447265625, -8.19580078125, -7.046875, -5.89794921875, -4.7490234375, -3.60009765625, -2.451171875, -1.30224609375, -0.1533203125, 0.99560546875, 2.14453125, 3.29345703125, 4.4423828125, 5.59130859375, 6.740234375, 7.88916015625, 9.0380859375, 10.18701171875, 11.3359375, 12.48486328125, 13.6337890625, 14.78271484375, 15.931640625, 17.08056640625, 18.2294921875, 19.37841796875, 20.52734375, 21.67626953125, 22.8251953125, 23.97412109375, 25.123046875, 26.27197265625, 27.4208984375, 28.56982421875, 29.71875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 15.0, 67.0, 209.0, 403.0, 236.0, 65.0, 16.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.55224609375, -89.45958709716797, -84.36692810058594, -79.2742691040039, -74.18161010742188, -69.08895111083984, -63.99629211425781, -58.90363311767578, -53.81097412109375, -48.71831512451172, -43.62565612792969, -38.532997131347656, -33.440338134765625, -28.347679138183594, -23.255020141601562, -18.16236114501953, -13.0697021484375, -7.977043151855469, -2.8843841552734375, 2.2082748413085938, 7.300933837890625, 12.393592834472656, 17.486251831054688, 22.57891082763672, 27.67156982421875, 32.76422882080078, 37.85688781738281, 42.949546813964844, 48.042205810546875, 53.134864807128906, 58.22752380371094, 63.32018280029297, 68.412841796875, 73.50550079345703, 78.59815979003906, 83.6908187866211, 88.78347778320312, 93.87613677978516, 98.96879577636719, 104.06145477294922, 109.15411376953125, 114.24677276611328, 119.33943176269531, 124.43209075927734, 129.52474975585938, 134.61740112304688, 139.71006774902344, 144.802734375, 149.8953857421875, 154.988037109375, 160.08070373535156, 165.17337036132812, 170.26602172851562, 175.35867309570312, 180.4513397216797, 185.54400634765625, 190.63665771484375, 195.72930908203125, 200.8219757080078, 205.91464233398438, 211.00729370117188, 216.09994506835938, 221.19261169433594, 226.2852783203125, 231.3779296875]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 8.0, 8.0, 12.0, 6.0, 19.0, 10.0, 17.0, 22.0, 18.0, 28.0, 27.0, 22.0, 26.0, 36.0, 38.0, 47.0, 37.0, 38.0, 38.0, 41.0, 38.0, 32.0, 37.0, 34.0, 27.0, 28.0, 24.0, 36.0, 21.0, 29.0, 26.0, 24.0, 17.0, 12.0, 13.0, 17.0, 14.0, 6.0, 8.0, 13.0, 9.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0], "bins": [-31.283584594726562, -30.273103713989258, -29.262622833251953, -28.25214385986328, -27.241662979125977, -26.231182098388672, -25.220703125, -24.210222244262695, -23.19974136352539, -22.189260482788086, -21.17877960205078, -20.16830062866211, -19.157819747924805, -18.1473388671875, -17.136859893798828, -16.126379013061523, -15.115898132324219, -14.105417251586914, -13.094937324523926, -12.084457397460938, -11.073976516723633, -10.063495635986328, -9.05301570892334, -8.042535781860352, -7.032054901123047, -6.0215744972229, -5.011094093322754, -4.000613689422607, -2.990133285522461, -1.9796528816223145, -0.969172477722168, 0.041307926177978516, 1.051788330078125, 2.0622687339782715, 3.072749137878418, 4.0832295417785645, 5.093709945678711, 6.104190349578857, 7.114670753479004, 8.125150680541992, 9.135631561279297, 10.146112442016602, 11.15659236907959, 12.167072296142578, 13.177553176879883, 14.188034057617188, 15.198513984680176, 16.208993911743164, 17.21947479248047, 18.229955673217773, 19.240436553955078, 20.25091552734375, 21.261396408081055, 22.27187728881836, 23.28235626220703, 24.292837142944336, 25.30331802368164, 26.313798904418945, 27.32427978515625, 28.334758758544922, 29.345239639282227, 30.35572052001953, 31.366199493408203, 32.37668228149414, 33.38716125488281]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 8.0, 7.0, 4.0, 10.0, 11.0, 12.0, 18.0, 24.0, 27.0, 31.0, 21.0, 23.0, 24.0, 35.0, 30.0, 45.0, 46.0, 41.0, 52.0, 39.0, 37.0, 52.0, 50.0, 37.0, 36.0, 36.0, 41.0, 29.0, 41.0, 15.0, 26.0, 20.0, 10.0, 15.0, 6.0, 6.0, 8.0, 8.0, 4.0, 8.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.83038330078125, -4.6724853515625, -4.51458740234375, -4.356689453125, -4.19879150390625, -4.0408935546875, -3.88299560546875, -3.72509765625, -3.56719970703125, -3.4093017578125, -3.25140380859375, -3.093505859375, -2.93560791015625, -2.7777099609375, -2.61981201171875, -2.4619140625, -2.30401611328125, -2.1461181640625, -1.98822021484375, -1.830322265625, -1.67242431640625, -1.5145263671875, -1.35662841796875, -1.19873046875, -1.04083251953125, -0.8829345703125, -0.72503662109375, -0.567138671875, -0.40924072265625, -0.2513427734375, -0.09344482421875, 0.064453125, 0.22235107421875, 0.3802490234375, 0.53814697265625, 0.696044921875, 0.85394287109375, 1.0118408203125, 1.16973876953125, 1.32763671875, 1.48553466796875, 1.6434326171875, 1.80133056640625, 1.959228515625, 2.11712646484375, 2.2750244140625, 2.43292236328125, 2.5908203125, 2.74871826171875, 2.9066162109375, 3.06451416015625, 3.222412109375, 3.38031005859375, 3.5382080078125, 3.69610595703125, 3.85400390625, 4.01190185546875, 4.1697998046875, 4.32769775390625, 4.485595703125, 4.64349365234375, 4.8013916015625, 4.95928955078125, 5.1171875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 11.0, 14.0, 19.0, 40.0, 59.0, 92.0, 153.0, 243.0, 356.0, 511.0, 803.0, 1218.0, 1779.0, 2629.0, 3873.0, 5874.0, 8848.0, 13442.0, 20534.0, 32312.0, 52394.0, 88191.0, 149286.0, 203849.0, 175959.0, 110906.0, 64773.0, 39094.0, 24509.0, 15716.0, 10190.0, 6885.0, 4506.0, 3131.0, 2019.0, 1443.0, 1006.0, 646.0, 436.0, 282.0, 196.0, 110.0, 74.0, 59.0, 27.0, 17.0, 17.0, 8.0, 8.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4228515625, -0.4086151123046875, -0.394378662109375, -0.3801422119140625, -0.36590576171875, -0.3516693115234375, -0.337432861328125, -0.3231964111328125, -0.3089599609375, -0.2947235107421875, -0.280487060546875, -0.2662506103515625, -0.25201416015625, -0.2377777099609375, -0.223541259765625, -0.2093048095703125, -0.195068359375, -0.1808319091796875, -0.166595458984375, -0.1523590087890625, -0.13812255859375, -0.1238861083984375, -0.109649658203125, -0.0954132080078125, -0.0811767578125, -0.0669403076171875, -0.052703857421875, -0.0384674072265625, -0.02423095703125, -0.0099945068359375, 0.004241943359375, 0.0184783935546875, 0.03271484375, 0.0469512939453125, 0.061187744140625, 0.0754241943359375, 0.08966064453125, 0.1038970947265625, 0.118133544921875, 0.1323699951171875, 0.1466064453125, 0.1608428955078125, 0.175079345703125, 0.1893157958984375, 0.20355224609375, 0.2177886962890625, 0.232025146484375, 0.2462615966796875, 0.260498046875, 0.2747344970703125, 0.288970947265625, 0.3032073974609375, 0.31744384765625, 0.3316802978515625, 0.345916748046875, 0.3601531982421875, 0.3743896484375, 0.3886260986328125, 0.402862548828125, 0.4170989990234375, 0.43133544921875, 0.4455718994140625, 0.459808349609375, 0.4740447998046875, 0.48828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 5.0, 5.0, 11.0, 5.0, 9.0, 6.0, 15.0, 17.0, 17.0, 16.0, 19.0, 28.0, 27.0, 24.0, 51.0, 31.0, 49.0, 29.0, 36.0, 49.0, 44.0, 1080.0, 47.0, 37.0, 31.0, 35.0, 30.0, 42.0, 35.0, 31.0, 27.0, 20.0, 25.0, 13.0, 16.0, 21.0, 8.0, 5.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0], "bins": [-3.546875, -3.451019287109375, -3.35516357421875, -3.259307861328125, -3.1634521484375, -3.067596435546875, -2.97174072265625, -2.875885009765625, -2.780029296875, -2.684173583984375, -2.58831787109375, -2.492462158203125, -2.3966064453125, -2.300750732421875, -2.20489501953125, -2.109039306640625, -2.01318359375, -1.917327880859375, -1.82147216796875, -1.725616455078125, -1.6297607421875, -1.533905029296875, -1.43804931640625, -1.342193603515625, -1.246337890625, -1.150482177734375, -1.05462646484375, -0.958770751953125, -0.8629150390625, -0.767059326171875, -0.67120361328125, -0.575347900390625, -0.4794921875, -0.383636474609375, -0.28778076171875, -0.191925048828125, -0.0960693359375, -0.000213623046875, 0.09564208984375, 0.191497802734375, 0.287353515625, 0.383209228515625, 0.47906494140625, 0.574920654296875, 0.6707763671875, 0.766632080078125, 0.86248779296875, 0.958343505859375, 1.05419921875, 1.150054931640625, 1.24591064453125, 1.341766357421875, 1.4376220703125, 1.533477783203125, 1.62933349609375, 1.725189208984375, 1.821044921875, 1.916900634765625, 2.01275634765625, 2.108612060546875, 2.2044677734375, 2.300323486328125, 2.39617919921875, 2.492034912109375, 2.587890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 11.0, 20.0, 20.0, 34.0, 56.0, 50.0, 102.0, 136.0, 231.0, 361.0, 517.0, 786.0, 1253.0, 1785.0, 2930.0, 4392.0, 7095.0, 10943.0, 18072.0, 29858.0, 50008.0, 86892.0, 143769.0, 1253806.0, 186731.0, 119517.0, 70720.0, 41291.0, 24427.0, 15126.0, 9309.0, 5879.0, 3817.0, 2508.0, 1609.0, 1023.0, 726.0, 453.0, 286.0, 193.0, 140.0, 91.0, 59.0, 29.0, 19.0, 15.0, 9.0, 11.0, 3.0, 6.0, 5.0, 3.0, 3.0], "bins": [-0.49755859375, -0.4832649230957031, -0.46897125244140625, -0.4546775817871094, -0.4403839111328125, -0.4260902404785156, -0.41179656982421875, -0.3975028991699219, -0.383209228515625, -0.3689155578613281, -0.35462188720703125, -0.3403282165527344, -0.3260345458984375, -0.3117408752441406, -0.29744720458984375, -0.2831535339355469, -0.26885986328125, -0.2545661926269531, -0.24027252197265625, -0.22597885131835938, -0.2116851806640625, -0.19739151000976562, -0.18309783935546875, -0.16880416870117188, -0.154510498046875, -0.14021682739257812, -0.12592315673828125, -0.11162948608398438, -0.0973358154296875, -0.08304214477539062, -0.06874847412109375, -0.054454803466796875, -0.0401611328125, -0.025867462158203125, -0.01157379150390625, 0.002719879150390625, 0.0170135498046875, 0.031307220458984375, 0.04560089111328125, 0.059894561767578125, 0.074188232421875, 0.08848190307617188, 0.10277557373046875, 0.11706924438476562, 0.1313629150390625, 0.14565658569335938, 0.15995025634765625, 0.17424392700195312, 0.18853759765625, 0.20283126831054688, 0.21712493896484375, 0.23141860961914062, 0.2457122802734375, 0.2600059509277344, 0.27429962158203125, 0.2885932922363281, 0.302886962890625, 0.3171806335449219, 0.33147430419921875, 0.3457679748535156, 0.3600616455078125, 0.3743553161621094, 0.38864898681640625, 0.4029426574707031, 0.417236328125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 9.0, 6.0, 5.0, 9.0, 9.0, 16.0, 18.0, 15.0, 30.0, 19.0, 33.0, 37.0, 42.0, 37.0, 37.0, 42.0, 29.0, 51.0, 39.0, 46.0, 40.0, 47.0, 41.0, 41.0, 34.0, 32.0, 40.0, 24.0, 28.0, 20.0, 20.0, 21.0, 22.0, 17.0, 8.0, 10.0, 6.0, 9.0, 4.0, 0.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005669593811035156, -0.0005471333861351013, -0.000527307391166687, -0.0005074813961982727, -0.0004876554012298584, -0.0004678294062614441, -0.0004480034112930298, -0.0004281774163246155, -0.00040835142135620117, -0.00038852542638778687, -0.00036869943141937256, -0.00034887343645095825, -0.00032904744148254395, -0.00030922144651412964, -0.00028939545154571533, -0.000269569456577301, -0.0002497434616088867, -0.0002299174666404724, -0.0002100914716720581, -0.0001902654767036438, -0.0001704394817352295, -0.00015061348676681519, -0.00013078749179840088, -0.00011096149682998657, -9.113550186157227e-05, -7.130950689315796e-05, -5.148351192474365e-05, -3.1657516956329346e-05, -1.1831521987915039e-05, 7.994472980499268e-06, 2.7820467948913574e-05, 4.764646291732788e-05, 6.747245788574219e-05, 8.72984528541565e-05, 0.0001071244478225708, 0.0001269504427909851, 0.00014677643775939941, 0.00016660243272781372, 0.00018642842769622803, 0.00020625442266464233, 0.00022608041763305664, 0.00024590641260147095, 0.00026573240756988525, 0.00028555840253829956, 0.00030538439750671387, 0.0003252103924751282, 0.0003450363874435425, 0.0003648623824119568, 0.0003846883773803711, 0.0004045143723487854, 0.0004243403673171997, 0.000444166362285614, 0.0004639923572540283, 0.0004838183522224426, 0.0005036443471908569, 0.0005234703421592712, 0.0005432963371276855, 0.0005631223320960999, 0.0005829483270645142, 0.0006027743220329285, 0.0006226003170013428, 0.0006424263119697571, 0.0006622523069381714, 0.0006820783019065857, 0.000701904296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 11.0, 4.0, 10.0, 8.0, 14.0, 13.0, 25.0, 22.0, 32.0, 25.0, 45.0, 50.0, 71.0, 106.0, 177.0, 304.0, 592.0, 1498.0, 278841.0, 762770.0, 2092.0, 763.0, 362.0, 190.0, 117.0, 64.0, 66.0, 66.0, 42.0, 34.0, 25.0, 21.0, 14.0, 21.0, 13.0, 7.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.0149078369140625, -0.014483332633972168, -0.014058828353881836, -0.013634324073791504, -0.013209819793701172, -0.01278531551361084, -0.012360811233520508, -0.011936306953430176, -0.011511802673339844, -0.011087298393249512, -0.01066279411315918, -0.010238289833068848, -0.009813785552978516, -0.009389281272888184, -0.008964776992797852, -0.00854027271270752, -0.008115768432617188, -0.0076912641525268555, -0.0072667598724365234, -0.006842255592346191, -0.006417751312255859, -0.005993247032165527, -0.005568742752075195, -0.005144238471984863, -0.004719734191894531, -0.004295229911804199, -0.003870725631713867, -0.003446221351623535, -0.003021717071533203, -0.002597212791442871, -0.002172708511352539, -0.001748204231262207, -0.001323699951171875, -0.000899195671081543, -0.00047469139099121094, -5.0187110900878906e-05, 0.0003743171691894531, 0.0007988214492797852, 0.0012233257293701172, 0.0016478300094604492, 0.0020723342895507812, 0.0024968385696411133, 0.0029213428497314453, 0.0033458471298217773, 0.0037703514099121094, 0.004194855690002441, 0.0046193599700927734, 0.0050438642501831055, 0.0054683685302734375, 0.0058928728103637695, 0.0063173770904541016, 0.006741881370544434, 0.007166385650634766, 0.007590889930725098, 0.00801539421081543, 0.008439898490905762, 0.008864402770996094, 0.009288907051086426, 0.009713411331176758, 0.01013791561126709, 0.010562419891357422, 0.010986924171447754, 0.011411428451538086, 0.011835932731628418, 0.01226043701171875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 27.0, 219.0, 473.0, 252.0, 39.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030095879919826984, -0.0029419763013720512, -0.002874364610761404, -0.002806752920150757, -0.0027391412295401096, -0.002671529771760106, -0.002603918081149459, -0.0025363063905388117, -0.0024686946999281645, -0.0024010830093175173, -0.00233347131870687, -0.002265859628096223, -0.0021982481703162193, -0.002130636479705572, -0.002063024789094925, -0.0019954130984842777, -0.0019278014078736305, -0.0018601897172629833, -0.0017925780266523361, -0.0017249664524570107, -0.0016573547618463635, -0.0015897430712357163, -0.001522131497040391, -0.0014545198064297438, -0.0013869081158190966, -0.0013192964252084494, -0.0012516847345978022, -0.0011840731604024768, -0.0011164614697918296, -0.0010488497791811824, -0.000981238204985857, -0.0009136265143752098, -0.0008460148237645626, -0.0007784031331539154, -0.0007107915007509291, -0.0006431798683479428, -0.0005755681777372956, -0.0005079564871266484, -0.00044034485472366214, -0.0003727331932168454, -0.00030512153171002865, -0.0002375098702032119, -0.00016989820869639516, -0.00010228654718957841, -3.467488568276167e-05, 3.2936775824055076e-05, 0.00010054843733087182, 0.00016816009883768857, 0.0002357717603445053, 0.00030338342185132205, 0.0003709950833581388, 0.00043860674486495554, 0.0005062184063717723, 0.0005738300969824195, 0.0006414417293854058, 0.0007090533617883921, 0.0007766650523990393, 0.0008442767430096865, 0.0009118883754126728, 0.000979500007815659, 0.0010471116984263062, 0.0011147233890369534, 0.0011823349632322788, 0.001249946653842926, 0.0013175583444535732]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 17.0, 7.0, 13.0, 14.0, 13.0, 28.0, 30.0, 16.0, 27.0, 37.0, 30.0, 31.0, 42.0, 40.0, 30.0, 31.0, 36.0, 40.0, 37.0, 43.0, 43.0, 34.0, 47.0, 35.0, 39.0, 24.0, 32.0, 27.0, 29.0, 16.0, 20.0, 11.0, 16.0, 9.0, 12.0, 8.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037866830825805664, -0.0003670603036880493, -0.000355452299118042, -0.00034384429454803467, -0.00033223628997802734, -0.00032062828540802, -0.0003090202808380127, -0.00029741227626800537, -0.00028580427169799805, -0.0002741962671279907, -0.0002625882625579834, -0.0002509802579879761, -0.00023937225341796875, -0.00022776424884796143, -0.0002161562442779541, -0.00020454823970794678, -0.00019294023513793945, -0.00018133223056793213, -0.0001697242259979248, -0.00015811622142791748, -0.00014650821685791016, -0.00013490021228790283, -0.0001232922077178955, -0.00011168420314788818, -0.00010007619857788086, -8.846819400787354e-05, -7.686018943786621e-05, -6.525218486785889e-05, -5.364418029785156e-05, -4.203617572784424e-05, -3.0428171157836914e-05, -1.882016658782959e-05, -7.212162017822266e-06, 4.395842552185059e-06, 1.6003847122192383e-05, 2.7611851692199707e-05, 3.921985626220703e-05, 5.0827860832214355e-05, 6.243586540222168e-05, 7.4043869972229e-05, 8.565187454223633e-05, 9.725987911224365e-05, 0.00010886788368225098, 0.0001204758882522583, 0.00013208389282226562, 0.00014369189739227295, 0.00015529990196228027, 0.0001669079065322876, 0.00017851591110229492, 0.00019012391567230225, 0.00020173192024230957, 0.0002133399248123169, 0.00022494792938232422, 0.00023655593395233154, 0.00024816393852233887, 0.0002597719430923462, 0.0002713799476623535, 0.00028298795223236084, 0.00029459595680236816, 0.0003062039613723755, 0.0003178119659423828, 0.00032941997051239014, 0.00034102797508239746, 0.0003526359796524048, 0.0003642439842224121]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 8.0, 7.0, 4.0, 10.0, 11.0, 12.0, 18.0, 24.0, 27.0, 31.0, 21.0, 24.0, 23.0, 35.0, 30.0, 45.0, 46.0, 41.0, 52.0, 39.0, 37.0, 52.0, 50.0, 37.0, 36.0, 36.0, 41.0, 29.0, 41.0, 15.0, 26.0, 20.0, 10.0, 15.0, 6.0, 6.0, 8.0, 8.0, 4.0, 8.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.83038330078125, -4.6724853515625, -4.51458740234375, -4.356689453125, -4.19879150390625, -4.0408935546875, -3.88299560546875, -3.72509765625, -3.56719970703125, -3.4093017578125, -3.25140380859375, -3.093505859375, -2.93560791015625, -2.7777099609375, -2.61981201171875, -2.4619140625, -2.30401611328125, -2.1461181640625, -1.98822021484375, -1.830322265625, -1.67242431640625, -1.5145263671875, -1.35662841796875, -1.19873046875, -1.04083251953125, -0.8829345703125, -0.72503662109375, -0.567138671875, -0.40924072265625, -0.2513427734375, -0.09344482421875, 0.064453125, 0.22235107421875, 0.3802490234375, 0.53814697265625, 0.696044921875, 0.85394287109375, 1.0118408203125, 1.16973876953125, 1.32763671875, 1.48553466796875, 1.6434326171875, 1.80133056640625, 1.959228515625, 2.11712646484375, 2.2750244140625, 2.43292236328125, 2.5908203125, 2.74871826171875, 2.9066162109375, 3.06451416015625, 3.222412109375, 3.38031005859375, 3.5382080078125, 3.69610595703125, 3.85400390625, 4.01190185546875, 4.1697998046875, 4.32769775390625, 4.485595703125, 4.64349365234375, 4.8013916015625, 4.95928955078125, 5.1171875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 11.0, 17.0, 5.0, 19.0, 24.0, 36.0, 33.0, 62.0, 86.0, 121.0, 158.0, 242.0, 355.0, 552.0, 794.0, 1239.0, 1996.0, 3454.0, 5908.0, 10772.0, 19765.0, 36994.0, 71715.0, 155838.0, 307937.0, 223811.0, 98569.0, 48909.0, 26163.0, 13823.0, 7798.0, 4380.0, 2549.0, 1462.0, 942.0, 612.0, 427.0, 303.0, 180.0, 131.0, 98.0, 71.0, 42.0, 43.0, 30.0, 19.0, 21.0, 11.0, 9.0, 10.0, 1.0, 1.0, 3.0, 5.0, 1.0, 0.0, 2.0], "bins": [-2.853515625, -2.7635498046875, -2.673583984375, -2.5836181640625, -2.49365234375, -2.4036865234375, -2.313720703125, -2.2237548828125, -2.1337890625, -2.0438232421875, -1.953857421875, -1.8638916015625, -1.77392578125, -1.6839599609375, -1.593994140625, -1.5040283203125, -1.4140625, -1.3240966796875, -1.234130859375, -1.1441650390625, -1.05419921875, -0.9642333984375, -0.874267578125, -0.7843017578125, -0.6943359375, -0.6043701171875, -0.514404296875, -0.4244384765625, -0.33447265625, -0.2445068359375, -0.154541015625, -0.0645751953125, 0.025390625, 0.1153564453125, 0.205322265625, 0.2952880859375, 0.38525390625, 0.4752197265625, 0.565185546875, 0.6551513671875, 0.7451171875, 0.8350830078125, 0.925048828125, 1.0150146484375, 1.10498046875, 1.1949462890625, 1.284912109375, 1.3748779296875, 1.46484375, 1.5548095703125, 1.644775390625, 1.7347412109375, 1.82470703125, 1.9146728515625, 2.004638671875, 2.0946044921875, 2.1845703125, 2.2745361328125, 2.364501953125, 2.4544677734375, 2.54443359375, 2.6343994140625, 2.724365234375, 2.8143310546875, 2.904296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 7.0, 10.0, 17.0, 21.0, 15.0, 21.0, 27.0, 28.0, 22.0, 30.0, 43.0, 37.0, 48.0, 49.0, 74.0, 159.0, 1669.0, 232.0, 90.0, 44.0, 54.0, 34.0, 46.0, 43.0, 31.0, 25.0, 28.0, 26.0, 13.0, 23.0, 18.0, 12.0, 10.0, 13.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.234375, -20.63916015625, -20.0439453125, -19.44873046875, -18.853515625, -18.25830078125, -17.6630859375, -17.06787109375, -16.47265625, -15.87744140625, -15.2822265625, -14.68701171875, -14.091796875, -13.49658203125, -12.9013671875, -12.30615234375, -11.7109375, -11.11572265625, -10.5205078125, -9.92529296875, -9.330078125, -8.73486328125, -8.1396484375, -7.54443359375, -6.94921875, -6.35400390625, -5.7587890625, -5.16357421875, -4.568359375, -3.97314453125, -3.3779296875, -2.78271484375, -2.1875, -1.59228515625, -0.9970703125, -0.40185546875, 0.193359375, 0.78857421875, 1.3837890625, 1.97900390625, 2.57421875, 3.16943359375, 3.7646484375, 4.35986328125, 4.955078125, 5.55029296875, 6.1455078125, 6.74072265625, 7.3359375, 7.93115234375, 8.5263671875, 9.12158203125, 9.716796875, 10.31201171875, 10.9072265625, 11.50244140625, 12.09765625, 12.69287109375, 13.2880859375, 13.88330078125, 14.478515625, 15.07373046875, 15.6689453125, 16.26416015625, 16.859375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 9.0, 10.0, 21.0, 27.0, 44.0, 38.0, 55.0, 106.0, 154.0, 234.0, 345.0, 1096.0, 17095.0, 3118100.0, 6680.0, 723.0, 331.0, 207.0, 147.0, 76.0, 62.0, 51.0, 36.0, 15.0, 11.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.4375, -51.4130859375, -49.388671875, -47.3642578125, -45.33984375, -43.3154296875, -41.291015625, -39.2666015625, -37.2421875, -35.2177734375, -33.193359375, -31.1689453125, -29.14453125, -27.1201171875, -25.095703125, -23.0712890625, -21.046875, -19.0224609375, -16.998046875, -14.9736328125, -12.94921875, -10.9248046875, -8.900390625, -6.8759765625, -4.8515625, -2.8271484375, -0.802734375, 1.2216796875, 3.24609375, 5.2705078125, 7.294921875, 9.3193359375, 11.34375, 13.3681640625, 15.392578125, 17.4169921875, 19.44140625, 21.4658203125, 23.490234375, 25.5146484375, 27.5390625, 29.5634765625, 31.587890625, 33.6123046875, 35.63671875, 37.6611328125, 39.685546875, 41.7099609375, 43.734375, 45.7587890625, 47.783203125, 49.8076171875, 51.83203125, 53.8564453125, 55.880859375, 57.9052734375, 59.9296875, 61.9541015625, 63.978515625, 66.0029296875, 68.02734375, 70.0517578125, 72.076171875, 74.1005859375, 76.125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 20.0, 128.0, 345.0, 376.0, 120.0, 22.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.070805549621582, -10.061518669128418, -8.052231788635254, -6.04294490814209, -4.033658027648926, -2.0243711471557617, -0.015084266662597656, 1.9942026138305664, 4.0034894943237305, 6.0127763748168945, 8.022063255310059, 10.031350135803223, 12.040637016296387, 14.04992389678955, 16.05921173095703, 18.068496704101562, 20.07778549194336, 22.087072372436523, 24.096359252929688, 26.10564613342285, 28.114933013916016, 30.12421989440918, 32.133506774902344, 34.142791748046875, 36.15208053588867, 38.16136932373047, 40.170654296875, 42.17993927001953, 44.18922805786133, 46.198516845703125, 48.207801818847656, 50.21708679199219, 52.22637176513672, 54.23565673828125, 56.24494552612305, 58.254234313964844, 60.263519287109375, 62.272804260253906, 64.28208923339844, 66.2913818359375, 68.30066680908203, 70.30995178222656, 72.31924438476562, 74.32852935791016, 76.33781433105469, 78.34709930419922, 80.35638427734375, 82.36567687988281, 84.37496185302734, 86.38424682617188, 88.39353942871094, 90.40282440185547, 92.412109375, 94.42139434814453, 96.43067932128906, 98.43997192382812, 100.44925689697266, 102.45854187011719, 104.46783447265625, 106.47711944580078, 108.48640441894531, 110.49568939208984, 112.50497436523438, 114.51426696777344, 116.52355194091797]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 5.0, 13.0, 7.0, 11.0, 18.0, 10.0, 20.0, 24.0, 26.0, 20.0, 23.0, 25.0, 29.0, 40.0, 44.0, 30.0, 35.0, 48.0, 35.0, 36.0, 35.0, 42.0, 43.0, 30.0, 23.0, 43.0, 34.0, 21.0, 30.0, 29.0, 18.0, 19.0, 20.0, 12.0, 14.0, 14.0, 8.0, 11.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.655174255371094, -36.42484664916992, -35.19451904296875, -33.964195251464844, -32.73386764526367, -31.5035400390625, -30.273212432861328, -29.042884826660156, -27.812559127807617, -26.582231521606445, -25.351905822753906, -24.121578216552734, -22.891250610351562, -21.660924911499023, -20.43059730529785, -19.200271606445312, -17.96994400024414, -16.73961639404297, -15.50929069519043, -14.278963088989258, -13.048636436462402, -11.818309783935547, -10.587982177734375, -9.35765552520752, -8.127328872680664, -6.897002220153809, -5.666675090789795, -4.436347961425781, -3.206021308898926, -1.9756946563720703, -0.7453675270080566, 0.48495960235595703, 1.7152862548828125, 2.945613145828247, 4.175940036773682, 5.406267166137695, 6.636593818664551, 7.866920471191406, 9.097248077392578, 10.327574729919434, 11.557901382446289, 12.788228034973145, 14.0185546875, 15.248882293701172, 16.479209899902344, 17.709535598754883, 18.939863204956055, 20.170188903808594, 21.400516510009766, 22.630844116210938, 23.861169815063477, 25.09149742126465, 26.321823120117188, 27.55215072631836, 28.78247833251953, 30.012805938720703, 31.243131637573242, 32.47345733642578, 33.70378494262695, 34.934112548828125, 36.1644401550293, 37.39476776123047, 38.625091552734375, 39.85541915893555, 41.08574676513672]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 5.0, 5.0, 7.0, 9.0, 8.0, 14.0, 17.0, 12.0, 22.0, 22.0, 26.0, 25.0, 28.0, 29.0, 36.0, 38.0, 31.0, 47.0, 46.0, 46.0, 41.0, 52.0, 47.0, 38.0, 44.0, 39.0, 41.0, 33.0, 35.0, 24.0, 29.0, 20.0, 18.0, 9.0, 7.0, 9.0, 7.0, 8.0, 8.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-5.4609375, -5.297119140625, -5.13330078125, -4.969482421875, -4.8056640625, -4.641845703125, -4.47802734375, -4.314208984375, -4.150390625, -3.986572265625, -3.82275390625, -3.658935546875, -3.4951171875, -3.331298828125, -3.16748046875, -3.003662109375, -2.83984375, -2.676025390625, -2.51220703125, -2.348388671875, -2.1845703125, -2.020751953125, -1.85693359375, -1.693115234375, -1.529296875, -1.365478515625, -1.20166015625, -1.037841796875, -0.8740234375, -0.710205078125, -0.54638671875, -0.382568359375, -0.21875, -0.054931640625, 0.10888671875, 0.272705078125, 0.4365234375, 0.600341796875, 0.76416015625, 0.927978515625, 1.091796875, 1.255615234375, 1.41943359375, 1.583251953125, 1.7470703125, 1.910888671875, 2.07470703125, 2.238525390625, 2.40234375, 2.566162109375, 2.72998046875, 2.893798828125, 3.0576171875, 3.221435546875, 3.38525390625, 3.549072265625, 3.712890625, 3.876708984375, 4.04052734375, 4.204345703125, 4.3681640625, 4.531982421875, 4.69580078125, 4.859619140625, 5.0234375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 4.0, 14.0, 5.0, 9.0, 11.0, 19.0, 18.0, 17.0, 25.0, 24.0, 26.0, 28.0, 35.0, 54.0, 83.0, 248.0, 1667.0, 22756.0, 1821488.0, 2314023.0, 30919.0, 2036.0, 352.0, 109.0, 56.0, 33.0, 33.0, 33.0, 31.0, 20.0, 20.0, 11.0, 11.0, 10.0, 15.0, 6.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.78125, -22.091796875, -21.40234375, -20.712890625, -20.0234375, -19.333984375, -18.64453125, -17.955078125, -17.265625, -16.576171875, -15.88671875, -15.197265625, -14.5078125, -13.818359375, -13.12890625, -12.439453125, -11.75, -11.060546875, -10.37109375, -9.681640625, -8.9921875, -8.302734375, -7.61328125, -6.923828125, -6.234375, -5.544921875, -4.85546875, -4.166015625, -3.4765625, -2.787109375, -2.09765625, -1.408203125, -0.71875, -0.029296875, 0.66015625, 1.349609375, 2.0390625, 2.728515625, 3.41796875, 4.107421875, 4.796875, 5.486328125, 6.17578125, 6.865234375, 7.5546875, 8.244140625, 8.93359375, 9.623046875, 10.3125, 11.001953125, 11.69140625, 12.380859375, 13.0703125, 13.759765625, 14.44921875, 15.138671875, 15.828125, 16.517578125, 17.20703125, 17.896484375, 18.5859375, 19.275390625, 19.96484375, 20.654296875, 21.34375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 8.0, 16.0, 13.0, 13.0, 16.0, 21.0, 38.0, 30.0, 58.0, 87.0, 107.0, 100.0, 144.0, 192.0, 221.0, 322.0, 376.0, 381.0, 387.0, 286.0, 261.0, 243.0, 149.0, 145.0, 115.0, 86.0, 68.0, 43.0, 34.0, 25.0, 22.0, 12.0, 15.0, 7.0, 6.0, 8.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.5262451171875, -8.239990234375, -7.9537353515625, -7.66748046875, -7.3812255859375, -7.094970703125, -6.8087158203125, -6.5224609375, -6.2362060546875, -5.949951171875, -5.6636962890625, -5.37744140625, -5.0911865234375, -4.804931640625, -4.5186767578125, -4.232421875, -3.9461669921875, -3.659912109375, -3.3736572265625, -3.08740234375, -2.8011474609375, -2.514892578125, -2.2286376953125, -1.9423828125, -1.6561279296875, -1.369873046875, -1.0836181640625, -0.79736328125, -0.5111083984375, -0.224853515625, 0.0614013671875, 0.34765625, 0.6339111328125, 0.920166015625, 1.2064208984375, 1.49267578125, 1.7789306640625, 2.065185546875, 2.3514404296875, 2.6376953125, 2.9239501953125, 3.210205078125, 3.4964599609375, 3.78271484375, 4.0689697265625, 4.355224609375, 4.6414794921875, 4.927734375, 5.2139892578125, 5.500244140625, 5.7864990234375, 6.07275390625, 6.3590087890625, 6.645263671875, 6.9315185546875, 7.2177734375, 7.5040283203125, 7.790283203125, 8.0765380859375, 8.36279296875, 8.6490478515625, 8.935302734375, 9.2215576171875, 9.5078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 14.0, 15.0, 17.0, 21.0, 34.0, 34.0, 53.0, 92.0, 117.0, 168.0, 293.0, 554.0, 1752.0, 77603.0, 4053120.0, 57467.0, 1553.0, 531.0, 260.0, 164.0, 116.0, 74.0, 62.0, 46.0, 36.0, 16.0, 11.0, 13.0, 7.0, 10.0, 7.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.8125, -44.35693359375, -42.9013671875, -41.44580078125, -39.990234375, -38.53466796875, -37.0791015625, -35.62353515625, -34.16796875, -32.71240234375, -31.2568359375, -29.80126953125, -28.345703125, -26.89013671875, -25.4345703125, -23.97900390625, -22.5234375, -21.06787109375, -19.6123046875, -18.15673828125, -16.701171875, -15.24560546875, -13.7900390625, -12.33447265625, -10.87890625, -9.42333984375, -7.9677734375, -6.51220703125, -5.056640625, -3.60107421875, -2.1455078125, -0.68994140625, 0.765625, 2.22119140625, 3.6767578125, 5.13232421875, 6.587890625, 8.04345703125, 9.4990234375, 10.95458984375, 12.41015625, 13.86572265625, 15.3212890625, 16.77685546875, 18.232421875, 19.68798828125, 21.1435546875, 22.59912109375, 24.0546875, 25.51025390625, 26.9658203125, 28.42138671875, 29.876953125, 31.33251953125, 32.7880859375, 34.24365234375, 35.69921875, 37.15478515625, 38.6103515625, 40.06591796875, 41.521484375, 42.97705078125, 44.4326171875, 45.88818359375, 47.34375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 14.0, 17.0, 24.0, 45.0, 32.0, 39.0, 47.0, 51.0, 61.0, 78.0, 75.0, 77.0, 82.0, 72.0, 52.0, 58.0, 43.0, 41.0, 18.0, 14.0, 14.0, 10.0, 9.0, 2.0, 7.0, 8.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-36.07414627075195, -35.18165969848633, -34.2891731262207, -33.39668655395508, -32.50419998168945, -31.61171531677246, -30.719228744506836, -29.82674217224121, -28.934255599975586, -28.04176902770996, -27.149282455444336, -26.256797790527344, -25.36431121826172, -24.471824645996094, -23.57933807373047, -22.686851501464844, -21.79436492919922, -20.901878356933594, -20.00939178466797, -19.116905212402344, -18.22442054748535, -17.331933975219727, -16.4394474029541, -15.546960830688477, -14.654476165771484, -13.76198959350586, -12.86950397491455, -11.977017402648926, -11.0845308303833, -10.192045211791992, -9.299558639526367, -8.407072067260742, -7.514585494995117, -6.62209939956665, -5.729612827301025, -4.837126731872559, -3.9446403980255127, -3.052154064178467, -2.15966796875, -1.267181396484375, -0.3746953010559082, 0.5177909731864929, 1.410277247428894, 2.3027634620666504, 3.1952497959136963, 4.087736129760742, 4.980222225189209, 5.872708797454834, 6.765194892883301, 7.657680988311768, 8.550167083740234, 9.44265365600586, 10.335140228271484, 11.22762680053711, 12.120112419128418, 13.012598991394043, 13.905084609985352, 14.797571182250977, 15.690056800842285, 16.582542419433594, 17.47502899169922, 18.367515563964844, 19.26000213623047, 20.152488708496094, 21.04497528076172]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 12.0, 15.0, 7.0, 15.0, 14.0, 14.0, 28.0, 25.0, 20.0, 35.0, 31.0, 43.0, 39.0, 42.0, 45.0, 43.0, 45.0, 56.0, 52.0, 55.0, 45.0, 37.0, 30.0, 31.0, 31.0, 21.0, 25.0, 35.0, 21.0, 21.0, 13.0, 10.0, 10.0, 10.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.3475341796875, -37.14813232421875, -35.94873046875, -34.74932861328125, -33.5499267578125, -32.35052490234375, -31.151124954223633, -29.951723098754883, -28.752321243286133, -27.552919387817383, -26.353517532348633, -25.154115676879883, -23.954715728759766, -22.755313873291016, -21.555912017822266, -20.356510162353516, -19.157108306884766, -17.957706451416016, -16.758304595947266, -15.558903694152832, -14.359501838684082, -13.160099983215332, -11.960699081420898, -10.761297225952148, -9.561895370483398, -8.362493515014648, -7.163092136383057, -5.963690757751465, -4.764288902282715, -3.564887046813965, -2.365485668182373, -1.1660842895507812, 0.033321380615234375, 1.2327229976654053, 2.432124614715576, 3.631526231765747, 4.830927848815918, 6.030329704284668, 7.22973108291626, 8.429132461547852, 9.628534317016602, 10.827936172485352, 12.027338027954102, 13.226738929748535, 14.426140785217285, 15.625542640686035, 16.82494354248047, 18.02434539794922, 19.22374725341797, 20.42314910888672, 21.62255096435547, 22.82195281982422, 24.02135467529297, 25.22075653076172, 26.420156478881836, 27.619558334350586, 28.818960189819336, 30.018362045288086, 31.217763900756836, 32.41716384887695, 33.6165657043457, 34.81596755981445, 36.0153694152832, 37.21477127075195, 38.4141731262207]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 9.0, 9.0, 6.0, 7.0, 12.0, 6.0, 12.0, 14.0, 17.0, 20.0, 19.0, 27.0, 21.0, 41.0, 19.0, 38.0, 35.0, 48.0, 42.0, 32.0, 28.0, 33.0, 40.0, 40.0, 32.0, 41.0, 42.0, 35.0, 38.0, 31.0, 35.0, 23.0, 30.0, 28.0, 18.0, 11.0, 5.0, 14.0, 7.0, 3.0, 5.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-4.69140625, -4.5482177734375, -4.405029296875, -4.2618408203125, -4.11865234375, -3.9754638671875, -3.832275390625, -3.6890869140625, -3.5458984375, -3.4027099609375, -3.259521484375, -3.1163330078125, -2.97314453125, -2.8299560546875, -2.686767578125, -2.5435791015625, -2.400390625, -2.2572021484375, -2.114013671875, -1.9708251953125, -1.82763671875, -1.6844482421875, -1.541259765625, -1.3980712890625, -1.2548828125, -1.1116943359375, -0.968505859375, -0.8253173828125, -0.68212890625, -0.5389404296875, -0.395751953125, -0.2525634765625, -0.109375, 0.0338134765625, 0.177001953125, 0.3201904296875, 0.46337890625, 0.6065673828125, 0.749755859375, 0.8929443359375, 1.0361328125, 1.1793212890625, 1.322509765625, 1.4656982421875, 1.60888671875, 1.7520751953125, 1.895263671875, 2.0384521484375, 2.181640625, 2.3248291015625, 2.468017578125, 2.6112060546875, 2.75439453125, 2.8975830078125, 3.040771484375, 3.1839599609375, 3.3271484375, 3.4703369140625, 3.613525390625, 3.7567138671875, 3.89990234375, 4.0430908203125, 4.186279296875, 4.3294677734375, 4.47265625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 10.0, 17.0, 13.0, 27.0, 36.0, 58.0, 88.0, 139.0, 183.0, 259.0, 384.0, 557.0, 757.0, 1104.0, 1620.0, 2383.0, 3361.0, 4827.0, 6816.0, 10252.0, 14389.0, 21508.0, 31966.0, 48919.0, 76643.0, 120037.0, 167883.0, 171818.0, 125690.0, 80786.0, 51037.0, 33137.0, 22250.0, 15217.0, 10407.0, 7355.0, 5026.0, 3560.0, 2479.0, 1766.0, 1203.0, 804.0, 535.0, 402.0, 278.0, 183.0, 118.0, 94.0, 57.0, 40.0, 31.0, 20.0, 10.0, 10.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.413330078125, -0.4000205993652344, -0.38671112060546875, -0.3734016418457031, -0.3600921630859375, -0.3467826843261719, -0.33347320556640625, -0.3201637268066406, -0.306854248046875, -0.2935447692871094, -0.28023529052734375, -0.2669258117675781, -0.2536163330078125, -0.24030685424804688, -0.22699737548828125, -0.21368789672851562, -0.20037841796875, -0.18706893920898438, -0.17375946044921875, -0.16044998168945312, -0.1471405029296875, -0.13383102416992188, -0.12052154541015625, -0.10721206665039062, -0.093902587890625, -0.08059310913085938, -0.06728363037109375, -0.053974151611328125, -0.0406646728515625, -0.027355194091796875, -0.01404571533203125, -0.000736236572265625, 0.0125732421875, 0.025882720947265625, 0.03919219970703125, 0.052501678466796875, 0.0658111572265625, 0.07912063598632812, 0.09243011474609375, 0.10573959350585938, 0.119049072265625, 0.13235855102539062, 0.14566802978515625, 0.15897750854492188, 0.1722869873046875, 0.18559646606445312, 0.19890594482421875, 0.21221542358398438, 0.22552490234375, 0.23883438110351562, 0.25214385986328125, 0.2654533386230469, 0.2787628173828125, 0.2920722961425781, 0.30538177490234375, 0.3186912536621094, 0.332000732421875, 0.3453102111816406, 0.35861968994140625, 0.3719291687011719, 0.3852386474609375, 0.3985481262207031, 0.41185760498046875, 0.4251670837402344, 0.4384765625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 5.0, 8.0, 11.0, 9.0, 10.0, 13.0, 9.0, 17.0, 15.0, 28.0, 25.0, 24.0, 34.0, 19.0, 30.0, 36.0, 39.0, 38.0, 34.0, 42.0, 31.0, 42.0, 1055.0, 30.0, 39.0, 37.0, 31.0, 37.0, 33.0, 30.0, 22.0, 22.0, 30.0, 21.0, 22.0, 12.0, 17.0, 7.0, 8.0, 8.0, 10.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.96875, -2.87957763671875, -2.7904052734375, -2.70123291015625, -2.612060546875, -2.52288818359375, -2.4337158203125, -2.34454345703125, -2.25537109375, -2.16619873046875, -2.0770263671875, -1.98785400390625, -1.898681640625, -1.80950927734375, -1.7203369140625, -1.63116455078125, -1.5419921875, -1.45281982421875, -1.3636474609375, -1.27447509765625, -1.185302734375, -1.09613037109375, -1.0069580078125, -0.91778564453125, -0.82861328125, -0.73944091796875, -0.6502685546875, -0.56109619140625, -0.471923828125, -0.38275146484375, -0.2935791015625, -0.20440673828125, -0.115234375, -0.02606201171875, 0.0631103515625, 0.15228271484375, 0.241455078125, 0.33062744140625, 0.4197998046875, 0.50897216796875, 0.59814453125, 0.68731689453125, 0.7764892578125, 0.86566162109375, 0.954833984375, 1.04400634765625, 1.1331787109375, 1.22235107421875, 1.3115234375, 1.40069580078125, 1.4898681640625, 1.57904052734375, 1.668212890625, 1.75738525390625, 1.8465576171875, 1.93572998046875, 2.02490234375, 2.11407470703125, 2.2032470703125, 2.29241943359375, 2.381591796875, 2.47076416015625, 2.5599365234375, 2.64910888671875, 2.73828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 12.0, 15.0, 26.0, 31.0, 45.0, 59.0, 106.0, 159.0, 217.0, 346.0, 529.0, 801.0, 1184.0, 1880.0, 2965.0, 4607.0, 7077.0, 11188.0, 18055.0, 30106.0, 49439.0, 81782.0, 129334.0, 879731.0, 536587.0, 129731.0, 81288.0, 49613.0, 30153.0, 18331.0, 11498.0, 7180.0, 4452.0, 3001.0, 1949.0, 1175.0, 787.0, 547.0, 373.0, 233.0, 203.0, 116.0, 70.0, 45.0, 34.0, 21.0, 18.0, 11.0, 8.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.43701171875, -0.42291259765625, -0.4088134765625, -0.39471435546875, -0.380615234375, -0.36651611328125, -0.3524169921875, -0.33831787109375, -0.32421875, -0.31011962890625, -0.2960205078125, -0.28192138671875, -0.267822265625, -0.25372314453125, -0.2396240234375, -0.22552490234375, -0.21142578125, -0.19732666015625, -0.1832275390625, -0.16912841796875, -0.155029296875, -0.14093017578125, -0.1268310546875, -0.11273193359375, -0.0986328125, -0.08453369140625, -0.0704345703125, -0.05633544921875, -0.042236328125, -0.02813720703125, -0.0140380859375, 6.103515625e-05, 0.01416015625, 0.02825927734375, 0.0423583984375, 0.05645751953125, 0.070556640625, 0.08465576171875, 0.0987548828125, 0.11285400390625, 0.126953125, 0.14105224609375, 0.1551513671875, 0.16925048828125, 0.183349609375, 0.19744873046875, 0.2115478515625, 0.22564697265625, 0.23974609375, 0.25384521484375, 0.2679443359375, 0.28204345703125, 0.296142578125, 0.31024169921875, 0.3243408203125, 0.33843994140625, 0.3525390625, 0.36663818359375, 0.3807373046875, 0.39483642578125, 0.408935546875, 0.42303466796875, 0.4371337890625, 0.45123291015625, 0.46533203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 11.0, 12.0, 7.0, 12.0, 26.0, 13.0, 21.0, 35.0, 29.0, 53.0, 44.0, 49.0, 47.0, 49.0, 52.0, 45.0, 42.0, 45.0, 36.0, 46.0, 43.0, 42.0, 31.0, 21.0, 20.0, 24.0, 35.0, 16.0, 14.0, 15.0, 7.0, 9.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0008029937744140625, -0.0007797330617904663, -0.0007564723491668701, -0.0007332116365432739, -0.0007099509239196777, -0.0006866902112960815, -0.0006634294986724854, -0.0006401687860488892, -0.000616908073425293, -0.0005936473608016968, -0.0005703866481781006, -0.0005471259355545044, -0.0005238652229309082, -0.000500604510307312, -0.0004773437976837158, -0.00045408308506011963, -0.00043082237243652344, -0.00040756165981292725, -0.00038430094718933105, -0.00036104023456573486, -0.00033777952194213867, -0.0003145188093185425, -0.0002912580966949463, -0.0002679973840713501, -0.0002447366714477539, -0.00022147595882415771, -0.00019821524620056152, -0.00017495453357696533, -0.00015169382095336914, -0.00012843310832977295, -0.00010517239570617676, -8.191168308258057e-05, -5.8650970458984375e-05, -3.5390257835388184e-05, -1.2129545211791992e-05, 1.11311674118042e-05, 3.439188003540039e-05, 5.765259265899658e-05, 8.091330528259277e-05, 0.00010417401790618896, 0.00012743473052978516, 0.00015069544315338135, 0.00017395615577697754, 0.00019721686840057373, 0.00022047758102416992, 0.0002437382936477661, 0.0002669990062713623, 0.0002902597188949585, 0.0003135204315185547, 0.0003367811441421509, 0.00036004185676574707, 0.00038330256938934326, 0.00040656328201293945, 0.00042982399463653564, 0.00045308470726013184, 0.00047634541988372803, 0.0004996061325073242, 0.0005228668451309204, 0.0005461275577545166, 0.0005693882703781128, 0.000592648983001709, 0.0006159096956253052, 0.0006391704082489014, 0.0006624311208724976, 0.0006856918334960938]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 6.0, 10.0, 9.0, 7.0, 11.0, 21.0, 25.0, 24.0, 26.0, 30.0, 43.0, 67.0, 66.0, 140.0, 235.0, 463.0, 1289.0, 236119.0, 806749.0, 1785.0, 631.0, 268.0, 121.0, 88.0, 60.0, 57.0, 40.0, 30.0, 28.0, 19.0, 15.0, 14.0, 9.0, 5.0, 6.0, 3.0, 6.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01505279541015625, -0.014517426490783691, -0.013982057571411133, -0.013446688652038574, -0.012911319732666016, -0.012375950813293457, -0.011840581893920898, -0.01130521297454834, -0.010769844055175781, -0.010234475135803223, -0.009699106216430664, -0.009163737297058105, -0.008628368377685547, -0.008092999458312988, -0.00755763053894043, -0.007022261619567871, -0.0064868927001953125, -0.005951523780822754, -0.005416154861450195, -0.004880785942077637, -0.004345417022705078, -0.0038100481033325195, -0.003274679183959961, -0.0027393102645874023, -0.0022039413452148438, -0.0016685724258422852, -0.0011332035064697266, -0.000597834587097168, -6.246566772460938e-05, 0.0004729032516479492, 0.0010082721710205078, 0.0015436410903930664, 0.002079010009765625, 0.0026143789291381836, 0.003149747848510742, 0.0036851167678833008, 0.004220485687255859, 0.004755854606628418, 0.0052912235260009766, 0.005826592445373535, 0.006361961364746094, 0.006897330284118652, 0.007432699203491211, 0.00796806812286377, 0.008503437042236328, 0.009038805961608887, 0.009574174880981445, 0.010109543800354004, 0.010644912719726562, 0.011180281639099121, 0.01171565055847168, 0.012251019477844238, 0.012786388397216797, 0.013321757316589355, 0.013857126235961914, 0.014392495155334473, 0.014927864074707031, 0.01546323299407959, 0.01599860191345215, 0.016533970832824707, 0.017069339752197266, 0.017604708671569824, 0.018140077590942383, 0.01867544651031494, 0.0192108154296875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 31.0, 538.0, 435.0, 12.0, 2.0, 0.0, 2.0], "bins": [-0.007607099134474993, -0.007478008978068829, -0.007348918356001377, -0.007219828199595213, -0.007090738043189049, -0.006961647421121597, -0.006832557264715433, -0.006703467108309269, -0.0065743764862418175, -0.006445286329835653, -0.006316195707768202, -0.006187105551362038, -0.0060580153949558735, -0.005928924772888422, -0.005799834616482258, -0.005670744460076094, -0.0055416543036699295, -0.005412564147263765, -0.005283473525196314, -0.00515438336879015, -0.0050252932123839855, -0.004896202590316534, -0.00476711243391037, -0.004638022277504206, -0.004508931655436754, -0.00437984149903059, -0.004250750876963139, -0.004121660720556974, -0.00399257056415081, -0.0038634799420833588, -0.0037343897856771946, -0.0036052993964403868, -0.0034762087743729353, -0.0033471183851361275, -0.0032180282287299633, -0.0030889378394931555, -0.0029598474502563477, -0.0028307572938501835, -0.0027016669046133757, -0.002572576515376568, -0.0024434863589704037, -0.002314395969733596, -0.0021853058133274317, -0.002056215424090624, -0.001927125034853816, -0.00179803476203233, -0.001668944489210844, -0.0015398540999740362, -0.0014107637107372284, -0.0012816734379157424, -0.0011525830486789346, -0.0010234927758574486, -0.0008944024448283017, -0.0007653121137991548, -0.0006362218409776688, -0.0005071315099485219, -0.00037804123712703586, -0.00024895090609788895, -0.0001198606041725725, 9.22969775274396e-06, 0.00013832002878189087, 0.0002674103598110378, 0.0003965006326325238, 0.0005255909636616707, 0.0006546812946908176]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 11.0, 2.0, 10.0, 12.0, 7.0, 15.0, 13.0, 19.0, 14.0, 12.0, 29.0, 27.0, 22.0, 25.0, 42.0, 37.0, 41.0, 40.0, 36.0, 41.0, 36.0, 40.0, 36.0, 49.0, 34.0, 48.0, 27.0, 34.0, 31.0, 39.0, 29.0, 24.0, 16.0, 20.0, 14.0, 10.0, 15.0, 7.0, 13.0, 9.0, 4.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004176497459411621, -0.0004044706001877785, -0.00039129145443439484, -0.0003781123086810112, -0.00036493316292762756, -0.0003517540171742439, -0.0003385748714208603, -0.00032539572566747665, -0.000312216579914093, -0.0002990374341607094, -0.00028585828840732574, -0.0002726791426539421, -0.00025949999690055847, -0.00024632085114717484, -0.0002331417053937912, -0.00021996255964040756, -0.00020678341388702393, -0.0001936042681336403, -0.00018042512238025665, -0.00016724597662687302, -0.00015406683087348938, -0.00014088768512010574, -0.0001277085393667221, -0.00011452939361333847, -0.00010135024785995483, -8.81711021065712e-05, -7.499195635318756e-05, -6.181281059980392e-05, -4.863366484642029e-05, -3.545451909303665e-05, -2.2275373339653015e-05, -9.096227586269379e-06, 4.082918167114258e-06, 1.7262063920497894e-05, 3.044120967388153e-05, 4.362035542726517e-05, 5.6799501180648804e-05, 6.997864693403244e-05, 8.315779268741608e-05, 9.633693844079971e-05, 0.00010951608419418335, 0.00012269522994756699, 0.00013587437570095062, 0.00014905352145433426, 0.0001622326672077179, 0.00017541181296110153, 0.00018859095871448517, 0.0002017701044678688, 0.00021494925022125244, 0.00022812839597463608, 0.00024130754172801971, 0.00025448668748140335, 0.000267665833234787, 0.0002808449789881706, 0.00029402412474155426, 0.0003072032704949379, 0.00032038241624832153, 0.00033356156200170517, 0.0003467407077550888, 0.00035991985350847244, 0.0003730989992618561, 0.0003862781450152397, 0.00039945729076862335, 0.000412636436522007, 0.0004258155822753906]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 9.0, 9.0, 6.0, 7.0, 12.0, 6.0, 12.0, 14.0, 17.0, 20.0, 19.0, 27.0, 21.0, 40.0, 20.0, 38.0, 35.0, 48.0, 42.0, 32.0, 28.0, 33.0, 40.0, 40.0, 32.0, 42.0, 41.0, 35.0, 38.0, 31.0, 35.0, 23.0, 30.0, 28.0, 18.0, 11.0, 5.0, 14.0, 7.0, 3.0, 5.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-4.69140625, -4.5482177734375, -4.405029296875, -4.2618408203125, -4.11865234375, -3.9754638671875, -3.832275390625, -3.6890869140625, -3.5458984375, -3.4027099609375, -3.259521484375, -3.1163330078125, -2.97314453125, -2.8299560546875, -2.686767578125, -2.5435791015625, -2.400390625, -2.2572021484375, -2.114013671875, -1.9708251953125, -1.82763671875, -1.6844482421875, -1.541259765625, -1.3980712890625, -1.2548828125, -1.1116943359375, -0.968505859375, -0.8253173828125, -0.68212890625, -0.5389404296875, -0.395751953125, -0.2525634765625, -0.109375, 0.0338134765625, 0.177001953125, 0.3201904296875, 0.46337890625, 0.6065673828125, 0.749755859375, 0.8929443359375, 1.0361328125, 1.1793212890625, 1.322509765625, 1.4656982421875, 1.60888671875, 1.7520751953125, 1.895263671875, 2.0384521484375, 2.181640625, 2.3248291015625, 2.468017578125, 2.6112060546875, 2.75439453125, 2.8975830078125, 3.040771484375, 3.1839599609375, 3.3271484375, 3.4703369140625, 3.613525390625, 3.7567138671875, 3.89990234375, 4.0430908203125, 4.186279296875, 4.3294677734375, 4.47265625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 7.0, 9.0, 12.0, 8.0, 14.0, 21.0, 27.0, 27.0, 54.0, 64.0, 84.0, 126.0, 198.0, 282.0, 396.0, 583.0, 1053.0, 1866.0, 3450.0, 6983.0, 15917.0, 37001.0, 93026.0, 238151.0, 372498.0, 163972.0, 63619.0, 25961.0, 11330.0, 5264.0, 2569.0, 1469.0, 833.0, 518.0, 366.0, 249.0, 142.0, 121.0, 76.0, 62.0, 40.0, 19.0, 20.0, 22.0, 14.0, 14.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.611328125, -3.488067626953125, -3.36480712890625, -3.241546630859375, -3.1182861328125, -2.995025634765625, -2.87176513671875, -2.748504638671875, -2.625244140625, -2.501983642578125, -2.37872314453125, -2.255462646484375, -2.1322021484375, -2.008941650390625, -1.88568115234375, -1.762420654296875, -1.63916015625, -1.515899658203125, -1.39263916015625, -1.269378662109375, -1.1461181640625, -1.022857666015625, -0.89959716796875, -0.776336669921875, -0.653076171875, -0.529815673828125, -0.40655517578125, -0.283294677734375, -0.1600341796875, -0.036773681640625, 0.08648681640625, 0.209747314453125, 0.3330078125, 0.456268310546875, 0.57952880859375, 0.702789306640625, 0.8260498046875, 0.949310302734375, 1.07257080078125, 1.195831298828125, 1.319091796875, 1.442352294921875, 1.56561279296875, 1.688873291015625, 1.8121337890625, 1.935394287109375, 2.05865478515625, 2.181915283203125, 2.30517578125, 2.428436279296875, 2.55169677734375, 2.674957275390625, 2.7982177734375, 2.921478271484375, 3.04473876953125, 3.167999267578125, 3.291259765625, 3.414520263671875, 3.53778076171875, 3.661041259765625, 3.7843017578125, 3.907562255859375, 4.03082275390625, 4.154083251953125, 4.27734375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 6.0, 1.0, 8.0, 2.0, 5.0, 9.0, 6.0, 12.0, 17.0, 16.0, 19.0, 24.0, 33.0, 34.0, 34.0, 39.0, 42.0, 40.0, 53.0, 57.0, 152.0, 1601.0, 297.0, 117.0, 53.0, 53.0, 31.0, 39.0, 29.0, 27.0, 21.0, 31.0, 33.0, 20.0, 24.0, 16.0, 14.0, 7.0, 5.0, 3.0, 5.0, 3.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1171875, -13.6090087890625, -13.100830078125, -12.5926513671875, -12.08447265625, -11.5762939453125, -11.068115234375, -10.5599365234375, -10.0517578125, -9.5435791015625, -9.035400390625, -8.5272216796875, -8.01904296875, -7.5108642578125, -7.002685546875, -6.4945068359375, -5.986328125, -5.4781494140625, -4.969970703125, -4.4617919921875, -3.95361328125, -3.4454345703125, -2.937255859375, -2.4290771484375, -1.9208984375, -1.4127197265625, -0.904541015625, -0.3963623046875, 0.11181640625, 0.6199951171875, 1.128173828125, 1.6363525390625, 2.14453125, 2.6527099609375, 3.160888671875, 3.6690673828125, 4.17724609375, 4.6854248046875, 5.193603515625, 5.7017822265625, 6.2099609375, 6.7181396484375, 7.226318359375, 7.7344970703125, 8.24267578125, 8.7508544921875, 9.259033203125, 9.7672119140625, 10.275390625, 10.7835693359375, 11.291748046875, 11.7999267578125, 12.30810546875, 12.8162841796875, 13.324462890625, 13.8326416015625, 14.3408203125, 14.8489990234375, 15.357177734375, 15.8653564453125, 16.37353515625, 16.8817138671875, 17.389892578125, 17.8980712890625, 18.40625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 10.0, 7.0, 4.0, 14.0, 17.0, 37.0, 49.0, 42.0, 53.0, 62.0, 76.0, 131.0, 147.0, 244.0, 366.0, 670.0, 3596.0, 1964206.0, 1170782.0, 3330.0, 654.0, 362.0, 222.0, 155.0, 114.0, 90.0, 56.0, 47.0, 27.0, 34.0, 16.0, 15.0, 8.0, 10.0, 7.0, 6.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-40.9375, -39.6962890625, -38.455078125, -37.2138671875, -35.97265625, -34.7314453125, -33.490234375, -32.2490234375, -31.0078125, -29.7666015625, -28.525390625, -27.2841796875, -26.04296875, -24.8017578125, -23.560546875, -22.3193359375, -21.078125, -19.8369140625, -18.595703125, -17.3544921875, -16.11328125, -14.8720703125, -13.630859375, -12.3896484375, -11.1484375, -9.9072265625, -8.666015625, -7.4248046875, -6.18359375, -4.9423828125, -3.701171875, -2.4599609375, -1.21875, 0.0224609375, 1.263671875, 2.5048828125, 3.74609375, 4.9873046875, 6.228515625, 7.4697265625, 8.7109375, 9.9521484375, 11.193359375, 12.4345703125, 13.67578125, 14.9169921875, 16.158203125, 17.3994140625, 18.640625, 19.8818359375, 21.123046875, 22.3642578125, 23.60546875, 24.8466796875, 26.087890625, 27.3291015625, 28.5703125, 29.8115234375, 31.052734375, 32.2939453125, 33.53515625, 34.7763671875, 36.017578125, 37.2587890625, 38.5]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 16.0, 100.0, 449.0, 393.0, 51.0, 8.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.818111419677734, -13.15771484375, -10.497318267822266, -7.836922645568848, -5.176526069641113, -2.516129493713379, 0.14426612854003906, 2.8046627044677734, 5.465059280395508, 8.125455856323242, 10.785852432250977, 13.446248054504395, 16.106643676757812, 18.767040252685547, 21.42743682861328, 24.087833404541016, 26.74822998046875, 29.408626556396484, 32.06902313232422, 34.72941970825195, 37.38981628417969, 40.05021286010742, 42.710609436035156, 45.371002197265625, 48.031402587890625, 50.69179916381836, 53.352195739746094, 56.01259231567383, 58.67298889160156, 61.3333854675293, 63.99378204345703, 66.6541748046875, 69.31456756591797, 71.97496032714844, 74.63536071777344, 77.2957534790039, 79.9561538696289, 82.61654663085938, 85.27694702148438, 87.93733978271484, 90.59774017333984, 93.25813293457031, 95.91853332519531, 98.57892608642578, 101.23932647705078, 103.89971923828125, 106.56011962890625, 109.22051239013672, 111.88090515136719, 114.54129791259766, 117.20169830322266, 119.86209106445312, 122.52249145507812, 125.1828842163086, 127.8432846069336, 130.50367736816406, 133.16407775878906, 135.82447814941406, 138.48486328125, 141.145263671875, 143.8056640625, 146.466064453125, 149.12644958496094, 151.78684997558594, 154.44725036621094]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 8.0, 10.0, 6.0, 6.0, 8.0, 13.0, 15.0, 13.0, 16.0, 14.0, 20.0, 21.0, 30.0, 27.0, 39.0, 23.0, 27.0, 39.0, 29.0, 37.0, 36.0, 32.0, 40.0, 29.0, 43.0, 31.0, 34.0, 36.0, 35.0, 44.0, 31.0, 32.0, 23.0, 18.0, 17.0, 17.0, 20.0, 13.0, 15.0, 8.0, 10.0, 7.0, 6.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-44.21326446533203, -42.90032958984375, -41.5873908996582, -40.27445602416992, -38.96152114868164, -37.648582458496094, -36.33564758300781, -35.02271270751953, -33.70977783203125, -32.39684295654297, -31.083906173706055, -29.77096939086914, -28.45803451538086, -27.145097732543945, -25.83216094970703, -24.51922607421875, -23.206287384033203, -21.89335060119629, -20.580415725708008, -19.267478942871094, -17.954544067382812, -16.6416072845459, -15.328670501708984, -14.015734672546387, -12.702798843383789, -11.389863014221191, -10.076927185058594, -8.76399040222168, -7.451054573059082, -6.138118743896484, -4.8251824378967285, -3.5122461318969727, -2.1993064880371094, -0.8863704204559326, 0.42656564712524414, 1.739501714706421, 3.0524377822875977, 4.365373611450195, 5.678309917449951, 6.991246223449707, 8.304182052612305, 9.617117881774902, 10.9300537109375, 12.242990493774414, 13.555926322937012, 14.86886215209961, 16.181798934936523, 17.494735717773438, 18.80767059326172, 20.120607376098633, 21.433542251586914, 22.746479034423828, 24.05941390991211, 25.372350692749023, 26.685287475585938, 27.99822235107422, 29.311159133911133, 30.624095916748047, 31.937030792236328, 33.24996566772461, 34.562904357910156, 35.87583923339844, 37.18877410888672, 38.501712799072266, 39.81464767456055]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 9.0, 16.0, 10.0, 15.0, 12.0, 8.0, 19.0, 24.0, 21.0, 30.0, 17.0, 34.0, 31.0, 44.0, 40.0, 32.0, 30.0, 38.0, 37.0, 28.0, 34.0, 33.0, 39.0, 44.0, 36.0, 32.0, 37.0, 27.0, 34.0, 34.0, 25.0, 21.0, 19.0, 9.0, 14.0, 7.0, 4.0, 11.0, 1.0, 4.0, 5.0, 4.0, 4.0, 3.0, 5.0, 0.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-4.8359375, -4.68646240234375, -4.5369873046875, -4.38751220703125, -4.238037109375, -4.08856201171875, -3.9390869140625, -3.78961181640625, -3.64013671875, -3.49066162109375, -3.3411865234375, -3.19171142578125, -3.042236328125, -2.89276123046875, -2.7432861328125, -2.59381103515625, -2.4443359375, -2.29486083984375, -2.1453857421875, -1.99591064453125, -1.846435546875, -1.69696044921875, -1.5474853515625, -1.39801025390625, -1.24853515625, -1.09906005859375, -0.9495849609375, -0.80010986328125, -0.650634765625, -0.50115966796875, -0.3516845703125, -0.20220947265625, -0.052734375, 0.09674072265625, 0.2462158203125, 0.39569091796875, 0.545166015625, 0.69464111328125, 0.8441162109375, 0.99359130859375, 1.14306640625, 1.29254150390625, 1.4420166015625, 1.59149169921875, 1.740966796875, 1.89044189453125, 2.0399169921875, 2.18939208984375, 2.3388671875, 2.48834228515625, 2.6378173828125, 2.78729248046875, 2.936767578125, 3.08624267578125, 3.2357177734375, 3.38519287109375, 3.53466796875, 3.68414306640625, 3.8336181640625, 3.98309326171875, 4.132568359375, 4.28204345703125, 4.4315185546875, 4.58099365234375, 4.73046875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 9.0, 10.0, 6.0, 7.0, 17.0, 22.0, 22.0, 19.0, 17.0, 23.0, 25.0, 41.0, 63.0, 85.0, 248.0, 542.0, 2317.0, 18886.0, 646418.0, 3249619.0, 262902.0, 10393.0, 1565.0, 453.0, 160.0, 97.0, 56.0, 33.0, 25.0, 33.0, 26.0, 17.0, 21.0, 13.0, 13.0, 5.0, 11.0, 7.0, 8.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-17.890625, -17.338134765625, -16.78564453125, -16.233154296875, -15.6806640625, -15.128173828125, -14.57568359375, -14.023193359375, -13.470703125, -12.918212890625, -12.36572265625, -11.813232421875, -11.2607421875, -10.708251953125, -10.15576171875, -9.603271484375, -9.05078125, -8.498291015625, -7.94580078125, -7.393310546875, -6.8408203125, -6.288330078125, -5.73583984375, -5.183349609375, -4.630859375, -4.078369140625, -3.52587890625, -2.973388671875, -2.4208984375, -1.868408203125, -1.31591796875, -0.763427734375, -0.2109375, 0.341552734375, 0.89404296875, 1.446533203125, 1.9990234375, 2.551513671875, 3.10400390625, 3.656494140625, 4.208984375, 4.761474609375, 5.31396484375, 5.866455078125, 6.4189453125, 6.971435546875, 7.52392578125, 8.076416015625, 8.62890625, 9.181396484375, 9.73388671875, 10.286376953125, 10.8388671875, 11.391357421875, 11.94384765625, 12.496337890625, 13.048828125, 13.601318359375, 14.15380859375, 14.706298828125, 15.2587890625, 15.811279296875, 16.36376953125, 16.916259765625, 17.46875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 10.0, 14.0, 21.0, 21.0, 43.0, 71.0, 90.0, 131.0, 239.0, 343.0, 459.0, 611.0, 597.0, 479.0, 333.0, 217.0, 143.0, 83.0, 53.0, 33.0, 14.0, 20.0, 20.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9765625, -14.5067138671875, -14.036865234375, -13.5670166015625, -13.09716796875, -12.6273193359375, -12.157470703125, -11.6876220703125, -11.2177734375, -10.7479248046875, -10.278076171875, -9.8082275390625, -9.33837890625, -8.8685302734375, -8.398681640625, -7.9288330078125, -7.458984375, -6.9891357421875, -6.519287109375, -6.0494384765625, -5.57958984375, -5.1097412109375, -4.639892578125, -4.1700439453125, -3.7001953125, -3.2303466796875, -2.760498046875, -2.2906494140625, -1.82080078125, -1.3509521484375, -0.881103515625, -0.4112548828125, 0.05859375, 0.5284423828125, 0.998291015625, 1.4681396484375, 1.93798828125, 2.4078369140625, 2.877685546875, 3.3475341796875, 3.8173828125, 4.2872314453125, 4.757080078125, 5.2269287109375, 5.69677734375, 6.1666259765625, 6.636474609375, 7.1063232421875, 7.576171875, 8.0460205078125, 8.515869140625, 8.9857177734375, 9.45556640625, 9.9254150390625, 10.395263671875, 10.8651123046875, 11.3349609375, 11.8048095703125, 12.274658203125, 12.7445068359375, 13.21435546875, 13.6842041015625, 14.154052734375, 14.6239013671875, 15.09375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 11.0, 17.0, 12.0, 23.0, 31.0, 52.0, 53.0, 80.0, 126.0, 142.0, 216.0, 343.0, 513.0, 1264.0, 32397.0, 4056707.0, 98886.0, 1740.0, 553.0, 335.0, 211.0, 134.0, 126.0, 82.0, 49.0, 50.0, 32.0, 26.0, 20.0, 17.0, 9.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.03125, -51.45263671875, -49.8740234375, -48.29541015625, -46.716796875, -45.13818359375, -43.5595703125, -41.98095703125, -40.40234375, -38.82373046875, -37.2451171875, -35.66650390625, -34.087890625, -32.50927734375, -30.9306640625, -29.35205078125, -27.7734375, -26.19482421875, -24.6162109375, -23.03759765625, -21.458984375, -19.88037109375, -18.3017578125, -16.72314453125, -15.14453125, -13.56591796875, -11.9873046875, -10.40869140625, -8.830078125, -7.25146484375, -5.6728515625, -4.09423828125, -2.515625, -0.93701171875, 0.6416015625, 2.22021484375, 3.798828125, 5.37744140625, 6.9560546875, 8.53466796875, 10.11328125, 11.69189453125, 13.2705078125, 14.84912109375, 16.427734375, 18.00634765625, 19.5849609375, 21.16357421875, 22.7421875, 24.32080078125, 25.8994140625, 27.47802734375, 29.056640625, 30.63525390625, 32.2138671875, 33.79248046875, 35.37109375, 36.94970703125, 38.5283203125, 40.10693359375, 41.685546875, 43.26416015625, 44.8427734375, 46.42138671875, 48.0]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 22.0, 358.0, 548.0, 86.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.99755859375, -121.0228500366211, -113.04813385009766, -105.07342529296875, -97.09871673583984, -89.12400817871094, -81.1492919921875, -73.1745834350586, -65.19987487792969, -57.225162506103516, -49.25045394897461, -41.27574157714844, -33.30103302001953, -25.32632064819336, -17.351608276367188, -9.376899719238281, -1.4021835327148438, 6.5725274085998535, 14.54723834991455, 22.521949768066406, 30.496660232543945, 38.471370697021484, 46.446083068847656, 54.42079162597656, 62.395503997802734, 70.3702163696289, 78.34492492675781, 86.31964111328125, 94.29434967041016, 102.26905822753906, 110.2437744140625, 118.21847534179688, 126.19319152832031, 134.16790771484375, 142.14260864257812, 150.11732482910156, 158.092041015625, 166.06674194335938, 174.0414581298828, 182.01617431640625, 189.99087524414062, 197.96559143066406, 205.94029235839844, 213.91500854492188, 221.8897247314453, 229.8644256591797, 237.83914184570312, 245.8138427734375, 253.78857421875, 261.7632751464844, 269.7380065917969, 277.71270751953125, 285.6874084472656, 293.6621398925781, 301.6368408203125, 309.6115417480469, 317.58624267578125, 325.5609436035156, 333.5356750488281, 341.5103759765625, 349.4850769042969, 357.4598083496094, 365.43450927734375, 373.4092102050781, 381.3839416503906]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 17.0, 14.0, 18.0, 12.0, 23.0, 21.0, 35.0, 16.0, 36.0, 45.0, 25.0, 27.0, 41.0, 44.0, 44.0, 50.0, 40.0, 41.0, 38.0, 44.0, 29.0, 37.0, 26.0, 31.0, 25.0, 32.0, 24.0, 23.0, 19.0, 15.0, 10.0, 15.0, 9.0, 14.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-33.35020446777344, -32.268035888671875, -31.18586540222168, -30.103696823120117, -29.021526336669922, -27.93935775756836, -26.857189178466797, -25.775020599365234, -24.69285011291504, -23.610681533813477, -22.52851104736328, -21.44634246826172, -20.364173889160156, -19.28200340270996, -18.1998348236084, -17.117664337158203, -16.03549575805664, -14.953326225280762, -13.871156692504883, -12.78898811340332, -11.706818580627441, -10.624649047851562, -9.54248046875, -8.460310935974121, -7.378141403198242, -6.295971870422363, -5.213802814483643, -4.131633758544922, -3.049464225769043, -1.967294692993164, -0.8851256370544434, 0.19704341888427734, 1.2792129516601562, 2.361382246017456, 3.443551540374756, 4.525720596313477, 5.6078901290893555, 6.690059661865234, 7.772228717803955, 8.854397773742676, 9.936567306518555, 11.018736839294434, 12.100906372070312, 13.183074951171875, 14.265244483947754, 15.347414016723633, 16.429582595825195, 17.51175308227539, 18.593921661376953, 19.676090240478516, 20.75826072692871, 21.840429306030273, 22.92259979248047, 24.00476837158203, 25.086936950683594, 26.169105529785156, 27.25127601623535, 28.333444595336914, 29.41561508178711, 30.497783660888672, 31.579952239990234, 32.66212463378906, 33.744293212890625, 34.82646179199219, 35.90863037109375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 2.0, 6.0, 11.0, 8.0, 12.0, 14.0, 11.0, 17.0, 21.0, 17.0, 24.0, 23.0, 30.0, 25.0, 23.0, 21.0, 44.0, 37.0, 33.0, 43.0, 40.0, 28.0, 39.0, 39.0, 45.0, 42.0, 35.0, 31.0, 38.0, 34.0, 34.0, 23.0, 31.0, 23.0, 18.0, 14.0, 6.0, 12.0, 5.0, 12.0, 2.0, 6.0, 3.0, 0.0, 6.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.5728759765625, -4.423095703125, -4.2733154296875, -4.12353515625, -3.9737548828125, -3.823974609375, -3.6741943359375, -3.5244140625, -3.3746337890625, -3.224853515625, -3.0750732421875, -2.92529296875, -2.7755126953125, -2.625732421875, -2.4759521484375, -2.326171875, -2.1763916015625, -2.026611328125, -1.8768310546875, -1.72705078125, -1.5772705078125, -1.427490234375, -1.2777099609375, -1.1279296875, -0.9781494140625, -0.828369140625, -0.6785888671875, -0.52880859375, -0.3790283203125, -0.229248046875, -0.0794677734375, 0.0703125, 0.2200927734375, 0.369873046875, 0.5196533203125, 0.66943359375, 0.8192138671875, 0.968994140625, 1.1187744140625, 1.2685546875, 1.4183349609375, 1.568115234375, 1.7178955078125, 1.86767578125, 2.0174560546875, 2.167236328125, 2.3170166015625, 2.466796875, 2.6165771484375, 2.766357421875, 2.9161376953125, 3.06591796875, 3.2156982421875, 3.365478515625, 3.5152587890625, 3.6650390625, 3.8148193359375, 3.964599609375, 4.1143798828125, 4.26416015625, 4.4139404296875, 4.563720703125, 4.7135009765625, 4.86328125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 8.0, 21.0, 29.0, 34.0, 61.0, 72.0, 111.0, 152.0, 232.0, 325.0, 467.0, 674.0, 944.0, 1302.0, 1842.0, 2565.0, 3543.0, 5196.0, 7272.0, 10451.0, 14950.0, 22459.0, 33539.0, 50886.0, 79570.0, 123273.0, 170668.0, 168320.0, 119844.0, 77075.0, 49602.0, 32413.0, 21656.0, 14678.0, 10145.0, 7082.0, 4970.0, 3475.0, 2581.0, 1786.0, 1260.0, 927.0, 610.0, 449.0, 348.0, 195.0, 184.0, 108.0, 66.0, 46.0, 37.0, 15.0, 15.0, 18.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.41943359375, -0.4058876037597656, -0.39234161376953125, -0.3787956237792969, -0.3652496337890625, -0.3517036437988281, -0.33815765380859375, -0.3246116638183594, -0.311065673828125, -0.2975196838378906, -0.28397369384765625, -0.2704277038574219, -0.2568817138671875, -0.24333572387695312, -0.22978973388671875, -0.21624374389648438, -0.20269775390625, -0.18915176391601562, -0.17560577392578125, -0.16205978393554688, -0.1485137939453125, -0.13496780395507812, -0.12142181396484375, -0.10787582397460938, -0.094329833984375, -0.08078384399414062, -0.06723785400390625, -0.053691864013671875, -0.0401458740234375, -0.026599884033203125, -0.01305389404296875, 0.000492095947265625, 0.0140380859375, 0.027584075927734375, 0.04113006591796875, 0.054676055908203125, 0.0682220458984375, 0.08176803588867188, 0.09531402587890625, 0.10886001586914062, 0.122406005859375, 0.13595199584960938, 0.14949798583984375, 0.16304397583007812, 0.1765899658203125, 0.19013595581054688, 0.20368194580078125, 0.21722793579101562, 0.23077392578125, 0.24431991577148438, 0.25786590576171875, 0.2714118957519531, 0.2849578857421875, 0.2985038757324219, 0.31204986572265625, 0.3255958557128906, 0.339141845703125, 0.3526878356933594, 0.36623382568359375, 0.3797798156738281, 0.3933258056640625, 0.4068717956542969, 0.42041778564453125, 0.4339637756347656, 0.447509765625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 13.0, 10.0, 7.0, 11.0, 24.0, 16.0, 23.0, 16.0, 20.0, 28.0, 31.0, 32.0, 33.0, 34.0, 40.0, 36.0, 37.0, 48.0, 1075.0, 38.0, 54.0, 42.0, 34.0, 37.0, 32.0, 33.0, 18.0, 29.0, 18.0, 27.0, 22.0, 16.0, 17.0, 19.0, 11.0, 6.0, 5.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.279296875, -3.175750732421875, -3.07220458984375, -2.968658447265625, -2.8651123046875, -2.761566162109375, -2.65802001953125, -2.554473876953125, -2.450927734375, -2.347381591796875, -2.24383544921875, -2.140289306640625, -2.0367431640625, -1.933197021484375, -1.82965087890625, -1.726104736328125, -1.62255859375, -1.519012451171875, -1.41546630859375, -1.311920166015625, -1.2083740234375, -1.104827880859375, -1.00128173828125, -0.897735595703125, -0.794189453125, -0.690643310546875, -0.58709716796875, -0.483551025390625, -0.3800048828125, -0.276458740234375, -0.17291259765625, -0.069366455078125, 0.0341796875, 0.137725830078125, 0.24127197265625, 0.344818115234375, 0.4483642578125, 0.551910400390625, 0.65545654296875, 0.759002685546875, 0.862548828125, 0.966094970703125, 1.06964111328125, 1.173187255859375, 1.2767333984375, 1.380279541015625, 1.48382568359375, 1.587371826171875, 1.69091796875, 1.794464111328125, 1.89801025390625, 2.001556396484375, 2.1051025390625, 2.208648681640625, 2.31219482421875, 2.415740966796875, 2.519287109375, 2.622833251953125, 2.72637939453125, 2.829925537109375, 2.9334716796875, 3.037017822265625, 3.14056396484375, 3.244110107421875, 3.34765625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 7.0, 5.0, 9.0, 12.0, 20.0, 23.0, 36.0, 53.0, 71.0, 131.0, 160.0, 257.0, 396.0, 608.0, 935.0, 1413.0, 2174.0, 3299.0, 5255.0, 8430.0, 13501.0, 21840.0, 35490.0, 58861.0, 95956.0, 151841.0, 1246572.0, 167845.0, 108738.0, 66367.0, 40953.0, 24627.0, 15095.0, 9333.0, 5991.0, 3749.0, 2403.0, 1565.0, 1082.0, 636.0, 467.0, 320.0, 200.0, 128.0, 95.0, 63.0, 43.0, 27.0, 17.0, 12.0, 12.0, 8.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.458251953125, -0.44329071044921875, -0.4283294677734375, -0.41336822509765625, -0.398406982421875, -0.38344573974609375, -0.3684844970703125, -0.35352325439453125, -0.33856201171875, -0.32360076904296875, -0.3086395263671875, -0.29367828369140625, -0.278717041015625, -0.26375579833984375, -0.2487945556640625, -0.23383331298828125, -0.2188720703125, -0.20391082763671875, -0.1889495849609375, -0.17398834228515625, -0.159027099609375, -0.14406585693359375, -0.1291046142578125, -0.11414337158203125, -0.09918212890625, -0.08422088623046875, -0.0692596435546875, -0.05429840087890625, -0.039337158203125, -0.02437591552734375, -0.0094146728515625, 0.00554656982421875, 0.0205078125, 0.03546905517578125, 0.0504302978515625, 0.06539154052734375, 0.080352783203125, 0.09531402587890625, 0.1102752685546875, 0.12523651123046875, 0.14019775390625, 0.15515899658203125, 0.1701202392578125, 0.18508148193359375, 0.200042724609375, 0.21500396728515625, 0.2299652099609375, 0.24492645263671875, 0.2598876953125, 0.27484893798828125, 0.2898101806640625, 0.30477142333984375, 0.319732666015625, 0.33469390869140625, 0.3496551513671875, 0.36461639404296875, 0.37957763671875, 0.39453887939453125, 0.4095001220703125, 0.42446136474609375, 0.439422607421875, 0.45438385009765625, 0.4693450927734375, 0.48430633544921875, 0.499267578125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 2.0, 6.0, 4.0, 11.0, 10.0, 14.0, 15.0, 14.0, 16.0, 29.0, 25.0, 26.0, 34.0, 29.0, 32.0, 45.0, 45.0, 27.0, 48.0, 44.0, 45.0, 38.0, 29.0, 40.0, 51.0, 33.0, 32.0, 34.0, 27.0, 26.0, 30.0, 29.0, 15.0, 17.0, 16.0, 8.0, 13.0, 9.0, 5.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006694793701171875, -0.0006475299596786499, -0.0006255805492401123, -0.0006036311388015747, -0.0005816817283630371, -0.0005597323179244995, -0.0005377829074859619, -0.0005158334970474243, -0.0004938840866088867, -0.0004719346761703491, -0.0004499852657318115, -0.0004280358552932739, -0.00040608644485473633, -0.00038413703441619873, -0.00036218762397766113, -0.00034023821353912354, -0.00031828880310058594, -0.00029633939266204834, -0.00027438998222351074, -0.00025244057178497314, -0.00023049116134643555, -0.00020854175090789795, -0.00018659234046936035, -0.00016464293003082275, -0.00014269351959228516, -0.00012074410915374756, -9.879469871520996e-05, -7.684528827667236e-05, -5.4895877838134766e-05, -3.294646739959717e-05, -1.099705696105957e-05, 1.0952353477478027e-05, 3.2901763916015625e-05, 5.485117435455322e-05, 7.680058479309082e-05, 9.874999523162842e-05, 0.00012069940567016602, 0.0001426488161087036, 0.0001645982265472412, 0.0001865476369857788, 0.0002084970474243164, 0.000230446457862854, 0.0002523958683013916, 0.0002743452787399292, 0.0002962946891784668, 0.0003182440996170044, 0.000340193510055542, 0.0003621429204940796, 0.0003840923309326172, 0.0004060417413711548, 0.0004279911518096924, 0.00044994056224823, 0.0004718899726867676, 0.0004938393831253052, 0.0005157887935638428, 0.0005377382040023804, 0.000559687614440918, 0.0005816370248794556, 0.0006035864353179932, 0.0006255358457565308, 0.0006474852561950684, 0.000669434666633606, 0.0006913840770721436, 0.0007133334875106812, 0.0007352828979492188]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 11.0, 13.0, 8.0, 12.0, 21.0, 21.0, 29.0, 29.0, 37.0, 52.0, 56.0, 68.0, 87.0, 150.0, 306.0, 818.0, 4147.0, 1018393.0, 22157.0, 1043.0, 408.0, 159.0, 106.0, 75.0, 58.0, 42.0, 43.0, 37.0, 27.0, 25.0, 25.0, 14.0, 10.0, 14.0, 9.0, 1.0, 7.0, 2.0, 5.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.0182342529296875, -0.017722368240356445, -0.01721048355102539, -0.016698598861694336, -0.01618671417236328, -0.015674829483032227, -0.015162944793701172, -0.014651060104370117, -0.014139175415039062, -0.013627290725708008, -0.013115406036376953, -0.012603521347045898, -0.012091636657714844, -0.011579751968383789, -0.011067867279052734, -0.01055598258972168, -0.010044097900390625, -0.00953221321105957, -0.009020328521728516, -0.008508443832397461, -0.007996559143066406, -0.0074846744537353516, -0.006972789764404297, -0.006460905075073242, -0.0059490203857421875, -0.005437135696411133, -0.004925251007080078, -0.0044133663177490234, -0.0039014816284179688, -0.003389596939086914, -0.0028777122497558594, -0.0023658275604248047, -0.00185394287109375, -0.0013420581817626953, -0.0008301734924316406, -0.00031828880310058594, 0.00019359588623046875, 0.0007054805755615234, 0.0012173652648925781, 0.0017292499542236328, 0.0022411346435546875, 0.002753019332885742, 0.003264904022216797, 0.0037767887115478516, 0.004288673400878906, 0.004800558090209961, 0.005312442779541016, 0.00582432746887207, 0.006336212158203125, 0.00684809684753418, 0.007359981536865234, 0.007871866226196289, 0.008383750915527344, 0.008895635604858398, 0.009407520294189453, 0.009919404983520508, 0.010431289672851562, 0.010943174362182617, 0.011455059051513672, 0.011966943740844727, 0.012478828430175781, 0.012990713119506836, 0.01350259780883789, 0.014014482498168945, 0.0145263671875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 12.0, 76.0, 216.0, 336.0, 227.0, 112.0, 25.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002292017685249448, -0.0022468240931630135, -0.002201630501076579, -0.0021564369089901447, -0.0021112433169037104, -0.002066049724817276, -0.0020208561327308416, -0.0019756625406444073, -0.001930468948557973, -0.0018852753564715385, -0.0018400817643851042, -0.0017948881722986698, -0.0017496945802122355, -0.001704500988125801, -0.0016593073960393667, -0.0016141138039529324, -0.001568920211866498, -0.0015237266197800636, -0.0014785330276936293, -0.001433339435607195, -0.0013881458435207605, -0.0013429522514343262, -0.0012977586593478918, -0.0012525650672614574, -0.001207371475175023, -0.0011621778830885887, -0.0011169842910021544, -0.00107179069891572, -0.0010265971068292856, -0.0009814035147428513, -0.0009362099226564169, -0.0008910163305699825, -0.0008458227384835482, -0.0008006291463971138, -0.0007554355543106794, -0.0007102419622242451, -0.0006650483701378107, -0.0006198547780513763, -0.000574661185964942, -0.0005294675938785076, -0.00048427400179207325, -0.0004390804097056389, -0.0003938868176192045, -0.00034869322553277016, -0.0003034996334463358, -0.00025830604135990143, -0.00021311244927346706, -0.0001679188571870327, -0.00012272526510059834, -7.753167301416397e-05, -3.233808092772961e-05, 1.2855511158704758e-05, 5.804910324513912e-05, 0.00010324269533157349, 0.00014843628741800785, 0.00019362987950444221, 0.00023882347159087658, 0.00028401706367731094, 0.0003292106557637453, 0.00037440424785017967, 0.00041959783993661404, 0.0004647914320230484, 0.0005099850241094828, 0.0005551786161959171, 0.0006003722082823515]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 3.0, 9.0, 9.0, 16.0, 13.0, 25.0, 19.0, 24.0, 20.0, 20.0, 36.0, 31.0, 35.0, 30.0, 26.0, 41.0, 41.0, 51.0, 29.0, 50.0, 38.0, 33.0, 39.0, 33.0, 27.0, 35.0, 32.0, 26.0, 27.0, 19.0, 23.0, 10.0, 24.0, 19.0, 13.0, 13.0, 14.0, 8.0, 1.0, 5.0, 6.0, 7.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.00045299530029296875, -0.00044030509889125824, -0.00042761489748954773, -0.0004149246960878372, -0.0004022344946861267, -0.0003895442932844162, -0.0003768540918827057, -0.0003641638904809952, -0.00035147368907928467, -0.00033878348767757416, -0.00032609328627586365, -0.00031340308487415314, -0.0003007128834724426, -0.0002880226820707321, -0.0002753324806690216, -0.0002626422792673111, -0.0002499520778656006, -0.00023726187646389008, -0.00022457167506217957, -0.00021188147366046906, -0.00019919127225875854, -0.00018650107085704803, -0.00017381086945533752, -0.00016112066805362701, -0.0001484304666519165, -0.000135740265250206, -0.00012305006384849548, -0.00011035986244678497, -9.766966104507446e-05, -8.497945964336395e-05, -7.228925824165344e-05, -5.959905683994293e-05, -4.690885543823242e-05, -3.421865403652191e-05, -2.15284526348114e-05, -8.838251233100891e-06, 3.851950168609619e-06, 1.654215157032013e-05, 2.923235297203064e-05, 4.192255437374115e-05, 5.461275577545166e-05, 6.730295717716217e-05, 7.999315857887268e-05, 9.268335998058319e-05, 0.0001053735613822937, 0.00011806376278400421, 0.00013075396418571472, 0.00014344416558742523, 0.00015613436698913574, 0.00016882456839084625, 0.00018151476979255676, 0.00019420497119426727, 0.00020689517259597778, 0.0002195853739976883, 0.0002322755753993988, 0.0002449657768011093, 0.0002576559782028198, 0.00027034617960453033, 0.00028303638100624084, 0.00029572658240795135, 0.00030841678380966187, 0.0003211069852113724, 0.0003337971866130829, 0.0003464873880147934, 0.0003591775894165039]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 2.0, 6.0, 12.0, 7.0, 12.0, 14.0, 11.0, 17.0, 21.0, 17.0, 24.0, 23.0, 30.0, 25.0, 23.0, 21.0, 44.0, 37.0, 33.0, 43.0, 40.0, 28.0, 39.0, 39.0, 45.0, 42.0, 35.0, 31.0, 38.0, 34.0, 34.0, 23.0, 30.0, 24.0, 18.0, 14.0, 6.0, 12.0, 5.0, 12.0, 2.0, 6.0, 3.0, 0.0, 6.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.5728759765625, -4.423095703125, -4.2733154296875, -4.12353515625, -3.9737548828125, -3.823974609375, -3.6741943359375, -3.5244140625, -3.3746337890625, -3.224853515625, -3.0750732421875, -2.92529296875, -2.7755126953125, -2.625732421875, -2.4759521484375, -2.326171875, -2.1763916015625, -2.026611328125, -1.8768310546875, -1.72705078125, -1.5772705078125, -1.427490234375, -1.2777099609375, -1.1279296875, -0.9781494140625, -0.828369140625, -0.6785888671875, -0.52880859375, -0.3790283203125, -0.229248046875, -0.0794677734375, 0.0703125, 0.2200927734375, 0.369873046875, 0.5196533203125, 0.66943359375, 0.8192138671875, 0.968994140625, 1.1187744140625, 1.2685546875, 1.4183349609375, 1.568115234375, 1.7178955078125, 1.86767578125, 2.0174560546875, 2.167236328125, 2.3170166015625, 2.466796875, 2.6165771484375, 2.766357421875, 2.9161376953125, 3.06591796875, 3.2156982421875, 3.365478515625, 3.5152587890625, 3.6650390625, 3.8148193359375, 3.964599609375, 4.1143798828125, 4.26416015625, 4.4139404296875, 4.563720703125, 4.7135009765625, 4.86328125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 16.0, 13.0, 16.0, 26.0, 39.0, 50.0, 49.0, 101.0, 114.0, 194.0, 265.0, 429.0, 674.0, 1178.0, 2232.0, 4337.0, 8992.0, 21264.0, 54326.0, 151047.0, 382083.0, 261987.0, 95871.0, 35058.0, 14269.0, 6549.0, 3160.0, 1654.0, 886.0, 561.0, 318.0, 237.0, 156.0, 102.0, 78.0, 69.0, 29.0, 35.0, 22.0, 18.0, 14.0, 9.0, 7.0, 8.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.322265625, -3.210693359375, -3.09912109375, -2.987548828125, -2.8759765625, -2.764404296875, -2.65283203125, -2.541259765625, -2.4296875, -2.318115234375, -2.20654296875, -2.094970703125, -1.9833984375, -1.871826171875, -1.76025390625, -1.648681640625, -1.537109375, -1.425537109375, -1.31396484375, -1.202392578125, -1.0908203125, -0.979248046875, -0.86767578125, -0.756103515625, -0.64453125, -0.532958984375, -0.42138671875, -0.309814453125, -0.1982421875, -0.086669921875, 0.02490234375, 0.136474609375, 0.248046875, 0.359619140625, 0.47119140625, 0.582763671875, 0.6943359375, 0.805908203125, 0.91748046875, 1.029052734375, 1.140625, 1.252197265625, 1.36376953125, 1.475341796875, 1.5869140625, 1.698486328125, 1.81005859375, 1.921630859375, 2.033203125, 2.144775390625, 2.25634765625, 2.367919921875, 2.4794921875, 2.591064453125, 2.70263671875, 2.814208984375, 2.92578125, 3.037353515625, 3.14892578125, 3.260498046875, 3.3720703125, 3.483642578125, 3.59521484375, 3.706787109375, 3.818359375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 6.0, 13.0, 10.0, 24.0, 19.0, 16.0, 21.0, 28.0, 26.0, 37.0, 34.0, 45.0, 62.0, 56.0, 71.0, 177.0, 1616.0, 255.0, 85.0, 61.0, 50.0, 48.0, 36.0, 32.0, 34.0, 29.0, 15.0, 24.0, 16.0, 16.0, 12.0, 12.0, 14.0, 6.0, 14.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.34375, -16.8115234375, -16.279296875, -15.7470703125, -15.21484375, -14.6826171875, -14.150390625, -13.6181640625, -13.0859375, -12.5537109375, -12.021484375, -11.4892578125, -10.95703125, -10.4248046875, -9.892578125, -9.3603515625, -8.828125, -8.2958984375, -7.763671875, -7.2314453125, -6.69921875, -6.1669921875, -5.634765625, -5.1025390625, -4.5703125, -4.0380859375, -3.505859375, -2.9736328125, -2.44140625, -1.9091796875, -1.376953125, -0.8447265625, -0.3125, 0.2197265625, 0.751953125, 1.2841796875, 1.81640625, 2.3486328125, 2.880859375, 3.4130859375, 3.9453125, 4.4775390625, 5.009765625, 5.5419921875, 6.07421875, 6.6064453125, 7.138671875, 7.6708984375, 8.203125, 8.7353515625, 9.267578125, 9.7998046875, 10.33203125, 10.8642578125, 11.396484375, 11.9287109375, 12.4609375, 12.9931640625, 13.525390625, 14.0576171875, 14.58984375, 15.1220703125, 15.654296875, 16.1865234375, 16.71875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 1.0, 6.0, 11.0, 7.0, 14.0, 24.0, 41.0, 46.0, 84.0, 103.0, 150.0, 254.0, 436.0, 896.0, 38153.0, 3101657.0, 2404.0, 535.0, 322.0, 189.0, 124.0, 77.0, 61.0, 35.0, 32.0, 11.0, 7.0, 7.0, 6.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-73.5625, -71.53271484375, -69.5029296875, -67.47314453125, -65.443359375, -63.41357421875, -61.3837890625, -59.35400390625, -57.32421875, -55.29443359375, -53.2646484375, -51.23486328125, -49.205078125, -47.17529296875, -45.1455078125, -43.11572265625, -41.0859375, -39.05615234375, -37.0263671875, -34.99658203125, -32.966796875, -30.93701171875, -28.9072265625, -26.87744140625, -24.84765625, -22.81787109375, -20.7880859375, -18.75830078125, -16.728515625, -14.69873046875, -12.6689453125, -10.63916015625, -8.609375, -6.57958984375, -4.5498046875, -2.52001953125, -0.490234375, 1.53955078125, 3.5693359375, 5.59912109375, 7.62890625, 9.65869140625, 11.6884765625, 13.71826171875, 15.748046875, 17.77783203125, 19.8076171875, 21.83740234375, 23.8671875, 25.89697265625, 27.9267578125, 29.95654296875, 31.986328125, 34.01611328125, 36.0458984375, 38.07568359375, 40.10546875, 42.13525390625, 44.1650390625, 46.19482421875, 48.224609375, 50.25439453125, 52.2841796875, 54.31396484375, 56.34375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 5.0, 12.0, 93.0, 216.0, 333.0, 237.0, 77.0, 31.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.776172637939453, -6.392247676849365, -5.008322715759277, -3.6243977546691895, -2.2404727935791016, -0.8565478324890137, 0.5273771286010742, 1.9113025665283203, 3.29522705078125, 4.679152011871338, 6.063076972961426, 7.447001934051514, 8.830926895141602, 10.214851379394531, 11.598776817321777, 12.982702255249023, 14.366626739501953, 15.750551223754883, 17.134475708007812, 18.518402099609375, 19.902326583862305, 21.286251068115234, 22.670177459716797, 24.054101943969727, 25.438026428222656, 26.821950912475586, 28.205875396728516, 29.589801788330078, 30.973726272583008, 32.35765075683594, 33.7415771484375, 35.12550354003906, 36.509429931640625, 37.89335632324219, 39.277278900146484, 40.66120529174805, 42.045127868652344, 43.429054260253906, 44.81298065185547, 46.19690704345703, 47.58082962036133, 48.96475601196289, 50.34867858886719, 51.73260498046875, 53.11653137207031, 54.50045394897461, 55.88438034057617, 57.26830291748047, 58.65222930908203, 60.036155700683594, 61.42007827758789, 62.80400466918945, 64.18792724609375, 65.57185363769531, 66.95578002929688, 68.33970642089844, 69.7236328125, 71.10755920410156, 72.49148559570312, 73.87540435791016, 75.25933074951172, 76.64325714111328, 78.02718353271484, 79.4111099243164, 80.79502868652344]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 7.0, 6.0, 7.0, 6.0, 17.0, 13.0, 22.0, 16.0, 24.0, 27.0, 27.0, 32.0, 33.0, 40.0, 32.0, 37.0, 38.0, 45.0, 40.0, 43.0, 28.0, 31.0, 39.0, 32.0, 40.0, 25.0, 27.0, 30.0, 19.0, 30.0, 23.0, 21.0, 14.0, 14.0, 20.0, 16.0, 12.0, 9.0, 8.0, 8.0, 4.0, 6.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.71058654785156, -39.452144622802734, -38.193702697753906, -36.93525695800781, -35.676815032958984, -34.418373107910156, -33.15993118286133, -31.901487350463867, -30.643043518066406, -29.384601593017578, -28.126157760620117, -26.86771583557129, -25.609272003173828, -24.350830078125, -23.092388153076172, -21.83394432067871, -20.575502395629883, -19.317060470581055, -18.058616638183594, -16.800174713134766, -15.541730880737305, -14.283288955688477, -13.024846076965332, -11.766403198242188, -10.507960319519043, -9.249517440795898, -7.991074562072754, -6.732632160186768, -5.474189281463623, -4.2157464027404785, -2.957304000854492, -1.6988611221313477, -0.4404182434082031, 0.8180245161056519, 2.076467275619507, 3.3349099159240723, 4.593352794647217, 5.851795673370361, 7.110238075256348, 8.368680953979492, 9.627123832702637, 10.885566711425781, 12.144009590148926, 13.40245246887207, 14.660894393920898, 15.91933822631836, 17.177780151367188, 18.436222076416016, 19.694665908813477, 20.953107833862305, 22.211551666259766, 23.469993591308594, 24.728437423706055, 25.986879348754883, 27.245323181152344, 28.503765106201172, 29.76220703125, 31.020648956298828, 32.279090881347656, 33.53753662109375, 34.79597854614258, 36.054420471191406, 37.312862396240234, 38.57130432128906, 39.829750061035156]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 15.0, 9.0, 7.0, 10.0, 17.0, 14.0, 19.0, 24.0, 21.0, 28.0, 22.0, 31.0, 23.0, 24.0, 34.0, 36.0, 46.0, 31.0, 43.0, 37.0, 30.0, 48.0, 42.0, 43.0, 47.0, 38.0, 30.0, 31.0, 32.0, 23.0, 27.0, 21.0, 17.0, 12.0, 6.0, 8.0, 10.0, 10.0, 1.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.08203125, -4.91998291015625, -4.7579345703125, -4.59588623046875, -4.433837890625, -4.27178955078125, -4.1097412109375, -3.94769287109375, -3.78564453125, -3.62359619140625, -3.4615478515625, -3.29949951171875, -3.137451171875, -2.97540283203125, -2.8133544921875, -2.65130615234375, -2.4892578125, -2.32720947265625, -2.1651611328125, -2.00311279296875, -1.841064453125, -1.67901611328125, -1.5169677734375, -1.35491943359375, -1.19287109375, -1.03082275390625, -0.8687744140625, -0.70672607421875, -0.544677734375, -0.38262939453125, -0.2205810546875, -0.05853271484375, 0.103515625, 0.26556396484375, 0.4276123046875, 0.58966064453125, 0.751708984375, 0.91375732421875, 1.0758056640625, 1.23785400390625, 1.39990234375, 1.56195068359375, 1.7239990234375, 1.88604736328125, 2.048095703125, 2.21014404296875, 2.3721923828125, 2.53424072265625, 2.6962890625, 2.85833740234375, 3.0203857421875, 3.18243408203125, 3.344482421875, 3.50653076171875, 3.6685791015625, 3.83062744140625, 3.99267578125, 4.15472412109375, 4.3167724609375, 4.47882080078125, 4.640869140625, 4.80291748046875, 4.9649658203125, 5.12701416015625, 5.2890625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 11.0, 7.0, 8.0, 10.0, 15.0, 16.0, 23.0, 23.0, 35.0, 34.0, 58.0, 81.0, 145.0, 295.0, 655.0, 2225.0, 11727.0, 166493.0, 2284078.0, 1626856.0, 90693.0, 7894.0, 1698.0, 541.0, 212.0, 137.0, 68.0, 51.0, 45.0, 33.0, 23.0, 18.0, 15.0, 9.0, 9.0, 4.0, 8.0, 5.0, 1.0, 3.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0234375, -13.5838623046875, -13.144287109375, -12.7047119140625, -12.26513671875, -11.8255615234375, -11.385986328125, -10.9464111328125, -10.5068359375, -10.0672607421875, -9.627685546875, -9.1881103515625, -8.74853515625, -8.3089599609375, -7.869384765625, -7.4298095703125, -6.990234375, -6.5506591796875, -6.111083984375, -5.6715087890625, -5.23193359375, -4.7923583984375, -4.352783203125, -3.9132080078125, -3.4736328125, -3.0340576171875, -2.594482421875, -2.1549072265625, -1.71533203125, -1.2757568359375, -0.836181640625, -0.3966064453125, 0.04296875, 0.4825439453125, 0.922119140625, 1.3616943359375, 1.80126953125, 2.2408447265625, 2.680419921875, 3.1199951171875, 3.5595703125, 3.9991455078125, 4.438720703125, 4.8782958984375, 5.31787109375, 5.7574462890625, 6.197021484375, 6.6365966796875, 7.076171875, 7.5157470703125, 7.955322265625, 8.3948974609375, 8.83447265625, 9.2740478515625, 9.713623046875, 10.1531982421875, 10.5927734375, 11.0323486328125, 11.471923828125, 11.9114990234375, 12.35107421875, 12.7906494140625, 13.230224609375, 13.6697998046875, 14.109375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 9.0, 14.0, 25.0, 39.0, 41.0, 68.0, 72.0, 107.0, 123.0, 193.0, 282.0, 367.0, 511.0, 512.0, 449.0, 319.0, 244.0, 192.0, 124.0, 103.0, 74.0, 55.0, 38.0, 30.0, 21.0, 10.0, 10.0, 9.0, 5.0, 7.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.76220703125, -10.4072265625, -10.05224609375, -9.697265625, -9.34228515625, -8.9873046875, -8.63232421875, -8.27734375, -7.92236328125, -7.5673828125, -7.21240234375, -6.857421875, -6.50244140625, -6.1474609375, -5.79248046875, -5.4375, -5.08251953125, -4.7275390625, -4.37255859375, -4.017578125, -3.66259765625, -3.3076171875, -2.95263671875, -2.59765625, -2.24267578125, -1.8876953125, -1.53271484375, -1.177734375, -0.82275390625, -0.4677734375, -0.11279296875, 0.2421875, 0.59716796875, 0.9521484375, 1.30712890625, 1.662109375, 2.01708984375, 2.3720703125, 2.72705078125, 3.08203125, 3.43701171875, 3.7919921875, 4.14697265625, 4.501953125, 4.85693359375, 5.2119140625, 5.56689453125, 5.921875, 6.27685546875, 6.6318359375, 6.98681640625, 7.341796875, 7.69677734375, 8.0517578125, 8.40673828125, 8.76171875, 9.11669921875, 9.4716796875, 9.82666015625, 10.181640625, 10.53662109375, 10.8916015625, 11.24658203125, 11.6015625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 11.0, 9.0, 16.0, 21.0, 26.0, 25.0, 37.0, 47.0, 58.0, 70.0, 99.0, 129.0, 170.0, 197.0, 282.0, 471.0, 1114.0, 20563.0, 3751003.0, 414324.0, 3542.0, 671.0, 363.0, 233.0, 175.0, 140.0, 96.0, 81.0, 69.0, 49.0, 35.0, 40.0, 21.0, 20.0, 14.0, 12.0, 5.0, 6.0, 6.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.84375, -41.5361328125, -40.228515625, -38.9208984375, -37.61328125, -36.3056640625, -34.998046875, -33.6904296875, -32.3828125, -31.0751953125, -29.767578125, -28.4599609375, -27.15234375, -25.8447265625, -24.537109375, -23.2294921875, -21.921875, -20.6142578125, -19.306640625, -17.9990234375, -16.69140625, -15.3837890625, -14.076171875, -12.7685546875, -11.4609375, -10.1533203125, -8.845703125, -7.5380859375, -6.23046875, -4.9228515625, -3.615234375, -2.3076171875, -1.0, 0.3076171875, 1.615234375, 2.9228515625, 4.23046875, 5.5380859375, 6.845703125, 8.1533203125, 9.4609375, 10.7685546875, 12.076171875, 13.3837890625, 14.69140625, 15.9990234375, 17.306640625, 18.6142578125, 19.921875, 21.2294921875, 22.537109375, 23.8447265625, 25.15234375, 26.4599609375, 27.767578125, 29.0751953125, 30.3828125, 31.6904296875, 32.998046875, 34.3056640625, 35.61328125, 36.9208984375, 38.228515625, 39.5361328125, 40.84375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 37.0, 117.0, 325.0, 321.0, 157.0, 38.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.4826431274414, -67.50001525878906, -63.51738739013672, -59.534759521484375, -55.55213165283203, -51.56950378417969, -47.586875915527344, -43.604248046875, -39.621620178222656, -35.63899230957031, -31.65636444091797, -27.673736572265625, -23.69110870361328, -19.708480834960938, -15.725852966308594, -11.74322509765625, -7.760597229003906, -3.7779693603515625, 0.20465850830078125, 4.187286376953125, 8.169914245605469, 12.152542114257812, 16.135169982910156, 20.1177978515625, 24.100425720214844, 28.083053588867188, 32.06568145751953, 36.048309326171875, 40.03093719482422, 44.01356506347656, 47.996192932128906, 51.97882080078125, 55.96144104003906, 59.944068908691406, 63.92669677734375, 67.9093246459961, 71.89195251464844, 75.87458038330078, 79.85720825195312, 83.83983612060547, 87.82246398925781, 91.80509185791016, 95.7877197265625, 99.77034759521484, 103.75297546386719, 107.73560333251953, 111.71823120117188, 115.70085906982422, 119.68348693847656, 123.6661148071289, 127.64874267578125, 131.63137817382812, 135.61399841308594, 139.59661865234375, 143.57925415039062, 147.5618896484375, 151.5445098876953, 155.52713012695312, 159.509765625, 163.49240112304688, 167.4750213623047, 171.4576416015625, 175.44027709960938, 179.42291259765625, 183.40553283691406]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 10.0, 8.0, 7.0, 11.0, 7.0, 19.0, 15.0, 18.0, 15.0, 22.0, 24.0, 24.0, 28.0, 28.0, 38.0, 29.0, 27.0, 31.0, 36.0, 35.0, 48.0, 32.0, 33.0, 38.0, 43.0, 39.0, 39.0, 33.0, 32.0, 34.0, 23.0, 17.0, 22.0, 24.0, 17.0, 13.0, 10.0, 11.0, 4.0, 9.0, 6.0, 10.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.828853607177734, -30.778804779052734, -29.728755950927734, -28.678707122802734, -27.628658294677734, -26.578609466552734, -25.528562545776367, -24.478513717651367, -23.428464889526367, -22.378416061401367, -21.328367233276367, -20.278318405151367, -19.228271484375, -18.17822265625, -17.128173828125, -16.078125, -15.028076171875, -13.97802734375, -12.927978515625, -11.877930641174316, -10.827881813049316, -9.777832984924316, -8.727785110473633, -7.677736282348633, -6.627687454223633, -5.577638626098633, -4.527590274810791, -3.47754168510437, -2.427493095397949, -1.3774442672729492, -0.3273959159851074, 0.7226524353027344, 1.7726974487304688, 2.8227460384368896, 3.8727946281433105, 4.922842979431152, 5.972891807556152, 7.022940635681152, 8.072988510131836, 9.123037338256836, 10.173086166381836, 11.223134994506836, 12.273183822631836, 13.32323169708252, 14.37328052520752, 15.42332935333252, 16.473377227783203, 17.523426055908203, 18.573474884033203, 19.623523712158203, 20.673572540283203, 21.723621368408203, 22.773670196533203, 23.823719024658203, 24.87376594543457, 25.92381477355957, 26.97386360168457, 28.02391242980957, 29.07396125793457, 30.12401008605957, 31.174057006835938, 32.22410583496094, 33.27415466308594, 34.32420349121094, 35.37425231933594]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 10.0, 12.0, 12.0, 9.0, 16.0, 9.0, 16.0, 24.0, 14.0, 25.0, 29.0, 22.0, 35.0, 31.0, 36.0, 42.0, 43.0, 36.0, 38.0, 33.0, 42.0, 47.0, 40.0, 45.0, 38.0, 36.0, 39.0, 38.0, 36.0, 20.0, 18.0, 23.0, 15.0, 13.0, 9.0, 13.0, 3.0, 5.0, 4.0, 4.0, 0.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.875, -4.71319580078125, -4.5513916015625, -4.38958740234375, -4.227783203125, -4.06597900390625, -3.9041748046875, -3.74237060546875, -3.58056640625, -3.41876220703125, -3.2569580078125, -3.09515380859375, -2.933349609375, -2.77154541015625, -2.6097412109375, -2.44793701171875, -2.2861328125, -2.12432861328125, -1.9625244140625, -1.80072021484375, -1.638916015625, -1.47711181640625, -1.3153076171875, -1.15350341796875, -0.99169921875, -0.82989501953125, -0.6680908203125, -0.50628662109375, -0.344482421875, -0.18267822265625, -0.0208740234375, 0.14093017578125, 0.302734375, 0.46453857421875, 0.6263427734375, 0.78814697265625, 0.949951171875, 1.11175537109375, 1.2735595703125, 1.43536376953125, 1.59716796875, 1.75897216796875, 1.9207763671875, 2.08258056640625, 2.244384765625, 2.40618896484375, 2.5679931640625, 2.72979736328125, 2.8916015625, 3.05340576171875, 3.2152099609375, 3.37701416015625, 3.538818359375, 3.70062255859375, 3.8624267578125, 4.02423095703125, 4.18603515625, 4.34783935546875, 4.5096435546875, 4.67144775390625, 4.833251953125, 4.99505615234375, 5.1568603515625, 5.31866455078125, 5.48046875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 12.0, 18.0, 12.0, 28.0, 56.0, 48.0, 86.0, 117.0, 216.0, 289.0, 447.0, 672.0, 999.0, 1486.0, 2269.0, 3547.0, 5495.0, 8466.0, 13231.0, 21392.0, 34685.0, 57360.0, 98395.0, 163407.0, 211497.0, 167804.0, 100997.0, 59006.0, 35657.0, 21892.0, 13974.0, 8734.0, 5657.0, 3631.0, 2372.0, 1557.0, 1039.0, 654.0, 440.0, 295.0, 194.0, 143.0, 95.0, 56.0, 55.0, 20.0, 22.0, 12.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5068359375, -0.490234375, -0.4736328125, -0.45703125, -0.4404296875, -0.423828125, -0.4072265625, -0.390625, -0.3740234375, -0.357421875, -0.3408203125, -0.32421875, -0.3076171875, -0.291015625, -0.2744140625, -0.2578125, -0.2412109375, -0.224609375, -0.2080078125, -0.19140625, -0.1748046875, -0.158203125, -0.1416015625, -0.125, -0.1083984375, -0.091796875, -0.0751953125, -0.05859375, -0.0419921875, -0.025390625, -0.0087890625, 0.0078125, 0.0244140625, 0.041015625, 0.0576171875, 0.07421875, 0.0908203125, 0.107421875, 0.1240234375, 0.140625, 0.1572265625, 0.173828125, 0.1904296875, 0.20703125, 0.2236328125, 0.240234375, 0.2568359375, 0.2734375, 0.2900390625, 0.306640625, 0.3232421875, 0.33984375, 0.3564453125, 0.373046875, 0.3896484375, 0.40625, 0.4228515625, 0.439453125, 0.4560546875, 0.47265625, 0.4892578125, 0.505859375, 0.5224609375, 0.5390625, 0.5556640625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 3.0, 6.0, 9.0, 7.0, 17.0, 13.0, 15.0, 20.0, 18.0, 15.0, 20.0, 21.0, 29.0, 32.0, 28.0, 37.0, 41.0, 44.0, 47.0, 49.0, 1078.0, 31.0, 49.0, 39.0, 37.0, 36.0, 40.0, 35.0, 36.0, 28.0, 16.0, 23.0, 18.0, 16.0, 13.0, 12.0, 7.0, 7.0, 6.0, 3.0, 7.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.21484375, -3.10943603515625, -3.0040283203125, -2.89862060546875, -2.793212890625, -2.68780517578125, -2.5823974609375, -2.47698974609375, -2.37158203125, -2.26617431640625, -2.1607666015625, -2.05535888671875, -1.949951171875, -1.84454345703125, -1.7391357421875, -1.63372802734375, -1.5283203125, -1.42291259765625, -1.3175048828125, -1.21209716796875, -1.106689453125, -1.00128173828125, -0.8958740234375, -0.79046630859375, -0.68505859375, -0.57965087890625, -0.4742431640625, -0.36883544921875, -0.263427734375, -0.15802001953125, -0.0526123046875, 0.05279541015625, 0.158203125, 0.26361083984375, 0.3690185546875, 0.47442626953125, 0.579833984375, 0.68524169921875, 0.7906494140625, 0.89605712890625, 1.00146484375, 1.10687255859375, 1.2122802734375, 1.31768798828125, 1.423095703125, 1.52850341796875, 1.6339111328125, 1.73931884765625, 1.8447265625, 1.95013427734375, 2.0555419921875, 2.16094970703125, 2.266357421875, 2.37176513671875, 2.4771728515625, 2.58258056640625, 2.68798828125, 2.79339599609375, 2.8988037109375, 3.00421142578125, 3.109619140625, 3.21502685546875, 3.3204345703125, 3.42584228515625, 3.53125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 16.0, 28.0, 33.0, 42.0, 81.0, 132.0, 185.0, 272.0, 416.0, 684.0, 1010.0, 1550.0, 2353.0, 3652.0, 5945.0, 9262.0, 14653.0, 23742.0, 39090.0, 63196.0, 104441.0, 164127.0, 1247698.0, 156700.0, 99117.0, 60494.0, 37171.0, 22506.0, 14093.0, 8718.0, 5566.0, 3582.0, 2367.0, 1531.0, 891.0, 617.0, 405.0, 252.0, 163.0, 115.0, 79.0, 40.0, 36.0, 28.0, 12.0, 7.0, 3.0, 6.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4814453125, -0.46660614013671875, -0.4517669677734375, -0.43692779541015625, -0.422088623046875, -0.40724945068359375, -0.3924102783203125, -0.37757110595703125, -0.36273193359375, -0.34789276123046875, -0.3330535888671875, -0.31821441650390625, -0.303375244140625, -0.28853607177734375, -0.2736968994140625, -0.25885772705078125, -0.2440185546875, -0.22917938232421875, -0.2143402099609375, -0.19950103759765625, -0.184661865234375, -0.16982269287109375, -0.1549835205078125, -0.14014434814453125, -0.12530517578125, -0.11046600341796875, -0.0956268310546875, -0.08078765869140625, -0.065948486328125, -0.05110931396484375, -0.0362701416015625, -0.02143096923828125, -0.006591796875, 0.00824737548828125, 0.0230865478515625, 0.03792572021484375, 0.052764892578125, 0.06760406494140625, 0.0824432373046875, 0.09728240966796875, 0.11212158203125, 0.12696075439453125, 0.1417999267578125, 0.15663909912109375, 0.171478271484375, 0.18631744384765625, 0.2011566162109375, 0.21599578857421875, 0.2308349609375, 0.24567413330078125, 0.2605133056640625, 0.27535247802734375, 0.290191650390625, 0.30503082275390625, 0.3198699951171875, 0.33470916748046875, 0.34954833984375, 0.36438751220703125, 0.3792266845703125, 0.39406585693359375, 0.408905029296875, 0.42374420166015625, 0.4385833740234375, 0.45342254638671875, 0.46826171875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 8.0, 11.0, 16.0, 9.0, 24.0, 14.0, 17.0, 15.0, 13.0, 28.0, 28.0, 24.0, 27.0, 42.0, 22.0, 48.0, 42.0, 34.0, 42.0, 44.0, 35.0, 36.0, 44.0, 36.0, 42.0, 40.0, 31.0, 24.0, 25.0, 27.0, 20.0, 20.0, 12.0, 15.0, 13.0, 15.0, 17.0, 6.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.0006718635559082031, -0.0006514489650726318, -0.0006310343742370605, -0.0006106197834014893, -0.000590205192565918, -0.0005697906017303467, -0.0005493760108947754, -0.0005289614200592041, -0.0005085468292236328, -0.0004881322383880615, -0.00046771764755249023, -0.00044730305671691895, -0.00042688846588134766, -0.00040647387504577637, -0.0003860592842102051, -0.0003656446933746338, -0.0003452301025390625, -0.0003248155117034912, -0.0003044009208679199, -0.00028398633003234863, -0.00026357173919677734, -0.00024315714836120605, -0.00022274255752563477, -0.00020232796669006348, -0.0001819133758544922, -0.0001614987850189209, -0.0001410841941833496, -0.00012066960334777832, -0.00010025501251220703, -7.984042167663574e-05, -5.942583084106445e-05, -3.9011240005493164e-05, -1.8596649169921875e-05, 1.817941665649414e-06, 2.2232532501220703e-05, 4.264712333679199e-05, 6.306171417236328e-05, 8.347630500793457e-05, 0.00010389089584350586, 0.00012430548667907715, 0.00014472007751464844, 0.00016513466835021973, 0.00018554925918579102, 0.0002059638500213623, 0.0002263784408569336, 0.0002467930316925049, 0.00026720762252807617, 0.00028762221336364746, 0.00030803680419921875, 0.00032845139503479004, 0.00034886598587036133, 0.0003692805767059326, 0.0003896951675415039, 0.0004101097583770752, 0.0004305243492126465, 0.0004509389400482178, 0.00047135353088378906, 0.0004917681217193604, 0.0005121827125549316, 0.0005325973033905029, 0.0005530118942260742, 0.0005734264850616455, 0.0005938410758972168, 0.0006142556667327881, 0.0006346702575683594]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 5.0, 13.0, 9.0, 16.0, 8.0, 26.0, 13.0, 33.0, 26.0, 40.0, 39.0, 50.0, 68.0, 73.0, 85.0, 146.0, 322.0, 792.0, 3307.0, 961850.0, 79201.0, 1277.0, 420.0, 175.0, 111.0, 69.0, 65.0, 52.0, 44.0, 32.0, 30.0, 26.0, 19.0, 12.0, 13.0, 17.0, 17.0, 9.0, 7.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01458740234375, -0.014112710952758789, -0.013638019561767578, -0.013163328170776367, -0.012688636779785156, -0.012213945388793945, -0.011739253997802734, -0.011264562606811523, -0.010789871215820312, -0.010315179824829102, -0.00984048843383789, -0.00936579704284668, -0.008891105651855469, -0.008416414260864258, -0.007941722869873047, -0.007467031478881836, -0.006992340087890625, -0.006517648696899414, -0.006042957305908203, -0.005568265914916992, -0.005093574523925781, -0.00461888313293457, -0.004144191741943359, -0.0036695003509521484, -0.0031948089599609375, -0.0027201175689697266, -0.0022454261779785156, -0.0017707347869873047, -0.0012960433959960938, -0.0008213520050048828, -0.0003466606140136719, 0.00012803077697753906, 0.00060272216796875, 0.001077413558959961, 0.0015521049499511719, 0.002026796340942383, 0.0025014877319335938, 0.0029761791229248047, 0.0034508705139160156, 0.0039255619049072266, 0.0044002532958984375, 0.0048749446868896484, 0.005349636077880859, 0.00582432746887207, 0.006299018859863281, 0.006773710250854492, 0.007248401641845703, 0.007723093032836914, 0.008197784423828125, 0.008672475814819336, 0.009147167205810547, 0.009621858596801758, 0.010096549987792969, 0.01057124137878418, 0.01104593276977539, 0.011520624160766602, 0.011995315551757812, 0.012470006942749023, 0.012944698333740234, 0.013419389724731445, 0.013894081115722656, 0.014368772506713867, 0.014843463897705078, 0.015318155288696289, 0.0157928466796875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 21.0, 72.0, 188.0, 283.0, 258.0, 122.0, 42.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0020624916069209576, -0.002022620989009738, -0.0019827503710985184, -0.0019428798696026206, -0.001903009251691401, -0.0018631387501955032, -0.0018232681322842836, -0.001783397514373064, -0.0017435270128771663, -0.0017036563949659467, -0.001663785893470049, -0.0016239152755588293, -0.0015840446576476097, -0.001544174156151712, -0.0015043035382404923, -0.0014644330367445946, -0.001424562418833375, -0.0013846918009221554, -0.0013448212994262576, -0.001304950681515038, -0.0012650800636038184, -0.0012252095621079206, -0.001185338944196701, -0.0011454683262854815, -0.0011055977083742619, -0.0010657270904630423, -0.0010258565889671445, -0.000985985971055925, -0.0009461154113523662, -0.0009062448516488075, -0.0008663742337375879, -0.0008265036740340292, -0.0007866330561228096, -0.000746762496419251, -0.0007068918785080314, -0.0006670213188044727, -0.000627150759100914, -0.0005872801411896944, -0.0005474095814861357, -0.000507539021782577, -0.0004676684329751879, -0.00042779784416779876, -0.0003879272844642401, -0.00034805669565685093, -0.0003081861068494618, -0.0002683155471459031, -0.00022844495833851397, -0.0001885743986349553, -0.00014870380982756615, -0.00010883323557209224, -6.896265404066071e-05, -2.9092072509229183e-05, 1.0778501746244729e-05, 5.064907600171864e-05, 9.051966480910778e-05, 0.00013039022451266646, 0.0001702608133200556, 0.00021013138757552952, 0.00025000196183100343, 0.00028987255063839257, 0.0003297431394457817, 0.0003696136991493404, 0.00040948428795672953, 0.0004493548476602882, 0.0004892254364676774]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 6.0, 9.0, 18.0, 15.0, 18.0, 21.0, 21.0, 27.0, 28.0, 28.0, 44.0, 34.0, 30.0, 56.0, 41.0, 32.0, 41.0, 47.0, 36.0, 38.0, 54.0, 36.0, 41.0, 33.0, 35.0, 31.0, 22.0, 24.0, 21.0, 20.0, 18.0, 11.0, 9.0, 8.0, 7.0, 8.0, 7.0, 5.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00044918060302734375, -0.00043433625251054764, -0.0004194919019937515, -0.0004046475514769554, -0.0003898032009601593, -0.0003749588504433632, -0.0003601144999265671, -0.00034527014940977097, -0.00033042579889297485, -0.00031558144837617874, -0.00030073709785938263, -0.0002858927473425865, -0.0002710483968257904, -0.0002562040463089943, -0.00024135969579219818, -0.00022651534527540207, -0.00021167099475860596, -0.00019682664424180984, -0.00018198229372501373, -0.00016713794320821762, -0.0001522935926914215, -0.0001374492421746254, -0.00012260489165782928, -0.00010776054114103317, -9.291619062423706e-05, -7.807184010744095e-05, -6.322748959064484e-05, -4.8383139073848724e-05, -3.353878855705261e-05, -1.86944380402565e-05, -3.850087523460388e-06, 1.0994262993335724e-05, 2.5838613510131836e-05, 4.068296402692795e-05, 5.552731454372406e-05, 7.037166506052017e-05, 8.521601557731628e-05, 0.0001000603660941124, 0.00011490471661090851, 0.00012974906712770462, 0.00014459341764450073, 0.00015943776816129684, 0.00017428211867809296, 0.00018912646919488907, 0.00020397081971168518, 0.0002188151702284813, 0.0002336595207452774, 0.0002485038712620735, 0.00026334822177886963, 0.00027819257229566574, 0.00029303692281246185, 0.00030788127332925797, 0.0003227256238460541, 0.0003375699743628502, 0.0003524143248796463, 0.0003672586753964424, 0.0003821030259132385, 0.00039694737643003464, 0.00041179172694683075, 0.00042663607746362686, 0.000441480427980423, 0.0004563247784972191, 0.0004711691290140152, 0.0004860134795308113, 0.0005008578300476074]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 10.0, 12.0, 12.0, 9.0, 16.0, 9.0, 16.0, 24.0, 14.0, 25.0, 29.0, 22.0, 35.0, 31.0, 36.0, 42.0, 43.0, 36.0, 38.0, 33.0, 42.0, 47.0, 40.0, 45.0, 38.0, 36.0, 39.0, 38.0, 36.0, 20.0, 18.0, 23.0, 15.0, 13.0, 9.0, 13.0, 3.0, 5.0, 4.0, 4.0, 0.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.875, -4.71319580078125, -4.5513916015625, -4.38958740234375, -4.227783203125, -4.06597900390625, -3.9041748046875, -3.74237060546875, -3.58056640625, -3.41876220703125, -3.2569580078125, -3.09515380859375, -2.933349609375, -2.77154541015625, -2.6097412109375, -2.44793701171875, -2.2861328125, -2.12432861328125, -1.9625244140625, -1.80072021484375, -1.638916015625, -1.47711181640625, -1.3153076171875, -1.15350341796875, -0.99169921875, -0.82989501953125, -0.6680908203125, -0.50628662109375, -0.344482421875, -0.18267822265625, -0.0208740234375, 0.14093017578125, 0.302734375, 0.46453857421875, 0.6263427734375, 0.78814697265625, 0.949951171875, 1.11175537109375, 1.2735595703125, 1.43536376953125, 1.59716796875, 1.75897216796875, 1.9207763671875, 2.08258056640625, 2.244384765625, 2.40618896484375, 2.5679931640625, 2.72979736328125, 2.8916015625, 3.05340576171875, 3.2152099609375, 3.37701416015625, 3.538818359375, 3.70062255859375, 3.8624267578125, 4.02423095703125, 4.18603515625, 4.34783935546875, 4.5096435546875, 4.67144775390625, 4.833251953125, 4.99505615234375, 5.1568603515625, 5.31866455078125, 5.48046875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 5.0, 10.0, 12.0, 17.0, 15.0, 18.0, 25.0, 26.0, 56.0, 65.0, 80.0, 147.0, 183.0, 316.0, 569.0, 1182.0, 2533.0, 6239.0, 18158.0, 68212.0, 333566.0, 480532.0, 98372.0, 23980.0, 7947.0, 3072.0, 1354.0, 677.0, 405.0, 243.0, 160.0, 123.0, 68.0, 60.0, 32.0, 28.0, 23.0, 15.0, 4.0, 6.0, 4.0, 6.0, 0.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.75390625, -4.5960693359375, -4.438232421875, -4.2803955078125, -4.12255859375, -3.9647216796875, -3.806884765625, -3.6490478515625, -3.4912109375, -3.3333740234375, -3.175537109375, -3.0177001953125, -2.85986328125, -2.7020263671875, -2.544189453125, -2.3863525390625, -2.228515625, -2.0706787109375, -1.912841796875, -1.7550048828125, -1.59716796875, -1.4393310546875, -1.281494140625, -1.1236572265625, -0.9658203125, -0.8079833984375, -0.650146484375, -0.4923095703125, -0.33447265625, -0.1766357421875, -0.018798828125, 0.1390380859375, 0.296875, 0.4547119140625, 0.612548828125, 0.7703857421875, 0.92822265625, 1.0860595703125, 1.243896484375, 1.4017333984375, 1.5595703125, 1.7174072265625, 1.875244140625, 2.0330810546875, 2.19091796875, 2.3487548828125, 2.506591796875, 2.6644287109375, 2.822265625, 2.9801025390625, 3.137939453125, 3.2957763671875, 3.45361328125, 3.6114501953125, 3.769287109375, 3.9271240234375, 4.0849609375, 4.2427978515625, 4.400634765625, 4.5584716796875, 4.71630859375, 4.8741455078125, 5.031982421875, 5.1898193359375, 5.34765625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 13.0, 13.0, 7.0, 20.0, 14.0, 13.0, 18.0, 31.0, 27.0, 23.0, 22.0, 28.0, 35.0, 33.0, 41.0, 46.0, 62.0, 227.0, 1687.0, 176.0, 58.0, 52.0, 38.0, 50.0, 35.0, 36.0, 28.0, 29.0, 19.0, 25.0, 18.0, 16.0, 11.0, 16.0, 11.0, 5.0, 5.0, 10.0, 8.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.265625, -15.7640380859375, -15.262451171875, -14.7608642578125, -14.25927734375, -13.7576904296875, -13.256103515625, -12.7545166015625, -12.2529296875, -11.7513427734375, -11.249755859375, -10.7481689453125, -10.24658203125, -9.7449951171875, -9.243408203125, -8.7418212890625, -8.240234375, -7.7386474609375, -7.237060546875, -6.7354736328125, -6.23388671875, -5.7322998046875, -5.230712890625, -4.7291259765625, -4.2275390625, -3.7259521484375, -3.224365234375, -2.7227783203125, -2.22119140625, -1.7196044921875, -1.218017578125, -0.7164306640625, -0.21484375, 0.2867431640625, 0.788330078125, 1.2899169921875, 1.79150390625, 2.2930908203125, 2.794677734375, 3.2962646484375, 3.7978515625, 4.2994384765625, 4.801025390625, 5.3026123046875, 5.80419921875, 6.3057861328125, 6.807373046875, 7.3089599609375, 7.810546875, 8.3121337890625, 8.813720703125, 9.3153076171875, 9.81689453125, 10.3184814453125, 10.820068359375, 11.3216552734375, 11.8232421875, 12.3248291015625, 12.826416015625, 13.3280029296875, 13.82958984375, 14.3311767578125, 14.832763671875, 15.3343505859375, 15.8359375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 22.0, 53.0, 154.0, 570.0, 263920.0, 2880105.0, 594.0, 165.0, 79.0, 19.0, 12.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.875, -166.150390625, -160.42578125, -154.701171875, -148.9765625, -143.251953125, -137.52734375, -131.802734375, -126.078125, -120.353515625, -114.62890625, -108.904296875, -103.1796875, -97.455078125, -91.73046875, -86.005859375, -80.28125, -74.556640625, -68.83203125, -63.107421875, -57.3828125, -51.658203125, -45.93359375, -40.208984375, -34.484375, -28.759765625, -23.03515625, -17.310546875, -11.5859375, -5.861328125, -0.13671875, 5.587890625, 11.3125, 17.037109375, 22.76171875, 28.486328125, 34.2109375, 39.935546875, 45.66015625, 51.384765625, 57.109375, 62.833984375, 68.55859375, 74.283203125, 80.0078125, 85.732421875, 91.45703125, 97.181640625, 102.90625, 108.630859375, 114.35546875, 120.080078125, 125.8046875, 131.529296875, 137.25390625, 142.978515625, 148.703125, 154.427734375, 160.15234375, 165.876953125, 171.6015625, 177.326171875, 183.05078125, 188.775390625, 194.5]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 484.0, 534.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.85443878173828, -52.1862678527832, -43.518096923828125, -34.84992599487305, -26.18175506591797, -17.51358413696289, -8.845413208007812, -0.17724227905273438, 8.490928649902344, 17.159099578857422, 25.8272705078125, 34.49544143676758, 43.163612365722656, 51.831783294677734, 60.49995422363281, 69.16812133789062, 77.83629608154297, 86.50447082519531, 95.17263793945312, 103.84080505371094, 112.50897979736328, 121.17715454101562, 129.84532165527344, 138.51348876953125, 147.18167114257812, 155.84983825683594, 164.51800537109375, 173.18618774414062, 181.85435485839844, 190.52252197265625, 199.19070434570312, 207.85887145996094, 216.52700805664062, 225.19517517089844, 233.86334228515625, 242.53152465820312, 251.19969177246094, 259.86785888671875, 268.5360412597656, 277.2041931152344, 285.87237548828125, 294.5405578613281, 303.2087097167969, 311.87689208984375, 320.5450439453125, 329.2132263183594, 337.88140869140625, 346.549560546875, 355.2177429199219, 363.88592529296875, 372.5540771484375, 381.2222595214844, 389.89044189453125, 398.55859375, 407.2267761230469, 415.8949279785156, 424.5631103515625, 433.2312927246094, 441.8994445800781, 450.567626953125, 459.23577880859375, 467.9039611816406, 476.5721435546875, 485.24029541015625, 493.9084777832031]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 8.0, 7.0, 13.0, 14.0, 12.0, 17.0, 27.0, 23.0, 25.0, 42.0, 27.0, 29.0, 36.0, 43.0, 34.0, 37.0, 37.0, 33.0, 31.0, 44.0, 32.0, 28.0, 47.0, 34.0, 40.0, 26.0, 29.0, 27.0, 29.0, 24.0, 24.0, 18.0, 16.0, 11.0, 14.0, 7.0, 11.0, 13.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-48.68928909301758, -47.24296951293945, -45.79664993286133, -44.3503303527832, -42.90401077270508, -41.45769119262695, -40.01137161254883, -38.5650520324707, -37.11873245239258, -35.67241287231445, -34.22609329223633, -32.7797737121582, -31.333454132080078, -29.887134552001953, -28.440814971923828, -26.994495391845703, -25.548175811767578, -24.101856231689453, -22.655536651611328, -21.209217071533203, -19.762897491455078, -18.316577911376953, -16.870258331298828, -15.423938751220703, -13.977619171142578, -12.531299591064453, -11.084980010986328, -9.638660430908203, -8.192340850830078, -6.746021270751953, -5.299701690673828, -3.853382110595703, -2.407062530517578, -0.9607429504394531, 0.4855766296386719, 1.9318962097167969, 3.378215789794922, 4.824535369873047, 6.270854949951172, 7.717174530029297, 9.163494110107422, 10.609813690185547, 12.056133270263672, 13.502452850341797, 14.948772430419922, 16.395092010498047, 17.841411590576172, 19.287731170654297, 20.734050750732422, 22.180370330810547, 23.626689910888672, 25.073009490966797, 26.519329071044922, 27.965648651123047, 29.411968231201172, 30.858287811279297, 32.30460739135742, 33.75092697143555, 35.19724655151367, 36.6435661315918, 38.08988571166992, 39.53620529174805, 40.98252487182617, 42.4288444519043, 43.87516403198242]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 5.0, 6.0, 6.0, 13.0, 17.0, 12.0, 12.0, 18.0, 19.0, 13.0, 24.0, 14.0, 26.0, 26.0, 36.0, 36.0, 37.0, 36.0, 34.0, 40.0, 42.0, 36.0, 37.0, 40.0, 41.0, 37.0, 50.0, 31.0, 38.0, 33.0, 30.0, 29.0, 19.0, 12.0, 21.0, 14.0, 18.0, 10.0, 5.0, 3.0, 6.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.19921875, -5.03662109375, -4.8740234375, -4.71142578125, -4.548828125, -4.38623046875, -4.2236328125, -4.06103515625, -3.8984375, -3.73583984375, -3.5732421875, -3.41064453125, -3.248046875, -3.08544921875, -2.9228515625, -2.76025390625, -2.59765625, -2.43505859375, -2.2724609375, -2.10986328125, -1.947265625, -1.78466796875, -1.6220703125, -1.45947265625, -1.296875, -1.13427734375, -0.9716796875, -0.80908203125, -0.646484375, -0.48388671875, -0.3212890625, -0.15869140625, 0.00390625, 0.16650390625, 0.3291015625, 0.49169921875, 0.654296875, 0.81689453125, 0.9794921875, 1.14208984375, 1.3046875, 1.46728515625, 1.6298828125, 1.79248046875, 1.955078125, 2.11767578125, 2.2802734375, 2.44287109375, 2.60546875, 2.76806640625, 2.9306640625, 3.09326171875, 3.255859375, 3.41845703125, 3.5810546875, 3.74365234375, 3.90625, 4.06884765625, 4.2314453125, 4.39404296875, 4.556640625, 4.71923828125, 4.8818359375, 5.04443359375, 5.20703125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 7.0, 3.0, 7.0, 13.0, 15.0, 14.0, 28.0, 18.0, 37.0, 26.0, 43.0, 41.0, 30.0, 53.0, 80.0, 109.0, 164.0, 275.0, 508.0, 1524.0, 5649.0, 43095.0, 749697.0, 2800776.0, 552203.0, 32381.0, 4732.0, 1307.0, 534.0, 246.0, 162.0, 116.0, 80.0, 68.0, 52.0, 45.0, 39.0, 21.0, 18.0, 15.0, 10.0, 11.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.9375, -12.5260009765625, -12.114501953125, -11.7030029296875, -11.29150390625, -10.8800048828125, -10.468505859375, -10.0570068359375, -9.6455078125, -9.2340087890625, -8.822509765625, -8.4110107421875, -7.99951171875, -7.5880126953125, -7.176513671875, -6.7650146484375, -6.353515625, -5.9420166015625, -5.530517578125, -5.1190185546875, -4.70751953125, -4.2960205078125, -3.884521484375, -3.4730224609375, -3.0615234375, -2.6500244140625, -2.238525390625, -1.8270263671875, -1.41552734375, -1.0040283203125, -0.592529296875, -0.1810302734375, 0.23046875, 0.6419677734375, 1.053466796875, 1.4649658203125, 1.87646484375, 2.2879638671875, 2.699462890625, 3.1109619140625, 3.5224609375, 3.9339599609375, 4.345458984375, 4.7569580078125, 5.16845703125, 5.5799560546875, 5.991455078125, 6.4029541015625, 6.814453125, 7.2259521484375, 7.637451171875, 8.0489501953125, 8.46044921875, 8.8719482421875, 9.283447265625, 9.6949462890625, 10.1064453125, 10.5179443359375, 10.929443359375, 11.3409423828125, 11.75244140625, 12.1639404296875, 12.575439453125, 12.9869384765625, 13.3984375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 5.0, 7.0, 13.0, 10.0, 21.0, 15.0, 22.0, 27.0, 20.0, 37.0, 47.0, 62.0, 96.0, 115.0, 138.0, 171.0, 258.0, 284.0, 353.0, 401.0, 356.0, 353.0, 239.0, 213.0, 177.0, 141.0, 94.0, 88.0, 67.0, 50.0, 42.0, 31.0, 28.0, 25.0, 11.0, 7.0, 11.0, 8.0, 5.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-9.203125, -8.9393310546875, -8.675537109375, -8.4117431640625, -8.14794921875, -7.8841552734375, -7.620361328125, -7.3565673828125, -7.0927734375, -6.8289794921875, -6.565185546875, -6.3013916015625, -6.03759765625, -5.7738037109375, -5.510009765625, -5.2462158203125, -4.982421875, -4.7186279296875, -4.454833984375, -4.1910400390625, -3.92724609375, -3.6634521484375, -3.399658203125, -3.1358642578125, -2.8720703125, -2.6082763671875, -2.344482421875, -2.0806884765625, -1.81689453125, -1.5531005859375, -1.289306640625, -1.0255126953125, -0.76171875, -0.4979248046875, -0.234130859375, 0.0296630859375, 0.29345703125, 0.5572509765625, 0.821044921875, 1.0848388671875, 1.3486328125, 1.6124267578125, 1.876220703125, 2.1400146484375, 2.40380859375, 2.6676025390625, 2.931396484375, 3.1951904296875, 3.458984375, 3.7227783203125, 3.986572265625, 4.2503662109375, 4.51416015625, 4.7779541015625, 5.041748046875, 5.3055419921875, 5.5693359375, 5.8331298828125, 6.096923828125, 6.3607177734375, 6.62451171875, 6.8883056640625, 7.152099609375, 7.4158935546875, 7.6796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 6.0, 10.0, 9.0, 15.0, 11.0, 21.0, 26.0, 26.0, 38.0, 56.0, 62.0, 85.0, 93.0, 125.0, 145.0, 168.0, 236.0, 323.0, 439.0, 2563.0, 305794.0, 3861144.0, 20282.0, 863.0, 393.0, 295.0, 234.0, 168.0, 131.0, 113.0, 88.0, 65.0, 47.0, 43.0, 28.0, 30.0, 22.0, 18.0, 12.0, 10.0, 13.0, 10.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.1875, -36.83642578125, -35.4853515625, -34.13427734375, -32.783203125, -31.43212890625, -30.0810546875, -28.72998046875, -27.37890625, -26.02783203125, -24.6767578125, -23.32568359375, -21.974609375, -20.62353515625, -19.2724609375, -17.92138671875, -16.5703125, -15.21923828125, -13.8681640625, -12.51708984375, -11.166015625, -9.81494140625, -8.4638671875, -7.11279296875, -5.76171875, -4.41064453125, -3.0595703125, -1.70849609375, -0.357421875, 0.99365234375, 2.3447265625, 3.69580078125, 5.046875, 6.39794921875, 7.7490234375, 9.10009765625, 10.451171875, 11.80224609375, 13.1533203125, 14.50439453125, 15.85546875, 17.20654296875, 18.5576171875, 19.90869140625, 21.259765625, 22.61083984375, 23.9619140625, 25.31298828125, 26.6640625, 28.01513671875, 29.3662109375, 30.71728515625, 32.068359375, 33.41943359375, 34.7705078125, 36.12158203125, 37.47265625, 38.82373046875, 40.1748046875, 41.52587890625, 42.876953125, 44.22802734375, 45.5791015625, 46.93017578125, 48.28125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 11.0, 60.0, 259.0, 400.0, 230.0, 49.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.05471420288086, -30.37342071533203, -25.692127227783203, -21.010835647583008, -16.32954216003418, -11.648248672485352, -6.966957092285156, -2.285663604736328, 2.3956298828125, 7.07692289352417, 11.75821590423584, 16.43950843811035, 21.12080192565918, 25.802095413208008, 30.483386993408203, 35.16468048095703, 39.84597396850586, 44.52726745605469, 49.208560943603516, 53.889854431152344, 58.571144104003906, 63.25244140625, 67.93373107910156, 72.61502075195312, 77.29631805419922, 81.97760772705078, 86.65890502929688, 91.34019470214844, 96.02149200439453, 100.7027816772461, 105.38407897949219, 110.06536865234375, 114.74665832519531, 119.42794799804688, 124.10924530029297, 128.79054260253906, 133.47183227539062, 138.1531219482422, 142.83441162109375, 147.51571655273438, 152.19700622558594, 156.8782958984375, 161.55958557128906, 166.2408905029297, 170.92218017578125, 175.6034698486328, 180.28475952148438, 184.966064453125, 189.6473388671875, 194.32862854003906, 199.00991821289062, 203.69122314453125, 208.3725128173828, 213.05380249023438, 217.73509216308594, 222.4163818359375, 227.09768676757812, 231.7789764404297, 236.46026611328125, 241.14157104492188, 245.82286071777344, 250.504150390625, 255.18544006347656, 259.8667297363281, 264.54803466796875]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 7.0, 9.0, 6.0, 7.0, 5.0, 13.0, 16.0, 11.0, 14.0, 13.0, 26.0, 22.0, 28.0, 21.0, 37.0, 30.0, 38.0, 32.0, 44.0, 38.0, 39.0, 47.0, 50.0, 33.0, 40.0, 37.0, 43.0, 34.0, 25.0, 28.0, 25.0, 25.0, 20.0, 22.0, 23.0, 19.0, 23.0, 11.0, 14.0, 8.0, 4.0, 8.0, 7.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.797210693359375, -31.757232666015625, -30.717254638671875, -29.677276611328125, -28.637298583984375, -27.597320556640625, -26.557342529296875, -25.517364501953125, -24.477386474609375, -23.437408447265625, -22.397430419921875, -21.357452392578125, -20.317474365234375, -19.277496337890625, -18.237518310546875, -17.197540283203125, -16.157560348510742, -15.117582321166992, -14.077604293823242, -13.037626266479492, -11.997648239135742, -10.957670211791992, -9.917691230773926, -8.877713203430176, -7.837735176086426, -6.797757148742676, -5.757779121398926, -4.717800617218018, -3.6778225898742676, -2.6378445625305176, -1.5978660583496094, -0.5578880310058594, 0.4820899963378906, 1.5220681428909302, 2.5620462894439697, 3.602024555206299, 4.642002582550049, 5.681980609893799, 6.721959114074707, 7.761937141418457, 8.801915168762207, 9.841893196105957, 10.881871223449707, 11.921850204467773, 12.961828231811523, 14.001806259155273, 15.041784286499023, 16.081762313842773, 17.121740341186523, 18.161718368530273, 19.201696395874023, 20.241674423217773, 21.281652450561523, 22.321630477905273, 23.361610412597656, 24.401588439941406, 25.441566467285156, 26.481544494628906, 27.521522521972656, 28.561500549316406, 29.601478576660156, 30.641456604003906, 31.681434631347656, 32.721412658691406, 33.761390686035156]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 13.0, 9.0, 8.0, 14.0, 12.0, 12.0, 8.0, 14.0, 26.0, 15.0, 21.0, 15.0, 33.0, 34.0, 37.0, 36.0, 45.0, 47.0, 35.0, 41.0, 49.0, 33.0, 41.0, 40.0, 40.0, 33.0, 36.0, 38.0, 37.0, 23.0, 27.0, 28.0, 17.0, 21.0, 18.0, 5.0, 6.0, 7.0, 5.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6484375, -5.48272705078125, -5.3170166015625, -5.15130615234375, -4.985595703125, -4.81988525390625, -4.6541748046875, -4.48846435546875, -4.32275390625, -4.15704345703125, -3.9913330078125, -3.82562255859375, -3.659912109375, -3.49420166015625, -3.3284912109375, -3.16278076171875, -2.9970703125, -2.83135986328125, -2.6656494140625, -2.49993896484375, -2.334228515625, -2.16851806640625, -2.0028076171875, -1.83709716796875, -1.67138671875, -1.50567626953125, -1.3399658203125, -1.17425537109375, -1.008544921875, -0.84283447265625, -0.6771240234375, -0.51141357421875, -0.345703125, -0.17999267578125, -0.0142822265625, 0.15142822265625, 0.317138671875, 0.48284912109375, 0.6485595703125, 0.81427001953125, 0.97998046875, 1.14569091796875, 1.3114013671875, 1.47711181640625, 1.642822265625, 1.80853271484375, 1.9742431640625, 2.13995361328125, 2.3056640625, 2.47137451171875, 2.6370849609375, 2.80279541015625, 2.968505859375, 3.13421630859375, 3.2999267578125, 3.46563720703125, 3.63134765625, 3.79705810546875, 3.9627685546875, 4.12847900390625, 4.294189453125, 4.45989990234375, 4.6256103515625, 4.79132080078125, 4.95703125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 14.0, 16.0, 19.0, 38.0, 61.0, 84.0, 112.0, 191.0, 251.0, 368.0, 558.0, 859.0, 1273.0, 1948.0, 2873.0, 4478.0, 6876.0, 10861.0, 16850.0, 27406.0, 44680.0, 74698.0, 126577.0, 187535.0, 194697.0, 135576.0, 80929.0, 48173.0, 29217.0, 18432.0, 11578.0, 7342.0, 4730.0, 3078.0, 2091.0, 1318.0, 919.0, 609.0, 413.0, 267.0, 189.0, 108.0, 83.0, 44.0, 47.0, 26.0, 21.0, 10.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.48046875, -0.4644927978515625, -0.448516845703125, -0.4325408935546875, -0.41656494140625, -0.4005889892578125, -0.384613037109375, -0.3686370849609375, -0.3526611328125, -0.3366851806640625, -0.320709228515625, -0.3047332763671875, -0.28875732421875, -0.2727813720703125, -0.256805419921875, -0.2408294677734375, -0.224853515625, -0.2088775634765625, -0.192901611328125, -0.1769256591796875, -0.16094970703125, -0.1449737548828125, -0.128997802734375, -0.1130218505859375, -0.0970458984375, -0.0810699462890625, -0.065093994140625, -0.0491180419921875, -0.03314208984375, -0.0171661376953125, -0.001190185546875, 0.0147857666015625, 0.03076171875, 0.0467376708984375, 0.062713623046875, 0.0786895751953125, 0.09466552734375, 0.1106414794921875, 0.126617431640625, 0.1425933837890625, 0.1585693359375, 0.1745452880859375, 0.190521240234375, 0.2064971923828125, 0.22247314453125, 0.2384490966796875, 0.254425048828125, 0.2704010009765625, 0.286376953125, 0.3023529052734375, 0.318328857421875, 0.3343048095703125, 0.35028076171875, 0.3662567138671875, 0.382232666015625, 0.3982086181640625, 0.4141845703125, 0.4301605224609375, 0.446136474609375, 0.4621124267578125, 0.47808837890625, 0.4940643310546875, 0.510040283203125, 0.5260162353515625, 0.5419921875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 8.0, 8.0, 13.0, 11.0, 17.0, 16.0, 24.0, 23.0, 22.0, 33.0, 23.0, 25.0, 42.0, 39.0, 47.0, 48.0, 35.0, 42.0, 1054.0, 41.0, 54.0, 40.0, 33.0, 45.0, 21.0, 36.0, 22.0, 39.0, 29.0, 27.0, 15.0, 11.0, 24.0, 16.0, 5.0, 9.0, 4.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.126953125, -3.018341064453125, -2.90972900390625, -2.801116943359375, -2.6925048828125, -2.583892822265625, -2.47528076171875, -2.366668701171875, -2.258056640625, -2.149444580078125, -2.04083251953125, -1.932220458984375, -1.8236083984375, -1.714996337890625, -1.60638427734375, -1.497772216796875, -1.38916015625, -1.280548095703125, -1.17193603515625, -1.063323974609375, -0.9547119140625, -0.846099853515625, -0.73748779296875, -0.628875732421875, -0.520263671875, -0.411651611328125, -0.30303955078125, -0.194427490234375, -0.0858154296875, 0.022796630859375, 0.13140869140625, 0.240020751953125, 0.3486328125, 0.457244873046875, 0.56585693359375, 0.674468994140625, 0.7830810546875, 0.891693115234375, 1.00030517578125, 1.108917236328125, 1.217529296875, 1.326141357421875, 1.43475341796875, 1.543365478515625, 1.6519775390625, 1.760589599609375, 1.86920166015625, 1.977813720703125, 2.08642578125, 2.195037841796875, 2.30364990234375, 2.412261962890625, 2.5208740234375, 2.629486083984375, 2.73809814453125, 2.846710205078125, 2.955322265625, 3.063934326171875, 3.17254638671875, 3.281158447265625, 3.3897705078125, 3.498382568359375, 3.60699462890625, 3.715606689453125, 3.82421875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 12.0, 9.0, 18.0, 23.0, 33.0, 64.0, 80.0, 124.0, 174.0, 239.0, 422.0, 633.0, 928.0, 1443.0, 2195.0, 3484.0, 5561.0, 8938.0, 14599.0, 24563.0, 41903.0, 71903.0, 121096.0, 185024.0, 1250517.0, 145494.0, 88357.0, 51742.0, 30206.0, 17871.0, 10991.0, 6590.0, 4274.0, 2603.0, 1766.0, 1118.0, 711.0, 486.0, 308.0, 193.0, 158.0, 91.0, 52.0, 46.0, 24.0, 22.0, 18.0, 12.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.486083984375, -0.4705009460449219, -0.45491790771484375, -0.4393348693847656, -0.4237518310546875, -0.4081687927246094, -0.39258575439453125, -0.3770027160644531, -0.361419677734375, -0.3458366394042969, -0.33025360107421875, -0.3146705627441406, -0.2990875244140625, -0.2835044860839844, -0.26792144775390625, -0.2523384094238281, -0.23675537109375, -0.22117233276367188, -0.20558929443359375, -0.19000625610351562, -0.1744232177734375, -0.15884017944335938, -0.14325714111328125, -0.12767410278320312, -0.112091064453125, -0.09650802612304688, -0.08092498779296875, -0.06534194946289062, -0.0497589111328125, -0.034175872802734375, -0.01859283447265625, -0.003009796142578125, 0.0125732421875, 0.028156280517578125, 0.04373931884765625, 0.059322357177734375, 0.0749053955078125, 0.09048843383789062, 0.10607147216796875, 0.12165451049804688, 0.137237548828125, 0.15282058715820312, 0.16840362548828125, 0.18398666381835938, 0.1995697021484375, 0.21515274047851562, 0.23073577880859375, 0.24631881713867188, 0.26190185546875, 0.2774848937988281, 0.29306793212890625, 0.3086509704589844, 0.3242340087890625, 0.3398170471191406, 0.35540008544921875, 0.3709831237792969, 0.386566162109375, 0.4021492004394531, 0.41773223876953125, 0.4333152770996094, 0.4488983154296875, 0.4644813537597656, 0.48006439208984375, 0.4956474304199219, 0.51123046875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 13.0, 4.0, 9.0, 9.0, 9.0, 12.0, 13.0, 19.0, 23.0, 27.0, 30.0, 24.0, 29.0, 44.0, 36.0, 30.0, 48.0, 51.0, 26.0, 43.0, 45.0, 36.0, 39.0, 50.0, 42.0, 32.0, 38.0, 23.0, 30.0, 23.0, 15.0, 18.0, 23.0, 21.0, 11.0, 12.0, 7.0, 9.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0007038116455078125, -0.0006829351186752319, -0.0006620585918426514, -0.0006411820650100708, -0.0006203055381774902, -0.0005994290113449097, -0.0005785524845123291, -0.0005576759576797485, -0.000536799430847168, -0.0005159229040145874, -0.0004950463771820068, -0.00047416985034942627, -0.0004532933235168457, -0.00043241679668426514, -0.00041154026985168457, -0.000390663743019104, -0.00036978721618652344, -0.00034891068935394287, -0.0003280341625213623, -0.00030715763568878174, -0.00028628110885620117, -0.0002654045820236206, -0.00024452805519104004, -0.00022365152835845947, -0.0002027750015258789, -0.00018189847469329834, -0.00016102194786071777, -0.0001401454210281372, -0.00011926889419555664, -9.839236736297607e-05, -7.751584053039551e-05, -5.663931369781494e-05, -3.5762786865234375e-05, -1.4886260032653809e-05, 5.990266799926758e-06, 2.6866793632507324e-05, 4.774332046508789e-05, 6.861984729766846e-05, 8.949637413024902e-05, 0.00011037290096282959, 0.00013124942779541016, 0.00015212595462799072, 0.0001730024814605713, 0.00019387900829315186, 0.00021475553512573242, 0.000235632061958313, 0.00025650858879089355, 0.0002773851156234741, 0.0002982616424560547, 0.00031913816928863525, 0.0003400146961212158, 0.0003608912229537964, 0.00038176774978637695, 0.0004026442766189575, 0.0004235208034515381, 0.00044439733028411865, 0.0004652738571166992, 0.0004861503839492798, 0.0005070269107818604, 0.0005279034376144409, 0.0005487799644470215, 0.000569656491279602, 0.0005905330181121826, 0.0006114095449447632, 0.0006322860717773438]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 9.0, 12.0, 7.0, 10.0, 5.0, 25.0, 21.0, 19.0, 22.0, 35.0, 35.0, 54.0, 60.0, 79.0, 89.0, 116.0, 229.0, 584.0, 1693.0, 559959.0, 482523.0, 1569.0, 527.0, 246.0, 118.0, 103.0, 68.0, 61.0, 46.0, 34.0, 22.0, 34.0, 27.0, 24.0, 13.0, 6.0, 9.0, 13.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.01442718505859375, -0.013961553573608398, -0.013495922088623047, -0.013030290603637695, -0.012564659118652344, -0.012099027633666992, -0.01163339614868164, -0.011167764663696289, -0.010702133178710938, -0.010236501693725586, -0.009770870208740234, -0.009305238723754883, -0.008839607238769531, -0.00837397575378418, -0.007908344268798828, -0.0074427127838134766, -0.006977081298828125, -0.0065114498138427734, -0.006045818328857422, -0.00558018684387207, -0.005114555358886719, -0.004648923873901367, -0.004183292388916016, -0.003717660903930664, -0.0032520294189453125, -0.002786397933959961, -0.0023207664489746094, -0.0018551349639892578, -0.0013895034790039062, -0.0009238719940185547, -0.0004582405090332031, 7.3909759521484375e-06, 0.0004730224609375, 0.0009386539459228516, 0.0014042854309082031, 0.0018699169158935547, 0.0023355484008789062, 0.002801179885864258, 0.0032668113708496094, 0.003732442855834961, 0.0041980743408203125, 0.004663705825805664, 0.005129337310791016, 0.005594968795776367, 0.006060600280761719, 0.00652623176574707, 0.006991863250732422, 0.0074574947357177734, 0.007923126220703125, 0.008388757705688477, 0.008854389190673828, 0.00932002067565918, 0.009785652160644531, 0.010251283645629883, 0.010716915130615234, 0.011182546615600586, 0.011648178100585938, 0.012113809585571289, 0.01257944107055664, 0.013045072555541992, 0.013510704040527344, 0.013976335525512695, 0.014441967010498047, 0.014907598495483398, 0.01537322998046875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 7.0, 9.0, 14.0, 20.0, 34.0, 56.0, 61.0, 100.0, 101.0, 115.0, 104.0, 94.0, 96.0, 51.0, 52.0, 37.0, 14.0, 11.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005653519183397293, -0.0005511261988431215, -0.0005369004793465137, -0.0005226747016422451, -0.0005084489821456373, -0.0004942232626490295, -0.00047999751404859126, -0.000465771765448153, -0.00045154604595154524, -0.00043732032645493746, -0.0004230945778544992, -0.000408868829254061, -0.0003946431097574532, -0.0003804173902608454, -0.0003661916416604072, -0.00035196589305996895, -0.00033774017356336117, -0.0003235144540667534, -0.00030928870546631515, -0.0002950629568658769, -0.00028083723736926913, -0.00026661151787266135, -0.0002523857692722231, -0.0002381600352237001, -0.0002239343011751771, -0.0002097085671266541, -0.00019548283307813108, -0.00018125709902960807, -0.00016703136498108506, -0.00015280563093256205, -0.00013857989688403904, -0.00012435416283551604, -0.00011012845789082348, -9.590272384230047e-05, -8.167698979377747e-05, -6.745125574525446e-05, -5.322552169673145e-05, -3.899978764820844e-05, -2.477405359968543e-05, -1.0548319551162422e-05, 3.677414497360587e-06, 1.7903148545883596e-05, 3.2128882594406605e-05, 4.6354616642929614e-05, 6.058035069145262e-05, 7.480608473997563e-05, 8.903181878849864e-05, 0.00010325755283702165, 0.00011748328688554466, 0.00013170902093406767, 0.00014593475498259068, 0.00016016048903111368, 0.0001743862230796367, 0.0001886119571281597, 0.0002028376911766827, 0.00021706342522520572, 0.00023128915927372873, 0.00024551490787416697, 0.00025974062737077475, 0.0002739663468673825, 0.00028819209546782076, 0.000302417844068259, 0.0003166435635648668, 0.00033086928306147456, 0.0003450950316619128]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 8.0, 11.0, 9.0, 5.0, 11.0, 11.0, 19.0, 15.0, 19.0, 24.0, 17.0, 22.0, 23.0, 34.0, 25.0, 39.0, 36.0, 35.0, 36.0, 43.0, 43.0, 35.0, 42.0, 44.0, 46.0, 30.0, 28.0, 39.0, 30.0, 36.0, 22.0, 25.0, 14.0, 16.0, 20.0, 18.0, 14.0, 17.0, 9.0, 14.0, 3.0, 2.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004000067710876465, -0.0003871377557516098, -0.0003742687404155731, -0.00036139972507953644, -0.00034853070974349976, -0.0003356616944074631, -0.0003227926790714264, -0.0003099236637353897, -0.00029705464839935303, -0.00028418563306331635, -0.00027131661772727966, -0.000258447602391243, -0.0002455785870552063, -0.00023270957171916962, -0.00021984055638313293, -0.00020697154104709625, -0.00019410252571105957, -0.0001812335103750229, -0.0001683644950389862, -0.00015549547970294952, -0.00014262646436691284, -0.00012975744903087616, -0.00011688843369483948, -0.0001040194183588028, -9.115040302276611e-05, -7.828138768672943e-05, -6.541237235069275e-05, -5.254335701465607e-05, -3.9674341678619385e-05, -2.6805326342582703e-05, -1.393631100654602e-05, -1.0672956705093384e-06, 1.1801719665527344e-05, 2.4670735001564026e-05, 3.753975033760071e-05, 5.040876567363739e-05, 6.327778100967407e-05, 7.614679634571075e-05, 8.901581168174744e-05, 0.00010188482701778412, 0.0001147538423538208, 0.00012762285768985748, 0.00014049187302589417, 0.00015336088836193085, 0.00016622990369796753, 0.0001790989190340042, 0.0001919679343700409, 0.00020483694970607758, 0.00021770596504211426, 0.00023057498037815094, 0.00024344399571418762, 0.0002563130110502243, 0.000269182026386261, 0.00028205104172229767, 0.00029492005705833435, 0.00030778907239437103, 0.0003206580877304077, 0.0003335271030664444, 0.0003463961184024811, 0.00035926513373851776, 0.00037213414907455444, 0.0003850031644105911, 0.0003978721797466278, 0.0004107411950826645, 0.00042361021041870117]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 13.0, 9.0, 8.0, 14.0, 12.0, 12.0, 8.0, 14.0, 26.0, 15.0, 21.0, 15.0, 33.0, 34.0, 37.0, 36.0, 45.0, 47.0, 35.0, 41.0, 48.0, 34.0, 41.0, 40.0, 40.0, 33.0, 36.0, 38.0, 37.0, 23.0, 27.0, 28.0, 17.0, 21.0, 18.0, 5.0, 6.0, 7.0, 5.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.6484375, -5.48272705078125, -5.3170166015625, -5.15130615234375, -4.985595703125, -4.81988525390625, -4.6541748046875, -4.48846435546875, -4.32275390625, -4.15704345703125, -3.9913330078125, -3.82562255859375, -3.659912109375, -3.49420166015625, -3.3284912109375, -3.16278076171875, -2.9970703125, -2.83135986328125, -2.6656494140625, -2.49993896484375, -2.334228515625, -2.16851806640625, -2.0028076171875, -1.83709716796875, -1.67138671875, -1.50567626953125, -1.3399658203125, -1.17425537109375, -1.008544921875, -0.84283447265625, -0.6771240234375, -0.51141357421875, -0.345703125, -0.17999267578125, -0.0142822265625, 0.15142822265625, 0.317138671875, 0.48284912109375, 0.6485595703125, 0.81427001953125, 0.97998046875, 1.14569091796875, 1.3114013671875, 1.47711181640625, 1.642822265625, 1.80853271484375, 1.9742431640625, 2.13995361328125, 2.3056640625, 2.47137451171875, 2.6370849609375, 2.80279541015625, 2.968505859375, 3.13421630859375, 3.2999267578125, 3.46563720703125, 3.63134765625, 3.79705810546875, 3.9627685546875, 4.12847900390625, 4.294189453125, 4.45989990234375, 4.6256103515625, 4.79132080078125, 4.95703125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 12.0, 8.0, 15.0, 17.0, 23.0, 19.0, 25.0, 48.0, 80.0, 135.0, 215.0, 387.0, 715.0, 1444.0, 3205.0, 7331.0, 18776.0, 52372.0, 170212.0, 483277.0, 209400.0, 63085.0, 21987.0, 8513.0, 3645.0, 1678.0, 787.0, 441.0, 233.0, 154.0, 84.0, 58.0, 36.0, 26.0, 26.0, 19.0, 15.0, 8.0, 14.0, 6.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.16162109375, -4.0107421875, -3.85986328125, -3.708984375, -3.55810546875, -3.4072265625, -3.25634765625, -3.10546875, -2.95458984375, -2.8037109375, -2.65283203125, -2.501953125, -2.35107421875, -2.2001953125, -2.04931640625, -1.8984375, -1.74755859375, -1.5966796875, -1.44580078125, -1.294921875, -1.14404296875, -0.9931640625, -0.84228515625, -0.69140625, -0.54052734375, -0.3896484375, -0.23876953125, -0.087890625, 0.06298828125, 0.2138671875, 0.36474609375, 0.515625, 0.66650390625, 0.8173828125, 0.96826171875, 1.119140625, 1.27001953125, 1.4208984375, 1.57177734375, 1.72265625, 1.87353515625, 2.0244140625, 2.17529296875, 2.326171875, 2.47705078125, 2.6279296875, 2.77880859375, 2.9296875, 3.08056640625, 3.2314453125, 3.38232421875, 3.533203125, 3.68408203125, 3.8349609375, 3.98583984375, 4.13671875, 4.28759765625, 4.4384765625, 4.58935546875, 4.740234375, 4.89111328125, 5.0419921875, 5.19287109375, 5.34375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 4.0, 11.0, 10.0, 12.0, 15.0, 15.0, 17.0, 28.0, 27.0, 18.0, 26.0, 39.0, 46.0, 46.0, 62.0, 73.0, 182.0, 1735.0, 198.0, 82.0, 57.0, 49.0, 37.0, 32.0, 33.0, 29.0, 25.0, 20.0, 18.0, 13.0, 16.0, 18.0, 16.0, 3.0, 3.0, 9.0, 0.0, 2.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.19677734375, -17.5810546875, -16.96533203125, -16.349609375, -15.73388671875, -15.1181640625, -14.50244140625, -13.88671875, -13.27099609375, -12.6552734375, -12.03955078125, -11.423828125, -10.80810546875, -10.1923828125, -9.57666015625, -8.9609375, -8.34521484375, -7.7294921875, -7.11376953125, -6.498046875, -5.88232421875, -5.2666015625, -4.65087890625, -4.03515625, -3.41943359375, -2.8037109375, -2.18798828125, -1.572265625, -0.95654296875, -0.3408203125, 0.27490234375, 0.890625, 1.50634765625, 2.1220703125, 2.73779296875, 3.353515625, 3.96923828125, 4.5849609375, 5.20068359375, 5.81640625, 6.43212890625, 7.0478515625, 7.66357421875, 8.279296875, 8.89501953125, 9.5107421875, 10.12646484375, 10.7421875, 11.35791015625, 11.9736328125, 12.58935546875, 13.205078125, 13.82080078125, 14.4365234375, 15.05224609375, 15.66796875, 16.28369140625, 16.8994140625, 17.51513671875, 18.130859375, 18.74658203125, 19.3623046875, 19.97802734375, 20.59375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 1.0, 8.0, 7.0, 5.0, 12.0, 24.0, 21.0, 18.0, 36.0, 43.0, 51.0, 61.0, 104.0, 114.0, 165.0, 203.0, 342.0, 832.0, 13640.0, 3114593.0, 13248.0, 924.0, 378.0, 195.0, 156.0, 116.0, 93.0, 58.0, 46.0, 55.0, 31.0, 23.0, 25.0, 16.0, 22.0, 8.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.59375, -48.11328125, -46.6328125, -45.15234375, -43.671875, -42.19140625, -40.7109375, -39.23046875, -37.75, -36.26953125, -34.7890625, -33.30859375, -31.828125, -30.34765625, -28.8671875, -27.38671875, -25.90625, -24.42578125, -22.9453125, -21.46484375, -19.984375, -18.50390625, -17.0234375, -15.54296875, -14.0625, -12.58203125, -11.1015625, -9.62109375, -8.140625, -6.66015625, -5.1796875, -3.69921875, -2.21875, -0.73828125, 0.7421875, 2.22265625, 3.703125, 5.18359375, 6.6640625, 8.14453125, 9.625, 11.10546875, 12.5859375, 14.06640625, 15.546875, 17.02734375, 18.5078125, 19.98828125, 21.46875, 22.94921875, 24.4296875, 25.91015625, 27.390625, 28.87109375, 30.3515625, 31.83203125, 33.3125, 34.79296875, 36.2734375, 37.75390625, 39.234375, 40.71484375, 42.1953125, 43.67578125, 45.15625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [81.0, 938.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.155569076538086, -2.4575119018554688, 7.240545272827148, 16.938602447509766, 26.636659622192383, 36.334716796875, 46.03277587890625, 55.73082733154297, 65.42888641357422, 75.12694549560547, 84.82499694824219, 94.52305603027344, 104.22111511230469, 113.91917419433594, 123.61723327636719, 133.31527709960938, 143.0133514404297, 152.71141052246094, 162.4094696044922, 172.10752868652344, 181.80557250976562, 191.50363159179688, 201.20169067382812, 210.89974975585938, 220.59780883789062, 230.29586791992188, 239.99392700195312, 249.69198608398438, 259.3900451660156, 269.0881042480469, 278.7861633300781, 288.48419189453125, 298.1822509765625, 307.88031005859375, 317.578369140625, 327.27642822265625, 336.9744873046875, 346.67254638671875, 356.37060546875, 366.06866455078125, 375.7667236328125, 385.46478271484375, 395.162841796875, 404.86090087890625, 414.5589599609375, 424.25701904296875, 433.955078125, 443.65313720703125, 453.3511657714844, 463.0492248535156, 472.7472839355469, 482.4453430175781, 492.1434020996094, 501.8414611816406, 511.5395202636719, 521.237548828125, 530.9356079101562, 540.6336669921875, 550.3317260742188, 560.02978515625, 569.7278442382812, 579.4259033203125, 589.1239624023438, 598.822021484375, 608.5200805664062]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 7.0, 11.0, 9.0, 10.0, 15.0, 16.0, 19.0, 13.0, 27.0, 29.0, 33.0, 23.0, 28.0, 33.0, 35.0, 40.0, 53.0, 40.0, 40.0, 47.0, 42.0, 48.0, 34.0, 34.0, 39.0, 35.0, 36.0, 29.0, 29.0, 26.0, 14.0, 18.0, 19.0, 16.0, 10.0, 9.0, 10.0, 5.0, 5.0, 0.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.240943908691406, -54.67904281616211, -53.11714553833008, -51.55524444580078, -49.99334716796875, -48.43144607543945, -46.86954879760742, -45.307647705078125, -43.745750427246094, -42.1838493347168, -40.621952056884766, -39.06005096435547, -37.49815368652344, -35.93625259399414, -34.37435531616211, -32.81245422363281, -31.25055503845215, -29.688655853271484, -28.12675666809082, -26.564857482910156, -25.002958297729492, -23.441059112548828, -21.87915802001953, -20.3172607421875, -18.755359649658203, -17.19346046447754, -15.631561279296875, -14.069662094116211, -12.507762908935547, -10.945863723754883, -9.383963584899902, -7.822064399719238, -6.260166168212891, -4.698266983032227, -3.1363675594329834, -1.5744681358337402, -0.012568950653076172, 1.549330234527588, 3.11122989654541, 4.673129081726074, 6.235028266906738, 7.796927452087402, 9.358826637268066, 10.920726776123047, 12.482625961303711, 14.044525146484375, 15.606424331665039, 17.168323516845703, 18.730222702026367, 20.29212188720703, 21.854021072387695, 23.41592025756836, 24.977819442749023, 26.539718627929688, 28.101619720458984, 29.663516998291016, 31.225418090820312, 32.78731918334961, 34.34921646118164, 35.91111755371094, 37.47301483154297, 39.034915924072266, 40.5968132019043, 42.158714294433594, 43.720611572265625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 11.0, 13.0, 5.0, 11.0, 9.0, 5.0, 14.0, 13.0, 17.0, 19.0, 16.0, 19.0, 26.0, 30.0, 33.0, 32.0, 39.0, 35.0, 38.0, 44.0, 43.0, 41.0, 49.0, 44.0, 41.0, 41.0, 26.0, 35.0, 47.0, 33.0, 27.0, 32.0, 23.0, 25.0, 18.0, 11.0, 8.0, 11.0, 7.0, 4.0, 4.0, 0.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.828125, -5.64825439453125, -5.4683837890625, -5.28851318359375, -5.108642578125, -4.92877197265625, -4.7489013671875, -4.56903076171875, -4.38916015625, -4.20928955078125, -4.0294189453125, -3.84954833984375, -3.669677734375, -3.48980712890625, -3.3099365234375, -3.13006591796875, -2.9501953125, -2.77032470703125, -2.5904541015625, -2.41058349609375, -2.230712890625, -2.05084228515625, -1.8709716796875, -1.69110107421875, -1.51123046875, -1.33135986328125, -1.1514892578125, -0.97161865234375, -0.791748046875, -0.61187744140625, -0.4320068359375, -0.25213623046875, -0.072265625, 0.10760498046875, 0.2874755859375, 0.46734619140625, 0.647216796875, 0.82708740234375, 1.0069580078125, 1.18682861328125, 1.36669921875, 1.54656982421875, 1.7264404296875, 1.90631103515625, 2.086181640625, 2.26605224609375, 2.4459228515625, 2.62579345703125, 2.8056640625, 2.98553466796875, 3.1654052734375, 3.34527587890625, 3.525146484375, 3.70501708984375, 3.8848876953125, 4.06475830078125, 4.24462890625, 4.42449951171875, 4.6043701171875, 4.78424072265625, 4.964111328125, 5.14398193359375, 5.3238525390625, 5.50372314453125, 5.68359375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 12.0, 7.0, 6.0, 9.0, 9.0, 12.0, 10.0, 15.0, 18.0, 23.0, 17.0, 26.0, 47.0, 58.0, 77.0, 158.0, 305.0, 866.0, 3585.0, 36785.0, 1591491.0, 2477929.0, 75561.0, 5243.0, 1116.0, 369.0, 137.0, 87.0, 73.0, 47.0, 37.0, 28.0, 23.0, 16.0, 23.0, 8.0, 7.0, 11.0, 7.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-20.984375, -20.403076171875, -19.82177734375, -19.240478515625, -18.6591796875, -18.077880859375, -17.49658203125, -16.915283203125, -16.333984375, -15.752685546875, -15.17138671875, -14.590087890625, -14.0087890625, -13.427490234375, -12.84619140625, -12.264892578125, -11.68359375, -11.102294921875, -10.52099609375, -9.939697265625, -9.3583984375, -8.777099609375, -8.19580078125, -7.614501953125, -7.033203125, -6.451904296875, -5.87060546875, -5.289306640625, -4.7080078125, -4.126708984375, -3.54541015625, -2.964111328125, -2.3828125, -1.801513671875, -1.22021484375, -0.638916015625, -0.0576171875, 0.523681640625, 1.10498046875, 1.686279296875, 2.267578125, 2.848876953125, 3.43017578125, 4.011474609375, 4.5927734375, 5.174072265625, 5.75537109375, 6.336669921875, 6.91796875, 7.499267578125, 8.08056640625, 8.661865234375, 9.2431640625, 9.824462890625, 10.40576171875, 10.987060546875, 11.568359375, 12.149658203125, 12.73095703125, 13.312255859375, 13.8935546875, 14.474853515625, 15.05615234375, 15.637451171875, 16.21875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 5.0, 16.0, 19.0, 48.0, 53.0, 87.0, 149.0, 229.0, 372.0, 555.0, 637.0, 599.0, 444.0, 293.0, 181.0, 127.0, 81.0, 51.0, 34.0, 27.0, 22.0, 8.0, 17.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.4609375, -10.0, -9.5390625, -9.078125, -8.6171875, -8.15625, -7.6953125, -7.234375, -6.7734375, -6.3125, -5.8515625, -5.390625, -4.9296875, -4.46875, -4.0078125, -3.546875, -3.0859375, -2.625, -2.1640625, -1.703125, -1.2421875, -0.78125, -0.3203125, 0.140625, 0.6015625, 1.0625, 1.5234375, 1.984375, 2.4453125, 2.90625, 3.3671875, 3.828125, 4.2890625, 4.75, 5.2109375, 5.671875, 6.1328125, 6.59375, 7.0546875, 7.515625, 7.9765625, 8.4375, 8.8984375, 9.359375, 9.8203125, 10.28125, 10.7421875, 11.203125, 11.6640625, 12.125, 12.5859375, 13.046875, 13.5078125, 13.96875, 14.4296875, 14.890625, 15.3515625, 15.8125, 16.2734375, 16.734375, 17.1953125, 17.65625, 18.1171875, 18.578125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 3.0, 10.0, 20.0, 20.0, 39.0, 39.0, 54.0, 102.0, 112.0, 210.0, 239.0, 362.0, 599.0, 4550.0, 4104779.0, 80859.0, 1036.0, 408.0, 280.0, 195.0, 122.0, 78.0, 58.0, 29.0, 30.0, 15.0, 16.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.9375, -86.69775390625, -84.4580078125, -82.21826171875, -79.978515625, -77.73876953125, -75.4990234375, -73.25927734375, -71.01953125, -68.77978515625, -66.5400390625, -64.30029296875, -62.060546875, -59.82080078125, -57.5810546875, -55.34130859375, -53.1015625, -50.86181640625, -48.6220703125, -46.38232421875, -44.142578125, -41.90283203125, -39.6630859375, -37.42333984375, -35.18359375, -32.94384765625, -30.7041015625, -28.46435546875, -26.224609375, -23.98486328125, -21.7451171875, -19.50537109375, -17.265625, -15.02587890625, -12.7861328125, -10.54638671875, -8.306640625, -6.06689453125, -3.8271484375, -1.58740234375, 0.65234375, 2.89208984375, 5.1318359375, 7.37158203125, 9.611328125, 11.85107421875, 14.0908203125, 16.33056640625, 18.5703125, 20.81005859375, 23.0498046875, 25.28955078125, 27.529296875, 29.76904296875, 32.0087890625, 34.24853515625, 36.48828125, 38.72802734375, 40.9677734375, 43.20751953125, 45.447265625, 47.68701171875, 49.9267578125, 52.16650390625, 54.40625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 45.0, 249.0, 433.0, 236.0, 48.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.79261016845703, -75.8685302734375, -70.94445037841797, -66.02037048339844, -61.096290588378906, -56.172210693359375, -51.24813461303711, -46.32405471801758, -41.39997482299805, -36.475894927978516, -31.551815032958984, -26.627737045288086, -21.703657150268555, -16.779577255249023, -11.855499267578125, -6.931419372558594, -2.0073394775390625, 2.9167399406433105, 7.840819358825684, 12.764898300170898, 17.68897819519043, 22.61305809020996, 27.53713607788086, 32.46121597290039, 37.38529586791992, 42.30937576293945, 47.233455657958984, 52.15753173828125, 57.08161163330078, 62.00569152832031, 66.92977142333984, 71.85385131835938, 76.77792358398438, 81.7020034790039, 86.62608337402344, 91.55016326904297, 96.4742431640625, 101.39832305908203, 106.32240295410156, 111.24647521972656, 116.17056274414062, 121.09464263916016, 126.01872253417969, 130.9427947998047, 135.86688232421875, 140.79095458984375, 145.7150421142578, 150.6391143798828, 155.56320190429688, 160.48727416992188, 165.41136169433594, 170.33543395996094, 175.259521484375, 180.18359375, 185.10768127441406, 190.03175354003906, 194.95582580566406, 199.87989807128906, 204.80398559570312, 209.72805786132812, 214.6521453857422, 219.5762176513672, 224.50030517578125, 229.42437744140625, 234.3484649658203]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 6.0, 5.0, 11.0, 7.0, 11.0, 11.0, 17.0, 27.0, 21.0, 29.0, 34.0, 20.0, 31.0, 23.0, 29.0, 36.0, 44.0, 44.0, 34.0, 39.0, 35.0, 41.0, 37.0, 39.0, 40.0, 46.0, 38.0, 37.0, 20.0, 13.0, 23.0, 14.0, 26.0, 18.0, 13.0, 16.0, 8.0, 7.0, 9.0, 4.0, 10.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-33.91938781738281, -32.897396087646484, -31.875402450561523, -30.853408813476562, -29.831417083740234, -28.809425354003906, -27.787431716918945, -26.765438079833984, -25.743446350097656, -24.721454620361328, -23.699460983276367, -22.677467346191406, -21.655475616455078, -20.63348388671875, -19.61149024963379, -18.589496612548828, -17.5675048828125, -16.545513153076172, -15.523519515991211, -14.501526832580566, -13.479534149169922, -12.457541465759277, -11.435548782348633, -10.413556098937988, -9.391563415527344, -8.3695707321167, -7.347578048706055, -6.32558536529541, -5.303592681884766, -4.281599998474121, -3.2596073150634766, -2.237614631652832, -1.2156219482421875, -0.19362926483154297, 0.8283634185791016, 1.850356101989746, 2.8723487854003906, 3.894341468811035, 4.91633415222168, 5.938326835632324, 6.960319519042969, 7.982312202453613, 9.004304885864258, 10.026297569274902, 11.048290252685547, 12.070282936096191, 13.092275619506836, 14.11426830291748, 15.136260986328125, 16.158252716064453, 17.180246353149414, 18.202239990234375, 19.224231719970703, 20.24622344970703, 21.268217086791992, 22.290210723876953, 23.31220245361328, 24.33419418334961, 25.35618782043457, 26.37818145751953, 27.40017318725586, 28.422164916992188, 29.44415855407715, 30.46615219116211, 31.488143920898438]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 1.0, 5.0, 7.0, 6.0, 7.0, 10.0, 13.0, 8.0, 11.0, 16.0, 10.0, 24.0, 20.0, 27.0, 24.0, 31.0, 22.0, 40.0, 36.0, 51.0, 53.0, 42.0, 40.0, 40.0, 42.0, 43.0, 35.0, 33.0, 33.0, 33.0, 34.0, 33.0, 28.0, 22.0, 21.0, 16.0, 21.0, 23.0, 10.0, 11.0, 3.0, 3.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.89453125, -5.7261962890625, -5.557861328125, -5.3895263671875, -5.22119140625, -5.0528564453125, -4.884521484375, -4.7161865234375, -4.5478515625, -4.3795166015625, -4.211181640625, -4.0428466796875, -3.87451171875, -3.7061767578125, -3.537841796875, -3.3695068359375, -3.201171875, -3.0328369140625, -2.864501953125, -2.6961669921875, -2.52783203125, -2.3594970703125, -2.191162109375, -2.0228271484375, -1.8544921875, -1.6861572265625, -1.517822265625, -1.3494873046875, -1.18115234375, -1.0128173828125, -0.844482421875, -0.6761474609375, -0.5078125, -0.3394775390625, -0.171142578125, -0.0028076171875, 0.16552734375, 0.3338623046875, 0.502197265625, 0.6705322265625, 0.8388671875, 1.0072021484375, 1.175537109375, 1.3438720703125, 1.51220703125, 1.6805419921875, 1.848876953125, 2.0172119140625, 2.185546875, 2.3538818359375, 2.522216796875, 2.6905517578125, 2.85888671875, 3.0272216796875, 3.195556640625, 3.3638916015625, 3.5322265625, 3.7005615234375, 3.868896484375, 4.0372314453125, 4.20556640625, 4.3739013671875, 4.542236328125, 4.7105712890625, 4.87890625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 7.0, 12.0, 16.0, 23.0, 39.0, 50.0, 76.0, 130.0, 199.0, 283.0, 405.0, 623.0, 960.0, 1531.0, 2424.0, 3586.0, 5736.0, 9383.0, 15022.0, 24343.0, 40217.0, 69079.0, 121087.0, 200636.0, 216241.0, 139391.0, 78485.0, 45850.0, 27655.0, 16743.0, 10317.0, 6444.0, 4081.0, 2575.0, 1637.0, 1164.0, 732.0, 484.0, 269.0, 189.0, 151.0, 89.0, 66.0, 49.0, 21.0, 21.0, 15.0, 8.0, 7.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.5859375, -0.5676956176757812, -0.5494537353515625, -0.5312118530273438, -0.512969970703125, -0.49472808837890625, -0.4764862060546875, -0.45824432373046875, -0.44000244140625, -0.42176055908203125, -0.4035186767578125, -0.38527679443359375, -0.367034912109375, -0.34879302978515625, -0.3305511474609375, -0.31230926513671875, -0.2940673828125, -0.27582550048828125, -0.2575836181640625, -0.23934173583984375, -0.221099853515625, -0.20285797119140625, -0.1846160888671875, -0.16637420654296875, -0.14813232421875, -0.12989044189453125, -0.1116485595703125, -0.09340667724609375, -0.075164794921875, -0.05692291259765625, -0.0386810302734375, -0.02043914794921875, -0.002197265625, 0.01604461669921875, 0.0342864990234375, 0.05252838134765625, 0.070770263671875, 0.08901214599609375, 0.1072540283203125, 0.12549591064453125, 0.14373779296875, 0.16197967529296875, 0.1802215576171875, 0.19846343994140625, 0.216705322265625, 0.23494720458984375, 0.2531890869140625, 0.27143096923828125, 0.2896728515625, 0.30791473388671875, 0.3261566162109375, 0.34439849853515625, 0.362640380859375, 0.38088226318359375, 0.3991241455078125, 0.41736602783203125, 0.43560791015625, 0.45384979248046875, 0.4720916748046875, 0.49033355712890625, 0.508575439453125, 0.5268173217773438, 0.5450592041015625, 0.5633010864257812, 0.58154296875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 4.0, 8.0, 12.0, 7.0, 12.0, 13.0, 20.0, 19.0, 17.0, 28.0, 27.0, 25.0, 35.0, 28.0, 36.0, 40.0, 38.0, 31.0, 40.0, 25.0, 1063.0, 42.0, 44.0, 33.0, 40.0, 33.0, 34.0, 30.0, 26.0, 30.0, 24.0, 25.0, 20.0, 12.0, 18.0, 17.0, 15.0, 6.0, 7.0, 12.0, 4.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.248046875, -3.1468505859375, -3.045654296875, -2.9444580078125, -2.84326171875, -2.7420654296875, -2.640869140625, -2.5396728515625, -2.4384765625, -2.3372802734375, -2.236083984375, -2.1348876953125, -2.03369140625, -1.9324951171875, -1.831298828125, -1.7301025390625, -1.62890625, -1.5277099609375, -1.426513671875, -1.3253173828125, -1.22412109375, -1.1229248046875, -1.021728515625, -0.9205322265625, -0.8193359375, -0.7181396484375, -0.616943359375, -0.5157470703125, -0.41455078125, -0.3133544921875, -0.212158203125, -0.1109619140625, -0.009765625, 0.0914306640625, 0.192626953125, 0.2938232421875, 0.39501953125, 0.4962158203125, 0.597412109375, 0.6986083984375, 0.7998046875, 0.9010009765625, 1.002197265625, 1.1033935546875, 1.20458984375, 1.3057861328125, 1.406982421875, 1.5081787109375, 1.609375, 1.7105712890625, 1.811767578125, 1.9129638671875, 2.01416015625, 2.1153564453125, 2.216552734375, 2.3177490234375, 2.4189453125, 2.5201416015625, 2.621337890625, 2.7225341796875, 2.82373046875, 2.9249267578125, 3.026123046875, 3.1273193359375, 3.228515625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 4.0, 11.0, 9.0, 18.0, 23.0, 26.0, 51.0, 81.0, 121.0, 217.0, 315.0, 481.0, 767.0, 1235.0, 1908.0, 2892.0, 4842.0, 7750.0, 12813.0, 21521.0, 36519.0, 62375.0, 107606.0, 173822.0, 1260170.0, 162675.0, 97938.0, 56980.0, 33286.0, 19756.0, 11762.0, 7239.0, 4324.0, 2836.0, 1756.0, 1077.0, 707.0, 421.0, 287.0, 181.0, 117.0, 90.0, 45.0, 33.0, 19.0, 15.0, 8.0, 1.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468017578125, -0.4515495300292969, -0.43508148193359375, -0.4186134338378906, -0.4021453857421875, -0.3856773376464844, -0.36920928955078125, -0.3527412414550781, -0.336273193359375, -0.3198051452636719, -0.30333709716796875, -0.2868690490722656, -0.2704010009765625, -0.2539329528808594, -0.23746490478515625, -0.22099685668945312, -0.20452880859375, -0.18806076049804688, -0.17159271240234375, -0.15512466430664062, -0.1386566162109375, -0.12218856811523438, -0.10572052001953125, -0.08925247192382812, -0.072784423828125, -0.056316375732421875, -0.03984832763671875, -0.023380279541015625, -0.0069122314453125, 0.009555816650390625, 0.02602386474609375, 0.042491912841796875, 0.0589599609375, 0.07542800903320312, 0.09189605712890625, 0.10836410522460938, 0.1248321533203125, 0.14130020141601562, 0.15776824951171875, 0.17423629760742188, 0.190704345703125, 0.20717239379882812, 0.22364044189453125, 0.24010848999023438, 0.2565765380859375, 0.2730445861816406, 0.28951263427734375, 0.3059806823730469, 0.32244873046875, 0.3389167785644531, 0.35538482666015625, 0.3718528747558594, 0.3883209228515625, 0.4047889709472656, 0.42125701904296875, 0.4377250671386719, 0.454193115234375, 0.4706611633300781, 0.48712921142578125, 0.5035972595214844, 0.5200653076171875, 0.5365333557128906, 0.5530014038085938, 0.5694694519042969, 0.5859375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 7.0, 8.0, 18.0, 21.0, 18.0, 26.0, 33.0, 36.0, 44.0, 35.0, 46.0, 61.0, 62.0, 62.0, 56.0, 53.0, 53.0, 61.0, 46.0, 43.0, 41.0, 36.0, 18.0, 22.0, 10.0, 14.0, 13.0, 13.0, 10.0, 11.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008020401000976562, -0.0007718801498413086, -0.0007417201995849609, -0.0007115602493286133, -0.0006814002990722656, -0.000651240348815918, -0.0006210803985595703, -0.0005909204483032227, -0.000560760498046875, -0.0005306005477905273, -0.0005004405975341797, -0.00047028064727783203, -0.0004401206970214844, -0.0004099607467651367, -0.00037980079650878906, -0.0003496408462524414, -0.00031948089599609375, -0.0002893209457397461, -0.00025916099548339844, -0.00022900104522705078, -0.00019884109497070312, -0.00016868114471435547, -0.0001385211944580078, -0.00010836124420166016, -7.82012939453125e-05, -4.8041343688964844e-05, -1.7881393432617188e-05, 1.2278556823730469e-05, 4.2438507080078125e-05, 7.259845733642578e-05, 0.00010275840759277344, 0.0001329183578491211, 0.00016307830810546875, 0.0001932382583618164, 0.00022339820861816406, 0.0002535581588745117, 0.0002837181091308594, 0.00031387805938720703, 0.0003440380096435547, 0.00037419795989990234, 0.00040435791015625, 0.00043451786041259766, 0.0004646778106689453, 0.000494837760925293, 0.0005249977111816406, 0.0005551576614379883, 0.0005853176116943359, 0.0006154775619506836, 0.0006456375122070312, 0.0006757974624633789, 0.0007059574127197266, 0.0007361173629760742, 0.0007662773132324219, 0.0007964372634887695, 0.0008265972137451172, 0.0008567571640014648, 0.0008869171142578125, 0.0009170770645141602, 0.0009472370147705078, 0.0009773969650268555, 0.0010075569152832031, 0.0010377168655395508, 0.0010678768157958984, 0.001098036766052246, 0.0011281967163085938]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 10.0, 8.0, 17.0, 12.0, 18.0, 19.0, 20.0, 39.0, 70.0, 81.0, 119.0, 155.0, 501.0, 2367.0, 1040159.0, 3639.0, 603.0, 209.0, 135.0, 87.0, 63.0, 52.0, 27.0, 38.0, 26.0, 21.0, 12.0, 12.0, 9.0, 4.0, 4.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0292205810546875, -0.028462648391723633, -0.027704715728759766, -0.0269467830657959, -0.02618885040283203, -0.025430917739868164, -0.024672985076904297, -0.02391505241394043, -0.023157119750976562, -0.022399187088012695, -0.021641254425048828, -0.02088332176208496, -0.020125389099121094, -0.019367456436157227, -0.01860952377319336, -0.017851591110229492, -0.017093658447265625, -0.016335725784301758, -0.01557779312133789, -0.014819860458374023, -0.014061927795410156, -0.013303995132446289, -0.012546062469482422, -0.011788129806518555, -0.011030197143554688, -0.01027226448059082, -0.009514331817626953, -0.008756399154663086, -0.007998466491699219, -0.0072405338287353516, -0.006482601165771484, -0.005724668502807617, -0.00496673583984375, -0.004208803176879883, -0.0034508705139160156, -0.0026929378509521484, -0.0019350051879882812, -0.001177072525024414, -0.0004191398620605469, 0.0003387928009033203, 0.0010967254638671875, 0.0018546581268310547, 0.002612590789794922, 0.003370523452758789, 0.004128456115722656, 0.0048863887786865234, 0.005644321441650391, 0.006402254104614258, 0.007160186767578125, 0.007918119430541992, 0.00867605209350586, 0.009433984756469727, 0.010191917419433594, 0.010949850082397461, 0.011707782745361328, 0.012465715408325195, 0.013223648071289062, 0.01398158073425293, 0.014739513397216797, 0.015497446060180664, 0.01625537872314453, 0.0170133113861084, 0.017771244049072266, 0.018529176712036133, 0.019287109375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 109.0, 779.0, 127.0], "bins": [-0.007740622386336327, -0.007616789545863867, -0.007492957171052694, -0.0073691243305802345, -0.007245291955769062, -0.007121459115296602, -0.0069976262748241425, -0.00687379390001297, -0.00674996105954051, -0.00662612821906805, -0.006502295844256878, -0.006378463003784418, -0.006254630628973246, -0.006130797788500786, -0.006006965413689613, -0.0058831325732171535, -0.005759299732744694, -0.005635466892272234, -0.0055116345174610615, -0.005387801676988602, -0.005263969302177429, -0.005140136461704969, -0.00501630362123251, -0.004892471246421337, -0.004768638871610165, -0.004644806031137705, -0.004520973656326532, -0.004397140815854073, -0.0042733084410429, -0.00414947560057044, -0.0040256427600979805, -0.003901810385286808, -0.0037779773119837046, -0.0036541447043418884, -0.0035303120967000723, -0.003406479489058256, -0.0032826466485857964, -0.0031588140409439802, -0.003034981433302164, -0.002911148825660348, -0.002787316218018532, -0.0026634836103767157, -0.0025396510027348995, -0.0024158181622624397, -0.0022919855546206236, -0.0021681529469788074, -0.0020443203393369913, -0.0019204877316951752, -0.0017966548912227154, -0.0016728222835808992, -0.0015489895595237613, -0.0014251569518819451, -0.0013013242278248072, -0.001177491620182991, -0.0010536590125411749, -0.0009298263466916978, -0.0008059936808422208, -0.0006821610149927437, -0.0005583283491432667, -0.00043449574150145054, -0.0003106630756519735, -0.00018683040980249643, -6.29978021606803e-05, 6.083486368879676e-05, 0.0001846675295382738]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 10.0, 5.0, 11.0, 14.0, 11.0, 15.0, 17.0, 20.0, 25.0, 22.0, 27.0, 29.0, 35.0, 28.0, 41.0, 33.0, 47.0, 40.0, 43.0, 50.0, 33.0, 37.0, 52.0, 44.0, 36.0, 29.0, 37.0, 28.0, 29.0, 16.0, 18.0, 19.0, 13.0, 12.0, 12.0, 9.0, 8.0, 7.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0004610419273376465, -0.00044672563672065735, -0.0004324093461036682, -0.0004180930554866791, -0.00040377676486968994, -0.0003894604742527008, -0.00037514418363571167, -0.00036082789301872253, -0.0003465116024017334, -0.00033219531178474426, -0.0003178790211677551, -0.000303562730550766, -0.00028924643993377686, -0.0002749301493167877, -0.0002606138586997986, -0.00024629756808280945, -0.0002319812774658203, -0.00021766498684883118, -0.00020334869623184204, -0.0001890324056148529, -0.00017471611499786377, -0.00016039982438087463, -0.0001460835337638855, -0.00013176724314689636, -0.00011745095252990723, -0.00010313466191291809, -8.881837129592896e-05, -7.450208067893982e-05, -6.0185790061950684e-05, -4.586949944496155e-05, -3.155320882797241e-05, -1.7236918210983276e-05, -2.9206275939941406e-06, 1.1395663022994995e-05, 2.571195363998413e-05, 4.0028244256973267e-05, 5.43445348739624e-05, 6.866082549095154e-05, 8.297711610794067e-05, 9.729340672492981e-05, 0.00011160969734191895, 0.00012592598795890808, 0.00014024227857589722, 0.00015455856919288635, 0.0001688748598098755, 0.00018319115042686462, 0.00019750744104385376, 0.0002118237316608429, 0.00022614002227783203, 0.00024045631289482117, 0.0002547726035118103, 0.00026908889412879944, 0.0002834051847457886, 0.0002977214753627777, 0.00031203776597976685, 0.000326354056596756, 0.0003406703472137451, 0.00035498663783073425, 0.0003693029284477234, 0.0003836192190647125, 0.00039793550968170166, 0.0004122518002986908, 0.00042656809091567993, 0.00044088438153266907, 0.0004552006721496582]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 1.0, 5.0, 7.0, 6.0, 7.0, 10.0, 13.0, 8.0, 11.0, 16.0, 10.0, 24.0, 20.0, 27.0, 24.0, 31.0, 22.0, 40.0, 36.0, 51.0, 53.0, 42.0, 40.0, 40.0, 42.0, 43.0, 35.0, 33.0, 33.0, 33.0, 34.0, 33.0, 28.0, 22.0, 21.0, 16.0, 21.0, 23.0, 10.0, 11.0, 3.0, 3.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.89453125, -5.7261962890625, -5.557861328125, -5.3895263671875, -5.22119140625, -5.0528564453125, -4.884521484375, -4.7161865234375, -4.5478515625, -4.3795166015625, -4.211181640625, -4.0428466796875, -3.87451171875, -3.7061767578125, -3.537841796875, -3.3695068359375, -3.201171875, -3.0328369140625, -2.864501953125, -2.6961669921875, -2.52783203125, -2.3594970703125, -2.191162109375, -2.0228271484375, -1.8544921875, -1.6861572265625, -1.517822265625, -1.3494873046875, -1.18115234375, -1.0128173828125, -0.844482421875, -0.6761474609375, -0.5078125, -0.3394775390625, -0.171142578125, -0.0028076171875, 0.16552734375, 0.3338623046875, 0.502197265625, 0.6705322265625, 0.8388671875, 1.0072021484375, 1.175537109375, 1.3438720703125, 1.51220703125, 1.6805419921875, 1.848876953125, 2.0172119140625, 2.185546875, 2.3538818359375, 2.522216796875, 2.6905517578125, 2.85888671875, 3.0272216796875, 3.195556640625, 3.3638916015625, 3.5322265625, 3.7005615234375, 3.868896484375, 4.0372314453125, 4.20556640625, 4.3739013671875, 4.542236328125, 4.7105712890625, 4.87890625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 11.0, 10.0, 5.0, 17.0, 15.0, 23.0, 16.0, 30.0, 42.0, 69.0, 60.0, 77.0, 116.0, 206.0, 299.0, 519.0, 1263.0, 3777.0, 13452.0, 50913.0, 209760.0, 542712.0, 167584.0, 40974.0, 10923.0, 3164.0, 1066.0, 453.0, 299.0, 172.0, 138.0, 103.0, 83.0, 44.0, 40.0, 34.0, 26.0, 22.0, 14.0, 5.0, 5.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.671875, -6.4835205078125, -6.295166015625, -6.1068115234375, -5.91845703125, -5.7301025390625, -5.541748046875, -5.3533935546875, -5.1650390625, -4.9766845703125, -4.788330078125, -4.5999755859375, -4.41162109375, -4.2232666015625, -4.034912109375, -3.8465576171875, -3.658203125, -3.4698486328125, -3.281494140625, -3.0931396484375, -2.90478515625, -2.7164306640625, -2.528076171875, -2.3397216796875, -2.1513671875, -1.9630126953125, -1.774658203125, -1.5863037109375, -1.39794921875, -1.2095947265625, -1.021240234375, -0.8328857421875, -0.64453125, -0.4561767578125, -0.267822265625, -0.0794677734375, 0.10888671875, 0.2972412109375, 0.485595703125, 0.6739501953125, 0.8623046875, 1.0506591796875, 1.239013671875, 1.4273681640625, 1.61572265625, 1.8040771484375, 1.992431640625, 2.1807861328125, 2.369140625, 2.5574951171875, 2.745849609375, 2.9342041015625, 3.12255859375, 3.3109130859375, 3.499267578125, 3.6876220703125, 3.8759765625, 4.0643310546875, 4.252685546875, 4.4410400390625, 4.62939453125, 4.8177490234375, 5.006103515625, 5.1944580078125, 5.3828125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 3.0, 5.0, 6.0, 7.0, 8.0, 10.0, 15.0, 11.0, 18.0, 18.0, 29.0, 31.0, 29.0, 37.0, 48.0, 38.0, 51.0, 58.0, 89.0, 1562.0, 439.0, 92.0, 47.0, 45.0, 47.0, 52.0, 38.0, 33.0, 24.0, 21.0, 24.0, 21.0, 16.0, 14.0, 8.0, 13.0, 9.0, 7.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-19.125, -18.56201171875, -17.9990234375, -17.43603515625, -16.873046875, -16.31005859375, -15.7470703125, -15.18408203125, -14.62109375, -14.05810546875, -13.4951171875, -12.93212890625, -12.369140625, -11.80615234375, -11.2431640625, -10.68017578125, -10.1171875, -9.55419921875, -8.9912109375, -8.42822265625, -7.865234375, -7.30224609375, -6.7392578125, -6.17626953125, -5.61328125, -5.05029296875, -4.4873046875, -3.92431640625, -3.361328125, -2.79833984375, -2.2353515625, -1.67236328125, -1.109375, -0.54638671875, 0.0166015625, 0.57958984375, 1.142578125, 1.70556640625, 2.2685546875, 2.83154296875, 3.39453125, 3.95751953125, 4.5205078125, 5.08349609375, 5.646484375, 6.20947265625, 6.7724609375, 7.33544921875, 7.8984375, 8.46142578125, 9.0244140625, 9.58740234375, 10.150390625, 10.71337890625, 11.2763671875, 11.83935546875, 12.40234375, 12.96533203125, 13.5283203125, 14.09130859375, 14.654296875, 15.21728515625, 15.7802734375, 16.34326171875, 16.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 5.0, 5.0, 15.0, 18.0, 28.0, 23.0, 30.0, 45.0, 63.0, 83.0, 141.0, 172.0, 289.0, 484.0, 1492.0, 377140.0, 2761962.0, 2174.0, 578.0, 312.0, 180.0, 118.0, 87.0, 75.0, 41.0, 32.0, 24.0, 18.0, 14.0, 14.0, 10.0, 2.0, 7.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.78125, -47.21142578125, -45.6416015625, -44.07177734375, -42.501953125, -40.93212890625, -39.3623046875, -37.79248046875, -36.22265625, -34.65283203125, -33.0830078125, -31.51318359375, -29.943359375, -28.37353515625, -26.8037109375, -25.23388671875, -23.6640625, -22.09423828125, -20.5244140625, -18.95458984375, -17.384765625, -15.81494140625, -14.2451171875, -12.67529296875, -11.10546875, -9.53564453125, -7.9658203125, -6.39599609375, -4.826171875, -3.25634765625, -1.6865234375, -0.11669921875, 1.453125, 3.02294921875, 4.5927734375, 6.16259765625, 7.732421875, 9.30224609375, 10.8720703125, 12.44189453125, 14.01171875, 15.58154296875, 17.1513671875, 18.72119140625, 20.291015625, 21.86083984375, 23.4306640625, 25.00048828125, 26.5703125, 28.14013671875, 29.7099609375, 31.27978515625, 32.849609375, 34.41943359375, 35.9892578125, 37.55908203125, 39.12890625, 40.69873046875, 42.2685546875, 43.83837890625, 45.408203125, 46.97802734375, 48.5478515625, 50.11767578125, 51.6875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 36.0, 152.0, 283.0, 314.0, 162.0, 53.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.847450256347656, -52.70371627807617, -51.55998611450195, -50.41625213623047, -49.27252197265625, -48.128787994384766, -46.98505401611328, -45.84132385253906, -44.69758987426758, -43.553855895996094, -42.410125732421875, -41.26639175415039, -40.12266159057617, -38.97892761230469, -37.83519744873047, -36.691463470458984, -35.5477294921875, -34.403995513916016, -33.2602653503418, -32.11653137207031, -30.97279930114746, -29.82906723022461, -28.685335159301758, -27.541603088378906, -26.397872924804688, -25.254140853881836, -24.110408782958984, -22.9666748046875, -21.82294273376465, -20.679210662841797, -19.535478591918945, -18.391746520996094, -17.248014450073242, -16.10428237915039, -14.960549354553223, -13.816817283630371, -12.673084259033203, -11.529352188110352, -10.3856201171875, -9.241887092590332, -8.09815502166748, -6.954422473907471, -5.810689926147461, -4.666957855224609, -3.5232253074645996, -2.37949275970459, -1.2357606887817383, -0.09202766418457031, 1.0517044067382812, 2.195436954498291, 3.3391692638397217, 4.482901573181152, 5.626634120941162, 6.770366668701172, 7.914098739624023, 9.057831764221191, 10.201563835144043, 11.345295906066895, 12.489028930664062, 13.632761001586914, 14.776493072509766, 15.920226097106934, 17.06395721435547, 18.207691192626953, 19.351423263549805]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 17.0, 13.0, 19.0, 19.0, 22.0, 18.0, 24.0, 33.0, 20.0, 36.0, 34.0, 38.0, 30.0, 46.0, 31.0, 45.0, 39.0, 26.0, 39.0, 48.0, 28.0, 41.0, 32.0, 22.0, 36.0, 34.0, 29.0, 21.0, 23.0, 16.0, 15.0, 17.0, 14.0, 12.0, 5.0, 7.0, 6.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.56498718261719, -41.25544738769531, -39.94590759277344, -38.63636779785156, -37.32682800292969, -36.01728820800781, -34.70774841308594, -33.39820861816406, -32.08866882324219, -30.779129028320312, -29.469589233398438, -28.160049438476562, -26.850509643554688, -25.540969848632812, -24.231428146362305, -22.92188835144043, -21.612346649169922, -20.302806854248047, -18.993267059326172, -17.683727264404297, -16.374187469482422, -15.06464672088623, -13.755105972290039, -12.445566177368164, -11.136026382446289, -9.826486587524414, -8.516946792602539, -7.207406044006348, -5.897866249084473, -4.588326454162598, -3.2787861824035645, -1.9692459106445312, -0.6597061157226562, 0.6498339176177979, 1.959373950958252, 3.268913984298706, 4.57845401763916, 5.887993812561035, 7.197534084320068, 8.507074356079102, 9.816614151000977, 11.126153945922852, 12.435693740844727, 13.745234489440918, 15.054774284362793, 16.364315032958984, 17.67385482788086, 18.983394622802734, 20.29293441772461, 21.602474212646484, 22.91201400756836, 24.221553802490234, 25.53109359741211, 26.840633392333984, 28.150175094604492, 29.459714889526367, 30.769254684448242, 32.07879638671875, 33.388336181640625, 34.6978759765625, 36.007415771484375, 37.31695556640625, 38.626495361328125, 39.93603515625, 41.245574951171875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 11.0, 4.0, 15.0, 8.0, 17.0, 13.0, 17.0, 16.0, 23.0, 27.0, 25.0, 30.0, 30.0, 39.0, 52.0, 52.0, 37.0, 47.0, 47.0, 37.0, 49.0, 38.0, 35.0, 28.0, 25.0, 33.0, 27.0, 36.0, 33.0, 22.0, 19.0, 22.0, 14.0, 15.0, 10.0, 10.0, 7.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.12890625, -5.951171875, -5.7734375, -5.595703125, -5.41796875, -5.240234375, -5.0625, -4.884765625, -4.70703125, -4.529296875, -4.3515625, -4.173828125, -3.99609375, -3.818359375, -3.640625, -3.462890625, -3.28515625, -3.107421875, -2.9296875, -2.751953125, -2.57421875, -2.396484375, -2.21875, -2.041015625, -1.86328125, -1.685546875, -1.5078125, -1.330078125, -1.15234375, -0.974609375, -0.796875, -0.619140625, -0.44140625, -0.263671875, -0.0859375, 0.091796875, 0.26953125, 0.447265625, 0.625, 0.802734375, 0.98046875, 1.158203125, 1.3359375, 1.513671875, 1.69140625, 1.869140625, 2.046875, 2.224609375, 2.40234375, 2.580078125, 2.7578125, 2.935546875, 3.11328125, 3.291015625, 3.46875, 3.646484375, 3.82421875, 4.001953125, 4.1796875, 4.357421875, 4.53515625, 4.712890625, 4.890625, 5.068359375, 5.24609375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 13.0, 5.0, 7.0, 14.0, 14.0, 13.0, 20.0, 16.0, 17.0, 36.0, 41.0, 64.0, 108.0, 177.0, 296.0, 591.0, 1554.0, 9114.0, 359818.0, 3581991.0, 230511.0, 7126.0, 1424.0, 547.0, 270.0, 137.0, 87.0, 79.0, 38.0, 26.0, 24.0, 25.0, 15.0, 17.0, 14.0, 10.0, 10.0, 5.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.171875, -22.5361328125, -21.900390625, -21.2646484375, -20.62890625, -19.9931640625, -19.357421875, -18.7216796875, -18.0859375, -17.4501953125, -16.814453125, -16.1787109375, -15.54296875, -14.9072265625, -14.271484375, -13.6357421875, -13.0, -12.3642578125, -11.728515625, -11.0927734375, -10.45703125, -9.8212890625, -9.185546875, -8.5498046875, -7.9140625, -7.2783203125, -6.642578125, -6.0068359375, -5.37109375, -4.7353515625, -4.099609375, -3.4638671875, -2.828125, -2.1923828125, -1.556640625, -0.9208984375, -0.28515625, 0.3505859375, 0.986328125, 1.6220703125, 2.2578125, 2.8935546875, 3.529296875, 4.1650390625, 4.80078125, 5.4365234375, 6.072265625, 6.7080078125, 7.34375, 7.9794921875, 8.615234375, 9.2509765625, 9.88671875, 10.5224609375, 11.158203125, 11.7939453125, 12.4296875, 13.0654296875, 13.701171875, 14.3369140625, 14.97265625, 15.6083984375, 16.244140625, 16.8798828125, 17.515625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 7.0, 4.0, 9.0, 23.0, 22.0, 33.0, 48.0, 54.0, 69.0, 98.0, 159.0, 221.0, 274.0, 368.0, 453.0, 490.0, 480.0, 358.0, 257.0, 172.0, 150.0, 87.0, 58.0, 46.0, 39.0, 25.0, 14.0, 14.0, 8.0, 8.0, 8.0, 7.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.7744140625, -7.455078125, -7.1357421875, -6.81640625, -6.4970703125, -6.177734375, -5.8583984375, -5.5390625, -5.2197265625, -4.900390625, -4.5810546875, -4.26171875, -3.9423828125, -3.623046875, -3.3037109375, -2.984375, -2.6650390625, -2.345703125, -2.0263671875, -1.70703125, -1.3876953125, -1.068359375, -0.7490234375, -0.4296875, -0.1103515625, 0.208984375, 0.5283203125, 0.84765625, 1.1669921875, 1.486328125, 1.8056640625, 2.125, 2.4443359375, 2.763671875, 3.0830078125, 3.40234375, 3.7216796875, 4.041015625, 4.3603515625, 4.6796875, 4.9990234375, 5.318359375, 5.6376953125, 5.95703125, 6.2763671875, 6.595703125, 6.9150390625, 7.234375, 7.5537109375, 7.873046875, 8.1923828125, 8.51171875, 8.8310546875, 9.150390625, 9.4697265625, 9.7890625, 10.1083984375, 10.427734375, 10.7470703125, 11.06640625, 11.3857421875, 11.705078125, 12.0244140625, 12.34375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 0.0, 4.0, 8.0, 12.0, 10.0, 9.0, 21.0, 29.0, 27.0, 56.0, 73.0, 86.0, 127.0, 158.0, 207.0, 297.0, 452.0, 1342.0, 125426.0, 4053592.0, 10208.0, 686.0, 376.0, 272.0, 213.0, 141.0, 107.0, 87.0, 77.0, 53.0, 36.0, 28.0, 10.0, 22.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-73.1875, -71.37158203125, -69.5556640625, -67.73974609375, -65.923828125, -64.10791015625, -62.2919921875, -60.47607421875, -58.66015625, -56.84423828125, -55.0283203125, -53.21240234375, -51.396484375, -49.58056640625, -47.7646484375, -45.94873046875, -44.1328125, -42.31689453125, -40.5009765625, -38.68505859375, -36.869140625, -35.05322265625, -33.2373046875, -31.42138671875, -29.60546875, -27.78955078125, -25.9736328125, -24.15771484375, -22.341796875, -20.52587890625, -18.7099609375, -16.89404296875, -15.078125, -13.26220703125, -11.4462890625, -9.63037109375, -7.814453125, -5.99853515625, -4.1826171875, -2.36669921875, -0.55078125, 1.26513671875, 3.0810546875, 4.89697265625, 6.712890625, 8.52880859375, 10.3447265625, 12.16064453125, 13.9765625, 15.79248046875, 17.6083984375, 19.42431640625, 21.240234375, 23.05615234375, 24.8720703125, 26.68798828125, 28.50390625, 30.31982421875, 32.1357421875, 33.95166015625, 35.767578125, 37.58349609375, 39.3994140625, 41.21533203125, 43.03125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 21.0, 287.0, 538.0, 158.0, 9.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.29597473144531, -95.10132598876953, -88.90668487548828, -82.7120361328125, -76.51739501953125, -70.32274627685547, -64.12809753417969, -57.93345260620117, -51.738807678222656, -45.54416275024414, -39.349517822265625, -33.154869079589844, -26.960224151611328, -20.765579223632812, -14.570930480957031, -8.376285552978516, -2.181640625, 4.013005256652832, 10.207651138305664, 16.402297973632812, 22.596942901611328, 28.791587829589844, 34.986236572265625, 41.18088150024414, 47.375526428222656, 53.57017135620117, 59.76481628417969, 65.95946502685547, 72.15411376953125, 78.3487548828125, 84.54340362548828, 90.73805236816406, 96.93267822265625, 103.12732696533203, 109.32196807861328, 115.51661682128906, 121.71125793457031, 127.9059066772461, 134.10055541992188, 140.29519653320312, 146.48983764648438, 152.68447875976562, 158.87913513183594, 165.0737762451172, 171.26841735839844, 177.46307373046875, 183.65771484375, 189.85235595703125, 196.04701232910156, 202.2416534423828, 208.43630981445312, 214.63095092773438, 220.82559204101562, 227.02023315429688, 233.2148895263672, 239.40953063964844, 245.60418701171875, 251.798828125, 257.99346923828125, 264.1881103515625, 270.3827819824219, 276.5774230957031, 282.7720642089844, 288.9667053222656, 295.1613464355469]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 11.0, 13.0, 10.0, 18.0, 20.0, 18.0, 24.0, 19.0, 24.0, 26.0, 31.0, 35.0, 38.0, 38.0, 43.0, 40.0, 43.0, 49.0, 30.0, 50.0, 37.0, 46.0, 35.0, 40.0, 31.0, 33.0, 24.0, 22.0, 18.0, 19.0, 24.0, 16.0, 18.0, 9.0, 8.0, 6.0, 3.0, 5.0, 4.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-34.726531982421875, -33.73191452026367, -32.7372932434082, -31.74267578125, -30.748058319091797, -29.75343894958496, -28.758819580078125, -27.764202117919922, -26.76958465576172, -25.774965286254883, -24.78034782409668, -23.785728454589844, -22.79111099243164, -21.796491622924805, -20.80187225341797, -19.807254791259766, -18.81263542175293, -17.818016052246094, -16.82339859008789, -15.828779220581055, -14.834161758422852, -13.839542388916016, -12.844923973083496, -11.850305557250977, -10.855687141418457, -9.861068725585938, -8.866450309753418, -7.87183141708374, -6.877213001251221, -5.882594585418701, -4.887975692749023, -3.893357276916504, -2.8987388610839844, -1.9041203260421753, -0.9095017910003662, 0.08511686325073242, 1.079735279083252, 2.0743536949157715, 3.068972587585449, 4.063591003417969, 5.058209419250488, 6.052827835083008, 7.047446250915527, 8.042064666748047, 9.036684036254883, 10.031301498413086, 11.025920867919922, 12.020539283752441, 13.015157699584961, 14.00977611541748, 15.00439453125, 15.999013900756836, 16.99363136291504, 17.988250732421875, 18.982868194580078, 19.977487564086914, 20.97210693359375, 21.966726303100586, 22.96134376525879, 23.955963134765625, 24.950580596923828, 25.945199966430664, 26.9398193359375, 27.934436798095703, 28.929054260253906]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 7.0, 6.0, 10.0, 16.0, 9.0, 15.0, 19.0, 20.0, 23.0, 20.0, 31.0, 19.0, 35.0, 35.0, 36.0, 41.0, 50.0, 33.0, 38.0, 38.0, 49.0, 35.0, 43.0, 45.0, 35.0, 24.0, 32.0, 38.0, 24.0, 20.0, 21.0, 26.0, 10.0, 15.0, 14.0, 16.0, 14.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.1328125, -5.95965576171875, -5.7864990234375, -5.61334228515625, -5.440185546875, -5.26702880859375, -5.0938720703125, -4.92071533203125, -4.74755859375, -4.57440185546875, -4.4012451171875, -4.22808837890625, -4.054931640625, -3.88177490234375, -3.7086181640625, -3.53546142578125, -3.3623046875, -3.18914794921875, -3.0159912109375, -2.84283447265625, -2.669677734375, -2.49652099609375, -2.3233642578125, -2.15020751953125, -1.97705078125, -1.80389404296875, -1.6307373046875, -1.45758056640625, -1.284423828125, -1.11126708984375, -0.9381103515625, -0.76495361328125, -0.591796875, -0.41864013671875, -0.2454833984375, -0.07232666015625, 0.100830078125, 0.27398681640625, 0.4471435546875, 0.62030029296875, 0.79345703125, 0.96661376953125, 1.1397705078125, 1.31292724609375, 1.486083984375, 1.65924072265625, 1.8323974609375, 2.00555419921875, 2.1787109375, 2.35186767578125, 2.5250244140625, 2.69818115234375, 2.871337890625, 3.04449462890625, 3.2176513671875, 3.39080810546875, 3.56396484375, 3.73712158203125, 3.9102783203125, 4.08343505859375, 4.256591796875, 4.42974853515625, 4.6029052734375, 4.77606201171875, 4.94921875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 15.0, 16.0, 27.0, 46.0, 81.0, 98.0, 123.0, 172.0, 303.0, 450.0, 720.0, 1045.0, 1570.0, 2194.0, 3379.0, 5055.0, 7269.0, 11238.0, 16657.0, 25841.0, 40891.0, 66023.0, 108450.0, 167551.0, 195767.0, 146191.0, 90668.0, 56039.0, 34482.0, 22161.0, 14610.0, 9650.0, 6549.0, 4415.0, 2851.0, 1937.0, 1296.0, 861.0, 591.0, 401.0, 288.0, 192.0, 145.0, 92.0, 52.0, 25.0, 29.0, 13.0, 11.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4951171875, -0.478790283203125, -0.46246337890625, -0.446136474609375, -0.4298095703125, -0.413482666015625, -0.39715576171875, -0.380828857421875, -0.364501953125, -0.348175048828125, -0.33184814453125, -0.315521240234375, -0.2991943359375, -0.282867431640625, -0.26654052734375, -0.250213623046875, -0.23388671875, -0.217559814453125, -0.20123291015625, -0.184906005859375, -0.1685791015625, -0.152252197265625, -0.13592529296875, -0.119598388671875, -0.103271484375, -0.086944580078125, -0.07061767578125, -0.054290771484375, -0.0379638671875, -0.021636962890625, -0.00531005859375, 0.011016845703125, 0.02734375, 0.043670654296875, 0.05999755859375, 0.076324462890625, 0.0926513671875, 0.108978271484375, 0.12530517578125, 0.141632080078125, 0.157958984375, 0.174285888671875, 0.19061279296875, 0.206939697265625, 0.2232666015625, 0.239593505859375, 0.25592041015625, 0.272247314453125, 0.28857421875, 0.304901123046875, 0.32122802734375, 0.337554931640625, 0.3538818359375, 0.370208740234375, 0.38653564453125, 0.402862548828125, 0.419189453125, 0.435516357421875, 0.45184326171875, 0.468170166015625, 0.4844970703125, 0.500823974609375, 0.51715087890625, 0.533477783203125, 0.5498046875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 4.0, 14.0, 10.0, 10.0, 14.0, 16.0, 24.0, 14.0, 26.0, 26.0, 32.0, 29.0, 29.0, 35.0, 45.0, 26.0, 49.0, 51.0, 1074.0, 39.0, 39.0, 40.0, 38.0, 35.0, 35.0, 35.0, 26.0, 36.0, 27.0, 17.0, 25.0, 17.0, 13.0, 13.0, 8.0, 9.0, 9.0, 4.0, 2.0, 2.0, 0.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0], "bins": [-3.77734375, -3.66290283203125, -3.5484619140625, -3.43402099609375, -3.319580078125, -3.20513916015625, -3.0906982421875, -2.97625732421875, -2.86181640625, -2.74737548828125, -2.6329345703125, -2.51849365234375, -2.404052734375, -2.28961181640625, -2.1751708984375, -2.06072998046875, -1.9462890625, -1.83184814453125, -1.7174072265625, -1.60296630859375, -1.488525390625, -1.37408447265625, -1.2596435546875, -1.14520263671875, -1.03076171875, -0.91632080078125, -0.8018798828125, -0.68743896484375, -0.572998046875, -0.45855712890625, -0.3441162109375, -0.22967529296875, -0.115234375, -0.00079345703125, 0.1136474609375, 0.22808837890625, 0.342529296875, 0.45697021484375, 0.5714111328125, 0.68585205078125, 0.80029296875, 0.91473388671875, 1.0291748046875, 1.14361572265625, 1.258056640625, 1.37249755859375, 1.4869384765625, 1.60137939453125, 1.7158203125, 1.83026123046875, 1.9447021484375, 2.05914306640625, 2.173583984375, 2.28802490234375, 2.4024658203125, 2.51690673828125, 2.63134765625, 2.74578857421875, 2.8602294921875, 2.97467041015625, 3.089111328125, 3.20355224609375, 3.3179931640625, 3.43243408203125, 3.546875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 13.0, 19.0, 18.0, 35.0, 64.0, 112.0, 161.0, 301.0, 500.0, 900.0, 1578.0, 3102.0, 5856.0, 11379.0, 22157.0, 44890.0, 92126.0, 190170.0, 1330968.0, 199497.0, 97557.0, 47276.0, 23627.0, 11595.0, 6236.0, 3156.0, 1663.0, 947.0, 507.0, 288.0, 141.0, 106.0, 67.0, 41.0, 30.0, 14.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68017578125, -0.6571502685546875, -0.634124755859375, -0.6110992431640625, -0.58807373046875, -0.5650482177734375, -0.542022705078125, -0.5189971923828125, -0.4959716796875, -0.4729461669921875, -0.449920654296875, -0.4268951416015625, -0.40386962890625, -0.3808441162109375, -0.357818603515625, -0.3347930908203125, -0.311767578125, -0.2887420654296875, -0.265716552734375, -0.2426910400390625, -0.21966552734375, -0.1966400146484375, -0.173614501953125, -0.1505889892578125, -0.1275634765625, -0.1045379638671875, -0.081512451171875, -0.0584869384765625, -0.03546142578125, -0.0124359130859375, 0.010589599609375, 0.0336151123046875, 0.056640625, 0.0796661376953125, 0.102691650390625, 0.1257171630859375, 0.14874267578125, 0.1717681884765625, 0.194793701171875, 0.2178192138671875, 0.2408447265625, 0.2638702392578125, 0.286895751953125, 0.3099212646484375, 0.33294677734375, 0.3559722900390625, 0.378997802734375, 0.4020233154296875, 0.425048828125, 0.4480743408203125, 0.471099853515625, 0.4941253662109375, 0.51715087890625, 0.5401763916015625, 0.563201904296875, 0.5862274169921875, 0.6092529296875, 0.6322784423828125, 0.655303955078125, 0.6783294677734375, 0.70135498046875, 0.7243804931640625, 0.747406005859375, 0.7704315185546875, 0.79345703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 7.0, 9.0, 8.0, 8.0, 10.0, 21.0, 14.0, 20.0, 26.0, 23.0, 29.0, 34.0, 36.0, 35.0, 39.0, 43.0, 39.0, 41.0, 36.0, 34.0, 33.0, 42.0, 38.0, 31.0, 37.0, 36.0, 41.0, 29.0, 37.0, 28.0, 27.0, 22.0, 16.0, 12.0, 9.0, 7.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0007967948913574219, -0.000772327184677124, -0.0007478594779968262, -0.0007233917713165283, -0.0006989240646362305, -0.0006744563579559326, -0.0006499886512756348, -0.0006255209445953369, -0.0006010532379150391, -0.0005765855312347412, -0.0005521178245544434, -0.0005276501178741455, -0.0005031824111938477, -0.0004787147045135498, -0.00045424699783325195, -0.0004297792911529541, -0.00040531158447265625, -0.0003808438777923584, -0.00035637617111206055, -0.0003319084644317627, -0.00030744075775146484, -0.000282973051071167, -0.00025850534439086914, -0.0002340376377105713, -0.00020956993103027344, -0.00018510222434997559, -0.00016063451766967773, -0.00013616681098937988, -0.00011169910430908203, -8.723139762878418e-05, -6.276369094848633e-05, -3.8295984268188477e-05, -1.3828277587890625e-05, 1.0639429092407227e-05, 3.510713577270508e-05, 5.957484245300293e-05, 8.404254913330078e-05, 0.00010851025581359863, 0.00013297796249389648, 0.00015744566917419434, 0.0001819133758544922, 0.00020638108253479004, 0.0002308487892150879, 0.00025531649589538574, 0.0002797842025756836, 0.00030425190925598145, 0.0003287196159362793, 0.00035318732261657715, 0.000377655029296875, 0.00040212273597717285, 0.0004265904426574707, 0.00045105814933776855, 0.0004755258560180664, 0.0004999935626983643, 0.0005244612693786621, 0.00054892897605896, 0.0005733966827392578, 0.0005978643894195557, 0.0006223320960998535, 0.0006467998027801514, 0.0006712675094604492, 0.0006957352161407471, 0.0007202029228210449, 0.0007446706295013428, 0.0007691383361816406]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 0.0, 8.0, 5.0, 6.0, 9.0, 6.0, 12.0, 17.0, 24.0, 27.0, 32.0, 43.0, 40.0, 63.0, 52.0, 88.0, 91.0, 136.0, 240.0, 547.0, 1834.0, 943019.0, 100161.0, 1032.0, 379.0, 169.0, 104.0, 71.0, 56.0, 58.0, 46.0, 41.0, 22.0, 26.0, 18.0, 15.0, 8.0, 8.0, 11.0, 8.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01885986328125, -0.018266916275024414, -0.017673969268798828, -0.017081022262573242, -0.016488075256347656, -0.01589512825012207, -0.015302181243896484, -0.014709234237670898, -0.014116287231445312, -0.013523340225219727, -0.01293039321899414, -0.012337446212768555, -0.011744499206542969, -0.011151552200317383, -0.010558605194091797, -0.009965658187866211, -0.009372711181640625, -0.008779764175415039, -0.008186817169189453, -0.007593870162963867, -0.007000923156738281, -0.006407976150512695, -0.005815029144287109, -0.0052220821380615234, -0.0046291351318359375, -0.0040361881256103516, -0.0034432411193847656, -0.0028502941131591797, -0.0022573471069335938, -0.0016644001007080078, -0.0010714530944824219, -0.00047850608825683594, 0.00011444091796875, 0.0007073879241943359, 0.0013003349304199219, 0.0018932819366455078, 0.0024862289428710938, 0.0030791759490966797, 0.0036721229553222656, 0.0042650699615478516, 0.0048580169677734375, 0.0054509639739990234, 0.006043910980224609, 0.006636857986450195, 0.007229804992675781, 0.007822751998901367, 0.008415699005126953, 0.009008646011352539, 0.009601593017578125, 0.010194540023803711, 0.010787487030029297, 0.011380434036254883, 0.011973381042480469, 0.012566328048706055, 0.01315927505493164, 0.013752222061157227, 0.014345169067382812, 0.014938116073608398, 0.015531063079833984, 0.01612401008605957, 0.016716957092285156, 0.017309904098510742, 0.017902851104736328, 0.018495798110961914, 0.0190887451171875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 95.0, 919.0, 2.0, 1.0], "bins": [-0.01591569185256958, -0.015656089410185814, -0.015396486036479473, -0.015136883594095707, -0.01487728115171194, -0.0146176777780056, -0.014358075335621834, -0.014098472893238068, -0.013838869519531727, -0.01357926707714796, -0.01331966370344162, -0.013060061261057854, -0.012800458818674088, -0.012540855444967747, -0.01228125300258398, -0.012021650560200214, -0.011762047186493874, -0.011502444744110107, -0.011242841370403767, -0.01098323892802, -0.010723636485636234, -0.010464033111929893, -0.010204430669546127, -0.009944828227162361, -0.009685225784778595, -0.009425623342394829, -0.009166019968688488, -0.008906417526304722, -0.008646815083920956, -0.008387211710214615, -0.008127609267830849, -0.007868006825447083, -0.007608403917402029, -0.0073488010093569756, -0.007089198566973209, -0.006829595658928156, -0.006569992750883102, -0.006310390308499336, -0.006050787400454283, -0.005791184492409229, -0.005531582050025463, -0.00527197914198041, -0.0050123766995966434, -0.00475277379155159, -0.0044931708835065365, -0.004233567975461483, -0.003973965533077717, -0.0037143626250326633, -0.00345475971698761, -0.0031951570417732, -0.0029355541337281466, -0.0026759514585137367, -0.0024163485504686832, -0.0021567458752542734, -0.0018971432000398636, -0.001637540408410132, -0.001377937733195722, -0.0011183349415659904, -0.0008587322081439197, -0.000599129474721849, -0.0003395266830921173, -7.992389146238565e-05, 0.00017967878375202417, 0.00043928157538175583, 0.0006988843670114875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 5.0, 10.0, 15.0, 16.0, 16.0, 19.0, 12.0, 21.0, 32.0, 35.0, 38.0, 48.0, 48.0, 44.0, 50.0, 49.0, 45.0, 33.0, 49.0, 48.0, 46.0, 42.0, 35.0, 31.0, 26.0, 24.0, 24.0, 27.0, 23.0, 19.0, 15.0, 6.0, 13.0, 5.0, 7.0, 6.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004761219024658203, -0.00045892875641584396, -0.0004417356103658676, -0.00042454246431589127, -0.0004073493182659149, -0.00039015617221593857, -0.0003729630261659622, -0.00035576988011598587, -0.0003385767340660095, -0.00032138358801603317, -0.0003041904419660568, -0.0002869972959160805, -0.0002698041498661041, -0.0002526110038161278, -0.00023541785776615143, -0.00021822471171617508, -0.00020103156566619873, -0.00018383841961622238, -0.00016664527356624603, -0.00014945212751626968, -0.00013225898146629333, -0.00011506583541631699, -9.787268936634064e-05, -8.067954331636429e-05, -6.348639726638794e-05, -4.629325121641159e-05, -2.9100105166435242e-05, -1.1906959116458893e-05, 5.286186933517456e-06, 2.2479332983493805e-05, 3.9672479033470154e-05, 5.68656250834465e-05, 7.405877113342285e-05, 9.12519171833992e-05, 0.00010844506323337555, 0.0001256382092833519, 0.00014283135533332825, 0.0001600245013833046, 0.00017721764743328094, 0.0001944107934832573, 0.00021160393953323364, 0.00022879708558321, 0.00024599023163318634, 0.0002631833776831627, 0.00028037652373313904, 0.0002975696697831154, 0.00031476281583309174, 0.0003319559618830681, 0.00034914910793304443, 0.0003663422539830208, 0.00038353540003299713, 0.0004007285460829735, 0.00041792169213294983, 0.0004351148381829262, 0.0004523079842329025, 0.0004695011302828789, 0.0004866942763328552, 0.0005038874223828316, 0.0005210805684328079, 0.0005382737144827843, 0.0005554668605327606, 0.000572660006582737, 0.0005898531526327133, 0.0006070462986826897, 0.000624239444732666]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 7.0, 6.0, 10.0, 16.0, 9.0, 15.0, 19.0, 20.0, 23.0, 20.0, 31.0, 19.0, 35.0, 35.0, 36.0, 41.0, 50.0, 33.0, 38.0, 38.0, 49.0, 35.0, 43.0, 45.0, 35.0, 24.0, 32.0, 38.0, 24.0, 20.0, 21.0, 26.0, 10.0, 15.0, 14.0, 16.0, 14.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.1328125, -5.95965576171875, -5.7864990234375, -5.61334228515625, -5.440185546875, -5.26702880859375, -5.0938720703125, -4.92071533203125, -4.74755859375, -4.57440185546875, -4.4012451171875, -4.22808837890625, -4.054931640625, -3.88177490234375, -3.7086181640625, -3.53546142578125, -3.3623046875, -3.18914794921875, -3.0159912109375, -2.84283447265625, -2.669677734375, -2.49652099609375, -2.3233642578125, -2.15020751953125, -1.97705078125, -1.80389404296875, -1.6307373046875, -1.45758056640625, -1.284423828125, -1.11126708984375, -0.9381103515625, -0.76495361328125, -0.591796875, -0.41864013671875, -0.2454833984375, -0.07232666015625, 0.100830078125, 0.27398681640625, 0.4471435546875, 0.62030029296875, 0.79345703125, 0.96661376953125, 1.1397705078125, 1.31292724609375, 1.486083984375, 1.65924072265625, 1.8323974609375, 2.00555419921875, 2.1787109375, 2.35186767578125, 2.5250244140625, 2.69818115234375, 2.871337890625, 3.04449462890625, 3.2176513671875, 3.39080810546875, 3.56396484375, 3.73712158203125, 3.9102783203125, 4.08343505859375, 4.256591796875, 4.42974853515625, 4.6029052734375, 4.77606201171875, 4.94921875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 2.0, 7.0, 6.0, 9.0, 21.0, 19.0, 20.0, 30.0, 34.0, 54.0, 69.0, 88.0, 121.0, 184.0, 282.0, 415.0, 783.0, 1482.0, 5519.0, 35733.0, 434855.0, 519125.0, 40004.0, 5923.0, 1587.0, 741.0, 465.0, 265.0, 170.0, 139.0, 83.0, 74.0, 54.0, 43.0, 29.0, 24.0, 26.0, 17.0, 13.0, 11.0, 8.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.171875, -10.8529052734375, -10.533935546875, -10.2149658203125, -9.89599609375, -9.5770263671875, -9.258056640625, -8.9390869140625, -8.6201171875, -8.3011474609375, -7.982177734375, -7.6632080078125, -7.34423828125, -7.0252685546875, -6.706298828125, -6.3873291015625, -6.068359375, -5.7493896484375, -5.430419921875, -5.1114501953125, -4.79248046875, -4.4735107421875, -4.154541015625, -3.8355712890625, -3.5166015625, -3.1976318359375, -2.878662109375, -2.5596923828125, -2.24072265625, -1.9217529296875, -1.602783203125, -1.2838134765625, -0.96484375, -0.6458740234375, -0.326904296875, -0.0079345703125, 0.31103515625, 0.6300048828125, 0.948974609375, 1.2679443359375, 1.5869140625, 1.9058837890625, 2.224853515625, 2.5438232421875, 2.86279296875, 3.1817626953125, 3.500732421875, 3.8197021484375, 4.138671875, 4.4576416015625, 4.776611328125, 5.0955810546875, 5.41455078125, 5.7335205078125, 6.052490234375, 6.3714599609375, 6.6904296875, 7.0093994140625, 7.328369140625, 7.6473388671875, 7.96630859375, 8.2852783203125, 8.604248046875, 8.9232177734375, 9.2421875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 3.0, 8.0, 5.0, 4.0, 7.0, 19.0, 20.0, 18.0, 17.0, 26.0, 31.0, 35.0, 48.0, 50.0, 51.0, 52.0, 59.0, 115.0, 1763.0, 230.0, 61.0, 57.0, 53.0, 38.0, 32.0, 30.0, 26.0, 31.0, 25.0, 25.0, 17.0, 16.0, 6.0, 15.0, 14.0, 6.0, 12.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.551513671875, -15.93115234375, -15.310791015625, -14.6904296875, -14.070068359375, -13.44970703125, -12.829345703125, -12.208984375, -11.588623046875, -10.96826171875, -10.347900390625, -9.7275390625, -9.107177734375, -8.48681640625, -7.866455078125, -7.24609375, -6.625732421875, -6.00537109375, -5.385009765625, -4.7646484375, -4.144287109375, -3.52392578125, -2.903564453125, -2.283203125, -1.662841796875, -1.04248046875, -0.422119140625, 0.1982421875, 0.818603515625, 1.43896484375, 2.059326171875, 2.6796875, 3.300048828125, 3.92041015625, 4.540771484375, 5.1611328125, 5.781494140625, 6.40185546875, 7.022216796875, 7.642578125, 8.262939453125, 8.88330078125, 9.503662109375, 10.1240234375, 10.744384765625, 11.36474609375, 11.985107421875, 12.60546875, 13.225830078125, 13.84619140625, 14.466552734375, 15.0869140625, 15.707275390625, 16.32763671875, 16.947998046875, 17.568359375, 18.188720703125, 18.80908203125, 19.429443359375, 20.0498046875, 20.670166015625, 21.29052734375, 21.910888671875, 22.53125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 11.0, 7.0, 16.0, 14.0, 9.0, 15.0, 20.0, 30.0, 34.0, 31.0, 38.0, 59.0, 72.0, 141.0, 228.0, 401.0, 1218.0, 510603.0, 2630077.0, 1532.0, 415.0, 214.0, 130.0, 91.0, 59.0, 49.0, 36.0, 21.0, 23.0, 19.0, 22.0, 13.0, 8.0, 6.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-67.125, -65.2626953125, -63.400390625, -61.5380859375, -59.67578125, -57.8134765625, -55.951171875, -54.0888671875, -52.2265625, -50.3642578125, -48.501953125, -46.6396484375, -44.77734375, -42.9150390625, -41.052734375, -39.1904296875, -37.328125, -35.4658203125, -33.603515625, -31.7412109375, -29.87890625, -28.0166015625, -26.154296875, -24.2919921875, -22.4296875, -20.5673828125, -18.705078125, -16.8427734375, -14.98046875, -13.1181640625, -11.255859375, -9.3935546875, -7.53125, -5.6689453125, -3.806640625, -1.9443359375, -0.08203125, 1.7802734375, 3.642578125, 5.5048828125, 7.3671875, 9.2294921875, 11.091796875, 12.9541015625, 14.81640625, 16.6787109375, 18.541015625, 20.4033203125, 22.265625, 24.1279296875, 25.990234375, 27.8525390625, 29.71484375, 31.5771484375, 33.439453125, 35.3017578125, 37.1640625, 39.0263671875, 40.888671875, 42.7509765625, 44.61328125, 46.4755859375, 48.337890625, 50.2001953125, 52.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 950.0, 65.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.243045806884766, -53.319374084472656, -46.39570617675781, -39.47203826904297, -32.54836654663086, -25.624698638916016, -18.701026916503906, -11.777355194091797, -4.853687286376953, 2.0699825286865234, 8.99365234375, 15.917322158813477, 22.840991973876953, 29.764659881591797, 36.688331604003906, 43.612003326416016, 50.53567123413086, 57.45934295654297, 64.38301086425781, 71.30667877197266, 78.2303466796875, 85.15402221679688, 92.07769012451172, 99.00135803222656, 105.92503356933594, 112.84870147705078, 119.77236938476562, 126.696044921875, 133.61972045898438, 140.5433807373047, 147.46705627441406, 154.39071655273438, 161.31439208984375, 168.23806762695312, 175.16172790527344, 182.0854034423828, 189.00906372070312, 195.9327392578125, 202.85641479492188, 209.78009033203125, 216.70375061035156, 223.62742614746094, 230.55108642578125, 237.47476196289062, 244.3984375, 251.3220977783203, 258.2457580566406, 265.16943359375, 272.0931091308594, 279.01678466796875, 285.9404602050781, 292.8641052246094, 299.78778076171875, 306.7114562988281, 313.6351318359375, 320.5588073730469, 327.48248291015625, 334.4061584472656, 341.329833984375, 348.25347900390625, 355.1771545410156, 362.100830078125, 369.0245056152344, 375.94818115234375, 382.871826171875]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 1.0, 5.0, 3.0, 4.0, 3.0, 12.0, 12.0, 10.0, 16.0, 17.0, 24.0, 12.0, 17.0, 29.0, 30.0, 35.0, 33.0, 29.0, 40.0, 38.0, 43.0, 33.0, 29.0, 41.0, 37.0, 52.0, 40.0, 34.0, 28.0, 42.0, 34.0, 24.0, 34.0, 15.0, 20.0, 14.0, 19.0, 12.0, 13.0, 12.0, 7.0, 12.0, 6.0, 4.0, 6.0, 8.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0], "bins": [-56.04705047607422, -54.48263931274414, -52.91823196411133, -51.35382080078125, -49.78940963745117, -48.22500228881836, -46.66059112548828, -45.09618377685547, -43.53177261352539, -41.96736145019531, -40.4029541015625, -38.83854293823242, -37.274131774902344, -35.70972442626953, -34.14531326293945, -32.580902099609375, -31.01649284362793, -29.452083587646484, -27.887672424316406, -26.32326316833496, -24.758853912353516, -23.194442749023438, -21.630033493041992, -20.065624237060547, -18.50121307373047, -16.936803817749023, -15.372393608093262, -13.8079833984375, -12.243574142456055, -10.679163932800293, -9.114753723144531, -7.550344467163086, -5.985935211181641, -4.421525478363037, -2.8571155071258545, -1.2927055358886719, 0.27170419692993164, 1.8361139297485352, 3.400524139404297, 4.964933395385742, 6.529343605041504, 8.093753814697266, 9.658163070678711, 11.222573280334473, 12.786983489990234, 14.35139274597168, 15.915802955627441, 17.480213165283203, 19.04462242126465, 20.609031677246094, 22.173442840576172, 23.737852096557617, 25.302261352539062, 26.86667251586914, 28.431081771850586, 29.99549102783203, 31.55990219116211, 33.12431335449219, 34.688720703125, 36.25313186645508, 37.817543029785156, 39.38195037841797, 40.94636154174805, 42.510772705078125, 44.07518005371094]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 2.0, 6.0, 5.0, 4.0, 9.0, 3.0, 16.0, 4.0, 14.0, 16.0, 24.0, 25.0, 18.0, 27.0, 29.0, 27.0, 28.0, 32.0, 38.0, 37.0, 58.0, 33.0, 41.0, 31.0, 57.0, 47.0, 24.0, 44.0, 30.0, 38.0, 32.0, 21.0, 24.0, 25.0, 17.0, 26.0, 16.0, 14.0, 12.0, 14.0, 12.0, 6.0, 8.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.28515625, -6.1005859375, -5.916015625, -5.7314453125, -5.546875, -5.3623046875, -5.177734375, -4.9931640625, -4.80859375, -4.6240234375, -4.439453125, -4.2548828125, -4.0703125, -3.8857421875, -3.701171875, -3.5166015625, -3.33203125, -3.1474609375, -2.962890625, -2.7783203125, -2.59375, -2.4091796875, -2.224609375, -2.0400390625, -1.85546875, -1.6708984375, -1.486328125, -1.3017578125, -1.1171875, -0.9326171875, -0.748046875, -0.5634765625, -0.37890625, -0.1943359375, -0.009765625, 0.1748046875, 0.359375, 0.5439453125, 0.728515625, 0.9130859375, 1.09765625, 1.2822265625, 1.466796875, 1.6513671875, 1.8359375, 2.0205078125, 2.205078125, 2.3896484375, 2.57421875, 2.7587890625, 2.943359375, 3.1279296875, 3.3125, 3.4970703125, 3.681640625, 3.8662109375, 4.05078125, 4.2353515625, 4.419921875, 4.6044921875, 4.7890625, 4.9736328125, 5.158203125, 5.3427734375, 5.52734375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 3.0, 7.0, 6.0, 12.0, 11.0, 15.0, 13.0, 26.0, 36.0, 36.0, 61.0, 62.0, 113.0, 155.0, 236.0, 398.0, 681.0, 1322.0, 2836.0, 7349.0, 24037.0, 111546.0, 537527.0, 1490480.0, 1404140.0, 477422.0, 100650.0, 22414.0, 6868.0, 2718.0, 1276.0, 709.0, 351.0, 209.0, 147.0, 110.0, 70.0, 58.0, 44.0, 32.0, 22.0, 13.0, 18.0, 12.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.78125, -7.545166015625, -7.30908203125, -7.072998046875, -6.8369140625, -6.600830078125, -6.36474609375, -6.128662109375, -5.892578125, -5.656494140625, -5.42041015625, -5.184326171875, -4.9482421875, -4.712158203125, -4.47607421875, -4.239990234375, -4.00390625, -3.767822265625, -3.53173828125, -3.295654296875, -3.0595703125, -2.823486328125, -2.58740234375, -2.351318359375, -2.115234375, -1.879150390625, -1.64306640625, -1.406982421875, -1.1708984375, -0.934814453125, -0.69873046875, -0.462646484375, -0.2265625, 0.009521484375, 0.24560546875, 0.481689453125, 0.7177734375, 0.953857421875, 1.18994140625, 1.426025390625, 1.662109375, 1.898193359375, 2.13427734375, 2.370361328125, 2.6064453125, 2.842529296875, 3.07861328125, 3.314697265625, 3.55078125, 3.786865234375, 4.02294921875, 4.259033203125, 4.4951171875, 4.731201171875, 4.96728515625, 5.203369140625, 5.439453125, 5.675537109375, 5.91162109375, 6.147705078125, 6.3837890625, 6.619873046875, 6.85595703125, 7.092041015625, 7.328125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 12.0, 12.0, 17.0, 24.0, 44.0, 56.0, 88.0, 130.0, 171.0, 254.0, 408.0, 488.0, 576.0, 492.0, 355.0, 276.0, 203.0, 134.0, 98.0, 76.0, 44.0, 31.0, 30.0, 12.0, 17.0, 4.0, 7.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8671875, -9.4473876953125, -9.027587890625, -8.6077880859375, -8.18798828125, -7.7681884765625, -7.348388671875, -6.9285888671875, -6.5087890625, -6.0889892578125, -5.669189453125, -5.2493896484375, -4.82958984375, -4.4097900390625, -3.989990234375, -3.5701904296875, -3.150390625, -2.7305908203125, -2.310791015625, -1.8909912109375, -1.47119140625, -1.0513916015625, -0.631591796875, -0.2117919921875, 0.2080078125, 0.6278076171875, 1.047607421875, 1.4674072265625, 1.88720703125, 2.3070068359375, 2.726806640625, 3.1466064453125, 3.56640625, 3.9862060546875, 4.406005859375, 4.8258056640625, 5.24560546875, 5.6654052734375, 6.085205078125, 6.5050048828125, 6.9248046875, 7.3446044921875, 7.764404296875, 8.1842041015625, 8.60400390625, 9.0238037109375, 9.443603515625, 9.8634033203125, 10.283203125, 10.7030029296875, 11.122802734375, 11.5426025390625, 11.96240234375, 12.3822021484375, 12.802001953125, 13.2218017578125, 13.6416015625, 14.0614013671875, 14.481201171875, 14.9010009765625, 15.32080078125, 15.7406005859375, 16.160400390625, 16.5802001953125, 17.0]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 16.0, 20.0, 26.0, 35.0, 40.0, 78.0, 111.0, 128.0, 158.0, 190.0, 272.0, 374.0, 759.0, 2646.0, 204220.0, 3965287.0, 16852.0, 1336.0, 475.0, 314.0, 242.0, 190.0, 110.0, 90.0, 94.0, 53.0, 48.0, 32.0, 18.0, 16.0, 6.0, 4.0, 9.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.90625, -59.35595703125, -57.8056640625, -56.25537109375, -54.705078125, -53.15478515625, -51.6044921875, -50.05419921875, -48.50390625, -46.95361328125, -45.4033203125, -43.85302734375, -42.302734375, -40.75244140625, -39.2021484375, -37.65185546875, -36.1015625, -34.55126953125, -33.0009765625, -31.45068359375, -29.900390625, -28.35009765625, -26.7998046875, -25.24951171875, -23.69921875, -22.14892578125, -20.5986328125, -19.04833984375, -17.498046875, -15.94775390625, -14.3974609375, -12.84716796875, -11.296875, -9.74658203125, -8.1962890625, -6.64599609375, -5.095703125, -3.54541015625, -1.9951171875, -0.44482421875, 1.10546875, 2.65576171875, 4.2060546875, 5.75634765625, 7.306640625, 8.85693359375, 10.4072265625, 11.95751953125, 13.5078125, 15.05810546875, 16.6083984375, 18.15869140625, 19.708984375, 21.25927734375, 22.8095703125, 24.35986328125, 25.91015625, 27.46044921875, 29.0107421875, 30.56103515625, 32.111328125, 33.66162109375, 35.2119140625, 36.76220703125, 38.3125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 5.0, 73.0, 474.0, 418.0, 43.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.217418670654297, -18.67082977294922, -12.124239921569824, -5.57765007019043, 0.9689388275146484, 7.515529632568359, 14.062118530273438, 20.608707427978516, 27.155296325683594, 33.70188522338867, 40.24847412109375, 46.795066833496094, 53.341651916503906, 59.88824462890625, 66.43482971191406, 72.9814224243164, 79.52801513671875, 86.0746078491211, 92.6211929321289, 99.16778564453125, 105.71437072753906, 112.2609634399414, 118.80755615234375, 125.35414123535156, 131.90072631835938, 138.4473114013672, 144.99391174316406, 151.54049682617188, 158.0870819091797, 164.6336669921875, 171.18026733398438, 177.7268524169922, 184.27345275878906, 190.82003784179688, 197.36663818359375, 203.91322326660156, 210.45980834960938, 217.00640869140625, 223.55299377441406, 230.09957885742188, 236.6461639404297, 243.1927490234375, 249.73934936523438, 256.2859191894531, 262.83251953125, 269.3791198730469, 275.9256896972656, 282.4722900390625, 289.0188903808594, 295.56549072265625, 302.112060546875, 308.6586608886719, 315.20526123046875, 321.7518310546875, 328.2984313964844, 334.84503173828125, 341.3916015625, 347.9382019042969, 354.4847717285156, 361.0313720703125, 367.5779724121094, 374.1245422363281, 380.671142578125, 387.21771240234375, 393.7643127441406]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 8.0, 12.0, 10.0, 14.0, 16.0, 24.0, 20.0, 22.0, 21.0, 38.0, 35.0, 31.0, 45.0, 34.0, 43.0, 50.0, 45.0, 59.0, 54.0, 33.0, 36.0, 41.0, 49.0, 34.0, 41.0, 25.0, 31.0, 22.0, 30.0, 20.0, 9.0, 8.0, 8.0, 3.0, 4.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.171897888183594, -38.840877532958984, -37.50985336303711, -36.1788330078125, -34.84781265258789, -33.51679229736328, -32.185768127441406, -30.854747772216797, -29.523725509643555, -28.192703247070312, -26.861682891845703, -25.53066062927246, -24.19963836669922, -22.86861801147461, -21.537595748901367, -20.206573486328125, -18.875553131103516, -17.544530868530273, -16.213510513305664, -14.882488250732422, -13.551466941833496, -12.22044563293457, -10.889423370361328, -9.558402061462402, -8.227380752563477, -6.896359443664551, -5.565337657928467, -4.234315872192383, -2.903294563293457, -1.5722732543945312, -0.24125146865844727, 1.0897703170776367, 2.4207916259765625, 3.7518131732940674, 5.082834720611572, 6.413856506347656, 7.744877815246582, 9.075899124145508, 10.40692138671875, 11.737942695617676, 13.068964004516602, 14.399985313415527, 15.731006622314453, 17.062028884887695, 18.393051147460938, 19.724071502685547, 21.05509376525879, 22.38611602783203, 23.71713638305664, 25.048158645629883, 26.379179000854492, 27.710201263427734, 29.041221618652344, 30.372243881225586, 31.703266143798828, 33.03428649902344, 34.36531066894531, 35.69633102416992, 37.0273551940918, 38.358375549316406, 39.689395904541016, 41.020416259765625, 42.3514404296875, 43.68246078491211, 45.01348114013672]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 10.0, 8.0, 20.0, 12.0, 21.0, 17.0, 21.0, 24.0, 29.0, 32.0, 26.0, 39.0, 43.0, 35.0, 47.0, 48.0, 54.0, 51.0, 46.0, 38.0, 45.0, 39.0, 34.0, 28.0, 28.0, 30.0, 32.0, 20.0, 17.0, 25.0, 11.0, 15.0, 11.0, 11.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01953125, -5.82403564453125, -5.6285400390625, -5.43304443359375, -5.237548828125, -5.04205322265625, -4.8465576171875, -4.65106201171875, -4.45556640625, -4.26007080078125, -4.0645751953125, -3.86907958984375, -3.673583984375, -3.47808837890625, -3.2825927734375, -3.08709716796875, -2.8916015625, -2.69610595703125, -2.5006103515625, -2.30511474609375, -2.109619140625, -1.91412353515625, -1.7186279296875, -1.52313232421875, -1.32763671875, -1.13214111328125, -0.9366455078125, -0.74114990234375, -0.545654296875, -0.35015869140625, -0.1546630859375, 0.04083251953125, 0.236328125, 0.43182373046875, 0.6273193359375, 0.82281494140625, 1.018310546875, 1.21380615234375, 1.4093017578125, 1.60479736328125, 1.80029296875, 1.99578857421875, 2.1912841796875, 2.38677978515625, 2.582275390625, 2.77777099609375, 2.9732666015625, 3.16876220703125, 3.3642578125, 3.55975341796875, 3.7552490234375, 3.95074462890625, 4.146240234375, 4.34173583984375, 4.5372314453125, 4.73272705078125, 4.92822265625, 5.12371826171875, 5.3192138671875, 5.51470947265625, 5.710205078125, 5.90570068359375, 6.1011962890625, 6.29669189453125, 6.4921875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 7.0, 5.0, 11.0, 20.0, 19.0, 45.0, 72.0, 109.0, 166.0, 249.0, 353.0, 549.0, 843.0, 1364.0, 1940.0, 2994.0, 4368.0, 6580.0, 10026.0, 15064.0, 22363.0, 34642.0, 54408.0, 87506.0, 138793.0, 189184.0, 168380.0, 111726.0, 69628.0, 43743.0, 27882.0, 18658.0, 12287.0, 8182.0, 5452.0, 3755.0, 2434.0, 1595.0, 1076.0, 681.0, 523.0, 292.0, 205.0, 126.0, 87.0, 55.0, 33.0, 30.0, 20.0, 9.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.5361328125, -0.5197677612304688, -0.5034027099609375, -0.48703765869140625, -0.470672607421875, -0.45430755615234375, -0.4379425048828125, -0.42157745361328125, -0.40521240234375, -0.38884735107421875, -0.3724822998046875, -0.35611724853515625, -0.339752197265625, -0.32338714599609375, -0.3070220947265625, -0.29065704345703125, -0.2742919921875, -0.25792694091796875, -0.2415618896484375, -0.22519683837890625, -0.208831787109375, -0.19246673583984375, -0.1761016845703125, -0.15973663330078125, -0.14337158203125, -0.12700653076171875, -0.1106414794921875, -0.09427642822265625, -0.077911376953125, -0.06154632568359375, -0.0451812744140625, -0.02881622314453125, -0.012451171875, 0.00391387939453125, 0.0202789306640625, 0.03664398193359375, 0.053009033203125, 0.06937408447265625, 0.0857391357421875, 0.10210418701171875, 0.11846923828125, 0.13483428955078125, 0.1511993408203125, 0.16756439208984375, 0.183929443359375, 0.20029449462890625, 0.2166595458984375, 0.23302459716796875, 0.2493896484375, 0.26575469970703125, 0.2821197509765625, 0.29848480224609375, 0.314849853515625, 0.33121490478515625, 0.3475799560546875, 0.36394500732421875, 0.38031005859375, 0.39667510986328125, 0.4130401611328125, 0.42940521240234375, 0.445770263671875, 0.46213531494140625, 0.4785003662109375, 0.49486541748046875, 0.51123046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 8.0, 10.0, 16.0, 13.0, 22.0, 26.0, 19.0, 33.0, 32.0, 37.0, 26.0, 28.0, 39.0, 47.0, 44.0, 41.0, 1062.0, 46.0, 53.0, 54.0, 35.0, 32.0, 29.0, 37.0, 35.0, 24.0, 32.0, 28.0, 15.0, 21.0, 15.0, 15.0, 12.0, 8.0, 4.0, 10.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.29437255859375, -4.1668701171875, -4.03936767578125, -3.911865234375, -3.78436279296875, -3.6568603515625, -3.52935791015625, -3.40185546875, -3.27435302734375, -3.1468505859375, -3.01934814453125, -2.891845703125, -2.76434326171875, -2.6368408203125, -2.50933837890625, -2.3818359375, -2.25433349609375, -2.1268310546875, -1.99932861328125, -1.871826171875, -1.74432373046875, -1.6168212890625, -1.48931884765625, -1.36181640625, -1.23431396484375, -1.1068115234375, -0.97930908203125, -0.851806640625, -0.72430419921875, -0.5968017578125, -0.46929931640625, -0.341796875, -0.21429443359375, -0.0867919921875, 0.04071044921875, 0.168212890625, 0.29571533203125, 0.4232177734375, 0.55072021484375, 0.67822265625, 0.80572509765625, 0.9332275390625, 1.06072998046875, 1.188232421875, 1.31573486328125, 1.4432373046875, 1.57073974609375, 1.6982421875, 1.82574462890625, 1.9532470703125, 2.08074951171875, 2.208251953125, 2.33575439453125, 2.4632568359375, 2.59075927734375, 2.71826171875, 2.84576416015625, 2.9732666015625, 3.10076904296875, 3.228271484375, 3.35577392578125, 3.4832763671875, 3.61077880859375, 3.73828125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 8.0, 16.0, 14.0, 29.0, 42.0, 51.0, 107.0, 168.0, 239.0, 336.0, 607.0, 975.0, 1519.0, 2583.0, 4406.0, 7475.0, 13250.0, 23727.0, 43006.0, 78803.0, 142402.0, 1269319.0, 212907.0, 131325.0, 72728.0, 39394.0, 22024.0, 12100.0, 7032.0, 4142.0, 2476.0, 1463.0, 844.0, 574.0, 337.0, 245.0, 145.0, 107.0, 71.0, 45.0, 28.0, 16.0, 11.0, 10.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55078125, -0.532379150390625, -0.51397705078125, -0.495574951171875, -0.4771728515625, -0.458770751953125, -0.44036865234375, -0.421966552734375, -0.403564453125, -0.385162353515625, -0.36676025390625, -0.348358154296875, -0.3299560546875, -0.311553955078125, -0.29315185546875, -0.274749755859375, -0.25634765625, -0.237945556640625, -0.21954345703125, -0.201141357421875, -0.1827392578125, -0.164337158203125, -0.14593505859375, -0.127532958984375, -0.109130859375, -0.090728759765625, -0.07232666015625, -0.053924560546875, -0.0355224609375, -0.017120361328125, 0.00128173828125, 0.019683837890625, 0.0380859375, 0.056488037109375, 0.07489013671875, 0.093292236328125, 0.1116943359375, 0.130096435546875, 0.14849853515625, 0.166900634765625, 0.185302734375, 0.203704833984375, 0.22210693359375, 0.240509033203125, 0.2589111328125, 0.277313232421875, 0.29571533203125, 0.314117431640625, 0.33251953125, 0.350921630859375, 0.36932373046875, 0.387725830078125, 0.4061279296875, 0.424530029296875, 0.44293212890625, 0.461334228515625, 0.479736328125, 0.498138427734375, 0.51654052734375, 0.534942626953125, 0.5533447265625, 0.571746826171875, 0.59014892578125, 0.608551025390625, 0.626953125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 9.0, 11.0, 14.0, 16.0, 14.0, 25.0, 42.0, 33.0, 55.0, 53.0, 54.0, 50.0, 47.0, 62.0, 58.0, 68.0, 63.0, 51.0, 46.0, 41.0, 36.0, 30.0, 31.0, 22.0, 14.0, 11.0, 13.0, 16.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011959075927734375, -0.0011620298027992249, -0.0011281520128250122, -0.0010942742228507996, -0.001060396432876587, -0.0010265186429023743, -0.0009926408529281616, -0.000958763062953949, -0.0009248852729797363, -0.0008910074830055237, -0.000857129693031311, -0.0008232519030570984, -0.0007893741130828857, -0.0007554963231086731, -0.0007216185331344604, -0.0006877407431602478, -0.0006538629531860352, -0.0006199851632118225, -0.0005861073732376099, -0.0005522295832633972, -0.0005183517932891846, -0.0004844740033149719, -0.0004505962133407593, -0.00041671842336654663, -0.000382840633392334, -0.00034896284341812134, -0.0003150850534439087, -0.00028120726346969604, -0.0002473294734954834, -0.00021345168352127075, -0.0001795738935470581, -0.00014569610357284546, -0.00011181831359863281, -7.794052362442017e-05, -4.406273365020752e-05, -1.0184943675994873e-05, 2.3692846298217773e-05, 5.757063627243042e-05, 9.144842624664307e-05, 0.0001253262162208557, 0.00015920400619506836, 0.000193081796169281, 0.00022695958614349365, 0.0002608373761177063, 0.00029471516609191895, 0.0003285929560661316, 0.00036247074604034424, 0.0003963485360145569, 0.00043022632598876953, 0.0004641041159629822, 0.0004979819059371948, 0.0005318596959114075, 0.0005657374858856201, 0.0005996152758598328, 0.0006334930658340454, 0.0006673708558082581, 0.0007012486457824707, 0.0007351264357566833, 0.000769004225730896, 0.0008028820157051086, 0.0008367598056793213, 0.0008706375956535339, 0.0009045153856277466, 0.0009383931756019592, 0.0009722709655761719]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 12.0, 9.0, 14.0, 14.0, 22.0, 38.0, 46.0, 59.0, 74.0, 95.0, 143.0, 265.0, 756.0, 13858.0, 1030183.0, 1765.0, 472.0, 186.0, 120.0, 78.0, 78.0, 66.0, 55.0, 29.0, 25.0, 22.0, 13.0, 13.0, 5.0, 9.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.021697998046875, -0.020957231521606445, -0.02021646499633789, -0.019475698471069336, -0.01873493194580078, -0.017994165420532227, -0.017253398895263672, -0.016512632369995117, -0.015771865844726562, -0.015031099319458008, -0.014290332794189453, -0.013549566268920898, -0.012808799743652344, -0.012068033218383789, -0.011327266693115234, -0.01058650016784668, -0.009845733642578125, -0.00910496711730957, -0.008364200592041016, -0.007623434066772461, -0.006882667541503906, -0.0061419010162353516, -0.005401134490966797, -0.004660367965698242, -0.0039196014404296875, -0.003178834915161133, -0.002438068389892578, -0.0016973018646240234, -0.0009565353393554688, -0.00021576881408691406, 0.0005249977111816406, 0.0012657642364501953, 0.00200653076171875, 0.0027472972869873047, 0.0034880638122558594, 0.004228830337524414, 0.004969596862792969, 0.0057103633880615234, 0.006451129913330078, 0.007191896438598633, 0.007932662963867188, 0.008673429489135742, 0.009414196014404297, 0.010154962539672852, 0.010895729064941406, 0.011636495590209961, 0.012377262115478516, 0.01311802864074707, 0.013858795166015625, 0.01459956169128418, 0.015340328216552734, 0.01608109474182129, 0.016821861267089844, 0.0175626277923584, 0.018303394317626953, 0.019044160842895508, 0.019784927368164062, 0.020525693893432617, 0.021266460418701172, 0.022007226943969727, 0.02274799346923828, 0.023488759994506836, 0.02422952651977539, 0.024970293045043945, 0.0257110595703125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 227.0, 790.0], "bins": [-0.020816965028643608, -0.02048720046877861, -0.020157435908913612, -0.019827671349048615, -0.019497906789183617, -0.01916814222931862, -0.01883837766945362, -0.018508613109588623, -0.018178848549723625, -0.017849083989858627, -0.01751931942999363, -0.01718955487012863, -0.016859790310263634, -0.016530025750398636, -0.016200261190533638, -0.01587049663066864, -0.015540733002126217, -0.015210968442261219, -0.014881203882396221, -0.014551439322531223, -0.014221674762666225, -0.013891910202801228, -0.013562146574258804, -0.013232382014393806, -0.012902617454528809, -0.01257285289466381, -0.012243088334798813, -0.011913323774933815, -0.011583559215068817, -0.01125379465520382, -0.010924030095338821, -0.010594265535473824, -0.010264500044286251, -0.009934735484421253, -0.009604970924556255, -0.009275206364691257, -0.00894544180482626, -0.008615677244961262, -0.008285913616418839, -0.00795614905655384, -0.0076263840310275555, -0.007296619471162558, -0.00696685491129756, -0.006637090817093849, -0.006307326257228851, -0.0059775616973638535, -0.005647797137498856, -0.005318032577633858, -0.00498826801776886, -0.004658503457903862, -0.004328738898038864, -0.003998974338173866, -0.003669210011139512, -0.003339445451274514, -0.00300968112424016, -0.002679916564375162, -0.002350152237340808, -0.00202038767747581, -0.001690623234026134, -0.001360858790576458, -0.0010310942307114601, -0.0007013296708464622, -0.00037156534381210804, -4.1800783947110176e-05, 0.00028796386322937906]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 7.0, 4.0, 14.0, 24.0, 17.0, 22.0, 20.0, 40.0, 45.0, 47.0, 51.0, 43.0, 54.0, 70.0, 57.0, 63.0, 48.0, 60.0, 49.0, 45.0, 51.0, 30.0, 29.0, 19.0, 25.0, 17.0, 20.0, 3.0, 8.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004590749740600586, -0.0004376135766506195, -0.0004161521792411804, -0.00039469078183174133, -0.00037322938442230225, -0.00035176798701286316, -0.00033030658960342407, -0.000308845192193985, -0.0002873837947845459, -0.0002659223973751068, -0.0002444609999656677, -0.00022299960255622864, -0.00020153820514678955, -0.00018007680773735046, -0.00015861541032791138, -0.0001371540129184723, -0.0001156926155090332, -9.423121809959412e-05, -7.276982069015503e-05, -5.130842328071594e-05, -2.9847025871276855e-05, -8.385628461837769e-06, 1.3075768947601318e-05, 3.4537166357040405e-05, 5.599856376647949e-05, 7.745996117591858e-05, 9.892135858535767e-05, 0.00012038275599479675, 0.00014184415340423584, 0.00016330555081367493, 0.00018476694822311401, 0.0002062283456325531, 0.0002276897430419922, 0.0002491511404514313, 0.00027061253786087036, 0.00029207393527030945, 0.00031353533267974854, 0.0003349967300891876, 0.0003564581274986267, 0.0003779195249080658, 0.0003993809223175049, 0.00042084231972694397, 0.00044230371713638306, 0.00046376511454582214, 0.00048522651195526123, 0.0005066879093647003, 0.0005281493067741394, 0.0005496107041835785, 0.0005710721015930176, 0.0005925334990024567, 0.0006139948964118958, 0.0006354562938213348, 0.0006569176912307739, 0.000678379088640213, 0.0006998404860496521, 0.0007213018834590912, 0.0007427632808685303, 0.0007642246782779694, 0.0007856860756874084, 0.0008071474730968475, 0.0008286088705062866, 0.0008500702679157257, 0.0008715316653251648, 0.0008929930627346039, 0.000914454460144043]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 10.0, 8.0, 20.0, 12.0, 21.0, 17.0, 21.0, 24.0, 29.0, 32.0, 26.0, 39.0, 43.0, 35.0, 47.0, 48.0, 54.0, 51.0, 46.0, 38.0, 45.0, 39.0, 34.0, 28.0, 28.0, 30.0, 32.0, 20.0, 17.0, 25.0, 11.0, 15.0, 11.0, 11.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01953125, -5.82403564453125, -5.6285400390625, -5.43304443359375, -5.237548828125, -5.04205322265625, -4.8465576171875, -4.65106201171875, -4.45556640625, -4.26007080078125, -4.0645751953125, -3.86907958984375, -3.673583984375, -3.47808837890625, -3.2825927734375, -3.08709716796875, -2.8916015625, -2.69610595703125, -2.5006103515625, -2.30511474609375, -2.109619140625, -1.91412353515625, -1.7186279296875, -1.52313232421875, -1.32763671875, -1.13214111328125, -0.9366455078125, -0.74114990234375, -0.545654296875, -0.35015869140625, -0.1546630859375, 0.04083251953125, 0.236328125, 0.43182373046875, 0.6273193359375, 0.82281494140625, 1.018310546875, 1.21380615234375, 1.4093017578125, 1.60479736328125, 1.80029296875, 1.99578857421875, 2.1912841796875, 2.38677978515625, 2.582275390625, 2.77777099609375, 2.9732666015625, 3.16876220703125, 3.3642578125, 3.55975341796875, 3.7552490234375, 3.95074462890625, 4.146240234375, 4.34173583984375, 4.5372314453125, 4.73272705078125, 4.92822265625, 5.12371826171875, 5.3192138671875, 5.51470947265625, 5.710205078125, 5.90570068359375, 6.1011962890625, 6.29669189453125, 6.4921875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 10.0, 11.0, 7.0, 15.0, 10.0, 25.0, 25.0, 38.0, 44.0, 70.0, 105.0, 190.0, 368.0, 802.0, 1977.0, 4806.0, 12859.0, 34891.0, 97591.0, 312379.0, 387456.0, 124891.0, 43690.0, 15955.0, 5900.0, 2381.0, 997.0, 413.0, 237.0, 134.0, 74.0, 45.0, 47.0, 22.0, 27.0, 19.0, 17.0, 9.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23046875, -5.0567626953125, -4.883056640625, -4.7093505859375, -4.53564453125, -4.3619384765625, -4.188232421875, -4.0145263671875, -3.8408203125, -3.6671142578125, -3.493408203125, -3.3197021484375, -3.14599609375, -2.9722900390625, -2.798583984375, -2.6248779296875, -2.451171875, -2.2774658203125, -2.103759765625, -1.9300537109375, -1.75634765625, -1.5826416015625, -1.408935546875, -1.2352294921875, -1.0615234375, -0.8878173828125, -0.714111328125, -0.5404052734375, -0.36669921875, -0.1929931640625, -0.019287109375, 0.1544189453125, 0.328125, 0.5018310546875, 0.675537109375, 0.8492431640625, 1.02294921875, 1.1966552734375, 1.370361328125, 1.5440673828125, 1.7177734375, 1.8914794921875, 2.065185546875, 2.2388916015625, 2.41259765625, 2.5863037109375, 2.760009765625, 2.9337158203125, 3.107421875, 3.2811279296875, 3.454833984375, 3.6285400390625, 3.80224609375, 3.9759521484375, 4.149658203125, 4.3233642578125, 4.4970703125, 4.6707763671875, 4.844482421875, 5.0181884765625, 5.19189453125, 5.3656005859375, 5.539306640625, 5.7130126953125, 5.88671875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 4.0, 2.0, 8.0, 13.0, 9.0, 9.0, 14.0, 20.0, 29.0, 24.0, 30.0, 21.0, 41.0, 50.0, 39.0, 50.0, 66.0, 161.0, 1514.0, 388.0, 101.0, 54.0, 57.0, 45.0, 31.0, 42.0, 33.0, 34.0, 25.0, 31.0, 20.0, 13.0, 5.0, 12.0, 8.0, 8.0, 6.0, 6.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.234375, -19.63720703125, -19.0400390625, -18.44287109375, -17.845703125, -17.24853515625, -16.6513671875, -16.05419921875, -15.45703125, -14.85986328125, -14.2626953125, -13.66552734375, -13.068359375, -12.47119140625, -11.8740234375, -11.27685546875, -10.6796875, -10.08251953125, -9.4853515625, -8.88818359375, -8.291015625, -7.69384765625, -7.0966796875, -6.49951171875, -5.90234375, -5.30517578125, -4.7080078125, -4.11083984375, -3.513671875, -2.91650390625, -2.3193359375, -1.72216796875, -1.125, -0.52783203125, 0.0693359375, 0.66650390625, 1.263671875, 1.86083984375, 2.4580078125, 3.05517578125, 3.65234375, 4.24951171875, 4.8466796875, 5.44384765625, 6.041015625, 6.63818359375, 7.2353515625, 7.83251953125, 8.4296875, 9.02685546875, 9.6240234375, 10.22119140625, 10.818359375, 11.41552734375, 12.0126953125, 12.60986328125, 13.20703125, 13.80419921875, 14.4013671875, 14.99853515625, 15.595703125, 16.19287109375, 16.7900390625, 17.38720703125, 17.984375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 9.0, 11.0, 13.0, 23.0, 17.0, 37.0, 48.0, 48.0, 70.0, 101.0, 125.0, 156.0, 250.0, 392.0, 731.0, 3775.0, 271479.0, 2851934.0, 13818.0, 1160.0, 486.0, 268.0, 171.0, 143.0, 90.0, 61.0, 54.0, 43.0, 37.0, 24.0, 22.0, 15.0, 15.0, 10.0, 6.0, 4.0, 7.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.96875, -27.0107421875, -26.052734375, -25.0947265625, -24.13671875, -23.1787109375, -22.220703125, -21.2626953125, -20.3046875, -19.3466796875, -18.388671875, -17.4306640625, -16.47265625, -15.5146484375, -14.556640625, -13.5986328125, -12.640625, -11.6826171875, -10.724609375, -9.7666015625, -8.80859375, -7.8505859375, -6.892578125, -5.9345703125, -4.9765625, -4.0185546875, -3.060546875, -2.1025390625, -1.14453125, -0.1865234375, 0.771484375, 1.7294921875, 2.6875, 3.6455078125, 4.603515625, 5.5615234375, 6.51953125, 7.4775390625, 8.435546875, 9.3935546875, 10.3515625, 11.3095703125, 12.267578125, 13.2255859375, 14.18359375, 15.1416015625, 16.099609375, 17.0576171875, 18.015625, 18.9736328125, 19.931640625, 20.8896484375, 21.84765625, 22.8056640625, 23.763671875, 24.7216796875, 25.6796875, 26.6376953125, 27.595703125, 28.5537109375, 29.51171875, 30.4697265625, 31.427734375, 32.3857421875, 33.34375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 10.0, 77.0, 307.0, 472.0, 131.0, 17.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.286720275878906, -30.011655807495117, -27.736591339111328, -25.461528778076172, -23.186464309692383, -20.911399841308594, -18.636337280273438, -16.36127281188965, -14.08620834350586, -11.81114387512207, -9.536080360412598, -7.261016368865967, -4.985952377319336, -2.710887908935547, -0.4358243942260742, 1.8392391204833984, 4.1143035888671875, 6.389367580413818, 8.66443157196045, 10.939495086669922, 13.214559555053711, 15.4896240234375, 17.764686584472656, 20.039751052856445, 22.314815521240234, 24.589879989624023, 26.864944458007812, 29.14000701904297, 31.415071487426758, 33.69013595581055, 35.9651985168457, 38.240264892578125, 40.51533508300781, 42.79039764404297, 45.06546401977539, 47.34052658081055, 49.61559295654297, 51.890655517578125, 54.16571807861328, 56.44078063964844, 58.71584701538086, 60.990909576416016, 63.26597595214844, 65.5410385131836, 67.81610107421875, 70.09117126464844, 72.3662338256836, 74.64129638671875, 76.9163589477539, 79.19142150878906, 81.46648406982422, 83.7415542602539, 86.01661682128906, 88.29167938232422, 90.56674194335938, 92.84180450439453, 95.11686706542969, 97.39192962646484, 99.6669921875, 101.94206237792969, 104.21712493896484, 106.4921875, 108.76725006103516, 111.04231262207031, 113.3173828125]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 7.0, 7.0, 11.0, 14.0, 10.0, 21.0, 25.0, 17.0, 17.0, 32.0, 31.0, 36.0, 31.0, 35.0, 41.0, 41.0, 34.0, 44.0, 46.0, 50.0, 39.0, 32.0, 29.0, 36.0, 42.0, 37.0, 34.0, 25.0, 24.0, 26.0, 24.0, 15.0, 14.0, 7.0, 11.0, 7.0, 5.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-45.03936004638672, -43.53858947753906, -42.03781509399414, -40.537044525146484, -39.03627014160156, -37.535499572753906, -36.034725189208984, -34.53395462036133, -33.033180236816406, -31.532407760620117, -30.031635284423828, -28.53086280822754, -27.03009033203125, -25.52931785583496, -24.028545379638672, -22.527774810791016, -21.027002334594727, -19.526229858398438, -18.02545738220215, -16.52468490600586, -15.02391242980957, -13.523139953613281, -12.022368431091309, -10.52159595489502, -9.02082347869873, -7.520051002502441, -6.019278526306152, -4.5185065269470215, -3.0177340507507324, -1.5169615745544434, -0.0161895751953125, 1.4845829010009766, 2.9853553771972656, 4.486127853393555, 5.986900329589844, 7.487672328948975, 8.988445281982422, 10.489217758178711, 11.989989280700684, 13.490761756896973, 14.991534233093262, 16.492305755615234, 17.993078231811523, 19.493850708007812, 20.9946231842041, 22.49539566040039, 23.99616813659668, 25.49694061279297, 26.997713088989258, 28.498485565185547, 29.999258041381836, 31.500030517578125, 33.00080108642578, 34.5015754699707, 36.00234603881836, 37.50312042236328, 39.00389099121094, 40.504661560058594, 42.005435943603516, 43.50620651245117, 45.006980895996094, 46.50775146484375, 48.00852584838867, 49.50929641723633, 51.01007080078125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 10.0, 17.0, 9.0, 18.0, 14.0, 16.0, 16.0, 14.0, 33.0, 30.0, 28.0, 37.0, 34.0, 39.0, 41.0, 47.0, 48.0, 42.0, 48.0, 38.0, 59.0, 47.0, 36.0, 36.0, 32.0, 29.0, 32.0, 20.0, 25.0, 19.0, 18.0, 13.0, 15.0, 9.0, 9.0, 3.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.61834716796875, -5.4163818359375, -5.21441650390625, -5.012451171875, -4.81048583984375, -4.6085205078125, -4.40655517578125, -4.20458984375, -4.00262451171875, -3.8006591796875, -3.59869384765625, -3.396728515625, -3.19476318359375, -2.9927978515625, -2.79083251953125, -2.5888671875, -2.38690185546875, -2.1849365234375, -1.98297119140625, -1.781005859375, -1.57904052734375, -1.3770751953125, -1.17510986328125, -0.97314453125, -0.77117919921875, -0.5692138671875, -0.36724853515625, -0.165283203125, 0.03668212890625, 0.2386474609375, 0.44061279296875, 0.642578125, 0.84454345703125, 1.0465087890625, 1.24847412109375, 1.450439453125, 1.65240478515625, 1.8543701171875, 2.05633544921875, 2.25830078125, 2.46026611328125, 2.6622314453125, 2.86419677734375, 3.066162109375, 3.26812744140625, 3.4700927734375, 3.67205810546875, 3.8740234375, 4.07598876953125, 4.2779541015625, 4.47991943359375, 4.681884765625, 4.88385009765625, 5.0858154296875, 5.28778076171875, 5.48974609375, 5.69171142578125, 5.8936767578125, 6.09564208984375, 6.297607421875, 6.49957275390625, 6.7015380859375, 6.90350341796875, 7.10546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 7.0, 8.0, 3.0, 10.0, 10.0, 14.0, 28.0, 16.0, 27.0, 27.0, 35.0, 45.0, 75.0, 104.0, 201.0, 447.0, 1831.0, 19235.0, 1424371.0, 2701715.0, 42228.0, 2582.0, 597.0, 191.0, 120.0, 73.0, 50.0, 48.0, 36.0, 32.0, 23.0, 16.0, 20.0, 12.0, 6.0, 6.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.859375, -20.142822265625, -19.42626953125, -18.709716796875, -17.9931640625, -17.276611328125, -16.56005859375, -15.843505859375, -15.126953125, -14.410400390625, -13.69384765625, -12.977294921875, -12.2607421875, -11.544189453125, -10.82763671875, -10.111083984375, -9.39453125, -8.677978515625, -7.96142578125, -7.244873046875, -6.5283203125, -5.811767578125, -5.09521484375, -4.378662109375, -3.662109375, -2.945556640625, -2.22900390625, -1.512451171875, -0.7958984375, -0.079345703125, 0.63720703125, 1.353759765625, 2.0703125, 2.786865234375, 3.50341796875, 4.219970703125, 4.9365234375, 5.653076171875, 6.36962890625, 7.086181640625, 7.802734375, 8.519287109375, 9.23583984375, 9.952392578125, 10.6689453125, 11.385498046875, 12.10205078125, 12.818603515625, 13.53515625, 14.251708984375, 14.96826171875, 15.684814453125, 16.4013671875, 17.117919921875, 17.83447265625, 18.551025390625, 19.267578125, 19.984130859375, 20.70068359375, 21.417236328125, 22.1337890625, 22.850341796875, 23.56689453125, 24.283447265625, 25.0]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 16.0, 10.0, 14.0, 17.0, 22.0, 25.0, 36.0, 37.0, 59.0, 66.0, 103.0, 112.0, 149.0, 227.0, 280.0, 308.0, 364.0, 388.0, 377.0, 327.0, 214.0, 187.0, 162.0, 120.0, 113.0, 60.0, 59.0, 38.0, 22.0, 30.0, 22.0, 23.0, 12.0, 10.0, 12.0, 9.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-8.4921875, -8.2384033203125, -7.984619140625, -7.7308349609375, -7.47705078125, -7.2232666015625, -6.969482421875, -6.7156982421875, -6.4619140625, -6.2081298828125, -5.954345703125, -5.7005615234375, -5.44677734375, -5.1929931640625, -4.939208984375, -4.6854248046875, -4.431640625, -4.1778564453125, -3.924072265625, -3.6702880859375, -3.41650390625, -3.1627197265625, -2.908935546875, -2.6551513671875, -2.4013671875, -2.1475830078125, -1.893798828125, -1.6400146484375, -1.38623046875, -1.1324462890625, -0.878662109375, -0.6248779296875, -0.37109375, -0.1173095703125, 0.136474609375, 0.3902587890625, 0.64404296875, 0.8978271484375, 1.151611328125, 1.4053955078125, 1.6591796875, 1.9129638671875, 2.166748046875, 2.4205322265625, 2.67431640625, 2.9281005859375, 3.181884765625, 3.4356689453125, 3.689453125, 3.9432373046875, 4.197021484375, 4.4508056640625, 4.70458984375, 4.9583740234375, 5.212158203125, 5.4659423828125, 5.7197265625, 5.9735107421875, 6.227294921875, 6.4810791015625, 6.73486328125, 6.9886474609375, 7.242431640625, 7.4962158203125, 7.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 3.0, 4.0, 15.0, 12.0, 4.0, 17.0, 16.0, 31.0, 33.0, 42.0, 58.0, 56.0, 87.0, 100.0, 121.0, 125.0, 191.0, 278.0, 471.0, 1283.0, 17672.0, 3308557.0, 855005.0, 7594.0, 973.0, 380.0, 245.0, 183.0, 143.0, 131.0, 92.0, 57.0, 60.0, 44.0, 44.0, 27.0, 25.0, 23.0, 15.0, 14.0, 13.0, 8.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-45.28125, -43.98291015625, -42.6845703125, -41.38623046875, -40.087890625, -38.78955078125, -37.4912109375, -36.19287109375, -34.89453125, -33.59619140625, -32.2978515625, -30.99951171875, -29.701171875, -28.40283203125, -27.1044921875, -25.80615234375, -24.5078125, -23.20947265625, -21.9111328125, -20.61279296875, -19.314453125, -18.01611328125, -16.7177734375, -15.41943359375, -14.12109375, -12.82275390625, -11.5244140625, -10.22607421875, -8.927734375, -7.62939453125, -6.3310546875, -5.03271484375, -3.734375, -2.43603515625, -1.1376953125, 0.16064453125, 1.458984375, 2.75732421875, 4.0556640625, 5.35400390625, 6.65234375, 7.95068359375, 9.2490234375, 10.54736328125, 11.845703125, 13.14404296875, 14.4423828125, 15.74072265625, 17.0390625, 18.33740234375, 19.6357421875, 20.93408203125, 22.232421875, 23.53076171875, 24.8291015625, 26.12744140625, 27.42578125, 28.72412109375, 30.0224609375, 31.32080078125, 32.619140625, 33.91748046875, 35.2158203125, 36.51416015625, 37.8125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 15.0, 165.0, 699.0, 136.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.70066833496094, -176.18458557128906, -168.66851806640625, -161.15243530273438, -153.63636779785156, -146.1202850341797, -138.60421752929688, -131.088134765625, -123.57205963134766, -116.05598449707031, -108.53990936279297, -101.02383422851562, -93.50775146484375, -85.99168395996094, -78.47560119628906, -70.95952606201172, -63.443450927734375, -55.92737579345703, -48.41130065917969, -40.89522171020508, -33.379146575927734, -25.86307144165039, -18.34699249267578, -10.830917358398438, -3.3148422241210938, 4.201233863830566, 11.717309951782227, 19.233386993408203, 26.749462127685547, 34.26553726196289, 41.7816162109375, 49.297691345214844, 56.813751220703125, 64.32982635498047, 71.84590148925781, 79.36198425292969, 86.8780517578125, 94.39413452148438, 101.91020965576172, 109.42628479003906, 116.9423599243164, 124.45843505859375, 131.97451782226562, 139.49058532714844, 147.0066680908203, 154.52273559570312, 162.038818359375, 169.55490112304688, 177.0709686279297, 184.58705139160156, 192.10311889648438, 199.61920166015625, 207.13526916503906, 214.65135192871094, 222.16741943359375, 229.68350219726562, 237.1995849609375, 244.71566772460938, 252.2317352294922, 259.747802734375, 267.2638854980469, 274.77996826171875, 282.2960510253906, 289.8121337890625, 297.32818603515625]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 5.0, 9.0, 2.0, 10.0, 11.0, 12.0, 15.0, 15.0, 21.0, 27.0, 21.0, 20.0, 29.0, 22.0, 30.0, 32.0, 29.0, 26.0, 43.0, 34.0, 34.0, 41.0, 24.0, 20.0, 41.0, 34.0, 28.0, 37.0, 39.0, 26.0, 38.0, 29.0, 30.0, 19.0, 33.0, 20.0, 16.0, 8.0, 10.0, 10.0, 7.0, 4.0, 3.0, 8.0, 8.0, 3.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-30.58477783203125, -29.624061584472656, -28.663345336914062, -27.70262908935547, -26.741912841796875, -25.78119659423828, -24.82048225402832, -23.859766006469727, -22.899049758911133, -21.93833351135254, -20.977617263793945, -20.01690101623535, -19.05618667602539, -18.095470428466797, -17.134754180908203, -16.17403793334961, -15.213321685791016, -14.252605438232422, -13.291889190673828, -12.33117389678955, -11.370457649230957, -10.409741401672363, -9.449026107788086, -8.488309860229492, -7.527593612670898, -6.566877365112305, -5.606161594390869, -4.645445823669434, -3.68472957611084, -2.724013328552246, -1.7632975578308105, -0.802581787109375, 0.15813446044921875, 1.1188504695892334, 2.079566478729248, 3.0402824878692627, 4.000998497009277, 4.961714744567871, 5.922430515289307, 6.883146286010742, 7.843862533569336, 8.80457878112793, 9.765295028686523, 10.7260103225708, 11.686726570129395, 12.647442817687988, 13.608158111572266, 14.56887435913086, 15.529590606689453, 16.490306854248047, 17.45102310180664, 18.411739349365234, 19.372455596923828, 20.333171844482422, 21.293886184692383, 22.254602432250977, 23.21531867980957, 24.176034927368164, 25.136751174926758, 26.09746742248535, 27.058181762695312, 28.018898010253906, 28.9796142578125, 29.940330505371094, 30.901046752929688]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 7.0, 6.0, 12.0, 9.0, 15.0, 15.0, 16.0, 18.0, 26.0, 22.0, 23.0, 36.0, 37.0, 35.0, 31.0, 39.0, 35.0, 63.0, 37.0, 44.0, 44.0, 34.0, 38.0, 54.0, 32.0, 31.0, 39.0, 24.0, 22.0, 31.0, 20.0, 22.0, 9.0, 15.0, 11.0, 11.0, 8.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.19140625, -6.0048828125, -5.818359375, -5.6318359375, -5.4453125, -5.2587890625, -5.072265625, -4.8857421875, -4.69921875, -4.5126953125, -4.326171875, -4.1396484375, -3.953125, -3.7666015625, -3.580078125, -3.3935546875, -3.20703125, -3.0205078125, -2.833984375, -2.6474609375, -2.4609375, -2.2744140625, -2.087890625, -1.9013671875, -1.71484375, -1.5283203125, -1.341796875, -1.1552734375, -0.96875, -0.7822265625, -0.595703125, -0.4091796875, -0.22265625, -0.0361328125, 0.150390625, 0.3369140625, 0.5234375, 0.7099609375, 0.896484375, 1.0830078125, 1.26953125, 1.4560546875, 1.642578125, 1.8291015625, 2.015625, 2.2021484375, 2.388671875, 2.5751953125, 2.76171875, 2.9482421875, 3.134765625, 3.3212890625, 3.5078125, 3.6943359375, 3.880859375, 4.0673828125, 4.25390625, 4.4404296875, 4.626953125, 4.8134765625, 5.0, 5.1865234375, 5.373046875, 5.5595703125, 5.74609375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 12.0, 17.0, 28.0, 33.0, 52.0, 91.0, 112.0, 197.0, 277.0, 415.0, 578.0, 816.0, 1164.0, 1546.0, 2220.0, 3033.0, 4206.0, 5543.0, 7680.0, 10606.0, 14671.0, 20728.0, 28977.0, 40706.0, 58575.0, 84959.0, 119539.0, 147286.0, 138837.0, 104885.0, 73374.0, 50999.0, 35925.0, 25317.0, 18308.0, 12806.0, 9438.0, 6714.0, 4934.0, 3657.0, 2707.0, 1876.0, 1380.0, 1095.0, 748.0, 451.0, 330.0, 252.0, 162.0, 101.0, 82.0, 50.0, 32.0, 17.0, 13.0, 7.0, 3.0, 1.0], "bins": [-0.452880859375, -0.439483642578125, -0.42608642578125, -0.412689208984375, -0.3992919921875, -0.385894775390625, -0.37249755859375, -0.359100341796875, -0.345703125, -0.332305908203125, -0.31890869140625, -0.305511474609375, -0.2921142578125, -0.278717041015625, -0.26531982421875, -0.251922607421875, -0.238525390625, -0.225128173828125, -0.21173095703125, -0.198333740234375, -0.1849365234375, -0.171539306640625, -0.15814208984375, -0.144744873046875, -0.13134765625, -0.117950439453125, -0.10455322265625, -0.091156005859375, -0.0777587890625, -0.064361572265625, -0.05096435546875, -0.037567138671875, -0.024169921875, -0.010772705078125, 0.00262451171875, 0.016021728515625, 0.0294189453125, 0.042816162109375, 0.05621337890625, 0.069610595703125, 0.0830078125, 0.096405029296875, 0.10980224609375, 0.123199462890625, 0.1365966796875, 0.149993896484375, 0.16339111328125, 0.176788330078125, 0.190185546875, 0.203582763671875, 0.21697998046875, 0.230377197265625, 0.2437744140625, 0.257171630859375, 0.27056884765625, 0.283966064453125, 0.29736328125, 0.310760498046875, 0.32415771484375, 0.337554931640625, 0.3509521484375, 0.364349365234375, 0.37774658203125, 0.391143798828125, 0.404541015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 11.0, 12.0, 15.0, 23.0, 18.0, 18.0, 33.0, 32.0, 29.0, 46.0, 22.0, 31.0, 40.0, 38.0, 47.0, 40.0, 1062.0, 49.0, 47.0, 42.0, 47.0, 43.0, 22.0, 28.0, 26.0, 19.0, 18.0, 23.0, 20.0, 29.0, 13.0, 8.0, 13.0, 13.0, 5.0, 7.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.826812744140625, -3.70440673828125, -3.582000732421875, -3.4595947265625, -3.337188720703125, -3.21478271484375, -3.092376708984375, -2.969970703125, -2.847564697265625, -2.72515869140625, -2.602752685546875, -2.4803466796875, -2.357940673828125, -2.23553466796875, -2.113128662109375, -1.99072265625, -1.868316650390625, -1.74591064453125, -1.623504638671875, -1.5010986328125, -1.378692626953125, -1.25628662109375, -1.133880615234375, -1.011474609375, -0.889068603515625, -0.76666259765625, -0.644256591796875, -0.5218505859375, -0.399444580078125, -0.27703857421875, -0.154632568359375, -0.0322265625, 0.090179443359375, 0.21258544921875, 0.334991455078125, 0.4573974609375, 0.579803466796875, 0.70220947265625, 0.824615478515625, 0.947021484375, 1.069427490234375, 1.19183349609375, 1.314239501953125, 1.4366455078125, 1.559051513671875, 1.68145751953125, 1.803863525390625, 1.92626953125, 2.048675537109375, 2.17108154296875, 2.293487548828125, 2.4158935546875, 2.538299560546875, 2.66070556640625, 2.783111572265625, 2.905517578125, 3.027923583984375, 3.15032958984375, 3.272735595703125, 3.3951416015625, 3.517547607421875, 3.63995361328125, 3.762359619140625, 3.884765625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 12.0, 9.0, 15.0, 30.0, 37.0, 47.0, 66.0, 125.0, 154.0, 237.0, 345.0, 564.0, 778.0, 1278.0, 2046.0, 3128.0, 4985.0, 7886.0, 12758.0, 20775.0, 34735.0, 58037.0, 98288.0, 158731.0, 1253326.0, 170192.0, 107047.0, 63765.0, 37803.0, 22928.0, 13708.0, 8548.0, 5435.0, 3291.0, 2124.0, 1283.0, 957.0, 540.0, 356.0, 255.0, 174.0, 97.0, 78.0, 52.0, 35.0, 28.0, 13.0, 7.0, 9.0, 10.0, 1.0, 4.0, 3.0, 2.0], "bins": [-0.57958984375, -0.5628318786621094, -0.5460739135742188, -0.5293159484863281, -0.5125579833984375, -0.4958000183105469, -0.47904205322265625, -0.4622840881347656, -0.445526123046875, -0.4287681579589844, -0.41201019287109375, -0.3952522277832031, -0.3784942626953125, -0.3617362976074219, -0.34497833251953125, -0.3282203674316406, -0.31146240234375, -0.2947044372558594, -0.27794647216796875, -0.2611885070800781, -0.2444305419921875, -0.22767257690429688, -0.21091461181640625, -0.19415664672851562, -0.177398681640625, -0.16064071655273438, -0.14388275146484375, -0.12712478637695312, -0.1103668212890625, -0.09360885620117188, -0.07685089111328125, -0.060092926025390625, -0.0433349609375, -0.026576995849609375, -0.00981903076171875, 0.006938934326171875, 0.0236968994140625, 0.040454864501953125, 0.05721282958984375, 0.07397079467773438, 0.090728759765625, 0.10748672485351562, 0.12424468994140625, 0.14100265502929688, 0.1577606201171875, 0.17451858520507812, 0.19127655029296875, 0.20803451538085938, 0.22479248046875, 0.24155044555664062, 0.25830841064453125, 0.2750663757324219, 0.2918243408203125, 0.3085823059082031, 0.32534027099609375, 0.3420982360839844, 0.358856201171875, 0.3756141662597656, 0.39237213134765625, 0.4091300964355469, 0.4258880615234375, 0.4426460266113281, 0.45940399169921875, 0.4761619567871094, 0.492919921875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 9.0, 7.0, 14.0, 14.0, 14.0, 21.0, 29.0, 29.0, 35.0, 44.0, 32.0, 47.0, 50.0, 39.0, 51.0, 54.0, 43.0, 54.0, 47.0, 63.0, 48.0, 26.0, 39.0, 29.0, 35.0, 24.0, 18.0, 16.0, 13.0, 13.0, 14.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010728836059570312, -0.0010437965393066406, -0.00101470947265625, -0.0009856224060058594, -0.0009565353393554688, -0.0009274482727050781, -0.0008983612060546875, -0.0008692741394042969, -0.0008401870727539062, -0.0008111000061035156, -0.000782012939453125, -0.0007529258728027344, -0.0007238388061523438, -0.0006947517395019531, -0.0006656646728515625, -0.0006365776062011719, -0.0006074905395507812, -0.0005784034729003906, -0.00054931640625, -0.0005202293395996094, -0.0004911422729492188, -0.0004620552062988281, -0.0004329681396484375, -0.0004038810729980469, -0.00037479400634765625, -0.0003457069396972656, -0.000316619873046875, -0.0002875328063964844, -0.00025844573974609375, -0.00022935867309570312, -0.0002002716064453125, -0.00017118453979492188, -0.00014209747314453125, -0.00011301040649414062, -8.392333984375e-05, -5.4836273193359375e-05, -2.574920654296875e-05, 3.337860107421875e-06, 3.24249267578125e-05, 6.151199340820312e-05, 9.059906005859375e-05, 0.00011968612670898438, 0.000148773193359375, 0.00017786026000976562, 0.00020694732666015625, 0.00023603439331054688, 0.0002651214599609375, 0.0002942085266113281, 0.00032329559326171875, 0.0003523826599121094, 0.0003814697265625, 0.0004105567932128906, 0.00043964385986328125, 0.0004687309265136719, 0.0004978179931640625, 0.0005269050598144531, 0.0005559921264648438, 0.0005850791931152344, 0.000614166259765625, 0.0006432533264160156, 0.0006723403930664062, 0.0007014274597167969, 0.0007305145263671875, 0.0007596015930175781, 0.0007886886596679688]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 11.0, 6.0, 19.0, 13.0, 24.0, 36.0, 27.0, 48.0, 49.0, 63.0, 90.0, 100.0, 193.0, 322.0, 903.0, 23367.0, 1019852.0, 1913.0, 598.0, 279.0, 138.0, 98.0, 81.0, 59.0, 55.0, 52.0, 29.0, 25.0, 22.0, 20.0, 11.0, 9.0, 6.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0179595947265625, -0.01732492446899414, -0.01669025421142578, -0.016055583953857422, -0.015420913696289062, -0.014786243438720703, -0.014151573181152344, -0.013516902923583984, -0.012882232666015625, -0.012247562408447266, -0.011612892150878906, -0.010978221893310547, -0.010343551635742188, -0.009708881378173828, -0.009074211120605469, -0.00843954086303711, -0.00780487060546875, -0.007170200347900391, -0.006535530090332031, -0.005900859832763672, -0.0052661895751953125, -0.004631519317626953, -0.003996849060058594, -0.0033621788024902344, -0.002727508544921875, -0.0020928382873535156, -0.0014581680297851562, -0.0008234977722167969, -0.0001888275146484375, 0.0004458427429199219, 0.0010805130004882812, 0.0017151832580566406, 0.002349853515625, 0.0029845237731933594, 0.0036191940307617188, 0.004253864288330078, 0.0048885345458984375, 0.005523204803466797, 0.006157875061035156, 0.006792545318603516, 0.007427215576171875, 0.008061885833740234, 0.008696556091308594, 0.009331226348876953, 0.009965896606445312, 0.010600566864013672, 0.011235237121582031, 0.01186990737915039, 0.01250457763671875, 0.01313924789428711, 0.013773918151855469, 0.014408588409423828, 0.015043258666992188, 0.015677928924560547, 0.016312599182128906, 0.016947269439697266, 0.017581939697265625, 0.018216609954833984, 0.018851280212402344, 0.019485950469970703, 0.020120620727539062, 0.020755290985107422, 0.02138996124267578, 0.02202463150024414, 0.0226593017578125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 57.0, 693.0, 260.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006889502052217722, -0.006765866186469793, -0.006642230786383152, -0.006518594920635223, -0.006394959520548582, -0.0062713236548006535, -0.006147688254714012, -0.0060240523889660835, -0.005900416523218155, -0.005776780657470226, -0.005653145257383585, -0.005529509391635656, -0.005405873991549015, -0.005282238125801086, -0.005158602725714445, -0.0050349668599665165, -0.004911331459879875, -0.0047876955941319466, -0.004664060194045305, -0.004540424328297377, -0.004416788928210735, -0.004293153062462807, -0.004169517662376165, -0.004045881796628237, -0.0039222463965415955, -0.0037986107636243105, -0.0036749751307070255, -0.0035513394977897406, -0.0034277038648724556, -0.003304067999124527, -0.003180432366207242, -0.003056796733289957, -0.0029331608675420284, -0.0028095252346247435, -0.0026858896017074585, -0.0025622539687901735, -0.0024386183358728886, -0.00231498247012496, -0.002191346837207675, -0.00206771120429039, -0.0019440754549577832, -0.0018204398220404983, -0.0016968040727078915, -0.0015731684397906065, -0.0014495328068733215, -0.0013258971739560366, -0.0012022615410387516, -0.0010786257917061448, -0.0009549901587888598, -0.0008313545258715749, -0.000707718834746629, -0.0005840831436216831, -0.00046044751070439816, -0.0003368118777871132, -0.0002131761866621673, -8.954049553722143e-05, 3.4095137380063534e-05, 0.00015773079940117896, 0.0002813664614222944, 0.0004050021234434098, 0.0005286377854645252, 0.0006522734183818102, 0.0007759091095067561, 0.000899544800631702, 0.001023180433548987]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 13.0, 10.0, 17.0, 13.0, 21.0, 15.0, 16.0, 20.0, 21.0, 31.0, 30.0, 27.0, 38.0, 31.0, 38.0, 32.0, 37.0, 39.0, 35.0, 38.0, 33.0, 40.0, 51.0, 40.0, 38.0, 35.0, 20.0, 29.0, 30.0, 20.0, 16.0, 18.0, 9.0, 13.0, 17.0, 12.0, 7.0, 10.0, 4.0, 0.0, 4.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0004907846450805664, -0.0004763072356581688, -0.0004618298262357712, -0.00044735241681337357, -0.00043287500739097595, -0.00041839759796857834, -0.0004039201885461807, -0.0003894427791237831, -0.0003749653697013855, -0.0003604879602789879, -0.00034601055085659027, -0.00033153314143419266, -0.00031705573201179504, -0.00030257832258939743, -0.0002881009131669998, -0.0002736235037446022, -0.0002591460943222046, -0.000244668684899807, -0.00023019127547740936, -0.00021571386605501175, -0.00020123645663261414, -0.00018675904721021652, -0.0001722816377878189, -0.0001578042283654213, -0.00014332681894302368, -0.00012884940952062607, -0.00011437200009822845, -9.989459067583084e-05, -8.541718125343323e-05, -7.093977183103561e-05, -5.6462362408638e-05, -4.198495298624039e-05, -2.7507543563842773e-05, -1.303013414144516e-05, 1.4472752809524536e-06, 1.5924684703350067e-05, 3.040209412574768e-05, 4.4879503548145294e-05, 5.935691297054291e-05, 7.383432239294052e-05, 8.831173181533813e-05, 0.00010278914123773575, 0.00011726655066013336, 0.00013174396008253098, 0.0001462213695049286, 0.0001606987789273262, 0.00017517618834972382, 0.00018965359777212143, 0.00020413100719451904, 0.00021860841661691666, 0.00023308582603931427, 0.0002475632354617119, 0.0002620406448841095, 0.0002765180543065071, 0.0002909954637289047, 0.00030547287315130234, 0.00031995028257369995, 0.00033442769199609756, 0.0003489051014184952, 0.0003633825108408928, 0.0003778599202632904, 0.000392337329685688, 0.00040681473910808563, 0.00042129214853048325, 0.00043576955795288086]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 7.0, 6.0, 12.0, 9.0, 15.0, 15.0, 16.0, 18.0, 26.0, 22.0, 23.0, 36.0, 37.0, 35.0, 31.0, 39.0, 35.0, 63.0, 37.0, 44.0, 44.0, 34.0, 38.0, 54.0, 32.0, 31.0, 39.0, 24.0, 22.0, 31.0, 20.0, 22.0, 9.0, 15.0, 11.0, 11.0, 8.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.19140625, -6.0048828125, -5.818359375, -5.6318359375, -5.4453125, -5.2587890625, -5.072265625, -4.8857421875, -4.69921875, -4.5126953125, -4.326171875, -4.1396484375, -3.953125, -3.7666015625, -3.580078125, -3.3935546875, -3.20703125, -3.0205078125, -2.833984375, -2.6474609375, -2.4609375, -2.2744140625, -2.087890625, -1.9013671875, -1.71484375, -1.5283203125, -1.341796875, -1.1552734375, -0.96875, -0.7822265625, -0.595703125, -0.4091796875, -0.22265625, -0.0361328125, 0.150390625, 0.3369140625, 0.5234375, 0.7099609375, 0.896484375, 1.0830078125, 1.26953125, 1.4560546875, 1.642578125, 1.8291015625, 2.015625, 2.2021484375, 2.388671875, 2.5751953125, 2.76171875, 2.9482421875, 3.134765625, 3.3212890625, 3.5078125, 3.6943359375, 3.880859375, 4.0673828125, 4.25390625, 4.4404296875, 4.626953125, 4.8134765625, 5.0, 5.1865234375, 5.373046875, 5.5595703125, 5.74609375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 7.0, 13.0, 10.0, 24.0, 16.0, 32.0, 44.0, 57.0, 52.0, 88.0, 134.0, 194.0, 290.0, 468.0, 1219.0, 4925.0, 31563.0, 395424.0, 562150.0, 42524.0, 6208.0, 1503.0, 558.0, 312.0, 193.0, 138.0, 97.0, 68.0, 54.0, 38.0, 29.0, 19.0, 18.0, 17.0, 16.0, 11.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.203125, -11.8341064453125, -11.465087890625, -11.0960693359375, -10.72705078125, -10.3580322265625, -9.989013671875, -9.6199951171875, -9.2509765625, -8.8819580078125, -8.512939453125, -8.1439208984375, -7.77490234375, -7.4058837890625, -7.036865234375, -6.6678466796875, -6.298828125, -5.9298095703125, -5.560791015625, -5.1917724609375, -4.82275390625, -4.4537353515625, -4.084716796875, -3.7156982421875, -3.3466796875, -2.9776611328125, -2.608642578125, -2.2396240234375, -1.87060546875, -1.5015869140625, -1.132568359375, -0.7635498046875, -0.39453125, -0.0255126953125, 0.343505859375, 0.7125244140625, 1.08154296875, 1.4505615234375, 1.819580078125, 2.1885986328125, 2.5576171875, 2.9266357421875, 3.295654296875, 3.6646728515625, 4.03369140625, 4.4027099609375, 4.771728515625, 5.1407470703125, 5.509765625, 5.8787841796875, 6.247802734375, 6.6168212890625, 6.98583984375, 7.3548583984375, 7.723876953125, 8.0928955078125, 8.4619140625, 8.8309326171875, 9.199951171875, 9.5689697265625, 9.93798828125, 10.3070068359375, 10.676025390625, 11.0450439453125, 11.4140625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 7.0, 9.0, 21.0, 8.0, 24.0, 33.0, 25.0, 39.0, 40.0, 41.0, 54.0, 45.0, 87.0, 200.0, 1684.0, 220.0, 108.0, 54.0, 40.0, 38.0, 47.0, 33.0, 21.0, 27.0, 31.0, 20.0, 12.0, 14.0, 14.0, 11.0, 11.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-27.265625, -26.576171875, -25.88671875, -25.197265625, -24.5078125, -23.818359375, -23.12890625, -22.439453125, -21.75, -21.060546875, -20.37109375, -19.681640625, -18.9921875, -18.302734375, -17.61328125, -16.923828125, -16.234375, -15.544921875, -14.85546875, -14.166015625, -13.4765625, -12.787109375, -12.09765625, -11.408203125, -10.71875, -10.029296875, -9.33984375, -8.650390625, -7.9609375, -7.271484375, -6.58203125, -5.892578125, -5.203125, -4.513671875, -3.82421875, -3.134765625, -2.4453125, -1.755859375, -1.06640625, -0.376953125, 0.3125, 1.001953125, 1.69140625, 2.380859375, 3.0703125, 3.759765625, 4.44921875, 5.138671875, 5.828125, 6.517578125, 7.20703125, 7.896484375, 8.5859375, 9.275390625, 9.96484375, 10.654296875, 11.34375, 12.033203125, 12.72265625, 13.412109375, 14.1015625, 14.791015625, 15.48046875, 16.169921875, 16.859375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 9.0, 13.0, 16.0, 17.0, 21.0, 19.0, 32.0, 29.0, 43.0, 59.0, 83.0, 109.0, 230.0, 486.0, 1748.0, 91526.0, 3044371.0, 5293.0, 772.0, 272.0, 157.0, 100.0, 72.0, 53.0, 33.0, 35.0, 19.0, 23.0, 12.0, 9.0, 8.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.96875, -36.4013671875, -34.833984375, -33.2666015625, -31.69921875, -30.1318359375, -28.564453125, -26.9970703125, -25.4296875, -23.8623046875, -22.294921875, -20.7275390625, -19.16015625, -17.5927734375, -16.025390625, -14.4580078125, -12.890625, -11.3232421875, -9.755859375, -8.1884765625, -6.62109375, -5.0537109375, -3.486328125, -1.9189453125, -0.3515625, 1.2158203125, 2.783203125, 4.3505859375, 5.91796875, 7.4853515625, 9.052734375, 10.6201171875, 12.1875, 13.7548828125, 15.322265625, 16.8896484375, 18.45703125, 20.0244140625, 21.591796875, 23.1591796875, 24.7265625, 26.2939453125, 27.861328125, 29.4287109375, 30.99609375, 32.5634765625, 34.130859375, 35.6982421875, 37.265625, 38.8330078125, 40.400390625, 41.9677734375, 43.53515625, 45.1025390625, 46.669921875, 48.2373046875, 49.8046875, 51.3720703125, 52.939453125, 54.5068359375, 56.07421875, 57.6416015625, 59.208984375, 60.7763671875, 62.34375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 83.0, 885.0, 46.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-355.87091064453125, -349.2056884765625, -342.54046630859375, -335.8752746582031, -329.2100524902344, -322.5448303222656, -315.8796081542969, -309.21441650390625, -302.5491943359375, -295.88397216796875, -289.21875, -282.5535583496094, -275.8883361816406, -269.2231140136719, -262.5578918457031, -255.89268493652344, -249.2274627685547, -242.56224060058594, -235.89703369140625, -229.2318115234375, -222.5666046142578, -215.90138244628906, -209.23617553710938, -202.57095336914062, -195.90573120117188, -189.24050903320312, -182.57530212402344, -175.9100799560547, -169.244873046875, -162.57965087890625, -155.9144287109375, -149.2492218017578, -142.5840301513672, -135.91880798339844, -129.25360107421875, -122.58837890625, -115.92317199707031, -109.25794982910156, -102.59273529052734, -95.92752075195312, -89.2623062133789, -82.59709167480469, -75.93187713623047, -69.26666259765625, -62.601444244384766, -55.93622970581055, -49.27101135253906, -42.605796813964844, -35.940582275390625, -29.275367736816406, -22.610151290893555, -15.944934844970703, -9.279720306396484, -2.6145057678222656, 4.050712585449219, 10.715927124023438, 17.381141662597656, 24.046356201171875, 30.711572647094727, 37.37678909301758, 44.0420036315918, 50.707218170166016, 57.3724365234375, 64.03765106201172, 70.70286560058594]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 2.0, 1.0, 11.0, 5.0, 8.0, 11.0, 7.0, 15.0, 23.0, 13.0, 17.0, 18.0, 14.0, 31.0, 24.0, 20.0, 37.0, 37.0, 21.0, 34.0, 40.0, 36.0, 42.0, 40.0, 40.0, 32.0, 40.0, 36.0, 45.0, 28.0, 28.0, 25.0, 26.0, 20.0, 22.0, 16.0, 13.0, 20.0, 12.0, 13.0, 15.0, 12.0, 10.0, 12.0, 6.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-44.057552337646484, -42.69801712036133, -41.33848190307617, -39.978946685791016, -38.61941146850586, -37.25988006591797, -35.90034484863281, -34.540809631347656, -33.1812744140625, -31.821739196777344, -30.462203979492188, -29.10266876220703, -27.743135452270508, -26.38360023498535, -25.024065017700195, -23.664531707763672, -22.304994583129883, -20.945459365844727, -19.58592414855957, -18.226390838623047, -16.86685562133789, -15.507320404052734, -14.147785186767578, -12.788250923156738, -11.428715705871582, -10.069180488586426, -8.709646224975586, -7.35011100769043, -5.990576267242432, -4.631041526794434, -3.2715063095092773, -1.9119720458984375, -0.5524368286132812, 0.8070980310440063, 2.166632890701294, 3.526167869567871, 4.885702610015869, 6.245237350463867, 7.604772567749023, 8.964306831359863, 10.32384204864502, 11.683377265930176, 13.042911529541016, 14.402446746826172, 15.761981964111328, 17.121517181396484, 18.48105239868164, 19.840585708618164, 21.20012092590332, 22.559656143188477, 23.919191360473633, 25.278724670410156, 26.638259887695312, 27.99779510498047, 29.357330322265625, 30.71686553955078, 32.07640075683594, 33.435935974121094, 34.79547119140625, 36.155006408691406, 37.51454162597656, 38.87407684326172, 40.233612060546875, 41.593143463134766, 42.95267868041992]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 6.0, 6.0, 8.0, 7.0, 11.0, 10.0, 13.0, 16.0, 13.0, 24.0, 25.0, 28.0, 22.0, 35.0, 28.0, 33.0, 42.0, 44.0, 46.0, 43.0, 44.0, 38.0, 45.0, 40.0, 50.0, 47.0, 38.0, 28.0, 34.0, 19.0, 18.0, 34.0, 19.0, 18.0, 13.0, 15.0, 8.0, 11.0, 7.0, 8.0, 7.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.48046875, -6.28314208984375, -6.0858154296875, -5.88848876953125, -5.691162109375, -5.49383544921875, -5.2965087890625, -5.09918212890625, -4.90185546875, -4.70452880859375, -4.5072021484375, -4.30987548828125, -4.112548828125, -3.91522216796875, -3.7178955078125, -3.52056884765625, -3.3232421875, -3.12591552734375, -2.9285888671875, -2.73126220703125, -2.533935546875, -2.33660888671875, -2.1392822265625, -1.94195556640625, -1.74462890625, -1.54730224609375, -1.3499755859375, -1.15264892578125, -0.955322265625, -0.75799560546875, -0.5606689453125, -0.36334228515625, -0.166015625, 0.03131103515625, 0.2286376953125, 0.42596435546875, 0.623291015625, 0.82061767578125, 1.0179443359375, 1.21527099609375, 1.41259765625, 1.60992431640625, 1.8072509765625, 2.00457763671875, 2.201904296875, 2.39923095703125, 2.5965576171875, 2.79388427734375, 2.9912109375, 3.18853759765625, 3.3858642578125, 3.58319091796875, 3.780517578125, 3.97784423828125, 4.1751708984375, 4.37249755859375, 4.56982421875, 4.76715087890625, 4.9644775390625, 5.16180419921875, 5.359130859375, 5.55645751953125, 5.7537841796875, 5.95111083984375, 6.1484375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 3.0, 4.0, 4.0, 16.0, 10.0, 21.0, 14.0, 16.0, 25.0, 20.0, 37.0, 50.0, 70.0, 102.0, 209.0, 409.0, 1106.0, 5129.0, 48975.0, 1375969.0, 2618251.0, 131993.0, 9046.0, 1639.0, 504.0, 204.0, 116.0, 86.0, 58.0, 33.0, 31.0, 34.0, 25.0, 14.0, 8.0, 15.0, 7.0, 4.0, 9.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.890625, -17.334228515625, -16.77783203125, -16.221435546875, -15.6650390625, -15.108642578125, -14.55224609375, -13.995849609375, -13.439453125, -12.883056640625, -12.32666015625, -11.770263671875, -11.2138671875, -10.657470703125, -10.10107421875, -9.544677734375, -8.98828125, -8.431884765625, -7.87548828125, -7.319091796875, -6.7626953125, -6.206298828125, -5.64990234375, -5.093505859375, -4.537109375, -3.980712890625, -3.42431640625, -2.867919921875, -2.3115234375, -1.755126953125, -1.19873046875, -0.642333984375, -0.0859375, 0.470458984375, 1.02685546875, 1.583251953125, 2.1396484375, 2.696044921875, 3.25244140625, 3.808837890625, 4.365234375, 4.921630859375, 5.47802734375, 6.034423828125, 6.5908203125, 7.147216796875, 7.70361328125, 8.260009765625, 8.81640625, 9.372802734375, 9.92919921875, 10.485595703125, 11.0419921875, 11.598388671875, 12.15478515625, 12.711181640625, 13.267578125, 13.823974609375, 14.38037109375, 14.936767578125, 15.4931640625, 16.049560546875, 16.60595703125, 17.162353515625, 17.71875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 7.0, 9.0, 11.0, 22.0, 20.0, 30.0, 35.0, 58.0, 79.0, 94.0, 146.0, 161.0, 245.0, 309.0, 393.0, 468.0, 459.0, 372.0, 331.0, 244.0, 144.0, 119.0, 91.0, 63.0, 40.0, 35.0, 18.0, 16.0, 19.0, 7.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.1796875, -10.849609375, -10.51953125, -10.189453125, -9.859375, -9.529296875, -9.19921875, -8.869140625, -8.5390625, -8.208984375, -7.87890625, -7.548828125, -7.21875, -6.888671875, -6.55859375, -6.228515625, -5.8984375, -5.568359375, -5.23828125, -4.908203125, -4.578125, -4.248046875, -3.91796875, -3.587890625, -3.2578125, -2.927734375, -2.59765625, -2.267578125, -1.9375, -1.607421875, -1.27734375, -0.947265625, -0.6171875, -0.287109375, 0.04296875, 0.373046875, 0.703125, 1.033203125, 1.36328125, 1.693359375, 2.0234375, 2.353515625, 2.68359375, 3.013671875, 3.34375, 3.673828125, 4.00390625, 4.333984375, 4.6640625, 4.994140625, 5.32421875, 5.654296875, 5.984375, 6.314453125, 6.64453125, 6.974609375, 7.3046875, 7.634765625, 7.96484375, 8.294921875, 8.625, 8.955078125, 9.28515625, 9.615234375, 9.9453125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 11.0, 16.0, 23.0, 37.0, 52.0, 64.0, 86.0, 128.0, 174.0, 281.0, 546.0, 1990.0, 33022.0, 3962726.0, 189184.0, 4056.0, 780.0, 365.0, 204.0, 136.0, 95.0, 74.0, 72.0, 36.0, 18.0, 21.0, 22.0, 15.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.62060546875, -37.1162109375, -35.61181640625, -34.107421875, -32.60302734375, -31.0986328125, -29.59423828125, -28.08984375, -26.58544921875, -25.0810546875, -23.57666015625, -22.072265625, -20.56787109375, -19.0634765625, -17.55908203125, -16.0546875, -14.55029296875, -13.0458984375, -11.54150390625, -10.037109375, -8.53271484375, -7.0283203125, -5.52392578125, -4.01953125, -2.51513671875, -1.0107421875, 0.49365234375, 1.998046875, 3.50244140625, 5.0068359375, 6.51123046875, 8.015625, 9.52001953125, 11.0244140625, 12.52880859375, 14.033203125, 15.53759765625, 17.0419921875, 18.54638671875, 20.05078125, 21.55517578125, 23.0595703125, 24.56396484375, 26.068359375, 27.57275390625, 29.0771484375, 30.58154296875, 32.0859375, 33.59033203125, 35.0947265625, 36.59912109375, 38.103515625, 39.60791015625, 41.1123046875, 42.61669921875, 44.12109375, 45.62548828125, 47.1298828125, 48.63427734375, 50.138671875, 51.64306640625, 53.1474609375, 54.65185546875, 56.15625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 16.0, 60.0, 187.0, 292.0, 296.0, 114.0, 37.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.78128814697266, -89.56201934814453, -86.3427505493164, -83.12348937988281, -79.90422058105469, -76.68495178222656, -73.46568298339844, -70.24641418457031, -67.02714538574219, -63.80787658691406, -60.5886116027832, -57.36934280395508, -54.15007781982422, -50.930809020996094, -47.71154022216797, -44.492271423339844, -41.27301025390625, -38.053741455078125, -34.834476470947266, -31.61520767211914, -28.39594078063965, -25.176673889160156, -21.95740509033203, -18.73813819885254, -15.518871307373047, -12.299604415893555, -9.080336570739746, -5.8610687255859375, -2.6418018341064453, 0.5774650573730469, 3.796733856201172, 7.016000747680664, 10.235267639160156, 13.454534530639648, 16.67380142211914, 19.893070220947266, 23.112337112426758, 26.33160400390625, 29.550872802734375, 32.7701416015625, 35.98940658569336, 39.208675384521484, 42.427940368652344, 45.64720916748047, 48.866477966308594, 52.08574295043945, 55.30501174926758, 58.52427673339844, 61.74354553222656, 64.96281433105469, 68.18208312988281, 71.40135192871094, 74.62061309814453, 77.83988189697266, 81.05915069580078, 84.2784194946289, 87.4976806640625, 90.71694946289062, 93.93621826171875, 97.15548706054688, 100.37474822998047, 103.5940170288086, 106.81328582763672, 110.03255462646484, 113.25182342529297]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 13.0, 9.0, 10.0, 9.0, 23.0, 26.0, 17.0, 11.0, 20.0, 30.0, 34.0, 29.0, 42.0, 36.0, 46.0, 46.0, 33.0, 45.0, 35.0, 48.0, 30.0, 29.0, 44.0, 43.0, 30.0, 26.0, 23.0, 25.0, 22.0, 25.0, 20.0, 19.0, 10.0, 13.0, 10.0, 10.0, 17.0, 16.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-31.598857879638672, -30.598596572875977, -29.59833526611328, -28.598073959350586, -27.59781265258789, -26.597549438476562, -25.597288131713867, -24.597026824951172, -23.596765518188477, -22.59650421142578, -21.596242904663086, -20.59598159790039, -19.595718383789062, -18.595458984375, -17.595195770263672, -16.594934463500977, -15.594673156738281, -14.594411849975586, -13.59415054321289, -12.593888282775879, -11.593626976013184, -10.593365669250488, -9.593103408813477, -8.592842102050781, -7.592580795288086, -6.592319488525391, -5.592057704925537, -4.591795921325684, -3.5915346145629883, -2.591273307800293, -1.5910115242004395, -0.5907497406005859, 0.40950775146484375, 1.4097692966461182, 2.4100308418273926, 3.410292387008667, 4.410553932189941, 5.410815238952637, 6.41107702255249, 7.411338806152344, 8.411600112915039, 9.411861419677734, 10.41212272644043, 11.412384986877441, 12.412646293640137, 13.412907600402832, 14.413169860839844, 15.413431167602539, 16.413692474365234, 17.41395378112793, 18.414215087890625, 19.41447639465332, 20.414737701416016, 21.415000915527344, 22.41526222229004, 23.415523529052734, 24.41578483581543, 25.416046142578125, 26.41630744934082, 27.416568756103516, 28.416831970214844, 29.417091369628906, 30.417354583740234, 31.41761589050293, 32.417877197265625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 10.0, 13.0, 17.0, 14.0, 28.0, 27.0, 20.0, 35.0, 42.0, 29.0, 35.0, 43.0, 42.0, 49.0, 46.0, 45.0, 48.0, 37.0, 36.0, 39.0, 34.0, 43.0, 34.0, 26.0, 22.0, 28.0, 19.0, 21.0, 19.0, 16.0, 11.0, 8.0, 11.0, 10.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.04296875, -6.8377685546875, -6.632568359375, -6.4273681640625, -6.22216796875, -6.0169677734375, -5.811767578125, -5.6065673828125, -5.4013671875, -5.1961669921875, -4.990966796875, -4.7857666015625, -4.58056640625, -4.3753662109375, -4.170166015625, -3.9649658203125, -3.759765625, -3.5545654296875, -3.349365234375, -3.1441650390625, -2.93896484375, -2.7337646484375, -2.528564453125, -2.3233642578125, -2.1181640625, -1.9129638671875, -1.707763671875, -1.5025634765625, -1.29736328125, -1.0921630859375, -0.886962890625, -0.6817626953125, -0.4765625, -0.2713623046875, -0.066162109375, 0.1390380859375, 0.34423828125, 0.5494384765625, 0.754638671875, 0.9598388671875, 1.1650390625, 1.3702392578125, 1.575439453125, 1.7806396484375, 1.98583984375, 2.1910400390625, 2.396240234375, 2.6014404296875, 2.806640625, 3.0118408203125, 3.217041015625, 3.4222412109375, 3.62744140625, 3.8326416015625, 4.037841796875, 4.2430419921875, 4.4482421875, 4.6534423828125, 4.858642578125, 5.0638427734375, 5.26904296875, 5.4742431640625, 5.679443359375, 5.8846435546875, 6.08984375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 13.0, 11.0, 25.0, 27.0, 50.0, 69.0, 108.0, 151.0, 222.0, 318.0, 417.0, 674.0, 949.0, 1359.0, 2001.0, 2921.0, 4392.0, 6433.0, 9705.0, 14439.0, 22423.0, 34811.0, 55203.0, 87139.0, 133236.0, 176240.0, 166475.0, 117062.0, 75275.0, 47642.0, 30196.0, 19259.0, 12876.0, 8417.0, 5747.0, 3911.0, 2518.0, 1875.0, 1189.0, 841.0, 599.0, 389.0, 289.0, 201.0, 149.0, 98.0, 63.0, 41.0, 29.0, 29.0, 12.0, 8.0, 9.0, 5.0, 3.0, 5.0, 3.0], "bins": [-0.572265625, -0.554840087890625, -0.53741455078125, -0.519989013671875, -0.5025634765625, -0.485137939453125, -0.46771240234375, -0.450286865234375, -0.432861328125, -0.415435791015625, -0.39801025390625, -0.380584716796875, -0.3631591796875, -0.345733642578125, -0.32830810546875, -0.310882568359375, -0.29345703125, -0.276031494140625, -0.25860595703125, -0.241180419921875, -0.2237548828125, -0.206329345703125, -0.18890380859375, -0.171478271484375, -0.154052734375, -0.136627197265625, -0.11920166015625, -0.101776123046875, -0.0843505859375, -0.066925048828125, -0.04949951171875, -0.032073974609375, -0.0146484375, 0.002777099609375, 0.02020263671875, 0.037628173828125, 0.0550537109375, 0.072479248046875, 0.08990478515625, 0.107330322265625, 0.124755859375, 0.142181396484375, 0.15960693359375, 0.177032470703125, 0.1944580078125, 0.211883544921875, 0.22930908203125, 0.246734619140625, 0.26416015625, 0.281585693359375, 0.29901123046875, 0.316436767578125, 0.3338623046875, 0.351287841796875, 0.36871337890625, 0.386138916015625, 0.403564453125, 0.420989990234375, 0.43841552734375, 0.455841064453125, 0.4732666015625, 0.490692138671875, 0.50811767578125, 0.525543212890625, 0.54296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 9.0, 7.0, 10.0, 14.0, 16.0, 12.0, 21.0, 23.0, 25.0, 22.0, 29.0, 37.0, 20.0, 30.0, 27.0, 23.0, 39.0, 49.0, 37.0, 1080.0, 42.0, 41.0, 35.0, 22.0, 33.0, 29.0, 33.0, 40.0, 37.0, 29.0, 27.0, 24.0, 20.0, 9.0, 9.0, 14.0, 10.0, 10.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.779296875, -3.6580810546875, -3.536865234375, -3.4156494140625, -3.29443359375, -3.1732177734375, -3.052001953125, -2.9307861328125, -2.8095703125, -2.6883544921875, -2.567138671875, -2.4459228515625, -2.32470703125, -2.2034912109375, -2.082275390625, -1.9610595703125, -1.83984375, -1.7186279296875, -1.597412109375, -1.4761962890625, -1.35498046875, -1.2337646484375, -1.112548828125, -0.9913330078125, -0.8701171875, -0.7489013671875, -0.627685546875, -0.5064697265625, -0.38525390625, -0.2640380859375, -0.142822265625, -0.0216064453125, 0.099609375, 0.2208251953125, 0.342041015625, 0.4632568359375, 0.58447265625, 0.7056884765625, 0.826904296875, 0.9481201171875, 1.0693359375, 1.1905517578125, 1.311767578125, 1.4329833984375, 1.55419921875, 1.6754150390625, 1.796630859375, 1.9178466796875, 2.0390625, 2.1602783203125, 2.281494140625, 2.4027099609375, 2.52392578125, 2.6451416015625, 2.766357421875, 2.8875732421875, 3.0087890625, 3.1300048828125, 3.251220703125, 3.3724365234375, 3.49365234375, 3.6148681640625, 3.736083984375, 3.8572998046875, 3.978515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 12.0, 21.0, 27.0, 50.0, 56.0, 76.0, 163.0, 205.0, 355.0, 564.0, 853.0, 1448.0, 2268.0, 3542.0, 5965.0, 9399.0, 15617.0, 25884.0, 43767.0, 73892.0, 125072.0, 191820.0, 1251199.0, 139077.0, 83260.0, 49033.0, 28841.0, 17240.0, 10269.0, 6356.0, 4068.0, 2532.0, 1565.0, 956.0, 594.0, 385.0, 260.0, 153.0, 92.0, 61.0, 43.0, 24.0, 30.0, 11.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0], "bins": [-0.681640625, -0.6627655029296875, -0.643890380859375, -0.6250152587890625, -0.60614013671875, -0.5872650146484375, -0.568389892578125, -0.5495147705078125, -0.5306396484375, -0.5117645263671875, -0.492889404296875, -0.4740142822265625, -0.45513916015625, -0.4362640380859375, -0.417388916015625, -0.3985137939453125, -0.379638671875, -0.3607635498046875, -0.341888427734375, -0.3230133056640625, -0.30413818359375, -0.2852630615234375, -0.266387939453125, -0.2475128173828125, -0.2286376953125, -0.2097625732421875, -0.190887451171875, -0.1720123291015625, -0.15313720703125, -0.1342620849609375, -0.115386962890625, -0.0965118408203125, -0.07763671875, -0.0587615966796875, -0.039886474609375, -0.0210113525390625, -0.00213623046875, 0.0167388916015625, 0.035614013671875, 0.0544891357421875, 0.0733642578125, 0.0922393798828125, 0.111114501953125, 0.1299896240234375, 0.14886474609375, 0.1677398681640625, 0.186614990234375, 0.2054901123046875, 0.224365234375, 0.2432403564453125, 0.262115478515625, 0.2809906005859375, 0.29986572265625, 0.3187408447265625, 0.337615966796875, 0.3564910888671875, 0.3753662109375, 0.3942413330078125, 0.413116455078125, 0.4319915771484375, 0.45086669921875, 0.4697418212890625, 0.488616943359375, 0.5074920654296875, 0.5263671875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 12.0, 8.0, 11.0, 14.0, 21.0, 16.0, 22.0, 27.0, 32.0, 29.0, 34.0, 30.0, 30.0, 32.0, 42.0, 43.0, 45.0, 37.0, 49.0, 46.0, 61.0, 35.0, 32.0, 41.0, 33.0, 20.0, 27.0, 35.0, 19.0, 25.0, 12.0, 14.0, 12.0, 13.0, 5.0, 11.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007462501525878906, -0.0007209628820419312, -0.0006956756114959717, -0.0006703883409500122, -0.0006451010704040527, -0.0006198137998580933, -0.0005945265293121338, -0.0005692392587661743, -0.0005439519882202148, -0.0005186647176742554, -0.0004933774471282959, -0.0004680901765823364, -0.00044280290603637695, -0.0004175156354904175, -0.000392228364944458, -0.00036694109439849854, -0.00034165382385253906, -0.0003163665533065796, -0.0002910792827606201, -0.00026579201221466064, -0.00024050474166870117, -0.0002152174711227417, -0.00018993020057678223, -0.00016464293003082275, -0.00013935565948486328, -0.00011406838893890381, -8.878111839294434e-05, -6.349384784698486e-05, -3.820657730102539e-05, -1.2919306755065918e-05, 1.2367963790893555e-05, 3.765523433685303e-05, 6.29425048828125e-05, 8.822977542877197e-05, 0.00011351704597473145, 0.00013880431652069092, 0.0001640915870666504, 0.00018937885761260986, 0.00021466612815856934, 0.0002399533987045288, 0.0002652406692504883, 0.00029052793979644775, 0.0003158152103424072, 0.0003411024808883667, 0.00036638975143432617, 0.00039167702198028564, 0.0004169642925262451, 0.0004422515630722046, 0.00046753883361816406, 0.0004928261041641235, 0.000518113374710083, 0.0005434006452560425, 0.000568687915802002, 0.0005939751863479614, 0.0006192624568939209, 0.0006445497274398804, 0.0006698369979858398, 0.0006951242685317993, 0.0007204115390777588, 0.0007456988096237183, 0.0007709860801696777, 0.0007962733507156372, 0.0008215606212615967, 0.0008468478918075562, 0.0008721351623535156]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 3.0, 4.0, 12.0, 7.0, 16.0, 23.0, 15.0, 24.0, 24.0, 37.0, 39.0, 49.0, 53.0, 84.0, 99.0, 112.0, 183.0, 390.0, 823.0, 5306.0, 1028881.0, 10290.0, 937.0, 344.0, 207.0, 114.0, 81.0, 67.0, 69.0, 51.0, 36.0, 32.0, 29.0, 21.0, 15.0, 17.0, 11.0, 15.0, 8.0, 6.0, 8.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019073486328125, -0.01852130889892578, -0.017969131469726562, -0.017416954040527344, -0.016864776611328125, -0.016312599182128906, -0.015760421752929688, -0.015208244323730469, -0.01465606689453125, -0.014103889465332031, -0.013551712036132812, -0.012999534606933594, -0.012447357177734375, -0.011895179748535156, -0.011343002319335938, -0.010790824890136719, -0.0102386474609375, -0.009686470031738281, -0.009134292602539062, -0.008582115173339844, -0.008029937744140625, -0.007477760314941406, -0.0069255828857421875, -0.006373405456542969, -0.00582122802734375, -0.005269050598144531, -0.0047168731689453125, -0.004164695739746094, -0.003612518310546875, -0.0030603408813476562, -0.0025081634521484375, -0.0019559860229492188, -0.00140380859375, -0.0008516311645507812, -0.0002994537353515625, 0.00025272369384765625, 0.000804901123046875, 0.0013570785522460938, 0.0019092559814453125, 0.0024614334106445312, 0.00301361083984375, 0.0035657882690429688, 0.0041179656982421875, 0.004670143127441406, 0.005222320556640625, 0.005774497985839844, 0.0063266754150390625, 0.006878852844238281, 0.0074310302734375, 0.007983207702636719, 0.008535385131835938, 0.009087562561035156, 0.009639739990234375, 0.010191917419433594, 0.010744094848632812, 0.011296272277832031, 0.01184844970703125, 0.012400627136230469, 0.012952804565429688, 0.013504981994628906, 0.014057159423828125, 0.014609336853027344, 0.015161514282226562, 0.01571369171142578, 0.016265869140625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 15.0, 449.0, 536.0, 16.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006688817869871855, -0.006555243860930204, -0.006421669386327267, -0.006288095377385616, -0.006154520902782679, -0.006020946893841028, -0.0058873724192380905, -0.00575379841029644, -0.005620223935693502, -0.005486649926751852, -0.005353075452148914, -0.005219501443207264, -0.005085926968604326, -0.004952352959662676, -0.004818778485059738, -0.004685204476118088, -0.004551630467176437, -0.004418056458234787, -0.004284481983631849, -0.004150907974690199, -0.004017333500087261, -0.003883759258314967, -0.003750185016542673, -0.0036166110076010227, -0.003483036532998085, -0.003349462291225791, -0.003215888049453497, -0.003082313807681203, -0.002948739565908909, -0.002815165324136615, -0.0026815910823643208, -0.0025480170734226704, -0.0024144425988197327, -0.0022808683570474386, -0.0021472941152751446, -0.0020137198735028505, -0.0018801456317305565, -0.0017465713899582624, -0.0016129972646012902, -0.0014794230228289962, -0.0013458487810567021, -0.001212274539284408, -0.001078700297512114, -0.0009451261139474809, -0.0008115518721751869, -0.0006779776304028928, -0.0005444034468382597, -0.00041082920506596565, -0.0002772549632936716, -0.0001436807360732928, -1.0106508852913976e-05, 0.0001234677038155496, 0.00025704194558784366, 0.0003906161873601377, 0.0005241903709247708, 0.0006577646126970649, 0.0007913388544693589, 0.000924913096241653, 0.001058487338013947, 0.0011920614633709192, 0.0013256357051432133, 0.0014592099469155073, 0.0015927841886878014, 0.0017263584304600954, 0.0018599326722323895]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 11.0, 9.0, 9.0, 16.0, 14.0, 19.0, 17.0, 25.0, 19.0, 27.0, 31.0, 30.0, 28.0, 28.0, 32.0, 48.0, 30.0, 34.0, 44.0, 39.0, 34.0, 39.0, 28.0, 26.0, 38.0, 32.0, 40.0, 28.0, 24.0, 25.0, 30.0, 20.0, 24.0, 11.0, 13.0, 9.0, 21.0, 5.0, 4.0, 7.0, 4.0, 5.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004265904426574707, -0.00041273608803749084, -0.000398881733417511, -0.00038502737879753113, -0.00037117302417755127, -0.0003573186695575714, -0.00034346431493759155, -0.0003296099603176117, -0.00031575560569763184, -0.000301901251077652, -0.0002880468964576721, -0.00027419254183769226, -0.0002603381872177124, -0.00024648383259773254, -0.00023262947797775269, -0.00021877512335777283, -0.00020492076873779297, -0.0001910664141178131, -0.00017721205949783325, -0.0001633577048778534, -0.00014950335025787354, -0.00013564899563789368, -0.00012179464101791382, -0.00010794028639793396, -9.40859317779541e-05, -8.023157715797424e-05, -6.637722253799438e-05, -5.2522867918014526e-05, -3.866851329803467e-05, -2.481415867805481e-05, -1.0959804058074951e-05, 2.8945505619049072e-06, 1.6748905181884766e-05, 3.0603259801864624e-05, 4.445761442184448e-05, 5.831196904182434e-05, 7.21663236618042e-05, 8.602067828178406e-05, 9.987503290176392e-05, 0.00011372938752174377, 0.00012758374214172363, 0.0001414380967617035, 0.00015529245138168335, 0.0001691468060016632, 0.00018300116062164307, 0.00019685551524162292, 0.00021070986986160278, 0.00022456422448158264, 0.0002384185791015625, 0.00025227293372154236, 0.0002661272883415222, 0.0002799816429615021, 0.00029383599758148193, 0.0003076903522014618, 0.00032154470682144165, 0.0003353990614414215, 0.00034925341606140137, 0.0003631077706813812, 0.0003769621253013611, 0.00039081647992134094, 0.0004046708345413208, 0.00041852518916130066, 0.0004323795437812805, 0.0004462338984012604, 0.00046008825302124023]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 10.0, 13.0, 17.0, 14.0, 28.0, 27.0, 20.0, 35.0, 42.0, 29.0, 35.0, 43.0, 42.0, 49.0, 46.0, 45.0, 48.0, 37.0, 36.0, 39.0, 34.0, 43.0, 34.0, 26.0, 22.0, 28.0, 19.0, 21.0, 19.0, 16.0, 11.0, 8.0, 11.0, 10.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.04296875, -6.8377685546875, -6.632568359375, -6.4273681640625, -6.22216796875, -6.0169677734375, -5.811767578125, -5.6065673828125, -5.4013671875, -5.1961669921875, -4.990966796875, -4.7857666015625, -4.58056640625, -4.3753662109375, -4.170166015625, -3.9649658203125, -3.759765625, -3.5545654296875, -3.349365234375, -3.1441650390625, -2.93896484375, -2.7337646484375, -2.528564453125, -2.3233642578125, -2.1181640625, -1.9129638671875, -1.707763671875, -1.5025634765625, -1.29736328125, -1.0921630859375, -0.886962890625, -0.6817626953125, -0.4765625, -0.2713623046875, -0.066162109375, 0.1390380859375, 0.34423828125, 0.5494384765625, 0.754638671875, 0.9598388671875, 1.1650390625, 1.3702392578125, 1.575439453125, 1.7806396484375, 1.98583984375, 2.1910400390625, 2.396240234375, 2.6014404296875, 2.806640625, 3.0118408203125, 3.217041015625, 3.4222412109375, 3.62744140625, 3.8326416015625, 4.037841796875, 4.2430419921875, 4.4482421875, 4.6534423828125, 4.858642578125, 5.0638427734375, 5.26904296875, 5.4742431640625, 5.679443359375, 5.8846435546875, 6.08984375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 6.0, 10.0, 12.0, 20.0, 23.0, 24.0, 31.0, 38.0, 63.0, 86.0, 99.0, 163.0, 218.0, 315.0, 405.0, 587.0, 814.0, 2052.0, 11550.0, 134593.0, 847411.0, 41186.0, 5017.0, 1299.0, 685.0, 496.0, 357.0, 251.0, 184.0, 131.0, 90.0, 80.0, 56.0, 51.0, 34.0, 32.0, 18.0, 19.0, 16.0, 3.0, 3.0, 4.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.8125, -17.29296875, -16.7734375, -16.25390625, -15.734375, -15.21484375, -14.6953125, -14.17578125, -13.65625, -13.13671875, -12.6171875, -12.09765625, -11.578125, -11.05859375, -10.5390625, -10.01953125, -9.5, -8.98046875, -8.4609375, -7.94140625, -7.421875, -6.90234375, -6.3828125, -5.86328125, -5.34375, -4.82421875, -4.3046875, -3.78515625, -3.265625, -2.74609375, -2.2265625, -1.70703125, -1.1875, -0.66796875, -0.1484375, 0.37109375, 0.890625, 1.41015625, 1.9296875, 2.44921875, 2.96875, 3.48828125, 4.0078125, 4.52734375, 5.046875, 5.56640625, 6.0859375, 6.60546875, 7.125, 7.64453125, 8.1640625, 8.68359375, 9.203125, 9.72265625, 10.2421875, 10.76171875, 11.28125, 11.80078125, 12.3203125, 12.83984375, 13.359375, 13.87890625, 14.3984375, 14.91796875, 15.4375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 0.0, 5.0, 5.0, 6.0, 11.0, 11.0, 21.0, 14.0, 16.0, 21.0, 23.0, 35.0, 41.0, 38.0, 52.0, 64.0, 55.0, 108.0, 1775.0, 276.0, 82.0, 54.0, 59.0, 44.0, 45.0, 28.0, 37.0, 18.0, 23.0, 18.0, 15.0, 14.0, 15.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.1875, -20.4990234375, -19.810546875, -19.1220703125, -18.43359375, -17.7451171875, -17.056640625, -16.3681640625, -15.6796875, -14.9912109375, -14.302734375, -13.6142578125, -12.92578125, -12.2373046875, -11.548828125, -10.8603515625, -10.171875, -9.4833984375, -8.794921875, -8.1064453125, -7.41796875, -6.7294921875, -6.041015625, -5.3525390625, -4.6640625, -3.9755859375, -3.287109375, -2.5986328125, -1.91015625, -1.2216796875, -0.533203125, 0.1552734375, 0.84375, 1.5322265625, 2.220703125, 2.9091796875, 3.59765625, 4.2861328125, 4.974609375, 5.6630859375, 6.3515625, 7.0400390625, 7.728515625, 8.4169921875, 9.10546875, 9.7939453125, 10.482421875, 11.1708984375, 11.859375, 12.5478515625, 13.236328125, 13.9248046875, 14.61328125, 15.3017578125, 15.990234375, 16.6787109375, 17.3671875, 18.0556640625, 18.744140625, 19.4326171875, 20.12109375, 20.8095703125, 21.498046875, 22.1865234375, 22.875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 4.0, 11.0, 11.0, 14.0, 19.0, 21.0, 19.0, 24.0, 48.0, 45.0, 60.0, 97.0, 173.0, 327.0, 1183.0, 506041.0, 2635281.0, 1349.0, 378.0, 185.0, 89.0, 79.0, 46.0, 38.0, 28.0, 30.0, 16.0, 16.0, 17.0, 10.0, 13.0, 4.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-63.59375, -61.6689453125, -59.744140625, -57.8193359375, -55.89453125, -53.9697265625, -52.044921875, -50.1201171875, -48.1953125, -46.2705078125, -44.345703125, -42.4208984375, -40.49609375, -38.5712890625, -36.646484375, -34.7216796875, -32.796875, -30.8720703125, -28.947265625, -27.0224609375, -25.09765625, -23.1728515625, -21.248046875, -19.3232421875, -17.3984375, -15.4736328125, -13.548828125, -11.6240234375, -9.69921875, -7.7744140625, -5.849609375, -3.9248046875, -2.0, -0.0751953125, 1.849609375, 3.7744140625, 5.69921875, 7.6240234375, 9.548828125, 11.4736328125, 13.3984375, 15.3232421875, 17.248046875, 19.1728515625, 21.09765625, 23.0224609375, 24.947265625, 26.8720703125, 28.796875, 30.7216796875, 32.646484375, 34.5712890625, 36.49609375, 38.4208984375, 40.345703125, 42.2705078125, 44.1953125, 46.1201171875, 48.044921875, 49.9697265625, 51.89453125, 53.8193359375, 55.744140625, 57.6689453125, 59.59375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 7.0, 13.0, 41.0, 51.0, 78.0, 124.0, 132.0, 141.0, 117.0, 116.0, 78.0, 56.0, 30.0, 15.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.933711528778076, -4.448376655578613, -3.9630415439605713, -3.4777066707611084, -2.9923715591430664, -2.5070366859436035, -2.0217018127441406, -1.5363667011260986, -1.0510318279266357, -0.5656968355178833, -0.08036190271377563, 0.40497303009033203, 0.8903080224990845, 1.375643014907837, 1.8609778881072998, 2.346312999725342, 2.8316478729248047, 3.3169827461242676, 3.8023178577423096, 4.287652969360352, 4.7729878425598145, 5.258322715759277, 5.74365758895874, 6.228992462158203, 6.714327812194824, 7.199662685394287, 7.68499755859375, 8.170332908630371, 8.655667304992676, 9.141002655029297, 9.626337051391602, 10.111672401428223, 10.597006797790527, 11.082342147827148, 11.567676544189453, 12.053011894226074, 12.538346290588379, 13.023681640625, 13.509016036987305, 13.994351387023926, 14.479686737060547, 14.965022087097168, 15.450356483459473, 15.935691833496094, 16.4210262298584, 16.906360626220703, 17.39169692993164, 17.877031326293945, 18.36236572265625, 18.847700119018555, 19.333036422729492, 19.818370819091797, 20.3037052154541, 20.789039611816406, 21.274375915527344, 21.75971031188965, 22.245046615600586, 22.73038101196289, 23.215717315673828, 23.701051712036133, 24.186386108398438, 24.671722412109375, 25.15705680847168, 25.642391204833984, 26.12772560119629]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 11.0, 7.0, 15.0, 6.0, 10.0, 23.0, 23.0, 35.0, 29.0, 38.0, 34.0, 43.0, 49.0, 40.0, 47.0, 52.0, 56.0, 55.0, 43.0, 37.0, 35.0, 41.0, 32.0, 30.0, 28.0, 20.0, 32.0, 25.0, 13.0, 18.0, 18.0, 5.0, 10.0, 6.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-56.025821685791016, -54.40349578857422, -52.78116989135742, -51.158843994140625, -49.53651428222656, -47.914188385009766, -46.29186248779297, -44.66953659057617, -43.047210693359375, -41.42488479614258, -39.80255889892578, -38.18022918701172, -36.55790328979492, -34.935577392578125, -33.31325149536133, -31.69092559814453, -30.06859588623047, -28.446269989013672, -26.823942184448242, -25.201616287231445, -23.579288482666016, -21.95696258544922, -20.334636688232422, -18.712310791015625, -17.089982986450195, -15.467656135559082, -13.845329284667969, -12.223003387451172, -10.600676536560059, -8.978349685668945, -7.356023788452148, -5.733696937561035, -4.111366271972656, -2.489039659500122, -0.8667130470275879, 0.7556133270263672, 2.3779401779174805, 4.000267028808594, 5.622592926025391, 7.244919776916504, 8.867246627807617, 10.48957347869873, 12.111900329589844, 13.73422622680664, 15.356553077697754, 16.978879928588867, 18.601205825805664, 20.223533630371094, 21.84585952758789, 23.468185424804688, 25.090513229370117, 26.712839126586914, 28.335166931152344, 29.95749282836914, 31.579818725585938, 33.202144622802734, 34.82447052001953, 36.44679641723633, 38.069122314453125, 39.69145202636719, 41.313777923583984, 42.93610382080078, 44.55842971801758, 46.180755615234375, 47.80308532714844]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 11.0, 13.0, 11.0, 18.0, 17.0, 33.0, 25.0, 39.0, 38.0, 33.0, 30.0, 36.0, 50.0, 36.0, 49.0, 57.0, 48.0, 50.0, 42.0, 39.0, 31.0, 32.0, 37.0, 34.0, 29.0, 23.0, 25.0, 19.0, 15.0, 16.0, 13.0, 3.0, 10.0, 6.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.3167724609375, -7.098388671875, -6.8800048828125, -6.66162109375, -6.4432373046875, -6.224853515625, -6.0064697265625, -5.7880859375, -5.5697021484375, -5.351318359375, -5.1329345703125, -4.91455078125, -4.6961669921875, -4.477783203125, -4.2593994140625, -4.041015625, -3.8226318359375, -3.604248046875, -3.3858642578125, -3.16748046875, -2.9490966796875, -2.730712890625, -2.5123291015625, -2.2939453125, -2.0755615234375, -1.857177734375, -1.6387939453125, -1.42041015625, -1.2020263671875, -0.983642578125, -0.7652587890625, -0.546875, -0.3284912109375, -0.110107421875, 0.1082763671875, 0.32666015625, 0.5450439453125, 0.763427734375, 0.9818115234375, 1.2001953125, 1.4185791015625, 1.636962890625, 1.8553466796875, 2.07373046875, 2.2921142578125, 2.510498046875, 2.7288818359375, 2.947265625, 3.1656494140625, 3.384033203125, 3.6024169921875, 3.82080078125, 4.0391845703125, 4.257568359375, 4.4759521484375, 4.6943359375, 4.9127197265625, 5.131103515625, 5.3494873046875, 5.56787109375, 5.7862548828125, 6.004638671875, 6.2230224609375, 6.44140625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 6.0, 13.0, 12.0, 14.0, 24.0, 34.0, 39.0, 58.0, 61.0, 75.0, 108.0, 136.0, 194.0, 288.0, 532.0, 1025.0, 2370.0, 6900.0, 30609.0, 293822.0, 2299723.0, 1406027.0, 126112.0, 17491.0, 4749.0, 1719.0, 739.0, 430.0, 265.0, 172.0, 119.0, 92.0, 85.0, 59.0, 38.0, 35.0, 33.0, 16.0, 11.0, 12.0, 11.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.586181640625, -13.17236328125, -12.758544921875, -12.3447265625, -11.930908203125, -11.51708984375, -11.103271484375, -10.689453125, -10.275634765625, -9.86181640625, -9.447998046875, -9.0341796875, -8.620361328125, -8.20654296875, -7.792724609375, -7.37890625, -6.965087890625, -6.55126953125, -6.137451171875, -5.7236328125, -5.309814453125, -4.89599609375, -4.482177734375, -4.068359375, -3.654541015625, -3.24072265625, -2.826904296875, -2.4130859375, -1.999267578125, -1.58544921875, -1.171630859375, -0.7578125, -0.343994140625, 0.06982421875, 0.483642578125, 0.8974609375, 1.311279296875, 1.72509765625, 2.138916015625, 2.552734375, 2.966552734375, 3.38037109375, 3.794189453125, 4.2080078125, 4.621826171875, 5.03564453125, 5.449462890625, 5.86328125, 6.277099609375, 6.69091796875, 7.104736328125, 7.5185546875, 7.932373046875, 8.34619140625, 8.760009765625, 9.173828125, 9.587646484375, 10.00146484375, 10.415283203125, 10.8291015625, 11.242919921875, 11.65673828125, 12.070556640625, 12.484375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 13.0, 14.0, 19.0, 21.0, 23.0, 25.0, 56.0, 53.0, 81.0, 98.0, 159.0, 178.0, 218.0, 317.0, 437.0, 480.0, 427.0, 379.0, 287.0, 207.0, 136.0, 108.0, 83.0, 68.0, 59.0, 36.0, 16.0, 16.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-11.171875, -10.860107421875, -10.54833984375, -10.236572265625, -9.9248046875, -9.613037109375, -9.30126953125, -8.989501953125, -8.677734375, -8.365966796875, -8.05419921875, -7.742431640625, -7.4306640625, -7.118896484375, -6.80712890625, -6.495361328125, -6.18359375, -5.871826171875, -5.56005859375, -5.248291015625, -4.9365234375, -4.624755859375, -4.31298828125, -4.001220703125, -3.689453125, -3.377685546875, -3.06591796875, -2.754150390625, -2.4423828125, -2.130615234375, -1.81884765625, -1.507080078125, -1.1953125, -0.883544921875, -0.57177734375, -0.260009765625, 0.0517578125, 0.363525390625, 0.67529296875, 0.987060546875, 1.298828125, 1.610595703125, 1.92236328125, 2.234130859375, 2.5458984375, 2.857666015625, 3.16943359375, 3.481201171875, 3.79296875, 4.104736328125, 4.41650390625, 4.728271484375, 5.0400390625, 5.351806640625, 5.66357421875, 5.975341796875, 6.287109375, 6.598876953125, 6.91064453125, 7.222412109375, 7.5341796875, 7.845947265625, 8.15771484375, 8.469482421875, 8.78125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 12.0, 13.0, 16.0, 29.0, 43.0, 61.0, 84.0, 145.0, 293.0, 580.0, 1675.0, 15432.0, 3140506.0, 1023633.0, 9202.0, 1350.0, 503.0, 256.0, 146.0, 84.0, 67.0, 53.0, 28.0, 26.0, 11.0, 14.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0, -37.4345703125, -35.869140625, -34.3037109375, -32.73828125, -31.1728515625, -29.607421875, -28.0419921875, -26.4765625, -24.9111328125, -23.345703125, -21.7802734375, -20.21484375, -18.6494140625, -17.083984375, -15.5185546875, -13.953125, -12.3876953125, -10.822265625, -9.2568359375, -7.69140625, -6.1259765625, -4.560546875, -2.9951171875, -1.4296875, 0.1357421875, 1.701171875, 3.2666015625, 4.83203125, 6.3974609375, 7.962890625, 9.5283203125, 11.09375, 12.6591796875, 14.224609375, 15.7900390625, 17.35546875, 18.9208984375, 20.486328125, 22.0517578125, 23.6171875, 25.1826171875, 26.748046875, 28.3134765625, 29.87890625, 31.4443359375, 33.009765625, 34.5751953125, 36.140625, 37.7060546875, 39.271484375, 40.8369140625, 42.40234375, 43.9677734375, 45.533203125, 47.0986328125, 48.6640625, 50.2294921875, 51.794921875, 53.3603515625, 54.92578125, 56.4912109375, 58.056640625, 59.6220703125, 61.1875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 15.0, 512.0, 478.0, 12.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.40203857421875, -117.6756591796875, -105.94928741455078, -94.22290802001953, -82.49653625488281, -70.77015686035156, -59.04377746582031, -47.317405700683594, -35.591026306152344, -23.86465072631836, -12.138273239135742, -0.411895751953125, 11.31447982788086, 23.040855407714844, 34.767234802246094, 46.49360656738281, 58.21998596191406, 69.94636535644531, 81.67273712158203, 93.39911651611328, 105.12548828125, 116.85186767578125, 128.5782470703125, 140.30462646484375, 152.031005859375, 163.75738525390625, 175.4837646484375, 187.21014404296875, 198.93650817871094, 210.6628875732422, 222.38926696777344, 234.11563110351562, 245.84201049804688, 257.5683898925781, 269.2947692871094, 281.0211486816406, 292.7475280761719, 304.473876953125, 316.20025634765625, 327.9266357421875, 339.65301513671875, 351.37939453125, 363.10577392578125, 374.8321533203125, 386.55853271484375, 398.284912109375, 410.01129150390625, 421.7376403808594, 433.46405029296875, 445.1904296875, 456.91680908203125, 468.6431884765625, 480.36956787109375, 492.095947265625, 503.82232666015625, 515.5487060546875, 527.2750244140625, 539.0014038085938, 550.727783203125, 562.4541625976562, 574.1805419921875, 585.9069213867188, 597.63330078125, 609.3596801757812, 621.0860595703125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 8.0, 7.0, 12.0, 15.0, 21.0, 21.0, 24.0, 26.0, 30.0, 32.0, 24.0, 28.0, 27.0, 35.0, 26.0, 35.0, 36.0, 38.0, 37.0, 49.0, 46.0, 26.0, 33.0, 40.0, 32.0, 41.0, 35.0, 22.0, 27.0, 18.0, 24.0, 14.0, 16.0, 17.0, 10.0, 12.0, 8.0, 8.0, 4.0, 5.0, 2.0, 8.0, 1.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.10009765625, -34.93724822998047, -33.77439498901367, -32.61154556274414, -31.448692321777344, -30.28584098815918, -29.122989654541016, -27.960140228271484, -26.797286987304688, -25.634435653686523, -24.47158432006836, -23.308732986450195, -22.14588165283203, -20.983030319213867, -19.820178985595703, -18.657329559326172, -17.494478225708008, -16.331626892089844, -15.16877555847168, -14.005924224853516, -12.843072891235352, -11.680221557617188, -10.51737117767334, -9.354519844055176, -8.191668510437012, -7.028817176818848, -5.865965843200684, -4.703114986419678, -3.5402636528015137, -2.3774123191833496, -1.2145614624023438, -0.05171012878417969, 1.1111412048339844, 2.2739925384521484, 3.4368436336517334, 4.599694728851318, 5.762546062469482, 6.9253973960876465, 8.088248252868652, 9.251099586486816, 10.41395092010498, 11.576802253723145, 12.739653587341309, 13.902503967285156, 15.06535530090332, 16.228206634521484, 17.39105796813965, 18.553909301757812, 19.716760635375977, 20.87961196899414, 22.042463302612305, 23.20531463623047, 24.368165969848633, 25.531017303466797, 26.693866729736328, 27.856719970703125, 29.019569396972656, 30.18242073059082, 31.345272064208984, 32.508121490478516, 33.67097473144531, 34.833824157714844, 35.99667739868164, 37.15952682495117, 38.32238006591797]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 8.0, 9.0, 20.0, 18.0, 16.0, 18.0, 17.0, 24.0, 30.0, 30.0, 39.0, 49.0, 40.0, 40.0, 43.0, 42.0, 43.0, 36.0, 39.0, 49.0, 34.0, 37.0, 56.0, 32.0, 41.0, 24.0, 23.0, 33.0, 22.0, 20.0, 12.0, 14.0, 11.0, 6.0, 6.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6640625, -7.4324951171875, -7.200927734375, -6.9693603515625, -6.73779296875, -6.5062255859375, -6.274658203125, -6.0430908203125, -5.8115234375, -5.5799560546875, -5.348388671875, -5.1168212890625, -4.88525390625, -4.6536865234375, -4.422119140625, -4.1905517578125, -3.958984375, -3.7274169921875, -3.495849609375, -3.2642822265625, -3.03271484375, -2.8011474609375, -2.569580078125, -2.3380126953125, -2.1064453125, -1.8748779296875, -1.643310546875, -1.4117431640625, -1.18017578125, -0.9486083984375, -0.717041015625, -0.4854736328125, -0.25390625, -0.0223388671875, 0.209228515625, 0.4407958984375, 0.67236328125, 0.9039306640625, 1.135498046875, 1.3670654296875, 1.5986328125, 1.8302001953125, 2.061767578125, 2.2933349609375, 2.52490234375, 2.7564697265625, 2.988037109375, 3.2196044921875, 3.451171875, 3.6827392578125, 3.914306640625, 4.1458740234375, 4.37744140625, 4.6090087890625, 4.840576171875, 5.0721435546875, 5.3037109375, 5.5352783203125, 5.766845703125, 5.9984130859375, 6.22998046875, 6.4615478515625, 6.693115234375, 6.9246826171875, 7.15625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 19.0, 25.0, 26.0, 37.0, 52.0, 105.0, 135.0, 197.0, 295.0, 407.0, 619.0, 882.0, 1364.0, 1994.0, 2966.0, 4699.0, 7520.0, 11294.0, 17994.0, 28771.0, 47393.0, 78995.0, 133304.0, 200243.0, 193507.0, 123574.0, 73225.0, 43855.0, 27245.0, 16941.0, 10664.0, 6805.0, 4395.0, 2999.0, 2061.0, 1277.0, 912.0, 577.0, 364.0, 271.0, 170.0, 116.0, 82.0, 60.0, 35.0, 21.0, 19.0, 15.0, 7.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.671875, -0.6508331298828125, -0.629791259765625, -0.6087493896484375, -0.58770751953125, -0.5666656494140625, -0.545623779296875, -0.5245819091796875, -0.5035400390625, -0.4824981689453125, -0.461456298828125, -0.4404144287109375, -0.41937255859375, -0.3983306884765625, -0.377288818359375, -0.3562469482421875, -0.335205078125, -0.3141632080078125, -0.293121337890625, -0.2720794677734375, -0.25103759765625, -0.2299957275390625, -0.208953857421875, -0.1879119873046875, -0.1668701171875, -0.1458282470703125, -0.124786376953125, -0.1037445068359375, -0.08270263671875, -0.0616607666015625, -0.040618896484375, -0.0195770263671875, 0.00146484375, 0.0225067138671875, 0.043548583984375, 0.0645904541015625, 0.08563232421875, 0.1066741943359375, 0.127716064453125, 0.1487579345703125, 0.1697998046875, 0.1908416748046875, 0.211883544921875, 0.2329254150390625, 0.25396728515625, 0.2750091552734375, 0.296051025390625, 0.3170928955078125, 0.338134765625, 0.3591766357421875, 0.380218505859375, 0.4012603759765625, 0.42230224609375, 0.4433441162109375, 0.464385986328125, 0.4854278564453125, 0.5064697265625, 0.5275115966796875, 0.548553466796875, 0.5695953369140625, 0.59063720703125, 0.6116790771484375, 0.632720947265625, 0.6537628173828125, 0.6748046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 4.0, 6.0, 4.0, 4.0, 10.0, 14.0, 11.0, 17.0, 22.0, 35.0, 31.0, 28.0, 26.0, 32.0, 49.0, 38.0, 33.0, 36.0, 40.0, 40.0, 1068.0, 50.0, 36.0, 40.0, 31.0, 38.0, 33.0, 27.0, 32.0, 27.0, 20.0, 35.0, 23.0, 15.0, 6.0, 13.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 6.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.296875, -4.15460205078125, -4.0123291015625, -3.87005615234375, -3.727783203125, -3.58551025390625, -3.4432373046875, -3.30096435546875, -3.15869140625, -3.01641845703125, -2.8741455078125, -2.73187255859375, -2.589599609375, -2.44732666015625, -2.3050537109375, -2.16278076171875, -2.0205078125, -1.87823486328125, -1.7359619140625, -1.59368896484375, -1.451416015625, -1.30914306640625, -1.1668701171875, -1.02459716796875, -0.88232421875, -0.74005126953125, -0.5977783203125, -0.45550537109375, -0.313232421875, -0.17095947265625, -0.0286865234375, 0.11358642578125, 0.255859375, 0.39813232421875, 0.5404052734375, 0.68267822265625, 0.824951171875, 0.96722412109375, 1.1094970703125, 1.25177001953125, 1.39404296875, 1.53631591796875, 1.6785888671875, 1.82086181640625, 1.963134765625, 2.10540771484375, 2.2476806640625, 2.38995361328125, 2.5322265625, 2.67449951171875, 2.8167724609375, 2.95904541015625, 3.101318359375, 3.24359130859375, 3.3858642578125, 3.52813720703125, 3.67041015625, 3.81268310546875, 3.9549560546875, 4.09722900390625, 4.239501953125, 4.38177490234375, 4.5240478515625, 4.66632080078125, 4.80859375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 8.0, 19.0, 16.0, 12.0, 39.0, 49.0, 88.0, 112.0, 168.0, 237.0, 353.0, 531.0, 909.0, 1341.0, 2133.0, 3189.0, 5141.0, 8188.0, 13521.0, 22660.0, 37485.0, 63404.0, 106117.0, 170390.0, 1257293.0, 159492.0, 97709.0, 58154.0, 34558.0, 20418.0, 12533.0, 7539.0, 4721.0, 2978.0, 1947.0, 1299.0, 813.0, 554.0, 346.0, 225.0, 161.0, 100.0, 67.0, 36.0, 24.0, 21.0, 10.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0], "bins": [-0.68115234375, -0.6613616943359375, -0.641571044921875, -0.6217803955078125, -0.60198974609375, -0.5821990966796875, -0.562408447265625, -0.5426177978515625, -0.5228271484375, -0.5030364990234375, -0.483245849609375, -0.4634552001953125, -0.44366455078125, -0.4238739013671875, -0.404083251953125, -0.3842926025390625, -0.364501953125, -0.3447113037109375, -0.324920654296875, -0.3051300048828125, -0.28533935546875, -0.2655487060546875, -0.245758056640625, -0.2259674072265625, -0.2061767578125, -0.1863861083984375, -0.166595458984375, -0.1468048095703125, -0.12701416015625, -0.1072235107421875, -0.087432861328125, -0.0676422119140625, -0.0478515625, -0.0280609130859375, -0.008270263671875, 0.0115203857421875, 0.03131103515625, 0.0511016845703125, 0.070892333984375, 0.0906829833984375, 0.1104736328125, 0.1302642822265625, 0.150054931640625, 0.1698455810546875, 0.18963623046875, 0.2094268798828125, 0.229217529296875, 0.2490081787109375, 0.268798828125, 0.2885894775390625, 0.308380126953125, 0.3281707763671875, 0.34796142578125, 0.3677520751953125, 0.387542724609375, 0.4073333740234375, 0.4271240234375, 0.4469146728515625, 0.466705322265625, 0.4864959716796875, 0.50628662109375, 0.5260772705078125, 0.545867919921875, 0.5656585693359375, 0.58544921875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 11.0, 3.0, 17.0, 16.0, 25.0, 22.0, 32.0, 21.0, 34.0, 32.0, 29.0, 30.0, 46.0, 44.0, 47.0, 42.0, 49.0, 44.0, 43.0, 50.0, 30.0, 42.0, 40.0, 29.0, 28.0, 26.0, 22.0, 23.0, 19.0, 21.0, 14.0, 15.0, 11.0, 5.0, 7.0, 4.0, 3.0, 5.0, 4.0, 4.0, 0.0, 4.0], "bins": [-0.0010967254638671875, -0.0010683909058570862, -0.0010400563478469849, -0.0010117217898368835, -0.0009833872318267822, -0.0009550526738166809, -0.0009267181158065796, -0.0008983835577964783, -0.000870048999786377, -0.0008417144417762756, -0.0008133798837661743, -0.000785045325756073, -0.0007567107677459717, -0.0007283762097358704, -0.000700041651725769, -0.0006717070937156677, -0.0006433725357055664, -0.0006150379776954651, -0.0005867034196853638, -0.0005583688616752625, -0.0005300343036651611, -0.0005016997456550598, -0.0004733651876449585, -0.0004450306296348572, -0.00041669607162475586, -0.00038836151361465454, -0.0003600269556045532, -0.0003316923975944519, -0.0003033578395843506, -0.00027502328157424927, -0.00024668872356414795, -0.00021835416555404663, -0.0001900196075439453, -0.000161685049533844, -0.00013335049152374268, -0.00010501593351364136, -7.668137550354004e-05, -4.834681749343872e-05, -2.0012259483337402e-05, 8.322298526763916e-06, 3.6656856536865234e-05, 6.499141454696655e-05, 9.332597255706787e-05, 0.00012166053056716919, 0.0001499950885772705, 0.00017832964658737183, 0.00020666420459747314, 0.00023499876260757446, 0.0002633333206176758, 0.0002916678786277771, 0.0003200024366378784, 0.00034833699464797974, 0.00037667155265808105, 0.0004050061106681824, 0.0004333406686782837, 0.000461675226688385, 0.0004900097846984863, 0.0005183443427085876, 0.000546678900718689, 0.0005750134587287903, 0.0006033480167388916, 0.0006316825747489929, 0.0006600171327590942, 0.0006883516907691956, 0.0007166862487792969]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 6.0, 4.0, 8.0, 6.0, 5.0, 9.0, 16.0, 25.0, 20.0, 28.0, 43.0, 46.0, 49.0, 52.0, 69.0, 87.0, 122.0, 205.0, 342.0, 634.0, 2062.0, 950619.0, 91590.0, 1057.0, 484.0, 277.0, 147.0, 105.0, 77.0, 63.0, 66.0, 43.0, 47.0, 33.0, 29.0, 15.0, 15.0, 16.0, 15.0, 3.0, 3.0, 12.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01543426513671875, -0.014835476875305176, -0.014236688613891602, -0.013637900352478027, -0.013039112091064453, -0.012440323829650879, -0.011841535568237305, -0.01124274730682373, -0.010643959045410156, -0.010045170783996582, -0.009446382522583008, -0.008847594261169434, -0.00824880599975586, -0.007650017738342285, -0.007051229476928711, -0.006452441215515137, -0.0058536529541015625, -0.005254864692687988, -0.004656076431274414, -0.00405728816986084, -0.0034584999084472656, -0.0028597116470336914, -0.002260923385620117, -0.001662135124206543, -0.0010633468627929688, -0.00046455860137939453, 0.0001342296600341797, 0.0007330179214477539, 0.0013318061828613281, 0.0019305944442749023, 0.0025293827056884766, 0.0031281709671020508, 0.003726959228515625, 0.004325747489929199, 0.0049245357513427734, 0.005523324012756348, 0.006122112274169922, 0.006720900535583496, 0.00731968879699707, 0.007918477058410645, 0.008517265319824219, 0.009116053581237793, 0.009714841842651367, 0.010313630104064941, 0.010912418365478516, 0.01151120662689209, 0.012109994888305664, 0.012708783149719238, 0.013307571411132812, 0.013906359672546387, 0.014505147933959961, 0.015103936195373535, 0.01570272445678711, 0.016301512718200684, 0.016900300979614258, 0.017499089241027832, 0.018097877502441406, 0.01869666576385498, 0.019295454025268555, 0.01989424228668213, 0.020493030548095703, 0.021091818809509277, 0.02169060707092285, 0.022289395332336426, 0.02288818359375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 88.0, 731.0, 193.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004407996311783791, -0.004264035262167454, -0.004120074212551117, -0.003976112697273493, -0.003832151647657156, -0.003688190598040819, -0.0035442295484244823, -0.0034002684988081455, -0.003256307216361165, -0.0031123461667448282, -0.0029683848842978477, -0.002824423834681511, -0.002680462785065174, -0.0025365015026181936, -0.002392540453001857, -0.0022485791705548763, -0.0021046181209385395, -0.0019606570713222027, -0.0018166957888752222, -0.0016727347392588854, -0.0015287735732272267, -0.001384812407195568, -0.0012408513575792313, -0.0010968901915475726, -0.000952929025515914, -0.0008089678594842553, -0.0006650067516602576, -0.0005210456438362598, -0.0003770844778046012, -0.00023312331177294254, -8.916220394894481e-05, 5.479890387505293e-05, 0.00019876006990671158, 0.00034272120683453977, 0.00048668234376236796, 0.0006306434515863657, 0.0007746046176180243, 0.000918565783649683, 0.0010625268332660198, 0.0012064879992976785, 0.0013504491653293371, 0.0014944103313609958, 0.0016383714973926544, 0.0017823325470089912, 0.0019262937130406499, 0.0020702548790723085, 0.0022142159286886454, 0.002358177211135626, 0.0025021382607519627, 0.0026460993103682995, 0.00279006059281528, 0.0029340216424316168, 0.0030779829248785973, 0.003221943974494934, 0.003365905024111271, 0.0035098660737276077, 0.003653827356174588, 0.003797788405790925, 0.0039417496882379055, 0.004085710737854242, 0.004229671787470579, 0.004373633302748203, 0.00451759435236454, 0.004661555401980877, 0.004805516451597214]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 4.0, 5.0, 6.0, 7.0, 10.0, 12.0, 22.0, 29.0, 20.0, 28.0, 30.0, 33.0, 35.0, 35.0, 31.0, 45.0, 27.0, 50.0, 42.0, 34.0, 47.0, 44.0, 37.0, 49.0, 37.0, 37.0, 34.0, 22.0, 25.0, 18.0, 20.0, 20.0, 19.0, 9.0, 17.0, 15.0, 4.0, 9.0, 7.0, 8.0, 10.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005339384078979492, -0.0005162619054317474, -0.0004985854029655457, -0.00048090890049934387, -0.0004632323980331421, -0.0004455558955669403, -0.0004278793931007385, -0.00041020289063453674, -0.00039252638816833496, -0.0003748498857021332, -0.0003571733832359314, -0.0003394968807697296, -0.00032182037830352783, -0.00030414387583732605, -0.00028646737337112427, -0.0002687908709049225, -0.0002511143684387207, -0.00023343786597251892, -0.00021576136350631714, -0.00019808486104011536, -0.00018040835857391357, -0.0001627318561077118, -0.00014505535364151, -0.00012737885117530823, -0.00010970234870910645, -9.202584624290466e-05, -7.434934377670288e-05, -5.66728413105011e-05, -3.8996338844299316e-05, -2.1319836378097534e-05, -3.643333911895752e-06, 1.403316855430603e-05, 3.170967102050781e-05, 4.9386173486709595e-05, 6.706267595291138e-05, 8.473917841911316e-05, 0.00010241568088531494, 0.00012009218335151672, 0.0001377686858177185, 0.0001554451882839203, 0.00017312169075012207, 0.00019079819321632385, 0.00020847469568252563, 0.00022615119814872742, 0.0002438277006149292, 0.000261504203081131, 0.00027918070554733276, 0.00029685720801353455, 0.00031453371047973633, 0.0003322102129459381, 0.0003498867154121399, 0.0003675632178783417, 0.00038523972034454346, 0.00040291622281074524, 0.000420592725276947, 0.0004382692277431488, 0.0004559457302093506, 0.00047362223267555237, 0.0004912987351417542, 0.0005089752376079559, 0.0005266517400741577, 0.0005443282425403595, 0.0005620047450065613, 0.0005796812474727631, 0.0005973577499389648]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 8.0, 9.0, 20.0, 18.0, 16.0, 18.0, 17.0, 24.0, 30.0, 30.0, 39.0, 49.0, 40.0, 40.0, 43.0, 42.0, 43.0, 36.0, 39.0, 49.0, 34.0, 37.0, 56.0, 32.0, 41.0, 24.0, 23.0, 33.0, 22.0, 20.0, 12.0, 14.0, 11.0, 6.0, 6.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6640625, -7.4324951171875, -7.200927734375, -6.9693603515625, -6.73779296875, -6.5062255859375, -6.274658203125, -6.0430908203125, -5.8115234375, -5.5799560546875, -5.348388671875, -5.1168212890625, -4.88525390625, -4.6536865234375, -4.422119140625, -4.1905517578125, -3.958984375, -3.7274169921875, -3.495849609375, -3.2642822265625, -3.03271484375, -2.8011474609375, -2.569580078125, -2.3380126953125, -2.1064453125, -1.8748779296875, -1.643310546875, -1.4117431640625, -1.18017578125, -0.9486083984375, -0.717041015625, -0.4854736328125, -0.25390625, -0.0223388671875, 0.209228515625, 0.4407958984375, 0.67236328125, 0.9039306640625, 1.135498046875, 1.3670654296875, 1.5986328125, 1.8302001953125, 2.061767578125, 2.2933349609375, 2.52490234375, 2.7564697265625, 2.988037109375, 3.2196044921875, 3.451171875, 3.6827392578125, 3.914306640625, 4.1458740234375, 4.37744140625, 4.6090087890625, 4.840576171875, 5.0721435546875, 5.3037109375, 5.5352783203125, 5.766845703125, 5.9984130859375, 6.22998046875, 6.4615478515625, 6.693115234375, 6.9246826171875, 7.15625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 11.0, 13.0, 22.0, 30.0, 43.0, 44.0, 83.0, 106.0, 138.0, 179.0, 352.0, 621.0, 1194.0, 2522.0, 6056.0, 17609.0, 64429.0, 316120.0, 494536.0, 103586.0, 25748.0, 8253.0, 3356.0, 1503.0, 739.0, 450.0, 251.0, 173.0, 109.0, 73.0, 54.0, 33.0, 34.0, 26.0, 12.0, 13.0, 8.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.6529541015625, -9.352783203125, -9.0526123046875, -8.75244140625, -8.4522705078125, -8.152099609375, -7.8519287109375, -7.5517578125, -7.2515869140625, -6.951416015625, -6.6512451171875, -6.35107421875, -6.0509033203125, -5.750732421875, -5.4505615234375, -5.150390625, -4.8502197265625, -4.550048828125, -4.2498779296875, -3.94970703125, -3.6495361328125, -3.349365234375, -3.0491943359375, -2.7490234375, -2.4488525390625, -2.148681640625, -1.8485107421875, -1.54833984375, -1.2481689453125, -0.947998046875, -0.6478271484375, -0.34765625, -0.0474853515625, 0.252685546875, 0.5528564453125, 0.85302734375, 1.1531982421875, 1.453369140625, 1.7535400390625, 2.0537109375, 2.3538818359375, 2.654052734375, 2.9542236328125, 3.25439453125, 3.5545654296875, 3.854736328125, 4.1549072265625, 4.455078125, 4.7552490234375, 5.055419921875, 5.3555908203125, 5.65576171875, 5.9559326171875, 6.256103515625, 6.5562744140625, 6.8564453125, 7.1566162109375, 7.456787109375, 7.7569580078125, 8.05712890625, 8.3572998046875, 8.657470703125, 8.9576416015625, 9.2578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 16.0, 6.0, 13.0, 19.0, 19.0, 22.0, 32.0, 46.0, 32.0, 34.0, 37.0, 61.0, 88.0, 133.0, 273.0, 1544.0, 177.0, 85.0, 68.0, 54.0, 42.0, 45.0, 33.0, 29.0, 21.0, 25.0, 16.0, 14.0, 18.0, 9.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.8125, -21.11328125, -20.4140625, -19.71484375, -19.015625, -18.31640625, -17.6171875, -16.91796875, -16.21875, -15.51953125, -14.8203125, -14.12109375, -13.421875, -12.72265625, -12.0234375, -11.32421875, -10.625, -9.92578125, -9.2265625, -8.52734375, -7.828125, -7.12890625, -6.4296875, -5.73046875, -5.03125, -4.33203125, -3.6328125, -2.93359375, -2.234375, -1.53515625, -0.8359375, -0.13671875, 0.5625, 1.26171875, 1.9609375, 2.66015625, 3.359375, 4.05859375, 4.7578125, 5.45703125, 6.15625, 6.85546875, 7.5546875, 8.25390625, 8.953125, 9.65234375, 10.3515625, 11.05078125, 11.75, 12.44921875, 13.1484375, 13.84765625, 14.546875, 15.24609375, 15.9453125, 16.64453125, 17.34375, 18.04296875, 18.7421875, 19.44140625, 20.140625, 20.83984375, 21.5390625, 22.23828125, 22.9375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 12.0, 13.0, 11.0, 17.0, 19.0, 31.0, 57.0, 61.0, 84.0, 111.0, 160.0, 258.0, 350.0, 865.0, 4560.0, 80326.0, 2936071.0, 114961.0, 5567.0, 929.0, 354.0, 227.0, 179.0, 118.0, 82.0, 76.0, 50.0, 30.0, 22.0, 26.0, 15.0, 10.0, 11.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-31.90625, -31.033203125, -30.16015625, -29.287109375, -28.4140625, -27.541015625, -26.66796875, -25.794921875, -24.921875, -24.048828125, -23.17578125, -22.302734375, -21.4296875, -20.556640625, -19.68359375, -18.810546875, -17.9375, -17.064453125, -16.19140625, -15.318359375, -14.4453125, -13.572265625, -12.69921875, -11.826171875, -10.953125, -10.080078125, -9.20703125, -8.333984375, -7.4609375, -6.587890625, -5.71484375, -4.841796875, -3.96875, -3.095703125, -2.22265625, -1.349609375, -0.4765625, 0.396484375, 1.26953125, 2.142578125, 3.015625, 3.888671875, 4.76171875, 5.634765625, 6.5078125, 7.380859375, 8.25390625, 9.126953125, 10.0, 10.873046875, 11.74609375, 12.619140625, 13.4921875, 14.365234375, 15.23828125, 16.111328125, 16.984375, 17.857421875, 18.73046875, 19.603515625, 20.4765625, 21.349609375, 22.22265625, 23.095703125, 23.96875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 72.0, 585.0, 338.0, 18.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.70968627929688, -153.94027709960938, -150.17088317871094, -146.40147399902344, -142.63206481933594, -138.8626708984375, -135.09326171875, -131.3238525390625, -127.55445861816406, -123.7850570678711, -120.0156478881836, -116.24624633789062, -112.47684478759766, -108.70744323730469, -104.93803405761719, -101.16863250732422, -97.39922332763672, -93.62982177734375, -89.86041259765625, -86.09101104736328, -82.32160949707031, -78.55220031738281, -74.78279876708984, -71.01339721679688, -67.24398803710938, -63.47458267211914, -59.70518112182617, -55.93577575683594, -52.16637420654297, -48.396968841552734, -44.6275634765625, -40.85816192626953, -37.088768005371094, -33.31936264038086, -29.54996109008789, -25.780555725097656, -22.011152267456055, -18.241748809814453, -14.472343444824219, -10.702939987182617, -6.933536529541016, -3.164132595062256, 0.6052713394165039, 4.374675750732422, 8.144079208374023, 11.913482666015625, 15.68288803100586, 19.45229148864746, 23.221694946289062, 26.991098403930664, 30.760501861572266, 34.5299072265625, 38.29930877685547, 42.0687141418457, 45.83811950683594, 49.607521057128906, 53.37692642211914, 57.146331787109375, 60.915733337402344, 64.68513488769531, 68.45454406738281, 72.22394561767578, 75.99334716796875, 79.76275634765625, 83.53215789794922]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 9.0, 8.0, 12.0, 8.0, 17.0, 13.0, 13.0, 21.0, 17.0, 32.0, 23.0, 23.0, 39.0, 40.0, 33.0, 37.0, 43.0, 40.0, 40.0, 43.0, 48.0, 43.0, 48.0, 38.0, 50.0, 30.0, 27.0, 24.0, 27.0, 24.0, 24.0, 18.0, 16.0, 8.0, 15.0, 15.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-49.8905029296875, -48.491939544677734, -47.0933723449707, -45.69480895996094, -44.296241760253906, -42.89767837524414, -41.499114990234375, -40.100547790527344, -38.70198059082031, -37.30341720581055, -35.904850006103516, -34.50628662109375, -33.10771942138672, -31.709156036376953, -30.310590744018555, -28.912025451660156, -27.51346206665039, -26.114896774291992, -24.716331481933594, -23.317768096923828, -21.919200897216797, -20.52063751220703, -19.122072219848633, -17.723506927490234, -16.324941635131836, -14.926376342773438, -13.527811050415039, -12.129246711730957, -10.730681419372559, -9.33211612701416, -7.933551788330078, -6.53498649597168, -5.136421203613281, -3.737856149673462, -2.3392910957336426, -0.9407262802124023, 0.4578390121459961, 1.8564043045043945, 3.2549686431884766, 4.653533935546875, 6.052099227905273, 7.450664520263672, 8.84922981262207, 10.247794151306152, 11.64635944366455, 13.04492473602295, 14.443489074707031, 15.84205436706543, 17.240619659423828, 18.639184951782227, 20.037750244140625, 21.43631362915039, 22.834880828857422, 24.233444213867188, 25.632009506225586, 27.030574798583984, 28.429140090942383, 29.82770538330078, 31.22627067565918, 32.62483596801758, 34.023399353027344, 35.421966552734375, 36.82052993774414, 38.219093322753906, 39.61766052246094]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 12.0, 15.0, 22.0, 22.0, 22.0, 19.0, 23.0, 18.0, 42.0, 43.0, 46.0, 37.0, 28.0, 44.0, 41.0, 50.0, 38.0, 31.0, 57.0, 50.0, 48.0, 39.0, 40.0, 32.0, 34.0, 33.0, 19.0, 15.0, 14.0, 19.0, 10.0, 4.0, 9.0, 1.0, 5.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.91796875, -7.67626953125, -7.4345703125, -7.19287109375, -6.951171875, -6.70947265625, -6.4677734375, -6.22607421875, -5.984375, -5.74267578125, -5.5009765625, -5.25927734375, -5.017578125, -4.77587890625, -4.5341796875, -4.29248046875, -4.05078125, -3.80908203125, -3.5673828125, -3.32568359375, -3.083984375, -2.84228515625, -2.6005859375, -2.35888671875, -2.1171875, -1.87548828125, -1.6337890625, -1.39208984375, -1.150390625, -0.90869140625, -0.6669921875, -0.42529296875, -0.18359375, 0.05810546875, 0.2998046875, 0.54150390625, 0.783203125, 1.02490234375, 1.2666015625, 1.50830078125, 1.75, 1.99169921875, 2.2333984375, 2.47509765625, 2.716796875, 2.95849609375, 3.2001953125, 3.44189453125, 3.68359375, 3.92529296875, 4.1669921875, 4.40869140625, 4.650390625, 4.89208984375, 5.1337890625, 5.37548828125, 5.6171875, 5.85888671875, 6.1005859375, 6.34228515625, 6.583984375, 6.82568359375, 7.0673828125, 7.30908203125, 7.55078125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 6.0, 16.0, 18.0, 12.0, 24.0, 25.0, 19.0, 39.0, 42.0, 77.0, 145.0, 293.0, 866.0, 2906.0, 12999.0, 111628.0, 2105783.0, 1849469.0, 94260.0, 11640.0, 2549.0, 757.0, 271.0, 115.0, 60.0, 43.0, 40.0, 25.0, 28.0, 14.0, 20.0, 13.0, 9.0, 6.0, 8.0, 12.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.69091796875, -17.1005859375, -16.51025390625, -15.919921875, -15.32958984375, -14.7392578125, -14.14892578125, -13.55859375, -12.96826171875, -12.3779296875, -11.78759765625, -11.197265625, -10.60693359375, -10.0166015625, -9.42626953125, -8.8359375, -8.24560546875, -7.6552734375, -7.06494140625, -6.474609375, -5.88427734375, -5.2939453125, -4.70361328125, -4.11328125, -3.52294921875, -2.9326171875, -2.34228515625, -1.751953125, -1.16162109375, -0.5712890625, 0.01904296875, 0.609375, 1.19970703125, 1.7900390625, 2.38037109375, 2.970703125, 3.56103515625, 4.1513671875, 4.74169921875, 5.33203125, 5.92236328125, 6.5126953125, 7.10302734375, 7.693359375, 8.28369140625, 8.8740234375, 9.46435546875, 10.0546875, 10.64501953125, 11.2353515625, 11.82568359375, 12.416015625, 13.00634765625, 13.5966796875, 14.18701171875, 14.77734375, 15.36767578125, 15.9580078125, 16.54833984375, 17.138671875, 17.72900390625, 18.3193359375, 18.90966796875, 19.5]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 4.0, 12.0, 12.0, 17.0, 23.0, 27.0, 37.0, 79.0, 100.0, 167.0, 266.0, 393.0, 600.0, 656.0, 527.0, 373.0, 224.0, 157.0, 127.0, 67.0, 55.0, 33.0, 30.0, 20.0, 18.0, 4.0, 10.0, 7.0, 5.0, 7.0, 6.0, 5.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0078125, -13.5885009765625, -13.169189453125, -12.7498779296875, -12.33056640625, -11.9112548828125, -11.491943359375, -11.0726318359375, -10.6533203125, -10.2340087890625, -9.814697265625, -9.3953857421875, -8.97607421875, -8.5567626953125, -8.137451171875, -7.7181396484375, -7.298828125, -6.8795166015625, -6.460205078125, -6.0408935546875, -5.62158203125, -5.2022705078125, -4.782958984375, -4.3636474609375, -3.9443359375, -3.5250244140625, -3.105712890625, -2.6864013671875, -2.26708984375, -1.8477783203125, -1.428466796875, -1.0091552734375, -0.58984375, -0.1705322265625, 0.248779296875, 0.6680908203125, 1.08740234375, 1.5067138671875, 1.926025390625, 2.3453369140625, 2.7646484375, 3.1839599609375, 3.603271484375, 4.0225830078125, 4.44189453125, 4.8612060546875, 5.280517578125, 5.6998291015625, 6.119140625, 6.5384521484375, 6.957763671875, 7.3770751953125, 7.79638671875, 8.2156982421875, 8.635009765625, 9.0543212890625, 9.4736328125, 9.8929443359375, 10.312255859375, 10.7315673828125, 11.15087890625, 11.5701904296875, 11.989501953125, 12.4088134765625, 12.828125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 12.0, 24.0, 21.0, 33.0, 42.0, 58.0, 85.0, 136.0, 247.0, 405.0, 918.0, 2215.0, 7172.0, 33685.0, 310369.0, 3374457.0, 410631.0, 40740.0, 8456.0, 2538.0, 962.0, 452.0, 234.0, 132.0, 84.0, 41.0, 34.0, 23.0, 20.0, 6.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.296875, -24.585205078125, -23.87353515625, -23.161865234375, -22.4501953125, -21.738525390625, -21.02685546875, -20.315185546875, -19.603515625, -18.891845703125, -18.18017578125, -17.468505859375, -16.7568359375, -16.045166015625, -15.33349609375, -14.621826171875, -13.91015625, -13.198486328125, -12.48681640625, -11.775146484375, -11.0634765625, -10.351806640625, -9.64013671875, -8.928466796875, -8.216796875, -7.505126953125, -6.79345703125, -6.081787109375, -5.3701171875, -4.658447265625, -3.94677734375, -3.235107421875, -2.5234375, -1.811767578125, -1.10009765625, -0.388427734375, 0.3232421875, 1.034912109375, 1.74658203125, 2.458251953125, 3.169921875, 3.881591796875, 4.59326171875, 5.304931640625, 6.0166015625, 6.728271484375, 7.43994140625, 8.151611328125, 8.86328125, 9.574951171875, 10.28662109375, 10.998291015625, 11.7099609375, 12.421630859375, 13.13330078125, 13.844970703125, 14.556640625, 15.268310546875, 15.97998046875, 16.691650390625, 17.4033203125, 18.114990234375, 18.82666015625, 19.538330078125, 20.25]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 16.0, 91.0, 294.0, 367.0, 189.0, 40.0, 11.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.59024047851562, -84.20030975341797, -79.81037902832031, -75.42044830322266, -71.030517578125, -66.64057922363281, -62.250648498535156, -57.8607177734375, -53.470787048339844, -49.08085632324219, -44.69092559814453, -40.30099105834961, -35.91106033325195, -31.521129608154297, -27.131196975708008, -22.74126434326172, -18.351333618164062, -13.96140193939209, -9.571470260620117, -5.1815385818481445, -0.7916069030761719, 3.5983238220214844, 7.988256454467773, 12.378189086914062, 16.76811981201172, 21.158050537109375, 25.547983169555664, 29.937915802001953, 34.32784652709961, 38.717777252197266, 43.10771179199219, 47.497642517089844, 51.88758850097656, 56.27751922607422, 60.667449951171875, 65.05738067626953, 69.44731140136719, 73.83724975585938, 78.22718048095703, 82.61711120605469, 87.00704193115234, 91.39697265625, 95.78690338134766, 100.17683410644531, 104.5667724609375, 108.95669555664062, 113.34663391113281, 117.73656463623047, 122.12649536132812, 126.51642608642578, 130.90635681152344, 135.29629516601562, 139.68621826171875, 144.07615661621094, 148.46607971191406, 152.85601806640625, 157.24594116210938, 161.63587951660156, 166.0258026123047, 170.41574096679688, 174.8056640625, 179.1956024169922, 183.5855255126953, 187.9754638671875, 192.3654022216797]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 4.0, 9.0, 7.0, 15.0, 13.0, 16.0, 18.0, 15.0, 18.0, 23.0, 26.0, 34.0, 30.0, 38.0, 31.0, 43.0, 37.0, 46.0, 40.0, 35.0, 41.0, 52.0, 50.0, 28.0, 39.0, 34.0, 32.0, 24.0, 30.0, 25.0, 21.0, 18.0, 12.0, 10.0, 19.0, 9.0, 11.0, 8.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.079254150390625, -33.92224884033203, -32.76523971557617, -31.608232498168945, -30.45122528076172, -29.294219970703125, -28.1372127532959, -26.980205535888672, -25.823198318481445, -24.66619110107422, -23.509183883666992, -22.352176666259766, -21.195171356201172, -20.038162231445312, -18.88115692138672, -17.724149703979492, -16.567142486572266, -15.410135269165039, -14.253128051757812, -13.096121788024902, -11.939114570617676, -10.78210735321045, -9.625101089477539, -8.468093872070312, -7.311086654663086, -6.154079437255859, -4.997072696685791, -3.8400657176971436, -2.683058738708496, -1.5260515213012695, -0.36904478073120117, 0.7879619598388672, 1.9449691772460938, 3.101976156234741, 4.258983135223389, 5.415989875793457, 6.572997093200684, 7.73000431060791, 8.88701057434082, 10.044017791748047, 11.201025009155273, 12.3580322265625, 13.515039443969727, 14.672045707702637, 15.829052925109863, 16.986061096191406, 18.14306640625, 19.300073623657227, 20.457080841064453, 21.61408805847168, 22.771095275878906, 23.928102493286133, 25.08510971069336, 26.242115020751953, 27.39912223815918, 28.556129455566406, 29.713136672973633, 30.87014389038086, 32.02714920043945, 33.18415832519531, 34.341163635253906, 35.498172760009766, 36.65517807006836, 37.81218719482422, 38.96919250488281]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 2.0, 7.0, 3.0, 14.0, 12.0, 16.0, 11.0, 15.0, 24.0, 24.0, 34.0, 40.0, 33.0, 32.0, 49.0, 39.0, 44.0, 49.0, 45.0, 39.0, 45.0, 32.0, 54.0, 32.0, 26.0, 45.0, 46.0, 30.0, 28.0, 26.0, 25.0, 20.0, 10.0, 6.0, 6.0, 9.0, 9.0, 3.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.8046875, -7.5531005859375, -7.301513671875, -7.0499267578125, -6.79833984375, -6.5467529296875, -6.295166015625, -6.0435791015625, -5.7919921875, -5.5404052734375, -5.288818359375, -5.0372314453125, -4.78564453125, -4.5340576171875, -4.282470703125, -4.0308837890625, -3.779296875, -3.5277099609375, -3.276123046875, -3.0245361328125, -2.77294921875, -2.5213623046875, -2.269775390625, -2.0181884765625, -1.7666015625, -1.5150146484375, -1.263427734375, -1.0118408203125, -0.76025390625, -0.5086669921875, -0.257080078125, -0.0054931640625, 0.24609375, 0.4976806640625, 0.749267578125, 1.0008544921875, 1.25244140625, 1.5040283203125, 1.755615234375, 2.0072021484375, 2.2587890625, 2.5103759765625, 2.761962890625, 3.0135498046875, 3.26513671875, 3.5167236328125, 3.768310546875, 4.0198974609375, 4.271484375, 4.5230712890625, 4.774658203125, 5.0262451171875, 5.27783203125, 5.5294189453125, 5.781005859375, 6.0325927734375, 6.2841796875, 6.5357666015625, 6.787353515625, 7.0389404296875, 7.29052734375, 7.5421142578125, 7.793701171875, 8.0452880859375, 8.296875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 10.0, 18.0, 18.0, 31.0, 53.0, 87.0, 102.0, 192.0, 254.0, 412.0, 627.0, 931.0, 1484.0, 2405.0, 3830.0, 5969.0, 9411.0, 15562.0, 25661.0, 43924.0, 76041.0, 130836.0, 199645.0, 202822.0, 134601.0, 78547.0, 45539.0, 26874.0, 15972.0, 9816.0, 6091.0, 3954.0, 2441.0, 1571.0, 995.0, 613.0, 391.0, 280.0, 167.0, 118.0, 84.0, 54.0, 34.0, 36.0, 17.0, 7.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.8056640625, -0.7819900512695312, -0.7583160400390625, -0.7346420288085938, -0.710968017578125, -0.6872940063476562, -0.6636199951171875, -0.6399459838867188, -0.61627197265625, -0.5925979614257812, -0.5689239501953125, -0.5452499389648438, -0.521575927734375, -0.49790191650390625, -0.4742279052734375, -0.45055389404296875, -0.4268798828125, -0.40320587158203125, -0.3795318603515625, -0.35585784912109375, -0.332183837890625, -0.30850982666015625, -0.2848358154296875, -0.26116180419921875, -0.23748779296875, -0.21381378173828125, -0.1901397705078125, -0.16646575927734375, -0.142791748046875, -0.11911773681640625, -0.0954437255859375, -0.07176971435546875, -0.048095703125, -0.02442169189453125, -0.0007476806640625, 0.02292633056640625, 0.046600341796875, 0.07027435302734375, 0.0939483642578125, 0.11762237548828125, 0.14129638671875, 0.16497039794921875, 0.1886444091796875, 0.21231842041015625, 0.235992431640625, 0.25966644287109375, 0.2833404541015625, 0.30701446533203125, 0.3306884765625, 0.35436248779296875, 0.3780364990234375, 0.40171051025390625, 0.425384521484375, 0.44905853271484375, 0.4727325439453125, 0.49640655517578125, 0.52008056640625, 0.5437545776367188, 0.5674285888671875, 0.5911026000976562, 0.614776611328125, 0.6384506225585938, 0.6621246337890625, 0.6857986450195312, 0.70947265625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 9.0, 18.0, 25.0, 21.0, 33.0, 30.0, 37.0, 38.0, 39.0, 38.0, 42.0, 74.0, 41.0, 1068.0, 54.0, 53.0, 28.0, 50.0, 45.0, 35.0, 48.0, 28.0, 27.0, 24.0, 20.0, 11.0, 16.0, 11.0, 8.0, 11.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.31640625, -5.1357421875, -4.955078125, -4.7744140625, -4.59375, -4.4130859375, -4.232421875, -4.0517578125, -3.87109375, -3.6904296875, -3.509765625, -3.3291015625, -3.1484375, -2.9677734375, -2.787109375, -2.6064453125, -2.42578125, -2.2451171875, -2.064453125, -1.8837890625, -1.703125, -1.5224609375, -1.341796875, -1.1611328125, -0.98046875, -0.7998046875, -0.619140625, -0.4384765625, -0.2578125, -0.0771484375, 0.103515625, 0.2841796875, 0.46484375, 0.6455078125, 0.826171875, 1.0068359375, 1.1875, 1.3681640625, 1.548828125, 1.7294921875, 1.91015625, 2.0908203125, 2.271484375, 2.4521484375, 2.6328125, 2.8134765625, 2.994140625, 3.1748046875, 3.35546875, 3.5361328125, 3.716796875, 3.8974609375, 4.078125, 4.2587890625, 4.439453125, 4.6201171875, 4.80078125, 4.9814453125, 5.162109375, 5.3427734375, 5.5234375, 5.7041015625, 5.884765625, 6.0654296875, 6.24609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 11.0, 19.0, 28.0, 42.0, 42.0, 84.0, 144.0, 159.0, 282.0, 427.0, 681.0, 985.0, 1633.0, 2487.0, 4037.0, 6288.0, 10548.0, 17382.0, 28603.0, 49567.0, 84730.0, 141314.0, 1247991.0, 190043.0, 125317.0, 74819.0, 43731.0, 25583.0, 15416.0, 9201.0, 5768.0, 3642.0, 2207.0, 1353.0, 888.0, 590.0, 383.0, 229.0, 159.0, 102.0, 69.0, 36.0, 37.0, 24.0, 15.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70849609375, -0.68695068359375, -0.6654052734375, -0.64385986328125, -0.622314453125, -0.60076904296875, -0.5792236328125, -0.55767822265625, -0.5361328125, -0.51458740234375, -0.4930419921875, -0.47149658203125, -0.449951171875, -0.42840576171875, -0.4068603515625, -0.38531494140625, -0.36376953125, -0.34222412109375, -0.3206787109375, -0.29913330078125, -0.277587890625, -0.25604248046875, -0.2344970703125, -0.21295166015625, -0.19140625, -0.16986083984375, -0.1483154296875, -0.12677001953125, -0.105224609375, -0.08367919921875, -0.0621337890625, -0.04058837890625, -0.01904296875, 0.00250244140625, 0.0240478515625, 0.04559326171875, 0.067138671875, 0.08868408203125, 0.1102294921875, 0.13177490234375, 0.1533203125, 0.17486572265625, 0.1964111328125, 0.21795654296875, 0.239501953125, 0.26104736328125, 0.2825927734375, 0.30413818359375, 0.32568359375, 0.34722900390625, 0.3687744140625, 0.39031982421875, 0.411865234375, 0.43341064453125, 0.4549560546875, 0.47650146484375, 0.498046875, 0.51959228515625, 0.5411376953125, 0.56268310546875, 0.584228515625, 0.60577392578125, 0.6273193359375, 0.64886474609375, 0.67041015625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 11.0, 4.0, 8.0, 16.0, 22.0, 28.0, 33.0, 24.0, 34.0, 35.0, 31.0, 34.0, 59.0, 48.0, 54.0, 45.0, 43.0, 44.0, 39.0, 46.0, 49.0, 44.0, 45.0, 33.0, 27.0, 21.0, 33.0, 18.0, 12.0, 14.0, 15.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009636878967285156, -0.0009290501475334167, -0.0008944123983383179, -0.000859774649143219, -0.0008251368999481201, -0.0007904991507530212, -0.0007558614015579224, -0.0007212236523628235, -0.0006865859031677246, -0.0006519481539726257, -0.0006173104047775269, -0.000582672655582428, -0.0005480349063873291, -0.0005133971571922302, -0.00047875940799713135, -0.00044412165880203247, -0.0004094839096069336, -0.0003748461604118347, -0.00034020841121673584, -0.00030557066202163696, -0.0002709329128265381, -0.0002362951636314392, -0.00020165741443634033, -0.00016701966524124146, -0.00013238191604614258, -9.77441668510437e-05, -6.310641765594482e-05, -2.8468668460845947e-05, 6.16908073425293e-06, 4.080682992935181e-05, 7.544457912445068e-05, 0.00011008232831954956, 0.00014472007751464844, 0.00017935782670974731, 0.0002139955759048462, 0.00024863332509994507, 0.00028327107429504395, 0.0003179088234901428, 0.0003525465726852417, 0.0003871843218803406, 0.00042182207107543945, 0.00045645982027053833, 0.0004910975694656372, 0.0005257353186607361, 0.000560373067855835, 0.0005950108170509338, 0.0006296485662460327, 0.0006642863154411316, 0.0006989240646362305, 0.0007335618138313293, 0.0007681995630264282, 0.0008028373122215271, 0.000837475061416626, 0.0008721128106117249, 0.0009067505598068237, 0.0009413883090019226, 0.0009760260581970215, 0.0010106638073921204, 0.0010453015565872192, 0.0010799393057823181, 0.001114577054977417, 0.0011492148041725159, 0.0011838525533676147, 0.0012184903025627136, 0.0012531280517578125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 10.0, 16.0, 18.0, 19.0, 31.0, 49.0, 48.0, 50.0, 69.0, 86.0, 103.0, 136.0, 224.0, 387.0, 805.0, 4934.0, 1032919.0, 6672.0, 797.0, 363.0, 206.0, 144.0, 93.0, 74.0, 55.0, 61.0, 43.0, 27.0, 24.0, 20.0, 13.0, 14.0, 10.0, 5.0, 3.0, 5.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252685546875, -0.024557113647460938, -0.023845672607421875, -0.023134231567382812, -0.02242279052734375, -0.021711349487304688, -0.020999908447265625, -0.020288467407226562, -0.0195770263671875, -0.018865585327148438, -0.018154144287109375, -0.017442703247070312, -0.01673126220703125, -0.016019821166992188, -0.015308380126953125, -0.014596939086914062, -0.013885498046875, -0.013174057006835938, -0.012462615966796875, -0.011751174926757812, -0.01103973388671875, -0.010328292846679688, -0.009616851806640625, -0.008905410766601562, -0.0081939697265625, -0.0074825286865234375, -0.006771087646484375, -0.0060596466064453125, -0.00534820556640625, -0.0046367645263671875, -0.003925323486328125, -0.0032138824462890625, -0.00250244140625, -0.0017910003662109375, -0.001079559326171875, -0.0003681182861328125, 0.00034332275390625, 0.0010547637939453125, 0.001766204833984375, 0.0024776458740234375, 0.0031890869140625, 0.0039005279541015625, 0.004611968994140625, 0.0053234100341796875, 0.00603485107421875, 0.0067462921142578125, 0.007457733154296875, 0.008169174194335938, 0.008880615234375, 0.009592056274414062, 0.010303497314453125, 0.011014938354492188, 0.01172637939453125, 0.012437820434570312, 0.013149261474609375, 0.013860702514648438, 0.0145721435546875, 0.015283584594726562, 0.015995025634765625, 0.016706466674804688, 0.01741790771484375, 0.018129348754882812, 0.018840789794921875, 0.019552230834960938, 0.020263671875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 24.0, 148.0, 428.0, 327.0, 80.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034617597702890635, -0.003382748458534479, -0.003303737146779895, -0.003224725602194667, -0.0031457142904400826, -0.0030667029786854982, -0.002987691666930914, -0.0029086803551763296, -0.0028296690434217453, -0.002750657731667161, -0.0026716464199125767, -0.0025926348753273487, -0.0025136235635727644, -0.00243461225181818, -0.0023556009400635958, -0.0022765896283090115, -0.0021975780837237835, -0.002118566771969199, -0.002039555460214615, -0.001960543915629387, -0.0018815326038748026, -0.0018025212921202183, -0.001723509980365634, -0.0016444986686110497, -0.0015654872404411435, -0.0014864759286865592, -0.001407464500516653, -0.0013284531887620687, -0.0012494418770074844, -0.0011704304488375783, -0.001091419137082994, -0.0010124077089130878, -0.0009333962807431817, -0.0008543849107809365, -0.0007753735408186913, -0.0006963622290641069, -0.0006173508591018617, -0.0005383394891396165, -0.0004593281482812017, -0.00038031680742278695, -0.0003013054374605417, -0.00022229408205021173, -0.00014328272663988173, -6.427137122955173e-05, 1.4739984180778265e-05, 9.375135414302349e-05, 0.00017276269500143826, 0.00025177403585985303, 0.00033078540582209826, 0.0004097967757843435, 0.0004888081457465887, 0.000567819457501173, 0.0006468308274634182, 0.0007258421974256635, 0.0008048535091802478, 0.000883864879142493, 0.0009628762491047382, 0.0010418875608593225, 0.0011208989890292287, 0.001199910300783813, 0.0012789217289537191, 0.0013579330407083035, 0.0014369443524628878, 0.001515955664217472, 0.0015949670923873782]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 8.0, 10.0, 10.0, 5.0, 13.0, 16.0, 17.0, 25.0, 20.0, 26.0, 31.0, 23.0, 33.0, 42.0, 39.0, 36.0, 29.0, 35.0, 34.0, 43.0, 47.0, 40.0, 36.0, 34.0, 41.0, 39.0, 43.0, 20.0, 31.0, 20.0, 23.0, 22.0, 16.0, 15.0, 12.0, 6.0, 11.0, 4.0, 12.0, 8.0, 2.0, 6.0, 1.0, 5.0, 0.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0005627870559692383, -0.0005448721349239349, -0.0005269572138786316, -0.0005090422928333282, -0.0004911273717880249, -0.00047321245074272156, -0.0004552975296974182, -0.00043738260865211487, -0.0004194676876068115, -0.0004015527665615082, -0.00038363784551620483, -0.0003657229244709015, -0.00034780800342559814, -0.0003298930823802948, -0.00031197816133499146, -0.0002940632402896881, -0.00027614831924438477, -0.0002582333981990814, -0.00024031847715377808, -0.00022240355610847473, -0.0002044886350631714, -0.00018657371401786804, -0.0001686587929725647, -0.00015074387192726135, -0.000132828950881958, -0.00011491402983665466, -9.699910879135132e-05, -7.908418774604797e-05, -6.116926670074463e-05, -4.3254345655441284e-05, -2.533942461013794e-05, -7.424503564834595e-06, 1.049041748046875e-05, 2.8405338525772095e-05, 4.632025957107544e-05, 6.423518061637878e-05, 8.215010166168213e-05, 0.00010006502270698547, 0.00011797994375228882, 0.00013589486479759216, 0.0001538097858428955, 0.00017172470688819885, 0.0001896396279335022, 0.00020755454897880554, 0.0002254694700241089, 0.00024338439106941223, 0.0002612993121147156, 0.0002792142331600189, 0.00029712915420532227, 0.0003150440752506256, 0.00033295899629592896, 0.0003508739173412323, 0.00036878883838653564, 0.000386703759431839, 0.00040461868047714233, 0.0004225336015224457, 0.000440448522567749, 0.00045836344361305237, 0.0004762783646583557, 0.0004941932857036591, 0.0005121082067489624, 0.0005300231277942657, 0.0005479380488395691, 0.0005658529698848724, 0.0005837678909301758]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 2.0, 7.0, 3.0, 14.0, 12.0, 16.0, 11.0, 15.0, 24.0, 24.0, 34.0, 40.0, 33.0, 32.0, 49.0, 39.0, 44.0, 49.0, 45.0, 39.0, 45.0, 32.0, 54.0, 32.0, 26.0, 45.0, 46.0, 30.0, 28.0, 26.0, 25.0, 20.0, 10.0, 6.0, 6.0, 9.0, 9.0, 3.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.8046875, -7.5531005859375, -7.301513671875, -7.0499267578125, -6.79833984375, -6.5467529296875, -6.295166015625, -6.0435791015625, -5.7919921875, -5.5404052734375, -5.288818359375, -5.0372314453125, -4.78564453125, -4.5340576171875, -4.282470703125, -4.0308837890625, -3.779296875, -3.5277099609375, -3.276123046875, -3.0245361328125, -2.77294921875, -2.5213623046875, -2.269775390625, -2.0181884765625, -1.7666015625, -1.5150146484375, -1.263427734375, -1.0118408203125, -0.76025390625, -0.5086669921875, -0.257080078125, -0.0054931640625, 0.24609375, 0.4976806640625, 0.749267578125, 1.0008544921875, 1.25244140625, 1.5040283203125, 1.755615234375, 2.0072021484375, 2.2587890625, 2.5103759765625, 2.761962890625, 3.0135498046875, 3.26513671875, 3.5167236328125, 3.768310546875, 4.0198974609375, 4.271484375, 4.5230712890625, 4.774658203125, 5.0262451171875, 5.27783203125, 5.5294189453125, 5.781005859375, 6.0325927734375, 6.2841796875, 6.5357666015625, 6.787353515625, 7.0389404296875, 7.29052734375, 7.5421142578125, 7.793701171875, 8.0452880859375, 8.296875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 9.0, 10.0, 19.0, 22.0, 35.0, 45.0, 44.0, 72.0, 119.0, 178.0, 222.0, 344.0, 507.0, 880.0, 1507.0, 2918.0, 6700.0, 18689.0, 62004.0, 225254.0, 455645.0, 191636.0, 53152.0, 16169.0, 5828.0, 2744.0, 1423.0, 811.0, 499.0, 326.0, 203.0, 146.0, 92.0, 85.0, 52.0, 44.0, 40.0, 18.0, 15.0, 13.0, 13.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.0, -9.700927734375, -9.40185546875, -9.102783203125, -8.8037109375, -8.504638671875, -8.20556640625, -7.906494140625, -7.607421875, -7.308349609375, -7.00927734375, -6.710205078125, -6.4111328125, -6.112060546875, -5.81298828125, -5.513916015625, -5.21484375, -4.915771484375, -4.61669921875, -4.317626953125, -4.0185546875, -3.719482421875, -3.42041015625, -3.121337890625, -2.822265625, -2.523193359375, -2.22412109375, -1.925048828125, -1.6259765625, -1.326904296875, -1.02783203125, -0.728759765625, -0.4296875, -0.130615234375, 0.16845703125, 0.467529296875, 0.7666015625, 1.065673828125, 1.36474609375, 1.663818359375, 1.962890625, 2.261962890625, 2.56103515625, 2.860107421875, 3.1591796875, 3.458251953125, 3.75732421875, 4.056396484375, 4.35546875, 4.654541015625, 4.95361328125, 5.252685546875, 5.5517578125, 5.850830078125, 6.14990234375, 6.448974609375, 6.748046875, 7.047119140625, 7.34619140625, 7.645263671875, 7.9443359375, 8.243408203125, 8.54248046875, 8.841552734375, 9.140625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 13.0, 12.0, 16.0, 20.0, 30.0, 25.0, 36.0, 32.0, 43.0, 69.0, 93.0, 102.0, 180.0, 1403.0, 330.0, 163.0, 96.0, 64.0, 55.0, 52.0, 44.0, 34.0, 26.0, 32.0, 22.0, 12.0, 9.0, 15.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65625, -25.870849609375, -25.08544921875, -24.300048828125, -23.5146484375, -22.729248046875, -21.94384765625, -21.158447265625, -20.373046875, -19.587646484375, -18.80224609375, -18.016845703125, -17.2314453125, -16.446044921875, -15.66064453125, -14.875244140625, -14.08984375, -13.304443359375, -12.51904296875, -11.733642578125, -10.9482421875, -10.162841796875, -9.37744140625, -8.592041015625, -7.806640625, -7.021240234375, -6.23583984375, -5.450439453125, -4.6650390625, -3.879638671875, -3.09423828125, -2.308837890625, -1.5234375, -0.738037109375, 0.04736328125, 0.832763671875, 1.6181640625, 2.403564453125, 3.18896484375, 3.974365234375, 4.759765625, 5.545166015625, 6.33056640625, 7.115966796875, 7.9013671875, 8.686767578125, 9.47216796875, 10.257568359375, 11.04296875, 11.828369140625, 12.61376953125, 13.399169921875, 14.1845703125, 14.969970703125, 15.75537109375, 16.540771484375, 17.326171875, 18.111572265625, 18.89697265625, 19.682373046875, 20.4677734375, 21.253173828125, 22.03857421875, 22.823974609375, 23.609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 1.0, 5.0, 4.0, 13.0, 12.0, 22.0, 30.0, 37.0, 42.0, 66.0, 85.0, 116.0, 219.0, 318.0, 501.0, 1463.0, 13647.0, 2380830.0, 737415.0, 8247.0, 1215.0, 496.0, 287.0, 172.0, 122.0, 107.0, 52.0, 42.0, 35.0, 27.0, 20.0, 15.0, 5.0, 8.0, 5.0, 10.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.15625, -41.92041015625, -40.6845703125, -39.44873046875, -38.212890625, -36.97705078125, -35.7412109375, -34.50537109375, -33.26953125, -32.03369140625, -30.7978515625, -29.56201171875, -28.326171875, -27.09033203125, -25.8544921875, -24.61865234375, -23.3828125, -22.14697265625, -20.9111328125, -19.67529296875, -18.439453125, -17.20361328125, -15.9677734375, -14.73193359375, -13.49609375, -12.26025390625, -11.0244140625, -9.78857421875, -8.552734375, -7.31689453125, -6.0810546875, -4.84521484375, -3.609375, -2.37353515625, -1.1376953125, 0.09814453125, 1.333984375, 2.56982421875, 3.8056640625, 5.04150390625, 6.27734375, 7.51318359375, 8.7490234375, 9.98486328125, 11.220703125, 12.45654296875, 13.6923828125, 14.92822265625, 16.1640625, 17.39990234375, 18.6357421875, 19.87158203125, 21.107421875, 22.34326171875, 23.5791015625, 24.81494140625, 26.05078125, 27.28662109375, 28.5224609375, 29.75830078125, 30.994140625, 32.22998046875, 33.4658203125, 34.70166015625, 35.9375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 16.0, 198.0, 608.0, 176.0, 17.0, 3.0, 1.0, 1.0], "bins": [-243.40211486816406, -239.23875427246094, -235.07540893554688, -230.91204833984375, -226.74868774414062, -222.58534240722656, -218.42198181152344, -214.25863647460938, -210.09527587890625, -205.93191528320312, -201.76856994628906, -197.60520935058594, -193.44186401367188, -189.27850341796875, -185.11514282226562, -180.95179748535156, -176.78843688964844, -172.6250762939453, -168.46173095703125, -164.29837036132812, -160.135009765625, -155.97166442871094, -151.8083038330078, -147.64495849609375, -143.48159790039062, -139.3182373046875, -135.15489196777344, -130.9915313720703, -126.82817840576172, -122.66482543945312, -118.50146484375, -114.3381118774414, -110.17474365234375, -106.01139068603516, -101.84803771972656, -97.68467712402344, -93.52132415771484, -89.35797119140625, -85.19461059570312, -81.03125762939453, -76.86790466308594, -72.70455169677734, -68.54119873046875, -64.37783813476562, -60.21448516845703, -56.05113220214844, -51.88777542114258, -47.72441864013672, -43.561065673828125, -39.39771270751953, -35.23435592651367, -31.071001052856445, -26.90764617919922, -22.744291305541992, -18.580936431884766, -14.417581558227539, -10.254226684570312, -6.090871810913086, -1.9275169372558594, 2.235837936401367, 6.399192810058594, 10.56254768371582, 14.725902557373047, 18.889257431030273, 23.0526123046875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 3.0, 4.0, 5.0, 15.0, 9.0, 15.0, 8.0, 13.0, 15.0, 14.0, 31.0, 30.0, 26.0, 36.0, 30.0, 41.0, 38.0, 40.0, 29.0, 47.0, 49.0, 35.0, 47.0, 40.0, 38.0, 34.0, 33.0, 43.0, 22.0, 22.0, 30.0, 31.0, 26.0, 28.0, 11.0, 14.0, 7.0, 8.0, 10.0, 3.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0], "bins": [-54.48598098754883, -53.09469223022461, -51.703399658203125, -50.312110900878906, -48.92081832885742, -47.5295295715332, -46.13823699951172, -44.7469482421875, -43.35565948486328, -41.96437072753906, -40.57307815551758, -39.18178939819336, -37.790496826171875, -36.399208068847656, -35.00791931152344, -33.61662673950195, -32.22533416748047, -30.834043502807617, -29.442752838134766, -28.051464080810547, -26.660171508789062, -25.268882751464844, -23.877592086791992, -22.48630142211914, -21.09501075744629, -19.703720092773438, -18.312429428100586, -16.921138763427734, -15.5298490524292, -14.138558387756348, -12.747268676757812, -11.355978012084961, -9.964691162109375, -8.573400497436523, -7.18211030960083, -5.790820121765137, -4.399529457092285, -3.0082387924194336, -1.6169490814208984, -0.22565841674804688, 1.1656322479248047, 2.556922674179077, 3.9482131004333496, 5.339503288269043, 6.7307939529418945, 8.122084617614746, 9.513374328613281, 10.904664993286133, 12.295955657958984, 13.687246322631836, 15.078536987304688, 16.469825744628906, 17.86111831665039, 19.25240707397461, 20.64369773864746, 22.034988403320312, 23.426279067993164, 24.817569732666016, 26.208860397338867, 27.60015106201172, 28.991439819335938, 30.382732391357422, 31.77402114868164, 33.165313720703125, 34.556602478027344]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 4.0, 10.0, 5.0, 11.0, 13.0, 18.0, 20.0, 24.0, 25.0, 35.0, 31.0, 37.0, 50.0, 44.0, 40.0, 43.0, 46.0, 45.0, 39.0, 39.0, 42.0, 39.0, 48.0, 29.0, 44.0, 30.0, 34.0, 26.0, 23.0, 21.0, 13.0, 11.0, 13.0, 9.0, 12.0, 6.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4296875, -7.17236328125, -6.9150390625, -6.65771484375, -6.400390625, -6.14306640625, -5.8857421875, -5.62841796875, -5.37109375, -5.11376953125, -4.8564453125, -4.59912109375, -4.341796875, -4.08447265625, -3.8271484375, -3.56982421875, -3.3125, -3.05517578125, -2.7978515625, -2.54052734375, -2.283203125, -2.02587890625, -1.7685546875, -1.51123046875, -1.25390625, -0.99658203125, -0.7392578125, -0.48193359375, -0.224609375, 0.03271484375, 0.2900390625, 0.54736328125, 0.8046875, 1.06201171875, 1.3193359375, 1.57666015625, 1.833984375, 2.09130859375, 2.3486328125, 2.60595703125, 2.86328125, 3.12060546875, 3.3779296875, 3.63525390625, 3.892578125, 4.14990234375, 4.4072265625, 4.66455078125, 4.921875, 5.17919921875, 5.4365234375, 5.69384765625, 5.951171875, 6.20849609375, 6.4658203125, 6.72314453125, 6.98046875, 7.23779296875, 7.4951171875, 7.75244140625, 8.009765625, 8.26708984375, 8.5244140625, 8.78173828125, 9.0390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 9.0, 13.0, 20.0, 17.0, 14.0, 34.0, 31.0, 40.0, 60.0, 70.0, 98.0, 111.0, 174.0, 245.0, 291.0, 382.0, 587.0, 166237.0, 4023295.0, 784.0, 382.0, 346.0, 259.0, 169.0, 146.0, 110.0, 72.0, 52.0, 48.0, 40.0, 26.0, 24.0, 23.0, 8.0, 8.0, 12.0, 9.0, 7.0, 3.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-153.625, -148.6875, -143.75, -138.8125, -133.875, -128.9375, -124.0, -119.0625, -114.125, -109.1875, -104.25, -99.3125, -94.375, -89.4375, -84.5, -79.5625, -74.625, -69.6875, -64.75, -59.8125, -54.875, -49.9375, -45.0, -40.0625, -35.125, -30.1875, -25.25, -20.3125, -15.375, -10.4375, -5.5, -0.5625, 4.375, 9.3125, 14.25, 19.1875, 24.125, 29.0625, 34.0, 38.9375, 43.875, 48.8125, 53.75, 58.6875, 63.625, 68.5625, 73.5, 78.4375, 83.375, 88.3125, 93.25, 98.1875, 103.125, 108.0625, 113.0, 117.9375, 122.875, 127.8125, 132.75, 137.6875, 142.625, 147.5625, 152.5, 157.4375, 162.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 9.0, 17.0, 25.0, 30.0, 33.0, 39.0, 60.0, 72.0, 131.0, 122.0, 258.0, 393.0, 538.0, 629.0, 563.0, 350.0, 228.0, 143.0, 106.0, 82.0, 62.0, 40.0, 34.0, 26.0, 20.0, 11.0, 9.0, 9.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-13.1171875, -12.7139892578125, -12.310791015625, -11.9075927734375, -11.50439453125, -11.1011962890625, -10.697998046875, -10.2947998046875, -9.8916015625, -9.4884033203125, -9.085205078125, -8.6820068359375, -8.27880859375, -7.8756103515625, -7.472412109375, -7.0692138671875, -6.666015625, -6.2628173828125, -5.859619140625, -5.4564208984375, -5.05322265625, -4.6500244140625, -4.246826171875, -3.8436279296875, -3.4404296875, -3.0372314453125, -2.634033203125, -2.2308349609375, -1.82763671875, -1.4244384765625, -1.021240234375, -0.6180419921875, -0.21484375, 0.1883544921875, 0.591552734375, 0.9947509765625, 1.39794921875, 1.8011474609375, 2.204345703125, 2.6075439453125, 3.0107421875, 3.4139404296875, 3.817138671875, 4.2203369140625, 4.62353515625, 5.0267333984375, 5.429931640625, 5.8331298828125, 6.236328125, 6.6395263671875, 7.042724609375, 7.4459228515625, 7.84912109375, 8.2523193359375, 8.655517578125, 9.0587158203125, 9.4619140625, 9.8651123046875, 10.268310546875, 10.6715087890625, 11.07470703125, 11.4779052734375, 11.881103515625, 12.2843017578125, 12.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 3.0, 5.0, 8.0, 11.0, 17.0, 20.0, 16.0, 29.0, 29.0, 27.0, 37.0, 50.0, 67.0, 91.0, 232.0, 2046.0, 2411832.0, 1777216.0, 1916.0, 225.0, 84.0, 59.0, 53.0, 45.0, 40.0, 19.0, 22.0, 18.0, 13.0, 6.0, 12.0, 5.0, 3.0, 2.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.875, -97.0205078125, -94.166015625, -91.3115234375, -88.45703125, -85.6025390625, -82.748046875, -79.8935546875, -77.0390625, -74.1845703125, -71.330078125, -68.4755859375, -65.62109375, -62.7666015625, -59.912109375, -57.0576171875, -54.203125, -51.3486328125, -48.494140625, -45.6396484375, -42.78515625, -39.9306640625, -37.076171875, -34.2216796875, -31.3671875, -28.5126953125, -25.658203125, -22.8037109375, -19.94921875, -17.0947265625, -14.240234375, -11.3857421875, -8.53125, -5.6767578125, -2.822265625, 0.0322265625, 2.88671875, 5.7412109375, 8.595703125, 11.4501953125, 14.3046875, 17.1591796875, 20.013671875, 22.8681640625, 25.72265625, 28.5771484375, 31.431640625, 34.2861328125, 37.140625, 39.9951171875, 42.849609375, 45.7041015625, 48.55859375, 51.4130859375, 54.267578125, 57.1220703125, 59.9765625, 62.8310546875, 65.685546875, 68.5400390625, 71.39453125, 74.2490234375, 77.103515625, 79.9580078125, 82.8125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 33.0, 392.0, 504.0, 83.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.08602905273438, -126.7131118774414, -119.34020233154297, -111.96728515625, -104.59436798095703, -97.22145080566406, -89.84854125976562, -82.47562408447266, -75.10270690917969, -67.72978973388672, -60.356876373291016, -52.98396301269531, -45.611045837402344, -38.23813247680664, -30.865219116210938, -23.49230194091797, -16.11939239501953, -8.746477127075195, -1.3735628128051758, 5.999351501464844, 13.37226676940918, 20.745182037353516, 28.11809539794922, 35.49101257324219, 42.86392593383789, 50.236839294433594, 57.60975646972656, 64.982666015625, 72.35558319091797, 79.72850036621094, 87.10140991210938, 94.47433471679688, 101.84724426269531, 109.22016143798828, 116.59307098388672, 123.96598815917969, 131.33889770507812, 138.71182250976562, 146.08473205566406, 153.4576416015625, 160.83056640625, 168.20347595214844, 175.57640075683594, 182.94931030273438, 190.3222198486328, 197.6951446533203, 205.06805419921875, 212.44097900390625, 219.81387329101562, 227.18678283691406, 234.55970764160156, 241.9326171875, 249.30552673339844, 256.6784362792969, 264.0513610839844, 271.4242858886719, 278.7972106933594, 286.1701354980469, 293.54302978515625, 300.91595458984375, 308.28887939453125, 315.6617736816406, 323.0346984863281, 330.4076232910156, 337.780517578125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 7.0, 9.0, 5.0, 8.0, 17.0, 13.0, 17.0, 13.0, 16.0, 28.0, 24.0, 42.0, 35.0, 36.0, 36.0, 40.0, 39.0, 46.0, 48.0, 53.0, 49.0, 41.0, 46.0, 38.0, 34.0, 37.0, 28.0, 32.0, 23.0, 23.0, 20.0, 17.0, 23.0, 16.0, 9.0, 6.0, 7.0, 8.0, 1.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.98048400878906, -37.61699676513672, -36.25350570678711, -34.890018463134766, -33.52653121948242, -32.16304016113281, -30.79955291748047, -29.436065673828125, -28.07257652282715, -26.709087371826172, -25.345600128173828, -23.98211097717285, -22.618621826171875, -21.25513458251953, -19.891645431518555, -18.528156280517578, -17.164669036865234, -15.801180839538574, -14.437692642211914, -13.074203491210938, -11.710715293884277, -10.347227096557617, -8.98373794555664, -7.6202497482299805, -6.25676155090332, -4.89327335357666, -3.529784679412842, -2.1662960052490234, -0.8028078079223633, 0.5606803894042969, 1.9241695404052734, 3.2876577377319336, 4.651145935058594, 6.014634132385254, 7.378122806549072, 8.74161148071289, 10.10509967803955, 11.468587875366211, 12.832077026367188, 14.195565223693848, 15.559053421020508, 16.922542572021484, 18.286029815673828, 19.649518966674805, 21.01300811767578, 22.376495361328125, 23.7399845123291, 25.103473663330078, 26.466960906982422, 27.8304500579834, 29.193937301635742, 30.55742645263672, 31.920913696289062, 33.284400939941406, 34.647891998291016, 36.01137924194336, 37.37487030029297, 38.73835754394531, 40.10184860229492, 41.465335845947266, 42.82882308959961, 44.19231414794922, 45.55580139160156, 46.919288635253906, 48.28277587890625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 6.0, 3.0, 5.0, 8.0, 12.0, 6.0, 14.0, 22.0, 18.0, 27.0, 31.0, 35.0, 36.0, 34.0, 44.0, 48.0, 46.0, 49.0, 52.0, 41.0, 34.0, 50.0, 40.0, 38.0, 44.0, 30.0, 41.0, 23.0, 27.0, 22.0, 16.0, 11.0, 26.0, 15.0, 13.0, 4.0, 7.0, 10.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.94140625, -7.68121337890625, -7.4210205078125, -7.16082763671875, -6.900634765625, -6.64044189453125, -6.3802490234375, -6.12005615234375, -5.85986328125, -5.59967041015625, -5.3394775390625, -5.07928466796875, -4.819091796875, -4.55889892578125, -4.2987060546875, -4.03851318359375, -3.7783203125, -3.51812744140625, -3.2579345703125, -2.99774169921875, -2.737548828125, -2.47735595703125, -2.2171630859375, -1.95697021484375, -1.69677734375, -1.43658447265625, -1.1763916015625, -0.91619873046875, -0.656005859375, -0.39581298828125, -0.1356201171875, 0.12457275390625, 0.384765625, 0.64495849609375, 0.9051513671875, 1.16534423828125, 1.425537109375, 1.68572998046875, 1.9459228515625, 2.20611572265625, 2.46630859375, 2.72650146484375, 2.9866943359375, 3.24688720703125, 3.507080078125, 3.76727294921875, 4.0274658203125, 4.28765869140625, 4.5478515625, 4.80804443359375, 5.0682373046875, 5.32843017578125, 5.588623046875, 5.84881591796875, 6.1090087890625, 6.36920166015625, 6.62939453125, 6.88958740234375, 7.1497802734375, 7.40997314453125, 7.670166015625, 7.93035888671875, 8.1905517578125, 8.45074462890625, 8.7109375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 10.0, 12.0, 16.0, 35.0, 37.0, 72.0, 90.0, 141.0, 210.0, 342.0, 428.0, 700.0, 1056.0, 1606.0, 2456.0, 3698.0, 5653.0, 9179.0, 14766.0, 24435.0, 41606.0, 72484.0, 129644.0, 208341.0, 212316.0, 133092.0, 76012.0, 42703.0, 25162.0, 15388.0, 9613.0, 5983.0, 3774.0, 2528.0, 1672.0, 1088.0, 698.0, 523.0, 320.0, 215.0, 159.0, 100.0, 72.0, 47.0, 23.0, 18.0, 17.0, 10.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.8251953125, -0.8009490966796875, -0.776702880859375, -0.7524566650390625, -0.72821044921875, -0.7039642333984375, -0.679718017578125, -0.6554718017578125, -0.6312255859375, -0.6069793701171875, -0.582733154296875, -0.5584869384765625, -0.53424072265625, -0.5099945068359375, -0.485748291015625, -0.4615020751953125, -0.437255859375, -0.4130096435546875, -0.388763427734375, -0.3645172119140625, -0.34027099609375, -0.3160247802734375, -0.291778564453125, -0.2675323486328125, -0.2432861328125, -0.2190399169921875, -0.194793701171875, -0.1705474853515625, -0.14630126953125, -0.1220550537109375, -0.097808837890625, -0.0735626220703125, -0.04931640625, -0.0250701904296875, -0.000823974609375, 0.0234222412109375, 0.04766845703125, 0.0719146728515625, 0.096160888671875, 0.1204071044921875, 0.1446533203125, 0.1688995361328125, 0.193145751953125, 0.2173919677734375, 0.24163818359375, 0.2658843994140625, 0.290130615234375, 0.3143768310546875, 0.338623046875, 0.3628692626953125, 0.387115478515625, 0.4113616943359375, 0.43560791015625, 0.4598541259765625, 0.484100341796875, 0.5083465576171875, 0.5325927734375, 0.5568389892578125, 0.581085205078125, 0.6053314208984375, 0.62957763671875, 0.6538238525390625, 0.678070068359375, 0.7023162841796875, 0.7265625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 6.0, 11.0, 9.0, 11.0, 8.0, 11.0, 15.0, 24.0, 14.0, 24.0, 22.0, 30.0, 27.0, 31.0, 45.0, 33.0, 34.0, 40.0, 26.0, 29.0, 1071.0, 39.0, 47.0, 30.0, 32.0, 35.0, 37.0, 29.0, 28.0, 20.0, 29.0, 24.0, 11.0, 25.0, 15.0, 16.0, 13.0, 9.0, 11.0, 11.0, 9.0, 6.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-4.82421875, -4.68798828125, -4.5517578125, -4.41552734375, -4.279296875, -4.14306640625, -4.0068359375, -3.87060546875, -3.734375, -3.59814453125, -3.4619140625, -3.32568359375, -3.189453125, -3.05322265625, -2.9169921875, -2.78076171875, -2.64453125, -2.50830078125, -2.3720703125, -2.23583984375, -2.099609375, -1.96337890625, -1.8271484375, -1.69091796875, -1.5546875, -1.41845703125, -1.2822265625, -1.14599609375, -1.009765625, -0.87353515625, -0.7373046875, -0.60107421875, -0.46484375, -0.32861328125, -0.1923828125, -0.05615234375, 0.080078125, 0.21630859375, 0.3525390625, 0.48876953125, 0.625, 0.76123046875, 0.8974609375, 1.03369140625, 1.169921875, 1.30615234375, 1.4423828125, 1.57861328125, 1.71484375, 1.85107421875, 1.9873046875, 2.12353515625, 2.259765625, 2.39599609375, 2.5322265625, 2.66845703125, 2.8046875, 2.94091796875, 3.0771484375, 3.21337890625, 3.349609375, 3.48583984375, 3.6220703125, 3.75830078125, 3.89453125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 3.0, 2.0, 9.0, 10.0, 11.0, 17.0, 48.0, 47.0, 110.0, 112.0, 221.0, 315.0, 452.0, 691.0, 1006.0, 1656.0, 2439.0, 4083.0, 6415.0, 10082.0, 16782.0, 27664.0, 47712.0, 82428.0, 141334.0, 1255083.0, 194280.0, 125124.0, 72614.0, 42074.0, 24739.0, 14867.0, 9015.0, 5542.0, 3581.0, 2336.0, 1487.0, 963.0, 593.0, 411.0, 278.0, 146.0, 102.0, 91.0, 57.0, 34.0, 22.0, 15.0, 13.0, 7.0, 4.0, 4.0, 4.0, 3.0], "bins": [-0.7802734375, -0.7585296630859375, -0.736785888671875, -0.7150421142578125, -0.69329833984375, -0.6715545654296875, -0.649810791015625, -0.6280670166015625, -0.6063232421875, -0.5845794677734375, -0.562835693359375, -0.5410919189453125, -0.51934814453125, -0.4976043701171875, -0.475860595703125, -0.4541168212890625, -0.432373046875, -0.4106292724609375, -0.388885498046875, -0.3671417236328125, -0.34539794921875, -0.3236541748046875, -0.301910400390625, -0.2801666259765625, -0.2584228515625, -0.2366790771484375, -0.214935302734375, -0.1931915283203125, -0.17144775390625, -0.1497039794921875, -0.127960205078125, -0.1062164306640625, -0.08447265625, -0.0627288818359375, -0.040985107421875, -0.0192413330078125, 0.00250244140625, 0.0242462158203125, 0.045989990234375, 0.0677337646484375, 0.0894775390625, 0.1112213134765625, 0.132965087890625, 0.1547088623046875, 0.17645263671875, 0.1981964111328125, 0.219940185546875, 0.2416839599609375, 0.263427734375, 0.2851715087890625, 0.306915283203125, 0.3286590576171875, 0.35040283203125, 0.3721466064453125, 0.393890380859375, 0.4156341552734375, 0.4373779296875, 0.4591217041015625, 0.480865478515625, 0.5026092529296875, 0.52435302734375, 0.5460968017578125, 0.567840576171875, 0.5895843505859375, 0.611328125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 8.0, 14.0, 11.0, 13.0, 8.0, 19.0, 22.0, 26.0, 33.0, 33.0, 34.0, 36.0, 37.0, 47.0, 56.0, 43.0, 50.0, 55.0, 44.0, 55.0, 54.0, 40.0, 38.0, 38.0, 27.0, 17.0, 33.0, 20.0, 14.0, 18.0, 13.0, 6.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010242462158203125, -0.000991523265838623, -0.0009588003158569336, -0.0009260773658752441, -0.0008933544158935547, -0.0008606314659118652, -0.0008279085159301758, -0.0007951855659484863, -0.0007624626159667969, -0.0007297396659851074, -0.000697016716003418, -0.0006642937660217285, -0.0006315708160400391, -0.0005988478660583496, -0.0005661249160766602, -0.0005334019660949707, -0.0005006790161132812, -0.0004679560661315918, -0.00043523311614990234, -0.0004025101661682129, -0.00036978721618652344, -0.000337064266204834, -0.00030434131622314453, -0.0002716183662414551, -0.00023889541625976562, -0.00020617246627807617, -0.00017344951629638672, -0.00014072656631469727, -0.00010800361633300781, -7.528066635131836e-05, -4.2557716369628906e-05, -9.834766387939453e-06, 2.288818359375e-05, 5.561113357543945e-05, 8.83340835571289e-05, 0.00012105703353881836, 0.0001537799835205078, 0.00018650293350219727, 0.00021922588348388672, 0.00025194883346557617, 0.0002846717834472656, 0.0003173947334289551, 0.00035011768341064453, 0.000382840633392334, 0.00041556358337402344, 0.0004482865333557129, 0.00048100948333740234, 0.0005137324333190918, 0.0005464553833007812, 0.0005791783332824707, 0.0006119012832641602, 0.0006446242332458496, 0.0006773471832275391, 0.0007100701332092285, 0.000742793083190918, 0.0007755160331726074, 0.0008082389831542969, 0.0008409619331359863, 0.0008736848831176758, 0.0009064078330993652, 0.0009391307830810547, 0.0009718537330627441, 0.0010045766830444336, 0.001037299633026123, 0.0010700225830078125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 7.0, 7.0, 3.0, 10.0, 11.0, 15.0, 17.0, 29.0, 36.0, 39.0, 41.0, 58.0, 82.0, 93.0, 141.0, 185.0, 288.0, 481.0, 711.0, 1864.0, 840070.0, 201347.0, 1167.0, 580.0, 384.0, 222.0, 143.0, 109.0, 94.0, 71.0, 56.0, 38.0, 36.0, 24.0, 21.0, 14.0, 17.0, 12.0, 11.0, 3.0, 7.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0196533203125, -0.01905512809753418, -0.01845693588256836, -0.01785874366760254, -0.01726055145263672, -0.0166623592376709, -0.016064167022705078, -0.015465974807739258, -0.014867782592773438, -0.014269590377807617, -0.013671398162841797, -0.013073205947875977, -0.012475013732910156, -0.011876821517944336, -0.011278629302978516, -0.010680437088012695, -0.010082244873046875, -0.009484052658081055, -0.008885860443115234, -0.008287668228149414, -0.007689476013183594, -0.0070912837982177734, -0.006493091583251953, -0.005894899368286133, -0.0052967071533203125, -0.004698514938354492, -0.004100322723388672, -0.0035021305084228516, -0.0029039382934570312, -0.002305746078491211, -0.0017075538635253906, -0.0011093616485595703, -0.00051116943359375, 8.702278137207031e-05, 0.0006852149963378906, 0.001283407211303711, 0.0018815994262695312, 0.0024797916412353516, 0.003077983856201172, 0.003676176071166992, 0.0042743682861328125, 0.004872560501098633, 0.005470752716064453, 0.0060689449310302734, 0.006667137145996094, 0.007265329360961914, 0.007863521575927734, 0.008461713790893555, 0.009059906005859375, 0.009658098220825195, 0.010256290435791016, 0.010854482650756836, 0.011452674865722656, 0.012050867080688477, 0.012649059295654297, 0.013247251510620117, 0.013845443725585938, 0.014443635940551758, 0.015041828155517578, 0.0156400203704834, 0.01623821258544922, 0.01683640480041504, 0.01743459701538086, 0.01803278923034668, 0.0186309814453125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 20.0, 270.0, 623.0, 98.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0049111791886389256, -0.004797704517841339, -0.00468423031270504, -0.0045707556419074535, -0.004457281436771154, -0.004343806765973568, -0.004230332560837269, -0.004116857890039682, -0.004003383684903383, -0.0038899092469364405, -0.0037764348089694977, -0.003662960371002555, -0.003549485933035612, -0.0034360114950686693, -0.0033225370571017265, -0.00320906238630414, -0.0030955879483371973, -0.0029821135103702545, -0.0028686390724033117, -0.002755164634436369, -0.002641690196469426, -0.0025282157585024834, -0.002414741087704897, -0.002301266882568598, -0.0021877922117710114, -0.0020743177738040686, -0.0019608433358371258, -0.001847368897870183, -0.0017338944599032402, -0.0016204200219362974, -0.0015069454675540328, -0.00139347102958709, -0.001279996708035469, -0.0011665222700685263, -0.0010530478321015835, -0.0009395733359269798, -0.000826098897960037, -0.0007126244599930942, -0.0005991499638184905, -0.0004856755258515477, -0.00037220108788460493, -0.00025872664991766214, -0.0001452521828468889, -3.1777715776115656e-05, 8.169672219082713e-05, 0.00019517116015776992, 0.0003086456563323736, 0.0004221200942993164, 0.0005355945322662592, 0.000649068970233202, 0.0007625434082001448, 0.0008760179043747485, 0.0009894922841340303, 0.0011029667221009731, 0.0012164412764832377, 0.0013299157144501805, 0.0014433901524171233, 0.001556864590384066, 0.001670339028351009, 0.0017838135827332735, 0.0018972880207002163, 0.002010762458667159, 0.002124236896634102, 0.0022377113346010447, 0.0023511857725679874]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 7.0, 2.0, 7.0, 9.0, 13.0, 14.0, 14.0, 12.0, 12.0, 24.0, 19.0, 27.0, 23.0, 26.0, 20.0, 33.0, 40.0, 35.0, 44.0, 36.0, 49.0, 42.0, 45.0, 39.0, 33.0, 43.0, 36.0, 40.0, 31.0, 27.0, 32.0, 30.0, 17.0, 15.0, 25.0, 13.0, 12.0, 11.0, 8.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005233883857727051, -0.0005053617060184479, -0.0004873350262641907, -0.00046930834650993347, -0.00045128166675567627, -0.00043325498700141907, -0.00041522830724716187, -0.00039720162749290466, -0.00037917494773864746, -0.00036114826798439026, -0.00034312158823013306, -0.00032509490847587585, -0.00030706822872161865, -0.00028904154896736145, -0.00027101486921310425, -0.00025298818945884705, -0.00023496150970458984, -0.00021693482995033264, -0.00019890815019607544, -0.00018088147044181824, -0.00016285479068756104, -0.00014482811093330383, -0.00012680143117904663, -0.00010877475142478943, -9.074807167053223e-05, -7.272139191627502e-05, -5.469471216201782e-05, -3.666803240776062e-05, -1.8641352653503418e-05, -6.146728992462158e-07, 1.7412006855010986e-05, 3.543868660926819e-05, 5.346536636352539e-05, 7.149204611778259e-05, 8.95187258720398e-05, 0.000107545405626297, 0.0001255720853805542, 0.0001435987651348114, 0.0001616254448890686, 0.0001796521246433258, 0.000197678804397583, 0.0002157054841518402, 0.0002337321639060974, 0.0002517588436603546, 0.0002697855234146118, 0.000287812203168869, 0.0003058388829231262, 0.0003238655626773834, 0.0003418922424316406, 0.00035991892218589783, 0.00037794560194015503, 0.00039597228169441223, 0.00041399896144866943, 0.00043202564120292664, 0.00045005232095718384, 0.00046807900071144104, 0.00048610568046569824, 0.0005041323602199554, 0.0005221590399742126, 0.0005401857197284698, 0.000558212399482727, 0.0005762390792369843, 0.0005942657589912415, 0.0006122924387454987, 0.0006303191184997559]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 6.0, 3.0, 5.0, 8.0, 12.0, 6.0, 14.0, 22.0, 18.0, 27.0, 31.0, 35.0, 36.0, 34.0, 44.0, 48.0, 46.0, 49.0, 52.0, 41.0, 34.0, 50.0, 40.0, 38.0, 44.0, 30.0, 41.0, 23.0, 27.0, 22.0, 16.0, 11.0, 26.0, 15.0, 13.0, 4.0, 7.0, 10.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.94140625, -7.68121337890625, -7.4210205078125, -7.16082763671875, -6.900634765625, -6.64044189453125, -6.3802490234375, -6.12005615234375, -5.85986328125, -5.59967041015625, -5.3394775390625, -5.07928466796875, -4.819091796875, -4.55889892578125, -4.2987060546875, -4.03851318359375, -3.7783203125, -3.51812744140625, -3.2579345703125, -2.99774169921875, -2.737548828125, -2.47735595703125, -2.2171630859375, -1.95697021484375, -1.69677734375, -1.43658447265625, -1.1763916015625, -0.91619873046875, -0.656005859375, -0.39581298828125, -0.1356201171875, 0.12457275390625, 0.384765625, 0.64495849609375, 0.9051513671875, 1.16534423828125, 1.425537109375, 1.68572998046875, 1.9459228515625, 2.20611572265625, 2.46630859375, 2.72650146484375, 2.9866943359375, 3.24688720703125, 3.507080078125, 3.76727294921875, 4.0274658203125, 4.28765869140625, 4.5478515625, 4.80804443359375, 5.0682373046875, 5.32843017578125, 5.588623046875, 5.84881591796875, 6.1090087890625, 6.36920166015625, 6.62939453125, 6.88958740234375, 7.1497802734375, 7.40997314453125, 7.670166015625, 7.93035888671875, 8.1905517578125, 8.45074462890625, 8.7109375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 7.0, 15.0, 23.0, 30.0, 24.0, 53.0, 80.0, 87.0, 122.0, 154.0, 218.0, 293.0, 391.0, 475.0, 617.0, 881.0, 1180.0, 1862.0, 4205.0, 16726.0, 96749.0, 490130.0, 352513.0, 61352.0, 11073.0, 3342.0, 1661.0, 1079.0, 783.0, 591.0, 457.0, 328.0, 276.0, 198.0, 147.0, 108.0, 88.0, 68.0, 61.0, 30.0, 21.0, 18.0, 9.0, 9.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.09375, -12.6954345703125, -12.297119140625, -11.8988037109375, -11.50048828125, -11.1021728515625, -10.703857421875, -10.3055419921875, -9.9072265625, -9.5089111328125, -9.110595703125, -8.7122802734375, -8.31396484375, -7.9156494140625, -7.517333984375, -7.1190185546875, -6.720703125, -6.3223876953125, -5.924072265625, -5.5257568359375, -5.12744140625, -4.7291259765625, -4.330810546875, -3.9324951171875, -3.5341796875, -3.1358642578125, -2.737548828125, -2.3392333984375, -1.94091796875, -1.5426025390625, -1.144287109375, -0.7459716796875, -0.34765625, 0.0506591796875, 0.448974609375, 0.8472900390625, 1.24560546875, 1.6439208984375, 2.042236328125, 2.4405517578125, 2.8388671875, 3.2371826171875, 3.635498046875, 4.0338134765625, 4.43212890625, 4.8304443359375, 5.228759765625, 5.6270751953125, 6.025390625, 6.4237060546875, 6.822021484375, 7.2203369140625, 7.61865234375, 8.0169677734375, 8.415283203125, 8.8135986328125, 9.2119140625, 9.6102294921875, 10.008544921875, 10.4068603515625, 10.80517578125, 11.2034912109375, 11.601806640625, 12.0001220703125, 12.3984375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 5.0, 9.0, 14.0, 10.0, 18.0, 11.0, 25.0, 30.0, 36.0, 49.0, 51.0, 56.0, 73.0, 103.0, 233.0, 1592.0, 223.0, 104.0, 70.0, 68.0, 69.0, 35.0, 39.0, 24.0, 29.0, 17.0, 11.0, 10.0, 2.0, 6.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.59375, -21.852294921875, -21.11083984375, -20.369384765625, -19.6279296875, -18.886474609375, -18.14501953125, -17.403564453125, -16.662109375, -15.920654296875, -15.17919921875, -14.437744140625, -13.6962890625, -12.954833984375, -12.21337890625, -11.471923828125, -10.73046875, -9.989013671875, -9.24755859375, -8.506103515625, -7.7646484375, -7.023193359375, -6.28173828125, -5.540283203125, -4.798828125, -4.057373046875, -3.31591796875, -2.574462890625, -1.8330078125, -1.091552734375, -0.35009765625, 0.391357421875, 1.1328125, 1.874267578125, 2.61572265625, 3.357177734375, 4.0986328125, 4.840087890625, 5.58154296875, 6.322998046875, 7.064453125, 7.805908203125, 8.54736328125, 9.288818359375, 10.0302734375, 10.771728515625, 11.51318359375, 12.254638671875, 12.99609375, 13.737548828125, 14.47900390625, 15.220458984375, 15.9619140625, 16.703369140625, 17.44482421875, 18.186279296875, 18.927734375, 19.669189453125, 20.41064453125, 21.152099609375, 21.8935546875, 22.635009765625, 23.37646484375, 24.117919921875, 24.859375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 8.0, 9.0, 15.0, 22.0, 16.0, 24.0, 41.0, 52.0, 83.0, 124.0, 259.0, 429.0, 1056.0, 11580.0, 3125621.0, 4525.0, 871.0, 350.0, 193.0, 137.0, 72.0, 52.0, 41.0, 31.0, 20.0, 22.0, 9.0, 11.0, 7.0, 8.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-89.625, -87.22900390625, -84.8330078125, -82.43701171875, -80.041015625, -77.64501953125, -75.2490234375, -72.85302734375, -70.45703125, -68.06103515625, -65.6650390625, -63.26904296875, -60.873046875, -58.47705078125, -56.0810546875, -53.68505859375, -51.2890625, -48.89306640625, -46.4970703125, -44.10107421875, -41.705078125, -39.30908203125, -36.9130859375, -34.51708984375, -32.12109375, -29.72509765625, -27.3291015625, -24.93310546875, -22.537109375, -20.14111328125, -17.7451171875, -15.34912109375, -12.953125, -10.55712890625, -8.1611328125, -5.76513671875, -3.369140625, -0.97314453125, 1.4228515625, 3.81884765625, 6.21484375, 8.61083984375, 11.0068359375, 13.40283203125, 15.798828125, 18.19482421875, 20.5908203125, 22.98681640625, 25.3828125, 27.77880859375, 30.1748046875, 32.57080078125, 34.966796875, 37.36279296875, 39.7587890625, 42.15478515625, 44.55078125, 46.94677734375, 49.3427734375, 51.73876953125, 54.134765625, 56.53076171875, 58.9267578125, 61.32275390625, 63.71875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 227.0, 685.0, 96.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-249.56735229492188, -243.38369750976562, -237.20005798339844, -231.0164031982422, -224.83274841308594, -218.64910888671875, -212.4654541015625, -206.28179931640625, -200.09815979003906, -193.9145050048828, -187.73086547851562, -181.54721069335938, -175.36355590820312, -169.17991638183594, -162.9962615966797, -156.8126220703125, -150.62896728515625, -144.4453125, -138.2616729736328, -132.07801818847656, -125.89437103271484, -119.71072387695312, -113.52706909179688, -107.34342193603516, -101.15975952148438, -94.97611236572266, -88.7924575805664, -82.60881042480469, -76.42516326904297, -70.24151611328125, -64.057861328125, -57.87421417236328, -51.69056701660156, -45.50691604614258, -39.32326889038086, -33.139617919921875, -26.955968856811523, -20.772319793701172, -14.588668823242188, -8.405021667480469, -2.2213706970214844, 3.9622788429260254, 10.145928382873535, 16.329578399658203, 22.513227462768555, 28.696876525878906, 34.88052749633789, 41.06417465209961, 47.247825622558594, 53.43147659301758, 59.6151237487793, 65.79877471923828, 71.982421875, 78.16607666015625, 84.34972381591797, 90.53337097167969, 96.71702575683594, 102.90067291259766, 109.0843276977539, 115.26797485351562, 121.45162200927734, 127.63526916503906, 133.8189239501953, 140.0025634765625, 146.18621826171875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 5.0, 8.0, 11.0, 8.0, 9.0, 16.0, 15.0, 23.0, 16.0, 12.0, 21.0, 12.0, 25.0, 21.0, 35.0, 28.0, 30.0, 38.0, 30.0, 35.0, 28.0, 51.0, 31.0, 35.0, 42.0, 38.0, 30.0, 29.0, 31.0, 26.0, 31.0, 33.0, 25.0, 20.0, 16.0, 16.0, 19.0, 16.0, 9.0, 10.0, 13.0, 6.0, 12.0, 3.0, 2.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-48.26645278930664, -46.85055160522461, -45.43465042114258, -44.01874923706055, -42.60284423828125, -41.18694305419922, -39.77104187011719, -38.355140686035156, -36.939239501953125, -35.523338317871094, -34.10743713378906, -32.69153594970703, -31.275632858276367, -29.859731674194336, -28.443828582763672, -27.02792739868164, -25.61202621459961, -24.196125030517578, -22.780223846435547, -21.364320755004883, -19.94841957092285, -18.53251838684082, -17.116615295410156, -15.700714111328125, -14.284812927246094, -12.868911743164062, -11.453009605407715, -10.037107467651367, -8.621206283569336, -7.2053046226501465, -5.789402961730957, -4.373500823974609, -2.9575958251953125, -1.541694164276123, -0.1257925033569336, 1.2901091575622559, 2.7060108184814453, 4.121912479400635, 5.537814140319824, 6.953716278076172, 8.369617462158203, 9.785518646240234, 11.201420783996582, 12.61732292175293, 14.033224105834961, 15.449125289916992, 16.865028381347656, 18.280929565429688, 19.69683074951172, 21.11273193359375, 22.52863311767578, 23.944536209106445, 25.360437393188477, 26.776338577270508, 28.192241668701172, 29.608142852783203, 31.024044036865234, 32.439945220947266, 33.8558464050293, 35.27174758911133, 36.687652587890625, 38.103553771972656, 39.51945495605469, 40.93535614013672, 42.35125732421875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 7.0, 6.0, 11.0, 14.0, 11.0, 22.0, 13.0, 24.0, 27.0, 30.0, 31.0, 33.0, 39.0, 46.0, 40.0, 42.0, 41.0, 43.0, 45.0, 39.0, 39.0, 34.0, 37.0, 38.0, 39.0, 36.0, 32.0, 24.0, 20.0, 19.0, 14.0, 17.0, 14.0, 9.0, 15.0, 9.0, 8.0, 6.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.32421875, -7.07635498046875, -6.8284912109375, -6.58062744140625, -6.332763671875, -6.08489990234375, -5.8370361328125, -5.58917236328125, -5.34130859375, -5.09344482421875, -4.8455810546875, -4.59771728515625, -4.349853515625, -4.10198974609375, -3.8541259765625, -3.60626220703125, -3.3583984375, -3.11053466796875, -2.8626708984375, -2.61480712890625, -2.366943359375, -2.11907958984375, -1.8712158203125, -1.62335205078125, -1.37548828125, -1.12762451171875, -0.8797607421875, -0.63189697265625, -0.384033203125, -0.13616943359375, 0.1116943359375, 0.35955810546875, 0.607421875, 0.85528564453125, 1.1031494140625, 1.35101318359375, 1.598876953125, 1.84674072265625, 2.0946044921875, 2.34246826171875, 2.59033203125, 2.83819580078125, 3.0860595703125, 3.33392333984375, 3.581787109375, 3.82965087890625, 4.0775146484375, 4.32537841796875, 4.5732421875, 4.82110595703125, 5.0689697265625, 5.31683349609375, 5.564697265625, 5.81256103515625, 6.0604248046875, 6.30828857421875, 6.55615234375, 6.80401611328125, 7.0518798828125, 7.29974365234375, 7.547607421875, 7.79547119140625, 8.0433349609375, 8.29119873046875, 8.5390625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 5.0, 11.0, 15.0, 15.0, 23.0, 32.0, 31.0, 53.0, 60.0, 70.0, 90.0, 119.0, 168.0, 241.0, 447.0, 861.0, 1774.0, 4389.0, 15151.0, 101627.0, 1050248.0, 2508625.0, 451182.0, 43436.0, 9220.0, 3169.0, 1326.0, 650.0, 379.0, 210.0, 166.0, 102.0, 77.0, 60.0, 58.0, 39.0, 36.0, 28.0, 24.0, 11.0, 14.0, 10.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.734375, -17.217529296875, -16.70068359375, -16.183837890625, -15.6669921875, -15.150146484375, -14.63330078125, -14.116455078125, -13.599609375, -13.082763671875, -12.56591796875, -12.049072265625, -11.5322265625, -11.015380859375, -10.49853515625, -9.981689453125, -9.46484375, -8.947998046875, -8.43115234375, -7.914306640625, -7.3974609375, -6.880615234375, -6.36376953125, -5.846923828125, -5.330078125, -4.813232421875, -4.29638671875, -3.779541015625, -3.2626953125, -2.745849609375, -2.22900390625, -1.712158203125, -1.1953125, -0.678466796875, -0.16162109375, 0.355224609375, 0.8720703125, 1.388916015625, 1.90576171875, 2.422607421875, 2.939453125, 3.456298828125, 3.97314453125, 4.489990234375, 5.0068359375, 5.523681640625, 6.04052734375, 6.557373046875, 7.07421875, 7.591064453125, 8.10791015625, 8.624755859375, 9.1416015625, 9.658447265625, 10.17529296875, 10.692138671875, 11.208984375, 11.725830078125, 12.24267578125, 12.759521484375, 13.2763671875, 13.793212890625, 14.31005859375, 14.826904296875, 15.34375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 8.0, 13.0, 8.0, 18.0, 31.0, 62.0, 73.0, 102.0, 140.0, 207.0, 281.0, 484.0, 636.0, 555.0, 452.0, 263.0, 184.0, 165.0, 103.0, 83.0, 57.0, 45.0, 25.0, 17.0, 22.0, 9.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6328125, -13.1248779296875, -12.616943359375, -12.1090087890625, -11.60107421875, -11.0931396484375, -10.585205078125, -10.0772705078125, -9.5693359375, -9.0614013671875, -8.553466796875, -8.0455322265625, -7.53759765625, -7.0296630859375, -6.521728515625, -6.0137939453125, -5.505859375, -4.9979248046875, -4.489990234375, -3.9820556640625, -3.47412109375, -2.9661865234375, -2.458251953125, -1.9503173828125, -1.4423828125, -0.9344482421875, -0.426513671875, 0.0814208984375, 0.58935546875, 1.0972900390625, 1.605224609375, 2.1131591796875, 2.62109375, 3.1290283203125, 3.636962890625, 4.1448974609375, 4.65283203125, 5.1607666015625, 5.668701171875, 6.1766357421875, 6.6845703125, 7.1925048828125, 7.700439453125, 8.2083740234375, 8.71630859375, 9.2242431640625, 9.732177734375, 10.2401123046875, 10.748046875, 11.2559814453125, 11.763916015625, 12.2718505859375, 12.77978515625, 13.2877197265625, 13.795654296875, 14.3035888671875, 14.8115234375, 15.3194580078125, 15.827392578125, 16.3353271484375, 16.84326171875, 17.3511962890625, 17.859130859375, 18.3670654296875, 18.875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 15.0, 19.0, 17.0, 29.0, 46.0, 80.0, 118.0, 238.0, 391.0, 926.0, 2733.0, 16693.0, 728260.0, 3385834.0, 51971.0, 4533.0, 1254.0, 494.0, 255.0, 126.0, 67.0, 50.0, 45.0, 22.0, 16.0, 15.0, 9.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.98583984375, -31.8154296875, -30.64501953125, -29.474609375, -28.30419921875, -27.1337890625, -25.96337890625, -24.79296875, -23.62255859375, -22.4521484375, -21.28173828125, -20.111328125, -18.94091796875, -17.7705078125, -16.60009765625, -15.4296875, -14.25927734375, -13.0888671875, -11.91845703125, -10.748046875, -9.57763671875, -8.4072265625, -7.23681640625, -6.06640625, -4.89599609375, -3.7255859375, -2.55517578125, -1.384765625, -0.21435546875, 0.9560546875, 2.12646484375, 3.296875, 4.46728515625, 5.6376953125, 6.80810546875, 7.978515625, 9.14892578125, 10.3193359375, 11.48974609375, 12.66015625, 13.83056640625, 15.0009765625, 16.17138671875, 17.341796875, 18.51220703125, 19.6826171875, 20.85302734375, 22.0234375, 23.19384765625, 24.3642578125, 25.53466796875, 26.705078125, 27.87548828125, 29.0458984375, 30.21630859375, 31.38671875, 32.55712890625, 33.7275390625, 34.89794921875, 36.068359375, 37.23876953125, 38.4091796875, 39.57958984375, 40.75]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 986.0, 26.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-819.9397583007812, -786.6697387695312, -753.399658203125, -720.129638671875, -686.8595581054688, -653.5895385742188, -620.3194580078125, -587.0494384765625, -553.7794189453125, -520.5093994140625, -487.23931884765625, -453.96929931640625, -420.69921875, -387.42919921875, -354.1591491699219, -320.88909912109375, -287.6190185546875, -254.34896850585938, -221.07891845703125, -187.8088836669922, -154.53883361816406, -121.26878356933594, -87.99874877929688, -54.72869873046875, -21.458648681640625, 11.811397552490234, 45.081443786621094, 78.35148620605469, 111.62153625488281, 144.89158630371094, 178.16162109375, 211.43167114257812, 244.7017822265625, 277.9718322753906, 311.24188232421875, 344.51190185546875, 377.781982421875, 411.052001953125, 444.3220520019531, 477.59210205078125, 510.8621520996094, 544.1322021484375, 577.4022216796875, 610.6723022460938, 643.9423217773438, 677.21240234375, 710.482421875, 743.75244140625, 777.0225219726562, 810.2925415039062, 843.5626220703125, 876.8326416015625, 910.1027221679688, 943.3727416992188, 976.642822265625, 1009.912841796875, 1043.182861328125, 1076.452880859375, 1109.722900390625, 1142.9930419921875, 1176.2630615234375, 1209.5330810546875, 1242.8031005859375, 1276.0732421875, 1309.34326171875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 8.0, 9.0, 6.0, 4.0, 5.0, 15.0, 22.0, 27.0, 30.0, 24.0, 29.0, 36.0, 35.0, 31.0, 39.0, 45.0, 42.0, 50.0, 55.0, 63.0, 53.0, 42.0, 36.0, 45.0, 44.0, 36.0, 33.0, 19.0, 17.0, 18.0, 15.0, 17.0, 14.0, 14.0, 5.0, 3.0, 7.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-76.0504150390625, -73.94217681884766, -71.83394622802734, -69.7257080078125, -67.61747741699219, -65.50923919677734, -63.401004791259766, -61.29277038574219, -59.18453598022461, -57.07630157470703, -54.96806716918945, -52.859832763671875, -50.75159454345703, -48.64336395263672, -46.535125732421875, -44.4268913269043, -42.31865692138672, -40.21042251586914, -38.10218811035156, -35.993953704833984, -33.885719299316406, -31.777482986450195, -29.669246673583984, -27.561012268066406, -25.452777862548828, -23.34454345703125, -21.236309051513672, -19.12807273864746, -17.019838333129883, -14.911603927612305, -12.80336856842041, -10.695133209228516, -8.586898803710938, -6.478663921356201, -4.370429039001465, -2.2621941566467285, -0.1539592742919922, 1.954275131225586, 4.0625104904174805, 6.170745849609375, 8.278980255126953, 10.387214660644531, 12.495450019836426, 14.60368537902832, 16.7119197845459, 18.820154190063477, 20.928390502929688, 23.036624908447266, 25.144859313964844, 27.253093719482422, 29.361328125, 31.46956443786621, 33.577796936035156, 35.68603515625, 37.79426956176758, 39.902503967285156, 42.010738372802734, 44.11897277832031, 46.22720718383789, 48.33544158935547, 50.44367980957031, 52.551910400390625, 54.66014862060547, 56.76838302612305, 58.876617431640625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 9.0, 6.0, 9.0, 9.0, 16.0, 11.0, 10.0, 21.0, 21.0, 18.0, 17.0, 21.0, 31.0, 29.0, 27.0, 29.0, 32.0, 30.0, 36.0, 35.0, 31.0, 45.0, 30.0, 50.0, 33.0, 35.0, 38.0, 38.0, 21.0, 35.0, 18.0, 25.0, 32.0, 16.0, 15.0, 18.0, 13.0, 16.0, 18.0, 14.0, 10.0, 5.0, 6.0, 8.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.8984375, -4.730712890625, -4.56298828125, -4.395263671875, -4.2275390625, -4.059814453125, -3.89208984375, -3.724365234375, -3.556640625, -3.388916015625, -3.22119140625, -3.053466796875, -2.8857421875, -2.718017578125, -2.55029296875, -2.382568359375, -2.21484375, -2.047119140625, -1.87939453125, -1.711669921875, -1.5439453125, -1.376220703125, -1.20849609375, -1.040771484375, -0.873046875, -0.705322265625, -0.53759765625, -0.369873046875, -0.2021484375, -0.034423828125, 0.13330078125, 0.301025390625, 0.46875, 0.636474609375, 0.80419921875, 0.971923828125, 1.1396484375, 1.307373046875, 1.47509765625, 1.642822265625, 1.810546875, 1.978271484375, 2.14599609375, 2.313720703125, 2.4814453125, 2.649169921875, 2.81689453125, 2.984619140625, 3.15234375, 3.320068359375, 3.48779296875, 3.655517578125, 3.8232421875, 3.990966796875, 4.15869140625, 4.326416015625, 4.494140625, 4.661865234375, 4.82958984375, 4.997314453125, 5.1650390625, 5.332763671875, 5.50048828125, 5.668212890625, 5.8359375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 8.0, 13.0, 18.0, 34.0, 42.0, 57.0, 90.0, 107.0, 191.0, 291.0, 399.0, 535.0, 813.0, 1200.0, 1626.0, 2418.0, 3537.0, 5406.0, 7946.0, 12506.0, 19971.0, 33191.0, 57144.0, 100796.0, 168897.0, 214623.0, 168668.0, 100758.0, 56480.0, 33286.0, 19963.0, 12711.0, 8151.0, 5364.0, 3493.0, 2442.0, 1616.0, 1126.0, 838.0, 550.0, 390.0, 272.0, 189.0, 131.0, 96.0, 59.0, 46.0, 19.0, 14.0, 13.0, 9.0, 8.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.57177734375, -0.5541839599609375, -0.536590576171875, -0.5189971923828125, -0.50140380859375, -0.4838104248046875, -0.466217041015625, -0.4486236572265625, -0.4310302734375, -0.4134368896484375, -0.395843505859375, -0.3782501220703125, -0.36065673828125, -0.3430633544921875, -0.325469970703125, -0.3078765869140625, -0.290283203125, -0.2726898193359375, -0.255096435546875, -0.2375030517578125, -0.21990966796875, -0.2023162841796875, -0.184722900390625, -0.1671295166015625, -0.1495361328125, -0.1319427490234375, -0.114349365234375, -0.0967559814453125, -0.07916259765625, -0.0615692138671875, -0.043975830078125, -0.0263824462890625, -0.0087890625, 0.0088043212890625, 0.026397705078125, 0.0439910888671875, 0.06158447265625, 0.0791778564453125, 0.096771240234375, 0.1143646240234375, 0.1319580078125, 0.1495513916015625, 0.167144775390625, 0.1847381591796875, 0.20233154296875, 0.2199249267578125, 0.237518310546875, 0.2551116943359375, 0.272705078125, 0.2902984619140625, 0.307891845703125, 0.3254852294921875, 0.34307861328125, 0.3606719970703125, 0.378265380859375, 0.3958587646484375, 0.4134521484375, 0.4310455322265625, 0.448638916015625, 0.4662322998046875, 0.48382568359375, 0.5014190673828125, 0.519012451171875, 0.5366058349609375, 0.55419921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 9.0, 9.0, 9.0, 17.0, 12.0, 23.0, 21.0, 28.0, 35.0, 21.0, 31.0, 36.0, 37.0, 36.0, 35.0, 40.0, 40.0, 1056.0, 46.0, 46.0, 39.0, 50.0, 37.0, 33.0, 31.0, 38.0, 28.0, 36.0, 23.0, 16.0, 16.0, 17.0, 17.0, 13.0, 12.0, 10.0, 2.0, 7.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.87774658203125, -3.7515869140625, -3.62542724609375, -3.499267578125, -3.37310791015625, -3.2469482421875, -3.12078857421875, -2.99462890625, -2.86846923828125, -2.7423095703125, -2.61614990234375, -2.489990234375, -2.36383056640625, -2.2376708984375, -2.11151123046875, -1.9853515625, -1.85919189453125, -1.7330322265625, -1.60687255859375, -1.480712890625, -1.35455322265625, -1.2283935546875, -1.10223388671875, -0.97607421875, -0.84991455078125, -0.7237548828125, -0.59759521484375, -0.471435546875, -0.34527587890625, -0.2191162109375, -0.09295654296875, 0.033203125, 0.15936279296875, 0.2855224609375, 0.41168212890625, 0.537841796875, 0.66400146484375, 0.7901611328125, 0.91632080078125, 1.04248046875, 1.16864013671875, 1.2947998046875, 1.42095947265625, 1.547119140625, 1.67327880859375, 1.7994384765625, 1.92559814453125, 2.0517578125, 2.17791748046875, 2.3040771484375, 2.43023681640625, 2.556396484375, 2.68255615234375, 2.8087158203125, 2.93487548828125, 3.06103515625, 3.18719482421875, 3.3133544921875, 3.43951416015625, 3.565673828125, 3.69183349609375, 3.8179931640625, 3.94415283203125, 4.0703125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 6.0, 4.0, 6.0, 11.0, 16.0, 22.0, 41.0, 39.0, 56.0, 102.0, 150.0, 241.0, 355.0, 553.0, 902.0, 1196.0, 1941.0, 2870.0, 4335.0, 6430.0, 9900.0, 15164.0, 23760.0, 37534.0, 59815.0, 95813.0, 147567.0, 1233076.0, 161768.0, 108090.0, 67375.0, 42077.0, 26836.0, 16991.0, 11069.0, 7236.0, 4751.0, 3104.0, 2018.0, 1323.0, 846.0, 604.0, 390.0, 288.0, 162.0, 121.0, 69.0, 47.0, 35.0, 15.0, 8.0, 10.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421142578125, -0.4064369201660156, -0.39173126220703125, -0.3770256042480469, -0.3623199462890625, -0.3476142883300781, -0.33290863037109375, -0.3182029724121094, -0.303497314453125, -0.2887916564941406, -0.27408599853515625, -0.2593803405761719, -0.2446746826171875, -0.22996902465820312, -0.21526336669921875, -0.20055770874023438, -0.18585205078125, -0.17114639282226562, -0.15644073486328125, -0.14173507690429688, -0.1270294189453125, -0.11232376098632812, -0.09761810302734375, -0.08291244506835938, -0.068206787109375, -0.053501129150390625, -0.03879547119140625, -0.024089813232421875, -0.0093841552734375, 0.005321502685546875, 0.02002716064453125, 0.034732818603515625, 0.0494384765625, 0.06414413452148438, 0.07884979248046875, 0.09355545043945312, 0.1082611083984375, 0.12296676635742188, 0.13767242431640625, 0.15237808227539062, 0.167083740234375, 0.18178939819335938, 0.19649505615234375, 0.21120071411132812, 0.2259063720703125, 0.24061203002929688, 0.25531768798828125, 0.2700233459472656, 0.28472900390625, 0.2994346618652344, 0.31414031982421875, 0.3288459777832031, 0.3435516357421875, 0.3582572937011719, 0.37296295166015625, 0.3876686096191406, 0.402374267578125, 0.4170799255371094, 0.43178558349609375, 0.4464912414550781, 0.4611968994140625, 0.4759025573730469, 0.49060821533203125, 0.5053138732910156, 0.52001953125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 4.0, 6.0, 8.0, 14.0, 16.0, 22.0, 25.0, 22.0, 28.0, 21.0, 27.0, 27.0, 26.0, 52.0, 44.0, 37.0, 25.0, 52.0, 39.0, 43.0, 55.0, 37.0, 48.0, 47.0, 34.0, 31.0, 28.0, 31.0, 27.0, 29.0, 16.0, 13.0, 19.0, 12.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0008096694946289062, -0.000783674418926239, -0.0007576793432235718, -0.0007316842675209045, -0.0007056891918182373, -0.0006796941161155701, -0.0006536990404129028, -0.0006277039647102356, -0.0006017088890075684, -0.0005757138133049011, -0.0005497187376022339, -0.0005237236618995667, -0.0004977285861968994, -0.0004717335104942322, -0.00044573843479156494, -0.0004197433590888977, -0.00039374828338623047, -0.00036775320768356323, -0.000341758131980896, -0.00031576305627822876, -0.0002897679805755615, -0.0002637729048728943, -0.00023777782917022705, -0.00021178275346755981, -0.00018578767776489258, -0.00015979260206222534, -0.0001337975263595581, -0.00010780245065689087, -8.180737495422363e-05, -5.5812299251556396e-05, -2.981722354888916e-05, -3.822147846221924e-06, 2.2172927856445312e-05, 4.816800355911255e-05, 7.416307926177979e-05, 0.00010015815496444702, 0.00012615323066711426, 0.0001521483063697815, 0.00017814338207244873, 0.00020413845777511597, 0.0002301335334777832, 0.00025612860918045044, 0.0002821236848831177, 0.0003081187605857849, 0.00033411383628845215, 0.0003601089119911194, 0.0003861039876937866, 0.00041209906339645386, 0.0004380941390991211, 0.00046408921480178833, 0.0004900842905044556, 0.0005160793662071228, 0.00054207444190979, 0.0005680695176124573, 0.0005940645933151245, 0.0006200596690177917, 0.000646054744720459, 0.0006720498204231262, 0.0006980448961257935, 0.0007240399718284607, 0.0007500350475311279, 0.0007760301232337952, 0.0008020251989364624, 0.0008280202746391296, 0.0008540153503417969]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 6.0, 6.0, 9.0, 11.0, 11.0, 32.0, 31.0, 45.0, 42.0, 62.0, 61.0, 110.0, 105.0, 149.0, 244.0, 353.0, 545.0, 960.0, 14901.0, 1019902.0, 8397.0, 896.0, 464.0, 320.0, 218.0, 135.0, 99.0, 102.0, 58.0, 53.0, 51.0, 34.0, 41.0, 17.0, 17.0, 8.0, 6.0, 8.0, 13.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0178375244140625, -0.017334461212158203, -0.016831398010253906, -0.01632833480834961, -0.015825271606445312, -0.015322208404541016, -0.014819145202636719, -0.014316082000732422, -0.013813018798828125, -0.013309955596923828, -0.012806892395019531, -0.012303829193115234, -0.011800765991210938, -0.01129770278930664, -0.010794639587402344, -0.010291576385498047, -0.00978851318359375, -0.009285449981689453, -0.008782386779785156, -0.00827932357788086, -0.0077762603759765625, -0.007273197174072266, -0.006770133972167969, -0.006267070770263672, -0.005764007568359375, -0.005260944366455078, -0.004757881164550781, -0.004254817962646484, -0.0037517547607421875, -0.0032486915588378906, -0.0027456283569335938, -0.002242565155029297, -0.001739501953125, -0.0012364387512207031, -0.0007333755493164062, -0.00023031234741210938, 0.0002727508544921875, 0.0007758140563964844, 0.0012788772583007812, 0.0017819404602050781, 0.002285003662109375, 0.002788066864013672, 0.0032911300659179688, 0.0037941932678222656, 0.0042972564697265625, 0.004800319671630859, 0.005303382873535156, 0.005806446075439453, 0.00630950927734375, 0.006812572479248047, 0.007315635681152344, 0.00781869888305664, 0.008321762084960938, 0.008824825286865234, 0.009327888488769531, 0.009830951690673828, 0.010334014892578125, 0.010837078094482422, 0.011340141296386719, 0.011843204498291016, 0.012346267700195312, 0.01284933090209961, 0.013352394104003906, 0.013855457305908203, 0.0143585205078125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 49.0, 180.0, 356.0, 287.0, 99.0, 24.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00146421417593956, -0.0014116031816229224, -0.001358992070890963, -0.0013063810765743256, -0.0012537699658423662, -0.0012011589715257287, -0.0011485479772090912, -0.0010959368664771318, -0.0010433258721604943, -0.0009907148778438568, -0.0009381037671118975, -0.00088549277279526, -0.0008328817202709615, -0.0007802706677466631, -0.0007276596734300256, -0.0006750486209057271, -0.0006224375683814287, -0.0005698265158571303, -0.0005172154633328319, -0.00046460446901619434, -0.0004119934164918959, -0.0003593823639675975, -0.0003067713405471295, -0.00025416031712666154, -0.0002015492646023631, -0.0001489382266299799, -9.632718865759671e-05, -4.3716150685213506e-05, 8.894887287169695e-06, 6.150593981146812e-05, 0.0001141169632319361, 0.00016672798665240407, 0.00021933915559202433, 0.00027195020811632276, 0.00032456123153679073, 0.0003771722549572587, 0.00042978330748155713, 0.00048239436000585556, 0.0005350053543224931, 0.0005876164068467915, 0.0006402274593710899, 0.0006928385118953884, 0.0007454495644196868, 0.0007980605587363243, 0.0008506716112606227, 0.0009032826637849212, 0.0009558936581015587, 0.001008504768833518, 0.0010611157631501555, 0.001113726757466793, 0.0011663378681987524, 0.00121894886251539, 0.0012715598568320274, 0.0013241709675639868, 0.0013767819618806243, 0.0014293929561972618, 0.0014820040669292212, 0.0015346150612458587, 0.001587226171977818, 0.0016398371662944555, 0.0016924482770264149, 0.0017450592713430524, 0.00179767026565969, 0.0018502813763916492, 0.0019028923707082868]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 7.0, 2.0, 3.0, 6.0, 6.0, 7.0, 11.0, 10.0, 5.0, 12.0, 12.0, 12.0, 16.0, 14.0, 26.0, 19.0, 32.0, 39.0, 30.0, 39.0, 29.0, 35.0, 28.0, 41.0, 42.0, 40.0, 40.0, 34.0, 42.0, 27.0, 34.0, 32.0, 30.0, 31.0, 28.0, 17.0, 19.0, 19.0, 13.0, 9.0, 17.0, 12.0, 17.0, 13.0, 11.0, 5.0, 9.0, 5.0, 6.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.00045561790466308594, -0.0004416732117533684, -0.0004277285188436508, -0.00041378382593393326, -0.0003998391330242157, -0.00038589444011449814, -0.0003719497472047806, -0.000358005054295063, -0.00034406036138534546, -0.0003301156684756279, -0.00031617097556591034, -0.0003022262826561928, -0.0002882815897464752, -0.00027433689683675766, -0.0002603922039270401, -0.00024644751101732254, -0.00023250281810760498, -0.00021855812519788742, -0.00020461343228816986, -0.0001906687393784523, -0.00017672404646873474, -0.00016277935355901718, -0.00014883466064929962, -0.00013488996773958206, -0.0001209452748298645, -0.00010700058192014694, -9.305588901042938e-05, -7.911119610071182e-05, -6.516650319099426e-05, -5.12218102812767e-05, -3.727711737155914e-05, -2.3332424461841583e-05, -9.387731552124023e-06, 4.556961357593536e-06, 1.8501654267311096e-05, 3.2446347177028656e-05, 4.6391040086746216e-05, 6.0335732996463776e-05, 7.428042590618134e-05, 8.82251188158989e-05, 0.00010216981172561646, 0.00011611450463533401, 0.00013005919754505157, 0.00014400389045476913, 0.0001579485833644867, 0.00017189327627420425, 0.00018583796918392181, 0.00019978266209363937, 0.00021372735500335693, 0.0002276720479130745, 0.00024161674082279205, 0.0002555614337325096, 0.00026950612664222717, 0.00028345081955194473, 0.0002973955124616623, 0.00031134020537137985, 0.0003252848982810974, 0.00033922959119081497, 0.00035317428410053253, 0.0003671189770102501, 0.00038106366991996765, 0.0003950083628296852, 0.00040895305573940277, 0.00042289774864912033, 0.0004368424415588379]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 9.0, 6.0, 9.0, 9.0, 16.0, 11.0, 10.0, 21.0, 21.0, 18.0, 17.0, 21.0, 31.0, 29.0, 27.0, 29.0, 32.0, 30.0, 36.0, 35.0, 30.0, 46.0, 30.0, 50.0, 33.0, 35.0, 38.0, 38.0, 21.0, 35.0, 18.0, 25.0, 32.0, 16.0, 15.0, 18.0, 13.0, 16.0, 18.0, 14.0, 10.0, 5.0, 6.0, 8.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.8984375, -4.730712890625, -4.56298828125, -4.395263671875, -4.2275390625, -4.059814453125, -3.89208984375, -3.724365234375, -3.556640625, -3.388916015625, -3.22119140625, -3.053466796875, -2.8857421875, -2.718017578125, -2.55029296875, -2.382568359375, -2.21484375, -2.047119140625, -1.87939453125, -1.711669921875, -1.5439453125, -1.376220703125, -1.20849609375, -1.040771484375, -0.873046875, -0.705322265625, -0.53759765625, -0.369873046875, -0.2021484375, -0.034423828125, 0.13330078125, 0.301025390625, 0.46875, 0.636474609375, 0.80419921875, 0.971923828125, 1.1396484375, 1.307373046875, 1.47509765625, 1.642822265625, 1.810546875, 1.978271484375, 2.14599609375, 2.313720703125, 2.4814453125, 2.649169921875, 2.81689453125, 2.984619140625, 3.15234375, 3.320068359375, 3.48779296875, 3.655517578125, 3.8232421875, 3.990966796875, 4.15869140625, 4.326416015625, 4.494140625, 4.661865234375, 4.82958984375, 4.997314453125, 5.1650390625, 5.332763671875, 5.50048828125, 5.668212890625, 5.8359375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 10.0, 8.0, 13.0, 25.0, 30.0, 50.0, 44.0, 59.0, 93.0, 103.0, 160.0, 219.0, 319.0, 447.0, 638.0, 889.0, 1273.0, 1952.0, 3963.0, 8860.0, 34265.0, 249362.0, 619529.0, 94930.0, 17292.0, 5784.0, 2844.0, 1688.0, 1066.0, 743.0, 511.0, 392.0, 263.0, 192.0, 164.0, 119.0, 69.0, 53.0, 27.0, 28.0, 23.0, 20.0, 13.0, 4.0, 2.0, 5.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.765625, -14.30810546875, -13.8505859375, -13.39306640625, -12.935546875, -12.47802734375, -12.0205078125, -11.56298828125, -11.10546875, -10.64794921875, -10.1904296875, -9.73291015625, -9.275390625, -8.81787109375, -8.3603515625, -7.90283203125, -7.4453125, -6.98779296875, -6.5302734375, -6.07275390625, -5.615234375, -5.15771484375, -4.7001953125, -4.24267578125, -3.78515625, -3.32763671875, -2.8701171875, -2.41259765625, -1.955078125, -1.49755859375, -1.0400390625, -0.58251953125, -0.125, 0.33251953125, 0.7900390625, 1.24755859375, 1.705078125, 2.16259765625, 2.6201171875, 3.07763671875, 3.53515625, 3.99267578125, 4.4501953125, 4.90771484375, 5.365234375, 5.82275390625, 6.2802734375, 6.73779296875, 7.1953125, 7.65283203125, 8.1103515625, 8.56787109375, 9.025390625, 9.48291015625, 9.9404296875, 10.39794921875, 10.85546875, 11.31298828125, 11.7705078125, 12.22802734375, 12.685546875, 13.14306640625, 13.6005859375, 14.05810546875, 14.515625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0, 4.0, 5.0, 8.0, 19.0, 15.0, 15.0, 19.0, 24.0, 32.0, 34.0, 41.0, 33.0, 36.0, 48.0, 65.0, 74.0, 211.0, 1580.0, 273.0, 99.0, 60.0, 58.0, 39.0, 39.0, 30.0, 32.0, 31.0, 23.0, 22.0, 12.0, 13.0, 8.0, 4.0, 10.0, 8.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-18.8125, -18.312255859375, -17.81201171875, -17.311767578125, -16.8115234375, -16.311279296875, -15.81103515625, -15.310791015625, -14.810546875, -14.310302734375, -13.81005859375, -13.309814453125, -12.8095703125, -12.309326171875, -11.80908203125, -11.308837890625, -10.80859375, -10.308349609375, -9.80810546875, -9.307861328125, -8.8076171875, -8.307373046875, -7.80712890625, -7.306884765625, -6.806640625, -6.306396484375, -5.80615234375, -5.305908203125, -4.8056640625, -4.305419921875, -3.80517578125, -3.304931640625, -2.8046875, -2.304443359375, -1.80419921875, -1.303955078125, -0.8037109375, -0.303466796875, 0.19677734375, 0.697021484375, 1.197265625, 1.697509765625, 2.19775390625, 2.697998046875, 3.1982421875, 3.698486328125, 4.19873046875, 4.698974609375, 5.19921875, 5.699462890625, 6.19970703125, 6.699951171875, 7.2001953125, 7.700439453125, 8.20068359375, 8.700927734375, 9.201171875, 9.701416015625, 10.20166015625, 10.701904296875, 11.2021484375, 11.702392578125, 12.20263671875, 12.702880859375, 13.203125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 7.0, 4.0, 9.0, 10.0, 12.0, 10.0, 16.0, 20.0, 27.0, 37.0, 43.0, 47.0, 60.0, 51.0, 96.0, 111.0, 158.0, 298.0, 444.0, 961.0, 3870.0, 2621136.0, 513280.0, 2826.0, 773.0, 411.0, 243.0, 173.0, 122.0, 80.0, 69.0, 50.0, 49.0, 33.0, 34.0, 32.0, 17.0, 21.0, 14.0, 9.0, 6.0, 5.0, 7.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-36.75, -35.56201171875, -34.3740234375, -33.18603515625, -31.998046875, -30.81005859375, -29.6220703125, -28.43408203125, -27.24609375, -26.05810546875, -24.8701171875, -23.68212890625, -22.494140625, -21.30615234375, -20.1181640625, -18.93017578125, -17.7421875, -16.55419921875, -15.3662109375, -14.17822265625, -12.990234375, -11.80224609375, -10.6142578125, -9.42626953125, -8.23828125, -7.05029296875, -5.8623046875, -4.67431640625, -3.486328125, -2.29833984375, -1.1103515625, 0.07763671875, 1.265625, 2.45361328125, 3.6416015625, 4.82958984375, 6.017578125, 7.20556640625, 8.3935546875, 9.58154296875, 10.76953125, 11.95751953125, 13.1455078125, 14.33349609375, 15.521484375, 16.70947265625, 17.8974609375, 19.08544921875, 20.2734375, 21.46142578125, 22.6494140625, 23.83740234375, 25.025390625, 26.21337890625, 27.4013671875, 28.58935546875, 29.77734375, 30.96533203125, 32.1533203125, 33.34130859375, 34.529296875, 35.71728515625, 36.9052734375, 38.09326171875, 39.28125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 16.0, 30.0, 95.0, 201.0, 248.0, 226.0, 119.0, 52.0, 21.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.09284591674805, -37.27388000488281, -35.45491027832031, -33.63594436645508, -31.816974639892578, -29.998008728027344, -28.179040908813477, -26.36007308959961, -24.541105270385742, -22.722137451171875, -20.903169631958008, -19.08420181274414, -17.265235900878906, -15.446267127990723, -13.627300262451172, -11.808332443237305, -9.989364624023438, -8.17039680480957, -6.351429462432861, -4.532462120056152, -2.713494300842285, -0.894526481628418, 0.9244403839111328, 2.743408203125, 4.562376022338867, 6.381343841552734, 8.200311660766602, 10.019278526306152, 11.83824634552002, 13.657214164733887, 15.476181030273438, 17.295148849487305, 19.114120483398438, 20.933088302612305, 22.752056121826172, 24.571022033691406, 26.389991760253906, 28.20895767211914, 30.027925491333008, 31.846893310546875, 33.665863037109375, 35.48482894897461, 37.30379867553711, 39.122764587402344, 40.941734313964844, 42.76070022583008, 44.57966613769531, 46.39863586425781, 48.21760177612305, 50.03656768798828, 51.85553741455078, 53.674503326416016, 55.493473052978516, 57.31243896484375, 59.13140869140625, 60.950374603271484, 62.76934051513672, 64.58831024169922, 66.40727233886719, 68.22624206542969, 70.04521179199219, 71.86418151855469, 73.68314361572266, 75.50211334228516, 77.32108306884766]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 6.0, 11.0, 17.0, 16.0, 18.0, 22.0, 30.0, 37.0, 20.0, 41.0, 32.0, 39.0, 44.0, 42.0, 39.0, 38.0, 43.0, 41.0, 46.0, 44.0, 32.0, 35.0, 33.0, 25.0, 35.0, 25.0, 25.0, 26.0, 24.0, 15.0, 13.0, 15.0, 10.0, 9.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-38.49690246582031, -37.16041564941406, -35.82392501831055, -34.48743438720703, -33.15094757080078, -31.8144588470459, -30.477970123291016, -29.141481399536133, -27.80499267578125, -26.468503952026367, -25.132015228271484, -23.7955265045166, -22.45903778076172, -21.122549057006836, -19.786060333251953, -18.44957160949707, -17.113082885742188, -15.776594161987305, -14.440105438232422, -13.103616714477539, -11.767127990722656, -10.430639266967773, -9.09415054321289, -7.757661819458008, -6.421173095703125, -5.084684371948242, -3.7481956481933594, -2.4117069244384766, -1.0752182006835938, 0.26127052307128906, 1.5977592468261719, 2.9342479705810547, 4.2707366943359375, 5.60722541809082, 6.943714141845703, 8.280202865600586, 9.616691589355469, 10.953180313110352, 12.289669036865234, 13.626157760620117, 14.962646484375, 16.299135208129883, 17.635623931884766, 18.97211265563965, 20.30860137939453, 21.645090103149414, 22.981578826904297, 24.31806755065918, 25.654556274414062, 26.991044998168945, 28.327533721923828, 29.66402244567871, 31.000511169433594, 32.336997985839844, 33.67348861694336, 35.009979248046875, 36.346466064453125, 37.682952880859375, 39.01944351196289, 40.355934143066406, 41.692420959472656, 43.028907775878906, 44.36539840698242, 45.70188903808594, 47.03837585449219]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 2.0, 2.0, 3.0, 9.0, 3.0, 8.0, 11.0, 5.0, 16.0, 18.0, 22.0, 14.0, 13.0, 29.0, 33.0, 29.0, 29.0, 32.0, 28.0, 42.0, 44.0, 31.0, 39.0, 31.0, 32.0, 36.0, 46.0, 35.0, 32.0, 44.0, 35.0, 23.0, 25.0, 26.0, 22.0, 30.0, 17.0, 19.0, 13.0, 11.0, 11.0, 13.0, 10.0, 6.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-5.5390625, -5.35601806640625, -5.1729736328125, -4.98992919921875, -4.806884765625, -4.62384033203125, -4.4407958984375, -4.25775146484375, -4.07470703125, -3.89166259765625, -3.7086181640625, -3.52557373046875, -3.342529296875, -3.15948486328125, -2.9764404296875, -2.79339599609375, -2.6103515625, -2.42730712890625, -2.2442626953125, -2.06121826171875, -1.878173828125, -1.69512939453125, -1.5120849609375, -1.32904052734375, -1.14599609375, -0.96295166015625, -0.7799072265625, -0.59686279296875, -0.413818359375, -0.23077392578125, -0.0477294921875, 0.13531494140625, 0.318359375, 0.50140380859375, 0.6844482421875, 0.86749267578125, 1.050537109375, 1.23358154296875, 1.4166259765625, 1.59967041015625, 1.78271484375, 1.96575927734375, 2.1488037109375, 2.33184814453125, 2.514892578125, 2.69793701171875, 2.8809814453125, 3.06402587890625, 3.2470703125, 3.43011474609375, 3.6131591796875, 3.79620361328125, 3.979248046875, 4.16229248046875, 4.3453369140625, 4.52838134765625, 4.71142578125, 4.89447021484375, 5.0775146484375, 5.26055908203125, 5.443603515625, 5.62664794921875, 5.8096923828125, 5.99273681640625, 6.17578125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 10.0, 6.0, 9.0, 7.0, 16.0, 23.0, 33.0, 46.0, 78.0, 103.0, 165.0, 233.0, 318.0, 520.0, 815.0, 1303.0, 2274.0, 3978.0, 7751.0, 18477.0, 69066.0, 377028.0, 1564930.0, 1636646.0, 403626.0, 69714.0, 19130.0, 7941.0, 3983.0, 2271.0, 1368.0, 845.0, 515.0, 364.0, 221.0, 137.0, 95.0, 71.0, 42.0, 37.0, 23.0, 12.0, 12.0, 13.0, 5.0, 2.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.109375, -8.805908203125, -8.50244140625, -8.198974609375, -7.8955078125, -7.592041015625, -7.28857421875, -6.985107421875, -6.681640625, -6.378173828125, -6.07470703125, -5.771240234375, -5.4677734375, -5.164306640625, -4.86083984375, -4.557373046875, -4.25390625, -3.950439453125, -3.64697265625, -3.343505859375, -3.0400390625, -2.736572265625, -2.43310546875, -2.129638671875, -1.826171875, -1.522705078125, -1.21923828125, -0.915771484375, -0.6123046875, -0.308837890625, -0.00537109375, 0.298095703125, 0.6015625, 0.905029296875, 1.20849609375, 1.511962890625, 1.8154296875, 2.118896484375, 2.42236328125, 2.725830078125, 3.029296875, 3.332763671875, 3.63623046875, 3.939697265625, 4.2431640625, 4.546630859375, 4.85009765625, 5.153564453125, 5.45703125, 5.760498046875, 6.06396484375, 6.367431640625, 6.6708984375, 6.974365234375, 7.27783203125, 7.581298828125, 7.884765625, 8.188232421875, 8.49169921875, 8.795166015625, 9.0986328125, 9.402099609375, 9.70556640625, 10.009033203125, 10.3125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 9.0, 17.0, 20.0, 46.0, 72.0, 115.0, 190.0, 285.0, 445.0, 653.0, 759.0, 614.0, 310.0, 228.0, 116.0, 88.0, 40.0, 25.0, 16.0, 10.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0, -18.4443359375, -17.888671875, -17.3330078125, -16.77734375, -16.2216796875, -15.666015625, -15.1103515625, -14.5546875, -13.9990234375, -13.443359375, -12.8876953125, -12.33203125, -11.7763671875, -11.220703125, -10.6650390625, -10.109375, -9.5537109375, -8.998046875, -8.4423828125, -7.88671875, -7.3310546875, -6.775390625, -6.2197265625, -5.6640625, -5.1083984375, -4.552734375, -3.9970703125, -3.44140625, -2.8857421875, -2.330078125, -1.7744140625, -1.21875, -0.6630859375, -0.107421875, 0.4482421875, 1.00390625, 1.5595703125, 2.115234375, 2.6708984375, 3.2265625, 3.7822265625, 4.337890625, 4.8935546875, 5.44921875, 6.0048828125, 6.560546875, 7.1162109375, 7.671875, 8.2275390625, 8.783203125, 9.3388671875, 9.89453125, 10.4501953125, 11.005859375, 11.5615234375, 12.1171875, 12.6728515625, 13.228515625, 13.7841796875, 14.33984375, 14.8955078125, 15.451171875, 16.0068359375, 16.5625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 8.0, 5.0, 3.0, 12.0, 31.0, 43.0, 52.0, 120.0, 216.0, 421.0, 1041.0, 2872.0, 45406.0, 4064720.0, 73989.0, 3177.0, 1035.0, 496.0, 269.0, 139.0, 82.0, 56.0, 19.0, 21.0, 16.0, 7.0, 7.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.3125, -33.1103515625, -31.908203125, -30.7060546875, -29.50390625, -28.3017578125, -27.099609375, -25.8974609375, -24.6953125, -23.4931640625, -22.291015625, -21.0888671875, -19.88671875, -18.6845703125, -17.482421875, -16.2802734375, -15.078125, -13.8759765625, -12.673828125, -11.4716796875, -10.26953125, -9.0673828125, -7.865234375, -6.6630859375, -5.4609375, -4.2587890625, -3.056640625, -1.8544921875, -0.65234375, 0.5498046875, 1.751953125, 2.9541015625, 4.15625, 5.3583984375, 6.560546875, 7.7626953125, 8.96484375, 10.1669921875, 11.369140625, 12.5712890625, 13.7734375, 14.9755859375, 16.177734375, 17.3798828125, 18.58203125, 19.7841796875, 20.986328125, 22.1884765625, 23.390625, 24.5927734375, 25.794921875, 26.9970703125, 28.19921875, 29.4013671875, 30.603515625, 31.8056640625, 33.0078125, 34.2099609375, 35.412109375, 36.6142578125, 37.81640625, 39.0185546875, 40.220703125, 41.4228515625, 42.625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 127.0, 685.0, 184.0, 15.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.14366149902344, -94.04507446289062, -85.94648742675781, -77.847900390625, -69.74931335449219, -61.65072250366211, -53.55213165283203, -45.45354461669922, -37.354957580566406, -29.256370544433594, -21.15778160095215, -13.059192657470703, -4.960605621337891, 3.137981414794922, 11.236572265625, 19.335159301757812, 27.433746337890625, 35.53233337402344, 43.63092041015625, 51.72951126098633, 59.82809829711914, 67.92668151855469, 76.02527618408203, 84.12386322021484, 92.22245025634766, 100.32103729248047, 108.41962432861328, 116.51821899414062, 124.61680603027344, 132.71539306640625, 140.81398010253906, 148.91256713867188, 157.01116943359375, 165.10975646972656, 173.20834350585938, 181.3069305419922, 189.405517578125, 197.5041046142578, 205.60269165039062, 213.7012939453125, 221.79986572265625, 229.89845275878906, 237.99703979492188, 246.0956268310547, 254.1942138671875, 262.2928161621094, 270.3913879394531, 278.489990234375, 286.58856201171875, 294.6871643066406, 302.7857360839844, 310.88433837890625, 318.98291015625, 327.0815124511719, 335.1800842285156, 343.2786865234375, 351.3772888183594, 359.47589111328125, 367.574462890625, 375.6730651855469, 383.7716369628906, 391.8702392578125, 399.96881103515625, 408.0674133300781, 416.1659851074219]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 11.0, 11.0, 14.0, 15.0, 12.0, 31.0, 16.0, 21.0, 27.0, 33.0, 25.0, 31.0, 32.0, 30.0, 45.0, 37.0, 42.0, 47.0, 32.0, 41.0, 42.0, 41.0, 40.0, 50.0, 39.0, 26.0, 33.0, 29.0, 24.0, 20.0, 12.0, 19.0, 13.0, 13.0, 9.0, 4.0, 0.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-46.37642288208008, -45.011905670166016, -43.64738464355469, -42.282867431640625, -40.9183464050293, -39.553829193115234, -38.189308166503906, -36.824790954589844, -35.46027374267578, -34.09575653076172, -32.73123550415039, -31.366718292236328, -30.002197265625, -28.637680053710938, -27.273160934448242, -25.908641815185547, -24.54412078857422, -23.179601669311523, -21.815082550048828, -20.450565338134766, -19.086044311523438, -17.721527099609375, -16.35700798034668, -14.992488861083984, -13.627969741821289, -12.263450622558594, -10.898931503295898, -9.53441333770752, -8.169894218444824, -6.805375099182129, -5.44085693359375, -4.076337814331055, -2.711822509765625, -1.3473036289215088, 0.017215251922607422, 1.3817338943481445, 2.74625301361084, 4.110772132873535, 5.475290298461914, 6.839809417724609, 8.204328536987305, 9.56884765625, 10.933366775512695, 12.297884941101074, 13.66240406036377, 15.026923179626465, 16.391441345214844, 17.75596046447754, 19.120479583740234, 20.48499870300293, 21.849517822265625, 23.214035034179688, 24.578556060791016, 25.943073272705078, 27.307592391967773, 28.67211151123047, 30.036630630493164, 31.40114974975586, 32.76566696166992, 34.13018798828125, 35.49470520019531, 36.85922622680664, 38.2237434387207, 39.58826446533203, 40.952781677246094]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 9.0, 5.0, 8.0, 16.0, 19.0, 18.0, 24.0, 20.0, 21.0, 26.0, 19.0, 21.0, 35.0, 48.0, 28.0, 35.0, 46.0, 37.0, 37.0, 49.0, 41.0, 41.0, 32.0, 43.0, 33.0, 28.0, 24.0, 36.0, 34.0, 20.0, 23.0, 18.0, 15.0, 11.0, 21.0, 8.0, 8.0, 12.0, 7.0, 6.0, 4.0, 7.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.45703125, -4.30645751953125, -4.1558837890625, -4.00531005859375, -3.854736328125, -3.70416259765625, -3.5535888671875, -3.40301513671875, -3.25244140625, -3.10186767578125, -2.9512939453125, -2.80072021484375, -2.650146484375, -2.49957275390625, -2.3489990234375, -2.19842529296875, -2.0478515625, -1.89727783203125, -1.7467041015625, -1.59613037109375, -1.445556640625, -1.29498291015625, -1.1444091796875, -0.99383544921875, -0.84326171875, -0.69268798828125, -0.5421142578125, -0.39154052734375, -0.240966796875, -0.09039306640625, 0.0601806640625, 0.21075439453125, 0.361328125, 0.51190185546875, 0.6624755859375, 0.81304931640625, 0.963623046875, 1.11419677734375, 1.2647705078125, 1.41534423828125, 1.56591796875, 1.71649169921875, 1.8670654296875, 2.01763916015625, 2.168212890625, 2.31878662109375, 2.4693603515625, 2.61993408203125, 2.7705078125, 2.92108154296875, 3.0716552734375, 3.22222900390625, 3.372802734375, 3.52337646484375, 3.6739501953125, 3.82452392578125, 3.97509765625, 4.12567138671875, 4.2762451171875, 4.42681884765625, 4.577392578125, 4.72796630859375, 4.8785400390625, 5.02911376953125, 5.1796875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 13.0, 17.0, 15.0, 31.0, 63.0, 106.0, 146.0, 253.0, 337.0, 545.0, 856.0, 1364.0, 2086.0, 3346.0, 5249.0, 8575.0, 14142.0, 23637.0, 40717.0, 72734.0, 131740.0, 212279.0, 215195.0, 135471.0, 75383.0, 41795.0, 24385.0, 14592.0, 8742.0, 5373.0, 3317.0, 2194.0, 1419.0, 886.0, 546.0, 340.0, 256.0, 139.0, 93.0, 62.0, 37.0, 29.0, 10.0, 13.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.533203125, -0.5175323486328125, -0.501861572265625, -0.4861907958984375, -0.47052001953125, -0.4548492431640625, -0.439178466796875, -0.4235076904296875, -0.4078369140625, -0.3921661376953125, -0.376495361328125, -0.3608245849609375, -0.34515380859375, -0.3294830322265625, -0.313812255859375, -0.2981414794921875, -0.282470703125, -0.2667999267578125, -0.251129150390625, -0.2354583740234375, -0.21978759765625, -0.2041168212890625, -0.188446044921875, -0.1727752685546875, -0.1571044921875, -0.1414337158203125, -0.125762939453125, -0.1100921630859375, -0.09442138671875, -0.0787506103515625, -0.063079833984375, -0.0474090576171875, -0.03173828125, -0.0160675048828125, -0.000396728515625, 0.0152740478515625, 0.03094482421875, 0.0466156005859375, 0.062286376953125, 0.0779571533203125, 0.0936279296875, 0.1092987060546875, 0.124969482421875, 0.1406402587890625, 0.15631103515625, 0.1719818115234375, 0.187652587890625, 0.2033233642578125, 0.218994140625, 0.2346649169921875, 0.250335693359375, 0.2660064697265625, 0.28167724609375, 0.2973480224609375, 0.313018798828125, 0.3286895751953125, 0.3443603515625, 0.3600311279296875, 0.375701904296875, 0.3913726806640625, 0.40704345703125, 0.4227142333984375, 0.438385009765625, 0.4540557861328125, 0.4697265625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 6.0, 3.0, 5.0, 13.0, 12.0, 9.0, 15.0, 18.0, 21.0, 15.0, 14.0, 28.0, 27.0, 34.0, 35.0, 28.0, 34.0, 49.0, 53.0, 37.0, 30.0, 1060.0, 37.0, 47.0, 33.0, 31.0, 34.0, 30.0, 27.0, 27.0, 32.0, 32.0, 29.0, 27.0, 16.0, 17.0, 7.0, 10.0, 11.0, 10.0, 7.0, 4.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.23828125, -3.141387939453125, -3.04449462890625, -2.947601318359375, -2.8507080078125, -2.753814697265625, -2.65692138671875, -2.560028076171875, -2.463134765625, -2.366241455078125, -2.26934814453125, -2.172454833984375, -2.0755615234375, -1.978668212890625, -1.88177490234375, -1.784881591796875, -1.68798828125, -1.591094970703125, -1.49420166015625, -1.397308349609375, -1.3004150390625, -1.203521728515625, -1.10662841796875, -1.009735107421875, -0.912841796875, -0.815948486328125, -0.71905517578125, -0.622161865234375, -0.5252685546875, -0.428375244140625, -0.33148193359375, -0.234588623046875, -0.1376953125, -0.040802001953125, 0.05609130859375, 0.152984619140625, 0.2498779296875, 0.346771240234375, 0.44366455078125, 0.540557861328125, 0.637451171875, 0.734344482421875, 0.83123779296875, 0.928131103515625, 1.0250244140625, 1.121917724609375, 1.21881103515625, 1.315704345703125, 1.41259765625, 1.509490966796875, 1.60638427734375, 1.703277587890625, 1.8001708984375, 1.897064208984375, 1.99395751953125, 2.090850830078125, 2.187744140625, 2.284637451171875, 2.38153076171875, 2.478424072265625, 2.5753173828125, 2.672210693359375, 2.76910400390625, 2.865997314453125, 2.962890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 4.0, 13.0, 14.0, 19.0, 29.0, 37.0, 80.0, 110.0, 179.0, 279.0, 404.0, 680.0, 1087.0, 1679.0, 2767.0, 4301.0, 7041.0, 11547.0, 19188.0, 32221.0, 55565.0, 94799.0, 153088.0, 1249802.0, 176717.0, 116355.0, 68956.0, 40129.0, 23628.0, 14076.0, 8317.0, 5288.0, 3197.0, 2087.0, 1262.0, 809.0, 504.0, 318.0, 195.0, 124.0, 85.0, 51.0, 31.0, 27.0, 16.0, 9.0, 14.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416015625, -0.402008056640625, -0.38800048828125, -0.373992919921875, -0.3599853515625, -0.345977783203125, -0.33197021484375, -0.317962646484375, -0.303955078125, -0.289947509765625, -0.27593994140625, -0.261932373046875, -0.2479248046875, -0.233917236328125, -0.21990966796875, -0.205902099609375, -0.19189453125, -0.177886962890625, -0.16387939453125, -0.149871826171875, -0.1358642578125, -0.121856689453125, -0.10784912109375, -0.093841552734375, -0.079833984375, -0.065826416015625, -0.05181884765625, -0.037811279296875, -0.0238037109375, -0.009796142578125, 0.00421142578125, 0.018218994140625, 0.0322265625, 0.046234130859375, 0.06024169921875, 0.074249267578125, 0.0882568359375, 0.102264404296875, 0.11627197265625, 0.130279541015625, 0.144287109375, 0.158294677734375, 0.17230224609375, 0.186309814453125, 0.2003173828125, 0.214324951171875, 0.22833251953125, 0.242340087890625, 0.25634765625, 0.270355224609375, 0.28436279296875, 0.298370361328125, 0.3123779296875, 0.326385498046875, 0.34039306640625, 0.354400634765625, 0.368408203125, 0.382415771484375, 0.39642333984375, 0.410430908203125, 0.4244384765625, 0.438446044921875, 0.45245361328125, 0.466461181640625, 0.48046875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 4.0, 5.0, 6.0, 8.0, 12.0, 12.0, 8.0, 9.0, 14.0, 15.0, 25.0, 22.0, 22.0, 32.0, 23.0, 30.0, 26.0, 32.0, 27.0, 39.0, 41.0, 46.0, 47.0, 37.0, 35.0, 40.0, 38.0, 30.0, 34.0, 28.0, 40.0, 23.0, 29.0, 16.0, 20.0, 18.0, 22.0, 17.0, 8.0, 13.0, 7.0, 12.0, 5.0, 1.0, 4.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006117820739746094, -0.000591181218624115, -0.0005705803632736206, -0.0005499795079231262, -0.0005293786525726318, -0.0005087777972221375, -0.00048817694187164307, -0.0004675760865211487, -0.0004469752311706543, -0.0004263743758201599, -0.00040577352046966553, -0.00038517266511917114, -0.00036457180976867676, -0.0003439709544181824, -0.000323370099067688, -0.0003027692437171936, -0.0002821683883666992, -0.00026156753301620483, -0.00024096667766571045, -0.00022036582231521606, -0.00019976496696472168, -0.0001791641116142273, -0.0001585632562637329, -0.00013796240091323853, -0.00011736154556274414, -9.676069021224976e-05, -7.615983486175537e-05, -5.5558979511260986e-05, -3.49581241607666e-05, -1.4357268810272217e-05, 6.243586540222168e-06, 2.6844441890716553e-05, 4.744529724121094e-05, 6.804615259170532e-05, 8.864700794219971e-05, 0.00010924786329269409, 0.00012984871864318848, 0.00015044957399368286, 0.00017105042934417725, 0.00019165128469467163, 0.00021225214004516602, 0.0002328529953956604, 0.0002534538507461548, 0.00027405470609664917, 0.00029465556144714355, 0.00031525641679763794, 0.0003358572721481323, 0.0003564581274986267, 0.0003770589828491211, 0.0003976598381996155, 0.00041826069355010986, 0.00043886154890060425, 0.00045946240425109863, 0.000480063259601593, 0.0005006641149520874, 0.0005212649703025818, 0.0005418658256530762, 0.0005624666810035706, 0.0005830675363540649, 0.0006036683917045593, 0.0006242692470550537, 0.0006448701024055481, 0.0006654709577560425, 0.0006860718131065369, 0.0007066726684570312]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 13.0, 9.0, 5.0, 12.0, 22.0, 27.0, 28.0, 24.0, 36.0, 61.0, 66.0, 72.0, 100.0, 121.0, 170.0, 240.0, 286.0, 404.0, 653.0, 1248.0, 331028.0, 709962.0, 1541.0, 717.0, 455.0, 294.0, 199.0, 162.0, 100.0, 91.0, 72.0, 67.0, 61.0, 30.0, 41.0, 26.0, 25.0, 27.0, 11.0, 7.0, 12.0, 5.0, 8.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0132904052734375, -0.012888550758361816, -0.012486696243286133, -0.01208484172821045, -0.011682987213134766, -0.011281132698059082, -0.010879278182983398, -0.010477423667907715, -0.010075569152832031, -0.009673714637756348, -0.009271860122680664, -0.00887000560760498, -0.008468151092529297, -0.008066296577453613, -0.00766444206237793, -0.007262587547302246, -0.0068607330322265625, -0.006458878517150879, -0.006057024002075195, -0.005655169486999512, -0.005253314971923828, -0.0048514604568481445, -0.004449605941772461, -0.004047751426696777, -0.0036458969116210938, -0.00324404239654541, -0.0028421878814697266, -0.002440333366394043, -0.0020384788513183594, -0.0016366243362426758, -0.0012347698211669922, -0.0008329153060913086, -0.000431060791015625, -2.9206275939941406e-05, 0.0003726482391357422, 0.0007745027542114258, 0.0011763572692871094, 0.001578211784362793, 0.0019800662994384766, 0.00238192081451416, 0.0027837753295898438, 0.0031856298446655273, 0.003587484359741211, 0.0039893388748168945, 0.004391193389892578, 0.004793047904968262, 0.005194902420043945, 0.005596756935119629, 0.0059986114501953125, 0.006400465965270996, 0.00680232048034668, 0.007204174995422363, 0.007606029510498047, 0.00800788402557373, 0.008409738540649414, 0.008811593055725098, 0.009213447570800781, 0.009615302085876465, 0.010017156600952148, 0.010419011116027832, 0.010820865631103516, 0.0112227201461792, 0.011624574661254883, 0.012026429176330566, 0.01242828369140625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 134.0, 670.0, 197.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0037641318049281836, -0.0036833547055721283, -0.003602577606216073, -0.0035218005068600178, -0.0034410234075039625, -0.0033602463081479073, -0.0032794689759612083, -0.003198691876605153, -0.003117914777249098, -0.0030371376778930426, -0.0029563605785369873, -0.002875583479180932, -0.002794806379824877, -0.002714029047638178, -0.0026332521811127663, -0.0025524748489260674, -0.0024716979824006557, -0.0023909208830446005, -0.0023101437836885452, -0.00222936668433249, -0.0021485895849764347, -0.002067812252789736, -0.001987035386264324, -0.0019062580540776253, -0.00182548095472157, -0.0017447038553655148, -0.0016639267560094595, -0.0015831496566534042, -0.0015023724408820271, -0.0014215953415259719, -0.0013408182421699166, -0.0012600410263985395, -0.0011792639270424843, -0.001098486827686429, -0.0010177097283303738, -0.0009369325707666576, -0.0008561554132029414, -0.0007753783138468862, -0.0006946012144908309, -0.0006138240569271147, -0.0005330469575710595, -0.00045226982911117375, -0.00037149270065128803, -0.00029071560129523277, -0.00020993847283534706, -0.00012916134437546134, -4.838424501940608e-05, 3.239291254431009e-05, 0.00011317001190036535, 0.00019394714036025107, 0.0002747242688201368, 0.00035550136817619205, 0.00043627849663607776, 0.0005170556250959635, 0.0005978327244520187, 0.0006786098820157349, 0.0007593869813717902, 0.0008401640807278454, 0.0009209412382915616, 0.0010017183376476169, 0.0010824954370036721, 0.0011632726527750492, 0.0012440497521311045, 0.0013248268514871597, 0.001405603950843215]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 9.0, 15.0, 12.0, 7.0, 16.0, 19.0, 19.0, 15.0, 22.0, 33.0, 28.0, 30.0, 21.0, 36.0, 30.0, 43.0, 28.0, 51.0, 34.0, 35.0, 45.0, 45.0, 30.0, 28.0, 38.0, 30.0, 26.0, 24.0, 24.0, 32.0, 23.0, 20.0, 18.0, 11.0, 13.0, 18.0, 8.0, 9.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.00042617321014404297, -0.0004127919673919678, -0.0003994107246398926, -0.0003860294818878174, -0.0003726482391357422, -0.000359266996383667, -0.0003458857536315918, -0.0003325045108795166, -0.0003191232681274414, -0.0003057420253753662, -0.000292360782623291, -0.0002789795398712158, -0.0002655982971191406, -0.00025221705436706543, -0.00023883581161499023, -0.00022545456886291504, -0.00021207332611083984, -0.00019869208335876465, -0.00018531084060668945, -0.00017192959785461426, -0.00015854835510253906, -0.00014516711235046387, -0.00013178586959838867, -0.00011840462684631348, -0.00010502338409423828, -9.164214134216309e-05, -7.826089859008789e-05, -6.48796558380127e-05, -5.14984130859375e-05, -3.8117170333862305e-05, -2.473592758178711e-05, -1.1354684829711914e-05, 2.0265579223632812e-06, 1.5407800674438477e-05, 2.8789043426513672e-05, 4.217028617858887e-05, 5.555152893066406e-05, 6.893277168273926e-05, 8.231401443481445e-05, 9.569525718688965e-05, 0.00010907649993896484, 0.00012245774269104004, 0.00013583898544311523, 0.00014922022819519043, 0.00016260147094726562, 0.00017598271369934082, 0.00018936395645141602, 0.0002027451992034912, 0.0002161264419555664, 0.0002295076847076416, 0.0002428889274597168, 0.000256270170211792, 0.0002696514129638672, 0.0002830326557159424, 0.0002964138984680176, 0.0003097951412200928, 0.00032317638397216797, 0.00033655762672424316, 0.00034993886947631836, 0.00036332011222839355, 0.00037670135498046875, 0.00039008259773254395, 0.00040346384048461914, 0.00041684508323669434, 0.00043022632598876953]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 9.0, 5.0, 8.0, 16.0, 18.0, 19.0, 24.0, 20.0, 21.0, 26.0, 19.0, 21.0, 35.0, 48.0, 28.0, 35.0, 46.0, 37.0, 37.0, 49.0, 41.0, 41.0, 32.0, 43.0, 33.0, 28.0, 24.0, 36.0, 34.0, 20.0, 23.0, 18.0, 15.0, 11.0, 21.0, 8.0, 8.0, 12.0, 7.0, 6.0, 4.0, 7.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.45703125, -4.30645751953125, -4.1558837890625, -4.00531005859375, -3.854736328125, -3.70416259765625, -3.5535888671875, -3.40301513671875, -3.25244140625, -3.10186767578125, -2.9512939453125, -2.80072021484375, -2.650146484375, -2.49957275390625, -2.3489990234375, -2.19842529296875, -2.0478515625, -1.89727783203125, -1.7467041015625, -1.59613037109375, -1.445556640625, -1.29498291015625, -1.1444091796875, -0.99383544921875, -0.84326171875, -0.69268798828125, -0.5421142578125, -0.39154052734375, -0.240966796875, -0.09039306640625, 0.0601806640625, 0.21075439453125, 0.361328125, 0.51190185546875, 0.6624755859375, 0.81304931640625, 0.963623046875, 1.11419677734375, 1.2647705078125, 1.41534423828125, 1.56591796875, 1.71649169921875, 1.8670654296875, 2.01763916015625, 2.168212890625, 2.31878662109375, 2.4693603515625, 2.61993408203125, 2.7705078125, 2.92108154296875, 3.0716552734375, 3.22222900390625, 3.372802734375, 3.52337646484375, 3.6739501953125, 3.82452392578125, 3.97509765625, 4.12567138671875, 4.2762451171875, 4.42681884765625, 4.577392578125, 4.72796630859375, 4.8785400390625, 5.02911376953125, 5.1796875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 11.0, 9.0, 23.0, 28.0, 29.0, 55.0, 76.0, 103.0, 148.0, 182.0, 249.0, 366.0, 572.0, 908.0, 1645.0, 3428.0, 8828.0, 26830.0, 102751.0, 492011.0, 313820.0, 65042.0, 18642.0, 6332.0, 2665.0, 1347.0, 744.0, 495.0, 352.0, 260.0, 146.0, 102.0, 73.0, 70.0, 48.0, 31.0, 34.0, 22.0, 17.0, 13.0, 5.0, 10.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.1563720703125, -7.883056640625, -7.6097412109375, -7.33642578125, -7.0631103515625, -6.789794921875, -6.5164794921875, -6.2431640625, -5.9698486328125, -5.696533203125, -5.4232177734375, -5.14990234375, -4.8765869140625, -4.603271484375, -4.3299560546875, -4.056640625, -3.7833251953125, -3.510009765625, -3.2366943359375, -2.96337890625, -2.6900634765625, -2.416748046875, -2.1434326171875, -1.8701171875, -1.5968017578125, -1.323486328125, -1.0501708984375, -0.77685546875, -0.5035400390625, -0.230224609375, 0.0430908203125, 0.31640625, 0.5897216796875, 0.863037109375, 1.1363525390625, 1.40966796875, 1.6829833984375, 1.956298828125, 2.2296142578125, 2.5029296875, 2.7762451171875, 3.049560546875, 3.3228759765625, 3.59619140625, 3.8695068359375, 4.142822265625, 4.4161376953125, 4.689453125, 4.9627685546875, 5.236083984375, 5.5093994140625, 5.78271484375, 6.0560302734375, 6.329345703125, 6.6026611328125, 6.8759765625, 7.1492919921875, 7.422607421875, 7.6959228515625, 7.96923828125, 8.2425537109375, 8.515869140625, 8.7891845703125, 9.0625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 9.0, 2.0, 6.0, 6.0, 10.0, 9.0, 7.0, 14.0, 22.0, 20.0, 28.0, 33.0, 41.0, 36.0, 63.0, 76.0, 107.0, 314.0, 1675.0, 167.0, 82.0, 56.0, 42.0, 36.0, 37.0, 26.0, 32.0, 21.0, 19.0, 9.0, 11.0, 5.0, 8.0, 9.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-17.65625, -17.1822509765625, -16.708251953125, -16.2342529296875, -15.76025390625, -15.2862548828125, -14.812255859375, -14.3382568359375, -13.8642578125, -13.3902587890625, -12.916259765625, -12.4422607421875, -11.96826171875, -11.4942626953125, -11.020263671875, -10.5462646484375, -10.072265625, -9.5982666015625, -9.124267578125, -8.6502685546875, -8.17626953125, -7.7022705078125, -7.228271484375, -6.7542724609375, -6.2802734375, -5.8062744140625, -5.332275390625, -4.8582763671875, -4.38427734375, -3.9102783203125, -3.436279296875, -2.9622802734375, -2.48828125, -2.0142822265625, -1.540283203125, -1.0662841796875, -0.59228515625, -0.1182861328125, 0.355712890625, 0.8297119140625, 1.3037109375, 1.7777099609375, 2.251708984375, 2.7257080078125, 3.19970703125, 3.6737060546875, 4.147705078125, 4.6217041015625, 5.095703125, 5.5697021484375, 6.043701171875, 6.5177001953125, 6.99169921875, 7.4656982421875, 7.939697265625, 8.4136962890625, 8.8876953125, 9.3616943359375, 9.835693359375, 10.3096923828125, 10.78369140625, 11.2576904296875, 11.731689453125, 12.2056884765625, 12.6796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 10.0, 14.0, 17.0, 37.0, 43.0, 60.0, 88.0, 145.0, 271.0, 562.0, 1892.0, 2973403.0, 166625.0, 1335.0, 487.0, 235.0, 149.0, 87.0, 49.0, 38.0, 30.0, 25.0, 13.0, 18.0, 9.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.0625, -33.7080078125, -32.353515625, -30.9990234375, -29.64453125, -28.2900390625, -26.935546875, -25.5810546875, -24.2265625, -22.8720703125, -21.517578125, -20.1630859375, -18.80859375, -17.4541015625, -16.099609375, -14.7451171875, -13.390625, -12.0361328125, -10.681640625, -9.3271484375, -7.97265625, -6.6181640625, -5.263671875, -3.9091796875, -2.5546875, -1.2001953125, 0.154296875, 1.5087890625, 2.86328125, 4.2177734375, 5.572265625, 6.9267578125, 8.28125, 9.6357421875, 10.990234375, 12.3447265625, 13.69921875, 15.0537109375, 16.408203125, 17.7626953125, 19.1171875, 20.4716796875, 21.826171875, 23.1806640625, 24.53515625, 25.8896484375, 27.244140625, 28.5986328125, 29.953125, 31.3076171875, 32.662109375, 34.0166015625, 35.37109375, 36.7255859375, 38.080078125, 39.4345703125, 40.7890625, 42.1435546875, 43.498046875, 44.8525390625, 46.20703125, 47.5615234375, 48.916015625, 50.2705078125, 51.625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 12.0, 122.0, 505.0, 336.0, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.957307815551758, -20.62201690673828, -18.286727905273438, -15.951436996459961, -13.616146087646484, -11.280855178833008, -8.945565223693848, -6.6102752685546875, -4.274984359741211, -1.9396939277648926, 0.3955965042114258, 2.730886936187744, 5.0661773681640625, 7.401468276977539, 9.7367582321167, 12.07204818725586, 14.407339096069336, 16.742630004882812, 19.077919006347656, 21.413209915161133, 23.74850082397461, 26.083791732788086, 28.419082641601562, 30.754371643066406, 33.08966064453125, 35.424949645996094, 37.7602424621582, 40.09553146362305, 42.430824279785156, 44.76611328125, 47.101402282714844, 49.43669128417969, 51.77198791503906, 54.107276916503906, 56.442569732666016, 58.77785873413086, 61.11315155029297, 63.44844055175781, 65.78372955322266, 68.1190185546875, 70.45431518554688, 72.78960418701172, 75.12489318847656, 77.46018981933594, 79.79547882080078, 82.13076782226562, 84.46605682373047, 86.80134582519531, 89.13663482666016, 91.471923828125, 93.80721282958984, 96.14250946044922, 98.47779846191406, 100.8130874633789, 103.14837646484375, 105.4836654663086, 107.81895446777344, 110.15424346923828, 112.48953247070312, 114.8248291015625, 117.16011810302734, 119.49540710449219, 121.83069610595703, 124.16598510742188, 126.50128173828125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 1.0, 6.0, 6.0, 7.0, 7.0, 11.0, 12.0, 15.0, 21.0, 12.0, 21.0, 26.0, 26.0, 25.0, 36.0, 40.0, 42.0, 38.0, 34.0, 40.0, 35.0, 41.0, 50.0, 33.0, 40.0, 36.0, 39.0, 41.0, 48.0, 32.0, 26.0, 15.0, 24.0, 19.0, 17.0, 16.0, 9.0, 11.0, 12.0, 6.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.542922973632812, -25.697681427001953, -24.85243797302246, -24.0071964263916, -23.16195297241211, -22.31671142578125, -21.47146987915039, -20.62622833251953, -19.78098487854004, -18.93574333190918, -18.090499877929688, -17.245258331298828, -16.40001678466797, -15.554773330688477, -14.709531784057617, -13.864289283752441, -13.019046783447266, -12.17380428314209, -11.328561782836914, -10.483320236206055, -9.638077735900879, -8.792835235595703, -7.9475932121276855, -7.102351188659668, -6.257108688354492, -5.411866188049316, -4.566624164581299, -3.721381902694702, -2.8761396408081055, -2.0308971405029297, -1.185655117034912, -0.34041309356689453, 0.5048313140869141, 1.3500735759735107, 2.1953158378601074, 3.040558099746704, 3.885800361633301, 4.731042861938477, 5.576284885406494, 6.421526908874512, 7.2667694091796875, 8.112011909484863, 8.957254409790039, 9.802495956420898, 10.647738456726074, 11.49298095703125, 12.33822250366211, 13.183465003967285, 14.028707504272461, 14.873950004577637, 15.719192504882812, 16.564434051513672, 17.40967559814453, 18.254919052124023, 19.100160598754883, 19.945404052734375, 20.790645599365234, 21.635887145996094, 22.481130599975586, 23.326372146606445, 24.171615600585938, 25.016857147216797, 25.862098693847656, 26.707340240478516, 27.552583694458008]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 10.0, 11.0, 12.0, 15.0, 14.0, 14.0, 21.0, 30.0, 29.0, 32.0, 35.0, 44.0, 44.0, 38.0, 44.0, 46.0, 48.0, 54.0, 45.0, 47.0, 38.0, 45.0, 38.0, 35.0, 34.0, 18.0, 31.0, 21.0, 21.0, 11.0, 14.0, 13.0, 6.0, 8.0, 8.0, 9.0, 9.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.24609375, -6.05279541015625, -5.8594970703125, -5.66619873046875, -5.472900390625, -5.27960205078125, -5.0863037109375, -4.89300537109375, -4.69970703125, -4.50640869140625, -4.3131103515625, -4.11981201171875, -3.926513671875, -3.73321533203125, -3.5399169921875, -3.34661865234375, -3.1533203125, -2.96002197265625, -2.7667236328125, -2.57342529296875, -2.380126953125, -2.18682861328125, -1.9935302734375, -1.80023193359375, -1.60693359375, -1.41363525390625, -1.2203369140625, -1.02703857421875, -0.833740234375, -0.64044189453125, -0.4471435546875, -0.25384521484375, -0.060546875, 0.13275146484375, 0.3260498046875, 0.51934814453125, 0.712646484375, 0.90594482421875, 1.0992431640625, 1.29254150390625, 1.48583984375, 1.67913818359375, 1.8724365234375, 2.06573486328125, 2.259033203125, 2.45233154296875, 2.6456298828125, 2.83892822265625, 3.0322265625, 3.22552490234375, 3.4188232421875, 3.61212158203125, 3.805419921875, 3.99871826171875, 4.1920166015625, 4.38531494140625, 4.57861328125, 4.77191162109375, 4.9652099609375, 5.15850830078125, 5.351806640625, 5.54510498046875, 5.7384033203125, 5.93170166015625, 6.125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 6.0, 9.0, 3.0, 13.0, 7.0, 7.0, 21.0, 17.0, 32.0, 25.0, 29.0, 51.0, 55.0, 77.0, 86.0, 150.0, 215.0, 245.0, 313.0, 520.0, 824.0, 1715.0, 6862.0, 132786.0, 3692684.0, 341746.0, 10666.0, 2168.0, 944.0, 518.0, 330.0, 274.0, 194.0, 160.0, 110.0, 72.0, 73.0, 63.0, 39.0, 28.0, 28.0, 18.0, 17.0, 12.0, 15.0, 14.0, 7.0, 7.0, 12.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.90625, -29.92822265625, -28.9501953125, -27.97216796875, -26.994140625, -26.01611328125, -25.0380859375, -24.06005859375, -23.08203125, -22.10400390625, -21.1259765625, -20.14794921875, -19.169921875, -18.19189453125, -17.2138671875, -16.23583984375, -15.2578125, -14.27978515625, -13.3017578125, -12.32373046875, -11.345703125, -10.36767578125, -9.3896484375, -8.41162109375, -7.43359375, -6.45556640625, -5.4775390625, -4.49951171875, -3.521484375, -2.54345703125, -1.5654296875, -0.58740234375, 0.390625, 1.36865234375, 2.3466796875, 3.32470703125, 4.302734375, 5.28076171875, 6.2587890625, 7.23681640625, 8.21484375, 9.19287109375, 10.1708984375, 11.14892578125, 12.126953125, 13.10498046875, 14.0830078125, 15.06103515625, 16.0390625, 17.01708984375, 17.9951171875, 18.97314453125, 19.951171875, 20.92919921875, 21.9072265625, 22.88525390625, 23.86328125, 24.84130859375, 25.8193359375, 26.79736328125, 27.775390625, 28.75341796875, 29.7314453125, 30.70947265625, 31.6875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 21.0, 29.0, 45.0, 55.0, 92.0, 150.0, 232.0, 407.0, 602.0, 704.0, 595.0, 399.0, 266.0, 188.0, 90.0, 64.0, 49.0, 23.0, 10.0, 12.0, 6.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.2890625, -10.8458251953125, -10.402587890625, -9.9593505859375, -9.51611328125, -9.0728759765625, -8.629638671875, -8.1864013671875, -7.7431640625, -7.2999267578125, -6.856689453125, -6.4134521484375, -5.97021484375, -5.5269775390625, -5.083740234375, -4.6405029296875, -4.197265625, -3.7540283203125, -3.310791015625, -2.8675537109375, -2.42431640625, -1.9810791015625, -1.537841796875, -1.0946044921875, -0.6513671875, -0.2081298828125, 0.235107421875, 0.6783447265625, 1.12158203125, 1.5648193359375, 2.008056640625, 2.4512939453125, 2.89453125, 3.3377685546875, 3.781005859375, 4.2242431640625, 4.66748046875, 5.1107177734375, 5.553955078125, 5.9971923828125, 6.4404296875, 6.8836669921875, 7.326904296875, 7.7701416015625, 8.21337890625, 8.6566162109375, 9.099853515625, 9.5430908203125, 9.986328125, 10.4295654296875, 10.872802734375, 11.3160400390625, 11.75927734375, 12.2025146484375, 12.645751953125, 13.0889892578125, 13.5322265625, 13.9754638671875, 14.418701171875, 14.8619384765625, 15.30517578125, 15.7484130859375, 16.191650390625, 16.6348876953125, 17.078125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 23.0, 45.0, 86.0, 223.0, 635.0, 1965.0, 9766.0, 145141.0, 3623746.0, 391716.0, 16775.0, 2804.0, 805.0, 322.0, 124.0, 42.0, 17.0, 11.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.109375, -18.417724609375, -17.72607421875, -17.034423828125, -16.3427734375, -15.651123046875, -14.95947265625, -14.267822265625, -13.576171875, -12.884521484375, -12.19287109375, -11.501220703125, -10.8095703125, -10.117919921875, -9.42626953125, -8.734619140625, -8.04296875, -7.351318359375, -6.65966796875, -5.968017578125, -5.2763671875, -4.584716796875, -3.89306640625, -3.201416015625, -2.509765625, -1.818115234375, -1.12646484375, -0.434814453125, 0.2568359375, 0.948486328125, 1.64013671875, 2.331787109375, 3.0234375, 3.715087890625, 4.40673828125, 5.098388671875, 5.7900390625, 6.481689453125, 7.17333984375, 7.864990234375, 8.556640625, 9.248291015625, 9.93994140625, 10.631591796875, 11.3232421875, 12.014892578125, 12.70654296875, 13.398193359375, 14.08984375, 14.781494140625, 15.47314453125, 16.164794921875, 16.8564453125, 17.548095703125, 18.23974609375, 18.931396484375, 19.623046875, 20.314697265625, 21.00634765625, 21.697998046875, 22.3896484375, 23.081298828125, 23.77294921875, 24.464599609375, 25.15625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 11.0, 23.0, 37.0, 65.0, 95.0, 137.0, 150.0, 126.0, 114.0, 99.0, 49.0, 40.0, 19.0, 18.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.819419860839844, -53.592628479003906, -50.3658332824707, -47.1390380859375, -43.91224670410156, -40.685455322265625, -37.45866012573242, -34.23186492919922, -31.00507354736328, -27.77828025817871, -24.55148696899414, -21.32469367980957, -18.097900390625, -14.87110710144043, -11.64431381225586, -8.417520523071289, -5.190727233886719, -1.9639339447021484, 1.2628593444824219, 4.489652633666992, 7.7164459228515625, 10.943239212036133, 14.170032501220703, 17.396825790405273, 20.623619079589844, 23.850412368774414, 27.077205657958984, 30.303998947143555, 33.530792236328125, 36.75758361816406, 39.984378814697266, 43.21117401123047, 46.43797302246094, 49.664764404296875, 52.89155960083008, 56.11835479736328, 59.34514617919922, 62.571937561035156, 65.79873657226562, 69.02552795410156, 72.2523193359375, 75.47911071777344, 78.70590209960938, 81.93270111083984, 85.15949249267578, 88.38628387451172, 91.61308288574219, 94.83987426757812, 98.06666564941406, 101.29345703125, 104.52024841308594, 107.7470474243164, 110.97383880615234, 114.20063018798828, 117.42742919921875, 120.65422058105469, 123.88101196289062, 127.10780334472656, 130.3345947265625, 133.56138610839844, 136.78817749023438, 140.01498413085938, 143.2417755126953, 146.46856689453125, 149.6953582763672]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 6.0, 8.0, 10.0, 9.0, 13.0, 19.0, 23.0, 10.0, 21.0, 22.0, 29.0, 36.0, 24.0, 34.0, 40.0, 36.0, 26.0, 32.0, 42.0, 41.0, 31.0, 50.0, 41.0, 47.0, 35.0, 40.0, 22.0, 28.0, 27.0, 18.0, 21.0, 23.0, 22.0, 16.0, 16.0, 13.0, 15.0, 8.0, 10.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-35.016841888427734, -33.92645263671875, -32.836063385009766, -31.745676040649414, -30.65528678894043, -29.564897537231445, -28.474510192871094, -27.38412094116211, -26.293731689453125, -25.20334243774414, -24.112953186035156, -23.022565841674805, -21.93217658996582, -20.841787338256836, -19.751399993896484, -18.6610107421875, -17.570621490478516, -16.48023223876953, -15.389843940734863, -14.299455642700195, -13.209066390991211, -12.118677139282227, -11.028288841247559, -9.93790054321289, -8.847511291503906, -7.75712251663208, -6.666733741760254, -5.576344966888428, -4.485956192016602, -3.3955674171447754, -2.305178642272949, -1.214789867401123, -0.12439727783203125, 0.9659914970397949, 2.056380271911621, 3.1467690467834473, 4.237157821655273, 5.3275465965271, 6.417935371398926, 7.508324146270752, 8.598712921142578, 9.689102172851562, 10.77949047088623, 11.869878768920898, 12.960268020629883, 14.050657272338867, 15.141045570373535, 16.231433868408203, 17.321823120117188, 18.412212371826172, 19.502601623535156, 20.592988967895508, 21.683378219604492, 22.773767471313477, 23.864154815673828, 24.954544067382812, 26.044933319091797, 27.13532257080078, 28.225711822509766, 29.316099166870117, 30.4064884185791, 31.496877670288086, 32.58726501464844, 33.67765426635742, 34.768043518066406]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 9.0, 6.0, 10.0, 12.0, 11.0, 15.0, 19.0, 16.0, 18.0, 23.0, 23.0, 30.0, 37.0, 35.0, 34.0, 31.0, 37.0, 30.0, 39.0, 41.0, 42.0, 40.0, 43.0, 51.0, 33.0, 43.0, 39.0, 22.0, 16.0, 21.0, 18.0, 19.0, 32.0, 20.0, 20.0, 13.0, 8.0, 8.0, 6.0, 4.0, 6.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-60.0625, -58.23974609375, -56.4169921875, -54.59423828125, -52.771484375, -50.94873046875, -49.1259765625, -47.30322265625, -45.48046875, -43.65771484375, -41.8349609375, -40.01220703125, -38.189453125, -36.36669921875, -34.5439453125, -32.72119140625, -30.8984375, -29.07568359375, -27.2529296875, -25.43017578125, -23.607421875, -21.78466796875, -19.9619140625, -18.13916015625, -16.31640625, -14.49365234375, -12.6708984375, -10.84814453125, -9.025390625, -7.20263671875, -5.3798828125, -3.55712890625, -1.734375, 0.08837890625, 1.9111328125, 3.73388671875, 5.556640625, 7.37939453125, 9.2021484375, 11.02490234375, 12.84765625, 14.67041015625, 16.4931640625, 18.31591796875, 20.138671875, 21.96142578125, 23.7841796875, 25.60693359375, 27.4296875, 29.25244140625, 31.0751953125, 32.89794921875, 34.720703125, 36.54345703125, 38.3662109375, 40.18896484375, 42.01171875, 43.83447265625, 45.6572265625, 47.47998046875, 49.302734375, 51.12548828125, 52.9482421875, 54.77099609375, 56.59375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 12.0, 31.0, 27.0, 35.0, 65.0, 93.0, 137.0, 218.0, 367.0, 596.0, 915.0, 1336.0, 2105.0, 3322.0, 5090.0, 8217.0, 12919.0, 20458.0, 33609.0, 56847.0, 96251.0, 157506.0, 205577.0, 172254.0, 107436.0, 63651.0, 37613.0, 22689.0, 14325.0, 9029.0, 5733.0, 3569.0, 2307.0, 1534.0, 943.0, 618.0, 397.0, 267.0, 174.0, 104.0, 60.0, 37.0, 37.0, 22.0, 10.0, 3.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-6.04296875, -5.8631591796875, -5.683349609375, -5.5035400390625, -5.32373046875, -5.1439208984375, -4.964111328125, -4.7843017578125, -4.6044921875, -4.4246826171875, -4.244873046875, -4.0650634765625, -3.88525390625, -3.7054443359375, -3.525634765625, -3.3458251953125, -3.166015625, -2.9862060546875, -2.806396484375, -2.6265869140625, -2.44677734375, -2.2669677734375, -2.087158203125, -1.9073486328125, -1.7275390625, -1.5477294921875, -1.367919921875, -1.1881103515625, -1.00830078125, -0.8284912109375, -0.648681640625, -0.4688720703125, -0.2890625, -0.1092529296875, 0.070556640625, 0.2503662109375, 0.43017578125, 0.6099853515625, 0.789794921875, 0.9696044921875, 1.1494140625, 1.3292236328125, 1.509033203125, 1.6888427734375, 1.86865234375, 2.0484619140625, 2.228271484375, 2.4080810546875, 2.587890625, 2.7677001953125, 2.947509765625, 3.1273193359375, 3.30712890625, 3.4869384765625, 3.666748046875, 3.8465576171875, 4.0263671875, 4.2061767578125, 4.385986328125, 4.5657958984375, 4.74560546875, 4.9254150390625, 5.105224609375, 5.2850341796875, 5.46484375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 5.0, 8.0, 6.0, 7.0, 12.0, 14.0, 11.0, 20.0, 21.0, 27.0, 13.0, 23.0, 28.0, 29.0, 30.0, 36.0, 33.0, 35.0, 22.0, 42.0, 27.0, 43.0, 1059.0, 32.0, 31.0, 35.0, 35.0, 26.0, 36.0, 31.0, 23.0, 19.0, 25.0, 29.0, 19.0, 14.0, 18.0, 10.0, 15.0, 7.0, 11.0, 8.0, 8.0, 5.0, 7.0, 6.0, 6.0, 2.0, 5.0, 1.0, 7.0, 3.0, 0.0, 1.0], "bins": [-32.0625, -31.06494140625, -30.0673828125, -29.06982421875, -28.072265625, -27.07470703125, -26.0771484375, -25.07958984375, -24.08203125, -23.08447265625, -22.0869140625, -21.08935546875, -20.091796875, -19.09423828125, -18.0966796875, -17.09912109375, -16.1015625, -15.10400390625, -14.1064453125, -13.10888671875, -12.111328125, -11.11376953125, -10.1162109375, -9.11865234375, -8.12109375, -7.12353515625, -6.1259765625, -5.12841796875, -4.130859375, -3.13330078125, -2.1357421875, -1.13818359375, -0.140625, 0.85693359375, 1.8544921875, 2.85205078125, 3.849609375, 4.84716796875, 5.8447265625, 6.84228515625, 7.83984375, 8.83740234375, 9.8349609375, 10.83251953125, 11.830078125, 12.82763671875, 13.8251953125, 14.82275390625, 15.8203125, 16.81787109375, 17.8154296875, 18.81298828125, 19.810546875, 20.80810546875, 21.8056640625, 22.80322265625, 23.80078125, 24.79833984375, 25.7958984375, 26.79345703125, 27.791015625, 28.78857421875, 29.7861328125, 30.78369140625, 31.78125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 14.0, 25.0, 19.0, 25.0, 54.0, 62.0, 130.0, 174.0, 289.0, 386.0, 568.0, 895.0, 1474.0, 2358.0, 3586.0, 5713.0, 9029.0, 14768.0, 24520.0, 41524.0, 70349.0, 119311.0, 180736.0, 1247542.0, 148143.0, 91218.0, 53036.0, 31560.0, 18801.0, 11556.0, 7054.0, 4486.0, 2821.0, 1734.0, 1103.0, 766.0, 459.0, 265.0, 185.0, 132.0, 86.0, 51.0, 39.0, 31.0, 21.0, 10.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.18359375, -5.01763916015625, -4.8516845703125, -4.68572998046875, -4.519775390625, -4.35382080078125, -4.1878662109375, -4.02191162109375, -3.85595703125, -3.69000244140625, -3.5240478515625, -3.35809326171875, -3.192138671875, -3.02618408203125, -2.8602294921875, -2.69427490234375, -2.5283203125, -2.36236572265625, -2.1964111328125, -2.03045654296875, -1.864501953125, -1.69854736328125, -1.5325927734375, -1.36663818359375, -1.20068359375, -1.03472900390625, -0.8687744140625, -0.70281982421875, -0.536865234375, -0.37091064453125, -0.2049560546875, -0.03900146484375, 0.126953125, 0.29290771484375, 0.4588623046875, 0.62481689453125, 0.790771484375, 0.95672607421875, 1.1226806640625, 1.28863525390625, 1.45458984375, 1.62054443359375, 1.7864990234375, 1.95245361328125, 2.118408203125, 2.28436279296875, 2.4503173828125, 2.61627197265625, 2.7822265625, 2.94818115234375, 3.1141357421875, 3.28009033203125, 3.446044921875, 3.61199951171875, 3.7779541015625, 3.94390869140625, 4.10986328125, 4.27581787109375, 4.4417724609375, 4.60772705078125, 4.773681640625, 4.93963623046875, 5.1055908203125, 5.27154541015625, 5.4375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 9.0, 13.0, 7.0, 11.0, 12.0, 19.0, 27.0, 19.0, 26.0, 26.0, 30.0, 38.0, 42.0, 32.0, 36.0, 43.0, 45.0, 40.0, 42.0, 45.0, 40.0, 43.0, 36.0, 40.0, 33.0, 24.0, 29.0, 28.0, 15.0, 16.0, 21.0, 20.0, 17.0, 12.0, 15.0, 14.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007678985595703125, -0.007404625415802002, -0.007130265235900879, -0.006855905055999756, -0.006581544876098633, -0.00630718469619751, -0.006032824516296387, -0.005758464336395264, -0.005484104156494141, -0.005209743976593018, -0.0049353837966918945, -0.0046610236167907715, -0.0043866634368896484, -0.004112303256988525, -0.0038379430770874023, -0.0035635828971862793, -0.0032892227172851562, -0.003014862537384033, -0.00274050235748291, -0.002466142177581787, -0.002191781997680664, -0.001917421817779541, -0.001643061637878418, -0.001368701457977295, -0.0010943412780761719, -0.0008199810981750488, -0.0005456209182739258, -0.00027126073837280273, 3.0994415283203125e-06, 0.00027745962142944336, 0.0005518198013305664, 0.0008261799812316895, 0.0011005401611328125, 0.0013749003410339355, 0.0016492605209350586, 0.0019236207008361816, 0.0021979808807373047, 0.0024723410606384277, 0.0027467012405395508, 0.003021061420440674, 0.003295421600341797, 0.00356978178024292, 0.003844141960144043, 0.004118502140045166, 0.004392862319946289, 0.004667222499847412, 0.004941582679748535, 0.005215942859649658, 0.005490303039550781, 0.005764663219451904, 0.006039023399353027, 0.00631338357925415, 0.0065877437591552734, 0.0068621039390563965, 0.0071364641189575195, 0.007410824298858643, 0.007685184478759766, 0.007959544658660889, 0.008233904838562012, 0.008508265018463135, 0.008782625198364258, 0.00905698537826538, 0.009331345558166504, 0.009605705738067627, 0.00988006591796875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 3.0, 5.0, 9.0, 12.0, 18.0, 23.0, 33.0, 41.0, 57.0, 76.0, 109.0, 128.0, 174.0, 185.0, 252.0, 340.0, 484.0, 816.0, 1506.0, 3471.0, 10537.0, 36949.0, 128195.0, 306971.0, 333607.0, 155956.0, 46331.0, 13299.0, 4252.0, 1800.0, 852.0, 526.0, 365.0, 298.0, 201.0, 152.0, 127.0, 114.0, 61.0, 52.0, 38.0, 32.0, 24.0, 19.0, 14.0, 16.0, 5.0, 8.0, 5.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.06134033203125, -0.059592247009277344, -0.05784416198730469, -0.05609607696533203, -0.054347991943359375, -0.05259990692138672, -0.05085182189941406, -0.049103736877441406, -0.04735565185546875, -0.045607566833496094, -0.04385948181152344, -0.04211139678955078, -0.040363311767578125, -0.03861522674560547, -0.03686714172363281, -0.035119056701660156, -0.0333709716796875, -0.031622886657714844, -0.029874801635742188, -0.02812671661376953, -0.026378631591796875, -0.02463054656982422, -0.022882461547851562, -0.021134376525878906, -0.01938629150390625, -0.017638206481933594, -0.015890121459960938, -0.014142036437988281, -0.012393951416015625, -0.010645866394042969, -0.008897781372070312, -0.007149696350097656, -0.005401611328125, -0.0036535263061523438, -0.0019054412841796875, -0.00015735626220703125, 0.001590728759765625, 0.0033388137817382812, 0.0050868988037109375, 0.006834983825683594, 0.00858306884765625, 0.010331153869628906, 0.012079238891601562, 0.013827323913574219, 0.015575408935546875, 0.01732349395751953, 0.019071578979492188, 0.020819664001464844, 0.0225677490234375, 0.024315834045410156, 0.026063919067382812, 0.02781200408935547, 0.029560089111328125, 0.03130817413330078, 0.03305625915527344, 0.034804344177246094, 0.03655242919921875, 0.038300514221191406, 0.04004859924316406, 0.04179668426513672, 0.043544769287109375, 0.04529285430908203, 0.04704093933105469, 0.048789024353027344, 0.050537109375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 22.0, 56.0, 82.0, 126.0, 163.0, 138.0, 147.0, 98.0, 76.0, 45.0, 28.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02146703563630581, -0.020934611558914185, -0.02040218561887741, -0.019869761541485786, -0.019337337464094162, -0.018804913386702538, -0.018272487446665764, -0.01774006336927414, -0.017207639291882515, -0.01667521521449089, -0.016142789274454117, -0.015610365197062492, -0.015077941119670868, -0.014545516110956669, -0.01401309110224247, -0.013480667024850845, -0.012948242016136646, -0.012415817007422447, -0.011883392930030823, -0.011350967921316624, -0.010818543843925, -0.0102861188352108, -0.009753694757819176, -0.009221269749104977, -0.008688844740390778, -0.008156419731676579, -0.007623995654284954, -0.007091570645570755, -0.0065591465681791306, -0.0060267215594649315, -0.00549429701641202, -0.004961872473359108, -0.0044294483959674835, -0.0038970238529145718, -0.00336459930986166, -0.0028321745339781046, -0.002299749990925193, -0.001767325447872281, -0.0012349006719887257, -0.0007024761289358139, -0.00017005158588290215, 0.0003623730153776705, 0.0008947976166382432, 0.0014272222761064768, 0.0019596468191593885, 0.0024920713622123003, 0.0030244961380958557, 0.0035569206811487675, 0.004089345224201679, 0.004621769767254591, 0.005154194310307503, 0.005686619319021702, 0.006219043396413326, 0.006751468405127525, 0.007283892948180437, 0.007816317491233349, 0.008348742499947548, 0.008881167508661747, 0.009413591586053371, 0.00994601659476757, 0.010478440672159195, 0.011010865680873394, 0.011543290689587593, 0.012075714766979218, 0.012608138844370842]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 10.0, 12.0, 7.0, 23.0, 17.0, 21.0, 36.0, 19.0, 33.0, 42.0, 45.0, 41.0, 50.0, 54.0, 43.0, 52.0, 52.0, 39.0, 39.0, 49.0, 33.0, 40.0, 37.0, 26.0, 29.0, 25.0, 16.0, 15.0, 20.0, 18.0, 8.0, 8.0, 8.0, 5.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0055408477783203125, -0.005342938005924225, -0.005145028233528137, -0.0049471184611320496, -0.004749208688735962, -0.004551298916339874, -0.004353389143943787, -0.004155479371547699, -0.003957569599151611, -0.0037596598267555237, -0.003561750054359436, -0.0033638402819633484, -0.0031659305095672607, -0.002968020737171173, -0.0027701109647750854, -0.002572201192378998, -0.00237429141998291, -0.0021763816475868225, -0.001978471875190735, -0.0017805621027946472, -0.0015826523303985596, -0.001384742558002472, -0.0011868327856063843, -0.0009889230132102966, -0.000791013240814209, -0.0005931034684181213, -0.0003951936960220337, -0.00019728392362594604, 6.258487701416016e-07, 0.00019853562116622925, 0.0003964453935623169, 0.0005943551659584045, 0.0007922649383544922, 0.0009901747107505798, 0.0011880844831466675, 0.0013859942555427551, 0.0015839040279388428, 0.0017818138003349304, 0.001979723572731018, 0.0021776333451271057, 0.0023755431175231934, 0.002573452889919281, 0.0027713626623153687, 0.0029692724347114563, 0.003167182207107544, 0.0033650919795036316, 0.0035630017518997192, 0.003760911524295807, 0.0039588212966918945, 0.004156731069087982, 0.00435464084148407, 0.0045525506138801575, 0.004750460386276245, 0.004948370158672333, 0.00514627993106842, 0.005344189703464508, 0.005542099475860596, 0.005740009248256683, 0.005937919020652771, 0.006135828793048859, 0.006333738565444946, 0.006531648337841034, 0.006729558110237122, 0.006927467882633209, 0.007125377655029297]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 8.0, 7.0, 10.0, 12.0, 11.0, 14.0, 20.0, 16.0, 18.0, 23.0, 23.0, 29.0, 38.0, 35.0, 34.0, 31.0, 37.0, 30.0, 39.0, 41.0, 42.0, 40.0, 43.0, 51.0, 33.0, 43.0, 39.0, 22.0, 16.0, 21.0, 18.0, 19.0, 31.0, 21.0, 20.0, 12.0, 9.0, 8.0, 6.0, 5.0, 5.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-60.09375, -58.2705078125, -56.447265625, -54.6240234375, -52.80078125, -50.9775390625, -49.154296875, -47.3310546875, -45.5078125, -43.6845703125, -41.861328125, -40.0380859375, -38.21484375, -36.3916015625, -34.568359375, -32.7451171875, -30.921875, -29.0986328125, -27.275390625, -25.4521484375, -23.62890625, -21.8056640625, -19.982421875, -18.1591796875, -16.3359375, -14.5126953125, -12.689453125, -10.8662109375, -9.04296875, -7.2197265625, -5.396484375, -3.5732421875, -1.75, 0.0732421875, 1.896484375, 3.7197265625, 5.54296875, 7.3662109375, 9.189453125, 11.0126953125, 12.8359375, 14.6591796875, 16.482421875, 18.3056640625, 20.12890625, 21.9521484375, 23.775390625, 25.5986328125, 27.421875, 29.2451171875, 31.068359375, 32.8916015625, 34.71484375, 36.5380859375, 38.361328125, 40.1845703125, 42.0078125, 43.8310546875, 45.654296875, 47.4775390625, 49.30078125, 51.1240234375, 52.947265625, 54.7705078125, 56.59375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 2.0, 7.0, 9.0, 7.0, 14.0, 18.0, 21.0, 18.0, 33.0, 32.0, 59.0, 73.0, 120.0, 176.0, 273.0, 395.0, 684.0, 1206.0, 2172.0, 4205.0, 9348.0, 26569.0, 107841.0, 461784.0, 327587.0, 71016.0, 19456.0, 7250.0, 3542.0, 1843.0, 1054.0, 591.0, 364.0, 226.0, 156.0, 113.0, 82.0, 43.0, 50.0, 28.0, 18.0, 16.0, 14.0, 7.0, 9.0, 5.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.4765625, -14.022216796875, -13.56787109375, -13.113525390625, -12.6591796875, -12.204833984375, -11.75048828125, -11.296142578125, -10.841796875, -10.387451171875, -9.93310546875, -9.478759765625, -9.0244140625, -8.570068359375, -8.11572265625, -7.661376953125, -7.20703125, -6.752685546875, -6.29833984375, -5.843994140625, -5.3896484375, -4.935302734375, -4.48095703125, -4.026611328125, -3.572265625, -3.117919921875, -2.66357421875, -2.209228515625, -1.7548828125, -1.300537109375, -0.84619140625, -0.391845703125, 0.0625, 0.516845703125, 0.97119140625, 1.425537109375, 1.8798828125, 2.334228515625, 2.78857421875, 3.242919921875, 3.697265625, 4.151611328125, 4.60595703125, 5.060302734375, 5.5146484375, 5.968994140625, 6.42333984375, 6.877685546875, 7.33203125, 7.786376953125, 8.24072265625, 8.695068359375, 9.1494140625, 9.603759765625, 10.05810546875, 10.512451171875, 10.966796875, 11.421142578125, 11.87548828125, 12.329833984375, 12.7841796875, 13.238525390625, 13.69287109375, 14.147216796875, 14.6015625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 10.0, 9.0, 5.0, 20.0, 10.0, 23.0, 28.0, 24.0, 37.0, 29.0, 31.0, 38.0, 52.0, 56.0, 109.0, 2040.0, 66.0, 51.0, 64.0, 36.0, 59.0, 42.0, 38.0, 24.0, 25.0, 29.0, 21.0, 18.0, 15.0, 10.0, 6.0, 4.0, 3.0, 5.0, 4.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.9375, -100.8134765625, -97.689453125, -94.5654296875, -91.44140625, -88.3173828125, -85.193359375, -82.0693359375, -78.9453125, -75.8212890625, -72.697265625, -69.5732421875, -66.44921875, -63.3251953125, -60.201171875, -57.0771484375, -53.953125, -50.8291015625, -47.705078125, -44.5810546875, -41.45703125, -38.3330078125, -35.208984375, -32.0849609375, -28.9609375, -25.8369140625, -22.712890625, -19.5888671875, -16.46484375, -13.3408203125, -10.216796875, -7.0927734375, -3.96875, -0.8447265625, 2.279296875, 5.4033203125, 8.52734375, 11.6513671875, 14.775390625, 17.8994140625, 21.0234375, 24.1474609375, 27.271484375, 30.3955078125, 33.51953125, 36.6435546875, 39.767578125, 42.8916015625, 46.015625, 49.1396484375, 52.263671875, 55.3876953125, 58.51171875, 61.6357421875, 64.759765625, 67.8837890625, 71.0078125, 74.1318359375, 77.255859375, 80.3798828125, 83.50390625, 86.6279296875, 89.751953125, 92.8759765625, 96.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 2.0, 7.0, 20.0, 12.0, 23.0, 34.0, 43.0, 48.0, 80.0, 89.0, 117.0, 189.0, 245.0, 389.0, 625.0, 1119.0, 2559.0, 10288.0, 77448.0, 2741784.0, 274330.0, 27490.0, 4761.0, 1616.0, 826.0, 476.0, 302.0, 203.0, 144.0, 111.0, 74.0, 54.0, 49.0, 30.0, 31.0, 13.0, 19.0, 12.0, 4.0, 10.0, 4.0, 4.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-20.578125, -19.93017578125, -19.2822265625, -18.63427734375, -17.986328125, -17.33837890625, -16.6904296875, -16.04248046875, -15.39453125, -14.74658203125, -14.0986328125, -13.45068359375, -12.802734375, -12.15478515625, -11.5068359375, -10.85888671875, -10.2109375, -9.56298828125, -8.9150390625, -8.26708984375, -7.619140625, -6.97119140625, -6.3232421875, -5.67529296875, -5.02734375, -4.37939453125, -3.7314453125, -3.08349609375, -2.435546875, -1.78759765625, -1.1396484375, -0.49169921875, 0.15625, 0.80419921875, 1.4521484375, 2.10009765625, 2.748046875, 3.39599609375, 4.0439453125, 4.69189453125, 5.33984375, 5.98779296875, 6.6357421875, 7.28369140625, 7.931640625, 8.57958984375, 9.2275390625, 9.87548828125, 10.5234375, 11.17138671875, 11.8193359375, 12.46728515625, 13.115234375, 13.76318359375, 14.4111328125, 15.05908203125, 15.70703125, 16.35498046875, 17.0029296875, 17.65087890625, 18.298828125, 18.94677734375, 19.5947265625, 20.24267578125, 20.890625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 8.0, 15.0, 46.0, 171.0, 283.0, 264.0, 118.0, 42.0, 17.0, 11.0, 10.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.50149536132812, -146.27305603027344, -137.0446319580078, -127.81619262695312, -118.58776092529297, -109.35932922363281, -100.13088989257812, -90.90245819091797, -81.67402648925781, -72.44559478759766, -63.217159271240234, -53.98872375488281, -44.760292053222656, -35.5318603515625, -26.303424835205078, -17.074989318847656, -7.8465576171875, 1.381875991821289, 10.610309600830078, 19.838743209838867, 29.067176818847656, 38.29560852050781, 47.524044036865234, 56.752479553222656, 65.98091125488281, 75.20934295654297, 84.43777465820312, 93.66621398925781, 102.89464569091797, 112.12307739257812, 121.35151672363281, 130.5799560546875, 139.80838012695312, 149.0368194580078, 158.26524353027344, 167.49368286132812, 176.72210693359375, 185.95054626464844, 195.17898559570312, 204.40740966796875, 213.63584899902344, 222.86428833007812, 232.09271240234375, 241.32115173339844, 250.54959106445312, 259.77801513671875, 269.0064392089844, 278.2348937988281, 287.46331787109375, 296.6917419433594, 305.9201965332031, 315.14862060546875, 324.3770446777344, 333.60546875, 342.83392333984375, 352.0623474121094, 361.290771484375, 370.5191955566406, 379.7476501464844, 388.97607421875, 398.2044982910156, 407.43292236328125, 416.661376953125, 425.8898010253906, 435.1182556152344]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 3.0, 3.0, 11.0, 7.0, 3.0, 11.0, 22.0, 18.0, 19.0, 17.0, 19.0, 27.0, 38.0, 43.0, 41.0, 40.0, 43.0, 51.0, 55.0, 51.0, 48.0, 42.0, 41.0, 43.0, 50.0, 37.0, 31.0, 37.0, 21.0, 19.0, 18.0, 20.0, 17.0, 13.0, 6.0, 8.0, 8.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.80606079101562, -103.87979125976562, -99.9535140991211, -96.0272445678711, -92.10096740722656, -88.17469787597656, -84.24842071533203, -80.32215118408203, -76.3958740234375, -72.4696044921875, -68.54332733154297, -64.61705780029297, -60.69078063964844, -56.76451110839844, -52.838233947753906, -48.911964416503906, -44.98569107055664, -41.059417724609375, -37.13314437866211, -33.206871032714844, -29.280597686767578, -25.354326248168945, -21.42805290222168, -17.501779556274414, -13.575506210327148, -9.649232864379883, -5.722959995269775, -1.796687126159668, 2.1295862197875977, 6.055858612060547, 9.982131958007812, 13.908405303955078, 17.834678649902344, 21.76095199584961, 25.687225341796875, 29.61349868774414, 33.539772033691406, 37.466041564941406, 41.39231872558594, 45.31858825683594, 49.24486541748047, 53.171138763427734, 57.097412109375, 61.023685455322266, 64.94995880126953, 68.87622833251953, 72.80250549316406, 76.72877502441406, 80.65504455566406, 84.58131408691406, 88.5075912475586, 92.4338607788086, 96.36013793945312, 100.28640747070312, 104.21268463134766, 108.13895416259766, 112.06523132324219, 115.99150085449219, 119.91777801513672, 123.84404754638672, 127.77032470703125, 131.69659423828125, 135.62286376953125, 139.5491485595703, 143.4754180908203]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 6.0, 5.0, 16.0, 18.0, 27.0, 30.0, 35.0, 33.0, 57.0, 99.0, 107.0, 116.0, 135.0, 167.0, 203.0, 228.0, 302.0, 316.0, 455.0, 633.0, 805.0, 1040416.0, 964.0, 720.0, 502.0, 380.0, 326.0, 252.0, 240.0, 205.0, 164.0, 127.0, 106.0, 79.0, 58.0, 40.0, 45.0, 33.0, 23.0, 21.0, 21.0, 10.0, 7.0, 3.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.14198303222656, -35.03799057006836, -33.933998107910156, -32.83000564575195, -31.72601318359375, -30.622020721435547, -29.518030166625977, -28.414037704467773, -27.31004524230957, -26.206052780151367, -25.102060317993164, -23.99806785583496, -22.89407730102539, -21.790084838867188, -20.686092376708984, -19.58209991455078, -18.478107452392578, -17.374114990234375, -16.270122528076172, -15.166131019592285, -14.062138557434082, -12.958146095275879, -11.854154586791992, -10.750162124633789, -9.646169662475586, -8.542177200317383, -7.438185214996338, -6.334193229675293, -5.23020076751709, -4.126208305358887, -3.022216320037842, -1.9182243347167969, -0.8142318725585938, 0.2897603511810303, 1.3937525749206543, 2.4977447986602783, 3.6017370223999023, 4.7057294845581055, 5.80972146987915, 6.913713455200195, 8.017705917358398, 9.121698379516602, 10.225690841674805, 11.329682350158691, 12.433674812316895, 13.537667274475098, 14.641658782958984, 15.745651245117188, 16.84964370727539, 17.953636169433594, 19.057628631591797, 20.16162109375, 21.265613555908203, 22.369606018066406, 23.473596572875977, 24.57758903503418, 25.681581497192383, 26.785573959350586, 27.88956642150879, 28.993558883666992, 30.097549438476562, 31.201541900634766, 32.30553436279297, 33.40952682495117, 34.513519287109375]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 15.0, 14.0, 14.0, 15.0, 43.0, 234.0, 51462512.0, 149.0, 50.0, 24.0, 6.0, 6.0, 5.0, 3.0, 6.0, 6.0, 7.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6494.2607421875, -6239.2412109375, -5984.22119140625, -5729.20166015625, -5474.18212890625, -5219.162109375, -4964.142578125, -4709.123046875, -4454.103515625, -4199.083984375, -3944.064208984375, -3689.04443359375, -3434.02490234375, -3179.005126953125, -2923.9853515625, -2668.9658203125, -2413.94580078125, -2158.926025390625, -1903.906494140625, -1648.88671875, -1393.8670654296875, -1138.847412109375, -883.82763671875, -628.8079833984375, -373.788330078125, -118.76864624023438, 136.25103759765625, 391.270751953125, 646.2904052734375, 901.31005859375, 1156.329833984375, 1411.3494873046875, 1666.369140625, 1921.3887939453125, 2176.408447265625, 2431.42822265625, 2686.44775390625, 2941.467529296875, 3196.4873046875, 3451.5068359375, 3706.526611328125, 3961.54638671875, 4216.56591796875, 4471.5859375, 4726.60546875, 4981.625, 5236.64453125, 5491.66455078125, 5746.68408203125, 6001.70361328125, 6256.7236328125, 6511.7431640625, 6766.7626953125, 7021.7822265625, 7276.80224609375, 7531.82177734375, 7786.841796875, 8041.861328125, 8296.880859375, 8551.900390625, 8806.9208984375, 9061.9404296875, 9316.9599609375, 9571.9794921875, 9826.9990234375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 15.0, 17.0, 33.0, 47.0, 60.0, 103.0, 151.0, 186.0, 339.0, 451.0, 737.0, 1118.0, 1816.0, 2772.0, 4551.0, 7430.0, 12409.0, 20750.0, 35590.0, 62010.0, 110063.0, 198096.0, 349615.0, 599872.0, 3684176.0, 504189.0, 301755.0, 169073.0, 94009.0, 53341.0, 30287.0, 17976.0, 10692.0, 6629.0, 3990.0, 2549.0, 1569.0, 1001.0, 675.0, 420.0, 303.0, 205.0, 132.0, 70.0, 49.0, 27.0, 27.0, 13.0, 20.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.337890625, -2.265655517578125, -2.19342041015625, -2.121185302734375, -2.0489501953125, -1.976715087890625, -1.90447998046875, -1.832244873046875, -1.760009765625, -1.687774658203125, -1.61553955078125, -1.543304443359375, -1.4710693359375, -1.398834228515625, -1.32659912109375, -1.254364013671875, -1.18212890625, -1.109893798828125, -1.03765869140625, -0.965423583984375, -0.8931884765625, -0.820953369140625, -0.74871826171875, -0.676483154296875, -0.604248046875, -0.532012939453125, -0.45977783203125, -0.387542724609375, -0.3153076171875, -0.243072509765625, -0.17083740234375, -0.098602294921875, -0.0263671875, 0.045867919921875, 0.11810302734375, 0.190338134765625, 0.2625732421875, 0.334808349609375, 0.40704345703125, 0.479278564453125, 0.551513671875, 0.623748779296875, 0.69598388671875, 0.768218994140625, 0.8404541015625, 0.912689208984375, 0.98492431640625, 1.057159423828125, 1.12939453125, 1.201629638671875, 1.27386474609375, 1.346099853515625, 1.4183349609375, 1.490570068359375, 1.56280517578125, 1.635040283203125, 1.707275390625, 1.779510498046875, 1.85174560546875, 1.923980712890625, 1.9962158203125, 2.068450927734375, 2.14068603515625, 2.212921142578125, 2.28515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 3.0, 10.0, 19.0, 6.0, 7.0, 12.0, 22.0, 33.0, 17.0, 19.0, 27.0, 31.0, 29.0, 40.0, 33.0, 46.0, 38.0, 42.0, 88.0, 832.0, 213.0, 43.0, 33.0, 36.0, 33.0, 34.0, 32.0, 28.0, 16.0, 21.0, 32.0, 27.0, 22.0, 22.0, 13.0, 12.0, 11.0, 6.0, 11.0, 1.0, 2.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.328125, -12.9208984375, -12.513671875, -12.1064453125, -11.69921875, -11.2919921875, -10.884765625, -10.4775390625, -10.0703125, -9.6630859375, -9.255859375, -8.8486328125, -8.44140625, -8.0341796875, -7.626953125, -7.2197265625, -6.8125, -6.4052734375, -5.998046875, -5.5908203125, -5.18359375, -4.7763671875, -4.369140625, -3.9619140625, -3.5546875, -3.1474609375, -2.740234375, -2.3330078125, -1.92578125, -1.5185546875, -1.111328125, -0.7041015625, -0.296875, 0.1103515625, 0.517578125, 0.9248046875, 1.33203125, 1.7392578125, 2.146484375, 2.5537109375, 2.9609375, 3.3681640625, 3.775390625, 4.1826171875, 4.58984375, 4.9970703125, 5.404296875, 5.8115234375, 6.21875, 6.6259765625, 7.033203125, 7.4404296875, 7.84765625, 8.2548828125, 8.662109375, 9.0693359375, 9.4765625, 9.8837890625, 10.291015625, 10.6982421875, 11.10546875, 11.5126953125, 11.919921875, 12.3271484375, 12.734375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 1.0, 6.0, 11.0, 19.0, 34.0, 48.0, 68.0, 126.0, 153.0, 216.0, 352.0, 476.0, 752.0, 1114.0, 1630.0, 2460.0, 3701.0, 5660.0, 8442.0, 12475.0, 19033.0, 28912.0, 44903.0, 70424.0, 112093.0, 178745.0, 278647.0, 421329.0, 3070529.0, 986878.0, 368777.0, 243832.0, 155544.0, 97109.0, 61648.0, 39517.0, 25564.0, 16661.0, 11104.0, 7246.0, 5140.0, 3372.0, 2160.0, 1429.0, 1004.0, 680.0, 495.0, 311.0, 218.0, 125.0, 87.0, 60.0, 43.0, 33.0, 19.0, 8.0, 9.0, 6.0, 2.0, 3.0], "bins": [-1.8525390625, -1.796142578125, -1.73974609375, -1.683349609375, -1.626953125, -1.570556640625, -1.51416015625, -1.457763671875, -1.4013671875, -1.344970703125, -1.28857421875, -1.232177734375, -1.17578125, -1.119384765625, -1.06298828125, -1.006591796875, -0.9501953125, -0.893798828125, -0.83740234375, -0.781005859375, -0.724609375, -0.668212890625, -0.61181640625, -0.555419921875, -0.4990234375, -0.442626953125, -0.38623046875, -0.329833984375, -0.2734375, -0.217041015625, -0.16064453125, -0.104248046875, -0.0478515625, 0.008544921875, 0.06494140625, 0.121337890625, 0.177734375, 0.234130859375, 0.29052734375, 0.346923828125, 0.4033203125, 0.459716796875, 0.51611328125, 0.572509765625, 0.62890625, 0.685302734375, 0.74169921875, 0.798095703125, 0.8544921875, 0.910888671875, 0.96728515625, 1.023681640625, 1.080078125, 1.136474609375, 1.19287109375, 1.249267578125, 1.3056640625, 1.362060546875, 1.41845703125, 1.474853515625, 1.53125, 1.587646484375, 1.64404296875, 1.700439453125, 1.7568359375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 5.0, 7.0, 6.0, 7.0, 16.0, 9.0, 16.0, 17.0, 18.0, 18.0, 26.0, 23.0, 24.0, 18.0, 23.0, 36.0, 34.0, 34.0, 37.0, 50.0, 135.0, 800.0, 209.0, 38.0, 35.0, 47.0, 27.0, 33.0, 28.0, 35.0, 26.0, 18.0, 23.0, 22.0, 22.0, 14.0, 20.0, 7.0, 17.0, 12.0, 9.0, 4.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.34375, -9.057861328125, -8.77197265625, -8.486083984375, -8.2001953125, -7.914306640625, -7.62841796875, -7.342529296875, -7.056640625, -6.770751953125, -6.48486328125, -6.198974609375, -5.9130859375, -5.627197265625, -5.34130859375, -5.055419921875, -4.76953125, -4.483642578125, -4.19775390625, -3.911865234375, -3.6259765625, -3.340087890625, -3.05419921875, -2.768310546875, -2.482421875, -2.196533203125, -1.91064453125, -1.624755859375, -1.3388671875, -1.052978515625, -0.76708984375, -0.481201171875, -0.1953125, 0.090576171875, 0.37646484375, 0.662353515625, 0.9482421875, 1.234130859375, 1.52001953125, 1.805908203125, 2.091796875, 2.377685546875, 2.66357421875, 2.949462890625, 3.2353515625, 3.521240234375, 3.80712890625, 4.093017578125, 4.37890625, 4.664794921875, 4.95068359375, 5.236572265625, 5.5224609375, 5.808349609375, 6.09423828125, 6.380126953125, 6.666015625, 6.951904296875, 7.23779296875, 7.523681640625, 7.8095703125, 8.095458984375, 8.38134765625, 8.667236328125, 8.953125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 4.0, 4.0, 5.0, 8.0, 9.0, 18.0, 20.0, 10.0, 21.0, 38.0, 38.0, 81.0, 68.0, 119.0, 169.0, 197.0, 283.0, 427.0, 598.0, 808.0, 1206.0, 1833.0, 2902.0, 5337.0, 11094.0, 24666.0, 59230.0, 167166.0, 5748728.0, 159598.0, 57789.0, 23941.0, 10818.0, 5363.0, 3023.0, 1769.0, 1100.0, 790.0, 570.0, 371.0, 326.0, 239.0, 153.0, 126.0, 94.0, 69.0, 64.0, 38.0, 22.0, 15.0, 21.0, 2.0, 9.0, 12.0, 10.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-6.53125, -6.32379150390625, -6.1163330078125, -5.90887451171875, -5.701416015625, -5.49395751953125, -5.2864990234375, -5.07904052734375, -4.87158203125, -4.66412353515625, -4.4566650390625, -4.24920654296875, -4.041748046875, -3.83428955078125, -3.6268310546875, -3.41937255859375, -3.2119140625, -3.00445556640625, -2.7969970703125, -2.58953857421875, -2.382080078125, -2.17462158203125, -1.9671630859375, -1.75970458984375, -1.55224609375, -1.34478759765625, -1.1373291015625, -0.92987060546875, -0.722412109375, -0.51495361328125, -0.3074951171875, -0.10003662109375, 0.107421875, 0.31488037109375, 0.5223388671875, 0.72979736328125, 0.937255859375, 1.14471435546875, 1.3521728515625, 1.55963134765625, 1.76708984375, 1.97454833984375, 2.1820068359375, 2.38946533203125, 2.596923828125, 2.80438232421875, 3.0118408203125, 3.21929931640625, 3.4267578125, 3.63421630859375, 3.8416748046875, 4.04913330078125, 4.256591796875, 4.46405029296875, 4.6715087890625, 4.87896728515625, 5.08642578125, 5.29388427734375, 5.5013427734375, 5.70880126953125, 5.916259765625, 6.12371826171875, 6.3311767578125, 6.53863525390625, 6.74609375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 6.0, 10.0, 7.0, 13.0, 8.0, 11.0, 10.0, 17.0, 20.0, 25.0, 20.0, 30.0, 29.0, 36.0, 29.0, 38.0, 30.0, 45.0, 29.0, 54.0, 133.0, 708.0, 264.0, 50.0, 40.0, 43.0, 31.0, 27.0, 38.0, 27.0, 30.0, 21.0, 25.0, 18.0, 15.0, 16.0, 11.0, 17.0, 10.0, 8.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.2265625, -7.01220703125, -6.7978515625, -6.58349609375, -6.369140625, -6.15478515625, -5.9404296875, -5.72607421875, -5.51171875, -5.29736328125, -5.0830078125, -4.86865234375, -4.654296875, -4.43994140625, -4.2255859375, -4.01123046875, -3.796875, -3.58251953125, -3.3681640625, -3.15380859375, -2.939453125, -2.72509765625, -2.5107421875, -2.29638671875, -2.08203125, -1.86767578125, -1.6533203125, -1.43896484375, -1.224609375, -1.01025390625, -0.7958984375, -0.58154296875, -0.3671875, -0.15283203125, 0.0615234375, 0.27587890625, 0.490234375, 0.70458984375, 0.9189453125, 1.13330078125, 1.34765625, 1.56201171875, 1.7763671875, 1.99072265625, 2.205078125, 2.41943359375, 2.6337890625, 2.84814453125, 3.0625, 3.27685546875, 3.4912109375, 3.70556640625, 3.919921875, 4.13427734375, 4.3486328125, 4.56298828125, 4.77734375, 4.99169921875, 5.2060546875, 5.42041015625, 5.634765625, 5.84912109375, 6.0634765625, 6.27783203125, 6.4921875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 1.0, 6.0, 10.0, 14.0, 28.0, 46.0, 92.0, 130.0, 187.0, 195.0, 112.0, 82.0, 53.0, 23.0, 8.0, 10.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.500179290771484, -21.858583450317383, -21.21698570251465, -20.575389862060547, -19.933792114257812, -19.29219627380371, -18.650598526000977, -18.009002685546875, -17.36740493774414, -16.72580909729004, -16.084211349487305, -15.442614555358887, -14.801017761230469, -14.159421920776367, -13.51782512664795, -12.876228332519531, -12.23463249206543, -11.593035697937012, -10.951438903808594, -10.309842109680176, -9.668245315551758, -9.026649475097656, -8.385052680969238, -7.74345588684082, -7.101859092712402, -6.460262298583984, -5.818665504455566, -5.177069187164307, -4.535472393035889, -3.8938755989074707, -3.252279043197632, -2.610682487487793, -1.9690837860107422, -1.3274871110916138, -0.6858904361724854, -0.044293761253356934, 0.5973029136657715, 1.2388997077941895, 1.8804962635040283, 2.522092819213867, 3.163689613342285, 3.805286407470703, 4.446883201599121, 5.088479518890381, 5.730076313018799, 6.371673107147217, 7.013269424438477, 7.6548662185668945, 8.296463012695312, 8.93805980682373, 9.579656600952148, 10.221253395080566, 10.862850189208984, 11.504446029663086, 12.146042823791504, 12.787639617919922, 13.42923641204834, 14.070833206176758, 14.712430000305176, 15.354026794433594, 15.995622634887695, 16.63722038269043, 17.27881622314453, 17.920413970947266, 18.562009811401367]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 6.0, 12.0, 8.0, 11.0, 11.0, 10.0, 17.0, 27.0, 14.0, 29.0, 22.0, 19.0, 23.0, 29.0, 27.0, 25.0, 38.0, 42.0, 27.0, 29.0, 34.0, 48.0, 33.0, 30.0, 30.0, 38.0, 38.0, 32.0, 26.0, 36.0, 16.0, 28.0, 29.0, 18.0, 18.0, 20.0, 17.0, 18.0, 6.0, 8.0, 13.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.744325637817383, -8.459771156311035, -8.175216674804688, -7.89066219329834, -7.606107711791992, -7.3215532302856445, -7.036999225616455, -6.752444744110107, -6.46789026260376, -6.183335781097412, -5.8987812995910645, -5.614226818084717, -5.329672813415527, -5.04511833190918, -4.760563850402832, -4.476009368896484, -4.191454887390137, -3.906900405883789, -3.6223459243774414, -3.337791681289673, -3.053237199783325, -2.7686827182769775, -2.484128475189209, -2.1995739936828613, -1.9150195121765137, -1.630465030670166, -1.345910668373108, -1.0613563060760498, -0.7768018245697021, -0.4922473430633545, -0.2076929807662964, 0.07686138153076172, 0.3614158630371094, 0.6459702849388123, 0.9305247068405151, 1.2150790691375732, 1.499633550643921, 1.7841880321502686, 2.068742275238037, 2.3532967567443848, 2.6378512382507324, 2.92240571975708, 3.2069602012634277, 3.4915144443511963, 3.776068925857544, 4.0606231689453125, 4.34517765045166, 4.629732131958008, 4.9142866134643555, 5.198841094970703, 5.483395576477051, 5.767950057983398, 6.052504539489746, 6.337059020996094, 6.621613025665283, 6.906167507171631, 7.1907219886779785, 7.475276470184326, 7.759830951690674, 8.044384956359863, 8.328939437866211, 8.613493919372559, 8.898048400878906, 9.182602882385254, 9.467157363891602]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 10.0, 13.0, 16.0, 22.0, 36.0, 46.0, 80.0, 131.0, 195.0, 365.0, 585.0, 1125.0, 2206.0, 5200.0, 14904.0, 89357.0, 4009739.0, 50063.0, 11454.0, 4247.0, 1976.0, 1020.0, 573.0, 316.0, 191.0, 131.0, 65.0, 67.0, 33.0, 31.0, 20.0, 21.0, 14.0, 5.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.471435546875, -0.4535560607910156, -0.43567657470703125, -0.4177970886230469, -0.3999176025390625, -0.3820381164550781, -0.36415863037109375, -0.3462791442871094, -0.328399658203125, -0.3105201721191406, -0.29264068603515625, -0.2747611999511719, -0.2568817138671875, -0.23900222778320312, -0.22112274169921875, -0.20324325561523438, -0.18536376953125, -0.16748428344726562, -0.14960479736328125, -0.13172531127929688, -0.1138458251953125, -0.09596633911132812, -0.07808685302734375, -0.060207366943359375, -0.042327880859375, -0.024448394775390625, -0.00656890869140625, 0.011310577392578125, 0.0291900634765625, 0.047069549560546875, 0.06494903564453125, 0.08282852172851562, 0.1007080078125, 0.11858749389648438, 0.13646697998046875, 0.15434646606445312, 0.1722259521484375, 0.19010543823242188, 0.20798492431640625, 0.22586441040039062, 0.243743896484375, 0.2616233825683594, 0.27950286865234375, 0.2973823547363281, 0.3152618408203125, 0.3331413269042969, 0.35102081298828125, 0.3689002990722656, 0.38677978515625, 0.4046592712402344, 0.42253875732421875, 0.4404182434082031, 0.4582977294921875, 0.4761772155761719, 0.49405670166015625, 0.5119361877441406, 0.529815673828125, 0.5476951599121094, 0.5655746459960938, 0.5834541320800781, 0.6013336181640625, 0.6192131042480469, 0.6370925903320312, 0.6549720764160156, 0.6728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 7.0, 15.0, 10.0, 8.0, 16.0, 27.0, 772.0, 13.0, 8.0, 15.0, 14.0, 12.0, 12.0, 11.0, 2.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07940673828125, -0.07672309875488281, -0.07403945922851562, -0.07135581970214844, -0.06867218017578125, -0.06598854064941406, -0.06330490112304688, -0.06062126159667969, -0.0579376220703125, -0.05525398254394531, -0.052570343017578125, -0.04988670349121094, -0.04720306396484375, -0.04451942443847656, -0.041835784912109375, -0.03915214538574219, -0.036468505859375, -0.03378486633300781, -0.031101226806640625, -0.028417587280273438, -0.02573394775390625, -0.023050308227539062, -0.020366668701171875, -0.017683029174804688, -0.0149993896484375, -0.012315750122070312, -0.009632110595703125, -0.0069484710693359375, -0.00426483154296875, -0.0015811920166015625, 0.001102447509765625, 0.0037860870361328125, 0.0064697265625, 0.009153366088867188, 0.011837005615234375, 0.014520645141601562, 0.01720428466796875, 0.019887924194335938, 0.022571563720703125, 0.025255203247070312, 0.0279388427734375, 0.030622482299804688, 0.033306121826171875, 0.03598976135253906, 0.03867340087890625, 0.04135704040527344, 0.044040679931640625, 0.04672431945800781, 0.049407958984375, 0.05209159851074219, 0.054775238037109375, 0.05745887756347656, 0.06014251708984375, 0.06282615661621094, 0.06550979614257812, 0.06819343566894531, 0.0708770751953125, 0.07356071472167969, 0.07624435424804688, 0.07892799377441406, 0.08161163330078125, 0.08429527282714844, 0.08697891235351562, 0.08966255187988281, 0.09234619140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 8.0, 15.0, 10.0, 7.0, 19.0, 37.0, 48.0, 112.0, 175.0, 374.0, 846.0, 1947.0, 4743.0, 12497.0, 41561.0, 204650.0, 3098632.0, 704492.0, 86848.0, 23075.0, 8182.0, 3271.0, 1353.0, 609.0, 327.0, 166.0, 101.0, 47.0, 31.0, 26.0, 11.0, 7.0, 7.0, 5.0, 7.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0], "bins": [-0.452880859375, -0.4408836364746094, -0.42888641357421875, -0.4168891906738281, -0.4048919677734375, -0.3928947448730469, -0.38089752197265625, -0.3689002990722656, -0.356903076171875, -0.3449058532714844, -0.33290863037109375, -0.3209114074707031, -0.3089141845703125, -0.2969169616699219, -0.28491973876953125, -0.2729225158691406, -0.26092529296875, -0.24892807006835938, -0.23693084716796875, -0.22493362426757812, -0.2129364013671875, -0.20093917846679688, -0.18894195556640625, -0.17694473266601562, -0.164947509765625, -0.15295028686523438, -0.14095306396484375, -0.12895584106445312, -0.1169586181640625, -0.10496139526367188, -0.09296417236328125, -0.08096694946289062, -0.0689697265625, -0.056972503662109375, -0.04497528076171875, -0.032978057861328125, -0.0209808349609375, -0.008983612060546875, 0.00301361083984375, 0.015010833740234375, 0.027008056640625, 0.039005279541015625, 0.05100250244140625, 0.06299972534179688, 0.0749969482421875, 0.08699417114257812, 0.09899139404296875, 0.11098861694335938, 0.12298583984375, 0.13498306274414062, 0.14698028564453125, 0.15897750854492188, 0.1709747314453125, 0.18297195434570312, 0.19496917724609375, 0.20696640014648438, 0.218963623046875, 0.23096084594726562, 0.24295806884765625, 0.2549552917480469, 0.2669525146484375, 0.2789497375488281, 0.29094696044921875, 0.3029441833496094, 0.31494140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 4.0, 11.0, 4.0, 10.0, 15.0, 21.0, 32.0, 31.0, 46.0, 64.0, 81.0, 114.0, 187.0, 311.0, 586.0, 1024.0, 576.0, 265.0, 182.0, 128.0, 77.0, 57.0, 42.0, 39.0, 29.0, 25.0, 10.0, 16.0, 9.0, 10.0, 10.0, 10.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.090087890625, -0.08702945709228516, -0.08397102355957031, -0.08091259002685547, -0.07785415649414062, -0.07479572296142578, -0.07173728942871094, -0.0686788558959961, -0.06562042236328125, -0.0625619888305664, -0.05950355529785156, -0.05644512176513672, -0.053386688232421875, -0.05032825469970703, -0.04726982116699219, -0.044211387634277344, -0.0411529541015625, -0.038094520568847656, -0.03503608703613281, -0.03197765350341797, -0.028919219970703125, -0.02586078643798828, -0.022802352905273438, -0.019743919372558594, -0.01668548583984375, -0.013627052307128906, -0.010568618774414062, -0.007510185241699219, -0.004451751708984375, -0.0013933181762695312, 0.0016651153564453125, 0.004723548889160156, 0.007781982421875, 0.010840415954589844, 0.013898849487304688, 0.01695728302001953, 0.020015716552734375, 0.02307415008544922, 0.026132583618164062, 0.029191017150878906, 0.03224945068359375, 0.035307884216308594, 0.03836631774902344, 0.04142475128173828, 0.044483184814453125, 0.04754161834716797, 0.05060005187988281, 0.053658485412597656, 0.0567169189453125, 0.059775352478027344, 0.06283378601074219, 0.06589221954345703, 0.06895065307617188, 0.07200908660888672, 0.07506752014160156, 0.0781259536743164, 0.08118438720703125, 0.0842428207397461, 0.08730125427246094, 0.09035968780517578, 0.09341812133789062, 0.09647655487060547, 0.09953498840332031, 0.10259342193603516, 0.10565185546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 38.0, 60.0, 179.0, 287.0, 261.0, 99.0, 37.0, 20.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8512928485870361, -1.8008859157562256, -1.7504788637161255, -1.700071930885315, -1.6496648788452148, -1.5992579460144043, -1.5488510131835938, -1.4984440803527832, -1.448037028312683, -1.3976300954818726, -1.3472230434417725, -1.296816110610962, -1.2464091777801514, -1.1960021257400513, -1.1455951929092407, -1.0951881408691406, -1.04478120803833, -0.9943742156028748, -0.9439672231674194, -0.8935602903366089, -0.8431532979011536, -0.7927463054656982, -0.7423393726348877, -0.6919323801994324, -0.641525387763977, -0.5911183953285217, -0.5407114028930664, -0.49030447006225586, -0.43989747762680054, -0.3894904851913452, -0.3390835225582123, -0.28867655992507935, -0.23826956748962402, -0.1878625899553299, -0.13745561242103577, -0.08704863488674164, -0.03664165735244751, 0.013765335083007812, 0.06417229771614075, 0.11457926034927368, 0.164986252784729, 0.21539323031902313, 0.26580020785331726, 0.3162071704864502, 0.3666141629219055, 0.41702115535736084, 0.4674281179904938, 0.5178350806236267, 0.568242073059082, 0.6186490654945374, 0.6690560579299927, 0.7194629907608032, 0.7698699831962585, 0.8202769756317139, 0.8706839084625244, 0.9210909008979797, 0.9714978933334351, 1.0219048261642456, 1.0723118782043457, 1.1227188110351562, 1.1731257438659668, 1.223532795906067, 1.2739397287368774, 1.3243467807769775, 1.374753713607788]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 11.0, 12.0, 18.0, 30.0, 25.0, 40.0, 53.0, 70.0, 72.0, 72.0, 74.0, 95.0, 75.0, 57.0, 61.0, 52.0, 44.0, 36.0, 21.0, 23.0, 20.0, 9.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0255264043807983, -1.0026744604110718, -0.9798226356506348, -0.9569706916809082, -0.9341188073158264, -0.9112669229507446, -0.8884149789810181, -0.8655630946159363, -0.8427112102508545, -0.8198593258857727, -0.7970074415206909, -0.7741554975509644, -0.7513036131858826, -0.7284517288208008, -0.7055997848510742, -0.6827479004859924, -0.6598960161209106, -0.6370441317558289, -0.6141922473907471, -0.5913403034210205, -0.5684884190559387, -0.5456365346908569, -0.5227845907211304, -0.4999327063560486, -0.4770808219909668, -0.454228937625885, -0.43137702345848083, -0.40852510929107666, -0.3856732249259949, -0.3628213405609131, -0.3399694263935089, -0.31711751222610474, -0.2942655682563782, -0.2714136838912964, -0.2485617697238922, -0.22570987045764923, -0.20285797119140625, -0.18000607192516327, -0.1571541726589203, -0.1343022733926773, -0.11145037412643433, -0.08859847486019135, -0.06574657559394836, -0.04289467632770538, -0.020042777061462402, 0.0028091222047805786, 0.02566102147102356, 0.04851292073726654, 0.07136482000350952, 0.0942167192697525, 0.11706861853599548, 0.13992051780223846, 0.16277241706848145, 0.18562431633472443, 0.2084762156009674, 0.2313281148672104, 0.25418001413345337, 0.27703189849853516, 0.29988381266593933, 0.3227357268333435, 0.3455876111984253, 0.3684394955635071, 0.39129140973091125, 0.41414332389831543, 0.4369952082633972]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 10.0, 14.0, 34.0, 43.0, 59.0, 123.0, 162.0, 242.0, 385.0, 618.0, 898.0, 1563.0, 2560.0, 4411.0, 8317.0, 17779.0, 44948.0, 772837.0, 140738.0, 26099.0, 11948.0, 6219.0, 3303.0, 1968.0, 1190.0, 721.0, 437.0, 318.0, 191.0, 116.0, 86.0, 65.0, 52.0, 25.0, 19.0, 10.0, 14.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.3443794250488281, -0.33280181884765625, -0.3212242126464844, -0.3096466064453125, -0.2980690002441406, -0.28649139404296875, -0.2749137878417969, -0.263336181640625, -0.2517585754394531, -0.24018096923828125, -0.22860336303710938, -0.2170257568359375, -0.20544815063476562, -0.19387054443359375, -0.18229293823242188, -0.17071533203125, -0.15913772583007812, -0.14756011962890625, -0.13598251342773438, -0.1244049072265625, -0.11282730102539062, -0.10124969482421875, -0.08967208862304688, -0.078094482421875, -0.06651687622070312, -0.05493927001953125, -0.043361663818359375, -0.0317840576171875, -0.020206451416015625, -0.00862884521484375, 0.002948760986328125, 0.0145263671875, 0.026103973388671875, 0.03768157958984375, 0.049259185791015625, 0.0608367919921875, 0.07241439819335938, 0.08399200439453125, 0.09556961059570312, 0.107147216796875, 0.11872482299804688, 0.13030242919921875, 0.14188003540039062, 0.1534576416015625, 0.16503524780273438, 0.17661285400390625, 0.18819046020507812, 0.19976806640625, 0.21134567260742188, 0.22292327880859375, 0.23450088500976562, 0.2460784912109375, 0.2576560974121094, 0.26923370361328125, 0.2808113098144531, 0.292388916015625, 0.3039665222167969, 0.31554412841796875, 0.3271217346191406, 0.3386993408203125, 0.3502769470214844, 0.36185455322265625, 0.3734321594238281, 0.385009765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 6.0, 6.0, 13.0, 7.0, 19.0, 30.0, 87.0, 228.0, 297.0, 152.0, 49.0, 6.0, 15.0, 7.0, 15.0, 9.0, 4.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0693359375, -0.06704330444335938, -0.06475067138671875, -0.062458038330078125, -0.0601654052734375, -0.057872772216796875, -0.05558013916015625, -0.053287506103515625, -0.050994873046875, -0.048702239990234375, -0.04640960693359375, -0.044116973876953125, -0.0418243408203125, -0.039531707763671875, -0.03723907470703125, -0.034946441650390625, -0.03265380859375, -0.030361175537109375, -0.02806854248046875, -0.025775909423828125, -0.0234832763671875, -0.021190643310546875, -0.01889801025390625, -0.016605377197265625, -0.014312744140625, -0.012020111083984375, -0.00972747802734375, -0.007434844970703125, -0.0051422119140625, -0.002849578857421875, -0.00055694580078125, 0.001735687255859375, 0.0040283203125, 0.006320953369140625, 0.00861358642578125, 0.010906219482421875, 0.0131988525390625, 0.015491485595703125, 0.01778411865234375, 0.020076751708984375, 0.022369384765625, 0.024662017822265625, 0.02695465087890625, 0.029247283935546875, 0.0315399169921875, 0.033832550048828125, 0.03612518310546875, 0.038417816162109375, 0.04071044921875, 0.043003082275390625, 0.04529571533203125, 0.047588348388671875, 0.0498809814453125, 0.052173614501953125, 0.05446624755859375, 0.056758880615234375, 0.059051513671875, 0.061344146728515625, 0.06363677978515625, 0.06592941284179688, 0.0682220458984375, 0.07051467895507812, 0.07280731201171875, 0.07509994506835938, 0.077392578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 18.0, 27.0, 41.0, 64.0, 96.0, 152.0, 242.0, 402.0, 676.0, 1235.0, 2133.0, 4081.0, 7828.0, 15211.0, 31106.0, 66597.0, 144195.0, 292262.0, 253453.0, 120212.0, 55004.0, 26137.0, 12862.0, 6518.0, 3378.0, 1944.0, 1048.0, 606.0, 392.0, 214.0, 138.0, 92.0, 57.0, 32.0, 18.0, 15.0, 19.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2120361328125, -0.2053852081298828, -0.19873428344726562, -0.19208335876464844, -0.18543243408203125, -0.17878150939941406, -0.17213058471679688, -0.1654796600341797, -0.1588287353515625, -0.1521778106689453, -0.14552688598632812, -0.13887596130371094, -0.13222503662109375, -0.12557411193847656, -0.11892318725585938, -0.11227226257324219, -0.105621337890625, -0.09897041320800781, -0.09231948852539062, -0.08566856384277344, -0.07901763916015625, -0.07236671447753906, -0.06571578979492188, -0.05906486511230469, -0.0524139404296875, -0.04576301574707031, -0.039112091064453125, -0.03246116638183594, -0.02581024169921875, -0.019159317016601562, -0.012508392333984375, -0.0058574676513671875, 0.00079345703125, 0.0074443817138671875, 0.014095306396484375, 0.020746231079101562, 0.02739715576171875, 0.03404808044433594, 0.040699005126953125, 0.04734992980957031, 0.0540008544921875, 0.06065177917480469, 0.06730270385742188, 0.07395362854003906, 0.08060455322265625, 0.08725547790527344, 0.09390640258789062, 0.10055732727050781, 0.107208251953125, 0.11385917663574219, 0.12051010131835938, 0.12716102600097656, 0.13381195068359375, 0.14046287536621094, 0.14711380004882812, 0.1537647247314453, 0.1604156494140625, 0.1670665740966797, 0.17371749877929688, 0.18036842346191406, 0.18701934814453125, 0.19367027282714844, 0.20032119750976562, 0.2069721221923828, 0.213623046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 3.0, 11.0, 3.0, 11.0, 11.0, 15.0, 13.0, 22.0, 16.0, 25.0, 25.0, 29.0, 22.0, 24.0, 25.0, 30.0, 31.0, 34.0, 38.0, 45.0, 49.0, 25.0, 44.0, 36.0, 48.0, 29.0, 26.0, 39.0, 40.0, 33.0, 32.0, 31.0, 24.0, 22.0, 22.0, 16.0, 11.0, 5.0, 6.0, 12.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.240478515625, -0.2324676513671875, -0.224456787109375, -0.2164459228515625, -0.20843505859375, -0.2004241943359375, -0.192413330078125, -0.1844024658203125, -0.1763916015625, -0.1683807373046875, -0.160369873046875, -0.1523590087890625, -0.14434814453125, -0.1363372802734375, -0.128326416015625, -0.1203155517578125, -0.1123046875, -0.1042938232421875, -0.096282958984375, -0.0882720947265625, -0.08026123046875, -0.0722503662109375, -0.064239501953125, -0.0562286376953125, -0.0482177734375, -0.0402069091796875, -0.032196044921875, -0.0241851806640625, -0.01617431640625, -0.0081634521484375, -0.000152587890625, 0.0078582763671875, 0.015869140625, 0.0238800048828125, 0.031890869140625, 0.0399017333984375, 0.04791259765625, 0.0559234619140625, 0.063934326171875, 0.0719451904296875, 0.0799560546875, 0.0879669189453125, 0.095977783203125, 0.1039886474609375, 0.11199951171875, 0.1200103759765625, 0.128021240234375, 0.1360321044921875, 0.14404296875, 0.1520538330078125, 0.160064697265625, 0.1680755615234375, 0.17608642578125, 0.1840972900390625, 0.192108154296875, 0.2001190185546875, 0.2081298828125, 0.2161407470703125, 0.224151611328125, 0.2321624755859375, 0.24017333984375, 0.2481842041015625, 0.256195068359375, 0.2642059326171875, 0.272216796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 4.0, 4.0, 11.0, 11.0, 27.0, 42.0, 50.0, 116.0, 186.0, 434.0, 1195.0, 4870.0, 49527.0, 917051.0, 67141.0, 5572.0, 1346.0, 501.0, 199.0, 110.0, 50.0, 39.0, 21.0, 15.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4033203125, -0.389190673828125, -0.37506103515625, -0.360931396484375, -0.3468017578125, -0.332672119140625, -0.31854248046875, -0.304412841796875, -0.290283203125, -0.276153564453125, -0.26202392578125, -0.247894287109375, -0.2337646484375, -0.219635009765625, -0.20550537109375, -0.191375732421875, -0.17724609375, -0.163116455078125, -0.14898681640625, -0.134857177734375, -0.1207275390625, -0.106597900390625, -0.09246826171875, -0.078338623046875, -0.064208984375, -0.050079345703125, -0.03594970703125, -0.021820068359375, -0.0076904296875, 0.006439208984375, 0.02056884765625, 0.034698486328125, 0.048828125, 0.062957763671875, 0.07708740234375, 0.091217041015625, 0.1053466796875, 0.119476318359375, 0.13360595703125, 0.147735595703125, 0.161865234375, 0.175994873046875, 0.19012451171875, 0.204254150390625, 0.2183837890625, 0.232513427734375, 0.24664306640625, 0.260772705078125, 0.27490234375, 0.289031982421875, 0.30316162109375, 0.317291259765625, 0.3314208984375, 0.345550537109375, 0.35968017578125, 0.373809814453125, 0.387939453125, 0.402069091796875, 0.41619873046875, 0.430328369140625, 0.4444580078125, 0.458587646484375, 0.47271728515625, 0.486846923828125, 0.5009765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 9.0, 9.0, 15.0, 21.0, 26.0, 36.0, 59.0, 65.0, 95.0, 77.0, 104.0, 125.0, 95.0, 69.0, 48.0, 34.0, 32.0, 12.0, 24.0, 11.0, 1.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5391578674316406e-05, -2.4498440325260162e-05, -2.360530197620392e-05, -2.2712163627147675e-05, -2.181902527809143e-05, -2.0925886929035187e-05, -2.0032748579978943e-05, -1.91396102309227e-05, -1.8246471881866455e-05, -1.735333353281021e-05, -1.6460195183753967e-05, -1.5567056834697723e-05, -1.467391848564148e-05, -1.3780780136585236e-05, -1.2887641787528992e-05, -1.1994503438472748e-05, -1.1101365089416504e-05, -1.020822674036026e-05, -9.315088391304016e-06, -8.421950042247772e-06, -7.528811693191528e-06, -6.6356733441352844e-06, -5.7425349950790405e-06, -4.849396646022797e-06, -3.956258296966553e-06, -3.063119947910309e-06, -2.169981598854065e-06, -1.276843249797821e-06, -3.8370490074157715e-07, 5.094334483146667e-07, 1.4025717973709106e-06, 2.2957101464271545e-06, 3.1888484954833984e-06, 4.081986844539642e-06, 4.975125193595886e-06, 5.86826354265213e-06, 6.761401891708374e-06, 7.654540240764618e-06, 8.547678589820862e-06, 9.440816938877106e-06, 1.033395528793335e-05, 1.1227093636989594e-05, 1.2120231986045837e-05, 1.3013370335102081e-05, 1.3906508684158325e-05, 1.4799647033214569e-05, 1.5692785382270813e-05, 1.6585923731327057e-05, 1.74790620803833e-05, 1.8372200429439545e-05, 1.926533877849579e-05, 2.0158477127552032e-05, 2.1051615476608276e-05, 2.194475382566452e-05, 2.2837892174720764e-05, 2.3731030523777008e-05, 2.4624168872833252e-05, 2.5517307221889496e-05, 2.641044557094574e-05, 2.7303583920001984e-05, 2.8196722269058228e-05, 2.908986061811447e-05, 2.9982998967170715e-05, 3.087613731622696e-05, 3.17692756652832e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 12.0, 11.0, 14.0, 29.0, 43.0, 61.0, 94.0, 184.0, 356.0, 815.0, 2037.0, 6514.0, 28963.0, 204637.0, 665232.0, 113338.0, 18630.0, 4754.0, 1527.0, 628.0, 285.0, 159.0, 88.0, 52.0, 21.0, 27.0, 14.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23583984375, -0.22877120971679688, -0.22170257568359375, -0.21463394165039062, -0.2075653076171875, -0.20049667358398438, -0.19342803955078125, -0.18635940551757812, -0.179290771484375, -0.17222213745117188, -0.16515350341796875, -0.15808486938476562, -0.1510162353515625, -0.14394760131835938, -0.13687896728515625, -0.12981033325195312, -0.12274169921875, -0.11567306518554688, -0.10860443115234375, -0.10153579711914062, -0.0944671630859375, -0.08739852905273438, -0.08032989501953125, -0.07326126098632812, -0.066192626953125, -0.059123992919921875, -0.05205535888671875, -0.044986724853515625, -0.0379180908203125, -0.030849456787109375, -0.02378082275390625, -0.016712188720703125, -0.0096435546875, -0.002574920654296875, 0.00449371337890625, 0.011562347412109375, 0.0186309814453125, 0.025699615478515625, 0.03276824951171875, 0.039836883544921875, 0.046905517578125, 0.053974151611328125, 0.06104278564453125, 0.06811141967773438, 0.0751800537109375, 0.08224868774414062, 0.08931732177734375, 0.09638595581054688, 0.10345458984375, 0.11052322387695312, 0.11759185791015625, 0.12466049194335938, 0.1317291259765625, 0.13879776000976562, 0.14586639404296875, 0.15293502807617188, 0.160003662109375, 0.16707229614257812, 0.17414093017578125, 0.18120956420898438, 0.1882781982421875, 0.19534683227539062, 0.20241546630859375, 0.20948410034179688, 0.216552734375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 11.0, 6.0, 15.0, 17.0, 26.0, 43.0, 65.0, 96.0, 96.0, 119.0, 92.0, 100.0, 87.0, 74.0, 43.0, 37.0, 21.0, 22.0, 12.0, 5.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1651611328125, -0.1580371856689453, -0.15091323852539062, -0.14378929138183594, -0.13666534423828125, -0.12954139709472656, -0.12241744995117188, -0.11529350280761719, -0.1081695556640625, -0.10104560852050781, -0.09392166137695312, -0.08679771423339844, -0.07967376708984375, -0.07254981994628906, -0.06542587280273438, -0.05830192565917969, -0.051177978515625, -0.04405403137207031, -0.036930084228515625, -0.029806137084960938, -0.02268218994140625, -0.015558242797851562, -0.008434295654296875, -0.0013103485107421875, 0.0058135986328125, 0.012937545776367188, 0.020061492919921875, 0.027185440063476562, 0.03430938720703125, 0.04143333435058594, 0.048557281494140625, 0.05568122863769531, 0.06280517578125, 0.06992912292480469, 0.07705307006835938, 0.08417701721191406, 0.09130096435546875, 0.09842491149902344, 0.10554885864257812, 0.11267280578613281, 0.1197967529296875, 0.1269207000732422, 0.13404464721679688, 0.14116859436035156, 0.14829254150390625, 0.15541648864746094, 0.16254043579101562, 0.1696643829345703, 0.176788330078125, 0.1839122772216797, 0.19103622436523438, 0.19816017150878906, 0.20528411865234375, 0.21240806579589844, 0.21953201293945312, 0.2266559600830078, 0.2337799072265625, 0.2409038543701172, 0.24802780151367188, 0.25515174865722656, 0.26227569580078125, 0.26939964294433594, 0.2765235900878906, 0.2836475372314453, 0.290771484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 10.0, 16.0, 28.0, 44.0, 94.0, 182.0, 248.0, 169.0, 96.0, 35.0, 27.0, 14.0, 16.0, 9.0, 5.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.034984111785889, -3.91035532951355, -3.78572678565979, -3.661098003387451, -3.5364692211151123, -3.4118406772613525, -3.2872118949890137, -3.162583351135254, -3.037954568862915, -2.913325786590576, -2.7886972427368164, -2.6640684604644775, -2.5394396781921387, -2.414811134338379, -2.29018235206604, -2.165553569793701, -2.0409250259399414, -1.916296362876892, -1.7916675806045532, -1.667038917541504, -1.5424102544784546, -1.4177815914154053, -1.2931528091430664, -1.168524146080017, -1.0438952445983887, -0.9192665219306946, -0.7946378588676453, -0.6700091361999512, -0.5453804731369019, -0.42075175046920776, -0.29612302780151367, -0.17149436473846436, -0.04686570167541504, 0.07776299864053726, 0.20239169895648956, 0.32702040672302246, 0.45164909958839417, 0.5762777924537659, 0.70090651512146, 0.8255351781845093, 0.9501639008522034, 1.0747926235198975, 1.1994212865829468, 1.324049949645996, 1.448678731918335, 1.5733073949813843, 1.6979360580444336, 1.8225648403167725, 1.9471935033798218, 2.071822166442871, 2.19645094871521, 2.321079730987549, 2.4457082748413086, 2.5703370571136475, 2.6949658393859863, 2.819594383239746, 2.944223165512085, 3.068851947784424, 3.1934804916381836, 3.3181092739105225, 3.4427380561828613, 3.567366600036621, 3.69199538230896, 3.816624164581299, 3.9412527084350586]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 13.0, 9.0, 34.0, 51.0, 92.0, 108.0, 188.0, 154.0, 135.0, 74.0, 46.0, 15.0, 19.0, 12.0, 7.0, 4.0, 11.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95341682434082, -6.748269557952881, -6.543121814727783, -6.337974548339844, -6.132827281951904, -5.927680015563965, -5.722532272338867, -5.517385005950928, -5.312237739562988, -5.107090473175049, -4.901942729949951, -4.696795463562012, -4.491648197174072, -4.286500930786133, -4.081353187561035, -3.8762059211730957, -3.671058416366577, -3.4659109115600586, -3.260763645172119, -3.0556161403656006, -2.850468873977661, -2.6453213691711426, -2.440174102783203, -2.2350265979766846, -2.029879093170166, -1.824731707572937, -1.619584321975708, -1.4144368171691895, -1.20928955078125, -1.0041420459747314, -0.7989946603775024, -0.5938472747802734, -0.388700008392334, -0.1835526078939438, 0.02159479260444641, 0.2267422080039978, 0.4318895936012268, 0.6370370388031006, 0.8421844244003296, 1.0473318099975586, 1.2524791955947876, 1.4576265811920166, 1.6627739667892456, 1.8679213523864746, 2.073068857192993, 2.2782163619995117, 2.483363628387451, 2.6885108947753906, 2.893658399581909, 3.0988059043884277, 3.303953170776367, 3.5091006755828857, 3.714247941970825, 3.9193954467773438, 4.124542713165283, 4.329689979553223, 4.53483772277832, 4.73998498916626, 4.945132732391357, 5.150279998779297, 5.355427265167236, 5.560574531555176, 5.765722274780273, 5.970869541168213, 6.176016807556152]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 7.0, 7.0, 6.0, 12.0, 10.0, 17.0, 23.0, 36.0, 58.0, 76.0, 100.0, 167.0, 267.0, 462.0, 952.0, 1997.0, 5326.0, 22631.0, 837696.0, 3284164.0, 28422.0, 6800.0, 2479.0, 1165.0, 558.0, 315.0, 181.0, 119.0, 70.0, 40.0, 25.0, 20.0, 18.0, 17.0, 12.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.28125, -1.24468994140625, -1.2081298828125, -1.17156982421875, -1.135009765625, -1.09844970703125, -1.0618896484375, -1.02532958984375, -0.98876953125, -0.95220947265625, -0.9156494140625, -0.87908935546875, -0.842529296875, -0.80596923828125, -0.7694091796875, -0.73284912109375, -0.6962890625, -0.65972900390625, -0.6231689453125, -0.58660888671875, -0.550048828125, -0.51348876953125, -0.4769287109375, -0.44036865234375, -0.40380859375, -0.36724853515625, -0.3306884765625, -0.29412841796875, -0.257568359375, -0.22100830078125, -0.1844482421875, -0.14788818359375, -0.111328125, -0.07476806640625, -0.0382080078125, -0.00164794921875, 0.034912109375, 0.07147216796875, 0.1080322265625, 0.14459228515625, 0.18115234375, 0.21771240234375, 0.2542724609375, 0.29083251953125, 0.327392578125, 0.36395263671875, 0.4005126953125, 0.43707275390625, 0.4736328125, 0.51019287109375, 0.5467529296875, 0.58331298828125, 0.619873046875, 0.65643310546875, 0.6929931640625, 0.72955322265625, 0.76611328125, 0.80267333984375, 0.8392333984375, 0.87579345703125, 0.912353515625, 0.94891357421875, 0.9854736328125, 1.02203369140625, 1.05859375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 11.0, 9.0, 14.0, 15.0, 38.0, 71.0, 161.0, 265.0, 201.0, 76.0, 40.0, 8.0, 13.0, 11.0, 13.0, 9.0, 14.0, 8.0, 5.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09912109375, -0.09635162353515625, -0.0935821533203125, -0.09081268310546875, -0.088043212890625, -0.08527374267578125, -0.0825042724609375, -0.07973480224609375, -0.07696533203125, -0.07419586181640625, -0.0714263916015625, -0.06865692138671875, -0.065887451171875, -0.06311798095703125, -0.0603485107421875, -0.05757904052734375, -0.0548095703125, -0.05204010009765625, -0.0492706298828125, -0.04650115966796875, -0.043731689453125, -0.04096221923828125, -0.0381927490234375, -0.03542327880859375, -0.03265380859375, -0.02988433837890625, -0.0271148681640625, -0.02434539794921875, -0.021575927734375, -0.01880645751953125, -0.0160369873046875, -0.01326751708984375, -0.010498046875, -0.00772857666015625, -0.0049591064453125, -0.00218963623046875, 0.000579833984375, 0.00334930419921875, 0.0061187744140625, 0.00888824462890625, 0.01165771484375, 0.01442718505859375, 0.0171966552734375, 0.01996612548828125, 0.022735595703125, 0.02550506591796875, 0.0282745361328125, 0.03104400634765625, 0.0338134765625, 0.03658294677734375, 0.0393524169921875, 0.04212188720703125, 0.044891357421875, 0.04766082763671875, 0.0504302978515625, 0.05319976806640625, 0.05596923828125, 0.05873870849609375, 0.0615081787109375, 0.06427764892578125, 0.067047119140625, 0.06981658935546875, 0.0725860595703125, 0.07535552978515625, 0.078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 10.0, 7.0, 16.0, 25.0, 30.0, 47.0, 50.0, 94.0, 122.0, 196.0, 258.0, 439.0, 773.0, 1405.0, 2666.0, 5872.0, 15188.0, 51371.0, 431457.0, 3457657.0, 173807.0, 32579.0, 10825.0, 4407.0, 2067.0, 1127.0, 583.0, 407.0, 239.0, 176.0, 127.0, 65.0, 49.0, 37.0, 22.0, 16.0, 17.0, 15.0, 6.0, 12.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.70654296875, -0.6859664916992188, -0.6653900146484375, -0.6448135375976562, -0.624237060546875, -0.6036605834960938, -0.5830841064453125, -0.5625076293945312, -0.54193115234375, -0.5213546752929688, -0.5007781982421875, -0.48020172119140625, -0.459625244140625, -0.43904876708984375, -0.4184722900390625, -0.39789581298828125, -0.3773193359375, -0.35674285888671875, -0.3361663818359375, -0.31558990478515625, -0.295013427734375, -0.27443695068359375, -0.2538604736328125, -0.23328399658203125, -0.21270751953125, -0.19213104248046875, -0.1715545654296875, -0.15097808837890625, -0.130401611328125, -0.10982513427734375, -0.0892486572265625, -0.06867218017578125, -0.048095703125, -0.02751922607421875, -0.0069427490234375, 0.01363372802734375, 0.034210205078125, 0.05478668212890625, 0.0753631591796875, 0.09593963623046875, 0.11651611328125, 0.13709259033203125, 0.1576690673828125, 0.17824554443359375, 0.198822021484375, 0.21939849853515625, 0.2399749755859375, 0.26055145263671875, 0.2811279296875, 0.30170440673828125, 0.3222808837890625, 0.34285736083984375, 0.363433837890625, 0.38401031494140625, 0.4045867919921875, 0.42516326904296875, 0.44573974609375, 0.46631622314453125, 0.4868927001953125, 0.5074691772460938, 0.528045654296875, 0.5486221313476562, 0.5691986083984375, 0.5897750854492188, 0.6103515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 9.0, 11.0, 17.0, 19.0, 26.0, 38.0, 76.0, 133.0, 383.0, 1554.0, 1252.0, 289.0, 98.0, 56.0, 39.0, 18.0, 15.0, 12.0, 6.0, 4.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1258544921875, -0.12134742736816406, -0.11684036254882812, -0.11233329772949219, -0.10782623291015625, -0.10331916809082031, -0.09881210327148438, -0.09430503845214844, -0.0897979736328125, -0.08529090881347656, -0.08078384399414062, -0.07627677917480469, -0.07176971435546875, -0.06726264953613281, -0.06275558471679688, -0.05824851989746094, -0.053741455078125, -0.04923439025878906, -0.044727325439453125, -0.04022026062011719, -0.03571319580078125, -0.031206130981445312, -0.026699066162109375, -0.022192001342773438, -0.0176849365234375, -0.013177871704101562, -0.008670806884765625, -0.0041637420654296875, 0.00034332275390625, 0.0048503875732421875, 0.009357452392578125, 0.013864517211914062, 0.01837158203125, 0.022878646850585938, 0.027385711669921875, 0.03189277648925781, 0.03639984130859375, 0.04090690612792969, 0.045413970947265625, 0.04992103576660156, 0.0544281005859375, 0.05893516540527344, 0.06344223022460938, 0.06794929504394531, 0.07245635986328125, 0.07696342468261719, 0.08147048950195312, 0.08597755432128906, 0.090484619140625, 0.09499168395996094, 0.09949874877929688, 0.10400581359863281, 0.10851287841796875, 0.11301994323730469, 0.11752700805664062, 0.12203407287597656, 0.1265411376953125, 0.13104820251464844, 0.13555526733398438, 0.1400623321533203, 0.14456939697265625, 0.1490764617919922, 0.15358352661132812, 0.15809059143066406, 0.16259765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 13.0, 25.0, 75.0, 182.0, 413.0, 187.0, 60.0, 25.0, 11.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9056450724601746, -0.863746166229248, -0.8218472599983215, -0.779948353767395, -0.7380494475364685, -0.696150541305542, -0.6542516350746155, -0.612352728843689, -0.5704538226127625, -0.5285549163818359, -0.4866560101509094, -0.4447571039199829, -0.4028581976890564, -0.3609592914581299, -0.31906038522720337, -0.27716147899627686, -0.23526257276535034, -0.19336366653442383, -0.15146476030349731, -0.1095658540725708, -0.06766694784164429, -0.025768041610717773, 0.01613086462020874, 0.058029770851135254, 0.09992867708206177, 0.14182758331298828, 0.1837264895439148, 0.2256253957748413, 0.2675243020057678, 0.30942320823669434, 0.35132211446762085, 0.39322102069854736, 0.4351198673248291, 0.4770187735557556, 0.5189176797866821, 0.5608165860176086, 0.6027154922485352, 0.6446143984794617, 0.6865133047103882, 0.7284122109413147, 0.7703111171722412, 0.8122100234031677, 0.8541089296340942, 0.8960078358650208, 0.9379067420959473, 0.9798056483268738, 1.0217045545578003, 1.063603401184082, 1.1055023670196533, 1.1474013328552246, 1.1893001794815063, 1.231199026107788, 1.2730979919433594, 1.3149969577789307, 1.3568958044052124, 1.3987946510314941, 1.4406936168670654, 1.4825925827026367, 1.5244914293289185, 1.5663902759552002, 1.6082892417907715, 1.6501882076263428, 1.6920870542526245, 1.7339859008789062, 1.7758848667144775]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 4.0, 5.0, 5.0, 8.0, 9.0, 15.0, 19.0, 60.0, 61.0, 97.0, 132.0, 158.0, 129.0, 117.0, 76.0, 41.0, 22.0, 17.0, 11.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7039206027984619, -0.6778228878974915, -0.651725172996521, -0.6256273984909058, -0.5995296835899353, -0.5734319686889648, -0.5473342537879944, -0.5212365388870239, -0.49513882398605347, -0.469041109085083, -0.44294336438179016, -0.4168456494808197, -0.39074793457984924, -0.3646501898765564, -0.33855247497558594, -0.3124547600746155, -0.28635701537132263, -0.2602593004703522, -0.23416157066822052, -0.20806384086608887, -0.1819661259651184, -0.15586839616298676, -0.1297706663608551, -0.10367295145988464, -0.07757522165775299, -0.051477499306201935, -0.02537977322936058, 0.0007179528474807739, 0.02681567519903183, 0.052913397550582886, 0.07901112735271454, 0.105108842253685, 0.13120657205581665, 0.1573043018579483, 0.18340201675891876, 0.20949974656105042, 0.23559746146202087, 0.2616952061653137, 0.2877929210662842, 0.31389063596725464, 0.3399883508682251, 0.36608606576919556, 0.3921838104724884, 0.41828152537345886, 0.4443792402744293, 0.47047698497772217, 0.4965746998786926, 0.5226724147796631, 0.5487701892852783, 0.5748679041862488, 0.6009656190872192, 0.6270633935928345, 0.6531611084938049, 0.6792588233947754, 0.7053565382957458, 0.7314542531967163, 0.7575519680976868, 0.7836496829986572, 0.8097473978996277, 0.8358451128005981, 0.8619428873062134, 0.8880406022071838, 0.9141383171081543, 0.9402360320091248, 0.9663337469100952]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 11.0, 6.0, 12.0, 9.0, 15.0, 17.0, 29.0, 41.0, 41.0, 61.0, 141.0, 328.0, 1015.0, 3292.0, 13277.0, 106301.0, 855139.0, 55545.0, 9392.0, 2502.0, 772.0, 245.0, 118.0, 43.0, 40.0, 31.0, 22.0, 15.0, 13.0, 17.0, 10.0, 5.0, 10.0, 3.0, 6.0, 9.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7685546875, -0.7440643310546875, -0.719573974609375, -0.6950836181640625, -0.67059326171875, -0.6461029052734375, -0.621612548828125, -0.5971221923828125, -0.5726318359375, -0.5481414794921875, -0.523651123046875, -0.4991607666015625, -0.47467041015625, -0.4501800537109375, -0.425689697265625, -0.4011993408203125, -0.376708984375, -0.3522186279296875, -0.327728271484375, -0.3032379150390625, -0.27874755859375, -0.2542572021484375, -0.229766845703125, -0.2052764892578125, -0.1807861328125, -0.1562957763671875, -0.131805419921875, -0.1073150634765625, -0.08282470703125, -0.0583343505859375, -0.033843994140625, -0.0093536376953125, 0.01513671875, 0.0396270751953125, 0.064117431640625, 0.0886077880859375, 0.11309814453125, 0.1375885009765625, 0.162078857421875, 0.1865692138671875, 0.2110595703125, 0.2355499267578125, 0.260040283203125, 0.2845306396484375, 0.30902099609375, 0.3335113525390625, 0.358001708984375, 0.3824920654296875, 0.406982421875, 0.4314727783203125, 0.455963134765625, 0.4804534912109375, 0.50494384765625, 0.5294342041015625, 0.553924560546875, 0.5784149169921875, 0.6029052734375, 0.6273956298828125, 0.651885986328125, 0.6763763427734375, 0.70086669921875, 0.7253570556640625, 0.749847412109375, 0.7743377685546875, 0.798828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 12.0, 9.0, 15.0, 25.0, 64.0, 109.0, 208.0, 217.0, 170.0, 72.0, 28.0, 14.0, 12.0, 13.0, 7.0, 6.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.12939453125, -0.1267085075378418, -0.1240224838256836, -0.12133646011352539, -0.11865043640136719, -0.11596441268920898, -0.11327838897705078, -0.11059236526489258, -0.10790634155273438, -0.10522031784057617, -0.10253429412841797, -0.09984827041625977, -0.09716224670410156, -0.09447622299194336, -0.09179019927978516, -0.08910417556762695, -0.08641815185546875, -0.08373212814331055, -0.08104610443115234, -0.07836008071899414, -0.07567405700683594, -0.07298803329467773, -0.07030200958251953, -0.06761598587036133, -0.06492996215820312, -0.06224393844604492, -0.05955791473388672, -0.056871891021728516, -0.05418586730957031, -0.05149984359741211, -0.048813819885253906, -0.0461277961730957, -0.0434417724609375, -0.0407557487487793, -0.038069725036621094, -0.03538370132446289, -0.03269767761230469, -0.030011653900146484, -0.02732563018798828, -0.024639606475830078, -0.021953582763671875, -0.019267559051513672, -0.01658153533935547, -0.013895511627197266, -0.011209487915039062, -0.00852346420288086, -0.005837440490722656, -0.003151416778564453, -0.00046539306640625, 0.002220630645751953, 0.004906654357910156, 0.007592678070068359, 0.010278701782226562, 0.012964725494384766, 0.01565074920654297, 0.018336772918701172, 0.021022796630859375, 0.023708820343017578, 0.02639484405517578, 0.029080867767333984, 0.03176689147949219, 0.03445291519165039, 0.037138938903808594, 0.0398249626159668, 0.042510986328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 30.0, 302.0, 5241.0, 162276.0, 838488.0, 40226.0, 1793.0, 124.0, 23.0, 11.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.1064453125, -1.0751113891601562, -1.0437774658203125, -1.0124435424804688, -0.981109619140625, -0.9497756958007812, -0.9184417724609375, -0.8871078491210938, -0.85577392578125, -0.8244400024414062, -0.7931060791015625, -0.7617721557617188, -0.730438232421875, -0.6991043090820312, -0.6677703857421875, -0.6364364624023438, -0.6051025390625, -0.5737686157226562, -0.5424346923828125, -0.5111007690429688, -0.479766845703125, -0.44843292236328125, -0.4170989990234375, -0.38576507568359375, -0.35443115234375, -0.32309722900390625, -0.2917633056640625, -0.26042938232421875, -0.229095458984375, -0.19776153564453125, -0.1664276123046875, -0.13509368896484375, -0.103759765625, -0.07242584228515625, -0.0410919189453125, -0.00975799560546875, 0.021575927734375, 0.05290985107421875, 0.0842437744140625, 0.11557769775390625, 0.14691162109375, 0.17824554443359375, 0.2095794677734375, 0.24091339111328125, 0.272247314453125, 0.30358123779296875, 0.3349151611328125, 0.36624908447265625, 0.3975830078125, 0.42891693115234375, 0.4602508544921875, 0.49158477783203125, 0.522918701171875, 0.5542526245117188, 0.5855865478515625, 0.6169204711914062, 0.64825439453125, 0.6795883178710938, 0.7109222412109375, 0.7422561645507812, 0.773590087890625, 0.8049240112304688, 0.8362579345703125, 0.8675918579101562, 0.89892578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 10.0, 3.0, 5.0, 11.0, 10.0, 10.0, 17.0, 14.0, 15.0, 21.0, 23.0, 20.0, 37.0, 26.0, 43.0, 37.0, 28.0, 32.0, 25.0, 40.0, 41.0, 23.0, 31.0, 49.0, 38.0, 42.0, 34.0, 34.0, 30.0, 26.0, 23.0, 24.0, 29.0, 22.0, 19.0, 11.0, 18.0, 13.0, 13.0, 11.0, 5.0, 9.0, 8.0, 4.0, 6.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.14107131958007812, -0.13626861572265625, -0.13146591186523438, -0.1266632080078125, -0.12186050415039062, -0.11705780029296875, -0.11225509643554688, -0.107452392578125, -0.10264968872070312, -0.09784698486328125, -0.09304428100585938, -0.0882415771484375, -0.08343887329101562, -0.07863616943359375, -0.07383346557617188, -0.06903076171875, -0.06422805786132812, -0.05942535400390625, -0.054622650146484375, -0.0498199462890625, -0.045017242431640625, -0.04021453857421875, -0.035411834716796875, -0.030609130859375, -0.025806427001953125, -0.02100372314453125, -0.016201019287109375, -0.0113983154296875, -0.006595611572265625, -0.00179290771484375, 0.003009796142578125, 0.0078125, 0.012615203857421875, 0.01741790771484375, 0.022220611572265625, 0.0270233154296875, 0.031826019287109375, 0.03662872314453125, 0.041431427001953125, 0.046234130859375, 0.051036834716796875, 0.05583953857421875, 0.060642242431640625, 0.0654449462890625, 0.07024765014648438, 0.07505035400390625, 0.07985305786132812, 0.08465576171875, 0.08945846557617188, 0.09426116943359375, 0.09906387329101562, 0.1038665771484375, 0.10866928100585938, 0.11347198486328125, 0.11827468872070312, 0.123077392578125, 0.12788009643554688, 0.13268280029296875, 0.13748550415039062, 0.1422882080078125, 0.14709091186523438, 0.15189361572265625, 0.15669631958007812, 0.1614990234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 25.0, 77.0, 374.0, 6651.0, 1039295.0, 1811.0, 203.0, 58.0, 17.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.016357421875, -3.88818359375, -3.760009765625, -3.6318359375, -3.503662109375, -3.37548828125, -3.247314453125, -3.119140625, -2.990966796875, -2.86279296875, -2.734619140625, -2.6064453125, -2.478271484375, -2.35009765625, -2.221923828125, -2.09375, -1.965576171875, -1.83740234375, -1.709228515625, -1.5810546875, -1.452880859375, -1.32470703125, -1.196533203125, -1.068359375, -0.940185546875, -0.81201171875, -0.683837890625, -0.5556640625, -0.427490234375, -0.29931640625, -0.171142578125, -0.04296875, 0.085205078125, 0.21337890625, 0.341552734375, 0.4697265625, 0.597900390625, 0.72607421875, 0.854248046875, 0.982421875, 1.110595703125, 1.23876953125, 1.366943359375, 1.4951171875, 1.623291015625, 1.75146484375, 1.879638671875, 2.0078125, 2.135986328125, 2.26416015625, 2.392333984375, 2.5205078125, 2.648681640625, 2.77685546875, 2.905029296875, 3.033203125, 3.161376953125, 3.28955078125, 3.417724609375, 3.5458984375, 3.674072265625, 3.80224609375, 3.930419921875, 4.05859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 11.0, 17.0, 14.0, 27.0, 57.0, 64.0, 111.0, 151.0, 146.0, 120.0, 118.0, 47.0, 28.0, 21.0, 11.0, 7.0, 5.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.08427619934082e-05, -4.916638135910034e-05, -4.749000072479248e-05, -4.581362009048462e-05, -4.413723945617676e-05, -4.2460858821868896e-05, -4.0784478187561035e-05, -3.9108097553253174e-05, -3.743171691894531e-05, -3.575533628463745e-05, -3.407895565032959e-05, -3.240257501602173e-05, -3.072619438171387e-05, -2.9049813747406006e-05, -2.7373433113098145e-05, -2.5697052478790283e-05, -2.4020671844482422e-05, -2.234429121017456e-05, -2.06679105758667e-05, -1.8991529941558838e-05, -1.7315149307250977e-05, -1.5638768672943115e-05, -1.3962388038635254e-05, -1.2286007404327393e-05, -1.0609626770019531e-05, -8.93324613571167e-06, -7.256865501403809e-06, -5.580484867095947e-06, -3.904104232788086e-06, -2.2277235984802246e-06, -5.513429641723633e-07, 1.125037670135498e-06, 2.8014183044433594e-06, 4.477798938751221e-06, 6.154179573059082e-06, 7.830560207366943e-06, 9.506940841674805e-06, 1.1183321475982666e-05, 1.2859702110290527e-05, 1.4536082744598389e-05, 1.621246337890625e-05, 1.788884401321411e-05, 1.9565224647521973e-05, 2.1241605281829834e-05, 2.2917985916137695e-05, 2.4594366550445557e-05, 2.6270747184753418e-05, 2.794712781906128e-05, 2.962350845336914e-05, 3.1299889087677e-05, 3.297626972198486e-05, 3.4652650356292725e-05, 3.6329030990600586e-05, 3.800541162490845e-05, 3.968179225921631e-05, 4.135817289352417e-05, 4.303455352783203e-05, 4.471093416213989e-05, 4.6387314796447754e-05, 4.8063695430755615e-05, 4.9740076065063477e-05, 5.141645669937134e-05, 5.30928373336792e-05, 5.476921796798706e-05, 5.644559860229492e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 9.0, 5.0, 10.0, 12.0, 35.0, 32.0, 45.0, 55.0, 91.0, 193.0, 519.0, 1555.0, 6451.0, 140829.0, 866526.0, 27196.0, 3392.0, 971.0, 310.0, 134.0, 60.0, 40.0, 28.0, 17.0, 20.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.02734375, -1.0030517578125, -0.978759765625, -0.9544677734375, -0.93017578125, -0.9058837890625, -0.881591796875, -0.8572998046875, -0.8330078125, -0.8087158203125, -0.784423828125, -0.7601318359375, -0.73583984375, -0.7115478515625, -0.687255859375, -0.6629638671875, -0.638671875, -0.6143798828125, -0.590087890625, -0.5657958984375, -0.54150390625, -0.5172119140625, -0.492919921875, -0.4686279296875, -0.4443359375, -0.4200439453125, -0.395751953125, -0.3714599609375, -0.34716796875, -0.3228759765625, -0.298583984375, -0.2742919921875, -0.25, -0.2257080078125, -0.201416015625, -0.1771240234375, -0.15283203125, -0.1285400390625, -0.104248046875, -0.0799560546875, -0.0556640625, -0.0313720703125, -0.007080078125, 0.0172119140625, 0.04150390625, 0.0657958984375, 0.090087890625, 0.1143798828125, 0.138671875, 0.1629638671875, 0.187255859375, 0.2115478515625, 0.23583984375, 0.2601318359375, 0.284423828125, 0.3087158203125, 0.3330078125, 0.3572998046875, 0.381591796875, 0.4058837890625, 0.43017578125, 0.4544677734375, 0.478759765625, 0.5030517578125, 0.52734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 6.0, 14.0, 40.0, 78.0, 140.0, 206.0, 210.0, 157.0, 68.0, 45.0, 13.0, 6.0, 3.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.646484375, -0.6321449279785156, -0.6178054809570312, -0.6034660339355469, -0.5891265869140625, -0.5747871398925781, -0.5604476928710938, -0.5461082458496094, -0.531768798828125, -0.5174293518066406, -0.5030899047851562, -0.4887504577636719, -0.4744110107421875, -0.4600715637207031, -0.44573211669921875, -0.4313926696777344, -0.41705322265625, -0.4027137756347656, -0.38837432861328125, -0.3740348815917969, -0.3596954345703125, -0.3453559875488281, -0.33101654052734375, -0.3166770935058594, -0.302337646484375, -0.2879981994628906, -0.27365875244140625, -0.2593193054199219, -0.2449798583984375, -0.23064041137695312, -0.21630096435546875, -0.20196151733398438, -0.1876220703125, -0.17328262329101562, -0.15894317626953125, -0.14460372924804688, -0.1302642822265625, -0.11592483520507812, -0.10158538818359375, -0.08724594116210938, -0.072906494140625, -0.058567047119140625, -0.04422760009765625, -0.029888153076171875, -0.0155487060546875, -0.001209259033203125, 0.01313018798828125, 0.027469635009765625, 0.04180908203125, 0.056148529052734375, 0.07048797607421875, 0.08482742309570312, 0.0991668701171875, 0.11350631713867188, 0.12784576416015625, 0.14218521118164062, 0.156524658203125, 0.17086410522460938, 0.18520355224609375, 0.19954299926757812, 0.2138824462890625, 0.22822189331054688, 0.24256134033203125, 0.2569007873535156, 0.271240234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 24.0, 36.0, 56.0, 120.0, 202.0, 239.0, 129.0, 82.0, 45.0, 18.0, 18.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0226855278015137, -2.9417564868927, -2.8608274459838867, -2.7798984050750732, -2.6989693641662598, -2.6180405616760254, -2.537111520767212, -2.4561824798583984, -2.375253438949585, -2.2943243980407715, -2.213395357131958, -2.1324663162231445, -2.05153751373291, -1.9706083536148071, -1.8896794319152832, -1.8087503910064697, -1.7278213500976562, -1.6468923091888428, -1.5659632682800293, -1.4850343465805054, -1.404105305671692, -1.3231762647628784, -1.2422473430633545, -1.161318302154541, -1.0803892612457275, -0.9994602203369141, -0.9185312390327454, -0.8376022577285767, -0.7566732168197632, -0.6757441759109497, -0.594815194606781, -0.5138862133026123, -0.43295741081237793, -0.35202839970588684, -0.27109938859939575, -0.19017037749290466, -0.10924136638641357, -0.028312355279922485, 0.052616655826568604, 0.1335456371307373, 0.21447467803955078, 0.29540368914604187, 0.37633270025253296, 0.45726171135902405, 0.5381907224655151, 0.6191197633743286, 0.7000487446784973, 0.780977725982666, 0.8619067668914795, 0.942835807800293, 1.0237648487091064, 1.1046937704086304, 1.1856228113174438, 1.2665518522262573, 1.3474807739257812, 1.4284098148345947, 1.5093388557434082, 1.5902678966522217, 1.6711969375610352, 1.752125859260559, 1.8330549001693726, 1.913983941078186, 1.99491286277771, 2.0758419036865234, 2.156770944595337]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 3.0, 7.0, 10.0, 10.0, 17.0, 23.0, 26.0, 36.0, 40.0, 56.0, 73.0, 73.0, 72.0, 95.0, 75.0, 99.0, 77.0, 48.0, 29.0, 23.0, 19.0, 18.0, 17.0, 13.0, 10.0, 4.0, 4.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8004040718078613, -1.7375088930130005, -1.6746137142181396, -1.6117184162139893, -1.5488232374191284, -1.4859280586242676, -1.4230327606201172, -1.3601375818252563, -1.2972424030303955, -1.2343472242355347, -1.1714520454406738, -1.1085567474365234, -1.0456615686416626, -0.9827663898468018, -0.9198711514472961, -0.8569759130477905, -0.7940807342529297, -0.7311855554580688, -0.6682903170585632, -0.6053950786590576, -0.5424998998641968, -0.47960469126701355, -0.4167094826698303, -0.3538142740726471, -0.29091906547546387, -0.22802385687828064, -0.1651286482810974, -0.10223343968391418, -0.03933823108673096, 0.02355697751045227, 0.0864521861076355, 0.14934739470481873, 0.21224236488342285, 0.2751375734806061, 0.3380327820777893, 0.40092799067497253, 0.46382319927215576, 0.5267183780670166, 0.5896136164665222, 0.6525088548660278, 0.7154040336608887, 0.7782992124557495, 0.8411944508552551, 0.9040896892547607, 0.9669848680496216, 1.0298800468444824, 1.0927753448486328, 1.1556705236434937, 1.2185657024383545, 1.2814608812332153, 1.3443560600280762, 1.4072513580322266, 1.4701465368270874, 1.5330417156219482, 1.5959370136260986, 1.6588321924209595, 1.7217273712158203, 1.7846225500106812, 1.847517728805542, 1.9104130268096924, 1.9733082056045532, 2.036203384399414, 2.0990986824035645, 2.1619937419891357, 2.224889039993286]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 9.0, 4.0, 5.0, 8.0, 19.0, 18.0, 19.0, 32.0, 62.0, 70.0, 95.0, 140.0, 167.0, 301.0, 339.0, 524.0, 819.0, 1352.0, 2369.0, 4819.0, 11131.0, 37935.0, 494380.0, 3547679.0, 63188.0, 15351.0, 6145.0, 2984.0, 1532.0, 883.0, 580.0, 393.0, 275.0, 181.0, 118.0, 108.0, 68.0, 49.0, 35.0, 27.0, 23.0, 21.0, 13.0, 3.0, 3.0, 2.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.86669921875, -0.8397445678710938, -0.8127899169921875, -0.7858352661132812, -0.758880615234375, -0.7319259643554688, -0.7049713134765625, -0.6780166625976562, -0.65106201171875, -0.6241073608398438, -0.5971527099609375, -0.5701980590820312, -0.543243408203125, -0.5162887573242188, -0.4893341064453125, -0.46237945556640625, -0.4354248046875, -0.40847015380859375, -0.3815155029296875, -0.35456085205078125, -0.327606201171875, -0.30065155029296875, -0.2736968994140625, -0.24674224853515625, -0.21978759765625, -0.19283294677734375, -0.1658782958984375, -0.13892364501953125, -0.111968994140625, -0.08501434326171875, -0.0580596923828125, -0.03110504150390625, -0.004150390625, 0.02280426025390625, 0.0497589111328125, 0.07671356201171875, 0.103668212890625, 0.13062286376953125, 0.1575775146484375, 0.18453216552734375, 0.21148681640625, 0.23844146728515625, 0.2653961181640625, 0.29235076904296875, 0.319305419921875, 0.34626007080078125, 0.3732147216796875, 0.40016937255859375, 0.4271240234375, 0.45407867431640625, 0.4810333251953125, 0.5079879760742188, 0.534942626953125, 0.5618972778320312, 0.5888519287109375, 0.6158065795898438, 0.64276123046875, 0.6697158813476562, 0.6966705322265625, 0.7236251831054688, 0.750579833984375, 0.7775344848632812, 0.8044891357421875, 0.8314437866210938, 0.8583984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 5.0, 6.0, 12.0, 12.0, 17.0, 22.0, 24.0, 40.0, 50.0, 57.0, 66.0, 79.0, 76.0, 94.0, 74.0, 69.0, 55.0, 36.0, 43.0, 30.0, 24.0, 22.0, 12.0, 10.0, 6.0, 6.0, 4.0, 3.0, 6.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.034820556640625, -0.033695220947265625, -0.03256988525390625, -0.031444549560546875, -0.0303192138671875, -0.029193878173828125, -0.02806854248046875, -0.026943206787109375, -0.02581787109375, -0.024692535400390625, -0.02356719970703125, -0.022441864013671875, -0.0213165283203125, -0.020191192626953125, -0.01906585693359375, -0.017940521240234375, -0.016815185546875, -0.015689849853515625, -0.01456451416015625, -0.013439178466796875, -0.0123138427734375, -0.011188507080078125, -0.01006317138671875, -0.008937835693359375, -0.0078125, -0.006687164306640625, -0.00556182861328125, -0.004436492919921875, -0.0033111572265625, -0.002185821533203125, -0.00106048583984375, 6.4849853515625e-05, 0.001190185546875, 0.002315521240234375, 0.00344085693359375, 0.004566192626953125, 0.0056915283203125, 0.006816864013671875, 0.00794219970703125, 0.009067535400390625, 0.01019287109375, 0.011318206787109375, 0.01244354248046875, 0.013568878173828125, 0.0146942138671875, 0.015819549560546875, 0.01694488525390625, 0.018070220947265625, 0.019195556640625, 0.020320892333984375, 0.02144622802734375, 0.022571563720703125, 0.0236968994140625, 0.024822235107421875, 0.02594757080078125, 0.027072906494140625, 0.0281982421875, 0.029323577880859375, 0.03044891357421875, 0.031574249267578125, 0.0326995849609375, 0.033824920654296875, 0.03495025634765625, 0.036075592041015625, 0.037200927734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 3.0, 4.0, 7.0, 7.0, 5.0, 13.0, 12.0, 17.0, 27.0, 44.0, 44.0, 79.0, 171.0, 717.0, 8899.0, 3118398.0, 1058296.0, 6508.0, 576.0, 156.0, 61.0, 60.0, 33.0, 25.0, 19.0, 11.0, 18.0, 9.0, 13.0, 6.0, 6.0, 6.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.217864990234375, -2.15057373046875, -2.083282470703125, -2.0159912109375, -1.948699951171875, -1.88140869140625, -1.814117431640625, -1.746826171875, -1.679534912109375, -1.61224365234375, -1.544952392578125, -1.4776611328125, -1.410369873046875, -1.34307861328125, -1.275787353515625, -1.20849609375, -1.141204833984375, -1.07391357421875, -1.006622314453125, -0.9393310546875, -0.872039794921875, -0.80474853515625, -0.737457275390625, -0.670166015625, -0.602874755859375, -0.53558349609375, -0.468292236328125, -0.4010009765625, -0.333709716796875, -0.26641845703125, -0.199127197265625, -0.1318359375, -0.064544677734375, 0.00274658203125, 0.070037841796875, 0.1373291015625, 0.204620361328125, 0.27191162109375, 0.339202880859375, 0.406494140625, 0.473785400390625, 0.54107666015625, 0.608367919921875, 0.6756591796875, 0.742950439453125, 0.81024169921875, 0.877532958984375, 0.94482421875, 1.012115478515625, 1.07940673828125, 1.146697998046875, 1.2139892578125, 1.281280517578125, 1.34857177734375, 1.415863037109375, 1.483154296875, 1.550445556640625, 1.61773681640625, 1.685028076171875, 1.7523193359375, 1.819610595703125, 1.88690185546875, 1.954193115234375, 2.021484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 6.0, 8.0, 3.0, 8.0, 5.0, 7.0, 4.0, 15.0, 19.0, 14.0, 20.0, 32.0, 40.0, 44.0, 57.0, 98.0, 188.0, 383.0, 939.0, 1094.0, 439.0, 227.0, 127.0, 80.0, 53.0, 33.0, 31.0, 19.0, 20.0, 9.0, 6.0, 7.0, 7.0, 1.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0787353515625, -0.07642364501953125, -0.0741119384765625, -0.07180023193359375, -0.069488525390625, -0.06717681884765625, -0.0648651123046875, -0.06255340576171875, -0.06024169921875, -0.05792999267578125, -0.0556182861328125, -0.05330657958984375, -0.050994873046875, -0.04868316650390625, -0.0463714599609375, -0.04405975341796875, -0.041748046875, -0.03943634033203125, -0.0371246337890625, -0.03481292724609375, -0.032501220703125, -0.03018951416015625, -0.0278778076171875, -0.02556610107421875, -0.02325439453125, -0.02094268798828125, -0.0186309814453125, -0.01631927490234375, -0.014007568359375, -0.01169586181640625, -0.0093841552734375, -0.00707244873046875, -0.0047607421875, -0.00244903564453125, -0.0001373291015625, 0.00217437744140625, 0.004486083984375, 0.00679779052734375, 0.0091094970703125, 0.01142120361328125, 0.01373291015625, 0.01604461669921875, 0.0183563232421875, 0.02066802978515625, 0.022979736328125, 0.02529144287109375, 0.0276031494140625, 0.02991485595703125, 0.0322265625, 0.03453826904296875, 0.0368499755859375, 0.03916168212890625, 0.041473388671875, 0.04378509521484375, 0.0460968017578125, 0.04840850830078125, 0.05072021484375, 0.05303192138671875, 0.0553436279296875, 0.05765533447265625, 0.059967041015625, 0.06227874755859375, 0.0645904541015625, 0.06690216064453125, 0.0692138671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 54.0, 347.0, 513.0, 75.0, 12.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.071073532104492, -4.980628967285156, -4.89018440246582, -4.799739837646484, -4.709295272827148, -4.6188507080078125, -4.528406143188477, -4.437961578369141, -4.3475165367126465, -4.2570719718933105, -4.166627407073975, -4.076182842254639, -3.9857380390167236, -3.8952934741973877, -3.8048489093780518, -3.714404344558716, -3.623960018157959, -3.533515453338623, -3.443070888519287, -3.352626323699951, -3.262181520462036, -3.1717369556427, -3.0812923908233643, -2.9908478260040283, -2.9004030227661133, -2.8099584579467773, -2.7195138931274414, -2.6290693283081055, -2.5386245250701904, -2.4481799602508545, -2.3577353954315186, -2.2672908306121826, -2.176846504211426, -2.08640193939209, -1.9959572553634644, -1.9055126905441284, -1.8150681257247925, -1.724623441696167, -1.634178876876831, -1.5437343120574951, -1.4532896280288696, -1.3628450632095337, -1.2724003791809082, -1.1819558143615723, -1.0915112495422363, -1.0010666847229004, -0.9106220006942749, -0.820177435874939, -0.7297328114509583, -0.6392881870269775, -0.5488436222076416, -0.4583989977836609, -0.36795440316200256, -0.27750980854034424, -0.18706518411636353, -0.09662061929702759, -0.006175994873046875, 0.08426860719919205, 0.17471320927143097, 0.2651578187942505, 0.3556024134159088, 0.44604700803756714, 0.5364916324615479, 0.6269361972808838, 0.7173808217048645]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 11.0, 16.0, 22.0, 35.0, 49.0, 88.0, 129.0, 150.0, 130.0, 123.0, 109.0, 49.0, 34.0, 27.0, 15.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3025095462799072, -1.275489330291748, -1.2484691143035889, -1.2214488983154297, -1.19442880153656, -1.1674085855484009, -1.1403883695602417, -1.1133681535720825, -1.0863479375839233, -1.0593277215957642, -1.032307505607605, -1.0052872896194458, -0.9782671332359314, -0.951246976852417, -0.9242267608642578, -0.8972065448760986, -0.8701863288879395, -0.8431661128997803, -0.8161459565162659, -0.7891257405281067, -0.7621055245399475, -0.7350853681564331, -0.7080651521682739, -0.6810449361801147, -0.6540247797966003, -0.6270045638084412, -0.5999844074249268, -0.5729641914367676, -0.5459439754486084, -0.5189237594604492, -0.4919036030769348, -0.46488338708877563, -0.43786317110061646, -0.41084298491477966, -0.3838227689266205, -0.3568025827407837, -0.3297823667526245, -0.3027621805667877, -0.2757419943809509, -0.24872177839279175, -0.22170157730579376, -0.19468137621879578, -0.1676611751317978, -0.1406409740447998, -0.11362078040838242, -0.08660058677196503, -0.05958038568496704, -0.032560184597969055, -0.005539983510971069, 0.021480215713381767, 0.048500414937734604, 0.07552061229944229, 0.10254081338644028, 0.12956100702285767, 0.15658120810985565, 0.18360140919685364, 0.21062161028385162, 0.2376418113708496, 0.2646619975566864, 0.2916822135448456, 0.3187023997306824, 0.34572261571884155, 0.37274280190467834, 0.39976298809051514, 0.4267832040786743]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 14.0, 8.0, 11.0, 15.0, 24.0, 24.0, 30.0, 35.0, 47.0, 51.0, 59.0, 79.0, 886.0, 1037506.0, 9322.0, 98.0, 63.0, 51.0, 43.0, 37.0, 30.0, 20.0, 22.0, 17.0, 13.0, 12.0, 10.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.748046875, -3.639923095703125, -3.53179931640625, -3.423675537109375, -3.3155517578125, -3.207427978515625, -3.09930419921875, -2.991180419921875, -2.883056640625, -2.774932861328125, -2.66680908203125, -2.558685302734375, -2.4505615234375, -2.342437744140625, -2.23431396484375, -2.126190185546875, -2.01806640625, -1.909942626953125, -1.80181884765625, -1.693695068359375, -1.5855712890625, -1.477447509765625, -1.36932373046875, -1.261199951171875, -1.153076171875, -1.044952392578125, -0.93682861328125, -0.828704833984375, -0.7205810546875, -0.612457275390625, -0.50433349609375, -0.396209716796875, -0.2880859375, -0.179962158203125, -0.07183837890625, 0.036285400390625, 0.1444091796875, 0.252532958984375, 0.36065673828125, 0.468780517578125, 0.576904296875, 0.685028076171875, 0.79315185546875, 0.901275634765625, 1.0093994140625, 1.117523193359375, 1.22564697265625, 1.333770751953125, 1.44189453125, 1.550018310546875, 1.65814208984375, 1.766265869140625, 1.8743896484375, 1.982513427734375, 2.09063720703125, 2.198760986328125, 2.306884765625, 2.415008544921875, 2.52313232421875, 2.631256103515625, 2.7393798828125, 2.847503662109375, 2.95562744140625, 3.063751220703125, 3.171875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 24.0, 123.0, 340.0, 359.0, 133.0, 23.0, 8.0, 2.0, 3.0], "bins": [-0.33984375, -0.3339824676513672, -0.3281211853027344, -0.32225990295410156, -0.31639862060546875, -0.31053733825683594, -0.3046760559082031, -0.2988147735595703, -0.2929534912109375, -0.2870922088623047, -0.2812309265136719, -0.27536964416503906, -0.26950836181640625, -0.26364707946777344, -0.2577857971191406, -0.2519245147705078, -0.246063232421875, -0.2402019500732422, -0.23434066772460938, -0.22847938537597656, -0.22261810302734375, -0.21675682067871094, -0.21089553833007812, -0.2050342559814453, -0.1991729736328125, -0.1933116912841797, -0.18745040893554688, -0.18158912658691406, -0.17572784423828125, -0.16986656188964844, -0.16400527954101562, -0.1581439971923828, -0.15228271484375, -0.1464214324951172, -0.14056015014648438, -0.13469886779785156, -0.12883758544921875, -0.12297630310058594, -0.11711502075195312, -0.11125373840332031, -0.1053924560546875, -0.09953117370605469, -0.09366989135742188, -0.08780860900878906, -0.08194732666015625, -0.07608604431152344, -0.07022476196289062, -0.06436347961425781, -0.058502197265625, -0.05264091491699219, -0.046779632568359375, -0.04091835021972656, -0.03505706787109375, -0.029195785522460938, -0.023334503173828125, -0.017473220825195312, -0.0116119384765625, -0.0057506561279296875, 0.000110626220703125, 0.0059719085693359375, 0.01183319091796875, 0.017694473266601562, 0.023555755615234375, 0.029417037963867188, 0.0352783203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 2.0, 6.0, 8.0, 11.0, 13.0, 21.0, 22.0, 26.0, 39.0, 68.0, 128.0, 231.0, 435.0, 1011.0, 2544.0, 7786.0, 30936.0, 175558.0, 594974.0, 188241.0, 33422.0, 8176.0, 2683.0, 1088.0, 501.0, 242.0, 132.0, 90.0, 50.0, 31.0, 18.0, 15.0, 12.0, 11.0, 7.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.62841796875, -0.6078262329101562, -0.5872344970703125, -0.5666427612304688, -0.546051025390625, -0.5254592895507812, -0.5048675537109375, -0.48427581787109375, -0.46368408203125, -0.44309234619140625, -0.4225006103515625, -0.40190887451171875, -0.381317138671875, -0.36072540283203125, -0.3401336669921875, -0.31954193115234375, -0.2989501953125, -0.27835845947265625, -0.2577667236328125, -0.23717498779296875, -0.216583251953125, -0.19599151611328125, -0.1753997802734375, -0.15480804443359375, -0.13421630859375, -0.11362457275390625, -0.0930328369140625, -0.07244110107421875, -0.051849365234375, -0.03125762939453125, -0.0106658935546875, 0.00992584228515625, 0.030517578125, 0.05110931396484375, 0.0717010498046875, 0.09229278564453125, 0.112884521484375, 0.13347625732421875, 0.1540679931640625, 0.17465972900390625, 0.19525146484375, 0.21584320068359375, 0.2364349365234375, 0.25702667236328125, 0.277618408203125, 0.29821014404296875, 0.3188018798828125, 0.33939361572265625, 0.3599853515625, 0.38057708740234375, 0.4011688232421875, 0.42176055908203125, 0.442352294921875, 0.46294403076171875, 0.4835357666015625, 0.5041275024414062, 0.52471923828125, 0.5453109741210938, 0.5659027099609375, 0.5864944458007812, 0.607086181640625, 0.6276779174804688, 0.6482696533203125, 0.6688613891601562, 0.689453125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 14.0, 15.0, 12.0, 17.0, 32.0, 31.0, 38.0, 45.0, 44.0, 47.0, 61.0, 68.0, 72.0, 72.0, 64.0, 60.0, 49.0, 36.0, 40.0, 31.0, 24.0, 28.0, 20.0, 23.0, 10.0, 9.0, 6.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287841796875, -0.2778053283691406, -0.26776885986328125, -0.2577323913574219, -0.2476959228515625, -0.23765945434570312, -0.22762298583984375, -0.21758651733398438, -0.207550048828125, -0.19751358032226562, -0.18747711181640625, -0.17744064331054688, -0.1674041748046875, -0.15736770629882812, -0.14733123779296875, -0.13729476928710938, -0.12725830078125, -0.11722183227539062, -0.10718536376953125, -0.09714889526367188, -0.0871124267578125, -0.07707595825195312, -0.06703948974609375, -0.057003021240234375, -0.046966552734375, -0.036930084228515625, -0.02689361572265625, -0.016857147216796875, -0.0068206787109375, 0.003215789794921875, 0.01325225830078125, 0.023288726806640625, 0.0333251953125, 0.043361663818359375, 0.05339813232421875, 0.06343460083007812, 0.0734710693359375, 0.08350753784179688, 0.09354400634765625, 0.10358047485351562, 0.113616943359375, 0.12365341186523438, 0.13368988037109375, 0.14372634887695312, 0.1537628173828125, 0.16379928588867188, 0.17383575439453125, 0.18387222290039062, 0.19390869140625, 0.20394515991210938, 0.21398162841796875, 0.22401809692382812, 0.2340545654296875, 0.24409103393554688, 0.25412750244140625, 0.2641639709472656, 0.274200439453125, 0.2842369079589844, 0.29427337646484375, 0.3043098449707031, 0.3143463134765625, 0.3243827819824219, 0.33441925048828125, 0.3444557189941406, 0.3544921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 8.0, 9.0, 6.0, 14.0, 20.0, 38.0, 52.0, 69.0, 106.0, 177.0, 299.0, 604.0, 1497.0, 4374.0, 19280.0, 200484.0, 748537.0, 58997.0, 9308.0, 2562.0, 1000.0, 457.0, 249.0, 141.0, 90.0, 59.0, 28.0, 27.0, 12.0, 13.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98779296875, -0.9597930908203125, -0.931793212890625, -0.9037933349609375, -0.87579345703125, -0.8477935791015625, -0.819793701171875, -0.7917938232421875, -0.7637939453125, -0.7357940673828125, -0.707794189453125, -0.6797943115234375, -0.65179443359375, -0.6237945556640625, -0.595794677734375, -0.5677947998046875, -0.539794921875, -0.5117950439453125, -0.483795166015625, -0.4557952880859375, -0.42779541015625, -0.3997955322265625, -0.371795654296875, -0.3437957763671875, -0.3157958984375, -0.2877960205078125, -0.259796142578125, -0.2317962646484375, -0.20379638671875, -0.1757965087890625, -0.147796630859375, -0.1197967529296875, -0.091796875, -0.0637969970703125, -0.035797119140625, -0.0077972412109375, 0.02020263671875, 0.0482025146484375, 0.076202392578125, 0.1042022705078125, 0.1322021484375, 0.1602020263671875, 0.188201904296875, 0.2162017822265625, 0.24420166015625, 0.2722015380859375, 0.300201416015625, 0.3282012939453125, 0.356201171875, 0.3842010498046875, 0.412200927734375, 0.4402008056640625, 0.46820068359375, 0.4962005615234375, 0.524200439453125, 0.5522003173828125, 0.5802001953125, 0.6082000732421875, 0.636199951171875, 0.6641998291015625, 0.69219970703125, 0.7201995849609375, 0.748199462890625, 0.7761993408203125, 0.80419921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 12.0, 20.0, 27.0, 59.0, 94.0, 172.0, 228.0, 170.0, 86.0, 52.0, 26.0, 11.0, 11.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010102987289428711, -9.67392697930336e-05, -9.244866669178009e-05, -8.815806359052658e-05, -8.386746048927307e-05, -7.957685738801956e-05, -7.528625428676605e-05, -7.099565118551254e-05, -6.670504808425903e-05, -6.241444498300552e-05, -5.8123841881752014e-05, -5.3833238780498505e-05, -4.9542635679244995e-05, -4.5252032577991486e-05, -4.0961429476737976e-05, -3.6670826375484467e-05, -3.238022327423096e-05, -2.8089620172977448e-05, -2.3799017071723938e-05, -1.950841397047043e-05, -1.5217810869216919e-05, -1.092720776796341e-05, -6.6366046667099e-06, -2.3460015654563904e-06, 1.944601535797119e-06, 6.235204637050629e-06, 1.0525807738304138e-05, 1.4816410839557648e-05, 1.9107013940811157e-05, 2.3397617042064667e-05, 2.7688220143318176e-05, 3.1978823244571686e-05, 3.6269426345825195e-05, 4.0560029447078705e-05, 4.4850632548332214e-05, 4.9141235649585724e-05, 5.3431838750839233e-05, 5.772244185209274e-05, 6.201304495334625e-05, 6.630364805459976e-05, 7.059425115585327e-05, 7.488485425710678e-05, 7.917545735836029e-05, 8.34660604596138e-05, 8.775666356086731e-05, 9.204726666212082e-05, 9.633786976337433e-05, 0.00010062847286462784, 0.00010491907596588135, 0.00010920967906713486, 0.00011350028216838837, 0.00011779088526964188, 0.00012208148837089539, 0.0001263720914721489, 0.0001306626945734024, 0.00013495329767465591, 0.00013924390077590942, 0.00014353450387716293, 0.00014782510697841644, 0.00015211571007966995, 0.00015640631318092346, 0.00016069691628217697, 0.00016498751938343048, 0.000169278122484684, 0.0001735687255859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 5.0, 9.0, 13.0, 29.0, 28.0, 62.0, 125.0, 210.0, 463.0, 1078.0, 2978.0, 11327.0, 116902.0, 870843.0, 34773.0, 6304.0, 1969.0, 720.0, 319.0, 161.0, 83.0, 52.0, 33.0, 22.0, 13.0, 10.0, 7.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.35833740234375, -1.3162841796875, -1.27423095703125, -1.232177734375, -1.19012451171875, -1.1480712890625, -1.10601806640625, -1.06396484375, -1.02191162109375, -0.9798583984375, -0.93780517578125, -0.895751953125, -0.85369873046875, -0.8116455078125, -0.76959228515625, -0.7275390625, -0.68548583984375, -0.6434326171875, -0.60137939453125, -0.559326171875, -0.51727294921875, -0.4752197265625, -0.43316650390625, -0.39111328125, -0.34906005859375, -0.3070068359375, -0.26495361328125, -0.222900390625, -0.18084716796875, -0.1387939453125, -0.09674072265625, -0.0546875, -0.01263427734375, 0.0294189453125, 0.07147216796875, 0.113525390625, 0.15557861328125, 0.1976318359375, 0.23968505859375, 0.28173828125, 0.32379150390625, 0.3658447265625, 0.40789794921875, 0.449951171875, 0.49200439453125, 0.5340576171875, 0.57611083984375, 0.6181640625, 0.66021728515625, 0.7022705078125, 0.74432373046875, 0.786376953125, 0.82843017578125, 0.8704833984375, 0.91253662109375, 0.95458984375, 0.99664306640625, 1.0386962890625, 1.08074951171875, 1.122802734375, 1.16485595703125, 1.2069091796875, 1.24896240234375, 1.291015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 6.0, 9.0, 9.0, 18.0, 14.0, 28.0, 57.0, 62.0, 144.0, 186.0, 162.0, 113.0, 73.0, 41.0, 16.0, 16.0, 5.0, 3.0, 11.0, 8.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.41534423828125, -0.4022216796875, -0.38909912109375, -0.3759765625, -0.36285400390625, -0.3497314453125, -0.33660888671875, -0.323486328125, -0.31036376953125, -0.2972412109375, -0.28411865234375, -0.27099609375, -0.25787353515625, -0.2447509765625, -0.23162841796875, -0.218505859375, -0.20538330078125, -0.1922607421875, -0.17913818359375, -0.166015625, -0.15289306640625, -0.1397705078125, -0.12664794921875, -0.113525390625, -0.10040283203125, -0.0872802734375, -0.07415771484375, -0.06103515625, -0.04791259765625, -0.0347900390625, -0.02166748046875, -0.008544921875, 0.00457763671875, 0.0177001953125, 0.03082275390625, 0.0439453125, 0.05706787109375, 0.0701904296875, 0.08331298828125, 0.096435546875, 0.10955810546875, 0.1226806640625, 0.13580322265625, 0.14892578125, 0.16204833984375, 0.1751708984375, 0.18829345703125, 0.201416015625, 0.21453857421875, 0.2276611328125, 0.24078369140625, 0.25390625, 0.26702880859375, 0.2801513671875, 0.29327392578125, 0.306396484375, 0.31951904296875, 0.3326416015625, 0.34576416015625, 0.35888671875, 0.37200927734375, 0.3851318359375, 0.39825439453125, 0.411376953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 46.0, 339.0, 433.0, 119.0, 34.0, 17.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.462682723999023, -15.133832931518555, -14.80498218536377, -14.4761323928833, -14.147282600402832, -13.818431854248047, -13.489582061767578, -13.16073226928711, -12.83188247680664, -12.503032684326172, -12.174181938171387, -11.845332145690918, -11.51648235321045, -11.187631607055664, -10.858781814575195, -10.529932022094727, -10.201081275939941, -9.872231483459473, -9.543380737304688, -9.214530944824219, -8.88568115234375, -8.556831359863281, -8.227980613708496, -7.899130821228027, -7.5702805519104, -7.241430282592773, -6.912580490112305, -6.583730220794678, -6.254879951477051, -5.926030158996582, -5.597179889678955, -5.268329620361328, -4.939480781555176, -4.610630512237549, -4.28178071975708, -3.952930450439453, -3.6240804195404053, -3.2952303886413574, -2.9663801193237305, -2.6375300884246826, -2.3086800575256348, -1.979830026626587, -1.6509798765182495, -1.322129726409912, -0.9932796955108643, -0.6644296646118164, -0.335579514503479, -0.0067293643951416016, 0.32212066650390625, 0.6509707570075989, 0.9798208475112915, 1.308670997619629, 1.6375210285186768, 1.9663710594177246, 2.2952213287353516, 2.6240713596343994, 2.9529213905334473, 3.281771421432495, 3.610621452331543, 3.93947172164917, 4.268321990966797, 4.597171783447266, 4.926022052764893, 5.2548723220825195, 5.583722114562988]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 18.0, 21.0, 26.0, 40.0, 45.0, 75.0, 63.0, 79.0, 89.0, 88.0, 100.0, 75.0, 71.0, 69.0, 40.0, 29.0, 23.0, 12.0, 9.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.749948501586914, -4.652196407318115, -4.554444789886475, -4.456692695617676, -4.358941078186035, -4.261188983917236, -4.163437366485596, -4.065685272216797, -3.967933416366577, -3.8701815605163574, -3.7724297046661377, -3.674677848815918, -3.576925754547119, -3.4791738986968994, -3.3814220428466797, -3.28367018699646, -3.1859183311462402, -3.0881664752960205, -2.990414619445801, -2.892662763595581, -2.7949109077453613, -2.6971588134765625, -2.5994069576263428, -2.501655101776123, -2.4039032459259033, -2.3061513900756836, -2.208399534225464, -2.110647678375244, -2.0128955841064453, -1.9151438474655151, -1.8173918724060059, -1.7196400165557861, -1.6218880414962769, -1.5241361856460571, -1.4263842105865479, -1.3286323547363281, -1.2308804988861084, -1.1331286430358887, -1.035376787185669, -0.9376248121261597, -0.8398729562759399, -0.7421211004257202, -0.6443691849708557, -0.5466172695159912, -0.4488654136657715, -0.35111352801322937, -0.25336164236068726, -0.15560972690582275, -0.05785787105560303, 0.03989401459693909, 0.1376459002494812, 0.23539778590202332, 0.33314967155456543, 0.43090155720710754, 0.5286534428596497, 0.6264053583145142, 0.7241572141647339, 0.8219090700149536, 0.9196609854698181, 1.0174129009246826, 1.1151647567749023, 1.212916612625122, 1.3106684684753418, 1.408420443534851, 1.5061722993850708]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 8.0, 10.0, 15.0, 24.0, 22.0, 25.0, 46.0, 51.0, 62.0, 76.0, 120.0, 195.0, 15365.0, 4177298.0, 852.0, 78.0, 25.0, 9.0, 3.0, 0.0, 1.0], "bins": [-14.9765625, -14.71044921875, -14.4443359375, -14.17822265625, -13.912109375, -13.64599609375, -13.3798828125, -13.11376953125, -12.84765625, -12.58154296875, -12.3154296875, -12.04931640625, -11.783203125, -11.51708984375, -11.2509765625, -10.98486328125, -10.71875, -10.45263671875, -10.1865234375, -9.92041015625, -9.654296875, -9.38818359375, -9.1220703125, -8.85595703125, -8.58984375, -8.32373046875, -8.0576171875, -7.79150390625, -7.525390625, -7.25927734375, -6.9931640625, -6.72705078125, -6.4609375, -6.19482421875, -5.9287109375, -5.66259765625, -5.396484375, -5.13037109375, -4.8642578125, -4.59814453125, -4.33203125, -4.06591796875, -3.7998046875, -3.53369140625, -3.267578125, -3.00146484375, -2.7353515625, -2.46923828125, -2.203125, -1.93701171875, -1.6708984375, -1.40478515625, -1.138671875, -0.87255859375, -0.6064453125, -0.34033203125, -0.07421875, 0.19189453125, 0.4580078125, 0.72412109375, 0.990234375, 1.25634765625, 1.5224609375, 1.78857421875, 2.0546875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 15.0, 71.0, 131.0, 254.0, 273.0, 180.0, 56.0, 22.0, 7.0, 4.0, 0.0, 1.0], "bins": [-0.373779296875, -0.3671083450317383, -0.36043739318847656, -0.35376644134521484, -0.3470954895019531, -0.3404245376586914, -0.3337535858154297, -0.32708263397216797, -0.32041168212890625, -0.31374073028564453, -0.3070697784423828, -0.3003988265991211, -0.2937278747558594, -0.28705692291259766, -0.28038597106933594, -0.2737150192260742, -0.2670440673828125, -0.2603731155395508, -0.25370216369628906, -0.24703121185302734, -0.24036026000976562, -0.2336893081665039, -0.2270183563232422, -0.22034740447998047, -0.21367645263671875, -0.20700550079345703, -0.2003345489501953, -0.1936635971069336, -0.18699264526367188, -0.18032169342041016, -0.17365074157714844, -0.16697978973388672, -0.160308837890625, -0.15363788604736328, -0.14696693420410156, -0.14029598236083984, -0.13362503051757812, -0.1269540786743164, -0.12028312683105469, -0.11361217498779297, -0.10694122314453125, -0.10027027130126953, -0.09359931945800781, -0.0869283676147461, -0.08025741577148438, -0.07358646392822266, -0.06691551208496094, -0.06024456024169922, -0.0535736083984375, -0.04690265655517578, -0.04023170471191406, -0.033560752868652344, -0.026889801025390625, -0.020218849182128906, -0.013547897338867188, -0.006876945495605469, -0.00020599365234375, 0.006464958190917969, 0.013135910034179688, 0.019806861877441406, 0.026477813720703125, 0.033148765563964844, 0.03981971740722656, 0.04649066925048828, 0.05316162109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 11.0, 17.0, 32.0, 39.0, 52.0, 63.0, 69.0, 95.0, 113.0, 131.0, 237.0, 439.0, 18962.0, 4171537.0, 1611.0, 281.0, 155.0, 98.0, 100.0, 76.0, 55.0, 41.0, 20.0, 11.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.359375, -13.98388671875, -13.6083984375, -13.23291015625, -12.857421875, -12.48193359375, -12.1064453125, -11.73095703125, -11.35546875, -10.97998046875, -10.6044921875, -10.22900390625, -9.853515625, -9.47802734375, -9.1025390625, -8.72705078125, -8.3515625, -7.97607421875, -7.6005859375, -7.22509765625, -6.849609375, -6.47412109375, -6.0986328125, -5.72314453125, -5.34765625, -4.97216796875, -4.5966796875, -4.22119140625, -3.845703125, -3.47021484375, -3.0947265625, -2.71923828125, -2.34375, -1.96826171875, -1.5927734375, -1.21728515625, -0.841796875, -0.46630859375, -0.0908203125, 0.28466796875, 0.66015625, 1.03564453125, 1.4111328125, 1.78662109375, 2.162109375, 2.53759765625, 2.9130859375, 3.28857421875, 3.6640625, 4.03955078125, 4.4150390625, 4.79052734375, 5.166015625, 5.54150390625, 5.9169921875, 6.29248046875, 6.66796875, 7.04345703125, 7.4189453125, 7.79443359375, 8.169921875, 8.54541015625, 8.9208984375, 9.29638671875, 9.671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 19.0, 138.0, 3531.0, 312.0, 55.0, 20.0, 12.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.041015625, -2.004322052001953, -1.9676284790039062, -1.9309349060058594, -1.8942413330078125, -1.8575477600097656, -1.8208541870117188, -1.7841606140136719, -1.747467041015625, -1.7107734680175781, -1.6740798950195312, -1.6373863220214844, -1.6006927490234375, -1.5639991760253906, -1.5273056030273438, -1.4906120300292969, -1.45391845703125, -1.4172248840332031, -1.3805313110351562, -1.3438377380371094, -1.3071441650390625, -1.2704505920410156, -1.2337570190429688, -1.1970634460449219, -1.160369873046875, -1.1236763000488281, -1.0869827270507812, -1.0502891540527344, -1.0135955810546875, -0.9769020080566406, -0.9402084350585938, -0.9035148620605469, -0.8668212890625, -0.8301277160644531, -0.7934341430664062, -0.7567405700683594, -0.7200469970703125, -0.6833534240722656, -0.6466598510742188, -0.6099662780761719, -0.573272705078125, -0.5365791320800781, -0.49988555908203125, -0.4631919860839844, -0.4264984130859375, -0.3898048400878906, -0.35311126708984375, -0.3164176940917969, -0.27972412109375, -0.24303054809570312, -0.20633697509765625, -0.16964340209960938, -0.1329498291015625, -0.09625625610351562, -0.05956268310546875, -0.022869110107421875, 0.013824462890625, 0.050518035888671875, 0.08721160888671875, 0.12390518188476562, 0.1605987548828125, 0.19729232788085938, 0.23398590087890625, 0.2706794738769531, 0.307373046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 13.0, 81.0, 684.0, 182.0, 32.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-33.15644454956055, -32.51461410522461, -31.872785568237305, -31.230955123901367, -30.589126586914062, -29.947296142578125, -29.305465698242188, -28.66363525390625, -28.021806716918945, -27.379976272583008, -26.738147735595703, -26.096317291259766, -25.454486846923828, -24.812658309936523, -24.170827865600586, -23.52899932861328, -22.887168884277344, -22.245338439941406, -21.6035099029541, -20.961679458618164, -20.31985092163086, -19.678020477294922, -19.036190032958984, -18.394359588623047, -17.752531051635742, -17.110700607299805, -16.4688720703125, -15.827041625976562, -15.185212135314941, -14.54338264465332, -13.901552200317383, -13.259722709655762, -12.617891311645508, -11.976061820983887, -11.334232330322266, -10.692401885986328, -10.050572395324707, -9.408742904663086, -8.766912460327148, -8.125082969665527, -7.4832539558410645, -6.841423988342285, -6.199594497680664, -5.557765007019043, -4.915935039520264, -4.274105072021484, -3.6322755813598633, -2.990445613861084, -2.348616123199463, -1.7067863941192627, -1.0649566650390625, -0.4231269359588623, 0.2187027931213379, 0.8605325222015381, 1.5023622512817383, 2.1441922187805176, 2.7860217094421387, 3.427851438522339, 4.069681167602539, 4.71151065826416, 5.3533406257629395, 5.995170593261719, 6.63700008392334, 7.278830051422119, 7.92065954208374]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 14.0, 37.0, 55.0, 87.0, 140.0, 154.0, 156.0, 128.0, 89.0, 70.0, 36.0, 17.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.329023361206055, -7.0994415283203125, -6.869859218597412, -6.64027738571167, -6.4106950759887695, -6.181113243103027, -5.951531410217285, -5.721949100494385, -5.492366790771484, -5.262784957885742, -5.033202648162842, -4.8036208152771, -4.574038505554199, -4.344456672668457, -4.114874839782715, -3.8852925300598145, -3.6557106971740723, -3.426128625869751, -3.1965465545654297, -2.9669647216796875, -2.737382411956787, -2.507800579071045, -2.2782185077667236, -2.0486364364624023, -1.819054365158081, -1.5894722938537598, -1.3598902225494385, -1.1303082704544067, -0.9007261991500854, -0.6711441278457642, -0.4415621757507324, -0.21198010444641113, 0.017601490020751953, 0.24718353152275085, 0.47676557302474976, 0.7063475847244263, 0.9359296560287476, 1.1655117273330688, 1.3950936794281006, 1.6246757507324219, 1.8542578220367432, 2.0838398933410645, 2.3134219646453857, 2.543004035949707, 2.772585868835449, 3.0021681785583496, 3.231750011444092, 3.461332082748413, 3.6909141540527344, 3.9204962253570557, 4.150078296661377, 4.379660129547119, 4.6092424392700195, 4.838824272155762, 5.068406105041504, 5.297988414764404, 5.527570724487305, 5.757152557373047, 5.986734867095947, 6.2163166999816895, 6.44589900970459, 6.675480842590332, 6.905062675476074, 7.134644985198975, 7.364226818084717]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 4.0, 10.0, 17.0, 18.0, 23.0, 32.0, 43.0, 66.0, 112.0, 175.0, 320.0, 702.0, 1960.0, 8496.0, 90637.0, 871364.0, 64366.0, 6993.0, 1735.0, 659.0, 321.0, 175.0, 96.0, 41.0, 56.0, 35.0, 21.0, 15.0, 11.0, 10.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8515625, -3.72906494140625, -3.6065673828125, -3.48406982421875, -3.361572265625, -3.23907470703125, -3.1165771484375, -2.99407958984375, -2.87158203125, -2.74908447265625, -2.6265869140625, -2.50408935546875, -2.381591796875, -2.25909423828125, -2.1365966796875, -2.01409912109375, -1.8916015625, -1.76910400390625, -1.6466064453125, -1.52410888671875, -1.401611328125, -1.27911376953125, -1.1566162109375, -1.03411865234375, -0.91162109375, -0.78912353515625, -0.6666259765625, -0.54412841796875, -0.421630859375, -0.29913330078125, -0.1766357421875, -0.05413818359375, 0.068359375, 0.19085693359375, 0.3133544921875, 0.43585205078125, 0.558349609375, 0.68084716796875, 0.8033447265625, 0.92584228515625, 1.04833984375, 1.17083740234375, 1.2933349609375, 1.41583251953125, 1.538330078125, 1.66082763671875, 1.7833251953125, 1.90582275390625, 2.0283203125, 2.15081787109375, 2.2733154296875, 2.39581298828125, 2.518310546875, 2.64080810546875, 2.7633056640625, 2.88580322265625, 3.00830078125, 3.13079833984375, 3.2532958984375, 3.37579345703125, 3.498291015625, 3.62078857421875, 3.7432861328125, 3.86578369140625, 3.98828125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 26.0, 41.0, 76.0, 120.0, 135.0, 176.0, 139.0, 111.0, 76.0, 48.0, 26.0, 11.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.54443359375, -0.5331954956054688, -0.5219573974609375, -0.5107192993164062, -0.499481201171875, -0.48824310302734375, -0.4770050048828125, -0.46576690673828125, -0.45452880859375, -0.44329071044921875, -0.4320526123046875, -0.42081451416015625, -0.409576416015625, -0.39833831787109375, -0.3871002197265625, -0.37586212158203125, -0.3646240234375, -0.35338592529296875, -0.3421478271484375, -0.33090972900390625, -0.319671630859375, -0.30843353271484375, -0.2971954345703125, -0.28595733642578125, -0.27471923828125, -0.26348114013671875, -0.2522430419921875, -0.24100494384765625, -0.229766845703125, -0.21852874755859375, -0.2072906494140625, -0.19605255126953125, -0.184814453125, -0.17357635498046875, -0.1623382568359375, -0.15110015869140625, -0.139862060546875, -0.12862396240234375, -0.1173858642578125, -0.10614776611328125, -0.09490966796875, -0.08367156982421875, -0.0724334716796875, -0.06119537353515625, -0.049957275390625, -0.03871917724609375, -0.0274810791015625, -0.01624298095703125, -0.0050048828125, 0.00623321533203125, 0.0174713134765625, 0.02870941162109375, 0.039947509765625, 0.05118560791015625, 0.0624237060546875, 0.07366180419921875, 0.08489990234375, 0.09613800048828125, 0.1073760986328125, 0.11861419677734375, 0.129852294921875, 0.14109039306640625, 0.1523284912109375, 0.16356658935546875, 0.1748046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 10.0, 5.0, 11.0, 17.0, 17.0, 17.0, 20.0, 46.0, 68.0, 75.0, 117.0, 208.0, 338.0, 570.0, 1069.0, 2170.0, 5422.0, 15607.0, 58172.0, 386696.0, 480571.0, 68676.0, 17600.0, 6050.0, 2340.0, 1127.0, 547.0, 331.0, 201.0, 131.0, 110.0, 69.0, 48.0, 38.0, 15.0, 15.0, 9.0, 9.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0152130126953125, -0.977691650390625, -0.9401702880859375, -0.90264892578125, -0.8651275634765625, -0.827606201171875, -0.7900848388671875, -0.7525634765625, -0.7150421142578125, -0.677520751953125, -0.6399993896484375, -0.60247802734375, -0.5649566650390625, -0.527435302734375, -0.4899139404296875, -0.452392578125, -0.4148712158203125, -0.377349853515625, -0.3398284912109375, -0.30230712890625, -0.2647857666015625, -0.227264404296875, -0.1897430419921875, -0.1522216796875, -0.1147003173828125, -0.077178955078125, -0.0396575927734375, -0.00213623046875, 0.0353851318359375, 0.072906494140625, 0.1104278564453125, 0.14794921875, 0.1854705810546875, 0.222991943359375, 0.2605133056640625, 0.29803466796875, 0.3355560302734375, 0.373077392578125, 0.4105987548828125, 0.4481201171875, 0.4856414794921875, 0.523162841796875, 0.5606842041015625, 0.59820556640625, 0.6357269287109375, 0.673248291015625, 0.7107696533203125, 0.748291015625, 0.7858123779296875, 0.823333740234375, 0.8608551025390625, 0.89837646484375, 0.9358978271484375, 0.973419189453125, 1.0109405517578125, 1.0484619140625, 1.0859832763671875, 1.123504638671875, 1.1610260009765625, 1.19854736328125, 1.2360687255859375, 1.273590087890625, 1.3111114501953125, 1.3486328125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 8.0, 8.0, 11.0, 9.0, 14.0, 21.0, 15.0, 23.0, 31.0, 29.0, 35.0, 33.0, 58.0, 35.0, 58.0, 66.0, 49.0, 67.0, 48.0, 49.0, 52.0, 35.0, 42.0, 33.0, 26.0, 25.0, 15.0, 17.0, 16.0, 14.0, 11.0, 10.0, 4.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54296875, -0.5246810913085938, -0.5063934326171875, -0.48810577392578125, -0.469818115234375, -0.45153045654296875, -0.4332427978515625, -0.41495513916015625, -0.39666748046875, -0.37837982177734375, -0.3600921630859375, -0.34180450439453125, -0.323516845703125, -0.30522918701171875, -0.2869415283203125, -0.26865386962890625, -0.2503662109375, -0.23207855224609375, -0.2137908935546875, -0.19550323486328125, -0.177215576171875, -0.15892791748046875, -0.1406402587890625, -0.12235260009765625, -0.10406494140625, -0.08577728271484375, -0.0674896240234375, -0.04920196533203125, -0.030914306640625, -0.01262664794921875, 0.0056610107421875, 0.02394866943359375, 0.042236328125, 0.06052398681640625, 0.0788116455078125, 0.09709930419921875, 0.115386962890625, 0.13367462158203125, 0.1519622802734375, 0.17024993896484375, 0.18853759765625, 0.20682525634765625, 0.2251129150390625, 0.24340057373046875, 0.261688232421875, 0.27997589111328125, 0.2982635498046875, 0.31655120849609375, 0.3348388671875, 0.35312652587890625, 0.3714141845703125, 0.38970184326171875, 0.407989501953125, 0.42627716064453125, 0.4445648193359375, 0.46285247802734375, 0.48114013671875, 0.49942779541015625, 0.5177154541015625, 0.5360031127929688, 0.554290771484375, 0.5725784301757812, 0.5908660888671875, 0.6091537475585938, 0.62744140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 21.0, 37.0, 64.0, 129.0, 263.0, 815.0, 3510.0, 61918.0, 966887.0, 12346.0, 1660.0, 485.0, 186.0, 89.0, 46.0, 33.0, 18.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.732421875, -2.615020751953125, -2.49761962890625, -2.380218505859375, -2.2628173828125, -2.145416259765625, -2.02801513671875, -1.910614013671875, -1.793212890625, -1.675811767578125, -1.55841064453125, -1.441009521484375, -1.3236083984375, -1.206207275390625, -1.08880615234375, -0.971405029296875, -0.85400390625, -0.736602783203125, -0.61920166015625, -0.501800537109375, -0.3843994140625, -0.266998291015625, -0.14959716796875, -0.032196044921875, 0.085205078125, 0.202606201171875, 0.32000732421875, 0.437408447265625, 0.5548095703125, 0.672210693359375, 0.78961181640625, 0.907012939453125, 1.0244140625, 1.141815185546875, 1.25921630859375, 1.376617431640625, 1.4940185546875, 1.611419677734375, 1.72882080078125, 1.846221923828125, 1.963623046875, 2.081024169921875, 2.19842529296875, 2.315826416015625, 2.4332275390625, 2.550628662109375, 2.66802978515625, 2.785430908203125, 2.90283203125, 3.020233154296875, 3.13763427734375, 3.255035400390625, 3.3724365234375, 3.489837646484375, 3.60723876953125, 3.724639892578125, 3.842041015625, 3.959442138671875, 4.07684326171875, 4.194244384765625, 4.3116455078125, 4.429046630859375, 4.54644775390625, 4.663848876953125, 4.78125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 11.0, 12.0, 16.0, 24.0, 38.0, 96.0, 195.0, 275.0, 143.0, 69.0, 28.0, 25.0, 15.0, 9.0, 6.0, 6.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002455711364746094, -0.0002386048436164856, -0.00023163855075836182, -0.00022467225790023804, -0.00021770596504211426, -0.00021073967218399048, -0.0002037733793258667, -0.00019680708646774292, -0.00018984079360961914, -0.00018287450075149536, -0.00017590820789337158, -0.0001689419150352478, -0.00016197562217712402, -0.00015500932931900024, -0.00014804303646087646, -0.00014107674360275269, -0.0001341104507446289, -0.00012714415788650513, -0.00012017786502838135, -0.00011321157217025757, -0.00010624527931213379, -9.927898645401001e-05, -9.231269359588623e-05, -8.534640073776245e-05, -7.838010787963867e-05, -7.141381502151489e-05, -6.444752216339111e-05, -5.7481229305267334e-05, -5.0514936447143555e-05, -4.3548643589019775e-05, -3.6582350730895996e-05, -2.9616057872772217e-05, -2.2649765014648438e-05, -1.5683472156524658e-05, -8.717179298400879e-06, -1.7508864402770996e-06, 5.21540641784668e-06, 1.2181699275970459e-05, 1.9147992134094238e-05, 2.6114284992218018e-05, 3.30805778503418e-05, 4.0046870708465576e-05, 4.7013163566589355e-05, 5.3979456424713135e-05, 6.0945749282836914e-05, 6.79120421409607e-05, 7.487833499908447e-05, 8.184462785720825e-05, 8.881092071533203e-05, 9.577721357345581e-05, 0.00010274350643157959, 0.00010970979928970337, 0.00011667609214782715, 0.00012364238500595093, 0.0001306086778640747, 0.00013757497072219849, 0.00014454126358032227, 0.00015150755643844604, 0.00015847384929656982, 0.0001654401421546936, 0.00017240643501281738, 0.00017937272787094116, 0.00018633902072906494, 0.00019330531358718872, 0.0002002716064453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 3.0, 3.0, 3.0, 7.0, 20.0, 16.0, 43.0, 49.0, 110.0, 219.0, 464.0, 1179.0, 4166.0, 32690.0, 927278.0, 73329.0, 6336.0, 1509.0, 560.0, 236.0, 120.0, 66.0, 55.0, 33.0, 16.0, 17.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.884765625, -1.813995361328125, -1.74322509765625, -1.672454833984375, -1.6016845703125, -1.530914306640625, -1.46014404296875, -1.389373779296875, -1.318603515625, -1.247833251953125, -1.17706298828125, -1.106292724609375, -1.0355224609375, -0.964752197265625, -0.89398193359375, -0.823211669921875, -0.75244140625, -0.681671142578125, -0.61090087890625, -0.540130615234375, -0.4693603515625, -0.398590087890625, -0.32781982421875, -0.257049560546875, -0.186279296875, -0.115509033203125, -0.04473876953125, 0.026031494140625, 0.0968017578125, 0.167572021484375, 0.23834228515625, 0.309112548828125, 0.3798828125, 0.450653076171875, 0.52142333984375, 0.592193603515625, 0.6629638671875, 0.733734130859375, 0.80450439453125, 0.875274658203125, 0.946044921875, 1.016815185546875, 1.08758544921875, 1.158355712890625, 1.2291259765625, 1.299896240234375, 1.37066650390625, 1.441436767578125, 1.51220703125, 1.582977294921875, 1.65374755859375, 1.724517822265625, 1.7952880859375, 1.866058349609375, 1.93682861328125, 2.007598876953125, 2.078369140625, 2.149139404296875, 2.21990966796875, 2.290679931640625, 2.3614501953125, 2.432220458984375, 2.50299072265625, 2.573760986328125, 2.64453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 12.0, 10.0, 17.0, 36.0, 48.0, 86.0, 162.0, 246.0, 162.0, 90.0, 63.0, 26.0, 19.0, 7.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6123046875, -0.5873031616210938, -0.5623016357421875, -0.5373001098632812, -0.512298583984375, -0.48729705810546875, -0.4622955322265625, -0.43729400634765625, -0.41229248046875, -0.38729095458984375, -0.3622894287109375, -0.33728790283203125, -0.312286376953125, -0.28728485107421875, -0.2622833251953125, -0.23728179931640625, -0.2122802734375, -0.18727874755859375, -0.1622772216796875, -0.13727569580078125, -0.112274169921875, -0.08727264404296875, -0.0622711181640625, -0.03726959228515625, -0.01226806640625, 0.01273345947265625, 0.0377349853515625, 0.06273651123046875, 0.087738037109375, 0.11273956298828125, 0.1377410888671875, 0.16274261474609375, 0.187744140625, 0.21274566650390625, 0.2377471923828125, 0.26274871826171875, 0.287750244140625, 0.31275177001953125, 0.3377532958984375, 0.36275482177734375, 0.38775634765625, 0.41275787353515625, 0.4377593994140625, 0.46276092529296875, 0.487762451171875, 0.5127639770507812, 0.5377655029296875, 0.5627670288085938, 0.5877685546875, 0.6127700805664062, 0.6377716064453125, 0.6627731323242188, 0.687774658203125, 0.7127761840820312, 0.7377777099609375, 0.7627792358398438, 0.78778076171875, 0.8127822875976562, 0.8377838134765625, 0.8627853393554688, 0.887786865234375, 0.9127883911132812, 0.9377899169921875, 0.9627914428710938, 0.98779296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 14.0, 40.0, 88.0, 237.0, 312.0, 185.0, 74.0, 31.0, 11.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.502788543701172, -9.141368865966797, -8.779949188232422, -8.418529510498047, -8.057108879089355, -7.6956892013549805, -7.3342695236206055, -6.9728498458862305, -6.611429691314697, -6.250010013580322, -5.888589859008789, -5.527170181274414, -5.165750503540039, -4.804330348968506, -4.442910671234131, -4.081490516662598, -3.7200708389282227, -3.3586509227752686, -2.9972310066223145, -2.6358113288879395, -2.2743914127349854, -1.9129714965820312, -1.5515518188476562, -1.1901319026947021, -0.828711986541748, -0.4672921299934387, -0.1058722734451294, 0.25554752349853516, 0.6169674396514893, 0.9783873558044434, 1.3398070335388184, 1.7012269496917725, 2.06264591217041, 2.4240658283233643, 2.7854857444763184, 3.1469054222106934, 3.5083253383636475, 3.8697452545166016, 4.231164932250977, 4.592584609985352, 4.954004764556885, 5.31542444229126, 5.676844596862793, 6.038264274597168, 6.399683952331543, 6.761104106903076, 7.122523784637451, 7.483943939208984, 7.845363616943359, 8.206783294677734, 8.56820297241211, 8.929622650146484, 9.291043281555176, 9.65246295928955, 10.013882637023926, 10.3753023147583, 10.736722946166992, 11.098142623901367, 11.459562301635742, 11.820981979370117, 12.182402610778809, 12.543822288513184, 12.905241966247559, 13.266661643981934, 13.628081321716309]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 3.0, 7.0, 10.0, 4.0, 12.0, 19.0, 26.0, 27.0, 37.0, 42.0, 37.0, 43.0, 58.0, 48.0, 55.0, 61.0, 57.0, 68.0, 74.0, 51.0, 46.0, 46.0, 30.0, 26.0, 25.0, 24.0, 16.0, 14.0, 12.0, 5.0, 5.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.100205421447754, -3.9622089862823486, -3.8242127895355225, -3.686216354370117, -3.548220157623291, -3.4102237224578857, -3.2722272872924805, -3.1342310905456543, -2.996234655380249, -2.8582382202148438, -2.7202420234680176, -2.5822455883026123, -2.444249153137207, -2.306252956390381, -2.1682565212249756, -2.0302600860595703, -1.8922638893127441, -1.7542675733566284, -1.6162712574005127, -1.4782748222351074, -1.3402785062789917, -1.202282190322876, -1.0642857551574707, -0.926289439201355, -0.7882931232452393, -0.6502968072891235, -0.512300431728363, -0.3743040859699249, -0.23630774021148682, -0.0983114242553711, 0.039684951305389404, 0.1776813268661499, 0.3156776428222656, 0.45367398858070374, 0.5916703343391418, 0.7296667098999023, 0.8676630258560181, 1.0056593418121338, 1.143655776977539, 1.2816520929336548, 1.4196484088897705, 1.5576447248458862, 1.695641040802002, 1.8336374759674072, 1.971633791923523, 2.1096301078796387, 2.247626543045044, 2.385622978210449, 2.5236191749572754, 2.6616156101226807, 2.799611806869507, 2.937608242034912, 3.0756044387817383, 3.2136008739471436, 3.351597309112549, 3.489593505859375, 3.6275899410247803, 3.7655863761901855, 3.9035825729370117, 4.041578769683838, 4.179575443267822, 4.317571640014648, 4.455567836761475, 4.593564510345459, 4.731560707092285]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 4.0, 4.0, 6.0, 6.0, 8.0, 9.0, 9.0, 7.0, 13.0, 9.0, 14.0, 15.0, 15.0, 13.0, 17.0, 23.0, 26.0, 40.0, 49.0, 61.0, 89.0, 115.0, 150.0, 228.0, 382.0, 690.0, 1710.0, 4731.0, 15412.0, 70290.0, 3976290.0, 93945.0, 19909.0, 6327.0, 2148.0, 819.0, 344.0, 144.0, 86.0, 47.0, 37.0, 14.0, 6.0, 5.0, 2.0], "bins": [-5.7421875, -5.6263275146484375, -5.510467529296875, -5.3946075439453125, -5.27874755859375, -5.1628875732421875, -5.047027587890625, -4.9311676025390625, -4.8153076171875, -4.6994476318359375, -4.583587646484375, -4.4677276611328125, -4.35186767578125, -4.2360076904296875, -4.120147705078125, -4.0042877197265625, -3.888427734375, -3.7725677490234375, -3.656707763671875, -3.5408477783203125, -3.42498779296875, -3.3091278076171875, -3.193267822265625, -3.0774078369140625, -2.9615478515625, -2.8456878662109375, -2.729827880859375, -2.6139678955078125, -2.49810791015625, -2.3822479248046875, -2.266387939453125, -2.1505279541015625, -2.03466796875, -1.9188079833984375, -1.802947998046875, -1.6870880126953125, -1.57122802734375, -1.4553680419921875, -1.339508056640625, -1.2236480712890625, -1.1077880859375, -0.9919281005859375, -0.876068115234375, -0.7602081298828125, -0.64434814453125, -0.5284881591796875, -0.412628173828125, -0.2967681884765625, -0.180908203125, -0.0650482177734375, 0.050811767578125, 0.1666717529296875, 0.28253173828125, 0.3983917236328125, 0.514251708984375, 0.6301116943359375, 0.7459716796875, 0.8618316650390625, 0.977691650390625, 1.0935516357421875, 1.20941162109375, 1.3252716064453125, 1.441131591796875, 1.5569915771484375, 1.6728515625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 16.0, 23.0, 46.0, 76.0, 93.0, 117.0, 167.0, 150.0, 111.0, 78.0, 51.0, 32.0, 22.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.5498046875, -0.5389633178710938, -0.5281219482421875, -0.5172805786132812, -0.506439208984375, -0.49559783935546875, -0.4847564697265625, -0.47391510009765625, -0.46307373046875, -0.45223236083984375, -0.4413909912109375, -0.43054962158203125, -0.419708251953125, -0.40886688232421875, -0.3980255126953125, -0.38718414306640625, -0.3763427734375, -0.36550140380859375, -0.3546600341796875, -0.34381866455078125, -0.332977294921875, -0.32213592529296875, -0.3112945556640625, -0.30045318603515625, -0.28961181640625, -0.27877044677734375, -0.2679290771484375, -0.25708770751953125, -0.246246337890625, -0.23540496826171875, -0.2245635986328125, -0.21372222900390625, -0.202880859375, -0.19203948974609375, -0.1811981201171875, -0.17035675048828125, -0.159515380859375, -0.14867401123046875, -0.1378326416015625, -0.12699127197265625, -0.11614990234375, -0.10530853271484375, -0.0944671630859375, -0.08362579345703125, -0.072784423828125, -0.06194305419921875, -0.0511016845703125, -0.04026031494140625, -0.0294189453125, -0.01857757568359375, -0.0077362060546875, 0.00310516357421875, 0.013946533203125, 0.02478790283203125, 0.0356292724609375, 0.04647064208984375, 0.05731201171875, 0.06815338134765625, 0.0789947509765625, 0.08983612060546875, 0.100677490234375, 0.11151885986328125, 0.1223602294921875, 0.13320159912109375, 0.14404296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 11.0, 9.0, 15.0, 18.0, 33.0, 50.0, 82.0, 128.0, 240.0, 348.0, 685.0, 1792.0, 10430.0, 4011231.0, 161637.0, 5327.0, 1180.0, 512.0, 243.0, 121.0, 70.0, 45.0, 29.0, 15.0, 15.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.0859375, -8.86358642578125, -8.6412353515625, -8.41888427734375, -8.196533203125, -7.97418212890625, -7.7518310546875, -7.52947998046875, -7.30712890625, -7.08477783203125, -6.8624267578125, -6.64007568359375, -6.417724609375, -6.19537353515625, -5.9730224609375, -5.75067138671875, -5.5283203125, -5.30596923828125, -5.0836181640625, -4.86126708984375, -4.638916015625, -4.41656494140625, -4.1942138671875, -3.97186279296875, -3.74951171875, -3.52716064453125, -3.3048095703125, -3.08245849609375, -2.860107421875, -2.63775634765625, -2.4154052734375, -2.19305419921875, -1.970703125, -1.74835205078125, -1.5260009765625, -1.30364990234375, -1.081298828125, -0.85894775390625, -0.6365966796875, -0.41424560546875, -0.19189453125, 0.03045654296875, 0.2528076171875, 0.47515869140625, 0.697509765625, 0.91986083984375, 1.1422119140625, 1.36456298828125, 1.5869140625, 1.80926513671875, 2.0316162109375, 2.25396728515625, 2.476318359375, 2.69866943359375, 2.9210205078125, 3.14337158203125, 3.36572265625, 3.58807373046875, 3.8104248046875, 4.03277587890625, 4.255126953125, 4.47747802734375, 4.6998291015625, 4.92218017578125, 5.14453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 8.0, 16.0, 24.0, 39.0, 59.0, 249.0, 3140.0, 350.0, 73.0, 43.0, 34.0, 16.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.255859375, -1.2270889282226562, -1.1983184814453125, -1.1695480346679688, -1.140777587890625, -1.1120071411132812, -1.0832366943359375, -1.0544662475585938, -1.02569580078125, -0.9969253540039062, -0.9681549072265625, -0.9393844604492188, -0.910614013671875, -0.8818435668945312, -0.8530731201171875, -0.8243026733398438, -0.7955322265625, -0.7667617797851562, -0.7379913330078125, -0.7092208862304688, -0.680450439453125, -0.6516799926757812, -0.6229095458984375, -0.5941390991210938, -0.56536865234375, -0.5365982055664062, -0.5078277587890625, -0.47905731201171875, -0.450286865234375, -0.42151641845703125, -0.3927459716796875, -0.36397552490234375, -0.335205078125, -0.30643463134765625, -0.2776641845703125, -0.24889373779296875, -0.220123291015625, -0.19135284423828125, -0.1625823974609375, -0.13381195068359375, -0.10504150390625, -0.07627105712890625, -0.0475006103515625, -0.01873016357421875, 0.010040283203125, 0.03881072998046875, 0.0675811767578125, 0.09635162353515625, 0.1251220703125, 0.15389251708984375, 0.1826629638671875, 0.21143341064453125, 0.240203857421875, 0.26897430419921875, 0.2977447509765625, 0.32651519775390625, 0.35528564453125, 0.38405609130859375, 0.4128265380859375, 0.44159698486328125, 0.470367431640625, 0.49913787841796875, 0.5279083251953125, 0.5566787719726562, 0.58544921875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 20.0, 30.0, 48.0, 124.0, 283.0, 297.0, 94.0, 43.0, 18.0, 12.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.011326789855957, -7.8253173828125, -7.639307498931885, -7.453298091888428, -7.2672882080078125, -7.0812788009643555, -6.895269393920898, -6.709259510040283, -6.523249626159668, -6.337240219116211, -6.151230335235596, -5.965220928192139, -5.779211044311523, -5.593201637268066, -5.407192230224609, -5.221182346343994, -5.035172939300537, -4.84916353225708, -4.663153648376465, -4.477144241333008, -4.291134357452393, -4.1051249504089355, -3.9191153049468994, -3.7331056594848633, -3.547096014022827, -3.361086368560791, -3.175076723098755, -2.9890670776367188, -2.8030576705932617, -2.6170477867126465, -2.4310383796691895, -2.2450287342071533, -2.059018611907959, -1.8730089664459229, -1.6869993209838867, -1.5009897947311401, -1.314980149269104, -1.1289705038070679, -0.9429609775543213, -0.7569513320922852, -0.570941686630249, -0.3849320709705353, -0.19892245531082153, -0.012912869453430176, 0.17309677600860596, 0.3591064214706421, 0.5451159477233887, 0.7311255931854248, 0.9171352386474609, 1.103144884109497, 1.2891545295715332, 1.4751640558242798, 1.661173701286316, 1.847183346748352, 2.0331928730010986, 2.2192025184631348, 2.405212163925171, 2.591221809387207, 2.777231454849243, 2.9632411003112793, 3.1492505073547363, 3.3352603912353516, 3.5212697982788086, 3.7072794437408447, 3.893289089202881]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 9.0, 17.0, 31.0, 30.0, 41.0, 69.0, 85.0, 90.0, 81.0, 99.0, 105.0, 77.0, 70.0, 67.0, 50.0, 36.0, 23.0, 11.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.377947807312012, -4.254711627960205, -4.131475448608398, -4.008239269256592, -3.885003089904785, -3.7617669105529785, -3.6385304927825928, -3.515294313430786, -3.3920581340789795, -3.268821954727173, -3.145585775375366, -3.0223495960235596, -2.899113178253174, -2.775876998901367, -2.6526408195495605, -2.529404640197754, -2.4061684608459473, -2.2829322814941406, -2.159696102142334, -2.0364599227905273, -1.9132236242294312, -1.7899874448776245, -1.6667511463165283, -1.5435149669647217, -1.420278787612915, -1.2970426082611084, -1.1738064289093018, -1.0505701303482056, -0.9273339509963989, -0.8040977716445923, -0.6808615326881409, -0.5576252937316895, -0.4343891143798828, -0.3111529052257538, -0.18791669607162476, -0.06468048691749573, 0.0585557222366333, 0.18179190158843994, 0.30502814054489136, 0.4282643795013428, 0.5515005588531494, 0.674736738204956, 0.7979729771614075, 0.9212092161178589, 1.0444453954696655, 1.1676815748214722, 1.2909178733825684, 1.414154052734375, 1.5373902320861816, 1.6606264114379883, 1.783862590789795, 1.9070988893508911, 2.030334949493408, 2.153571128845215, 2.2768075466156006, 2.4000437259674072, 2.523279905319214, 2.6465160846710205, 2.769752264022827, 2.892988443374634, 3.0162248611450195, 3.139461040496826, 3.262697219848633, 3.3859333992004395, 3.509169578552246]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 7.0, 4.0, 6.0, 10.0, 14.0, 17.0, 22.0, 48.0, 52.0, 68.0, 100.0, 174.0, 275.0, 531.0, 1101.0, 2818.0, 9604.0, 50258.0, 657427.0, 287179.0, 28368.0, 6452.0, 2100.0, 854.0, 426.0, 210.0, 139.0, 83.0, 61.0, 40.0, 23.0, 21.0, 10.0, 20.0, 6.0, 5.0, 6.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7109375, -2.623046875, -2.53515625, -2.447265625, -2.359375, -2.271484375, -2.18359375, -2.095703125, -2.0078125, -1.919921875, -1.83203125, -1.744140625, -1.65625, -1.568359375, -1.48046875, -1.392578125, -1.3046875, -1.216796875, -1.12890625, -1.041015625, -0.953125, -0.865234375, -0.77734375, -0.689453125, -0.6015625, -0.513671875, -0.42578125, -0.337890625, -0.25, -0.162109375, -0.07421875, 0.013671875, 0.1015625, 0.189453125, 0.27734375, 0.365234375, 0.453125, 0.541015625, 0.62890625, 0.716796875, 0.8046875, 0.892578125, 0.98046875, 1.068359375, 1.15625, 1.244140625, 1.33203125, 1.419921875, 1.5078125, 1.595703125, 1.68359375, 1.771484375, 1.859375, 1.947265625, 2.03515625, 2.123046875, 2.2109375, 2.298828125, 2.38671875, 2.474609375, 2.5625, 2.650390625, 2.73828125, 2.826171875, 2.9140625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 7.0, 10.0, 25.0, 33.0, 49.0, 68.0, 112.0, 118.0, 114.0, 116.0, 93.0, 81.0, 75.0, 35.0, 25.0, 14.0, 15.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52734375, -0.514678955078125, -0.50201416015625, -0.489349365234375, -0.4766845703125, -0.464019775390625, -0.45135498046875, -0.438690185546875, -0.426025390625, -0.413360595703125, -0.40069580078125, -0.388031005859375, -0.3753662109375, -0.362701416015625, -0.35003662109375, -0.337371826171875, -0.32470703125, -0.312042236328125, -0.29937744140625, -0.286712646484375, -0.2740478515625, -0.261383056640625, -0.24871826171875, -0.236053466796875, -0.223388671875, -0.210723876953125, -0.19805908203125, -0.185394287109375, -0.1727294921875, -0.160064697265625, -0.14739990234375, -0.134735107421875, -0.1220703125, -0.109405517578125, -0.09674072265625, -0.084075927734375, -0.0714111328125, -0.058746337890625, -0.04608154296875, -0.033416748046875, -0.020751953125, -0.008087158203125, 0.00457763671875, 0.017242431640625, 0.0299072265625, 0.042572021484375, 0.05523681640625, 0.067901611328125, 0.08056640625, 0.093231201171875, 0.10589599609375, 0.118560791015625, 0.1312255859375, 0.143890380859375, 0.15655517578125, 0.169219970703125, 0.181884765625, 0.194549560546875, 0.20721435546875, 0.219879150390625, 0.2325439453125, 0.245208740234375, 0.25787353515625, 0.270538330078125, 0.283203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 7.0, 4.0, 10.0, 11.0, 11.0, 17.0, 18.0, 41.0, 46.0, 85.0, 114.0, 164.0, 275.0, 413.0, 640.0, 1137.0, 2181.0, 4389.0, 9579.0, 25054.0, 82195.0, 422187.0, 381829.0, 76182.0, 23572.0, 9117.0, 4093.0, 2161.0, 1171.0, 699.0, 417.0, 232.0, 129.0, 113.0, 83.0, 39.0, 38.0, 30.0, 20.0, 13.0, 13.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.03619384765625, -0.9991455078125, -0.96209716796875, -0.925048828125, -0.88800048828125, -0.8509521484375, -0.81390380859375, -0.77685546875, -0.73980712890625, -0.7027587890625, -0.66571044921875, -0.628662109375, -0.59161376953125, -0.5545654296875, -0.51751708984375, -0.48046875, -0.44342041015625, -0.4063720703125, -0.36932373046875, -0.332275390625, -0.29522705078125, -0.2581787109375, -0.22113037109375, -0.18408203125, -0.14703369140625, -0.1099853515625, -0.07293701171875, -0.035888671875, 0.00115966796875, 0.0382080078125, 0.07525634765625, 0.1123046875, 0.14935302734375, 0.1864013671875, 0.22344970703125, 0.260498046875, 0.29754638671875, 0.3345947265625, 0.37164306640625, 0.40869140625, 0.44573974609375, 0.4827880859375, 0.51983642578125, 0.556884765625, 0.59393310546875, 0.6309814453125, 0.66802978515625, 0.705078125, 0.74212646484375, 0.7791748046875, 0.81622314453125, 0.853271484375, 0.89031982421875, 0.9273681640625, 0.96441650390625, 1.00146484375, 1.03851318359375, 1.0755615234375, 1.11260986328125, 1.149658203125, 1.18670654296875, 1.2237548828125, 1.26080322265625, 1.2978515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 9.0, 14.0, 6.0, 16.0, 15.0, 23.0, 27.0, 19.0, 22.0, 37.0, 42.0, 45.0, 56.0, 54.0, 57.0, 53.0, 49.0, 52.0, 57.0, 49.0, 42.0, 42.0, 30.0, 27.0, 30.0, 27.0, 10.0, 16.0, 14.0, 14.0, 7.0, 6.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8232421875, -0.7955551147460938, -0.7678680419921875, -0.7401809692382812, -0.712493896484375, -0.6848068237304688, -0.6571197509765625, -0.6294326782226562, -0.60174560546875, -0.5740585327148438, -0.5463714599609375, -0.5186843872070312, -0.490997314453125, -0.46331024169921875, -0.4356231689453125, -0.40793609619140625, -0.3802490234375, -0.35256195068359375, -0.3248748779296875, -0.29718780517578125, -0.269500732421875, -0.24181365966796875, -0.2141265869140625, -0.18643951416015625, -0.15875244140625, -0.13106536865234375, -0.1033782958984375, -0.07569122314453125, -0.048004150390625, -0.02031707763671875, 0.0073699951171875, 0.03505706787109375, 0.062744140625, 0.09043121337890625, 0.1181182861328125, 0.14580535888671875, 0.173492431640625, 0.20117950439453125, 0.2288665771484375, 0.25655364990234375, 0.28424072265625, 0.31192779541015625, 0.3396148681640625, 0.36730194091796875, 0.394989013671875, 0.42267608642578125, 0.4503631591796875, 0.47805023193359375, 0.5057373046875, 0.5334243774414062, 0.5611114501953125, 0.5887985229492188, 0.616485595703125, 0.6441726684570312, 0.6718597412109375, 0.6995468139648438, 0.72723388671875, 0.7549209594726562, 0.7826080322265625, 0.8102951049804688, 0.837982177734375, 0.8656692504882812, 0.8933563232421875, 0.9210433959960938, 0.94873046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 10.0, 6.0, 13.0, 17.0, 23.0, 28.0, 62.0, 117.0, 292.0, 839.0, 3374.0, 46763.0, 986752.0, 7817.0, 1556.0, 484.0, 187.0, 74.0, 45.0, 22.0, 18.0, 13.0, 8.0, 8.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.052734375, -2.94464111328125, -2.8365478515625, -2.72845458984375, -2.620361328125, -2.51226806640625, -2.4041748046875, -2.29608154296875, -2.18798828125, -2.07989501953125, -1.9718017578125, -1.86370849609375, -1.755615234375, -1.64752197265625, -1.5394287109375, -1.43133544921875, -1.3232421875, -1.21514892578125, -1.1070556640625, -0.99896240234375, -0.890869140625, -0.78277587890625, -0.6746826171875, -0.56658935546875, -0.45849609375, -0.35040283203125, -0.2423095703125, -0.13421630859375, -0.026123046875, 0.08197021484375, 0.1900634765625, 0.29815673828125, 0.40625, 0.51434326171875, 0.6224365234375, 0.73052978515625, 0.838623046875, 0.94671630859375, 1.0548095703125, 1.16290283203125, 1.27099609375, 1.37908935546875, 1.4871826171875, 1.59527587890625, 1.703369140625, 1.81146240234375, 1.9195556640625, 2.02764892578125, 2.1357421875, 2.24383544921875, 2.3519287109375, 2.46002197265625, 2.568115234375, 2.67620849609375, 2.7843017578125, 2.89239501953125, 3.00048828125, 3.10858154296875, 3.2166748046875, 3.32476806640625, 3.432861328125, 3.54095458984375, 3.6490478515625, 3.75714111328125, 3.865234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 18.0, 22.0, 30.0, 77.0, 183.0, 271.0, 202.0, 96.0, 51.0, 18.0, 14.0, 3.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020194053649902344, -0.00019627436995506287, -0.0001906082034111023, -0.00018494203686714172, -0.00017927587032318115, -0.00017360970377922058, -0.00016794353723526, -0.00016227737069129944, -0.00015661120414733887, -0.0001509450376033783, -0.00014527887105941772, -0.00013961270451545715, -0.00013394653797149658, -0.000128280371427536, -0.00012261420488357544, -0.00011694803833961487, -0.0001112818717956543, -0.00010561570525169373, -9.994953870773315e-05, -9.428337216377258e-05, -8.861720561981201e-05, -8.295103907585144e-05, -7.728487253189087e-05, -7.16187059879303e-05, -6.595253944396973e-05, -6.0286372900009155e-05, -5.4620206356048584e-05, -4.895403981208801e-05, -4.328787326812744e-05, -3.762170672416687e-05, -3.19555401802063e-05, -2.6289373636245728e-05, -2.0623207092285156e-05, -1.4957040548324585e-05, -9.290874004364014e-06, -3.6247074604034424e-06, 2.041459083557129e-06, 7.7076256275177e-06, 1.3373792171478271e-05, 1.9039958715438843e-05, 2.4706125259399414e-05, 3.0372291803359985e-05, 3.603845834732056e-05, 4.170462489128113e-05, 4.73707914352417e-05, 5.303695797920227e-05, 5.870312452316284e-05, 6.436929106712341e-05, 7.003545761108398e-05, 7.570162415504456e-05, 8.136779069900513e-05, 8.70339572429657e-05, 9.270012378692627e-05, 9.836629033088684e-05, 0.00010403245687484741, 0.00010969862341880798, 0.00011536478996276855, 0.00012103095650672913, 0.0001266971230506897, 0.00013236328959465027, 0.00013802945613861084, 0.0001436956226825714, 0.00014936178922653198, 0.00015502795577049255, 0.00016069412231445312]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 7.0, 7.0, 9.0, 4.0, 13.0, 8.0, 10.0, 13.0, 21.0, 31.0, 44.0, 80.0, 118.0, 163.0, 217.0, 334.0, 534.0, 947.0, 1406.0, 2347.0, 4453.0, 14238.0, 890400.0, 116586.0, 7847.0, 3492.0, 1847.0, 1179.0, 777.0, 478.0, 293.0, 186.0, 127.0, 91.0, 60.0, 57.0, 39.0, 24.0, 11.0, 9.0, 11.0, 6.0, 5.0, 1.0, 4.0, 5.0, 0.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-1.8037109375, -1.7487335205078125, -1.693756103515625, -1.6387786865234375, -1.58380126953125, -1.5288238525390625, -1.473846435546875, -1.4188690185546875, -1.3638916015625, -1.3089141845703125, -1.253936767578125, -1.1989593505859375, -1.14398193359375, -1.0890045166015625, -1.034027099609375, -0.9790496826171875, -0.924072265625, -0.8690948486328125, -0.814117431640625, -0.7591400146484375, -0.70416259765625, -0.6491851806640625, -0.594207763671875, -0.5392303466796875, -0.4842529296875, -0.4292755126953125, -0.374298095703125, -0.3193206787109375, -0.26434326171875, -0.2093658447265625, -0.154388427734375, -0.0994110107421875, -0.04443359375, 0.0105438232421875, 0.065521240234375, 0.1204986572265625, 0.17547607421875, 0.2304534912109375, 0.285430908203125, 0.3404083251953125, 0.3953857421875, 0.4503631591796875, 0.505340576171875, 0.5603179931640625, 0.61529541015625, 0.6702728271484375, 0.725250244140625, 0.7802276611328125, 0.835205078125, 0.8901824951171875, 0.945159912109375, 1.0001373291015625, 1.05511474609375, 1.1100921630859375, 1.165069580078125, 1.2200469970703125, 1.2750244140625, 1.3300018310546875, 1.384979248046875, 1.4399566650390625, 1.49493408203125, 1.5499114990234375, 1.604888916015625, 1.6598663330078125, 1.71484375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 12.0, 72.0, 318.0, 405.0, 110.0, 33.0, 14.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3271484375, -1.285858154296875, -1.24456787109375, -1.203277587890625, -1.1619873046875, -1.120697021484375, -1.07940673828125, -1.038116455078125, -0.996826171875, -0.955535888671875, -0.91424560546875, -0.872955322265625, -0.8316650390625, -0.790374755859375, -0.74908447265625, -0.707794189453125, -0.66650390625, -0.625213623046875, -0.58392333984375, -0.542633056640625, -0.5013427734375, -0.460052490234375, -0.41876220703125, -0.377471923828125, -0.336181640625, -0.294891357421875, -0.25360107421875, -0.212310791015625, -0.1710205078125, -0.129730224609375, -0.08843994140625, -0.047149658203125, -0.005859375, 0.035430908203125, 0.07672119140625, 0.118011474609375, 0.1593017578125, 0.200592041015625, 0.24188232421875, 0.283172607421875, 0.324462890625, 0.365753173828125, 0.40704345703125, 0.448333740234375, 0.4896240234375, 0.530914306640625, 0.57220458984375, 0.613494873046875, 0.65478515625, 0.696075439453125, 0.73736572265625, 0.778656005859375, 0.8199462890625, 0.861236572265625, 0.90252685546875, 0.943817138671875, 0.985107421875, 1.026397705078125, 1.06768798828125, 1.108978271484375, 1.1502685546875, 1.191558837890625, 1.23284912109375, 1.274139404296875, 1.3154296875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 22.0, 140.0, 446.0, 281.0, 79.0, 20.0, 8.0, 6.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.675392150878906, -31.83068084716797, -30.98596954345703, -30.141258239746094, -29.296545028686523, -28.451833724975586, -27.60712242126465, -26.76241111755371, -25.917699813842773, -25.072988510131836, -24.2282772064209, -23.383563995361328, -22.53885269165039, -21.694141387939453, -20.849430084228516, -20.004718780517578, -19.16000747680664, -18.315296173095703, -17.470584869384766, -16.625873565673828, -15.781161308288574, -14.93644905090332, -14.091737747192383, -13.247026443481445, -12.402313232421875, -11.557601928710938, -10.712889671325684, -9.868178367614746, -9.023467063903809, -8.178754806518555, -7.334043502807617, -6.48933219909668, -5.644620895385742, -4.7999091148376465, -3.955197811126709, -3.1104860305786133, -2.2657744884490967, -1.42106294631958, -0.5763511657714844, 0.2683601379394531, 1.1130719184875488, 1.9577834606170654, 2.802495002746582, 3.6472067832946777, 4.491918563842773, 5.336629867553711, 6.181341648101807, 7.026052951812744, 7.87076473236084, 8.715476036071777, 9.560188293457031, 10.404899597167969, 11.249610900878906, 12.094322204589844, 12.939034461975098, 13.783745765686035, 14.628458023071289, 15.473169326782227, 16.317880630493164, 17.162593841552734, 18.007305145263672, 18.85201644897461, 19.696727752685547, 20.541439056396484, 21.386150360107422]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 8.0, 10.0, 5.0, 19.0, 10.0, 15.0, 20.0, 28.0, 35.0, 33.0, 31.0, 52.0, 39.0, 45.0, 49.0, 49.0, 68.0, 62.0, 48.0, 56.0, 46.0, 40.0, 47.0, 40.0, 26.0, 23.0, 27.0, 16.0, 9.0, 17.0, 11.0, 5.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.471404075622559, -7.274046421051025, -7.076688766479492, -6.879331111907959, -6.681973457336426, -6.484615802764893, -6.287258148193359, -6.089900016784668, -5.892542839050293, -5.69518518447876, -5.497827529907227, -5.300469875335693, -5.10311222076416, -4.905754566192627, -4.708396911621094, -4.511038780212402, -4.313681125640869, -4.116323471069336, -3.9189658164978027, -3.7216081619262695, -3.5242505073547363, -3.326892852783203, -3.129534959793091, -2.9321773052215576, -2.7348196506500244, -2.537461996078491, -2.340104341506958, -2.1427464485168457, -1.945388913154602, -1.7480312585830688, -1.550673484802246, -1.353315830230713, -1.1559576988220215, -0.9586000442504883, -0.7612423300743103, -0.5638846158981323, -0.3665269613265991, -0.16916930675506592, 0.028188467025756836, 0.22554612159729004, 0.42290377616882324, 0.6202614307403564, 0.8176191449165344, 1.0149768590927124, 1.2123345136642456, 1.4096921682357788, 1.6070499420166016, 1.8044075965881348, 2.001765251159668, 2.199122905731201, 2.3964805603027344, 2.5938382148742676, 2.791195869445801, 2.988553524017334, 3.1859114170074463, 3.3832690715789795, 3.5806267261505127, 3.777984380722046, 3.975342035293579, 4.172699928283691, 4.370057582855225, 4.567415237426758, 4.764772891998291, 4.962130546569824, 5.159488201141357]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 6.0, 3.0, 1.0, 4.0, 3.0, 8.0, 7.0, 6.0, 10.0, 12.0, 16.0, 22.0, 17.0, 23.0, 28.0, 20.0, 35.0, 38.0, 40.0, 53.0, 65.0, 82.0, 75.0, 108.0, 221.0, 392.0, 801.0, 1526.0, 3250.0, 7705.0, 21864.0, 219297.0, 3882714.0, 35389.0, 11179.0, 4662.0, 2120.0, 1059.0, 572.0, 342.0, 197.0, 99.0, 68.0, 57.0, 42.0, 15.0, 14.0, 6.0, 3.0, 4.0], "bins": [-4.69921875, -4.5974273681640625, -4.495635986328125, -4.3938446044921875, -4.29205322265625, -4.1902618408203125, -4.088470458984375, -3.9866790771484375, -3.8848876953125, -3.7830963134765625, -3.681304931640625, -3.5795135498046875, -3.47772216796875, -3.3759307861328125, -3.274139404296875, -3.1723480224609375, -3.070556640625, -2.9687652587890625, -2.866973876953125, -2.7651824951171875, -2.66339111328125, -2.5615997314453125, -2.459808349609375, -2.3580169677734375, -2.2562255859375, -2.1544342041015625, -2.052642822265625, -1.9508514404296875, -1.84906005859375, -1.7472686767578125, -1.645477294921875, -1.5436859130859375, -1.44189453125, -1.3401031494140625, -1.238311767578125, -1.1365203857421875, -1.03472900390625, -0.9329376220703125, -0.831146240234375, -0.7293548583984375, -0.6275634765625, -0.5257720947265625, -0.423980712890625, -0.3221893310546875, -0.22039794921875, -0.1186065673828125, -0.016815185546875, 0.0849761962890625, 0.186767578125, 0.2885589599609375, 0.390350341796875, 0.4921417236328125, 0.59393310546875, 0.6957244873046875, 0.797515869140625, 0.8993072509765625, 1.0010986328125, 1.1028900146484375, 1.204681396484375, 1.3064727783203125, 1.40826416015625, 1.5100555419921875, 1.611846923828125, 1.7136383056640625, 1.8154296875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 11.0, 13.0, 16.0, 37.0, 62.0, 63.0, 88.0, 101.0, 104.0, 98.0, 106.0, 80.0, 65.0, 51.0, 40.0, 19.0, 15.0, 12.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.5537109375, -0.5414009094238281, -0.5290908813476562, -0.5167808532714844, -0.5044708251953125, -0.4921607971191406, -0.47985076904296875, -0.4675407409667969, -0.455230712890625, -0.4429206848144531, -0.43061065673828125, -0.4183006286621094, -0.4059906005859375, -0.3936805725097656, -0.38137054443359375, -0.3690605163574219, -0.35675048828125, -0.3444404602050781, -0.33213043212890625, -0.3198204040527344, -0.3075103759765625, -0.2952003479003906, -0.28289031982421875, -0.2705802917480469, -0.258270263671875, -0.24596023559570312, -0.23365020751953125, -0.22134017944335938, -0.2090301513671875, -0.19672012329101562, -0.18441009521484375, -0.17210006713867188, -0.1597900390625, -0.14748001098632812, -0.13516998291015625, -0.12285995483398438, -0.1105499267578125, -0.09823989868164062, -0.08592987060546875, -0.07361984252929688, -0.061309814453125, -0.048999786376953125, -0.03668975830078125, -0.024379730224609375, -0.0120697021484375, 0.000240325927734375, 0.01255035400390625, 0.024860382080078125, 0.03717041015625, 0.049480438232421875, 0.06179046630859375, 0.07410049438476562, 0.0864105224609375, 0.09872055053710938, 0.11103057861328125, 0.12334060668945312, 0.135650634765625, 0.14796066284179688, 0.16027069091796875, 0.17258071899414062, 0.1848907470703125, 0.19720077514648438, 0.20951080322265625, 0.22182083129882812, 0.234130859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 12.0, 8.0, 17.0, 20.0, 14.0, 22.0, 34.0, 39.0, 48.0, 74.0, 86.0, 114.0, 197.0, 435.0, 1266.0, 9870.0, 3975982.0, 198989.0, 5268.0, 941.0, 330.0, 180.0, 84.0, 58.0, 50.0, 36.0, 28.0, 17.0, 8.0, 9.0, 11.0, 8.0, 9.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.81640625, -6.62640380859375, -6.4364013671875, -6.24639892578125, -6.056396484375, -5.86639404296875, -5.6763916015625, -5.48638916015625, -5.29638671875, -5.10638427734375, -4.9163818359375, -4.72637939453125, -4.536376953125, -4.34637451171875, -4.1563720703125, -3.96636962890625, -3.7763671875, -3.58636474609375, -3.3963623046875, -3.20635986328125, -3.016357421875, -2.82635498046875, -2.6363525390625, -2.44635009765625, -2.25634765625, -2.06634521484375, -1.8763427734375, -1.68634033203125, -1.496337890625, -1.30633544921875, -1.1163330078125, -0.92633056640625, -0.736328125, -0.54632568359375, -0.3563232421875, -0.16632080078125, 0.023681640625, 0.21368408203125, 0.4036865234375, 0.59368896484375, 0.78369140625, 0.97369384765625, 1.1636962890625, 1.35369873046875, 1.543701171875, 1.73370361328125, 1.9237060546875, 2.11370849609375, 2.3037109375, 2.49371337890625, 2.6837158203125, 2.87371826171875, 3.063720703125, 3.25372314453125, 3.4437255859375, 3.63372802734375, 3.82373046875, 4.01373291015625, 4.2037353515625, 4.39373779296875, 4.583740234375, 4.77374267578125, 4.9637451171875, 5.15374755859375, 5.34375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 8.0, 23.0, 34.0, 105.0, 961.0, 2752.0, 114.0, 45.0, 20.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.0703125, -2.02978515625, -1.9892578125, -1.94873046875, -1.908203125, -1.86767578125, -1.8271484375, -1.78662109375, -1.74609375, -1.70556640625, -1.6650390625, -1.62451171875, -1.583984375, -1.54345703125, -1.5029296875, -1.46240234375, -1.421875, -1.38134765625, -1.3408203125, -1.30029296875, -1.259765625, -1.21923828125, -1.1787109375, -1.13818359375, -1.09765625, -1.05712890625, -1.0166015625, -0.97607421875, -0.935546875, -0.89501953125, -0.8544921875, -0.81396484375, -0.7734375, -0.73291015625, -0.6923828125, -0.65185546875, -0.611328125, -0.57080078125, -0.5302734375, -0.48974609375, -0.44921875, -0.40869140625, -0.3681640625, -0.32763671875, -0.287109375, -0.24658203125, -0.2060546875, -0.16552734375, -0.125, -0.08447265625, -0.0439453125, -0.00341796875, 0.037109375, 0.07763671875, 0.1181640625, 0.15869140625, 0.19921875, 0.23974609375, 0.2802734375, 0.32080078125, 0.361328125, 0.40185546875, 0.4423828125, 0.48291015625, 0.5234375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 11.0, 28.0, 104.0, 397.0, 319.0, 99.0, 25.0, 13.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.226717948913574, -12.961729049682617, -12.696741104125977, -12.431753158569336, -12.166764259338379, -11.901775360107422, -11.636787414550781, -11.37179946899414, -11.106810569763184, -10.841821670532227, -10.576833724975586, -10.311845779418945, -10.046856880187988, -9.781867980957031, -9.51688003540039, -9.25189208984375, -8.986903190612793, -8.721914291381836, -8.456926345825195, -8.191938400268555, -7.926949501037598, -7.661961078643799, -7.39697265625, -7.131984233856201, -6.866995811462402, -6.6020073890686035, -6.337018966674805, -6.072030544281006, -5.807042121887207, -5.542053699493408, -5.277065277099609, -5.0120768547058105, -4.747088432312012, -4.482100009918213, -4.217111587524414, -3.9521231651306152, -3.6871347427368164, -3.4221463203430176, -3.1571578979492188, -2.89216947555542, -2.6271812915802, -2.3621928691864014, -2.0972044467926025, -1.8322160243988037, -1.5672276020050049, -1.302239179611206, -1.0372507572174072, -0.7722623348236084, -0.5072739124298096, -0.24228549003601074, 0.022702932357788086, 0.2876913547515869, 0.5526797771453857, 0.8176681995391846, 1.0826566219329834, 1.3476450443267822, 1.612633466720581, 1.8776218891143799, 2.1426103115081787, 2.4075987339019775, 2.6725871562957764, 2.937575578689575, 3.202564001083374, 3.467552423477173, 3.7325408458709717]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 10.0, 8.0, 11.0, 17.0, 33.0, 42.0, 66.0, 72.0, 92.0, 76.0, 88.0, 105.0, 86.0, 74.0, 67.0, 41.0, 51.0, 22.0, 15.0, 7.0, 5.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8538014888763428, -2.760843276977539, -2.6678850650787354, -2.5749268531799316, -2.481968879699707, -2.3890106678009033, -2.2960524559020996, -2.203094244003296, -2.110136032104492, -2.0171778202056885, -1.9242196083068848, -1.8312615156173706, -1.738303303718567, -1.6453450918197632, -1.552386999130249, -1.4594287872314453, -1.3664705753326416, -1.273512363433838, -1.1805541515350342, -1.08759605884552, -0.9946378469467163, -0.9016796350479126, -0.8087214827537537, -0.7157633304595947, -0.622805118560791, -0.5298469066619873, -0.43688875436782837, -0.34393057227134705, -0.2509723901748657, -0.1580142080783844, -0.06505602598190308, 0.02790212631225586, 0.12086057662963867, 0.21381875872612, 0.3067769408226013, 0.39973512291908264, 0.49269330501556396, 0.5856515169143677, 0.6786096692085266, 0.7715678215026855, 0.8645260334014893, 0.957484245300293, 1.0504424571990967, 1.1434005498886108, 1.2363587617874146, 1.3293169736862183, 1.4222750663757324, 1.5152332782745361, 1.6081914901733398, 1.7011497020721436, 1.7941079139709473, 1.8870660066604614, 1.9800242185592651, 2.0729823112487793, 2.165940523147583, 2.2588987350463867, 2.3518569469451904, 2.444815158843994, 2.537773370742798, 2.6307315826416016, 2.723689556121826, 2.81664776802063, 2.9096059799194336, 3.0025641918182373, 3.095522403717041]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 6.0, 6.0, 19.0, 24.0, 37.0, 55.0, 77.0, 105.0, 221.0, 360.0, 728.0, 1361.0, 4106.0, 18088.0, 224511.0, 744646.0, 43105.0, 6971.0, 2180.0, 877.0, 425.0, 203.0, 134.0, 99.0, 51.0, 41.0, 25.0, 12.0, 18.0, 9.0, 12.0, 6.0, 4.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.900634765625, -2.77001953125, -2.639404296875, -2.5087890625, -2.378173828125, -2.24755859375, -2.116943359375, -1.986328125, -1.855712890625, -1.72509765625, -1.594482421875, -1.4638671875, -1.333251953125, -1.20263671875, -1.072021484375, -0.94140625, -0.810791015625, -0.68017578125, -0.549560546875, -0.4189453125, -0.288330078125, -0.15771484375, -0.027099609375, 0.103515625, 0.234130859375, 0.36474609375, 0.495361328125, 0.6259765625, 0.756591796875, 0.88720703125, 1.017822265625, 1.1484375, 1.279052734375, 1.40966796875, 1.540283203125, 1.6708984375, 1.801513671875, 1.93212890625, 2.062744140625, 2.193359375, 2.323974609375, 2.45458984375, 2.585205078125, 2.7158203125, 2.846435546875, 2.97705078125, 3.107666015625, 3.23828125, 3.368896484375, 3.49951171875, 3.630126953125, 3.7607421875, 3.891357421875, 4.02197265625, 4.152587890625, 4.283203125, 4.413818359375, 4.54443359375, 4.675048828125, 4.8056640625, 4.936279296875, 5.06689453125, 5.197509765625, 5.328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 13.0, 20.0, 30.0, 37.0, 62.0, 74.0, 72.0, 80.0, 111.0, 97.0, 78.0, 75.0, 67.0, 63.0, 42.0, 21.0, 12.0, 13.0, 11.0, 2.0, 5.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.552734375, -0.5398445129394531, -0.5269546508789062, -0.5140647888183594, -0.5011749267578125, -0.4882850646972656, -0.47539520263671875, -0.4625053405761719, -0.449615478515625, -0.4367256164550781, -0.42383575439453125, -0.4109458923339844, -0.3980560302734375, -0.3851661682128906, -0.37227630615234375, -0.3593864440917969, -0.34649658203125, -0.3336067199707031, -0.32071685791015625, -0.3078269958496094, -0.2949371337890625, -0.2820472717285156, -0.26915740966796875, -0.2562675476074219, -0.243377685546875, -0.23048782348632812, -0.21759796142578125, -0.20470809936523438, -0.1918182373046875, -0.17892837524414062, -0.16603851318359375, -0.15314865112304688, -0.1402587890625, -0.12736892700195312, -0.11447906494140625, -0.10158920288085938, -0.0886993408203125, -0.07580947875976562, -0.06291961669921875, -0.050029754638671875, -0.037139892578125, -0.024250030517578125, -0.01136016845703125, 0.001529693603515625, 0.0144195556640625, 0.027309417724609375, 0.04019927978515625, 0.053089141845703125, 0.06597900390625, 0.07886886596679688, 0.09175872802734375, 0.10464859008789062, 0.1175384521484375, 0.13042831420898438, 0.14331817626953125, 0.15620803833007812, 0.169097900390625, 0.18198776245117188, 0.19487762451171875, 0.20776748657226562, 0.2206573486328125, 0.23354721069335938, 0.24643707275390625, 0.2593269348144531, 0.272216796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 22.0, 19.0, 33.0, 36.0, 67.0, 134.0, 196.0, 347.0, 714.0, 1431.0, 3496.0, 10711.0, 50826.0, 557245.0, 371414.0, 37609.0, 8541.0, 2975.0, 1322.0, 621.0, 334.0, 165.0, 106.0, 53.0, 39.0, 33.0, 17.0, 15.0, 3.0, 9.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.650390625, -2.567352294921875, -2.48431396484375, -2.401275634765625, -2.3182373046875, -2.235198974609375, -2.15216064453125, -2.069122314453125, -1.986083984375, -1.903045654296875, -1.82000732421875, -1.736968994140625, -1.6539306640625, -1.570892333984375, -1.48785400390625, -1.404815673828125, -1.32177734375, -1.238739013671875, -1.15570068359375, -1.072662353515625, -0.9896240234375, -0.906585693359375, -0.82354736328125, -0.740509033203125, -0.657470703125, -0.574432373046875, -0.49139404296875, -0.408355712890625, -0.3253173828125, -0.242279052734375, -0.15924072265625, -0.076202392578125, 0.0068359375, 0.089874267578125, 0.17291259765625, 0.255950927734375, 0.3389892578125, 0.422027587890625, 0.50506591796875, 0.588104248046875, 0.671142578125, 0.754180908203125, 0.83721923828125, 0.920257568359375, 1.0032958984375, 1.086334228515625, 1.16937255859375, 1.252410888671875, 1.33544921875, 1.418487548828125, 1.50152587890625, 1.584564208984375, 1.6676025390625, 1.750640869140625, 1.83367919921875, 1.916717529296875, 1.999755859375, 2.082794189453125, 2.16583251953125, 2.248870849609375, 2.3319091796875, 2.414947509765625, 2.49798583984375, 2.581024169921875, 2.6640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 3.0, 11.0, 11.0, 12.0, 14.0, 30.0, 28.0, 56.0, 54.0, 61.0, 75.0, 73.0, 76.0, 95.0, 69.0, 77.0, 50.0, 47.0, 34.0, 27.0, 23.0, 22.0, 16.0, 6.0, 7.0, 6.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0546875, -2.0016326904296875, -1.948577880859375, -1.8955230712890625, -1.84246826171875, -1.7894134521484375, -1.736358642578125, -1.6833038330078125, -1.6302490234375, -1.5771942138671875, -1.524139404296875, -1.4710845947265625, -1.41802978515625, -1.3649749755859375, -1.311920166015625, -1.2588653564453125, -1.205810546875, -1.1527557373046875, -1.099700927734375, -1.0466461181640625, -0.99359130859375, -0.9405364990234375, -0.887481689453125, -0.8344268798828125, -0.7813720703125, -0.7283172607421875, -0.675262451171875, -0.6222076416015625, -0.56915283203125, -0.5160980224609375, -0.463043212890625, -0.4099884033203125, -0.35693359375, -0.3038787841796875, -0.250823974609375, -0.1977691650390625, -0.14471435546875, -0.0916595458984375, -0.038604736328125, 0.0144500732421875, 0.0675048828125, 0.1205596923828125, 0.173614501953125, 0.2266693115234375, 0.27972412109375, 0.3327789306640625, 0.385833740234375, 0.4388885498046875, 0.491943359375, 0.5449981689453125, 0.598052978515625, 0.6511077880859375, 0.70416259765625, 0.7572174072265625, 0.810272216796875, 0.8633270263671875, 0.9163818359375, 0.9694366455078125, 1.022491455078125, 1.0755462646484375, 1.12860107421875, 1.1816558837890625, 1.234710693359375, 1.2877655029296875, 1.3408203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 9.0, 5.0, 5.0, 17.0, 26.0, 33.0, 40.0, 57.0, 99.0, 222.0, 519.0, 1493.0, 6759.0, 75777.0, 910371.0, 45830.0, 5121.0, 1224.0, 436.0, 207.0, 106.0, 68.0, 31.0, 24.0, 30.0, 14.0, 11.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2890625, -1.2466888427734375, -1.204315185546875, -1.1619415283203125, -1.11956787109375, -1.0771942138671875, -1.034820556640625, -0.9924468994140625, -0.9500732421875, -0.9076995849609375, -0.865325927734375, -0.8229522705078125, -0.78057861328125, -0.7382049560546875, -0.695831298828125, -0.6534576416015625, -0.611083984375, -0.5687103271484375, -0.526336669921875, -0.4839630126953125, -0.44158935546875, -0.3992156982421875, -0.356842041015625, -0.3144683837890625, -0.2720947265625, -0.2297210693359375, -0.187347412109375, -0.1449737548828125, -0.10260009765625, -0.0602264404296875, -0.017852783203125, 0.0245208740234375, 0.06689453125, 0.1092681884765625, 0.151641845703125, 0.1940155029296875, 0.23638916015625, 0.2787628173828125, 0.321136474609375, 0.3635101318359375, 0.4058837890625, 0.4482574462890625, 0.490631103515625, 0.5330047607421875, 0.57537841796875, 0.6177520751953125, 0.660125732421875, 0.7024993896484375, 0.744873046875, 0.7872467041015625, 0.829620361328125, 0.8719940185546875, 0.91436767578125, 0.9567413330078125, 0.999114990234375, 1.0414886474609375, 1.0838623046875, 1.1262359619140625, 1.168609619140625, 1.2109832763671875, 1.25335693359375, 1.2957305908203125, 1.338104248046875, 1.3804779052734375, 1.4228515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 4.0, 8.0, 7.0, 27.0, 29.0, 52.0, 128.0, 227.0, 218.0, 128.0, 65.0, 39.0, 22.0, 10.0, 12.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028896331787109375, -0.00028209760785102844, -0.00027523189783096313, -0.00026836618781089783, -0.0002615004777908325, -0.0002546347677707672, -0.0002477690577507019, -0.0002409033477306366, -0.0002340376377105713, -0.00022717192769050598, -0.00022030621767044067, -0.00021344050765037537, -0.00020657479763031006, -0.00019970908761024475, -0.00019284337759017944, -0.00018597766757011414, -0.00017911195755004883, -0.00017224624752998352, -0.0001653805375099182, -0.0001585148274898529, -0.0001516491174697876, -0.0001447834074497223, -0.00013791769742965698, -0.00013105198740959167, -0.00012418627738952637, -0.00011732056736946106, -0.00011045485734939575, -0.00010358914732933044, -9.672343730926514e-05, -8.985772728919983e-05, -8.299201726913452e-05, -7.612630724906921e-05, -6.92605972290039e-05, -6.23948872089386e-05, -5.552917718887329e-05, -4.8663467168807983e-05, -4.1797757148742676e-05, -3.493204712867737e-05, -2.806633710861206e-05, -2.1200627088546753e-05, -1.4334917068481445e-05, -7.469207048416138e-06, -6.034970283508301e-07, 6.2622129917144775e-06, 1.3127923011779785e-05, 1.9993633031845093e-05, 2.68593430519104e-05, 3.372505307197571e-05, 4.0590763092041016e-05, 4.745647311210632e-05, 5.432218313217163e-05, 6.118789315223694e-05, 6.805360317230225e-05, 7.491931319236755e-05, 8.178502321243286e-05, 8.865073323249817e-05, 9.551644325256348e-05, 0.00010238215327262878, 0.00010924786329269409, 0.0001161135733127594, 0.0001229792833328247, 0.00012984499335289001, 0.00013671070337295532, 0.00014357641339302063, 0.00015044212341308594]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 14.0, 20.0, 20.0, 44.0, 55.0, 92.0, 135.0, 250.0, 497.0, 969.0, 2216.0, 6218.0, 24411.0, 336534.0, 625741.0, 37940.0, 8163.0, 2749.0, 1182.0, 559.0, 277.0, 159.0, 94.0, 69.0, 47.0, 29.0, 20.0, 11.0, 9.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.826171875, -0.800445556640625, -0.77471923828125, -0.748992919921875, -0.7232666015625, -0.697540283203125, -0.67181396484375, -0.646087646484375, -0.620361328125, -0.594635009765625, -0.56890869140625, -0.543182373046875, -0.5174560546875, -0.491729736328125, -0.46600341796875, -0.440277099609375, -0.41455078125, -0.388824462890625, -0.36309814453125, -0.337371826171875, -0.3116455078125, -0.285919189453125, -0.26019287109375, -0.234466552734375, -0.208740234375, -0.183013916015625, -0.15728759765625, -0.131561279296875, -0.1058349609375, -0.080108642578125, -0.05438232421875, -0.028656005859375, -0.0029296875, 0.022796630859375, 0.04852294921875, 0.074249267578125, 0.0999755859375, 0.125701904296875, 0.15142822265625, 0.177154541015625, 0.202880859375, 0.228607177734375, 0.25433349609375, 0.280059814453125, 0.3057861328125, 0.331512451171875, 0.35723876953125, 0.382965087890625, 0.40869140625, 0.434417724609375, 0.46014404296875, 0.485870361328125, 0.5115966796875, 0.537322998046875, 0.56304931640625, 0.588775634765625, 0.614501953125, 0.640228271484375, 0.66595458984375, 0.691680908203125, 0.7174072265625, 0.743133544921875, 0.76885986328125, 0.794586181640625, 0.8203125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 8.0, 9.0, 11.0, 24.0, 26.0, 52.0, 105.0, 138.0, 147.0, 139.0, 113.0, 81.0, 36.0, 28.0, 27.0, 13.0, 7.0, 9.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429931640625, -0.4138526916503906, -0.39777374267578125, -0.3816947937011719, -0.3656158447265625, -0.3495368957519531, -0.33345794677734375, -0.3173789978027344, -0.301300048828125, -0.2852210998535156, -0.26914215087890625, -0.2530632019042969, -0.2369842529296875, -0.22090530395507812, -0.20482635498046875, -0.18874740600585938, -0.17266845703125, -0.15658950805664062, -0.14051055908203125, -0.12443161010742188, -0.1083526611328125, -0.09227371215820312, -0.07619476318359375, -0.060115814208984375, -0.044036865234375, -0.027957916259765625, -0.01187896728515625, 0.004199981689453125, 0.0202789306640625, 0.036357879638671875, 0.05243682861328125, 0.06851577758789062, 0.0845947265625, 0.10067367553710938, 0.11675262451171875, 0.13283157348632812, 0.1489105224609375, 0.16498947143554688, 0.18106842041015625, 0.19714736938476562, 0.213226318359375, 0.22930526733398438, 0.24538421630859375, 0.2614631652832031, 0.2775421142578125, 0.2936210632324219, 0.30970001220703125, 0.3257789611816406, 0.34185791015625, 0.3579368591308594, 0.37401580810546875, 0.3900947570800781, 0.4061737060546875, 0.4222526550292969, 0.43833160400390625, 0.4544105529785156, 0.470489501953125, 0.4865684509277344, 0.5026473999023438, 0.5187263488769531, 0.5348052978515625, 0.5508842468261719, 0.5669631958007812, 0.5830421447753906, 0.59912109375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 13.0, 16.0, 27.0, 55.0, 117.0, 199.0, 244.0, 144.0, 88.0, 30.0, 27.0, 9.0, 13.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.304840087890625, -21.831836700439453, -21.35883331298828, -20.885831832885742, -20.41282844543457, -19.9398250579834, -19.466821670532227, -18.993820190429688, -18.520816802978516, -18.047813415527344, -17.574810028076172, -17.101808547973633, -16.62880516052246, -16.15580177307129, -15.682798385620117, -15.209795951843262, -14.73679256439209, -14.263789176940918, -13.790786743164062, -13.31778335571289, -12.844780921936035, -12.371777534484863, -11.898775100708008, -11.425771713256836, -10.952768325805664, -10.479764938354492, -10.006762504577637, -9.533759117126465, -9.06075668334961, -8.587753295898438, -8.114749908447266, -7.64174747467041, -7.1687445640563965, -6.695741653442383, -6.222738742828369, -5.7497358322143555, -5.276732444763184, -4.803730010986328, -4.330726623535156, -3.8577237129211426, -3.384720802307129, -2.9117178916931152, -2.4387149810791016, -1.9657118320465088, -1.4927089214324951, -1.0197060108184814, -0.5467028617858887, -0.073699951171875, 0.39930295944213867, 0.8723059296607971, 1.3453088998794556, 1.8183119297027588, 2.2913148403167725, 2.764317750930786, 3.237320899963379, 3.7103238105773926, 4.183326721191406, 4.65632963180542, 5.129332542419434, 5.6023359298706055, 6.075338363647461, 6.548341751098633, 7.0213446617126465, 7.49434757232666, 7.967350482940674]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 8.0, 5.0, 8.0, 11.0, 14.0, 12.0, 9.0, 16.0, 25.0, 21.0, 16.0, 25.0, 33.0, 39.0, 49.0, 39.0, 56.0, 58.0, 44.0, 43.0, 46.0, 37.0, 43.0, 43.0, 44.0, 33.0, 36.0, 24.0, 21.0, 21.0, 24.0, 17.0, 15.0, 10.0, 9.0, 5.0, 11.0, 5.0, 7.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.693523406982422, -6.486822605133057, -6.280121803283691, -6.073421478271484, -5.866720676422119, -5.660019874572754, -5.453319072723389, -5.246618270874023, -5.039917945861816, -4.833217144012451, -4.626516342163086, -4.419816017150879, -4.213115215301514, -4.006414413452148, -3.799713611602783, -3.593012809753418, -3.3863120079040527, -3.1796112060546875, -2.9729106426239014, -2.766209840774536, -2.55950927734375, -2.3528084754943848, -2.1461076736450195, -1.9394069910049438, -1.7327063083648682, -1.5260056257247925, -1.3193049430847168, -1.1126041412353516, -0.9059034585952759, -0.6992027759552002, -0.49250197410583496, -0.2858012914657593, -0.0791006088256836, 0.12760010361671448, 0.33430081605911255, 0.541001558303833, 0.7477022409439087, 0.9544029235839844, 1.1611037254333496, 1.3678044080734253, 1.574505090713501, 1.7812057733535767, 1.9879064559936523, 2.1946072578430176, 2.401308059692383, 2.608008623123169, 2.814709424972534, 3.0214099884033203, 3.2281107902526855, 3.434811592102051, 3.641512155532837, 3.848212957382202, 4.054913520812988, 4.2616143226623535, 4.468315124511719, 4.675015926361084, 4.881716728210449, 5.0884175300598145, 5.29511833190918, 5.501818656921387, 5.708519458770752, 5.915220260620117, 6.121921062469482, 6.328621864318848, 6.535322189331055]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 4.0, 8.0, 8.0, 11.0, 9.0, 15.0, 10.0, 27.0, 9.0, 24.0, 30.0, 16.0, 37.0, 29.0, 52.0, 67.0, 65.0, 80.0, 107.0, 159.0, 167.0, 287.0, 495.0, 1020.0, 2244.0, 5341.0, 14472.0, 47369.0, 3199365.0, 856167.0, 43284.0, 13549.0, 5231.0, 2198.0, 1087.0, 520.0, 305.0, 178.0, 94.0, 49.0, 28.0, 24.0, 12.0, 10.0, 8.0, 3.0, 2.0], "bins": [-4.203125, -4.111663818359375, -4.02020263671875, -3.928741455078125, -3.8372802734375, -3.745819091796875, -3.65435791015625, -3.562896728515625, -3.471435546875, -3.379974365234375, -3.28851318359375, -3.197052001953125, -3.1055908203125, -3.014129638671875, -2.92266845703125, -2.831207275390625, -2.73974609375, -2.648284912109375, -2.55682373046875, -2.465362548828125, -2.3739013671875, -2.282440185546875, -2.19097900390625, -2.099517822265625, -2.008056640625, -1.916595458984375, -1.82513427734375, -1.733673095703125, -1.6422119140625, -1.550750732421875, -1.45928955078125, -1.367828369140625, -1.2763671875, -1.184906005859375, -1.09344482421875, -1.001983642578125, -0.9105224609375, -0.819061279296875, -0.72760009765625, -0.636138916015625, -0.544677734375, -0.453216552734375, -0.36175537109375, -0.270294189453125, -0.1788330078125, -0.087371826171875, 0.00408935546875, 0.095550537109375, 0.18701171875, 0.278472900390625, 0.36993408203125, 0.461395263671875, 0.5528564453125, 0.644317626953125, 0.73577880859375, 0.827239990234375, 0.918701171875, 1.010162353515625, 1.10162353515625, 1.193084716796875, 1.2845458984375, 1.376007080078125, 1.46746826171875, 1.558929443359375, 1.650390625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 12.0, 16.0, 19.0, 51.0, 47.0, 52.0, 65.0, 68.0, 88.0, 95.0, 93.0, 73.0, 87.0, 57.0, 50.0, 41.0, 24.0, 20.0, 9.0, 12.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.56591796875, -0.5532703399658203, -0.5406227111816406, -0.5279750823974609, -0.5153274536132812, -0.5026798248291016, -0.4900321960449219, -0.4773845672607422, -0.4647369384765625, -0.4520893096923828, -0.4394416809082031, -0.42679405212402344, -0.41414642333984375, -0.40149879455566406, -0.3888511657714844, -0.3762035369873047, -0.363555908203125, -0.3509082794189453, -0.3382606506347656, -0.32561302185058594, -0.31296539306640625, -0.30031776428222656, -0.2876701354980469, -0.2750225067138672, -0.2623748779296875, -0.2497272491455078, -0.23707962036132812, -0.22443199157714844, -0.21178436279296875, -0.19913673400878906, -0.18648910522460938, -0.1738414764404297, -0.16119384765625, -0.1485462188720703, -0.13589859008789062, -0.12325096130371094, -0.11060333251953125, -0.09795570373535156, -0.08530807495117188, -0.07266044616699219, -0.0600128173828125, -0.04736518859863281, -0.034717559814453125, -0.022069931030273438, -0.00942230224609375, 0.0032253265380859375, 0.015872955322265625, 0.028520584106445312, 0.041168212890625, 0.05381584167480469, 0.06646347045898438, 0.07911109924316406, 0.09175872802734375, 0.10440635681152344, 0.11705398559570312, 0.1297016143798828, 0.1423492431640625, 0.1549968719482422, 0.16764450073242188, 0.18029212951660156, 0.19293975830078125, 0.20558738708496094, 0.21823501586914062, 0.2308826446533203, 0.2435302734375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 8.0, 6.0, 11.0, 23.0, 23.0, 36.0, 49.0, 79.0, 99.0, 168.0, 240.0, 404.0, 702.0, 1157.0, 2233.0, 4828.0, 12857.0, 76150.0, 4006659.0, 67435.0, 11844.0, 4470.0, 2107.0, 1081.0, 565.0, 371.0, 229.0, 137.0, 98.0, 72.0, 36.0, 27.0, 17.0, 14.0, 13.0, 4.0, 5.0, 11.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.01171875, -4.857421875, -4.703125, -4.548828125, -4.39453125, -4.240234375, -4.0859375, -3.931640625, -3.77734375, -3.623046875, -3.46875, -3.314453125, -3.16015625, -3.005859375, -2.8515625, -2.697265625, -2.54296875, -2.388671875, -2.234375, -2.080078125, -1.92578125, -1.771484375, -1.6171875, -1.462890625, -1.30859375, -1.154296875, -1.0, -0.845703125, -0.69140625, -0.537109375, -0.3828125, -0.228515625, -0.07421875, 0.080078125, 0.234375, 0.388671875, 0.54296875, 0.697265625, 0.8515625, 1.005859375, 1.16015625, 1.314453125, 1.46875, 1.623046875, 1.77734375, 1.931640625, 2.0859375, 2.240234375, 2.39453125, 2.548828125, 2.703125, 2.857421875, 3.01171875, 3.166015625, 3.3203125, 3.474609375, 3.62890625, 3.783203125, 3.9375, 4.091796875, 4.24609375, 4.400390625, 4.5546875, 4.708984375, 4.86328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 5.0, 4.0, 22.0, 39.0, 68.0, 124.0, 1306.0, 2198.0, 149.0, 60.0, 33.0, 8.0, 12.0, 5.0, 3.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.099609375, -2.041351318359375, -1.98309326171875, -1.924835205078125, -1.8665771484375, -1.808319091796875, -1.75006103515625, -1.691802978515625, -1.633544921875, -1.575286865234375, -1.51702880859375, -1.458770751953125, -1.4005126953125, -1.342254638671875, -1.28399658203125, -1.225738525390625, -1.16748046875, -1.109222412109375, -1.05096435546875, -0.992706298828125, -0.9344482421875, -0.876190185546875, -0.81793212890625, -0.759674072265625, -0.701416015625, -0.643157958984375, -0.58489990234375, -0.526641845703125, -0.4683837890625, -0.410125732421875, -0.35186767578125, -0.293609619140625, -0.2353515625, -0.177093505859375, -0.11883544921875, -0.060577392578125, -0.0023193359375, 0.055938720703125, 0.11419677734375, 0.172454833984375, 0.230712890625, 0.288970947265625, 0.34722900390625, 0.405487060546875, 0.4637451171875, 0.522003173828125, 0.58026123046875, 0.638519287109375, 0.69677734375, 0.755035400390625, 0.81329345703125, 0.871551513671875, 0.9298095703125, 0.988067626953125, 1.04632568359375, 1.104583740234375, 1.162841796875, 1.221099853515625, 1.27935791015625, 1.337615966796875, 1.3958740234375, 1.454132080078125, 1.51239013671875, 1.570648193359375, 1.62890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 6.0, 12.0, 27.0, 89.0, 435.0, 343.0, 68.0, 16.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.378494262695312, -27.760772705078125, -27.14305305480957, -26.525331497192383, -25.907611846923828, -25.28989028930664, -24.672168731689453, -24.0544490814209, -23.43672752380371, -22.819005966186523, -22.20128631591797, -21.58356475830078, -20.965845108032227, -20.34812355041504, -19.730403900146484, -19.112682342529297, -18.49496078491211, -17.877239227294922, -17.259519577026367, -16.64179801940918, -16.024078369140625, -15.406356811523438, -14.788636207580566, -14.170915603637695, -13.55319595336914, -12.93547534942627, -12.317754745483398, -11.700033187866211, -11.08231258392334, -10.464591979980469, -9.846871376037598, -9.229150772094727, -8.611428260803223, -7.993707656860352, -7.375986576080322, -6.758265972137451, -6.140544891357422, -5.522824287414551, -4.90510368347168, -4.28738260269165, -3.6696619987487793, -3.051941156387329, -2.434220314025879, -1.8164997100830078, -1.1987788677215576, -0.5810580253601074, 0.03666257858276367, 0.654383659362793, 1.272104263305664, 1.8898251056671143, 2.5075459480285645, 3.1252665519714355, 3.7429873943328857, 4.360708236694336, 4.978428840637207, 5.596149921417236, 6.213870525360107, 6.8315911293029785, 7.449312210083008, 8.067032814025879, 8.68475341796875, 9.302474975585938, 9.920194625854492, 10.53791618347168, 11.15563678741455]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 2.0, 18.0, 20.0, 33.0, 41.0, 85.0, 93.0, 105.0, 123.0, 111.0, 110.0, 73.0, 66.0, 47.0, 30.0, 15.0, 13.0, 10.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.202716827392578, -6.986385822296143, -6.770055294036865, -6.55372428894043, -6.337393760681152, -6.121062755584717, -5.904731750488281, -5.688401222229004, -5.472070217132568, -5.255739212036133, -5.0394086837768555, -4.82307767868042, -4.606746673583984, -4.390416145324707, -4.1740851402282715, -3.957754373550415, -3.7414236068725586, -3.525092840194702, -3.3087620735168457, -3.09243106842041, -2.8761003017425537, -2.6597695350646973, -2.4434385299682617, -2.2271077632904053, -2.010776996612549, -1.7944462299346924, -1.5781153440475464, -1.3617844581604004, -1.145453691482544, -0.9291229248046875, -0.7127920389175415, -0.4964611530303955, -0.28013038635253906, -0.06379956007003784, 0.15253126621246338, 0.3688620924949646, 0.5851929187774658, 0.8015236854553223, 1.0178545713424683, 1.2341854572296143, 1.4505162239074707, 1.6668469905853271, 1.8831778764724731, 2.099508762359619, 2.3158395290374756, 2.532170295715332, 2.7485013008117676, 2.964832067489624, 3.1811628341674805, 3.397493600845337, 3.6138243675231934, 3.830155372619629, 4.046485900878906, 4.262816905975342, 4.479147911071777, 4.695478439331055, 4.91180944442749, 5.128140449523926, 5.344470977783203, 5.560801982879639, 5.777132987976074, 5.993463516235352, 6.209794521331787, 6.426125526428223, 6.6424560546875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 7.0, 11.0, 15.0, 20.0, 32.0, 56.0, 79.0, 125.0, 183.0, 370.0, 769.0, 2216.0, 10553.0, 134396.0, 828552.0, 61342.0, 6778.0, 1663.0, 665.0, 276.0, 149.0, 93.0, 69.0, 29.0, 31.0, 19.0, 13.0, 8.0, 3.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76953125, -3.6265869140625, -3.483642578125, -3.3406982421875, -3.19775390625, -3.0548095703125, -2.911865234375, -2.7689208984375, -2.6259765625, -2.4830322265625, -2.340087890625, -2.1971435546875, -2.05419921875, -1.9112548828125, -1.768310546875, -1.6253662109375, -1.482421875, -1.3394775390625, -1.196533203125, -1.0535888671875, -0.91064453125, -0.7677001953125, -0.624755859375, -0.4818115234375, -0.3388671875, -0.1959228515625, -0.052978515625, 0.0899658203125, 0.23291015625, 0.3758544921875, 0.518798828125, 0.6617431640625, 0.8046875, 0.9476318359375, 1.090576171875, 1.2335205078125, 1.37646484375, 1.5194091796875, 1.662353515625, 1.8052978515625, 1.9482421875, 2.0911865234375, 2.234130859375, 2.3770751953125, 2.52001953125, 2.6629638671875, 2.805908203125, 2.9488525390625, 3.091796875, 3.2347412109375, 3.377685546875, 3.5206298828125, 3.66357421875, 3.8065185546875, 3.949462890625, 4.0924072265625, 4.2353515625, 4.3782958984375, 4.521240234375, 4.6641845703125, 4.80712890625, 4.9500732421875, 5.093017578125, 5.2359619140625, 5.37890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 11.0, 23.0, 37.0, 61.0, 92.0, 92.0, 103.0, 118.0, 111.0, 91.0, 91.0, 59.0, 44.0, 32.0, 14.0, 7.0, 9.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.79150390625, -0.7737846374511719, -0.7560653686523438, -0.7383460998535156, -0.7206268310546875, -0.7029075622558594, -0.6851882934570312, -0.6674690246582031, -0.649749755859375, -0.6320304870605469, -0.6143112182617188, -0.5965919494628906, -0.5788726806640625, -0.5611534118652344, -0.5434341430664062, -0.5257148742675781, -0.50799560546875, -0.4902763366699219, -0.47255706787109375, -0.4548377990722656, -0.4371185302734375, -0.4193992614746094, -0.40167999267578125, -0.3839607238769531, -0.366241455078125, -0.3485221862792969, -0.33080291748046875, -0.3130836486816406, -0.2953643798828125, -0.2776451110839844, -0.25992584228515625, -0.24220657348632812, -0.2244873046875, -0.20676803588867188, -0.18904876708984375, -0.17132949829101562, -0.1536102294921875, -0.13589096069335938, -0.11817169189453125, -0.10045242309570312, -0.082733154296875, -0.06501388549804688, -0.04729461669921875, -0.029575347900390625, -0.0118560791015625, 0.005863189697265625, 0.02358245849609375, 0.041301727294921875, 0.05902099609375, 0.07674026489257812, 0.09445953369140625, 0.11217880249023438, 0.1298980712890625, 0.14761734008789062, 0.16533660888671875, 0.18305587768554688, 0.200775146484375, 0.21849441528320312, 0.23621368408203125, 0.2539329528808594, 0.2716522216796875, 0.2893714904785156, 0.30709075927734375, 0.3248100280761719, 0.342529296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 17.0, 8.0, 8.0, 23.0, 33.0, 34.0, 52.0, 67.0, 93.0, 161.0, 212.0, 324.0, 570.0, 924.0, 1722.0, 3127.0, 6167.0, 13445.0, 31025.0, 79355.0, 244842.0, 423402.0, 148603.0, 52287.0, 21480.0, 9897.0, 4780.0, 2393.0, 1329.0, 762.0, 458.0, 305.0, 193.0, 145.0, 84.0, 53.0, 40.0, 34.0, 18.0, 15.0, 18.0, 3.0, 7.0, 8.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0224609375, -0.9907989501953125, -0.959136962890625, -0.9274749755859375, -0.89581298828125, -0.8641510009765625, -0.832489013671875, -0.8008270263671875, -0.7691650390625, -0.7375030517578125, -0.705841064453125, -0.6741790771484375, -0.64251708984375, -0.6108551025390625, -0.579193115234375, -0.5475311279296875, -0.515869140625, -0.4842071533203125, -0.452545166015625, -0.4208831787109375, -0.38922119140625, -0.3575592041015625, -0.325897216796875, -0.2942352294921875, -0.2625732421875, -0.2309112548828125, -0.199249267578125, -0.1675872802734375, -0.13592529296875, -0.1042633056640625, -0.072601318359375, -0.0409393310546875, -0.00927734375, 0.0223846435546875, 0.054046630859375, 0.0857086181640625, 0.11737060546875, 0.1490325927734375, 0.180694580078125, 0.2123565673828125, 0.2440185546875, 0.2756805419921875, 0.307342529296875, 0.3390045166015625, 0.37066650390625, 0.4023284912109375, 0.433990478515625, 0.4656524658203125, 0.497314453125, 0.5289764404296875, 0.560638427734375, 0.5923004150390625, 0.62396240234375, 0.6556243896484375, 0.687286376953125, 0.7189483642578125, 0.7506103515625, 0.7822723388671875, 0.813934326171875, 0.8455963134765625, 0.87725830078125, 0.9089202880859375, 0.940582275390625, 0.9722442626953125, 1.00390625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 6.0, 5.0, 12.0, 11.0, 20.0, 16.0, 18.0, 24.0, 45.0, 23.0, 43.0, 40.0, 32.0, 48.0, 46.0, 54.0, 62.0, 58.0, 43.0, 48.0, 49.0, 39.0, 35.0, 37.0, 26.0, 30.0, 25.0, 22.0, 14.0, 8.0, 12.0, 11.0, 7.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1157379150390625, -1.081085205078125, -1.0464324951171875, -1.01177978515625, -0.9771270751953125, -0.942474365234375, -0.9078216552734375, -0.8731689453125, -0.8385162353515625, -0.803863525390625, -0.7692108154296875, -0.73455810546875, -0.6999053955078125, -0.665252685546875, -0.6305999755859375, -0.595947265625, -0.5612945556640625, -0.526641845703125, -0.4919891357421875, -0.45733642578125, -0.4226837158203125, -0.388031005859375, -0.3533782958984375, -0.3187255859375, -0.2840728759765625, -0.249420166015625, -0.2147674560546875, -0.18011474609375, -0.1454620361328125, -0.110809326171875, -0.0761566162109375, -0.04150390625, -0.0068511962890625, 0.027801513671875, 0.0624542236328125, 0.09710693359375, 0.1317596435546875, 0.166412353515625, 0.2010650634765625, 0.2357177734375, 0.2703704833984375, 0.305023193359375, 0.3396759033203125, 0.37432861328125, 0.4089813232421875, 0.443634033203125, 0.4782867431640625, 0.512939453125, 0.5475921630859375, 0.582244873046875, 0.6168975830078125, 0.65155029296875, 0.6862030029296875, 0.720855712890625, 0.7555084228515625, 0.7901611328125, 0.8248138427734375, 0.859466552734375, 0.8941192626953125, 0.92877197265625, 0.9634246826171875, 0.998077392578125, 1.0327301025390625, 1.0673828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 9.0, 6.0, 7.0, 12.0, 8.0, 17.0, 24.0, 34.0, 49.0, 66.0, 109.0, 152.0, 233.0, 356.0, 601.0, 1038.0, 1856.0, 3809.0, 8621.0, 24794.0, 110719.0, 618502.0, 217349.0, 38094.0, 11808.0, 4764.0, 2266.0, 1246.0, 692.0, 437.0, 270.0, 178.0, 145.0, 82.0, 63.0, 42.0, 25.0, 17.0, 15.0, 10.0, 7.0, 9.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.83349609375, -0.8101272583007812, -0.7867584228515625, -0.7633895874023438, -0.740020751953125, -0.7166519165039062, -0.6932830810546875, -0.6699142456054688, -0.64654541015625, -0.6231765747070312, -0.5998077392578125, -0.5764389038085938, -0.553070068359375, -0.5297012329101562, -0.5063323974609375, -0.48296356201171875, -0.4595947265625, -0.43622589111328125, -0.4128570556640625, -0.38948822021484375, -0.366119384765625, -0.34275054931640625, -0.3193817138671875, -0.29601287841796875, -0.27264404296875, -0.24927520751953125, -0.2259063720703125, -0.20253753662109375, -0.179168701171875, -0.15579986572265625, -0.1324310302734375, -0.10906219482421875, -0.085693359375, -0.06232452392578125, -0.0389556884765625, -0.01558685302734375, 0.007781982421875, 0.03115081787109375, 0.0545196533203125, 0.07788848876953125, 0.10125732421875, 0.12462615966796875, 0.1479949951171875, 0.17136383056640625, 0.194732666015625, 0.21810150146484375, 0.2414703369140625, 0.26483917236328125, 0.2882080078125, 0.31157684326171875, 0.3349456787109375, 0.35831451416015625, 0.381683349609375, 0.40505218505859375, 0.4284210205078125, 0.45178985595703125, 0.47515869140625, 0.49852752685546875, 0.5218963623046875, 0.5452651977539062, 0.568634033203125, 0.5920028686523438, 0.6153717041015625, 0.6387405395507812, 0.662109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 4.0, 9.0, 6.0, 8.0, 11.0, 14.0, 23.0, 31.0, 27.0, 49.0, 90.0, 88.0, 126.0, 131.0, 100.0, 65.0, 52.0, 44.0, 26.0, 19.0, 16.0, 16.0, 8.0, 7.0, 2.0, 3.0, 7.0, 5.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011175870895385742, -0.00010744575411081314, -0.00010313279926776886, -9.881984442472458e-05, -9.45068895816803e-05, -9.019393473863602e-05, -8.588097989559174e-05, -8.156802505254745e-05, -7.725507020950317e-05, -7.294211536645889e-05, -6.862916052341461e-05, -6.431620568037033e-05, -6.000325083732605e-05, -5.569029599428177e-05, -5.137734115123749e-05, -4.706438630819321e-05, -4.2751431465148926e-05, -3.8438476622104645e-05, -3.4125521779060364e-05, -2.9812566936016083e-05, -2.5499612092971802e-05, -2.118665724992752e-05, -1.687370240688324e-05, -1.2560747563838959e-05, -8.247792720794678e-06, -3.934837877750397e-06, 3.781169652938843e-07, 4.691071808338165e-06, 9.004026651382446e-06, 1.3316981494426727e-05, 1.7629936337471008e-05, 2.194289118051529e-05, 2.625584602355957e-05, 3.056880086660385e-05, 3.488175570964813e-05, 3.919471055269241e-05, 4.3507665395736694e-05, 4.7820620238780975e-05, 5.2133575081825256e-05, 5.644652992486954e-05, 6.075948476791382e-05, 6.50724396109581e-05, 6.938539445400238e-05, 7.369834929704666e-05, 7.801130414009094e-05, 8.232425898313522e-05, 8.66372138261795e-05, 9.095016866922379e-05, 9.526312351226807e-05, 9.957607835531235e-05, 0.00010388903319835663, 0.00010820198804140091, 0.00011251494288444519, 0.00011682789772748947, 0.00012114085257053375, 0.00012545380741357803, 0.00012976676225662231, 0.0001340797170996666, 0.00013839267194271088, 0.00014270562678575516, 0.00014701858162879944, 0.00015133153647184372, 0.000155644491314888, 0.00015995744615793228, 0.00016427040100097656]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 11.0, 9.0, 17.0, 24.0, 29.0, 48.0, 73.0, 114.0, 158.0, 267.0, 423.0, 676.0, 1258.0, 2597.0, 5594.0, 14567.0, 49572.0, 299681.0, 548479.0, 88109.0, 21721.0, 7752.0, 3369.0, 1722.0, 886.0, 484.0, 320.0, 193.0, 140.0, 71.0, 54.0, 25.0, 29.0, 21.0, 19.0, 11.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.64404296875, -0.6233901977539062, -0.6027374267578125, -0.5820846557617188, -0.561431884765625, -0.5407791137695312, -0.5201263427734375, -0.49947357177734375, -0.47882080078125, -0.45816802978515625, -0.4375152587890625, -0.41686248779296875, -0.396209716796875, -0.37555694580078125, -0.3549041748046875, -0.33425140380859375, -0.3135986328125, -0.29294586181640625, -0.2722930908203125, -0.25164031982421875, -0.230987548828125, -0.21033477783203125, -0.1896820068359375, -0.16902923583984375, -0.14837646484375, -0.12772369384765625, -0.1070709228515625, -0.08641815185546875, -0.065765380859375, -0.04511260986328125, -0.0244598388671875, -0.00380706787109375, 0.016845703125, 0.03749847412109375, 0.0581512451171875, 0.07880401611328125, 0.099456787109375, 0.12010955810546875, 0.1407623291015625, 0.16141510009765625, 0.18206787109375, 0.20272064208984375, 0.2233734130859375, 0.24402618408203125, 0.264678955078125, 0.28533172607421875, 0.3059844970703125, 0.32663726806640625, 0.3472900390625, 0.36794281005859375, 0.3885955810546875, 0.40924835205078125, 0.429901123046875, 0.45055389404296875, 0.4712066650390625, 0.49185943603515625, 0.51251220703125, 0.5331649780273438, 0.5538177490234375, 0.5744705200195312, 0.595123291015625, 0.6157760620117188, 0.6364288330078125, 0.6570816040039062, 0.677734375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 4.0, 7.0, 14.0, 8.0, 15.0, 33.0, 32.0, 44.0, 57.0, 86.0, 102.0, 117.0, 105.0, 113.0, 75.0, 49.0, 36.0, 29.0, 24.0, 16.0, 8.0, 8.0, 10.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.49456024169921875, -0.4774017333984375, -0.46024322509765625, -0.443084716796875, -0.42592620849609375, -0.4087677001953125, -0.39160919189453125, -0.37445068359375, -0.35729217529296875, -0.3401336669921875, -0.32297515869140625, -0.305816650390625, -0.28865814208984375, -0.2714996337890625, -0.25434112548828125, -0.2371826171875, -0.22002410888671875, -0.2028656005859375, -0.18570709228515625, -0.168548583984375, -0.15139007568359375, -0.1342315673828125, -0.11707305908203125, -0.09991455078125, -0.08275604248046875, -0.0655975341796875, -0.04843902587890625, -0.031280517578125, -0.01412200927734375, 0.0030364990234375, 0.02019500732421875, 0.037353515625, 0.05451202392578125, 0.0716705322265625, 0.08882904052734375, 0.105987548828125, 0.12314605712890625, 0.1403045654296875, 0.15746307373046875, 0.17462158203125, 0.19178009033203125, 0.2089385986328125, 0.22609710693359375, 0.243255615234375, 0.26041412353515625, 0.2775726318359375, 0.29473114013671875, 0.3118896484375, 0.32904815673828125, 0.3462066650390625, 0.36336517333984375, 0.380523681640625, 0.39768218994140625, 0.4148406982421875, 0.43199920654296875, 0.44915771484375, 0.46631622314453125, 0.4834747314453125, 0.5006332397460938, 0.517791748046875, 0.5349502563476562, 0.5521087646484375, 0.5692672729492188, 0.58642578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 4.0, 7.0, 12.0, 23.0, 23.0, 44.0, 71.0, 85.0, 132.0, 129.0, 113.0, 86.0, 82.0, 46.0, 44.0, 32.0, 12.0, 18.0, 12.0, 8.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.693008422851562, -8.44550895690918, -8.198009490966797, -7.950510025024414, -7.703010559082031, -7.455511093139648, -7.208011627197266, -6.960512161254883, -6.7130126953125, -6.465513229370117, -6.218013763427734, -5.970514297485352, -5.723014831542969, -5.475515365600586, -5.228015899658203, -4.98051643371582, -4.733017444610596, -4.485517978668213, -4.23801851272583, -3.9905190467834473, -3.7430195808410645, -3.4955201148986816, -3.248020887374878, -3.000521421432495, -2.7530219554901123, -2.5055224895477295, -2.2580230236053467, -2.010523796081543, -1.7630242109298706, -1.5155247449874878, -1.2680253982543945, -1.0205259323120117, -0.7730264663696289, -0.5255270004272461, -0.27802759408950806, -0.03052818775177002, 0.2169712781906128, 0.4644707441329956, 0.7119700908660889, 0.9594695568084717, 1.2069690227508545, 1.4544684886932373, 1.7019679546356201, 1.9494673013687134, 2.1969666481018066, 2.4444661140441895, 2.6919655799865723, 2.939465045928955, 3.186964511871338, 3.4344639778137207, 3.6819634437561035, 3.9294629096984863, 4.176962375640869, 4.424461841583252, 4.671960830688477, 4.919460296630859, 5.166959762573242, 5.414459228515625, 5.661958694458008, 5.909458160400391, 6.156957626342773, 6.404457092285156, 6.651956558227539, 6.899456024169922, 7.146955490112305]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 2.0, 9.0, 14.0, 12.0, 14.0, 19.0, 19.0, 15.0, 32.0, 26.0, 24.0, 32.0, 34.0, 41.0, 35.0, 42.0, 54.0, 53.0, 58.0, 43.0, 38.0, 36.0, 38.0, 44.0, 31.0, 35.0, 22.0, 27.0, 20.0, 23.0, 20.0, 11.0, 10.0, 14.0, 11.0, 6.0, 6.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.06458044052124, -6.861997604370117, -6.659415245056152, -6.456832408905029, -6.254249572753906, -6.051667213439941, -5.849084377288818, -5.646501541137695, -5.4439191818237305, -5.241336345672607, -5.038753986358643, -4.8361711502075195, -4.633588790893555, -4.431005954742432, -4.228423118591309, -4.025840759277344, -3.8232579231262207, -3.6206753253936768, -3.418092727661133, -3.2155098915100098, -3.012927293777466, -2.810344696044922, -2.607761859893799, -2.405179262161255, -2.202596664428711, -2.000014066696167, -1.7974313497543335, -1.5948486328125, -1.392266035079956, -1.189683437347412, -0.9871007204055786, -0.7845180034637451, -0.581934928894043, -0.37935227155685425, -0.17676961421966553, 0.025813043117523193, 0.22839570045471191, 0.43097829818725586, 0.6335610151290894, 0.8361437320709229, 1.0387263298034668, 1.2413089275360107, 1.4438916444778442, 1.6464743614196777, 1.8490569591522217, 2.0516395568847656, 2.2542223930358887, 2.4568049907684326, 2.6593875885009766, 2.8619701862335205, 3.0645527839660645, 3.2671356201171875, 3.4697182178497314, 3.6723008155822754, 3.8748836517333984, 4.077466011047363, 4.280048847198486, 4.482631683349609, 4.685214042663574, 4.887796878814697, 5.09037971496582, 5.292962074279785, 5.495544910430908, 5.698127746582031, 5.900710105895996]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 12.0, 8.0, 13.0, 7.0, 23.0, 13.0, 30.0, 46.0, 51.0, 81.0, 107.0, 192.0, 480.0, 1601.0, 7207.0, 103930.0, 4061533.0, 14689.0, 2761.0, 817.0, 310.0, 146.0, 90.0, 53.0, 27.0, 15.0, 11.0, 4.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.37890625, -7.208038330078125, -7.03717041015625, -6.866302490234375, -6.6954345703125, -6.524566650390625, -6.35369873046875, -6.182830810546875, -6.011962890625, -5.841094970703125, -5.67022705078125, -5.499359130859375, -5.3284912109375, -5.157623291015625, -4.98675537109375, -4.815887451171875, -4.64501953125, -4.474151611328125, -4.30328369140625, -4.132415771484375, -3.9615478515625, -3.790679931640625, -3.61981201171875, -3.448944091796875, -3.278076171875, -3.107208251953125, -2.93634033203125, -2.765472412109375, -2.5946044921875, -2.423736572265625, -2.25286865234375, -2.082000732421875, -1.9111328125, -1.740264892578125, -1.56939697265625, -1.398529052734375, -1.2276611328125, -1.056793212890625, -0.88592529296875, -0.715057373046875, -0.544189453125, -0.373321533203125, -0.20245361328125, -0.031585693359375, 0.1392822265625, 0.310150146484375, 0.48101806640625, 0.651885986328125, 0.82275390625, 0.993621826171875, 1.16448974609375, 1.335357666015625, 1.5062255859375, 1.677093505859375, 1.84796142578125, 2.018829345703125, 2.189697265625, 2.360565185546875, 2.53143310546875, 2.702301025390625, 2.8731689453125, 3.044036865234375, 3.21490478515625, 3.385772705078125, 3.556640625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 10.0, 10.0, 19.0, 25.0, 34.0, 56.0, 71.0, 85.0, 90.0, 99.0, 90.0, 86.0, 98.0, 73.0, 47.0, 42.0, 34.0, 18.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.73876953125, -0.7215843200683594, -0.7043991088867188, -0.6872138977050781, -0.6700286865234375, -0.6528434753417969, -0.6356582641601562, -0.6184730529785156, -0.601287841796875, -0.5841026306152344, -0.5669174194335938, -0.5497322082519531, -0.5325469970703125, -0.5153617858886719, -0.49817657470703125, -0.4809913635253906, -0.46380615234375, -0.4466209411621094, -0.42943572998046875, -0.4122505187988281, -0.3950653076171875, -0.3778800964355469, -0.36069488525390625, -0.3435096740722656, -0.326324462890625, -0.3091392517089844, -0.29195404052734375, -0.2747688293457031, -0.2575836181640625, -0.24039840698242188, -0.22321319580078125, -0.20602798461914062, -0.1888427734375, -0.17165756225585938, -0.15447235107421875, -0.13728713989257812, -0.1201019287109375, -0.10291671752929688, -0.08573150634765625, -0.06854629516601562, -0.051361083984375, -0.034175872802734375, -0.01699066162109375, 0.000194549560546875, 0.0173797607421875, 0.034564971923828125, 0.05175018310546875, 0.06893539428710938, 0.08612060546875, 0.10330581665039062, 0.12049102783203125, 0.13767623901367188, 0.1548614501953125, 0.17204666137695312, 0.18923187255859375, 0.20641708374023438, 0.223602294921875, 0.24078750610351562, 0.25797271728515625, 0.2751579284667969, 0.2923431396484375, 0.3095283508300781, 0.32671356201171875, 0.3438987731933594, 0.361083984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 6.0, 5.0, 9.0, 11.0, 4.0, 17.0, 28.0, 17.0, 32.0, 37.0, 44.0, 49.0, 113.0, 223.0, 538.0, 1502.0, 5442.0, 37614.0, 4065077.0, 72334.0, 7915.0, 1980.0, 623.0, 264.0, 121.0, 73.0, 44.0, 27.0, 33.0, 25.0, 26.0, 7.0, 5.0, 10.0, 9.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.416015625, -3.296600341796875, -3.17718505859375, -3.057769775390625, -2.9383544921875, -2.818939208984375, -2.69952392578125, -2.580108642578125, -2.460693359375, -2.341278076171875, -2.22186279296875, -2.102447509765625, -1.9830322265625, -1.863616943359375, -1.74420166015625, -1.624786376953125, -1.50537109375, -1.385955810546875, -1.26654052734375, -1.147125244140625, -1.0277099609375, -0.908294677734375, -0.78887939453125, -0.669464111328125, -0.550048828125, -0.430633544921875, -0.31121826171875, -0.191802978515625, -0.0723876953125, 0.047027587890625, 0.16644287109375, 0.285858154296875, 0.4052734375, 0.524688720703125, 0.64410400390625, 0.763519287109375, 0.8829345703125, 1.002349853515625, 1.12176513671875, 1.241180419921875, 1.360595703125, 1.480010986328125, 1.59942626953125, 1.718841552734375, 1.8382568359375, 1.957672119140625, 2.07708740234375, 2.196502685546875, 2.31591796875, 2.435333251953125, 2.55474853515625, 2.674163818359375, 2.7935791015625, 2.912994384765625, 3.03240966796875, 3.151824951171875, 3.271240234375, 3.390655517578125, 3.51007080078125, 3.629486083984375, 3.7489013671875, 3.868316650390625, 3.98773193359375, 4.107147216796875, 4.2265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 9.0, 6.0, 23.0, 40.0, 89.0, 359.0, 3048.0, 312.0, 85.0, 37.0, 22.0, 8.0, 11.0, 10.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5244140625, -1.492279052734375, -1.46014404296875, -1.428009033203125, -1.3958740234375, -1.363739013671875, -1.33160400390625, -1.299468994140625, -1.267333984375, -1.235198974609375, -1.20306396484375, -1.170928955078125, -1.1387939453125, -1.106658935546875, -1.07452392578125, -1.042388916015625, -1.01025390625, -0.978118896484375, -0.94598388671875, -0.913848876953125, -0.8817138671875, -0.849578857421875, -0.81744384765625, -0.785308837890625, -0.753173828125, -0.721038818359375, -0.68890380859375, -0.656768798828125, -0.6246337890625, -0.592498779296875, -0.56036376953125, -0.528228759765625, -0.49609375, -0.463958740234375, -0.43182373046875, -0.399688720703125, -0.3675537109375, -0.335418701171875, -0.30328369140625, -0.271148681640625, -0.239013671875, -0.206878662109375, -0.17474365234375, -0.142608642578125, -0.1104736328125, -0.078338623046875, -0.04620361328125, -0.014068603515625, 0.01806640625, 0.050201416015625, 0.08233642578125, 0.114471435546875, 0.1466064453125, 0.178741455078125, 0.21087646484375, 0.243011474609375, 0.275146484375, 0.307281494140625, 0.33941650390625, 0.371551513671875, 0.4036865234375, 0.435821533203125, 0.46795654296875, 0.500091552734375, 0.5322265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 10.0, 19.0, 54.0, 169.0, 338.0, 233.0, 98.0, 42.0, 15.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.128536224365234, -5.928487777709961, -5.7284393310546875, -5.528390884399414, -5.328342437744141, -5.128293991088867, -4.928245544433594, -4.72819709777832, -4.528148651123047, -4.328100204467773, -4.1280517578125, -3.9280033111572266, -3.727954864501953, -3.5279064178466797, -3.3278579711914062, -3.127809524536133, -2.9277610778808594, -2.727712631225586, -2.5276641845703125, -2.327615737915039, -2.1275672912597656, -1.9275188446044922, -1.7274703979492188, -1.5274219512939453, -1.3273735046386719, -1.1273250579833984, -0.927276611328125, -0.7272281646728516, -0.5271797180175781, -0.3271312713623047, -0.12708282470703125, 0.07296562194824219, 0.2730135917663574, 0.47306203842163086, 0.6731104850769043, 0.8731589317321777, 1.0732073783874512, 1.2732558250427246, 1.473304271697998, 1.6733527183532715, 1.873401165008545, 2.0734496116638184, 2.273498058319092, 2.4735465049743652, 2.6735949516296387, 2.873643398284912, 3.0736918449401855, 3.273740291595459, 3.4737887382507324, 3.673837184906006, 3.8738856315612793, 4.073934078216553, 4.273982524871826, 4.4740309715271, 4.674079418182373, 4.8741278648376465, 5.07417631149292, 5.274224758148193, 5.474273204803467, 5.67432165145874, 5.874370098114014, 6.074418544769287, 6.2744669914245605, 6.474515438079834, 6.674563884735107]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 10.0, 17.0, 12.0, 24.0, 35.0, 37.0, 55.0, 66.0, 73.0, 86.0, 106.0, 87.0, 86.0, 66.0, 64.0, 44.0, 48.0, 26.0, 20.0, 19.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3855605125427246, -3.293560266494751, -3.2015600204467773, -3.1095597743988037, -3.01755952835083, -2.9255592823028564, -2.833559036254883, -2.7415590286254883, -2.6495585441589355, -2.557558298110962, -2.4655580520629883, -2.3735578060150146, -2.281557559967041, -2.1895573139190674, -2.0975570678710938, -2.005557060241699, -1.9135568141937256, -1.821556568145752, -1.7295563220977783, -1.6375560760498047, -1.545555830001831, -1.4535555839538574, -1.3615554571151733, -1.2695552110671997, -1.177554965019226, -1.0855547189712524, -0.9935544729232788, -0.90155428647995, -0.8095540404319763, -0.7175537943840027, -0.6255536079406738, -0.5335533618927002, -0.44155287742614746, -0.34955263137817383, -0.2575524151325226, -0.16555219888687134, -0.0735519528388977, 0.018448293209075928, 0.11044847965240479, 0.20244872570037842, 0.29444897174835205, 0.3864492177963257, 0.47844943404197693, 0.5704496502876282, 0.6624498963356018, 0.7544501423835754, 0.8464503288269043, 0.9384505748748779, 1.0304508209228516, 1.1224510669708252, 1.2144513130187988, 1.3064515590667725, 1.398451805114746, 1.4904520511627197, 1.5824521780014038, 1.6744524240493774, 1.766452670097351, 1.8584529161453247, 1.9504531621932983, 2.0424532890319824, 2.134453535079956, 2.2264537811279297, 2.3184540271759033, 2.410454273223877, 2.5024545192718506]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 5.0, 4.0, 10.0, 17.0, 22.0, 19.0, 24.0, 53.0, 66.0, 81.0, 144.0, 213.0, 349.0, 645.0, 1689.0, 5877.0, 31375.0, 312370.0, 625507.0, 56514.0, 9208.0, 2305.0, 874.0, 426.0, 246.0, 147.0, 107.0, 76.0, 35.0, 41.0, 22.0, 17.0, 12.0, 12.0, 6.0, 11.0, 3.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.057220458984375, -2.95233154296875, -2.847442626953125, -2.7425537109375, -2.637664794921875, -2.53277587890625, -2.427886962890625, -2.322998046875, -2.218109130859375, -2.11322021484375, -2.008331298828125, -1.9034423828125, -1.798553466796875, -1.69366455078125, -1.588775634765625, -1.48388671875, -1.378997802734375, -1.27410888671875, -1.169219970703125, -1.0643310546875, -0.959442138671875, -0.85455322265625, -0.749664306640625, -0.644775390625, -0.539886474609375, -0.43499755859375, -0.330108642578125, -0.2252197265625, -0.120330810546875, -0.01544189453125, 0.089447021484375, 0.1943359375, 0.299224853515625, 0.40411376953125, 0.509002685546875, 0.6138916015625, 0.718780517578125, 0.82366943359375, 0.928558349609375, 1.033447265625, 1.138336181640625, 1.24322509765625, 1.348114013671875, 1.4530029296875, 1.557891845703125, 1.66278076171875, 1.767669677734375, 1.87255859375, 1.977447509765625, 2.08233642578125, 2.187225341796875, 2.2921142578125, 2.397003173828125, 2.50189208984375, 2.606781005859375, 2.711669921875, 2.816558837890625, 2.92144775390625, 3.026336669921875, 3.1312255859375, 3.236114501953125, 3.34100341796875, 3.445892333984375, 3.55078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 13.0, 15.0, 24.0, 44.0, 66.0, 68.0, 85.0, 92.0, 117.0, 110.0, 76.0, 83.0, 71.0, 55.0, 33.0, 20.0, 9.0, 8.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.763671875, -0.7457542419433594, -0.7278366088867188, -0.7099189758300781, -0.6920013427734375, -0.6740837097167969, -0.6561660766601562, -0.6382484436035156, -0.620330810546875, -0.6024131774902344, -0.5844955444335938, -0.5665779113769531, -0.5486602783203125, -0.5307426452636719, -0.5128250122070312, -0.4949073791503906, -0.47698974609375, -0.4590721130371094, -0.44115447998046875, -0.4232368469238281, -0.4053192138671875, -0.3874015808105469, -0.36948394775390625, -0.3515663146972656, -0.333648681640625, -0.3157310485839844, -0.29781341552734375, -0.2798957824707031, -0.2619781494140625, -0.24406051635742188, -0.22614288330078125, -0.20822525024414062, -0.1903076171875, -0.17238998413085938, -0.15447235107421875, -0.13655471801757812, -0.1186370849609375, -0.10071945190429688, -0.08280181884765625, -0.06488418579101562, -0.046966552734375, -0.029048919677734375, -0.01113128662109375, 0.006786346435546875, 0.0247039794921875, 0.042621612548828125, 0.06053924560546875, 0.07845687866210938, 0.09637451171875, 0.11429214477539062, 0.13220977783203125, 0.15012741088867188, 0.1680450439453125, 0.18596267700195312, 0.20388031005859375, 0.22179794311523438, 0.239715576171875, 0.2576332092285156, 0.27555084228515625, 0.2934684753417969, 0.3113861083984375, 0.3293037414550781, 0.34722137451171875, 0.3651390075683594, 0.383056640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 14.0, 13.0, 21.0, 23.0, 35.0, 34.0, 63.0, 86.0, 129.0, 182.0, 272.0, 427.0, 688.0, 1063.0, 1836.0, 3225.0, 5861.0, 11150.0, 22766.0, 49828.0, 116340.0, 303129.0, 312464.0, 119149.0, 50632.0, 23547.0, 11446.0, 6037.0, 3204.0, 1808.0, 1092.0, 662.0, 444.0, 266.0, 191.0, 124.0, 75.0, 60.0, 46.0, 31.0, 21.0, 14.0, 19.0, 6.0, 10.0, 6.0, 0.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.845703125, -0.8184356689453125, -0.791168212890625, -0.7639007568359375, -0.73663330078125, -0.7093658447265625, -0.682098388671875, -0.6548309326171875, -0.6275634765625, -0.6002960205078125, -0.573028564453125, -0.5457611083984375, -0.51849365234375, -0.4912261962890625, -0.463958740234375, -0.4366912841796875, -0.409423828125, -0.3821563720703125, -0.354888916015625, -0.3276214599609375, -0.30035400390625, -0.2730865478515625, -0.245819091796875, -0.2185516357421875, -0.1912841796875, -0.1640167236328125, -0.136749267578125, -0.1094818115234375, -0.08221435546875, -0.0549468994140625, -0.027679443359375, -0.0004119873046875, 0.02685546875, 0.0541229248046875, 0.081390380859375, 0.1086578369140625, 0.13592529296875, 0.1631927490234375, 0.190460205078125, 0.2177276611328125, 0.2449951171875, 0.2722625732421875, 0.299530029296875, 0.3267974853515625, 0.35406494140625, 0.3813323974609375, 0.408599853515625, 0.4358673095703125, 0.463134765625, 0.4904022216796875, 0.517669677734375, 0.5449371337890625, 0.57220458984375, 0.5994720458984375, 0.626739501953125, 0.6540069580078125, 0.6812744140625, 0.7085418701171875, 0.735809326171875, 0.7630767822265625, 0.79034423828125, 0.8176116943359375, 0.844879150390625, 0.8721466064453125, 0.8994140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 9.0, 9.0, 10.0, 12.0, 10.0, 24.0, 21.0, 17.0, 23.0, 20.0, 38.0, 37.0, 43.0, 37.0, 46.0, 43.0, 49.0, 55.0, 55.0, 26.0, 36.0, 40.0, 40.0, 35.0, 40.0, 31.0, 24.0, 21.0, 25.0, 22.0, 13.0, 15.0, 12.0, 16.0, 9.0, 8.0, 6.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107421875, -0.9776763916015625, -0.944610595703125, -0.9115447998046875, -0.87847900390625, -0.8454132080078125, -0.812347412109375, -0.7792816162109375, -0.7462158203125, -0.7131500244140625, -0.680084228515625, -0.6470184326171875, -0.61395263671875, -0.5808868408203125, -0.547821044921875, -0.5147552490234375, -0.481689453125, -0.4486236572265625, -0.415557861328125, -0.3824920654296875, -0.34942626953125, -0.3163604736328125, -0.283294677734375, -0.2502288818359375, -0.2171630859375, -0.1840972900390625, -0.151031494140625, -0.1179656982421875, -0.08489990234375, -0.0518341064453125, -0.018768310546875, 0.0142974853515625, 0.04736328125, 0.0804290771484375, 0.113494873046875, 0.1465606689453125, 0.17962646484375, 0.2126922607421875, 0.245758056640625, 0.2788238525390625, 0.3118896484375, 0.3449554443359375, 0.378021240234375, 0.4110870361328125, 0.44415283203125, 0.4772186279296875, 0.510284423828125, 0.5433502197265625, 0.576416015625, 0.6094818115234375, 0.642547607421875, 0.6756134033203125, 0.70867919921875, 0.7417449951171875, 0.774810791015625, 0.8078765869140625, 0.8409423828125, 0.8740081787109375, 0.907073974609375, 0.9401397705078125, 0.97320556640625, 1.0062713623046875, 1.039337158203125, 1.0724029541015625, 1.10546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 8.0, 6.0, 20.0, 23.0, 23.0, 41.0, 101.0, 181.0, 360.0, 704.0, 1668.0, 4539.0, 15526.0, 79376.0, 641951.0, 256505.0, 34178.0, 8388.0, 2781.0, 1117.0, 474.0, 240.0, 145.0, 80.0, 45.0, 26.0, 16.0, 9.0, 7.0, 9.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7451171875, -0.7182769775390625, -0.691436767578125, -0.6645965576171875, -0.63775634765625, -0.6109161376953125, -0.584075927734375, -0.5572357177734375, -0.5303955078125, -0.5035552978515625, -0.476715087890625, -0.4498748779296875, -0.42303466796875, -0.3961944580078125, -0.369354248046875, -0.3425140380859375, -0.315673828125, -0.2888336181640625, -0.261993408203125, -0.2351531982421875, -0.20831298828125, -0.1814727783203125, -0.154632568359375, -0.1277923583984375, -0.1009521484375, -0.0741119384765625, -0.047271728515625, -0.0204315185546875, 0.00640869140625, 0.0332489013671875, 0.060089111328125, 0.0869293212890625, 0.11376953125, 0.1406097412109375, 0.167449951171875, 0.1942901611328125, 0.22113037109375, 0.2479705810546875, 0.274810791015625, 0.3016510009765625, 0.3284912109375, 0.3553314208984375, 0.382171630859375, 0.4090118408203125, 0.43585205078125, 0.4626922607421875, 0.489532470703125, 0.5163726806640625, 0.543212890625, 0.5700531005859375, 0.596893310546875, 0.6237335205078125, 0.65057373046875, 0.6774139404296875, 0.704254150390625, 0.7310943603515625, 0.7579345703125, 0.7847747802734375, 0.811614990234375, 0.8384552001953125, 0.86529541015625, 0.8921356201171875, 0.918975830078125, 0.9458160400390625, 0.97265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 15.0, 18.0, 20.0, 17.0, 34.0, 64.0, 69.0, 127.0, 139.0, 132.0, 106.0, 60.0, 52.0, 32.0, 22.0, 22.0, 12.0, 4.0, 16.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014793872833251953, -0.00014299340546131134, -0.00013804808259010315, -0.00013310275971889496, -0.00012815743684768677, -0.00012321211397647858, -0.00011826679110527039, -0.0001133214682340622, -0.000108376145362854, -0.00010343082249164581, -9.848549962043762e-05, -9.354017674922943e-05, -8.859485387802124e-05, -8.364953100681305e-05, -7.870420813560486e-05, -7.375888526439667e-05, -6.881356239318848e-05, -6.386823952198029e-05, -5.8922916650772095e-05, -5.3977593779563904e-05, -4.903227090835571e-05, -4.408694803714752e-05, -3.914162516593933e-05, -3.419630229473114e-05, -2.925097942352295e-05, -2.4305656552314758e-05, -1.9360333681106567e-05, -1.4415010809898376e-05, -9.469687938690186e-06, -4.524365067481995e-06, 4.209578037261963e-07, 5.366280674934387e-06, 1.0311603546142578e-05, 1.5256926417350769e-05, 2.020224928855896e-05, 2.514757215976715e-05, 3.0092895030975342e-05, 3.503821790218353e-05, 3.9983540773391724e-05, 4.4928863644599915e-05, 4.9874186515808105e-05, 5.4819509387016296e-05, 5.976483225822449e-05, 6.471015512943268e-05, 6.965547800064087e-05, 7.460080087184906e-05, 7.954612374305725e-05, 8.449144661426544e-05, 8.943676948547363e-05, 9.438209235668182e-05, 9.932741522789001e-05, 0.0001042727380990982, 0.0001092180609703064, 0.00011416338384151459, 0.00011910870671272278, 0.00012405402958393097, 0.00012899935245513916, 0.00013394467532634735, 0.00013888999819755554, 0.00014383532106876373, 0.00014878064393997192, 0.00015372596681118011, 0.0001586712896823883, 0.0001636166125535965, 0.0001685619354248047]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 5.0, 8.0, 9.0, 9.0, 19.0, 39.0, 43.0, 92.0, 117.0, 224.0, 372.0, 674.0, 1238.0, 2521.0, 5536.0, 13901.0, 42966.0, 185693.0, 544056.0, 183238.0, 42866.0, 13846.0, 5515.0, 2544.0, 1277.0, 682.0, 408.0, 228.0, 164.0, 90.0, 60.0, 39.0, 19.0, 19.0, 7.0, 14.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53515625, -0.5181655883789062, -0.5011749267578125, -0.48418426513671875, -0.467193603515625, -0.45020294189453125, -0.4332122802734375, -0.41622161865234375, -0.39923095703125, -0.38224029541015625, -0.3652496337890625, -0.34825897216796875, -0.331268310546875, -0.31427764892578125, -0.2972869873046875, -0.28029632568359375, -0.2633056640625, -0.24631500244140625, -0.2293243408203125, -0.21233367919921875, -0.195343017578125, -0.17835235595703125, -0.1613616943359375, -0.14437103271484375, -0.12738037109375, -0.11038970947265625, -0.0933990478515625, -0.07640838623046875, -0.059417724609375, -0.04242706298828125, -0.0254364013671875, -0.00844573974609375, 0.008544921875, 0.02553558349609375, 0.0425262451171875, 0.05951690673828125, 0.076507568359375, 0.09349822998046875, 0.1104888916015625, 0.12747955322265625, 0.14447021484375, 0.16146087646484375, 0.1784515380859375, 0.19544219970703125, 0.212432861328125, 0.22942352294921875, 0.2464141845703125, 0.26340484619140625, 0.2803955078125, 0.29738616943359375, 0.3143768310546875, 0.33136749267578125, 0.348358154296875, 0.36534881591796875, 0.3823394775390625, 0.39933013916015625, 0.41632080078125, 0.43331146240234375, 0.4503021240234375, 0.46729278564453125, 0.484283447265625, 0.5012741088867188, 0.5182647705078125, 0.5352554321289062, 0.55224609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 8.0, 5.0, 13.0, 19.0, 32.0, 37.0, 41.0, 50.0, 67.0, 61.0, 55.0, 78.0, 77.0, 72.0, 69.0, 63.0, 58.0, 39.0, 29.0, 32.0, 19.0, 13.0, 10.0, 8.0, 10.0, 6.0, 3.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455078125, -0.4417533874511719, -0.42842864990234375, -0.4151039123535156, -0.4017791748046875, -0.3884544372558594, -0.37512969970703125, -0.3618049621582031, -0.348480224609375, -0.3351554870605469, -0.32183074951171875, -0.3085060119628906, -0.2951812744140625, -0.2818565368652344, -0.26853179931640625, -0.2552070617675781, -0.24188232421875, -0.22855758666992188, -0.21523284912109375, -0.20190811157226562, -0.1885833740234375, -0.17525863647460938, -0.16193389892578125, -0.14860916137695312, -0.135284423828125, -0.12195968627929688, -0.10863494873046875, -0.09531021118164062, -0.0819854736328125, -0.06866073608398438, -0.05533599853515625, -0.042011260986328125, -0.0286865234375, -0.015361785888671875, -0.00203704833984375, 0.011287689208984375, 0.0246124267578125, 0.037937164306640625, 0.05126190185546875, 0.06458663940429688, 0.077911376953125, 0.09123611450195312, 0.10456085205078125, 0.11788558959960938, 0.1312103271484375, 0.14453506469726562, 0.15785980224609375, 0.17118453979492188, 0.18450927734375, 0.19783401489257812, 0.21115875244140625, 0.22448348999023438, 0.2378082275390625, 0.2511329650878906, 0.26445770263671875, 0.2777824401855469, 0.291107177734375, 0.3044319152832031, 0.31775665283203125, 0.3310813903808594, 0.3444061279296875, 0.3577308654785156, 0.37105560302734375, 0.3843803405761719, 0.397705078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 15.0, 25.0, 33.0, 90.0, 136.0, 204.0, 173.0, 139.0, 66.0, 36.0, 25.0, 22.0, 11.0, 7.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.752629280090332, -14.381635665893555, -14.010642051696777, -13.6396484375, -13.268655776977539, -12.897662162780762, -12.526668548583984, -12.155674934387207, -11.78468132019043, -11.413687705993652, -11.042694091796875, -10.671700477600098, -10.30070686340332, -9.92971420288086, -9.558720588684082, -9.187726974487305, -8.816733360290527, -8.44573974609375, -8.074746131896973, -7.7037529945373535, -7.332759380340576, -6.961765766143799, -6.59077262878418, -6.219779014587402, -5.848785400390625, -5.477791786193848, -5.10679817199707, -4.735805034637451, -4.364811420440674, -3.9938178062438965, -3.6228244304656982, -3.2518310546875, -2.8808374404907227, -2.5098438262939453, -2.138850450515747, -1.7678569555282593, -1.3968634605407715, -1.0258699655532837, -0.6548764705657959, -0.28388309478759766, 0.08711051940917969, 0.4581040143966675, 0.8290975093841553, 1.200091004371643, 1.5710844993591309, 1.9420779943466187, 2.3130714893341064, 2.6840648651123047, 3.055058479309082, 3.4260520935058594, 3.7970454692840576, 4.168038845062256, 4.539032459259033, 4.9100260734558105, 5.28101921081543, 5.652012825012207, 6.023006439208984, 6.394000053405762, 6.764993667602539, 7.135986804962158, 7.5069804191589355, 7.877974033355713, 8.248967170715332, 8.61996078491211, 8.990954399108887]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 5.0, 5.0, 10.0, 10.0, 17.0, 14.0, 15.0, 20.0, 29.0, 27.0, 26.0, 24.0, 34.0, 44.0, 40.0, 28.0, 42.0, 29.0, 47.0, 44.0, 42.0, 49.0, 32.0, 48.0, 45.0, 32.0, 27.0, 38.0, 16.0, 23.0, 16.0, 18.0, 17.0, 10.0, 16.0, 8.0, 10.0, 6.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.950320243835449, -5.77004337310791, -5.589766979217529, -5.40949010848999, -5.229213714599609, -5.04893684387207, -4.868659973144531, -4.688383102416992, -4.508106708526611, -4.327829837799072, -4.147553443908691, -3.9672765731811523, -3.7869999408721924, -3.6067233085632324, -3.4264464378356934, -3.2461698055267334, -3.0658931732177734, -2.8856165409088135, -2.7053399085998535, -2.5250630378723145, -2.3447864055633545, -2.1645097732543945, -1.984233021736145, -1.8039562702178955, -1.6236796379089355, -1.4434030055999756, -1.263126254081726, -1.0828495025634766, -0.9025728702545166, -0.7222961783409119, -0.5420194864273071, -0.3617427349090576, -0.18146562576293945, -0.0011889338493347168, 0.17908775806427002, 0.35936444997787476, 0.5396411418914795, 0.7199178338050842, 0.900194525718689, 1.0804712772369385, 1.2607479095458984, 1.4410245418548584, 1.621301293373108, 1.8015780448913574, 1.9818546772003174, 2.1621313095092773, 2.3424081802368164, 2.5226848125457764, 2.7029614448547363, 2.8832380771636963, 3.0635147094726562, 3.2437915802001953, 3.4240682125091553, 3.6043448448181152, 3.7846217155456543, 3.9648983478546143, 4.145174980163574, 4.325451850891113, 4.505728244781494, 4.686005115509033, 4.866281509399414, 5.046558380126953, 5.226835250854492, 5.407112121582031, 5.587388515472412]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 2.0, 4.0, 7.0, 9.0, 9.0, 17.0, 11.0, 15.0, 27.0, 39.0, 34.0, 44.0, 73.0, 64.0, 141.0, 188.0, 342.0, 674.0, 1644.0, 4846.0, 18872.0, 259417.0, 3868037.0, 28492.0, 6849.0, 2342.0, 884.0, 475.0, 278.0, 156.0, 88.0, 59.0, 56.0, 20.0, 16.0, 10.0, 13.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0], "bins": [-5.296875, -5.174072265625, -5.05126953125, -4.928466796875, -4.8056640625, -4.682861328125, -4.56005859375, -4.437255859375, -4.314453125, -4.191650390625, -4.06884765625, -3.946044921875, -3.8232421875, -3.700439453125, -3.57763671875, -3.454833984375, -3.33203125, -3.209228515625, -3.08642578125, -2.963623046875, -2.8408203125, -2.718017578125, -2.59521484375, -2.472412109375, -2.349609375, -2.226806640625, -2.10400390625, -1.981201171875, -1.8583984375, -1.735595703125, -1.61279296875, -1.489990234375, -1.3671875, -1.244384765625, -1.12158203125, -0.998779296875, -0.8759765625, -0.753173828125, -0.63037109375, -0.507568359375, -0.384765625, -0.261962890625, -0.13916015625, -0.016357421875, 0.1064453125, 0.229248046875, 0.35205078125, 0.474853515625, 0.59765625, 0.720458984375, 0.84326171875, 0.966064453125, 1.0888671875, 1.211669921875, 1.33447265625, 1.457275390625, 1.580078125, 1.702880859375, 1.82568359375, 1.948486328125, 2.0712890625, 2.194091796875, 2.31689453125, 2.439697265625, 2.5625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 13.0, 10.0, 32.0, 27.0, 46.0, 36.0, 70.0, 73.0, 79.0, 89.0, 83.0, 89.0, 86.0, 67.0, 42.0, 56.0, 41.0, 27.0, 13.0, 10.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7412109375, -0.7236061096191406, -0.7060012817382812, -0.6883964538574219, -0.6707916259765625, -0.6531867980957031, -0.6355819702148438, -0.6179771423339844, -0.600372314453125, -0.5827674865722656, -0.5651626586914062, -0.5475578308105469, -0.5299530029296875, -0.5123481750488281, -0.49474334716796875, -0.4771385192871094, -0.45953369140625, -0.4419288635253906, -0.42432403564453125, -0.4067192077636719, -0.3891143798828125, -0.3715095520019531, -0.35390472412109375, -0.3362998962402344, -0.318695068359375, -0.3010902404785156, -0.28348541259765625, -0.2658805847167969, -0.2482757568359375, -0.23067092895507812, -0.21306610107421875, -0.19546127319335938, -0.1778564453125, -0.16025161743164062, -0.14264678955078125, -0.12504196166992188, -0.1074371337890625, -0.08983230590820312, -0.07222747802734375, -0.054622650146484375, -0.037017822265625, -0.019412994384765625, -0.00180816650390625, 0.015796661376953125, 0.0334014892578125, 0.051006317138671875, 0.06861114501953125, 0.08621597290039062, 0.10382080078125, 0.12142562866210938, 0.13903045654296875, 0.15663528442382812, 0.1742401123046875, 0.19184494018554688, 0.20944976806640625, 0.22705459594726562, 0.244659423828125, 0.2622642517089844, 0.27986907958984375, 0.2974739074707031, 0.3150787353515625, 0.3326835632324219, 0.35028839111328125, 0.3678932189941406, 0.385498046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 10.0, 10.0, 9.0, 11.0, 25.0, 33.0, 44.0, 61.0, 104.0, 116.0, 203.0, 341.0, 605.0, 1211.0, 2715.0, 7472.0, 32750.0, 3576928.0, 536627.0, 23961.0, 6190.0, 2291.0, 1119.0, 534.0, 300.0, 182.0, 135.0, 82.0, 68.0, 40.0, 28.0, 22.0, 17.0, 13.0, 4.0, 3.0, 3.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.45703125, -3.3551025390625, -3.253173828125, -3.1512451171875, -3.04931640625, -2.9473876953125, -2.845458984375, -2.7435302734375, -2.6416015625, -2.5396728515625, -2.437744140625, -2.3358154296875, -2.23388671875, -2.1319580078125, -2.030029296875, -1.9281005859375, -1.826171875, -1.7242431640625, -1.622314453125, -1.5203857421875, -1.41845703125, -1.3165283203125, -1.214599609375, -1.1126708984375, -1.0107421875, -0.9088134765625, -0.806884765625, -0.7049560546875, -0.60302734375, -0.5010986328125, -0.399169921875, -0.2972412109375, -0.1953125, -0.0933837890625, 0.008544921875, 0.1104736328125, 0.21240234375, 0.3143310546875, 0.416259765625, 0.5181884765625, 0.6201171875, 0.7220458984375, 0.823974609375, 0.9259033203125, 1.02783203125, 1.1297607421875, 1.231689453125, 1.3336181640625, 1.435546875, 1.5374755859375, 1.639404296875, 1.7413330078125, 1.84326171875, 1.9451904296875, 2.047119140625, 2.1490478515625, 2.2509765625, 2.3529052734375, 2.454833984375, 2.5567626953125, 2.65869140625, 2.7606201171875, 2.862548828125, 2.9644775390625, 3.06640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 10.0, 33.0, 67.0, 158.0, 1187.0, 2360.0, 132.0, 53.0, 23.0, 13.0, 7.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8369140625, -1.782958984375, -1.72900390625, -1.675048828125, -1.62109375, -1.567138671875, -1.51318359375, -1.459228515625, -1.4052734375, -1.351318359375, -1.29736328125, -1.243408203125, -1.189453125, -1.135498046875, -1.08154296875, -1.027587890625, -0.9736328125, -0.919677734375, -0.86572265625, -0.811767578125, -0.7578125, -0.703857421875, -0.64990234375, -0.595947265625, -0.5419921875, -0.488037109375, -0.43408203125, -0.380126953125, -0.326171875, -0.272216796875, -0.21826171875, -0.164306640625, -0.1103515625, -0.056396484375, -0.00244140625, 0.051513671875, 0.10546875, 0.159423828125, 0.21337890625, 0.267333984375, 0.3212890625, 0.375244140625, 0.42919921875, 0.483154296875, 0.537109375, 0.591064453125, 0.64501953125, 0.698974609375, 0.7529296875, 0.806884765625, 0.86083984375, 0.914794921875, 0.96875, 1.022705078125, 1.07666015625, 1.130615234375, 1.1845703125, 1.238525390625, 1.29248046875, 1.346435546875, 1.400390625, 1.454345703125, 1.50830078125, 1.562255859375, 1.6162109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 3.0, 9.0, 14.0, 11.0, 30.0, 66.0, 129.0, 216.0, 203.0, 137.0, 64.0, 47.0, 21.0, 15.0, 13.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6247148513793945, -5.416622161865234, -5.208528995513916, -5.000436305999756, -4.792343616485596, -4.584250450134277, -4.376157760620117, -4.168065071105957, -3.959972381591797, -3.7518794536590576, -3.5437867641448975, -3.335693836212158, -3.127601146697998, -2.919508218765259, -2.7114152908325195, -2.5033226013183594, -2.29522967338562, -2.087136745452881, -1.8790440559387207, -1.6709511280059814, -1.4628584384918213, -1.254765510559082, -1.0466727018356323, -0.8385798931121826, -0.6304870843887329, -0.4223942756652832, -0.2143014371395111, -0.006208598613739014, 0.2018842101097107, 0.4099770784378052, 0.6180698871612549, 0.8261626958847046, 1.0342555046081543, 1.242348313331604, 1.4504411220550537, 1.658534049987793, 1.8666267395019531, 2.0747196674346924, 2.2828125953674316, 2.490905284881592, 2.698997974395752, 2.907090902328491, 3.1151835918426514, 3.3232765197753906, 3.531369209289551, 3.73946213722229, 3.9475550651550293, 4.1556477546691895, 4.363740921020508, 4.571833610534668, 4.779926776885986, 4.9880194664001465, 5.196112155914307, 5.404205322265625, 5.612298011779785, 5.820390701293945, 6.0284833908081055, 6.236576080322266, 6.444669246673584, 6.652761936187744, 6.860854625701904, 7.068947792053223, 7.277040481567383, 7.485133171081543, 7.693225860595703]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 11.0, 8.0, 17.0, 12.0, 18.0, 28.0, 24.0, 30.0, 46.0, 46.0, 45.0, 65.0, 50.0, 62.0, 52.0, 64.0, 61.0, 62.0, 42.0, 52.0, 40.0, 40.0, 33.0, 25.0, 18.0, 13.0, 7.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4255776405334473, -3.315368890762329, -3.205160140991211, -3.0949513912200928, -2.9847426414489746, -2.8745336532592773, -2.7643251419067383, -2.654116153717041, -2.543907403945923, -2.4336986541748047, -2.3234899044036865, -2.2132811546325684, -2.10307240486145, -1.9928635358810425, -1.8826547861099243, -1.7724459171295166, -1.662237286567688, -1.5520285367965698, -1.4418197870254517, -1.331610918045044, -1.2214021682739258, -1.1111934185028076, -1.0009846687316895, -0.8907758593559265, -0.7805671095848083, -0.6703583598136902, -0.5601495504379272, -0.4499408006668091, -0.33973202109336853, -0.22952324151992798, -0.11931449174880981, -0.009105682373046875, 0.10110306739807129, 0.21131184697151184, 0.3215206265449524, 0.43172937631607056, 0.5419381856918335, 0.6521469354629517, 0.7623556852340698, 0.8725644946098328, 0.9827732443809509, 1.0929820537567139, 1.203190803527832, 1.3133995532989502, 1.4236083030700684, 1.5338170528411865, 1.6440258026123047, 1.7542346715927124, 1.8644434213638306, 1.9746521711349487, 2.0848610401153564, 2.1950697898864746, 2.3052785396575928, 2.415487289428711, 2.525696039199829, 2.6359047889709473, 2.7461135387420654, 2.8563222885131836, 2.9665310382843018, 3.07673978805542, 3.186948537826538, 3.2971572875976562, 3.4073662757873535, 3.5175750255584717, 3.62778377532959]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 5.0, 9.0, 18.0, 24.0, 37.0, 80.0, 141.0, 387.0, 1149.0, 6001.0, 94680.0, 910295.0, 31086.0, 3240.0, 844.0, 284.0, 121.0, 58.0, 38.0, 17.0, 12.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.6861572265625, -4.501220703125, -4.3162841796875, -4.13134765625, -3.9464111328125, -3.761474609375, -3.5765380859375, -3.3916015625, -3.2066650390625, -3.021728515625, -2.8367919921875, -2.65185546875, -2.4669189453125, -2.281982421875, -2.0970458984375, -1.912109375, -1.7271728515625, -1.542236328125, -1.3572998046875, -1.17236328125, -0.9874267578125, -0.802490234375, -0.6175537109375, -0.4326171875, -0.2476806640625, -0.062744140625, 0.1221923828125, 0.30712890625, 0.4920654296875, 0.677001953125, 0.8619384765625, 1.046875, 1.2318115234375, 1.416748046875, 1.6016845703125, 1.78662109375, 1.9715576171875, 2.156494140625, 2.3414306640625, 2.5263671875, 2.7113037109375, 2.896240234375, 3.0811767578125, 3.26611328125, 3.4510498046875, 3.635986328125, 3.8209228515625, 4.005859375, 4.1907958984375, 4.375732421875, 4.5606689453125, 4.74560546875, 4.9305419921875, 5.115478515625, 5.3004150390625, 5.4853515625, 5.6702880859375, 5.855224609375, 6.0401611328125, 6.22509765625, 6.4100341796875, 6.594970703125, 6.7799072265625, 6.96484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 15.0, 12.0, 24.0, 21.0, 28.0, 42.0, 66.0, 53.0, 66.0, 84.0, 68.0, 84.0, 64.0, 79.0, 67.0, 55.0, 46.0, 42.0, 22.0, 19.0, 13.0, 11.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.671875, -0.6554794311523438, -0.6390838623046875, -0.6226882934570312, -0.606292724609375, -0.5898971557617188, -0.5735015869140625, -0.5571060180664062, -0.54071044921875, -0.5243148803710938, -0.5079193115234375, -0.49152374267578125, -0.475128173828125, -0.45873260498046875, -0.4423370361328125, -0.42594146728515625, -0.4095458984375, -0.39315032958984375, -0.3767547607421875, -0.36035919189453125, -0.343963623046875, -0.32756805419921875, -0.3111724853515625, -0.29477691650390625, -0.27838134765625, -0.26198577880859375, -0.2455902099609375, -0.22919464111328125, -0.212799072265625, -0.19640350341796875, -0.1800079345703125, -0.16361236572265625, -0.147216796875, -0.13082122802734375, -0.1144256591796875, -0.09803009033203125, -0.081634521484375, -0.06523895263671875, -0.0488433837890625, -0.03244781494140625, -0.01605224609375, 0.00034332275390625, 0.0167388916015625, 0.03313446044921875, 0.049530029296875, 0.06592559814453125, 0.0823211669921875, 0.09871673583984375, 0.1151123046875, 0.13150787353515625, 0.1479034423828125, 0.16429901123046875, 0.180694580078125, 0.19709014892578125, 0.2134857177734375, 0.22988128662109375, 0.24627685546875, 0.26267242431640625, 0.2790679931640625, 0.29546356201171875, 0.311859130859375, 0.32825469970703125, 0.3446502685546875, 0.36104583740234375, 0.37744140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 9.0, 11.0, 23.0, 29.0, 35.0, 50.0, 90.0, 182.0, 301.0, 616.0, 1348.0, 3304.0, 10237.0, 41457.0, 278056.0, 607692.0, 79602.0, 16609.0, 5097.0, 1898.0, 897.0, 420.0, 221.0, 129.0, 77.0, 41.0, 29.0, 21.0, 19.0, 16.0, 11.0, 8.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9416351318359375, -1.881317138671875, -1.8209991455078125, -1.76068115234375, -1.7003631591796875, -1.640045166015625, -1.5797271728515625, -1.5194091796875, -1.4590911865234375, -1.398773193359375, -1.3384552001953125, -1.27813720703125, -1.2178192138671875, -1.157501220703125, -1.0971832275390625, -1.036865234375, -0.9765472412109375, -0.916229248046875, -0.8559112548828125, -0.79559326171875, -0.7352752685546875, -0.674957275390625, -0.6146392822265625, -0.5543212890625, -0.4940032958984375, -0.433685302734375, -0.3733673095703125, -0.31304931640625, -0.2527313232421875, -0.192413330078125, -0.1320953369140625, -0.07177734375, -0.0114593505859375, 0.048858642578125, 0.1091766357421875, 0.16949462890625, 0.2298126220703125, 0.290130615234375, 0.3504486083984375, 0.4107666015625, 0.4710845947265625, 0.531402587890625, 0.5917205810546875, 0.65203857421875, 0.7123565673828125, 0.772674560546875, 0.8329925537109375, 0.893310546875, 0.9536285400390625, 1.013946533203125, 1.0742645263671875, 1.13458251953125, 1.1949005126953125, 1.255218505859375, 1.3155364990234375, 1.3758544921875, 1.4361724853515625, 1.496490478515625, 1.5568084716796875, 1.61712646484375, 1.6774444580078125, 1.737762451171875, 1.7980804443359375, 1.8583984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 8.0, 9.0, 14.0, 15.0, 24.0, 20.0, 25.0, 33.0, 31.0, 36.0, 48.0, 53.0, 59.0, 58.0, 50.0, 56.0, 58.0, 54.0, 64.0, 46.0, 37.0, 39.0, 34.0, 30.0, 21.0, 20.0, 18.0, 9.0, 6.0, 7.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.779296875, -1.7281646728515625, -1.677032470703125, -1.6259002685546875, -1.57476806640625, -1.5236358642578125, -1.472503662109375, -1.4213714599609375, -1.3702392578125, -1.3191070556640625, -1.267974853515625, -1.2168426513671875, -1.16571044921875, -1.1145782470703125, -1.063446044921875, -1.0123138427734375, -0.961181640625, -0.9100494384765625, -0.858917236328125, -0.8077850341796875, -0.75665283203125, -0.7055206298828125, -0.654388427734375, -0.6032562255859375, -0.5521240234375, -0.5009918212890625, -0.449859619140625, -0.3987274169921875, -0.34759521484375, -0.2964630126953125, -0.245330810546875, -0.1941986083984375, -0.14306640625, -0.0919342041015625, -0.040802001953125, 0.0103302001953125, 0.06146240234375, 0.1125946044921875, 0.163726806640625, 0.2148590087890625, 0.2659912109375, 0.3171234130859375, 0.368255615234375, 0.4193878173828125, 0.47052001953125, 0.5216522216796875, 0.572784423828125, 0.6239166259765625, 0.675048828125, 0.7261810302734375, 0.777313232421875, 0.8284454345703125, 0.87957763671875, 0.9307098388671875, 0.981842041015625, 1.0329742431640625, 1.0841064453125, 1.1352386474609375, 1.186370849609375, 1.2375030517578125, 1.28863525390625, 1.3397674560546875, 1.390899658203125, 1.4420318603515625, 1.4931640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 15.0, 23.0, 37.0, 73.0, 116.0, 281.0, 666.0, 1940.0, 7360.0, 123238.0, 892546.0, 17006.0, 3424.0, 1032.0, 383.0, 189.0, 92.0, 39.0, 39.0, 19.0, 5.0, 8.0, 4.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9716796875, -1.9085235595703125, -1.845367431640625, -1.7822113037109375, -1.71905517578125, -1.6558990478515625, -1.592742919921875, -1.5295867919921875, -1.4664306640625, -1.4032745361328125, -1.340118408203125, -1.2769622802734375, -1.21380615234375, -1.1506500244140625, -1.087493896484375, -1.0243377685546875, -0.961181640625, -0.8980255126953125, -0.834869384765625, -0.7717132568359375, -0.70855712890625, -0.6454010009765625, -0.582244873046875, -0.5190887451171875, -0.4559326171875, -0.3927764892578125, -0.329620361328125, -0.2664642333984375, -0.20330810546875, -0.1401519775390625, -0.076995849609375, -0.0138397216796875, 0.04931640625, 0.1124725341796875, 0.175628662109375, 0.2387847900390625, 0.30194091796875, 0.3650970458984375, 0.428253173828125, 0.4914093017578125, 0.5545654296875, 0.6177215576171875, 0.680877685546875, 0.7440338134765625, 0.80718994140625, 0.8703460693359375, 0.933502197265625, 0.9966583251953125, 1.059814453125, 1.1229705810546875, 1.186126708984375, 1.2492828369140625, 1.31243896484375, 1.3755950927734375, 1.438751220703125, 1.5019073486328125, 1.5650634765625, 1.6282196044921875, 1.691375732421875, 1.7545318603515625, 1.81768798828125, 1.8808441162109375, 1.944000244140625, 2.0071563720703125, 2.0703125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 2.0, 2.0, 6.0, 14.0, 21.0, 40.0, 81.0, 183.0, 305.0, 183.0, 77.0, 31.0, 29.0, 10.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002956390380859375, -0.0002868063747882843, -0.0002779737114906311, -0.0002691410481929779, -0.0002603083848953247, -0.0002514757215976715, -0.0002426430583000183, -0.0002338103950023651, -0.00022497773170471191, -0.00021614506840705872, -0.00020731240510940552, -0.00019847974181175232, -0.00018964707851409912, -0.00018081441521644592, -0.00017198175191879272, -0.00016314908862113953, -0.00015431642532348633, -0.00014548376202583313, -0.00013665109872817993, -0.00012781843543052673, -0.00011898577213287354, -0.00011015310883522034, -0.00010132044553756714, -9.248778223991394e-05, -8.365511894226074e-05, -7.482245564460754e-05, -6.598979234695435e-05, -5.715712904930115e-05, -4.832446575164795e-05, -3.949180245399475e-05, -3.065913915634155e-05, -2.1826475858688354e-05, -1.2993812561035156e-05, -4.161149263381958e-06, 4.67151403427124e-06, 1.3504177331924438e-05, 2.2336840629577637e-05, 3.1169503927230835e-05, 4.000216722488403e-05, 4.883483052253723e-05, 5.766749382019043e-05, 6.650015711784363e-05, 7.533282041549683e-05, 8.416548371315002e-05, 9.299814701080322e-05, 0.00010183081030845642, 0.00011066347360610962, 0.00011949613690376282, 0.00012832880020141602, 0.00013716146349906921, 0.0001459941267967224, 0.0001548267900943756, 0.0001636594533920288, 0.000172492116689682, 0.0001813247799873352, 0.0001901574432849884, 0.0001989901065826416, 0.0002078227698802948, 0.000216655433177948, 0.0002254880964756012, 0.0002343207597732544, 0.0002431534230709076, 0.0002519860863685608, 0.000260818749666214, 0.0002696514129638672]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 14.0, 23.0, 37.0, 82.0, 159.0, 357.0, 1169.0, 5142.0, 74453.0, 941923.0, 21026.0, 2904.0, 741.0, 256.0, 105.0, 65.0, 50.0, 16.0, 13.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.671875, -1.610687255859375, -1.54949951171875, -1.488311767578125, -1.4271240234375, -1.365936279296875, -1.30474853515625, -1.243560791015625, -1.182373046875, -1.121185302734375, -1.05999755859375, -0.998809814453125, -0.9376220703125, -0.876434326171875, -0.81524658203125, -0.754058837890625, -0.69287109375, -0.631683349609375, -0.57049560546875, -0.509307861328125, -0.4481201171875, -0.386932373046875, -0.32574462890625, -0.264556884765625, -0.203369140625, -0.142181396484375, -0.08099365234375, -0.019805908203125, 0.0413818359375, 0.102569580078125, 0.16375732421875, 0.224945068359375, 0.2861328125, 0.347320556640625, 0.40850830078125, 0.469696044921875, 0.5308837890625, 0.592071533203125, 0.65325927734375, 0.714447021484375, 0.775634765625, 0.836822509765625, 0.89801025390625, 0.959197998046875, 1.0203857421875, 1.081573486328125, 1.14276123046875, 1.203948974609375, 1.26513671875, 1.326324462890625, 1.38751220703125, 1.448699951171875, 1.5098876953125, 1.571075439453125, 1.63226318359375, 1.693450927734375, 1.754638671875, 1.815826416015625, 1.87701416015625, 1.938201904296875, 1.9993896484375, 2.060577392578125, 2.12176513671875, 2.182952880859375, 2.244140625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 8.0, 29.0, 35.0, 97.0, 232.0, 250.0, 191.0, 92.0, 34.0, 18.0, 4.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.2316131591796875, -1.189788818359375, -1.1479644775390625, -1.10614013671875, -1.0643157958984375, -1.022491455078125, -0.9806671142578125, -0.9388427734375, -0.8970184326171875, -0.855194091796875, -0.8133697509765625, -0.77154541015625, -0.7297210693359375, -0.687896728515625, -0.6460723876953125, -0.604248046875, -0.5624237060546875, -0.520599365234375, -0.4787750244140625, -0.43695068359375, -0.3951263427734375, -0.353302001953125, -0.3114776611328125, -0.2696533203125, -0.2278289794921875, -0.186004638671875, -0.1441802978515625, -0.10235595703125, -0.0605316162109375, -0.018707275390625, 0.0231170654296875, 0.06494140625, 0.1067657470703125, 0.148590087890625, 0.1904144287109375, 0.23223876953125, 0.2740631103515625, 0.315887451171875, 0.3577117919921875, 0.3995361328125, 0.4413604736328125, 0.483184814453125, 0.5250091552734375, 0.56683349609375, 0.6086578369140625, 0.650482177734375, 0.6923065185546875, 0.734130859375, 0.7759552001953125, 0.817779541015625, 0.8596038818359375, 0.90142822265625, 0.9432525634765625, 0.985076904296875, 1.0269012451171875, 1.0687255859375, 1.1105499267578125, 1.152374267578125, 1.1941986083984375, 1.23602294921875, 1.2778472900390625, 1.319671630859375, 1.3614959716796875, 1.4033203125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 13.0, 9.0, 16.0, 32.0, 65.0, 120.0, 203.0, 171.0, 149.0, 92.0, 59.0, 31.0, 16.0, 15.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.01144027709961, -13.585338592529297, -13.1592378616333, -12.733136177062988, -12.307035446166992, -11.88093376159668, -11.454833030700684, -11.028731346130371, -10.602630615234375, -10.176528930664062, -9.750428199768066, -9.324326515197754, -8.898225784301758, -8.472124099731445, -8.04602336883545, -7.619921684265137, -7.193820476531982, -6.767719268798828, -6.341618061065674, -5.9155168533325195, -5.489415645599365, -5.063314437866211, -4.637212753295898, -4.211112022399902, -3.785010576248169, -3.3589093685150146, -2.9328081607818604, -2.506706714630127, -2.0806055068969727, -1.6545042991638184, -1.228403091430664, -0.8023018836975098, -0.37620067596435547, 0.049900561571121216, 0.4760017991065979, 0.902103066444397, 1.3282042741775513, 1.7543056011199951, 2.1804068088531494, 2.6065080165863037, 3.032609224319458, 3.4587104320526123, 3.8848116397857666, 4.3109130859375, 4.737014293670654, 5.163115501403809, 5.589216709136963, 6.015317916870117, 6.4414191246032715, 6.867520332336426, 7.29362154006958, 7.719722747802734, 8.145824432373047, 8.571925163269043, 8.998026847839355, 9.424127578735352, 9.850229263305664, 10.276330947875977, 10.702431678771973, 11.128533363342285, 11.554634094238281, 11.980735778808594, 12.40683650970459, 12.832938194274902, 13.259038925170898]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 8.0, 7.0, 10.0, 5.0, 4.0, 12.0, 13.0, 13.0, 15.0, 31.0, 22.0, 13.0, 21.0, 23.0, 35.0, 27.0, 29.0, 28.0, 37.0, 49.0, 39.0, 36.0, 44.0, 36.0, 39.0, 40.0, 31.0, 33.0, 38.0, 28.0, 18.0, 27.0, 29.0, 24.0, 15.0, 18.0, 15.0, 13.0, 15.0, 7.0, 7.0, 8.0, 5.0, 12.0, 3.0, 4.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.615253448486328, -5.432126522064209, -5.24899959564209, -5.065873146057129, -4.88274621963501, -4.699619293212891, -4.5164923667907715, -4.333365440368652, -4.150238990783691, -3.9671120643615723, -3.7839853763580322, -3.600858449935913, -3.417731761932373, -3.234604835510254, -3.0514779090881348, -2.8683512210845947, -2.6852242946624756, -2.5020973682403564, -2.3189706802368164, -2.1358437538146973, -1.9527170658111572, -1.769590139389038, -1.5864633321762085, -1.403336524963379, -1.2202097177505493, -1.0370829105377197, -0.8539561033248901, -0.6708292365074158, -0.4877024292945862, -0.3045756220817566, -0.12144875526428223, 0.06167805194854736, 0.24480485916137695, 0.42793166637420654, 0.6110584735870361, 0.7941853404045105, 0.9773121476173401, 1.1604390144348145, 1.343565821647644, 1.5266926288604736, 1.7098194360733032, 1.8929462432861328, 2.076073169708252, 2.259199857711792, 2.442326784133911, 2.625453472137451, 2.8085803985595703, 2.9917073249816895, 3.1748340129852295, 3.3579609394073486, 3.5410876274108887, 3.724214553833008, 3.907341241836548, 4.090467929840088, 4.273594856262207, 4.456721782684326, 4.639848709106445, 4.8229756355285645, 5.006102561950684, 5.1892290115356445, 5.372355937957764, 5.555482864379883, 5.738609790802002, 5.921736717224121, 6.104863166809082]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 6.0, 3.0, 8.0, 8.0, 13.0, 12.0, 11.0, 26.0, 33.0, 32.0, 78.0, 135.0, 239.0, 506.0, 1278.0, 5041.0, 37569.0, 4116264.0, 26457.0, 4130.0, 1335.0, 523.0, 264.0, 127.0, 78.0, 28.0, 22.0, 20.0, 19.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-7.82421875, -7.64410400390625, -7.4639892578125, -7.28387451171875, -7.103759765625, -6.92364501953125, -6.7435302734375, -6.56341552734375, -6.38330078125, -6.20318603515625, -6.0230712890625, -5.84295654296875, -5.662841796875, -5.48272705078125, -5.3026123046875, -5.12249755859375, -4.9423828125, -4.76226806640625, -4.5821533203125, -4.40203857421875, -4.221923828125, -4.04180908203125, -3.8616943359375, -3.68157958984375, -3.50146484375, -3.32135009765625, -3.1412353515625, -2.96112060546875, -2.781005859375, -2.60089111328125, -2.4207763671875, -2.24066162109375, -2.060546875, -1.88043212890625, -1.7003173828125, -1.52020263671875, -1.340087890625, -1.15997314453125, -0.9798583984375, -0.79974365234375, -0.61962890625, -0.43951416015625, -0.2593994140625, -0.07928466796875, 0.100830078125, 0.28094482421875, 0.4610595703125, 0.64117431640625, 0.8212890625, 1.00140380859375, 1.1815185546875, 1.36163330078125, 1.541748046875, 1.72186279296875, 1.9019775390625, 2.08209228515625, 2.26220703125, 2.44232177734375, 2.6224365234375, 2.80255126953125, 2.982666015625, 3.16278076171875, 3.3428955078125, 3.52301025390625, 3.703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 11.0, 15.0, 13.0, 18.0, 25.0, 27.0, 44.0, 47.0, 60.0, 61.0, 61.0, 64.0, 71.0, 72.0, 60.0, 66.0, 62.0, 35.0, 48.0, 35.0, 30.0, 21.0, 12.0, 17.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6875, -0.6705131530761719, -0.6535263061523438, -0.6365394592285156, -0.6195526123046875, -0.6025657653808594, -0.5855789184570312, -0.5685920715332031, -0.551605224609375, -0.5346183776855469, -0.5176315307617188, -0.5006446838378906, -0.4836578369140625, -0.4666709899902344, -0.44968414306640625, -0.4326972961425781, -0.41571044921875, -0.3987236022949219, -0.38173675537109375, -0.3647499084472656, -0.3477630615234375, -0.3307762145996094, -0.31378936767578125, -0.2968025207519531, -0.279815673828125, -0.2628288269042969, -0.24584197998046875, -0.22885513305664062, -0.2118682861328125, -0.19488143920898438, -0.17789459228515625, -0.16090774536132812, -0.1439208984375, -0.12693405151367188, -0.10994720458984375, -0.09296035766601562, -0.0759735107421875, -0.058986663818359375, -0.04199981689453125, -0.025012969970703125, -0.008026123046875, 0.008960723876953125, 0.02594757080078125, 0.042934417724609375, 0.0599212646484375, 0.07690811157226562, 0.09389495849609375, 0.11088180541992188, 0.12786865234375, 0.14485549926757812, 0.16184234619140625, 0.17882919311523438, 0.1958160400390625, 0.21280288696289062, 0.22978973388671875, 0.24677658081054688, 0.263763427734375, 0.2807502746582031, 0.29773712158203125, 0.3147239685058594, 0.3317108154296875, 0.3486976623535156, 0.36568450927734375, 0.3826713562011719, 0.399658203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 11.0, 15.0, 17.0, 26.0, 35.0, 39.0, 40.0, 78.0, 111.0, 143.0, 170.0, 231.0, 340.0, 499.0, 785.0, 1723.0, 5084.0, 23702.0, 3773154.0, 363063.0, 17477.0, 3864.0, 1357.0, 654.0, 480.0, 359.0, 213.0, 151.0, 129.0, 86.0, 59.0, 40.0, 45.0, 22.0, 10.0, 11.0, 13.0, 7.0, 8.0, 4.0, 12.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.88671875, -3.75677490234375, -3.6268310546875, -3.49688720703125, -3.366943359375, -3.23699951171875, -3.1070556640625, -2.97711181640625, -2.84716796875, -2.71722412109375, -2.5872802734375, -2.45733642578125, -2.327392578125, -2.19744873046875, -2.0675048828125, -1.93756103515625, -1.8076171875, -1.67767333984375, -1.5477294921875, -1.41778564453125, -1.287841796875, -1.15789794921875, -1.0279541015625, -0.89801025390625, -0.76806640625, -0.63812255859375, -0.5081787109375, -0.37823486328125, -0.248291015625, -0.11834716796875, 0.0115966796875, 0.14154052734375, 0.271484375, 0.40142822265625, 0.5313720703125, 0.66131591796875, 0.791259765625, 0.92120361328125, 1.0511474609375, 1.18109130859375, 1.31103515625, 1.44097900390625, 1.5709228515625, 1.70086669921875, 1.830810546875, 1.96075439453125, 2.0906982421875, 2.22064208984375, 2.3505859375, 2.48052978515625, 2.6104736328125, 2.74041748046875, 2.870361328125, 3.00030517578125, 3.1302490234375, 3.26019287109375, 3.39013671875, 3.52008056640625, 3.6500244140625, 3.77996826171875, 3.909912109375, 4.03985595703125, 4.1697998046875, 4.29974365234375, 4.4296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 12.0, 16.0, 32.0, 108.0, 891.0, 2789.0, 111.0, 45.0, 25.0, 11.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.677734375, -1.6199951171875, -1.562255859375, -1.5045166015625, -1.44677734375, -1.3890380859375, -1.331298828125, -1.2735595703125, -1.2158203125, -1.1580810546875, -1.100341796875, -1.0426025390625, -0.98486328125, -0.9271240234375, -0.869384765625, -0.8116455078125, -0.75390625, -0.6961669921875, -0.638427734375, -0.5806884765625, -0.52294921875, -0.4652099609375, -0.407470703125, -0.3497314453125, -0.2919921875, -0.2342529296875, -0.176513671875, -0.1187744140625, -0.06103515625, -0.0032958984375, 0.054443359375, 0.1121826171875, 0.169921875, 0.2276611328125, 0.285400390625, 0.3431396484375, 0.40087890625, 0.4586181640625, 0.516357421875, 0.5740966796875, 0.6318359375, 0.6895751953125, 0.747314453125, 0.8050537109375, 0.86279296875, 0.9205322265625, 0.978271484375, 1.0360107421875, 1.09375, 1.1514892578125, 1.209228515625, 1.2669677734375, 1.32470703125, 1.3824462890625, 1.440185546875, 1.4979248046875, 1.5556640625, 1.6134033203125, 1.671142578125, 1.7288818359375, 1.78662109375, 1.8443603515625, 1.902099609375, 1.9598388671875, 2.017578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 15.0, 24.0, 82.0, 303.0, 367.0, 135.0, 35.0, 12.0, 7.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.798945426940918, -14.46423053741455, -14.1295166015625, -13.794801712036133, -13.460087776184082, -13.125372886657715, -12.790658950805664, -12.455944061279297, -12.12122917175293, -11.786514282226562, -11.451800346374512, -11.117085456848145, -10.782371520996094, -10.447656631469727, -10.11294174194336, -9.778227806091309, -9.443513870239258, -9.10879898071289, -8.77408504486084, -8.439370155334473, -8.104656219482422, -7.769941329956055, -7.435226917266846, -7.100512504577637, -6.7657976150512695, -6.4310832023620605, -6.096368789672852, -5.761653900146484, -5.426939487457275, -5.092225074768066, -4.757510662078857, -4.422796249389648, -4.088080883026123, -3.753366470336914, -3.418651819229126, -3.083937406539917, -2.749222755432129, -2.41450834274292, -2.079793930053711, -1.7450792789459229, -1.4103648662567139, -1.0756503343582153, -0.7409358620643616, -0.4062213897705078, -0.07150685787200928, 0.26320767402648926, 0.5979220867156982, 0.9326367378234863, 1.2673511505126953, 1.6020656824111938, 1.9367802143096924, 2.2714946269989014, 2.6062092781066895, 2.9409236907958984, 3.2756381034851074, 3.6103527545928955, 3.9450671672821045, 4.279781818389893, 4.614496231079102, 4.9492106437683105, 5.2839250564575195, 5.618639945983887, 5.9533538818359375, 6.288068771362305, 6.622783184051514]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 17.0, 32.0, 56.0, 70.0, 78.0, 101.0, 123.0, 105.0, 118.0, 86.0, 60.0, 46.0, 34.0, 28.0, 19.0, 11.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.492469787597656, -6.327296733856201, -6.162123680114746, -5.996950626373291, -5.831777572631836, -5.666604518890381, -5.501431465148926, -5.336258411407471, -5.171085357666016, -5.0059123039245605, -4.8407392501831055, -4.67556619644165, -4.510393142700195, -4.34522008895874, -4.180047035217285, -4.01487398147583, -3.849700689315796, -3.684527635574341, -3.5193545818328857, -3.3541815280914307, -3.1890084743499756, -3.0238354206085205, -2.8586621284484863, -2.6934890747070312, -2.528316020965576, -2.363142967224121, -2.197969913482666, -2.032796859741211, -1.8676238059997559, -1.7024507522583008, -1.5372775793075562, -1.372104525566101, -1.2069315910339355, -1.0417585372924805, -0.8765854835510254, -0.7114123702049255, -0.5462393164634705, -0.3810662627220154, -0.21589314937591553, -0.05072009563446045, 0.11445295810699463, 0.2796260118484497, 0.4447990953922272, 0.6099721789360046, 0.7751452326774597, 0.9403182864189148, 1.1054913997650146, 1.2706644535064697, 1.4358375072479248, 1.6010105609893799, 1.766183614730835, 1.93135666847229, 2.096529722213745, 2.2617027759552, 2.4268760681152344, 2.5920491218566895, 2.7572221755981445, 2.9223952293395996, 3.0875682830810547, 3.2527413368225098, 3.417914390563965, 3.58308744430542, 3.748260498046875, 3.91343355178833, 4.078606605529785]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 7.0, 17.0, 17.0, 32.0, 41.0, 62.0, 119.0, 187.0, 330.0, 741.0, 1967.0, 6210.0, 27856.0, 228988.0, 690210.0, 73359.0, 12685.0, 3448.0, 1159.0, 445.0, 253.0, 136.0, 91.0, 59.0, 33.0, 27.0, 12.0, 5.0, 7.0, 8.0, 5.0, 6.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.984375, -2.888885498046875, -2.79339599609375, -2.697906494140625, -2.6024169921875, -2.506927490234375, -2.41143798828125, -2.315948486328125, -2.220458984375, -2.124969482421875, -2.02947998046875, -1.933990478515625, -1.8385009765625, -1.743011474609375, -1.64752197265625, -1.552032470703125, -1.45654296875, -1.361053466796875, -1.26556396484375, -1.170074462890625, -1.0745849609375, -0.979095458984375, -0.88360595703125, -0.788116455078125, -0.692626953125, -0.597137451171875, -0.50164794921875, -0.406158447265625, -0.3106689453125, -0.215179443359375, -0.11968994140625, -0.024200439453125, 0.0712890625, 0.166778564453125, 0.26226806640625, 0.357757568359375, 0.4532470703125, 0.548736572265625, 0.64422607421875, 0.739715576171875, 0.835205078125, 0.930694580078125, 1.02618408203125, 1.121673583984375, 1.2171630859375, 1.312652587890625, 1.40814208984375, 1.503631591796875, 1.59912109375, 1.694610595703125, 1.79010009765625, 1.885589599609375, 1.9810791015625, 2.076568603515625, 2.17205810546875, 2.267547607421875, 2.363037109375, 2.458526611328125, 2.55401611328125, 2.649505615234375, 2.7449951171875, 2.840484619140625, 2.93597412109375, 3.031463623046875, 3.126953125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 8.0, 15.0, 10.0, 23.0, 20.0, 45.0, 45.0, 56.0, 59.0, 76.0, 69.0, 92.0, 73.0, 87.0, 64.0, 56.0, 53.0, 42.0, 22.0, 28.0, 19.0, 12.0, 9.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.85205078125, -0.8320808410644531, -0.8121109008789062, -0.7921409606933594, -0.7721710205078125, -0.7522010803222656, -0.7322311401367188, -0.7122611999511719, -0.692291259765625, -0.6723213195800781, -0.6523513793945312, -0.6323814392089844, -0.6124114990234375, -0.5924415588378906, -0.5724716186523438, -0.5525016784667969, -0.53253173828125, -0.5125617980957031, -0.49259185791015625, -0.4726219177246094, -0.4526519775390625, -0.4326820373535156, -0.41271209716796875, -0.3927421569824219, -0.372772216796875, -0.3528022766113281, -0.33283233642578125, -0.3128623962402344, -0.2928924560546875, -0.2729225158691406, -0.25295257568359375, -0.23298263549804688, -0.2130126953125, -0.19304275512695312, -0.17307281494140625, -0.15310287475585938, -0.1331329345703125, -0.11316299438476562, -0.09319305419921875, -0.07322311401367188, -0.053253173828125, -0.033283233642578125, -0.01331329345703125, 0.006656646728515625, 0.0266265869140625, 0.046596527099609375, 0.06656646728515625, 0.08653640747070312, 0.10650634765625, 0.12647628784179688, 0.14644622802734375, 0.16641616821289062, 0.1863861083984375, 0.20635604858398438, 0.22632598876953125, 0.24629592895507812, 0.266265869140625, 0.2862358093261719, 0.30620574951171875, 0.3261756896972656, 0.3461456298828125, 0.3661155700683594, 0.38608551025390625, 0.4060554504394531, 0.426025390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 4.0, 8.0, 6.0, 14.0, 20.0, 22.0, 39.0, 52.0, 76.0, 98.0, 126.0, 214.0, 384.0, 656.0, 1172.0, 2376.0, 4935.0, 10916.0, 25491.0, 68823.0, 228590.0, 473461.0, 147477.0, 48372.0, 18713.0, 8237.0, 3863.0, 1872.0, 1008.0, 534.0, 313.0, 199.0, 135.0, 104.0, 70.0, 42.0, 25.0, 21.0, 20.0, 15.0, 13.0, 9.0, 5.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.2880859375, -1.2505645751953125, -1.213043212890625, -1.1755218505859375, -1.13800048828125, -1.1004791259765625, -1.062957763671875, -1.0254364013671875, -0.9879150390625, -0.9503936767578125, -0.912872314453125, -0.8753509521484375, -0.83782958984375, -0.8003082275390625, -0.762786865234375, -0.7252655029296875, -0.687744140625, -0.6502227783203125, -0.612701416015625, -0.5751800537109375, -0.53765869140625, -0.5001373291015625, -0.462615966796875, -0.4250946044921875, -0.3875732421875, -0.3500518798828125, -0.312530517578125, -0.2750091552734375, -0.23748779296875, -0.1999664306640625, -0.162445068359375, -0.1249237060546875, -0.08740234375, -0.0498809814453125, -0.012359619140625, 0.0251617431640625, 0.06268310546875, 0.1002044677734375, 0.137725830078125, 0.1752471923828125, 0.2127685546875, 0.2502899169921875, 0.287811279296875, 0.3253326416015625, 0.36285400390625, 0.4003753662109375, 0.437896728515625, 0.4754180908203125, 0.512939453125, 0.5504608154296875, 0.587982177734375, 0.6255035400390625, 0.66302490234375, 0.7005462646484375, 0.738067626953125, 0.7755889892578125, 0.8131103515625, 0.8506317138671875, 0.888153076171875, 0.9256744384765625, 0.96319580078125, 1.0007171630859375, 1.038238525390625, 1.0757598876953125, 1.11328125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 3.0, 2.0, 6.0, 7.0, 14.0, 11.0, 10.0, 18.0, 7.0, 27.0, 25.0, 32.0, 41.0, 48.0, 39.0, 51.0, 47.0, 32.0, 41.0, 59.0, 50.0, 52.0, 39.0, 46.0, 38.0, 40.0, 41.0, 24.0, 38.0, 22.0, 17.0, 17.0, 19.0, 9.0, 9.0, 7.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.52178955078125, -1.4713134765625, -1.42083740234375, -1.370361328125, -1.31988525390625, -1.2694091796875, -1.21893310546875, -1.16845703125, -1.11798095703125, -1.0675048828125, -1.01702880859375, -0.966552734375, -0.91607666015625, -0.8656005859375, -0.81512451171875, -0.7646484375, -0.71417236328125, -0.6636962890625, -0.61322021484375, -0.562744140625, -0.51226806640625, -0.4617919921875, -0.41131591796875, -0.36083984375, -0.31036376953125, -0.2598876953125, -0.20941162109375, -0.158935546875, -0.10845947265625, -0.0579833984375, -0.00750732421875, 0.04296875, 0.09344482421875, 0.1439208984375, 0.19439697265625, 0.244873046875, 0.29534912109375, 0.3458251953125, 0.39630126953125, 0.44677734375, 0.49725341796875, 0.5477294921875, 0.59820556640625, 0.648681640625, 0.69915771484375, 0.7496337890625, 0.80010986328125, 0.8505859375, 0.90106201171875, 0.9515380859375, 1.00201416015625, 1.052490234375, 1.10296630859375, 1.1534423828125, 1.20391845703125, 1.25439453125, 1.30487060546875, 1.3553466796875, 1.40582275390625, 1.456298828125, 1.50677490234375, 1.5572509765625, 1.60772705078125, 1.658203125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 19.0, 22.0, 52.0, 90.0, 161.0, 370.0, 705.0, 1698.0, 5166.0, 22675.0, 255177.0, 696371.0, 52435.0, 9080.0, 2587.0, 984.0, 427.0, 246.0, 103.0, 64.0, 33.0, 22.0, 15.0, 10.0, 6.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -1.0084686279296875, -0.979827880859375, -0.9511871337890625, -0.92254638671875, -0.8939056396484375, -0.865264892578125, -0.8366241455078125, -0.8079833984375, -0.7793426513671875, -0.750701904296875, -0.7220611572265625, -0.69342041015625, -0.6647796630859375, -0.636138916015625, -0.6074981689453125, -0.578857421875, -0.5502166748046875, -0.521575927734375, -0.4929351806640625, -0.46429443359375, -0.4356536865234375, -0.407012939453125, -0.3783721923828125, -0.3497314453125, -0.3210906982421875, -0.292449951171875, -0.2638092041015625, -0.23516845703125, -0.2065277099609375, -0.177886962890625, -0.1492462158203125, -0.12060546875, -0.0919647216796875, -0.063323974609375, -0.0346832275390625, -0.00604248046875, 0.0225982666015625, 0.051239013671875, 0.0798797607421875, 0.1085205078125, 0.1371612548828125, 0.165802001953125, 0.1944427490234375, 0.22308349609375, 0.2517242431640625, 0.280364990234375, 0.3090057373046875, 0.337646484375, 0.3662872314453125, 0.394927978515625, 0.4235687255859375, 0.45220947265625, 0.4808502197265625, 0.509490966796875, 0.5381317138671875, 0.5667724609375, 0.5954132080078125, 0.624053955078125, 0.6526947021484375, 0.68133544921875, 0.7099761962890625, 0.738616943359375, 0.7672576904296875, 0.7958984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 20.0, 52.0, 88.0, 362.0, 334.0, 75.0, 29.0, 7.0, 6.0, 9.0, 6.0, 3.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003361701965332031, -0.0003208667039871216, -0.00030556321144104004, -0.0002902597188949585, -0.00027495622634887695, -0.0002596527338027954, -0.00024434924125671387, -0.00022904574871063232, -0.00021374225616455078, -0.00019843876361846924, -0.0001831352710723877, -0.00016783177852630615, -0.0001525282859802246, -0.00013722479343414307, -0.00012192130088806152, -0.00010661780834197998, -9.131431579589844e-05, -7.60108232498169e-05, -6.070733070373535e-05, -4.540383815765381e-05, -3.0100345611572266e-05, -1.4796853065490723e-05, 5.066394805908203e-07, 1.5810132026672363e-05, 3.1113624572753906e-05, 4.641711711883545e-05, 6.172060966491699e-05, 7.702410221099854e-05, 9.232759475708008e-05, 0.00010763108730316162, 0.00012293457984924316, 0.0001382380723953247, 0.00015354156494140625, 0.0001688450574874878, 0.00018414855003356934, 0.00019945204257965088, 0.00021475553512573242, 0.00023005902767181396, 0.0002453625202178955, 0.00026066601276397705, 0.0002759695053100586, 0.00029127299785614014, 0.0003065764904022217, 0.0003218799829483032, 0.00033718347549438477, 0.0003524869680404663, 0.00036779046058654785, 0.0003830939531326294, 0.00039839744567871094, 0.0004137009382247925, 0.000429004430770874, 0.00044430792331695557, 0.0004596114158630371, 0.00047491490840911865, 0.0004902184009552002, 0.0005055218935012817, 0.0005208253860473633, 0.0005361288785934448, 0.0005514323711395264, 0.0005667358636856079, 0.0005820393562316895, 0.000597342848777771, 0.0006126463413238525, 0.0006279498338699341, 0.0006432533264160156]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 14.0, 17.0, 31.0, 51.0, 55.0, 87.0, 158.0, 350.0, 684.0, 1868.0, 6061.0, 36254.0, 691687.0, 286008.0, 18615.0, 3946.0, 1415.0, 583.0, 255.0, 136.0, 82.0, 49.0, 47.0, 31.0, 24.0, 13.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.7470550537109375, -0.712860107421875, -0.6786651611328125, -0.64447021484375, -0.6102752685546875, -0.576080322265625, -0.5418853759765625, -0.5076904296875, -0.4734954833984375, -0.439300537109375, -0.4051055908203125, -0.37091064453125, -0.3367156982421875, -0.302520751953125, -0.2683258056640625, -0.234130859375, -0.1999359130859375, -0.165740966796875, -0.1315460205078125, -0.09735107421875, -0.0631561279296875, -0.028961181640625, 0.0052337646484375, 0.0394287109375, 0.0736236572265625, 0.107818603515625, 0.1420135498046875, 0.17620849609375, 0.2104034423828125, 0.244598388671875, 0.2787933349609375, 0.31298828125, 0.3471832275390625, 0.381378173828125, 0.4155731201171875, 0.44976806640625, 0.4839630126953125, 0.518157958984375, 0.5523529052734375, 0.5865478515625, 0.6207427978515625, 0.654937744140625, 0.6891326904296875, 0.72332763671875, 0.7575225830078125, 0.791717529296875, 0.8259124755859375, 0.860107421875, 0.8943023681640625, 0.928497314453125, 0.9626922607421875, 0.99688720703125, 1.0310821533203125, 1.065277099609375, 1.0994720458984375, 1.1336669921875, 1.1678619384765625, 1.202056884765625, 1.2362518310546875, 1.27044677734375, 1.3046417236328125, 1.338836669921875, 1.3730316162109375, 1.4072265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 12.0, 11.0, 13.0, 23.0, 43.0, 56.0, 85.0, 119.0, 140.0, 140.0, 114.0, 69.0, 63.0, 35.0, 24.0, 19.0, 6.0, 10.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53662109375, -0.5140762329101562, -0.4915313720703125, -0.46898651123046875, -0.446441650390625, -0.42389678955078125, -0.4013519287109375, -0.37880706787109375, -0.35626220703125, -0.33371734619140625, -0.3111724853515625, -0.28862762451171875, -0.266082763671875, -0.24353790283203125, -0.2209930419921875, -0.19844818115234375, -0.1759033203125, -0.15335845947265625, -0.1308135986328125, -0.10826873779296875, -0.085723876953125, -0.06317901611328125, -0.0406341552734375, -0.01808929443359375, 0.00445556640625, 0.02700042724609375, 0.0495452880859375, 0.07209014892578125, 0.094635009765625, 0.11717987060546875, 0.1397247314453125, 0.16226959228515625, 0.184814453125, 0.20735931396484375, 0.2299041748046875, 0.25244903564453125, 0.274993896484375, 0.29753875732421875, 0.3200836181640625, 0.34262847900390625, 0.36517333984375, 0.38771820068359375, 0.4102630615234375, 0.43280792236328125, 0.455352783203125, 0.47789764404296875, 0.5004425048828125, 0.5229873657226562, 0.5455322265625, 0.5680770874023438, 0.5906219482421875, 0.6131668090820312, 0.635711669921875, 0.6582565307617188, 0.6808013916015625, 0.7033462524414062, 0.72589111328125, 0.7484359741210938, 0.7709808349609375, 0.7935256958007812, 0.816070556640625, 0.8386154174804688, 0.8611602783203125, 0.8837051391601562, 0.90625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 15.0, 38.0, 139.0, 325.0, 329.0, 112.0, 35.0, 7.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15423583984375, -19.311105728149414, -18.467975616455078, -17.624845504760742, -16.781715393066406, -15.93858528137207, -15.095455169677734, -14.252325057983398, -13.409194946289062, -12.566064834594727, -11.72293472290039, -10.879804611206055, -10.036674499511719, -9.193544387817383, -8.350414276123047, -7.507283687591553, -6.664153099060059, -5.821022987365723, -4.977892875671387, -4.134762763977051, -3.2916324138641357, -2.4485020637512207, -1.6053719520568848, -0.7622418403625488, 0.08088827133178711, 0.9240184426307678, 1.7671486139297485, 2.610278844833374, 3.45340895652771, 4.296539306640625, 5.139669418334961, 5.982799530029297, 6.825929641723633, 7.669059753417969, 8.512189865112305, 9.35531997680664, 10.198450088500977, 11.041580200195312, 11.884710311889648, 12.727840423583984, 13.57097053527832, 14.414100646972656, 15.257230758666992, 16.100360870361328, 16.943490982055664, 17.78662109375, 18.629751205444336, 19.472881317138672, 20.31601333618164, 21.159143447875977, 22.002273559570312, 22.84540367126465, 23.688533782958984, 24.53166389465332, 25.374794006347656, 26.217924118041992, 27.061054229736328, 27.904184341430664, 28.747314453125, 29.590444564819336, 30.433574676513672, 31.276704788208008, 32.119834899902344, 32.96296691894531, 33.806095123291016]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 15.0, 19.0, 8.0, 19.0, 10.0, 16.0, 17.0, 24.0, 15.0, 21.0, 24.0, 39.0, 43.0, 31.0, 39.0, 47.0, 59.0, 48.0, 35.0, 29.0, 42.0, 43.0, 40.0, 41.0, 31.0, 25.0, 37.0, 27.0, 22.0, 21.0, 14.0, 17.0, 17.0, 14.0, 8.0, 7.0, 6.0, 8.0, 4.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.675537109375, -5.465715408325195, -5.255893230438232, -5.046071529388428, -4.836249828338623, -4.62642765045166, -4.4166059494018555, -4.206784248352051, -3.996962308883667, -3.787140369415283, -3.5773186683654785, -3.3674967288970947, -3.157674789428711, -2.9478530883789062, -2.7380311489105225, -2.5282092094421387, -2.318387508392334, -2.10856556892395, -1.8987438678741455, -1.6889219284057617, -1.4791001081466675, -1.2692782878875732, -1.0594563484191895, -0.8496345281600952, -0.639812707901001, -0.42999085783958435, -0.22016900777816772, -0.010347127914428711, 0.19947469234466553, 0.40929651260375977, 0.6191184520721436, 0.8289402723312378, 1.0387616157531738, 1.248583436012268, 1.4584052562713623, 1.668227195739746, 1.8780490159988403, 2.0878708362579346, 2.2976927757263184, 2.507514476776123, 2.717336416244507, 2.9271583557128906, 3.1369800567626953, 3.346801996231079, 3.556623935699463, 3.7664456367492676, 3.9762675762176514, 4.186089515686035, 4.39591121673584, 4.6057329177856445, 4.815555095672607, 5.025376796722412, 5.235198497772217, 5.44502067565918, 5.654842376708984, 5.864664077758789, 6.074485778808594, 6.284307479858398, 6.494129657745361, 6.703951358795166, 6.913773059844971, 7.123595237731934, 7.333416938781738, 7.543238639831543, 7.753060817718506]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 9.0, 7.0, 12.0, 18.0, 15.0, 23.0, 36.0, 46.0, 83.0, 118.0, 190.0, 389.0, 713.0, 1787.0, 6537.0, 47092.0, 4102204.0, 26999.0, 4943.0, 1624.0, 661.0, 332.0, 177.0, 101.0, 63.0, 31.0, 17.0, 11.0, 13.0, 10.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.184326171875, -8.96240234375, -8.740478515625, -8.5185546875, -8.296630859375, -8.07470703125, -7.852783203125, -7.630859375, -7.408935546875, -7.18701171875, -6.965087890625, -6.7431640625, -6.521240234375, -6.29931640625, -6.077392578125, -5.85546875, -5.633544921875, -5.41162109375, -5.189697265625, -4.9677734375, -4.745849609375, -4.52392578125, -4.302001953125, -4.080078125, -3.858154296875, -3.63623046875, -3.414306640625, -3.1923828125, -2.970458984375, -2.74853515625, -2.526611328125, -2.3046875, -2.082763671875, -1.86083984375, -1.638916015625, -1.4169921875, -1.195068359375, -0.97314453125, -0.751220703125, -0.529296875, -0.307373046875, -0.08544921875, 0.136474609375, 0.3583984375, 0.580322265625, 0.80224609375, 1.024169921875, 1.24609375, 1.468017578125, 1.68994140625, 1.911865234375, 2.1337890625, 2.355712890625, 2.57763671875, 2.799560546875, 3.021484375, 3.243408203125, 3.46533203125, 3.687255859375, 3.9091796875, 4.131103515625, 4.35302734375, 4.574951171875, 4.796875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 10.0, 13.0, 16.0, 21.0, 32.0, 29.0, 35.0, 43.0, 55.0, 62.0, 55.0, 59.0, 68.0, 61.0, 69.0, 57.0, 49.0, 43.0, 49.0, 42.0, 35.0, 25.0, 18.0, 13.0, 9.0, 12.0, 3.0, 3.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.7412109375, -0.72308349609375, -0.7049560546875, -0.68682861328125, -0.668701171875, -0.65057373046875, -0.6324462890625, -0.61431884765625, -0.59619140625, -0.57806396484375, -0.5599365234375, -0.54180908203125, -0.523681640625, -0.50555419921875, -0.4874267578125, -0.46929931640625, -0.451171875, -0.43304443359375, -0.4149169921875, -0.39678955078125, -0.378662109375, -0.36053466796875, -0.3424072265625, -0.32427978515625, -0.30615234375, -0.28802490234375, -0.2698974609375, -0.25177001953125, -0.233642578125, -0.21551513671875, -0.1973876953125, -0.17926025390625, -0.1611328125, -0.14300537109375, -0.1248779296875, -0.10675048828125, -0.088623046875, -0.07049560546875, -0.0523681640625, -0.03424072265625, -0.01611328125, 0.00201416015625, 0.0201416015625, 0.03826904296875, 0.056396484375, 0.07452392578125, 0.0926513671875, 0.11077880859375, 0.12890625, 0.14703369140625, 0.1651611328125, 0.18328857421875, 0.201416015625, 0.21954345703125, 0.2376708984375, 0.25579833984375, 0.27392578125, 0.29205322265625, 0.3101806640625, 0.32830810546875, 0.346435546875, 0.36456298828125, 0.3826904296875, 0.40081787109375, 0.4189453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 1.0, 2.0, 5.0, 7.0, 7.0, 8.0, 16.0, 17.0, 29.0, 15.0, 29.0, 38.0, 35.0, 58.0, 76.0, 62.0, 113.0, 130.0, 153.0, 236.0, 403.0, 828.0, 2065.0, 6495.0, 30111.0, 3994692.0, 138101.0, 13738.0, 3645.0, 1317.0, 594.0, 320.0, 193.0, 150.0, 124.0, 81.0, 65.0, 54.0, 48.0, 45.0, 33.0, 30.0, 26.0, 23.0, 16.0, 14.0, 6.0, 8.0, 3.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.66015625, -4.5179443359375, -4.375732421875, -4.2335205078125, -4.09130859375, -3.9490966796875, -3.806884765625, -3.6646728515625, -3.5224609375, -3.3802490234375, -3.238037109375, -3.0958251953125, -2.95361328125, -2.8114013671875, -2.669189453125, -2.5269775390625, -2.384765625, -2.2425537109375, -2.100341796875, -1.9581298828125, -1.81591796875, -1.6737060546875, -1.531494140625, -1.3892822265625, -1.2470703125, -1.1048583984375, -0.962646484375, -0.8204345703125, -0.67822265625, -0.5360107421875, -0.393798828125, -0.2515869140625, -0.109375, 0.0328369140625, 0.175048828125, 0.3172607421875, 0.45947265625, 0.6016845703125, 0.743896484375, 0.8861083984375, 1.0283203125, 1.1705322265625, 1.312744140625, 1.4549560546875, 1.59716796875, 1.7393798828125, 1.881591796875, 2.0238037109375, 2.166015625, 2.3082275390625, 2.450439453125, 2.5926513671875, 2.73486328125, 2.8770751953125, 3.019287109375, 3.1614990234375, 3.3037109375, 3.4459228515625, 3.588134765625, 3.7303466796875, 3.87255859375, 4.0147705078125, 4.156982421875, 4.2991943359375, 4.44140625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 14.0, 15.0, 24.0, 69.0, 2852.0, 974.0, 65.0, 29.0, 11.0, 13.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.14508056640625, -2.0655517578125, -1.98602294921875, -1.906494140625, -1.82696533203125, -1.7474365234375, -1.66790771484375, -1.58837890625, -1.50885009765625, -1.4293212890625, -1.34979248046875, -1.270263671875, -1.19073486328125, -1.1112060546875, -1.03167724609375, -0.9521484375, -0.87261962890625, -0.7930908203125, -0.71356201171875, -0.634033203125, -0.55450439453125, -0.4749755859375, -0.39544677734375, -0.31591796875, -0.23638916015625, -0.1568603515625, -0.07733154296875, 0.002197265625, 0.08172607421875, 0.1612548828125, 0.24078369140625, 0.3203125, 0.39984130859375, 0.4793701171875, 0.55889892578125, 0.638427734375, 0.71795654296875, 0.7974853515625, 0.87701416015625, 0.95654296875, 1.03607177734375, 1.1156005859375, 1.19512939453125, 1.274658203125, 1.35418701171875, 1.4337158203125, 1.51324462890625, 1.5927734375, 1.67230224609375, 1.7518310546875, 1.83135986328125, 1.910888671875, 1.99041748046875, 2.0699462890625, 2.14947509765625, 2.22900390625, 2.30853271484375, 2.3880615234375, 2.46759033203125, 2.547119140625, 2.62664794921875, 2.7061767578125, 2.78570556640625, 2.865234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 11.0, 13.0, 62.0, 415.0, 384.0, 77.0, 19.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.472673416137695, -14.973182678222656, -14.473692893981934, -13.974202156066895, -13.474712371826172, -12.975221633911133, -12.475730895996094, -11.976241111755371, -11.476751327514648, -10.97726058959961, -10.477770805358887, -9.978280067443848, -9.478790283203125, -8.979299545288086, -8.479808807373047, -7.980319023132324, -7.480828285217285, -6.981338024139404, -6.481847763061523, -5.982357025146484, -5.482867240905762, -4.983376502990723, -4.483886241912842, -3.984395980834961, -3.48490571975708, -2.985415458679199, -2.4859251976013184, -1.9864346981048584, -1.4869444370269775, -0.9874541759490967, -0.4879636764526367, 0.01152658462524414, 0.511016845703125, 1.0105071067810059, 1.5099974870681763, 2.0094878673553467, 2.5089781284332275, 3.0084683895111084, 3.5079588890075684, 4.007449150085449, 4.50693941116333, 5.006429672241211, 5.505919933319092, 6.005410194396973, 6.504900932312012, 7.004390716552734, 7.503881454467773, 8.003372192382812, 8.502861976623535, 9.002352714538574, 9.501842498779297, 10.001333236694336, 10.500823020935059, 11.000313758850098, 11.49980354309082, 11.99929428100586, 12.498785018920898, 12.998275756835938, 13.49776554107666, 13.9972562789917, 14.496746063232422, 14.996236801147461, 15.4957275390625, 15.995217323303223, 16.494707107543945]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 13.0, 10.0, 24.0, 40.0, 60.0, 74.0, 85.0, 112.0, 106.0, 138.0, 103.0, 73.0, 56.0, 34.0, 30.0, 19.0, 11.0, 6.0, 0.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.909114837646484, -6.7165069580078125, -6.523898601531982, -6.3312907218933105, -6.1386823654174805, -5.946074485778809, -5.753466606140137, -5.560858249664307, -5.368250370025635, -5.175642490386963, -4.983034133911133, -4.790426254272461, -4.597817897796631, -4.405210018157959, -4.212601661682129, -4.019993782043457, -3.827385663986206, -3.634777545928955, -3.442169427871704, -3.249561309814453, -3.0569534301757812, -2.8643453121185303, -2.6717371940612793, -2.4791293144226074, -2.2865209579467773, -2.0939128398895264, -1.901304841041565, -1.708696722984314, -1.5160887241363525, -1.3234806060791016, -1.1308724880218506, -0.9382644891738892, -0.7456564903259277, -0.5530484318733215, -0.36044034361839294, -0.16783225536346436, 0.024775803089141846, 0.21738386154174805, 0.409991979598999, 0.6025999784469604, 0.7952080965042114, 0.9878161549568176, 1.1804242134094238, 1.3730323314666748, 1.5656404495239258, 1.7582484483718872, 1.9508565664291382, 2.1434645652770996, 2.3360726833343506, 2.5286808013916016, 2.7212889194488525, 2.9138970375061035, 3.1065049171447754, 3.2991130352020264, 3.4917211532592773, 3.684329032897949, 3.8769373893737793, 4.069545269012451, 4.262153625488281, 4.454761505126953, 4.647369861602783, 4.839977741241455, 5.032586097717285, 5.225193977355957, 5.417801856994629]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 4.0, 11.0, 10.0, 18.0, 29.0, 33.0, 67.0, 98.0, 153.0, 301.0, 573.0, 1422.0, 4013.0, 16637.0, 102568.0, 709216.0, 179468.0, 24794.0, 5812.0, 1766.0, 742.0, 325.0, 200.0, 100.0, 57.0, 32.0, 33.0, 16.0, 11.0, 12.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.82928466796875, -2.7230224609375, -2.61676025390625, -2.510498046875, -2.40423583984375, -2.2979736328125, -2.19171142578125, -2.08544921875, -1.97918701171875, -1.8729248046875, -1.76666259765625, -1.660400390625, -1.55413818359375, -1.4478759765625, -1.34161376953125, -1.2353515625, -1.12908935546875, -1.0228271484375, -0.91656494140625, -0.810302734375, -0.70404052734375, -0.5977783203125, -0.49151611328125, -0.38525390625, -0.27899169921875, -0.1727294921875, -0.06646728515625, 0.039794921875, 0.14605712890625, 0.2523193359375, 0.35858154296875, 0.46484375, 0.57110595703125, 0.6773681640625, 0.78363037109375, 0.889892578125, 0.99615478515625, 1.1024169921875, 1.20867919921875, 1.31494140625, 1.42120361328125, 1.5274658203125, 1.63372802734375, 1.739990234375, 1.84625244140625, 1.9525146484375, 2.05877685546875, 2.1650390625, 2.27130126953125, 2.3775634765625, 2.48382568359375, 2.590087890625, 2.69635009765625, 2.8026123046875, 2.90887451171875, 3.01513671875, 3.12139892578125, 3.2276611328125, 3.33392333984375, 3.440185546875, 3.54644775390625, 3.6527099609375, 3.75897216796875, 3.865234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 24.0, 16.0, 21.0, 39.0, 30.0, 40.0, 46.0, 60.0, 53.0, 74.0, 84.0, 75.0, 64.0, 65.0, 61.0, 53.0, 44.0, 29.0, 28.0, 20.0, 12.0, 16.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8427734375, -0.8220901489257812, -0.8014068603515625, -0.7807235717773438, -0.760040283203125, -0.7393569946289062, -0.7186737060546875, -0.6979904174804688, -0.67730712890625, -0.6566238403320312, -0.6359405517578125, -0.6152572631835938, -0.594573974609375, -0.5738906860351562, -0.5532073974609375, -0.5325241088867188, -0.5118408203125, -0.49115753173828125, -0.4704742431640625, -0.44979095458984375, -0.429107666015625, -0.40842437744140625, -0.3877410888671875, -0.36705780029296875, -0.34637451171875, -0.32569122314453125, -0.3050079345703125, -0.28432464599609375, -0.263641357421875, -0.24295806884765625, -0.2222747802734375, -0.20159149169921875, -0.180908203125, -0.16022491455078125, -0.1395416259765625, -0.11885833740234375, -0.098175048828125, -0.07749176025390625, -0.0568084716796875, -0.03612518310546875, -0.01544189453125, 0.00524139404296875, 0.0259246826171875, 0.04660797119140625, 0.067291259765625, 0.08797454833984375, 0.1086578369140625, 0.12934112548828125, 0.1500244140625, 0.17070770263671875, 0.1913909912109375, 0.21207427978515625, 0.232757568359375, 0.25344085693359375, 0.2741241455078125, 0.29480743408203125, 0.31549072265625, 0.33617401123046875, 0.3568572998046875, 0.37754058837890625, 0.398223876953125, 0.41890716552734375, 0.4395904541015625, 0.46027374267578125, 0.48095703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 5.0, 5.0, 9.0, 10.0, 16.0, 16.0, 39.0, 47.0, 52.0, 82.0, 110.0, 198.0, 273.0, 440.0, 663.0, 1109.0, 1838.0, 3332.0, 6492.0, 12614.0, 26604.0, 61349.0, 161705.0, 393926.0, 226838.0, 82040.0, 34450.0, 15997.0, 8051.0, 4208.0, 2394.0, 1323.0, 826.0, 506.0, 338.0, 203.0, 137.0, 86.0, 64.0, 47.0, 33.0, 19.0, 17.0, 9.0, 6.0, 6.0, 4.0, 6.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.04296875, -1.0100250244140625, -0.977081298828125, -0.9441375732421875, -0.91119384765625, -0.8782501220703125, -0.845306396484375, -0.8123626708984375, -0.7794189453125, -0.7464752197265625, -0.713531494140625, -0.6805877685546875, -0.64764404296875, -0.6147003173828125, -0.581756591796875, -0.5488128662109375, -0.515869140625, -0.4829254150390625, -0.449981689453125, -0.4170379638671875, -0.38409423828125, -0.3511505126953125, -0.318206787109375, -0.2852630615234375, -0.2523193359375, -0.2193756103515625, -0.186431884765625, -0.1534881591796875, -0.12054443359375, -0.0876007080078125, -0.054656982421875, -0.0217132568359375, 0.01123046875, 0.0441741943359375, 0.077117919921875, 0.1100616455078125, 0.14300537109375, 0.1759490966796875, 0.208892822265625, 0.2418365478515625, 0.2747802734375, 0.3077239990234375, 0.340667724609375, 0.3736114501953125, 0.40655517578125, 0.4394989013671875, 0.472442626953125, 0.5053863525390625, 0.538330078125, 0.5712738037109375, 0.604217529296875, 0.6371612548828125, 0.67010498046875, 0.7030487060546875, 0.735992431640625, 0.7689361572265625, 0.8018798828125, 0.8348236083984375, 0.867767333984375, 0.9007110595703125, 0.93365478515625, 0.9665985107421875, 0.999542236328125, 1.0324859619140625, 1.0654296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 7.0, 13.0, 14.0, 13.0, 15.0, 26.0, 28.0, 18.0, 23.0, 28.0, 45.0, 45.0, 46.0, 45.0, 44.0, 39.0, 53.0, 61.0, 42.0, 43.0, 39.0, 46.0, 42.0, 31.0, 26.0, 25.0, 15.0, 22.0, 16.0, 16.0, 13.0, 13.0, 11.0, 7.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9189453125, -1.8578033447265625, -1.796661376953125, -1.7355194091796875, -1.67437744140625, -1.6132354736328125, -1.552093505859375, -1.4909515380859375, -1.4298095703125, -1.3686676025390625, -1.307525634765625, -1.2463836669921875, -1.18524169921875, -1.1240997314453125, -1.062957763671875, -1.0018157958984375, -0.940673828125, -0.8795318603515625, -0.818389892578125, -0.7572479248046875, -0.69610595703125, -0.6349639892578125, -0.573822021484375, -0.5126800537109375, -0.4515380859375, -0.3903961181640625, -0.329254150390625, -0.2681121826171875, -0.20697021484375, -0.1458282470703125, -0.084686279296875, -0.0235443115234375, 0.03759765625, 0.0987396240234375, 0.159881591796875, 0.2210235595703125, 0.28216552734375, 0.3433074951171875, 0.404449462890625, 0.4655914306640625, 0.5267333984375, 0.5878753662109375, 0.649017333984375, 0.7101593017578125, 0.77130126953125, 0.8324432373046875, 0.893585205078125, 0.9547271728515625, 1.015869140625, 1.0770111083984375, 1.138153076171875, 1.1992950439453125, 1.26043701171875, 1.3215789794921875, 1.382720947265625, 1.4438629150390625, 1.5050048828125, 1.5661468505859375, 1.627288818359375, 1.6884307861328125, 1.74957275390625, 1.8107147216796875, 1.871856689453125, 1.9329986572265625, 1.994140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 11.0, 15.0, 12.0, 21.0, 44.0, 70.0, 130.0, 279.0, 562.0, 1400.0, 5085.0, 26108.0, 289807.0, 657764.0, 54906.0, 8559.0, 2220.0, 811.0, 350.0, 165.0, 101.0, 52.0, 37.0, 20.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8896484375, -0.859161376953125, -0.82867431640625, -0.798187255859375, -0.7677001953125, -0.737213134765625, -0.70672607421875, -0.676239013671875, -0.645751953125, -0.615264892578125, -0.58477783203125, -0.554290771484375, -0.5238037109375, -0.493316650390625, -0.46282958984375, -0.432342529296875, -0.40185546875, -0.371368408203125, -0.34088134765625, -0.310394287109375, -0.2799072265625, -0.249420166015625, -0.21893310546875, -0.188446044921875, -0.157958984375, -0.127471923828125, -0.09698486328125, -0.066497802734375, -0.0360107421875, -0.005523681640625, 0.02496337890625, 0.055450439453125, 0.0859375, 0.116424560546875, 0.14691162109375, 0.177398681640625, 0.2078857421875, 0.238372802734375, 0.26885986328125, 0.299346923828125, 0.329833984375, 0.360321044921875, 0.39080810546875, 0.421295166015625, 0.4517822265625, 0.482269287109375, 0.51275634765625, 0.543243408203125, 0.57373046875, 0.604217529296875, 0.63470458984375, 0.665191650390625, 0.6956787109375, 0.726165771484375, 0.75665283203125, 0.787139892578125, 0.817626953125, 0.848114013671875, 0.87860107421875, 0.909088134765625, 0.9395751953125, 0.970062255859375, 1.00054931640625, 1.031036376953125, 1.0615234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 4.0, 8.0, 18.0, 16.0, 15.0, 20.0, 44.0, 52.0, 70.0, 102.0, 125.0, 125.0, 94.0, 79.0, 44.0, 51.0, 33.0, 23.0, 18.0, 12.0, 8.0, 7.0, 11.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.208917617797852e-05, -8.839089423418045e-05, -8.469261229038239e-05, -8.099433034658432e-05, -7.729604840278625e-05, -7.359776645898819e-05, -6.989948451519012e-05, -6.620120257139206e-05, -6.2502920627594e-05, -5.880463868379593e-05, -5.5106356739997864e-05, -5.14080747961998e-05, -4.7709792852401733e-05, -4.401151090860367e-05, -4.03132289648056e-05, -3.661494702100754e-05, -3.291666507720947e-05, -2.9218383133411407e-05, -2.5520101189613342e-05, -2.1821819245815277e-05, -1.8123537302017212e-05, -1.4425255358219147e-05, -1.0726973414421082e-05, -7.028691470623016e-06, -3.330409526824951e-06, 3.67872416973114e-07, 4.066154360771179e-06, 7.764436304569244e-06, 1.146271824836731e-05, 1.5161000192165375e-05, 1.885928213596344e-05, 2.2557564079761505e-05, 2.625584602355957e-05, 2.9954127967357635e-05, 3.36524099111557e-05, 3.7350691854953766e-05, 4.104897379875183e-05, 4.4747255742549896e-05, 4.844553768634796e-05, 5.2143819630146027e-05, 5.584210157394409e-05, 5.954038351774216e-05, 6.323866546154022e-05, 6.693694740533829e-05, 7.063522934913635e-05, 7.433351129293442e-05, 7.803179323673248e-05, 8.173007518053055e-05, 8.542835712432861e-05, 8.912663906812668e-05, 9.282492101192474e-05, 9.652320295572281e-05, 0.00010022148489952087, 0.00010391976684331894, 0.000107618048787117, 0.00011131633073091507, 0.00011501461267471313, 0.0001187128946185112, 0.00012241117656230927, 0.00012610945850610733, 0.0001298077404499054, 0.00013350602239370346, 0.00013720430433750153, 0.0001409025862812996, 0.00014460086822509766]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 8.0, 9.0, 19.0, 25.0, 49.0, 80.0, 131.0, 237.0, 475.0, 933.0, 2120.0, 5015.0, 13595.0, 45326.0, 228861.0, 560996.0, 141683.0, 31499.0, 10191.0, 3836.0, 1694.0, 786.0, 415.0, 216.0, 115.0, 83.0, 53.0, 35.0, 22.0, 10.0, 10.0, 11.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73828125, -0.716796875, -0.6953125, -0.673828125, -0.65234375, -0.630859375, -0.609375, -0.587890625, -0.56640625, -0.544921875, -0.5234375, -0.501953125, -0.48046875, -0.458984375, -0.4375, -0.416015625, -0.39453125, -0.373046875, -0.3515625, -0.330078125, -0.30859375, -0.287109375, -0.265625, -0.244140625, -0.22265625, -0.201171875, -0.1796875, -0.158203125, -0.13671875, -0.115234375, -0.09375, -0.072265625, -0.05078125, -0.029296875, -0.0078125, 0.013671875, 0.03515625, 0.056640625, 0.078125, 0.099609375, 0.12109375, 0.142578125, 0.1640625, 0.185546875, 0.20703125, 0.228515625, 0.25, 0.271484375, 0.29296875, 0.314453125, 0.3359375, 0.357421875, 0.37890625, 0.400390625, 0.421875, 0.443359375, 0.46484375, 0.486328125, 0.5078125, 0.529296875, 0.55078125, 0.572265625, 0.59375, 0.615234375, 0.63671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 8.0, 7.0, 7.0, 13.0, 16.0, 25.0, 30.0, 33.0, 50.0, 63.0, 77.0, 87.0, 102.0, 93.0, 74.0, 77.0, 56.0, 47.0, 26.0, 29.0, 12.0, 17.0, 10.0, 9.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56005859375, -0.5383529663085938, -0.5166473388671875, -0.49494171142578125, -0.473236083984375, -0.45153045654296875, -0.4298248291015625, -0.40811920166015625, -0.38641357421875, -0.36470794677734375, -0.3430023193359375, -0.32129669189453125, -0.299591064453125, -0.27788543701171875, -0.2561798095703125, -0.23447418212890625, -0.2127685546875, -0.19106292724609375, -0.1693572998046875, -0.14765167236328125, -0.125946044921875, -0.10424041748046875, -0.0825347900390625, -0.06082916259765625, -0.03912353515625, -0.01741790771484375, 0.0042877197265625, 0.02599334716796875, 0.047698974609375, 0.06940460205078125, 0.0911102294921875, 0.11281585693359375, 0.134521484375, 0.15622711181640625, 0.1779327392578125, 0.19963836669921875, 0.221343994140625, 0.24304962158203125, 0.2647552490234375, 0.28646087646484375, 0.30816650390625, 0.32987213134765625, 0.3515777587890625, 0.37328338623046875, 0.394989013671875, 0.41669464111328125, 0.4384002685546875, 0.46010589599609375, 0.4818115234375, 0.5035171508789062, 0.5252227783203125, 0.5469284057617188, 0.568634033203125, 0.5903396606445312, 0.6120452880859375, 0.6337509155273438, 0.65545654296875, 0.6771621704101562, 0.6988677978515625, 0.7205734252929688, 0.742279052734375, 0.7639846801757812, 0.7856903076171875, 0.8073959350585938, 0.8291015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 14.0, 22.0, 30.0, 45.0, 97.0, 148.0, 212.0, 178.0, 108.0, 62.0, 25.0, 24.0, 14.0, 5.0, 4.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.951412200927734, -6.431809902191162, -5.91220760345459, -5.392605781555176, -4.8730034828186035, -4.353401184082031, -3.833799123764038, -3.314197063446045, -2.7945947647094727, -2.2749924659729004, -1.7553904056549072, -1.2357882261276245, -0.7161860466003418, -0.19658374786376953, 0.32301831245422363, 0.8426203727722168, 1.362222671508789, 1.8818248510360718, 2.4014270305633545, 2.9210290908813477, 3.44063138961792, 3.960233688354492, 4.479835510253906, 4.9994378089904785, 5.519040107727051, 6.038642406463623, 6.558244705200195, 7.077846527099609, 7.597448825836182, 8.117051124572754, 8.636652946472168, 9.156255722045898, 9.675857543945312, 10.195459365844727, 10.715062141418457, 11.234663963317871, 11.754266738891602, 12.273868560791016, 12.79347038269043, 13.313072204589844, 13.832674980163574, 14.352276802062988, 14.871879577636719, 15.391481399536133, 15.911083221435547, 16.430686950683594, 16.950288772583008, 17.469890594482422, 17.989492416381836, 18.50909423828125, 19.028696060180664, 19.54829978942871, 20.067901611328125, 20.58750343322754, 21.107105255126953, 21.626707077026367, 22.14630889892578, 22.665910720825195, 23.18551254272461, 23.705116271972656, 24.22471809387207, 24.744319915771484, 25.2639217376709, 25.783523559570312, 26.30312728881836]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 11.0, 11.0, 7.0, 12.0, 15.0, 14.0, 18.0, 26.0, 20.0, 26.0, 16.0, 33.0, 35.0, 25.0, 34.0, 38.0, 48.0, 41.0, 44.0, 43.0, 39.0, 38.0, 39.0, 43.0, 40.0, 32.0, 29.0, 24.0, 36.0, 20.0, 26.0, 20.0, 14.0, 17.0, 15.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.637847900390625, -10.328468322753906, -10.019089698791504, -9.709711074829102, -9.400331497192383, -9.090951919555664, -8.781573295593262, -8.47219467163086, -8.16281509399414, -7.85343599319458, -7.5440568923950195, -7.234677791595459, -6.925298690795898, -6.615919589996338, -6.306540489196777, -5.997161388397217, -5.687782287597656, -5.378403186798096, -5.069024085998535, -4.759644985198975, -4.450265884399414, -4.1408867835998535, -3.831507682800293, -3.5221285820007324, -3.212749481201172, -2.9033703804016113, -2.593991279602051, -2.2846121788024902, -1.9752330780029297, -1.6658539772033691, -1.3564748764038086, -1.047095775604248, -0.7377157211303711, -0.42833662033081055, -0.11895751953125, 0.19042158126831055, 0.4998006820678711, 0.8091797828674316, 1.1185588836669922, 1.4279379844665527, 1.7373170852661133, 2.046696186065674, 2.3560752868652344, 2.665454387664795, 2.9748334884643555, 3.284212589263916, 3.5935916900634766, 3.902970790863037, 4.212349891662598, 4.521728992462158, 4.831108093261719, 5.140487194061279, 5.44986629486084, 5.7592453956604, 6.068624496459961, 6.3780035972595215, 6.687382698059082, 6.996761798858643, 7.306140899658203, 7.615520000457764, 7.924899101257324, 8.234277725219727, 8.543657302856445, 8.853036880493164, 9.162415504455566]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 3.0, 5.0, 12.0, 11.0, 4.0, 13.0, 16.0, 23.0, 36.0, 45.0, 74.0, 119.0, 210.0, 408.0, 1090.0, 3611.0, 17685.0, 4011008.0, 145358.0, 10059.0, 2634.0, 923.0, 459.0, 184.0, 110.0, 68.0, 35.0, 20.0, 14.0, 11.0, 7.0, 8.0, 1.0, 4.0, 4.0, 3.0], "bins": [-8.7265625, -8.53619384765625, -8.3458251953125, -8.15545654296875, -7.965087890625, -7.77471923828125, -7.5843505859375, -7.39398193359375, -7.20361328125, -7.01324462890625, -6.8228759765625, -6.63250732421875, -6.442138671875, -6.25177001953125, -6.0614013671875, -5.87103271484375, -5.6806640625, -5.49029541015625, -5.2999267578125, -5.10955810546875, -4.919189453125, -4.72882080078125, -4.5384521484375, -4.34808349609375, -4.15771484375, -3.96734619140625, -3.7769775390625, -3.58660888671875, -3.396240234375, -3.20587158203125, -3.0155029296875, -2.82513427734375, -2.634765625, -2.44439697265625, -2.2540283203125, -2.06365966796875, -1.873291015625, -1.68292236328125, -1.4925537109375, -1.30218505859375, -1.11181640625, -0.92144775390625, -0.7310791015625, -0.54071044921875, -0.350341796875, -0.15997314453125, 0.0303955078125, 0.22076416015625, 0.4111328125, 0.60150146484375, 0.7918701171875, 0.98223876953125, 1.172607421875, 1.36297607421875, 1.5533447265625, 1.74371337890625, 1.93408203125, 2.12445068359375, 2.3148193359375, 2.50518798828125, 2.695556640625, 2.88592529296875, 3.0762939453125, 3.26666259765625, 3.45703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 16.0, 30.0, 24.0, 25.0, 41.0, 49.0, 53.0, 53.0, 53.0, 51.0, 49.0, 65.0, 62.0, 51.0, 45.0, 52.0, 55.0, 26.0, 36.0, 30.0, 22.0, 16.0, 20.0, 11.0, 9.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.84326171875, -0.8217697143554688, -0.8002777099609375, -0.7787857055664062, -0.757293701171875, -0.7358016967773438, -0.7143096923828125, -0.6928176879882812, -0.67132568359375, -0.6498336791992188, -0.6283416748046875, -0.6068496704101562, -0.585357666015625, -0.5638656616210938, -0.5423736572265625, -0.5208816528320312, -0.4993896484375, -0.47789764404296875, -0.4564056396484375, -0.43491363525390625, -0.413421630859375, -0.39192962646484375, -0.3704376220703125, -0.34894561767578125, -0.32745361328125, -0.30596160888671875, -0.2844696044921875, -0.26297760009765625, -0.241485595703125, -0.21999359130859375, -0.1985015869140625, -0.17700958251953125, -0.155517578125, -0.13402557373046875, -0.1125335693359375, -0.09104156494140625, -0.069549560546875, -0.04805755615234375, -0.0265655517578125, -0.00507354736328125, 0.01641845703125, 0.03791046142578125, 0.0594024658203125, 0.08089447021484375, 0.102386474609375, 0.12387847900390625, 0.1453704833984375, 0.16686248779296875, 0.1883544921875, 0.20984649658203125, 0.2313385009765625, 0.25283050537109375, 0.274322509765625, 0.29581451416015625, 0.3173065185546875, 0.33879852294921875, 0.36029052734375, 0.38178253173828125, 0.4032745361328125, 0.42476654052734375, 0.446258544921875, 0.46775054931640625, 0.4892425537109375, 0.5107345581054688, 0.5322265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 1.0, 2.0, 6.0, 8.0, 12.0, 10.0, 25.0, 23.0, 29.0, 45.0, 43.0, 71.0, 121.0, 149.0, 195.0, 262.0, 396.0, 586.0, 985.0, 1690.0, 3390.0, 7604.0, 22448.0, 149516.0, 3900723.0, 76745.0, 16310.0, 5914.0, 2805.0, 1492.0, 904.0, 581.0, 352.0, 241.0, 167.0, 105.0, 65.0, 59.0, 51.0, 41.0, 24.0, 30.0, 10.0, 15.0, 12.0, 9.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-2.962890625, -2.876678466796875, -2.79046630859375, -2.704254150390625, -2.6180419921875, -2.531829833984375, -2.44561767578125, -2.359405517578125, -2.273193359375, -2.186981201171875, -2.10076904296875, -2.014556884765625, -1.9283447265625, -1.842132568359375, -1.75592041015625, -1.669708251953125, -1.58349609375, -1.497283935546875, -1.41107177734375, -1.324859619140625, -1.2386474609375, -1.152435302734375, -1.06622314453125, -0.980010986328125, -0.893798828125, -0.807586669921875, -0.72137451171875, -0.635162353515625, -0.5489501953125, -0.462738037109375, -0.37652587890625, -0.290313720703125, -0.2041015625, -0.117889404296875, -0.03167724609375, 0.054534912109375, 0.1407470703125, 0.226959228515625, 0.31317138671875, 0.399383544921875, 0.485595703125, 0.571807861328125, 0.65802001953125, 0.744232177734375, 0.8304443359375, 0.916656494140625, 1.00286865234375, 1.089080810546875, 1.17529296875, 1.261505126953125, 1.34771728515625, 1.433929443359375, 1.5201416015625, 1.606353759765625, 1.69256591796875, 1.778778076171875, 1.864990234375, 1.951202392578125, 2.03741455078125, 2.123626708984375, 2.2098388671875, 2.296051025390625, 2.38226318359375, 2.468475341796875, 2.5546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 8.0, 17.0, 16.0, 59.0, 81.0, 239.0, 3150.0, 277.0, 81.0, 51.0, 25.0, 14.0, 8.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.703125, -1.6492156982421875, -1.595306396484375, -1.5413970947265625, -1.48748779296875, -1.4335784912109375, -1.379669189453125, -1.3257598876953125, -1.2718505859375, -1.2179412841796875, -1.164031982421875, -1.1101226806640625, -1.05621337890625, -1.0023040771484375, -0.948394775390625, -0.8944854736328125, -0.840576171875, -0.7866668701171875, -0.732757568359375, -0.6788482666015625, -0.62493896484375, -0.5710296630859375, -0.517120361328125, -0.4632110595703125, -0.4093017578125, -0.3553924560546875, -0.301483154296875, -0.2475738525390625, -0.19366455078125, -0.1397552490234375, -0.085845947265625, -0.0319366455078125, 0.02197265625, 0.0758819580078125, 0.129791259765625, 0.1837005615234375, 0.23760986328125, 0.2915191650390625, 0.345428466796875, 0.3993377685546875, 0.4532470703125, 0.5071563720703125, 0.561065673828125, 0.6149749755859375, 0.66888427734375, 0.7227935791015625, 0.776702880859375, 0.8306121826171875, 0.884521484375, 0.9384307861328125, 0.992340087890625, 1.0462493896484375, 1.10015869140625, 1.1540679931640625, 1.207977294921875, 1.2618865966796875, 1.3157958984375, 1.3697052001953125, 1.423614501953125, 1.4775238037109375, 1.53143310546875, 1.5853424072265625, 1.639251708984375, 1.6931610107421875, 1.7470703125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 10.0, 17.0, 41.0, 212.0, 493.0, 154.0, 50.0, 16.0, 7.0, 4.0, 3.0], "bins": [-33.299678802490234, -32.721900939941406, -32.14412307739258, -31.56634521484375, -30.988567352294922, -30.410791397094727, -29.8330135345459, -29.25523567199707, -28.677457809448242, -28.099679946899414, -27.521902084350586, -26.944124221801758, -26.366348266601562, -25.788570404052734, -25.210792541503906, -24.633014678955078, -24.05523681640625, -23.477458953857422, -22.899681091308594, -22.321903228759766, -21.744125366210938, -21.166349411010742, -20.588571548461914, -20.010793685913086, -19.433015823364258, -18.85523796081543, -18.2774600982666, -17.699682235717773, -17.121906280517578, -16.54412841796875, -15.966350555419922, -15.388572692871094, -14.810796737670898, -14.23301887512207, -13.655241012573242, -13.07746410369873, -12.499686241149902, -11.921908378601074, -11.344131469726562, -10.766353607177734, -10.188575744628906, -9.610797882080078, -9.03302001953125, -8.455243110656738, -7.87746524810791, -7.299687385559082, -6.721909999847412, -6.144132614135742, -5.566354751586914, -4.988576889038086, -4.410799503326416, -3.833021879196167, -3.255244255065918, -2.677466630935669, -2.09968900680542, -1.52191162109375, -0.9441335201263428, -0.36635589599609375, 0.21142172813415527, 0.7891993522644043, 1.3669769763946533, 1.9447546005249023, 2.5225322246551514, 3.1003096103668213, 3.6780874729156494]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 9.0, 7.0, 14.0, 22.0, 16.0, 22.0, 20.0, 30.0, 36.0, 37.0, 57.0, 44.0, 59.0, 65.0, 60.0, 49.0, 63.0, 52.0, 55.0, 55.0, 43.0, 39.0, 39.0, 24.0, 22.0, 15.0, 12.0, 11.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.914286136627197, -4.779231071472168, -4.644176006317139, -4.509120941162109, -4.374066352844238, -4.239011287689209, -4.10395622253418, -3.9689011573791504, -3.833846092224121, -3.698791027069092, -3.5637359619140625, -3.4286811351776123, -3.293626070022583, -3.1585710048675537, -3.0235161781311035, -2.888461112976074, -2.753406047821045, -2.6183509826660156, -2.4832959175109863, -2.348241090774536, -2.213186025619507, -2.0781309604644775, -1.9430760145187378, -1.808021068572998, -1.6729660034179688, -1.5379109382629395, -1.4028559923171997, -1.26780104637146, -1.1327459812164307, -0.9976909756660461, -0.8626359701156616, -0.7275809645652771, -0.5925259590148926, -0.45747095346450806, -0.32241594791412354, -0.187360942363739, -0.05230593681335449, 0.08274906873703003, 0.21780407428741455, 0.3528590798377991, 0.4879140853881836, 0.6229690909385681, 0.7580240964889526, 0.8930791020393372, 1.0281341075897217, 1.163189172744751, 1.2982441186904907, 1.4332990646362305, 1.5683541297912598, 1.703409194946289, 1.8384641408920288, 1.9735190868377686, 2.108574151992798, 2.243629217147827, 2.3786840438842773, 2.5137391090393066, 2.648794174194336, 2.7838492393493652, 2.9189043045043945, 3.0539591312408447, 3.189014196395874, 3.3240692615509033, 3.4591240882873535, 3.594179153442383, 3.729234218597412]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 13.0, 13.0, 11.0, 27.0, 31.0, 59.0, 112.0, 205.0, 337.0, 775.0, 2124.0, 7820.0, 47686.0, 679151.0, 277715.0, 24803.0, 4922.0, 1507.0, 609.0, 261.0, 118.0, 95.0, 49.0, 33.0, 18.0, 11.0, 10.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.27947998046875, -5.1136474609375, -4.94781494140625, -4.781982421875, -4.61614990234375, -4.4503173828125, -4.28448486328125, -4.11865234375, -3.95281982421875, -3.7869873046875, -3.62115478515625, -3.455322265625, -3.28948974609375, -3.1236572265625, -2.95782470703125, -2.7919921875, -2.62615966796875, -2.4603271484375, -2.29449462890625, -2.128662109375, -1.96282958984375, -1.7969970703125, -1.63116455078125, -1.46533203125, -1.29949951171875, -1.1336669921875, -0.96783447265625, -0.802001953125, -0.63616943359375, -0.4703369140625, -0.30450439453125, -0.138671875, 0.02716064453125, 0.1929931640625, 0.35882568359375, 0.524658203125, 0.69049072265625, 0.8563232421875, 1.02215576171875, 1.18798828125, 1.35382080078125, 1.5196533203125, 1.68548583984375, 1.851318359375, 2.01715087890625, 2.1829833984375, 2.34881591796875, 2.5146484375, 2.68048095703125, 2.8463134765625, 3.01214599609375, 3.177978515625, 3.34381103515625, 3.5096435546875, 3.67547607421875, 3.84130859375, 4.00714111328125, 4.1729736328125, 4.33880615234375, 4.504638671875, 4.67047119140625, 4.8363037109375, 5.00213623046875, 5.16796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 26.0, 20.0, 19.0, 46.0, 33.0, 46.0, 50.0, 42.0, 47.0, 52.0, 63.0, 61.0, 63.0, 40.0, 53.0, 56.0, 40.0, 42.0, 36.0, 24.0, 35.0, 19.0, 15.0, 14.0, 8.0, 7.0, 2.0, 5.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.9091796875, -0.8866424560546875, -0.864105224609375, -0.8415679931640625, -0.81903076171875, -0.7964935302734375, -0.773956298828125, -0.7514190673828125, -0.7288818359375, -0.7063446044921875, -0.683807373046875, -0.6612701416015625, -0.63873291015625, -0.6161956787109375, -0.593658447265625, -0.5711212158203125, -0.548583984375, -0.5260467529296875, -0.503509521484375, -0.4809722900390625, -0.45843505859375, -0.4358978271484375, -0.413360595703125, -0.3908233642578125, -0.3682861328125, -0.3457489013671875, -0.323211669921875, -0.3006744384765625, -0.27813720703125, -0.2555999755859375, -0.233062744140625, -0.2105255126953125, -0.18798828125, -0.1654510498046875, -0.142913818359375, -0.1203765869140625, -0.09783935546875, -0.0753021240234375, -0.052764892578125, -0.0302276611328125, -0.0076904296875, 0.0148468017578125, 0.037384033203125, 0.0599212646484375, 0.08245849609375, 0.1049957275390625, 0.127532958984375, 0.1500701904296875, 0.172607421875, 0.1951446533203125, 0.217681884765625, 0.2402191162109375, 0.26275634765625, 0.2852935791015625, 0.307830810546875, 0.3303680419921875, 0.3529052734375, 0.3754425048828125, 0.397979736328125, 0.4205169677734375, 0.44305419921875, 0.4655914306640625, 0.488128662109375, 0.5106658935546875, 0.533203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 11.0, 20.0, 32.0, 45.0, 68.0, 126.0, 242.0, 459.0, 975.0, 2165.0, 5220.0, 15516.0, 58808.0, 366602.0, 494023.0, 74692.0, 18703.0, 6150.0, 2456.0, 1117.0, 514.0, 244.0, 143.0, 82.0, 41.0, 32.0, 20.0, 8.0, 6.0, 6.0, 3.0, 4.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.197265625, -2.116119384765625, -2.03497314453125, -1.953826904296875, -1.8726806640625, -1.791534423828125, -1.71038818359375, -1.629241943359375, -1.548095703125, -1.466949462890625, -1.38580322265625, -1.304656982421875, -1.2235107421875, -1.142364501953125, -1.06121826171875, -0.980072021484375, -0.89892578125, -0.817779541015625, -0.73663330078125, -0.655487060546875, -0.5743408203125, -0.493194580078125, -0.41204833984375, -0.330902099609375, -0.249755859375, -0.168609619140625, -0.08746337890625, -0.006317138671875, 0.0748291015625, 0.155975341796875, 0.23712158203125, 0.318267822265625, 0.3994140625, 0.480560302734375, 0.56170654296875, 0.642852783203125, 0.7239990234375, 0.805145263671875, 0.88629150390625, 0.967437744140625, 1.048583984375, 1.129730224609375, 1.21087646484375, 1.292022705078125, 1.3731689453125, 1.454315185546875, 1.53546142578125, 1.616607666015625, 1.69775390625, 1.778900146484375, 1.86004638671875, 1.941192626953125, 2.0223388671875, 2.103485107421875, 2.18463134765625, 2.265777587890625, 2.346923828125, 2.428070068359375, 2.50921630859375, 2.590362548828125, 2.6715087890625, 2.752655029296875, 2.83380126953125, 2.914947509765625, 2.99609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 7.0, 3.0, 4.0, 3.0, 13.0, 10.0, 6.0, 23.0, 27.0, 22.0, 31.0, 26.0, 41.0, 44.0, 42.0, 51.0, 70.0, 66.0, 68.0, 52.0, 66.0, 50.0, 56.0, 48.0, 25.0, 35.0, 25.0, 21.0, 23.0, 10.0, 8.0, 9.0, 9.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.966827392578125, -2.86138916015625, -2.755950927734375, -2.6505126953125, -2.545074462890625, -2.43963623046875, -2.334197998046875, -2.228759765625, -2.123321533203125, -2.01788330078125, -1.912445068359375, -1.8070068359375, -1.701568603515625, -1.59613037109375, -1.490692138671875, -1.38525390625, -1.279815673828125, -1.17437744140625, -1.068939208984375, -0.9635009765625, -0.858062744140625, -0.75262451171875, -0.647186279296875, -0.541748046875, -0.436309814453125, -0.33087158203125, -0.225433349609375, -0.1199951171875, -0.014556884765625, 0.09088134765625, 0.196319580078125, 0.3017578125, 0.407196044921875, 0.51263427734375, 0.618072509765625, 0.7235107421875, 0.828948974609375, 0.93438720703125, 1.039825439453125, 1.145263671875, 1.250701904296875, 1.35614013671875, 1.461578369140625, 1.5670166015625, 1.672454833984375, 1.77789306640625, 1.883331298828125, 1.98876953125, 2.094207763671875, 2.19964599609375, 2.305084228515625, 2.4105224609375, 2.515960693359375, 2.62139892578125, 2.726837158203125, 2.832275390625, 2.937713623046875, 3.04315185546875, 3.148590087890625, 3.2540283203125, 3.359466552734375, 3.46490478515625, 3.570343017578125, 3.67578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 3.0, 11.0, 8.0, 14.0, 20.0, 20.0, 33.0, 39.0, 63.0, 98.0, 137.0, 282.0, 583.0, 1055.0, 2172.0, 4919.0, 13520.0, 57975.0, 621973.0, 295760.0, 33052.0, 9451.0, 3725.0, 1691.0, 839.0, 458.0, 230.0, 133.0, 100.0, 61.0, 44.0, 25.0, 21.0, 9.0, 11.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359375, -1.3152923583984375, -1.271209716796875, -1.2271270751953125, -1.18304443359375, -1.1389617919921875, -1.094879150390625, -1.0507965087890625, -1.0067138671875, -0.9626312255859375, -0.918548583984375, -0.8744659423828125, -0.83038330078125, -0.7863006591796875, -0.742218017578125, -0.6981353759765625, -0.654052734375, -0.6099700927734375, -0.565887451171875, -0.5218048095703125, -0.47772216796875, -0.4336395263671875, -0.389556884765625, -0.3454742431640625, -0.3013916015625, -0.2573089599609375, -0.213226318359375, -0.1691436767578125, -0.12506103515625, -0.0809783935546875, -0.036895751953125, 0.0071868896484375, 0.05126953125, 0.0953521728515625, 0.139434814453125, 0.1835174560546875, 0.22760009765625, 0.2716827392578125, 0.315765380859375, 0.3598480224609375, 0.4039306640625, 0.4480133056640625, 0.492095947265625, 0.5361785888671875, 0.58026123046875, 0.6243438720703125, 0.668426513671875, 0.7125091552734375, 0.756591796875, 0.8006744384765625, 0.844757080078125, 0.8888397216796875, 0.93292236328125, 0.9770050048828125, 1.021087646484375, 1.0651702880859375, 1.1092529296875, 1.1533355712890625, 1.197418212890625, 1.2415008544921875, 1.28558349609375, 1.3296661376953125, 1.373748779296875, 1.4178314208984375, 1.4619140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 17.0, 24.0, 44.0, 97.0, 184.0, 286.0, 172.0, 76.0, 36.0, 22.0, 14.0, 7.0, 9.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0006213188171386719, -0.0006070025265216827, -0.0005926862359046936, -0.0005783699452877045, -0.0005640536546707153, -0.0005497373640537262, -0.0005354210734367371, -0.0005211047828197479, -0.0005067884922027588, -0.0004924722015857697, -0.0004781559109687805, -0.0004638396203517914, -0.00044952332973480225, -0.0004352070391178131, -0.000420890748500824, -0.00040657445788383484, -0.0003922581672668457, -0.00037794187664985657, -0.00036362558603286743, -0.0003493092954158783, -0.00033499300479888916, -0.0003206767141819, -0.0003063604235649109, -0.00029204413294792175, -0.0002777278423309326, -0.0002634115517139435, -0.00024909526109695435, -0.0002347789704799652, -0.00022046267986297607, -0.00020614638924598694, -0.0001918300986289978, -0.00017751380801200867, -0.00016319751739501953, -0.0001488812267780304, -0.00013456493616104126, -0.00012024864554405212, -0.00010593235492706299, -9.161606431007385e-05, -7.729977369308472e-05, -6.298348307609558e-05, -4.8667192459106445e-05, -3.435090184211731e-05, -2.0034611225128174e-05, -5.718320608139038e-06, 8.597970008850098e-06, 2.2914260625839233e-05, 3.723055124282837e-05, 5.1546841859817505e-05, 6.586313247680664e-05, 8.017942309379578e-05, 9.449571371078491e-05, 0.00010881200432777405, 0.00012312829494476318, 0.00013744458556175232, 0.00015176087617874146, 0.0001660771667957306, 0.00018039345741271973, 0.00019470974802970886, 0.000209026038646698, 0.00022334232926368713, 0.00023765861988067627, 0.0002519749104976654, 0.00026629120111465454, 0.0002806074917316437, 0.0002949237823486328]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 6.0, 6.0, 8.0, 16.0, 22.0, 16.0, 40.0, 40.0, 62.0, 100.0, 165.0, 256.0, 510.0, 1064.0, 2553.0, 6573.0, 21189.0, 155973.0, 748961.0, 86205.0, 15402.0, 5274.0, 2085.0, 915.0, 441.0, 222.0, 142.0, 78.0, 48.0, 41.0, 29.0, 22.0, 17.0, 15.0, 14.0, 9.0, 4.0, 6.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.58984375, -1.5422210693359375, -1.494598388671875, -1.4469757080078125, -1.39935302734375, -1.3517303466796875, -1.304107666015625, -1.2564849853515625, -1.2088623046875, -1.1612396240234375, -1.113616943359375, -1.0659942626953125, -1.01837158203125, -0.9707489013671875, -0.923126220703125, -0.8755035400390625, -0.827880859375, -0.7802581787109375, -0.732635498046875, -0.6850128173828125, -0.63739013671875, -0.5897674560546875, -0.542144775390625, -0.4945220947265625, -0.4468994140625, -0.3992767333984375, -0.351654052734375, -0.3040313720703125, -0.25640869140625, -0.2087860107421875, -0.161163330078125, -0.1135406494140625, -0.06591796875, -0.0182952880859375, 0.029327392578125, 0.0769500732421875, 0.12457275390625, 0.1721954345703125, 0.219818115234375, 0.2674407958984375, 0.3150634765625, 0.3626861572265625, 0.410308837890625, 0.4579315185546875, 0.50555419921875, 0.5531768798828125, 0.600799560546875, 0.6484222412109375, 0.696044921875, 0.7436676025390625, 0.791290283203125, 0.8389129638671875, 0.88653564453125, 0.9341583251953125, 0.981781005859375, 1.0294036865234375, 1.0770263671875, 1.1246490478515625, 1.172271728515625, 1.2198944091796875, 1.26751708984375, 1.3151397705078125, 1.362762451171875, 1.4103851318359375, 1.4580078125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 13.0, 11.0, 16.0, 24.0, 44.0, 82.0, 130.0, 208.0, 181.0, 106.0, 73.0, 39.0, 31.0, 13.0, 9.0, 12.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.4512176513671875, -1.387786865234375, -1.3243560791015625, -1.26092529296875, -1.1974945068359375, -1.134063720703125, -1.0706329345703125, -1.0072021484375, -0.9437713623046875, -0.880340576171875, -0.8169097900390625, -0.75347900390625, -0.6900482177734375, -0.626617431640625, -0.5631866455078125, -0.499755859375, -0.4363250732421875, -0.372894287109375, -0.3094635009765625, -0.24603271484375, -0.1826019287109375, -0.119171142578125, -0.0557403564453125, 0.0076904296875, 0.0711212158203125, 0.134552001953125, 0.1979827880859375, 0.26141357421875, 0.3248443603515625, 0.388275146484375, 0.4517059326171875, 0.51513671875, 0.5785675048828125, 0.641998291015625, 0.7054290771484375, 0.76885986328125, 0.8322906494140625, 0.895721435546875, 0.9591522216796875, 1.0225830078125, 1.0860137939453125, 1.149444580078125, 1.2128753662109375, 1.27630615234375, 1.3397369384765625, 1.403167724609375, 1.4665985107421875, 1.530029296875, 1.5934600830078125, 1.656890869140625, 1.7203216552734375, 1.78375244140625, 1.8471832275390625, 1.910614013671875, 1.9740447998046875, 2.0374755859375, 2.1009063720703125, 2.164337158203125, 2.2277679443359375, 2.29119873046875, 2.3546295166015625, 2.418060302734375, 2.4814910888671875, 2.544921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 10.0, 25.0, 47.0, 103.0, 195.0, 255.0, 194.0, 88.0, 44.0, 19.0, 15.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.73603057861328, -24.730749130249023, -23.725467681884766, -22.720184326171875, -21.714902877807617, -20.70962142944336, -19.7043399810791, -18.699058532714844, -17.693775177001953, -16.688493728637695, -15.683211326599121, -14.677929878234863, -13.672647476196289, -12.667366027832031, -11.662084579467773, -10.656803131103516, -9.651521682739258, -8.646240234375, -7.640957832336426, -6.635676383972168, -5.630394458770752, -4.625112533569336, -3.619831085205078, -2.614549160003662, -1.609267234802246, -0.6039854288101196, 0.40129637718200684, 1.4065780639648438, 2.4118599891662598, 3.417141914367676, 4.422423362731934, 5.42770528793335, 6.432987213134766, 7.438269138336182, 8.443551063537598, 9.448832511901855, 10.45411491394043, 11.459396362304688, 12.464677810668945, 13.469959259033203, 14.475241661071777, 15.480523109436035, 16.48580551147461, 17.491086959838867, 18.496368408203125, 19.501651763916016, 20.50693130493164, 21.51221466064453, 22.51749610900879, 23.522777557373047, 24.528059005737305, 25.533340454101562, 26.538623809814453, 27.54390525817871, 28.54918670654297, 29.554468154907227, 30.559749603271484, 31.565031051635742, 32.5703125, 33.57559585571289, 34.580875396728516, 35.586158752441406, 36.59143829345703, 37.59672164916992, 38.60200500488281]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 4.0, 9.0, 6.0, 14.0, 14.0, 15.0, 20.0, 19.0, 31.0, 15.0, 18.0, 37.0, 32.0, 38.0, 34.0, 46.0, 41.0, 44.0, 43.0, 32.0, 54.0, 51.0, 45.0, 35.0, 37.0, 37.0, 37.0, 28.0, 24.0, 21.0, 18.0, 26.0, 18.0, 17.0, 10.0, 7.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.705894470214844, -12.238492012023926, -11.771088600158691, -11.303686141967773, -10.836282730102539, -10.368880271911621, -9.901477813720703, -9.434074401855469, -8.96667194366455, -8.499269485473633, -8.031866073608398, -7.5644636154174805, -7.097060680389404, -6.629657745361328, -6.16225528717041, -5.694852352142334, -5.227449417114258, -4.760046482086182, -4.2926435470581055, -3.8252410888671875, -3.3578381538391113, -2.890435218811035, -2.423032522201538, -1.955629825592041, -1.4882268905639648, -1.0208240747451782, -0.5534212589263916, -0.08601844310760498, 0.38138437271118164, 0.8487873077392578, 1.3161900043487549, 1.783592700958252, 2.250995635986328, 2.7183985710144043, 3.1858012676239014, 3.6532039642333984, 4.120606899261475, 4.588009834289551, 5.055412292480469, 5.522815227508545, 5.990218162536621, 6.457621097564697, 6.925024032592773, 7.392426490783691, 7.859829425811768, 8.327232360839844, 8.794634819030762, 9.26203727722168, 9.729440689086914, 10.196843147277832, 10.664246559143066, 11.131649017333984, 11.599052429199219, 12.066454887390137, 12.533857345581055, 13.001260757446289, 13.468663215637207, 13.936065673828125, 14.40346908569336, 14.870871543884277, 15.338274002075195, 15.80567741394043, 16.273080825805664, 16.740482330322266, 17.2078857421875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 8.0, 18.0, 19.0, 21.0, 60.0, 91.0, 154.0, 246.0, 467.0, 1190.0, 24697.0, 4164331.0, 1669.0, 571.0, 289.0, 147.0, 112.0, 62.0, 40.0, 27.0, 24.0, 5.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-23.171875, -22.6466064453125, -22.121337890625, -21.5960693359375, -21.07080078125, -20.5455322265625, -20.020263671875, -19.4949951171875, -18.9697265625, -18.4444580078125, -17.919189453125, -17.3939208984375, -16.86865234375, -16.3433837890625, -15.818115234375, -15.2928466796875, -14.767578125, -14.2423095703125, -13.717041015625, -13.1917724609375, -12.66650390625, -12.1412353515625, -11.615966796875, -11.0906982421875, -10.5654296875, -10.0401611328125, -9.514892578125, -8.9896240234375, -8.46435546875, -7.9390869140625, -7.413818359375, -6.8885498046875, -6.36328125, -5.8380126953125, -5.312744140625, -4.7874755859375, -4.26220703125, -3.7369384765625, -3.211669921875, -2.6864013671875, -2.1611328125, -1.6358642578125, -1.110595703125, -0.5853271484375, -0.06005859375, 0.4652099609375, 0.990478515625, 1.5157470703125, 2.041015625, 2.5662841796875, 3.091552734375, 3.6168212890625, 4.14208984375, 4.6673583984375, 5.192626953125, 5.7178955078125, 6.2431640625, 6.7684326171875, 7.293701171875, 7.8189697265625, 8.34423828125, 8.8695068359375, 9.394775390625, 9.9200439453125, 10.4453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 5.0, 6.0, 8.0, 4.0, 11.0, 9.0, 16.0, 18.0, 20.0, 28.0, 28.0, 30.0, 35.0, 42.0, 53.0, 33.0, 53.0, 58.0, 39.0, 49.0, 35.0, 57.0, 42.0, 43.0, 35.0, 39.0, 36.0, 23.0, 23.0, 28.0, 22.0, 12.0, 12.0, 12.0, 5.0, 5.0, 9.0, 4.0, 5.0, 5.0, 0.0, 3.0, 5.0], "bins": [-0.953125, -0.9292831420898438, -0.9054412841796875, -0.8815994262695312, -0.857757568359375, -0.8339157104492188, -0.8100738525390625, -0.7862319946289062, -0.76239013671875, -0.7385482788085938, -0.7147064208984375, -0.6908645629882812, -0.667022705078125, -0.6431808471679688, -0.6193389892578125, -0.5954971313476562, -0.5716552734375, -0.5478134155273438, -0.5239715576171875, -0.5001296997070312, -0.476287841796875, -0.45244598388671875, -0.4286041259765625, -0.40476226806640625, -0.38092041015625, -0.35707855224609375, -0.3332366943359375, -0.30939483642578125, -0.285552978515625, -0.26171112060546875, -0.2378692626953125, -0.21402740478515625, -0.190185546875, -0.16634368896484375, -0.1425018310546875, -0.11865997314453125, -0.094818115234375, -0.07097625732421875, -0.0471343994140625, -0.02329254150390625, 0.00054931640625, 0.02439117431640625, 0.0482330322265625, 0.07207489013671875, 0.095916748046875, 0.11975860595703125, 0.1436004638671875, 0.16744232177734375, 0.1912841796875, 0.21512603759765625, 0.2389678955078125, 0.26280975341796875, 0.286651611328125, 0.31049346923828125, 0.3343353271484375, 0.35817718505859375, 0.38201904296875, 0.40586090087890625, 0.4297027587890625, 0.45354461669921875, 0.477386474609375, 0.5012283325195312, 0.5250701904296875, 0.5489120483398438, 0.57275390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 8.0, 17.0, 30.0, 38.0, 34.0, 39.0, 66.0, 97.0, 140.0, 201.0, 244.0, 341.0, 491.0, 698.0, 1106.0, 1629.0, 2742.0, 5602.0, 16344.0, 4011046.0, 128143.0, 12969.0, 4894.0, 2478.0, 1524.0, 1031.0, 671.0, 468.0, 322.0, 254.0, 159.0, 108.0, 84.0, 73.0, 49.0, 44.0, 32.0, 13.0, 13.0, 11.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.341796875, -3.23370361328125, -3.1256103515625, -3.01751708984375, -2.909423828125, -2.80133056640625, -2.6932373046875, -2.58514404296875, -2.47705078125, -2.36895751953125, -2.2608642578125, -2.15277099609375, -2.044677734375, -1.93658447265625, -1.8284912109375, -1.72039794921875, -1.6123046875, -1.50421142578125, -1.3961181640625, -1.28802490234375, -1.179931640625, -1.07183837890625, -0.9637451171875, -0.85565185546875, -0.74755859375, -0.63946533203125, -0.5313720703125, -0.42327880859375, -0.315185546875, -0.20709228515625, -0.0989990234375, 0.00909423828125, 0.1171875, 0.22528076171875, 0.3333740234375, 0.44146728515625, 0.549560546875, 0.65765380859375, 0.7657470703125, 0.87384033203125, 0.98193359375, 1.09002685546875, 1.1981201171875, 1.30621337890625, 1.414306640625, 1.52239990234375, 1.6304931640625, 1.73858642578125, 1.8466796875, 1.95477294921875, 2.0628662109375, 2.17095947265625, 2.279052734375, 2.38714599609375, 2.4952392578125, 2.60333251953125, 2.71142578125, 2.81951904296875, 2.9276123046875, 3.03570556640625, 3.143798828125, 3.25189208984375, 3.3599853515625, 3.46807861328125, 3.576171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 11.0, 26.0, 82.0, 3859.0, 34.0, 15.0, 9.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.1109161376953125, -1.074371337890625, -1.0378265380859375, -1.00128173828125, -0.9647369384765625, -0.928192138671875, -0.8916473388671875, -0.8551025390625, -0.8185577392578125, -0.782012939453125, -0.7454681396484375, -0.70892333984375, -0.6723785400390625, -0.635833740234375, -0.5992889404296875, -0.562744140625, -0.5261993408203125, -0.489654541015625, -0.4531097412109375, -0.41656494140625, -0.3800201416015625, -0.343475341796875, -0.3069305419921875, -0.2703857421875, -0.2338409423828125, -0.197296142578125, -0.1607513427734375, -0.12420654296875, -0.0876617431640625, -0.051116943359375, -0.0145721435546875, 0.02197265625, 0.0585174560546875, 0.095062255859375, 0.1316070556640625, 0.16815185546875, 0.2046966552734375, 0.241241455078125, 0.2777862548828125, 0.3143310546875, 0.3508758544921875, 0.387420654296875, 0.4239654541015625, 0.46051025390625, 0.4970550537109375, 0.533599853515625, 0.5701446533203125, 0.606689453125, 0.6432342529296875, 0.679779052734375, 0.7163238525390625, 0.75286865234375, 0.7894134521484375, 0.825958251953125, 0.8625030517578125, 0.8990478515625, 0.9355926513671875, 0.972137451171875, 1.0086822509765625, 1.04522705078125, 1.0817718505859375, 1.118316650390625, 1.1548614501953125, 1.19140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 13.0, 40.0, 69.0, 148.0, 236.0, 255.0, 154.0, 56.0, 24.0, 11.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.558355331420898, -6.387140274047852, -6.215925216674805, -6.044710159301758, -5.873495101928711, -5.702280044555664, -5.531064987182617, -5.3598504066467285, -5.188635349273682, -5.017420291900635, -4.846205234527588, -4.674990177154541, -4.503775119781494, -4.3325605392456055, -4.161345481872559, -3.9901304244995117, -3.8189151287078857, -3.647700071334839, -3.476485013961792, -3.305270195007324, -3.1340551376342773, -2.9628400802612305, -2.7916250228881836, -2.6204099655151367, -2.44919490814209, -2.277979850769043, -2.106764793395996, -1.9355498552322388, -1.7643349170684814, -1.5931198596954346, -1.4219048023223877, -1.2506898641586304, -1.079474925994873, -0.908259928226471, -0.7370449304580688, -0.565829873085022, -0.3946148753166199, -0.22339987754821777, -0.0521848201751709, 0.11903011798858643, 0.2902451753616333, 0.4614601731300354, 0.6326751708984375, 0.8038902282714844, 0.9751052260398865, 1.1463202238082886, 1.3175352811813354, 1.4887502193450928, 1.6599652767181396, 1.8311803340911865, 2.0023953914642334, 2.173610210418701, 2.344825267791748, 2.516040325164795, 2.687255382537842, 2.8584704399108887, 3.0296854972839355, 3.2009005546569824, 3.3721156120300293, 3.543330669403076, 3.714545488357544, 3.885760545730591, 4.056975364685059, 4.2281904220581055, 4.399405479431152]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 7.0, 7.0, 5.0, 5.0, 5.0, 10.0, 19.0, 18.0, 17.0, 16.0, 19.0, 24.0, 32.0, 28.0, 31.0, 30.0, 30.0, 46.0, 41.0, 39.0, 31.0, 58.0, 35.0, 38.0, 40.0, 45.0, 31.0, 35.0, 34.0, 35.0, 25.0, 31.0, 23.0, 18.0, 15.0, 20.0, 18.0, 9.0, 8.0, 5.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4997920989990234, -1.4447956085205078, -1.3897989988327026, -1.334802508354187, -1.2798058986663818, -1.2248094081878662, -1.1698129177093506, -1.1148163080215454, -1.0598198175430298, -1.0048233270645142, -0.949826717376709, -0.8948302268981934, -0.839833676815033, -0.7848371267318726, -0.7298405766487122, -0.6748440265655518, -0.6198474764823914, -0.564850926399231, -0.5098543763160706, -0.45485785603523254, -0.39986133575439453, -0.34486478567123413, -0.28986823558807373, -0.23487171530723572, -0.17987516522407532, -0.12487863004207611, -0.06988208740949631, -0.014885544776916504, 0.0401109904050827, 0.09510752558708191, 0.1501040756702423, 0.20510059595108032, 0.2600971460342407, 0.3150936961174011, 0.37009021639823914, 0.42508676648139954, 0.48008328676223755, 0.535079836845398, 0.5900763869285583, 0.6450729370117188, 0.7000694274902344, 0.7550659775733948, 0.8100625276565552, 0.8650590181350708, 0.9200555682182312, 0.9750521183013916, 1.0300486087799072, 1.0850452184677124, 1.1400418281555176, 1.1950383186340332, 1.2500349283218384, 1.305031418800354, 1.3600280284881592, 1.4150245189666748, 1.4700210094451904, 1.5250176191329956, 1.5800141096115112, 1.6350106000900269, 1.690007209777832, 1.7450037002563477, 1.8000003099441528, 1.8549968004226685, 1.9099934101104736, 1.9649899005889893, 2.019986391067505]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 8.0, 8.0, 13.0, 40.0, 32.0, 65.0, 79.0, 164.0, 294.0, 623.0, 1288.0, 3091.0, 7962.0, 24336.0, 92875.0, 451799.0, 360918.0, 73095.0, 20183.0, 6722.0, 2659.0, 1078.0, 594.0, 265.0, 134.0, 94.0, 37.0, 30.0, 15.0, 10.0, 6.0, 8.0, 12.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.443359375, -2.349090576171875, -2.25482177734375, -2.160552978515625, -2.0662841796875, -1.972015380859375, -1.87774658203125, -1.783477783203125, -1.689208984375, -1.594940185546875, -1.50067138671875, -1.406402587890625, -1.3121337890625, -1.217864990234375, -1.12359619140625, -1.029327392578125, -0.93505859375, -0.840789794921875, -0.74652099609375, -0.652252197265625, -0.5579833984375, -0.463714599609375, -0.36944580078125, -0.275177001953125, -0.180908203125, -0.086639404296875, 0.00762939453125, 0.101898193359375, 0.1961669921875, 0.290435791015625, 0.38470458984375, 0.478973388671875, 0.5732421875, 0.667510986328125, 0.76177978515625, 0.856048583984375, 0.9503173828125, 1.044586181640625, 1.13885498046875, 1.233123779296875, 1.327392578125, 1.421661376953125, 1.51593017578125, 1.610198974609375, 1.7044677734375, 1.798736572265625, 1.89300537109375, 1.987274169921875, 2.08154296875, 2.175811767578125, 2.27008056640625, 2.364349365234375, 2.4586181640625, 2.552886962890625, 2.64715576171875, 2.741424560546875, 2.835693359375, 2.929962158203125, 3.02423095703125, 3.118499755859375, 3.2127685546875, 3.307037353515625, 3.40130615234375, 3.495574951171875, 3.58984375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 8.0, 4.0, 11.0, 7.0, 13.0, 15.0, 18.0, 19.0, 30.0, 22.0, 35.0, 32.0, 45.0, 43.0, 40.0, 44.0, 48.0, 44.0, 58.0, 59.0, 51.0, 34.0, 46.0, 26.0, 32.0, 37.0, 31.0, 25.0, 22.0, 17.0, 14.0, 8.0, 16.0, 7.0, 6.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.880706787109375, -0.85467529296875, -0.828643798828125, -0.8026123046875, -0.776580810546875, -0.75054931640625, -0.724517822265625, -0.698486328125, -0.672454833984375, -0.64642333984375, -0.620391845703125, -0.5943603515625, -0.568328857421875, -0.54229736328125, -0.516265869140625, -0.490234375, -0.464202880859375, -0.43817138671875, -0.412139892578125, -0.3861083984375, -0.360076904296875, -0.33404541015625, -0.308013916015625, -0.281982421875, -0.255950927734375, -0.22991943359375, -0.203887939453125, -0.1778564453125, -0.151824951171875, -0.12579345703125, -0.099761962890625, -0.07373046875, -0.047698974609375, -0.02166748046875, 0.004364013671875, 0.0303955078125, 0.056427001953125, 0.08245849609375, 0.108489990234375, 0.134521484375, 0.160552978515625, 0.18658447265625, 0.212615966796875, 0.2386474609375, 0.264678955078125, 0.29071044921875, 0.316741943359375, 0.3427734375, 0.368804931640625, 0.39483642578125, 0.420867919921875, 0.4468994140625, 0.472930908203125, 0.49896240234375, 0.524993896484375, 0.551025390625, 0.577056884765625, 0.60308837890625, 0.629119873046875, 0.6551513671875, 0.681182861328125, 0.70721435546875, 0.733245849609375, 0.75927734375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 3.0, 11.0, 12.0, 11.0, 19.0, 47.0, 52.0, 84.0, 145.0, 224.0, 447.0, 845.0, 1686.0, 3774.0, 9396.0, 25246.0, 80632.0, 306771.0, 443306.0, 118428.0, 35549.0, 12484.0, 4935.0, 2116.0, 1112.0, 497.0, 257.0, 145.0, 92.0, 58.0, 31.0, 27.0, 29.0, 13.0, 15.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.291015625, -2.219757080078125, -2.14849853515625, -2.077239990234375, -2.0059814453125, -1.934722900390625, -1.86346435546875, -1.792205810546875, -1.720947265625, -1.649688720703125, -1.57843017578125, -1.507171630859375, -1.4359130859375, -1.364654541015625, -1.29339599609375, -1.222137451171875, -1.15087890625, -1.079620361328125, -1.00836181640625, -0.937103271484375, -0.8658447265625, -0.794586181640625, -0.72332763671875, -0.652069091796875, -0.580810546875, -0.509552001953125, -0.43829345703125, -0.367034912109375, -0.2957763671875, -0.224517822265625, -0.15325927734375, -0.082000732421875, -0.0107421875, 0.060516357421875, 0.13177490234375, 0.203033447265625, 0.2742919921875, 0.345550537109375, 0.41680908203125, 0.488067626953125, 0.559326171875, 0.630584716796875, 0.70184326171875, 0.773101806640625, 0.8443603515625, 0.915618896484375, 0.98687744140625, 1.058135986328125, 1.12939453125, 1.200653076171875, 1.27191162109375, 1.343170166015625, 1.4144287109375, 1.485687255859375, 1.55694580078125, 1.628204345703125, 1.699462890625, 1.770721435546875, 1.84197998046875, 1.913238525390625, 1.9844970703125, 2.055755615234375, 2.12701416015625, 2.198272705078125, 2.26953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 6.0, 7.0, 8.0, 12.0, 14.0, 17.0, 30.0, 20.0, 39.0, 43.0, 32.0, 53.0, 38.0, 48.0, 38.0, 43.0, 41.0, 39.0, 52.0, 43.0, 53.0, 50.0, 31.0, 29.0, 23.0, 37.0, 31.0, 22.0, 20.0, 10.0, 8.0, 8.0, 14.0, 8.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.86328125, -4.723876953125, -4.58447265625, -4.445068359375, -4.3056640625, -4.166259765625, -4.02685546875, -3.887451171875, -3.748046875, -3.608642578125, -3.46923828125, -3.329833984375, -3.1904296875, -3.051025390625, -2.91162109375, -2.772216796875, -2.6328125, -2.493408203125, -2.35400390625, -2.214599609375, -2.0751953125, -1.935791015625, -1.79638671875, -1.656982421875, -1.517578125, -1.378173828125, -1.23876953125, -1.099365234375, -0.9599609375, -0.820556640625, -0.68115234375, -0.541748046875, -0.40234375, -0.262939453125, -0.12353515625, 0.015869140625, 0.1552734375, 0.294677734375, 0.43408203125, 0.573486328125, 0.712890625, 0.852294921875, 0.99169921875, 1.131103515625, 1.2705078125, 1.409912109375, 1.54931640625, 1.688720703125, 1.828125, 1.967529296875, 2.10693359375, 2.246337890625, 2.3857421875, 2.525146484375, 2.66455078125, 2.803955078125, 2.943359375, 3.082763671875, 3.22216796875, 3.361572265625, 3.5009765625, 3.640380859375, 3.77978515625, 3.919189453125, 4.05859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 13.0, 20.0, 31.0, 72.0, 112.0, 244.0, 680.0, 1962.0, 8091.0, 85004.0, 887011.0, 56191.0, 6482.0, 1618.0, 521.0, 244.0, 117.0, 51.0, 25.0, 17.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.3150634765625, -2.233642578125, -2.1522216796875, -2.07080078125, -1.9893798828125, -1.907958984375, -1.8265380859375, -1.7451171875, -1.6636962890625, -1.582275390625, -1.5008544921875, -1.41943359375, -1.3380126953125, -1.256591796875, -1.1751708984375, -1.09375, -1.0123291015625, -0.930908203125, -0.8494873046875, -0.76806640625, -0.6866455078125, -0.605224609375, -0.5238037109375, -0.4423828125, -0.3609619140625, -0.279541015625, -0.1981201171875, -0.11669921875, -0.0352783203125, 0.046142578125, 0.1275634765625, 0.208984375, 0.2904052734375, 0.371826171875, 0.4532470703125, 0.53466796875, 0.6160888671875, 0.697509765625, 0.7789306640625, 0.8603515625, 0.9417724609375, 1.023193359375, 1.1046142578125, 1.18603515625, 1.2674560546875, 1.348876953125, 1.4302978515625, 1.51171875, 1.5931396484375, 1.674560546875, 1.7559814453125, 1.83740234375, 1.9188232421875, 2.000244140625, 2.0816650390625, 2.1630859375, 2.2445068359375, 2.325927734375, 2.4073486328125, 2.48876953125, 2.5701904296875, 2.651611328125, 2.7330322265625, 2.814453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 3.0, 6.0, 6.0, 9.0, 11.0, 31.0, 45.0, 59.0, 89.0, 122.0, 162.0, 121.0, 106.0, 59.0, 54.0, 34.0, 23.0, 12.0, 16.0, 13.0, 8.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0003066062927246094, -0.0002987012267112732, -0.000290796160697937, -0.00028289109468460083, -0.00027498602867126465, -0.00026708096265792847, -0.0002591758966445923, -0.0002512708306312561, -0.00024336576461791992, -0.00023546069860458374, -0.00022755563259124756, -0.00021965056657791138, -0.0002117455005645752, -0.00020384043455123901, -0.00019593536853790283, -0.00018803030252456665, -0.00018012523651123047, -0.0001722201704978943, -0.0001643151044845581, -0.00015641003847122192, -0.00014850497245788574, -0.00014059990644454956, -0.00013269484043121338, -0.0001247897744178772, -0.00011688470840454102, -0.00010897964239120483, -0.00010107457637786865, -9.316951036453247e-05, -8.526444435119629e-05, -7.735937833786011e-05, -6.945431232452393e-05, -6.154924631118774e-05, -5.364418029785156e-05, -4.573911428451538e-05, -3.78340482711792e-05, -2.9928982257843018e-05, -2.2023916244506836e-05, -1.4118850231170654e-05, -6.213784217834473e-06, 1.691281795501709e-06, 9.59634780883789e-06, 1.7501413822174072e-05, 2.5406479835510254e-05, 3.3311545848846436e-05, 4.121661186218262e-05, 4.91216778755188e-05, 5.702674388885498e-05, 6.493180990219116e-05, 7.283687591552734e-05, 8.074194192886353e-05, 8.864700794219971e-05, 9.655207395553589e-05, 0.00010445713996887207, 0.00011236220598220825, 0.00012026727199554443, 0.00012817233800888062, 0.0001360774040222168, 0.00014398247003555298, 0.00015188753604888916, 0.00015979260206222534, 0.00016769766807556152, 0.0001756027340888977, 0.0001835078001022339, 0.00019141286611557007, 0.00019931793212890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 12.0, 20.0, 38.0, 66.0, 165.0, 500.0, 2195.0, 20533.0, 797894.0, 217294.0, 8056.0, 1204.0, 346.0, 121.0, 52.0, 25.0, 17.0, 9.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.888671875, -3.795684814453125, -3.70269775390625, -3.609710693359375, -3.5167236328125, -3.423736572265625, -3.33074951171875, -3.237762451171875, -3.144775390625, -3.051788330078125, -2.95880126953125, -2.865814208984375, -2.7728271484375, -2.679840087890625, -2.58685302734375, -2.493865966796875, -2.40087890625, -2.307891845703125, -2.21490478515625, -2.121917724609375, -2.0289306640625, -1.935943603515625, -1.84295654296875, -1.749969482421875, -1.656982421875, -1.563995361328125, -1.47100830078125, -1.378021240234375, -1.2850341796875, -1.192047119140625, -1.09906005859375, -1.006072998046875, -0.9130859375, -0.820098876953125, -0.72711181640625, -0.634124755859375, -0.5411376953125, -0.448150634765625, -0.35516357421875, -0.262176513671875, -0.169189453125, -0.076202392578125, 0.01678466796875, 0.109771728515625, 0.2027587890625, 0.295745849609375, 0.38873291015625, 0.481719970703125, 0.57470703125, 0.667694091796875, 0.76068115234375, 0.853668212890625, 0.9466552734375, 1.039642333984375, 1.13262939453125, 1.225616455078125, 1.318603515625, 1.411590576171875, 1.50457763671875, 1.597564697265625, 1.6905517578125, 1.783538818359375, 1.87652587890625, 1.969512939453125, 2.0625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 11.0, 14.0, 18.0, 30.0, 41.0, 65.0, 102.0, 138.0, 158.0, 133.0, 101.0, 68.0, 36.0, 25.0, 20.0, 8.0, 11.0, 7.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1328125, -3.0576324462890625, -2.982452392578125, -2.9072723388671875, -2.83209228515625, -2.7569122314453125, -2.681732177734375, -2.6065521240234375, -2.5313720703125, -2.4561920166015625, -2.381011962890625, -2.3058319091796875, -2.23065185546875, -2.1554718017578125, -2.080291748046875, -2.0051116943359375, -1.929931640625, -1.8547515869140625, -1.779571533203125, -1.7043914794921875, -1.62921142578125, -1.5540313720703125, -1.478851318359375, -1.4036712646484375, -1.3284912109375, -1.2533111572265625, -1.178131103515625, -1.1029510498046875, -1.02777099609375, -0.9525909423828125, -0.877410888671875, -0.8022308349609375, -0.72705078125, -0.6518707275390625, -0.576690673828125, -0.5015106201171875, -0.42633056640625, -0.3511505126953125, -0.275970458984375, -0.2007904052734375, -0.1256103515625, -0.0504302978515625, 0.024749755859375, 0.0999298095703125, 0.17510986328125, 0.2502899169921875, 0.325469970703125, 0.4006500244140625, 0.475830078125, 0.5510101318359375, 0.626190185546875, 0.7013702392578125, 0.77655029296875, 0.8517303466796875, 0.926910400390625, 1.0020904541015625, 1.0772705078125, 1.1524505615234375, 1.227630615234375, 1.3028106689453125, 1.37799072265625, 1.4531707763671875, 1.528350830078125, 1.6035308837890625, 1.6787109375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 8.0, 16.0, 40.0, 81.0, 137.0, 202.0, 239.0, 151.0, 62.0, 37.0, 17.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.89295196533203, -54.72303009033203, -53.55310821533203, -52.3831901550293, -51.2132682800293, -50.0433464050293, -48.87342834472656, -47.70350646972656, -46.53358459472656, -45.36366271972656, -44.19374084472656, -43.02382278442383, -41.85390090942383, -40.68397903442383, -39.514060974121094, -38.344139099121094, -37.174217224121094, -36.004295349121094, -34.834373474121094, -33.66445541381836, -32.49453353881836, -31.32461166381836, -30.154691696166992, -28.984771728515625, -27.814849853515625, -26.644927978515625, -25.475008010864258, -24.30508804321289, -23.13516616821289, -21.96524429321289, -20.795324325561523, -19.625404357910156, -18.45547866821289, -17.28555679321289, -16.115636825561523, -14.94571590423584, -13.775794982910156, -12.605874061584473, -11.435953140258789, -10.266032218933105, -9.096111297607422, -7.926190376281738, -6.756269454956055, -5.586348533630371, -4.4164276123046875, -3.246506690979004, -2.0765857696533203, -0.9066648483276367, 0.2632560729980469, 1.4331769943237305, 2.603097915649414, 3.7730188369750977, 4.942939758300781, 6.112860679626465, 7.282781600952148, 8.452702522277832, 9.622623443603516, 10.7925443649292, 11.962465286254883, 13.132386207580566, 14.30230712890625, 15.472228050231934, 16.642148971557617, 17.812068939208984, 18.981990814208984]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 4.0, 7.0, 4.0, 11.0, 8.0, 22.0, 17.0, 19.0, 26.0, 25.0, 22.0, 34.0, 42.0, 50.0, 46.0, 60.0, 58.0, 54.0, 60.0, 66.0, 59.0, 29.0, 56.0, 26.0, 30.0, 29.0, 24.0, 26.0, 19.0, 21.0, 7.0, 10.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.85089683532715, -24.063228607177734, -23.27556037902832, -22.487892150878906, -21.700225830078125, -20.91255760192871, -20.124889373779297, -19.337221145629883, -18.54955291748047, -17.761884689331055, -16.97421646118164, -16.18655014038086, -15.398881912231445, -14.611213684082031, -13.823545455932617, -13.035877227783203, -12.248210906982422, -11.460542678833008, -10.67287540435791, -9.885207176208496, -9.097539901733398, -8.309871673583984, -7.52220344543457, -6.7345356941223145, -5.946867942810059, -5.159200191497803, -4.371532440185547, -3.583864212036133, -2.796196460723877, -2.008528709411621, -1.220860481262207, -0.43319272994995117, 0.3544769287109375, 1.142144799232483, 1.9298126697540283, 2.7174806594848633, 3.505148410797119, 4.292816162109375, 5.080484390258789, 5.868152141571045, 6.655819892883301, 7.443487644195557, 8.231155395507812, 9.018823623657227, 9.80649185180664, 10.594159126281738, 11.381827354431152, 12.16949462890625, 12.957162857055664, 13.744831085205078, 14.532498359680176, 15.32016658782959, 16.107833862304688, 16.8955020904541, 17.683170318603516, 18.47083854675293, 19.258506774902344, 20.046175003051758, 20.833843231201172, 21.621509552001953, 22.409177780151367, 23.19684600830078, 23.984514236450195, 24.77218246459961, 25.55984878540039]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 8.0, 13.0, 17.0, 20.0, 45.0, 59.0, 90.0, 135.0, 305.0, 688.0, 2274.0, 12297.0, 4165595.0, 9358.0, 1986.0, 681.0, 263.0, 156.0, 97.0, 56.0, 33.0, 33.0, 17.0, 14.0, 10.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-10.6484375, -10.40338134765625, -10.1583251953125, -9.91326904296875, -9.668212890625, -9.42315673828125, -9.1781005859375, -8.93304443359375, -8.68798828125, -8.44293212890625, -8.1978759765625, -7.95281982421875, -7.707763671875, -7.46270751953125, -7.2176513671875, -6.97259521484375, -6.7275390625, -6.48248291015625, -6.2374267578125, -5.99237060546875, -5.747314453125, -5.50225830078125, -5.2572021484375, -5.01214599609375, -4.76708984375, -4.52203369140625, -4.2769775390625, -4.03192138671875, -3.786865234375, -3.54180908203125, -3.2967529296875, -3.05169677734375, -2.806640625, -2.56158447265625, -2.3165283203125, -2.07147216796875, -1.826416015625, -1.58135986328125, -1.3363037109375, -1.09124755859375, -0.84619140625, -0.60113525390625, -0.3560791015625, -0.11102294921875, 0.134033203125, 0.37908935546875, 0.6241455078125, 0.86920166015625, 1.1142578125, 1.35931396484375, 1.6043701171875, 1.84942626953125, 2.094482421875, 2.33953857421875, 2.5845947265625, 2.82965087890625, 3.07470703125, 3.31976318359375, 3.5648193359375, 3.80987548828125, 4.054931640625, 4.29998779296875, 4.5450439453125, 4.79010009765625, 5.03515625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 7.0, 7.0, 8.0, 12.0, 18.0, 15.0, 24.0, 27.0, 31.0, 43.0, 34.0, 40.0, 57.0, 72.0, 82.0, 55.0, 58.0, 63.0, 44.0, 39.0, 42.0, 38.0, 32.0, 26.0, 34.0, 20.0, 15.0, 10.0, 8.0, 10.0, 2.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.46484375, -1.4275131225585938, -1.3901824951171875, -1.3528518676757812, -1.315521240234375, -1.2781906127929688, -1.2408599853515625, -1.2035293579101562, -1.16619873046875, -1.1288681030273438, -1.0915374755859375, -1.0542068481445312, -1.016876220703125, -0.9795455932617188, -0.9422149658203125, -0.9048843383789062, -0.8675537109375, -0.8302230834960938, -0.7928924560546875, -0.7555618286132812, -0.718231201171875, -0.6809005737304688, -0.6435699462890625, -0.6062393188476562, -0.56890869140625, -0.5315780639648438, -0.4942474365234375, -0.45691680908203125, -0.419586181640625, -0.38225555419921875, -0.3449249267578125, -0.30759429931640625, -0.270263671875, -0.23293304443359375, -0.1956024169921875, -0.15827178955078125, -0.120941162109375, -0.08361053466796875, -0.0462799072265625, -0.00894927978515625, 0.02838134765625, 0.06571197509765625, 0.1030426025390625, 0.14037322998046875, 0.177703857421875, 0.21503448486328125, 0.2523651123046875, 0.28969573974609375, 0.3270263671875, 0.36435699462890625, 0.4016876220703125, 0.43901824951171875, 0.476348876953125, 0.5136795043945312, 0.5510101318359375, 0.5883407592773438, 0.62567138671875, 0.6630020141601562, 0.7003326416015625, 0.7376632690429688, 0.774993896484375, 0.8123245239257812, 0.8496551513671875, 0.8869857788085938, 0.92431640625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 13.0, 15.0, 22.0, 25.0, 50.0, 50.0, 60.0, 92.0, 130.0, 154.0, 226.0, 334.0, 451.0, 589.0, 901.0, 1320.0, 1997.0, 3182.0, 5958.0, 12707.0, 50032.0, 4057579.0, 33622.0, 10860.0, 5103.0, 2902.0, 1779.0, 1244.0, 781.0, 580.0, 372.0, 311.0, 225.0, 168.0, 114.0, 90.0, 62.0, 52.0, 31.0, 19.0, 30.0, 14.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.44140625, -2.366058349609375, -2.29071044921875, -2.215362548828125, -2.1400146484375, -2.064666748046875, -1.98931884765625, -1.913970947265625, -1.838623046875, -1.763275146484375, -1.68792724609375, -1.612579345703125, -1.5372314453125, -1.461883544921875, -1.38653564453125, -1.311187744140625, -1.23583984375, -1.160491943359375, -1.08514404296875, -1.009796142578125, -0.9344482421875, -0.859100341796875, -0.78375244140625, -0.708404541015625, -0.633056640625, -0.557708740234375, -0.48236083984375, -0.407012939453125, -0.3316650390625, -0.256317138671875, -0.18096923828125, -0.105621337890625, -0.0302734375, 0.045074462890625, 0.12042236328125, 0.195770263671875, 0.2711181640625, 0.346466064453125, 0.42181396484375, 0.497161865234375, 0.572509765625, 0.647857666015625, 0.72320556640625, 0.798553466796875, 0.8739013671875, 0.949249267578125, 1.02459716796875, 1.099945068359375, 1.17529296875, 1.250640869140625, 1.32598876953125, 1.401336669921875, 1.4766845703125, 1.552032470703125, 1.62738037109375, 1.702728271484375, 1.778076171875, 1.853424072265625, 1.92877197265625, 2.004119873046875, 2.0794677734375, 2.154815673828125, 2.23016357421875, 2.305511474609375, 2.380859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 16.0, 27.0, 31.0, 3330.0, 553.0, 38.0, 15.0, 8.0, 4.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.8076171875, -0.7806777954101562, -0.7537384033203125, -0.7267990112304688, -0.699859619140625, -0.6729202270507812, -0.6459808349609375, -0.6190414428710938, -0.59210205078125, -0.5651626586914062, -0.5382232666015625, -0.5112838745117188, -0.484344482421875, -0.45740509033203125, -0.4304656982421875, -0.40352630615234375, -0.3765869140625, -0.34964752197265625, -0.3227081298828125, -0.29576873779296875, -0.268829345703125, -0.24188995361328125, -0.2149505615234375, -0.18801116943359375, -0.16107177734375, -0.13413238525390625, -0.1071929931640625, -0.08025360107421875, -0.053314208984375, -0.02637481689453125, 0.0005645751953125, 0.02750396728515625, 0.054443359375, 0.08138275146484375, 0.1083221435546875, 0.13526153564453125, 0.162200927734375, 0.18914031982421875, 0.2160797119140625, 0.24301910400390625, 0.26995849609375, 0.29689788818359375, 0.3238372802734375, 0.35077667236328125, 0.377716064453125, 0.40465545654296875, 0.4315948486328125, 0.45853424072265625, 0.4854736328125, 0.5124130249023438, 0.5393524169921875, 0.5662918090820312, 0.593231201171875, 0.6201705932617188, 0.6471099853515625, 0.6740493774414062, 0.70098876953125, 0.7279281616210938, 0.7548675537109375, 0.7818069458007812, 0.808746337890625, 0.8356857299804688, 0.8626251220703125, 0.8895645141601562, 0.91650390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 13.0, 26.0, 51.0, 100.0, 169.0, 220.0, 181.0, 119.0, 63.0, 27.0, 11.0, 9.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.136025905609131, -5.000357627868652, -4.864689350128174, -4.729021072387695, -4.593353271484375, -4.4576849937438965, -4.322016716003418, -4.1863484382629395, -4.050680160522461, -3.9150118827819824, -3.779343605041504, -3.6436755657196045, -3.508007287979126, -3.3723390102386475, -3.236670970916748, -3.1010026931762695, -2.965334415435791, -2.8296661376953125, -2.693997859954834, -2.5583298206329346, -2.422661542892456, -2.2869932651519775, -2.151325225830078, -2.0156569480895996, -1.879988670349121, -1.7443203926086426, -1.6086522340774536, -1.4729840755462646, -1.3373157978057861, -1.2016475200653076, -1.0659793615341187, -0.9303111433982849, -0.7946429252624512, -0.6589747071266174, -0.5233064889907837, -0.38763827085494995, -0.2519700527191162, -0.11630183458328247, 0.01936638355255127, 0.155034601688385, 0.29070281982421875, 0.4263710379600525, 0.5620392560958862, 0.69770747423172, 0.8333756923675537, 0.9690439105033875, 1.1047121286392212, 1.2403802871704102, 1.3760485649108887, 1.5117168426513672, 1.6473850011825562, 1.7830531597137451, 1.9187214374542236, 2.054389715194702, 2.1900577545166016, 2.32572603225708, 2.4613943099975586, 2.597062587738037, 2.7327308654785156, 2.868398904800415, 3.0040671825408936, 3.139735460281372, 3.2754034996032715, 3.41107177734375, 3.5467400550842285]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 14.0, 14.0, 23.0, 22.0, 21.0, 34.0, 48.0, 36.0, 51.0, 59.0, 51.0, 60.0, 49.0, 63.0, 46.0, 51.0, 49.0, 34.0, 39.0, 44.0, 40.0, 36.0, 15.0, 16.0, 14.0, 11.0, 10.0, 13.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8371754884719849, -1.7770426273345947, -1.7169097661972046, -1.6567769050598145, -1.5966440439224243, -1.5365111827850342, -1.4763782024383545, -1.416245460510254, -1.3561124801635742, -1.295979619026184, -1.235846757888794, -1.1757138967514038, -1.1155810356140137, -1.0554481744766235, -0.9953152537345886, -0.9351823925971985, -0.8750495910644531, -0.814916729927063, -0.7547838687896729, -0.6946510076522827, -0.6345181465148926, -0.5743852853775024, -0.5142523646354675, -0.4541195034980774, -0.39398664236068726, -0.3338537812232971, -0.273720920085907, -0.21358802914619446, -0.15345516800880432, -0.09332230687141418, -0.03318941593170166, 0.026943445205688477, 0.08707618713378906, 0.1472090482711792, 0.20734192430973053, 0.26747480034828186, 0.327607661485672, 0.38774052262306213, 0.44787341356277466, 0.5080062747001648, 0.5681391358375549, 0.6282719969749451, 0.6884048581123352, 0.7485377788543701, 0.8086706399917603, 0.8688035011291504, 0.9289363622665405, 0.9890692234039307, 1.0492020845413208, 1.109334945678711, 1.169467806816101, 1.2296006679534912, 1.2897335290908813, 1.3498663902282715, 1.4099993705749512, 1.4701321125030518, 1.5302650928497314, 1.5903979539871216, 1.6505308151245117, 1.7106636762619019, 1.770796537399292, 1.8309293985366821, 1.8910622596740723, 1.951195240020752, 2.0113279819488525]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 14.0, 17.0, 25.0, 44.0, 55.0, 72.0, 128.0, 232.0, 411.0, 807.0, 1556.0, 3598.0, 9183.0, 27171.0, 100450.0, 453898.0, 342711.0, 73703.0, 20957.0, 7439.0, 3117.0, 1407.0, 666.0, 319.0, 197.0, 129.0, 87.0, 51.0, 29.0, 17.0, 16.0, 12.0, 5.0, 2.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.150390625, -3.051605224609375, -2.95281982421875, -2.854034423828125, -2.7552490234375, -2.656463623046875, -2.55767822265625, -2.458892822265625, -2.360107421875, -2.261322021484375, -2.16253662109375, -2.063751220703125, -1.9649658203125, -1.866180419921875, -1.76739501953125, -1.668609619140625, -1.56982421875, -1.471038818359375, -1.37225341796875, -1.273468017578125, -1.1746826171875, -1.075897216796875, -0.97711181640625, -0.878326416015625, -0.779541015625, -0.680755615234375, -0.58197021484375, -0.483184814453125, -0.3843994140625, -0.285614013671875, -0.18682861328125, -0.088043212890625, 0.0107421875, 0.109527587890625, 0.20831298828125, 0.307098388671875, 0.4058837890625, 0.504669189453125, 0.60345458984375, 0.702239990234375, 0.801025390625, 0.899810791015625, 0.99859619140625, 1.097381591796875, 1.1961669921875, 1.294952392578125, 1.39373779296875, 1.492523193359375, 1.59130859375, 1.690093994140625, 1.78887939453125, 1.887664794921875, 1.9864501953125, 2.085235595703125, 2.18402099609375, 2.282806396484375, 2.381591796875, 2.480377197265625, 2.57916259765625, 2.677947998046875, 2.7767333984375, 2.875518798828125, 2.97430419921875, 3.073089599609375, 3.171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 9.0, 7.0, 8.0, 11.0, 21.0, 17.0, 21.0, 38.0, 36.0, 46.0, 42.0, 56.0, 52.0, 76.0, 67.0, 56.0, 61.0, 37.0, 56.0, 47.0, 42.0, 30.0, 26.0, 26.0, 20.0, 15.0, 22.0, 13.0, 2.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0], "bins": [-1.55859375, -1.5210113525390625, -1.483428955078125, -1.4458465576171875, -1.40826416015625, -1.3706817626953125, -1.333099365234375, -1.2955169677734375, -1.2579345703125, -1.2203521728515625, -1.182769775390625, -1.1451873779296875, -1.10760498046875, -1.0700225830078125, -1.032440185546875, -0.9948577880859375, -0.957275390625, -0.9196929931640625, -0.882110595703125, -0.8445281982421875, -0.80694580078125, -0.7693634033203125, -0.731781005859375, -0.6941986083984375, -0.6566162109375, -0.6190338134765625, -0.581451416015625, -0.5438690185546875, -0.50628662109375, -0.4687042236328125, -0.431121826171875, -0.3935394287109375, -0.35595703125, -0.3183746337890625, -0.280792236328125, -0.2432098388671875, -0.20562744140625, -0.1680450439453125, -0.130462646484375, -0.0928802490234375, -0.0552978515625, -0.0177154541015625, 0.019866943359375, 0.0574493408203125, 0.09503173828125, 0.1326141357421875, 0.170196533203125, 0.2077789306640625, 0.245361328125, 0.2829437255859375, 0.320526123046875, 0.3581085205078125, 0.39569091796875, 0.4332733154296875, 0.470855712890625, 0.5084381103515625, 0.5460205078125, 0.5836029052734375, 0.621185302734375, 0.6587677001953125, 0.69635009765625, 0.7339324951171875, 0.771514892578125, 0.8090972900390625, 0.8466796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 12.0, 10.0, 9.0, 31.0, 37.0, 51.0, 99.0, 166.0, 330.0, 669.0, 1680.0, 5866.0, 34863.0, 581983.0, 388561.0, 26374.0, 4989.0, 1531.0, 613.0, 293.0, 140.0, 93.0, 48.0, 40.0, 24.0, 15.0, 9.0, 8.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.9290771484375, -4.764404296875, -4.5997314453125, -4.43505859375, -4.2703857421875, -4.105712890625, -3.9410400390625, -3.7763671875, -3.6116943359375, -3.447021484375, -3.2823486328125, -3.11767578125, -2.9530029296875, -2.788330078125, -2.6236572265625, -2.458984375, -2.2943115234375, -2.129638671875, -1.9649658203125, -1.80029296875, -1.6356201171875, -1.470947265625, -1.3062744140625, -1.1416015625, -0.9769287109375, -0.812255859375, -0.6475830078125, -0.48291015625, -0.3182373046875, -0.153564453125, 0.0111083984375, 0.17578125, 0.3404541015625, 0.505126953125, 0.6697998046875, 0.83447265625, 0.9991455078125, 1.163818359375, 1.3284912109375, 1.4931640625, 1.6578369140625, 1.822509765625, 1.9871826171875, 2.15185546875, 2.3165283203125, 2.481201171875, 2.6458740234375, 2.810546875, 2.9752197265625, 3.139892578125, 3.3045654296875, 3.46923828125, 3.6339111328125, 3.798583984375, 3.9632568359375, 4.1279296875, 4.2926025390625, 4.457275390625, 4.6219482421875, 4.78662109375, 4.9512939453125, 5.115966796875, 5.2806396484375, 5.4453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 9.0, 14.0, 21.0, 27.0, 34.0, 63.0, 67.0, 86.0, 96.0, 88.0, 91.0, 102.0, 84.0, 60.0, 51.0, 41.0, 24.0, 10.0, 10.0, 6.0, 3.0, 5.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.71630859375, -9.4169921875, -9.11767578125, -8.818359375, -8.51904296875, -8.2197265625, -7.92041015625, -7.62109375, -7.32177734375, -7.0224609375, -6.72314453125, -6.423828125, -6.12451171875, -5.8251953125, -5.52587890625, -5.2265625, -4.92724609375, -4.6279296875, -4.32861328125, -4.029296875, -3.72998046875, -3.4306640625, -3.13134765625, -2.83203125, -2.53271484375, -2.2333984375, -1.93408203125, -1.634765625, -1.33544921875, -1.0361328125, -0.73681640625, -0.4375, -0.13818359375, 0.1611328125, 0.46044921875, 0.759765625, 1.05908203125, 1.3583984375, 1.65771484375, 1.95703125, 2.25634765625, 2.5556640625, 2.85498046875, 3.154296875, 3.45361328125, 3.7529296875, 4.05224609375, 4.3515625, 4.65087890625, 4.9501953125, 5.24951171875, 5.548828125, 5.84814453125, 6.1474609375, 6.44677734375, 6.74609375, 7.04541015625, 7.3447265625, 7.64404296875, 7.943359375, 8.24267578125, 8.5419921875, 8.84130859375, 9.140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 3.0, 7.0, 15.0, 24.0, 37.0, 50.0, 95.0, 234.0, 674.0, 3118.0, 46174.0, 973512.0, 21582.0, 2084.0, 530.0, 204.0, 95.0, 41.0, 24.0, 21.0, 14.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.36419677734375, -6.1893310546875, -6.01446533203125, -5.839599609375, -5.66473388671875, -5.4898681640625, -5.31500244140625, -5.14013671875, -4.96527099609375, -4.7904052734375, -4.61553955078125, -4.440673828125, -4.26580810546875, -4.0909423828125, -3.91607666015625, -3.7412109375, -3.56634521484375, -3.3914794921875, -3.21661376953125, -3.041748046875, -2.86688232421875, -2.6920166015625, -2.51715087890625, -2.34228515625, -2.16741943359375, -1.9925537109375, -1.81768798828125, -1.642822265625, -1.46795654296875, -1.2930908203125, -1.11822509765625, -0.943359375, -0.76849365234375, -0.5936279296875, -0.41876220703125, -0.243896484375, -0.06903076171875, 0.1058349609375, 0.28070068359375, 0.45556640625, 0.63043212890625, 0.8052978515625, 0.98016357421875, 1.155029296875, 1.32989501953125, 1.5047607421875, 1.67962646484375, 1.8544921875, 2.02935791015625, 2.2042236328125, 2.37908935546875, 2.553955078125, 2.72882080078125, 2.9036865234375, 3.07855224609375, 3.25341796875, 3.42828369140625, 3.6031494140625, 3.77801513671875, 3.952880859375, 4.12774658203125, 4.3026123046875, 4.47747802734375, 4.65234375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 9.0, 24.0, 42.0, 96.0, 212.0, 297.0, 174.0, 70.0, 35.0, 15.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008101463317871094, -0.0007895380258560181, -0.0007689297199249268, -0.0007483214139938354, -0.0007277131080627441, -0.0007071048021316528, -0.0006864964962005615, -0.0006658881902694702, -0.0006452798843383789, -0.0006246715784072876, -0.0006040632724761963, -0.000583454966545105, -0.0005628466606140137, -0.0005422383546829224, -0.0005216300487518311, -0.0005010217428207397, -0.00048041343688964844, -0.00045980513095855713, -0.0004391968250274658, -0.0004185885190963745, -0.0003979802131652832, -0.0003773719072341919, -0.0003567636013031006, -0.0003361552953720093, -0.00031554698944091797, -0.00029493868350982666, -0.00027433037757873535, -0.00025372207164764404, -0.00023311376571655273, -0.00021250545978546143, -0.00019189715385437012, -0.0001712888479232788, -0.0001506805419921875, -0.0001300722360610962, -0.00010946393013000488, -8.885562419891357e-05, -6.824731826782227e-05, -4.763901233673096e-05, -2.703070640563965e-05, -6.42240047454834e-06, 1.4185905456542969e-05, 3.479421138763428e-05, 5.5402517318725586e-05, 7.60108232498169e-05, 9.66191291809082e-05, 0.00011722743511199951, 0.00013783574104309082, 0.00015844404697418213, 0.00017905235290527344, 0.00019966065883636475, 0.00022026896476745605, 0.00024087727069854736, 0.00026148557662963867, 0.00028209388256073, 0.0003027021884918213, 0.0003233104944229126, 0.0003439188003540039, 0.0003645271062850952, 0.0003851354122161865, 0.00040574371814727783, 0.00042635202407836914, 0.00044696033000946045, 0.00046756863594055176, 0.00048817694187164307, 0.0005087852478027344]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 9.0, 9.0, 15.0, 34.0, 47.0, 95.0, 143.0, 324.0, 650.0, 1711.0, 6508.0, 70387.0, 917085.0, 43696.0, 5131.0, 1516.0, 542.0, 288.0, 151.0, 90.0, 46.0, 23.0, 16.0, 9.0, 2.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.326416015625, -3.21337890625, -3.100341796875, -2.9873046875, -2.874267578125, -2.76123046875, -2.648193359375, -2.53515625, -2.422119140625, -2.30908203125, -2.196044921875, -2.0830078125, -1.969970703125, -1.85693359375, -1.743896484375, -1.630859375, -1.517822265625, -1.40478515625, -1.291748046875, -1.1787109375, -1.065673828125, -0.95263671875, -0.839599609375, -0.7265625, -0.613525390625, -0.50048828125, -0.387451171875, -0.2744140625, -0.161376953125, -0.04833984375, 0.064697265625, 0.177734375, 0.290771484375, 0.40380859375, 0.516845703125, 0.6298828125, 0.742919921875, 0.85595703125, 0.968994140625, 1.08203125, 1.195068359375, 1.30810546875, 1.421142578125, 1.5341796875, 1.647216796875, 1.76025390625, 1.873291015625, 1.986328125, 2.099365234375, 2.21240234375, 2.325439453125, 2.4384765625, 2.551513671875, 2.66455078125, 2.777587890625, 2.890625, 3.003662109375, 3.11669921875, 3.229736328125, 3.3427734375, 3.455810546875, 3.56884765625, 3.681884765625, 3.794921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 7.0, 6.0, 8.0, 29.0, 38.0, 58.0, 154.0, 210.0, 225.0, 115.0, 73.0, 32.0, 19.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.959442138671875, -4.81732177734375, -4.675201416015625, -4.5330810546875, -4.390960693359375, -4.24884033203125, -4.106719970703125, -3.964599609375, -3.822479248046875, -3.68035888671875, -3.538238525390625, -3.3961181640625, -3.253997802734375, -3.11187744140625, -2.969757080078125, -2.82763671875, -2.685516357421875, -2.54339599609375, -2.401275634765625, -2.2591552734375, -2.117034912109375, -1.97491455078125, -1.832794189453125, -1.690673828125, -1.548553466796875, -1.40643310546875, -1.264312744140625, -1.1221923828125, -0.980072021484375, -0.83795166015625, -0.695831298828125, -0.5537109375, -0.411590576171875, -0.26947021484375, -0.127349853515625, 0.0147705078125, 0.156890869140625, 0.29901123046875, 0.441131591796875, 0.583251953125, 0.725372314453125, 0.86749267578125, 1.009613037109375, 1.1517333984375, 1.293853759765625, 1.43597412109375, 1.578094482421875, 1.72021484375, 1.862335205078125, 2.00445556640625, 2.146575927734375, 2.2886962890625, 2.430816650390625, 2.57293701171875, 2.715057373046875, 2.857177734375, 2.999298095703125, 3.14141845703125, 3.283538818359375, 3.4256591796875, 3.567779541015625, 3.70989990234375, 3.852020263671875, 3.994140625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 12.0, 25.0, 129.0, 348.0, 320.0, 119.0, 30.0, 12.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.49012756347656, -30.878982543945312, -28.267837524414062, -25.656692504882812, -23.045547485351562, -20.434402465820312, -17.823257446289062, -15.212112426757812, -12.600967407226562, -9.989822387695312, -7.3786773681640625, -4.7675323486328125, -2.1563873291015625, 0.4547576904296875, 3.0659027099609375, 5.6770477294921875, 8.288192749023438, 10.899337768554688, 13.510482788085938, 16.121627807617188, 18.732772827148438, 21.343917846679688, 23.955062866210938, 26.566207885742188, 29.177352905273438, 31.788497924804688, 34.39964294433594, 37.01078796386719, 39.62193298339844, 42.23307800292969, 44.84422302246094, 47.45536804199219, 50.06651306152344, 52.67765808105469, 55.28880310058594, 57.89994812011719, 60.51109313964844, 63.12223815917969, 65.73338317871094, 68.34452819824219, 70.95567321777344, 73.56681823730469, 76.17796325683594, 78.78910827636719, 81.40025329589844, 84.01139831542969, 86.62254333496094, 89.23368835449219, 91.84483337402344, 94.45597839355469, 97.06712341308594, 99.67826843261719, 102.28941345214844, 104.90055847167969, 107.51170349121094, 110.12284851074219, 112.73399353027344, 115.34513854980469, 117.95628356933594, 120.56742858886719, 123.17857360839844, 125.78971862792969, 128.40086364746094, 131.0120086669922, 133.62315368652344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 3.0, 5.0, 1.0, 5.0, 5.0, 10.0, 17.0, 14.0, 14.0, 14.0, 27.0, 31.0, 30.0, 32.0, 42.0, 43.0, 43.0, 60.0, 44.0, 47.0, 49.0, 59.0, 61.0, 53.0, 44.0, 43.0, 35.0, 44.0, 25.0, 11.0, 23.0, 16.0, 10.0, 4.0, 9.0, 8.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.342876434326172, -24.474384307861328, -23.605892181396484, -22.73740005493164, -21.868907928466797, -21.000415802001953, -20.13192367553711, -19.2634334564209, -18.394941329956055, -17.52644920349121, -16.657957077026367, -15.789464950561523, -14.920973777770996, -14.052481651306152, -13.183989524841309, -12.315498352050781, -11.447005271911621, -10.578513145446777, -9.710021018981934, -8.841529846191406, -7.9730377197265625, -7.104545593261719, -6.236053466796875, -5.3675618171691895, -4.499069690704346, -3.630577802658081, -2.7620859146118164, -1.8935937881469727, -1.025101900100708, -0.15661001205444336, 0.7118821144104004, 1.580373764038086, 2.4488658905029297, 3.3173577785491943, 4.185849666595459, 5.054341793060303, 5.922833442687988, 6.791325569152832, 7.659817695617676, 8.528308868408203, 9.396800994873047, 10.26529312133789, 11.133785247802734, 12.002277374267578, 12.870768547058105, 13.73926067352295, 14.607752799987793, 15.47624397277832, 16.344738006591797, 17.21323013305664, 18.081722259521484, 18.950214385986328, 19.818706512451172, 20.687198638916016, 21.55569076538086, 22.42418098449707, 23.292673110961914, 24.161165237426758, 25.0296573638916, 25.898149490356445, 26.76664161682129, 27.6351318359375, 28.503623962402344, 29.372116088867188, 30.24060821533203]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 17.0, 25.0, 40.0, 50.0, 99.0, 150.0, 281.0, 514.0, 1412.0, 7739.0, 4171354.0, 9800.0, 1530.0, 530.0, 272.0, 172.0, 110.0, 47.0, 36.0, 25.0, 22.0, 8.0, 11.0, 5.0, 1.0, 4.0, 6.0, 3.0, 2.0, 4.0], "bins": [-17.421875, -17.03076171875, -16.6396484375, -16.24853515625, -15.857421875, -15.46630859375, -15.0751953125, -14.68408203125, -14.29296875, -13.90185546875, -13.5107421875, -13.11962890625, -12.728515625, -12.33740234375, -11.9462890625, -11.55517578125, -11.1640625, -10.77294921875, -10.3818359375, -9.99072265625, -9.599609375, -9.20849609375, -8.8173828125, -8.42626953125, -8.03515625, -7.64404296875, -7.2529296875, -6.86181640625, -6.470703125, -6.07958984375, -5.6884765625, -5.29736328125, -4.90625, -4.51513671875, -4.1240234375, -3.73291015625, -3.341796875, -2.95068359375, -2.5595703125, -2.16845703125, -1.77734375, -1.38623046875, -0.9951171875, -0.60400390625, -0.212890625, 0.17822265625, 0.5693359375, 0.96044921875, 1.3515625, 1.74267578125, 2.1337890625, 2.52490234375, 2.916015625, 3.30712890625, 3.6982421875, 4.08935546875, 4.48046875, 4.87158203125, 5.2626953125, 5.65380859375, 6.044921875, 6.43603515625, 6.8271484375, 7.21826171875, 7.609375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 14.0, 7.0, 14.0, 13.0, 19.0, 14.0, 16.0, 26.0, 35.0, 49.0, 46.0, 74.0, 74.0, 71.0, 70.0, 66.0, 64.0, 53.0, 56.0, 37.0, 36.0, 31.0, 20.0, 26.0, 13.0, 12.0, 13.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1544342041015625, -1.106719970703125, -1.0590057373046875, -1.01129150390625, -0.9635772705078125, -0.915863037109375, -0.8681488037109375, -0.8204345703125, -0.7727203369140625, -0.725006103515625, -0.6772918701171875, -0.62957763671875, -0.5818634033203125, -0.534149169921875, -0.4864349365234375, -0.438720703125, -0.3910064697265625, -0.343292236328125, -0.2955780029296875, -0.24786376953125, -0.2001495361328125, -0.152435302734375, -0.1047210693359375, -0.0570068359375, -0.0092926025390625, 0.038421630859375, 0.0861358642578125, 0.13385009765625, 0.1815643310546875, 0.229278564453125, 0.2769927978515625, 0.32470703125, 0.3724212646484375, 0.420135498046875, 0.4678497314453125, 0.51556396484375, 0.5632781982421875, 0.610992431640625, 0.6587066650390625, 0.7064208984375, 0.7541351318359375, 0.801849365234375, 0.8495635986328125, 0.89727783203125, 0.9449920654296875, 0.992706298828125, 1.0404205322265625, 1.088134765625, 1.1358489990234375, 1.183563232421875, 1.2312774658203125, 1.27899169921875, 1.3267059326171875, 1.374420166015625, 1.4221343994140625, 1.4698486328125, 1.5175628662109375, 1.565277099609375, 1.6129913330078125, 1.66070556640625, 1.7084197998046875, 1.756134033203125, 1.8038482666015625, 1.8515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 14.0, 18.0, 30.0, 53.0, 51.0, 70.0, 123.0, 192.0, 255.0, 390.0, 575.0, 864.0, 1569.0, 2985.0, 6139.0, 17631.0, 4081843.0, 60523.0, 10779.0, 4445.0, 2241.0, 1253.0, 749.0, 481.0, 330.0, 213.0, 150.0, 98.0, 66.0, 43.0, 22.0, 16.0, 17.0, 15.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.640625, -4.507293701171875, -4.37396240234375, -4.240631103515625, -4.1072998046875, -3.973968505859375, -3.84063720703125, -3.707305908203125, -3.573974609375, -3.440643310546875, -3.30731201171875, -3.173980712890625, -3.0406494140625, -2.907318115234375, -2.77398681640625, -2.640655517578125, -2.50732421875, -2.373992919921875, -2.24066162109375, -2.107330322265625, -1.9739990234375, -1.840667724609375, -1.70733642578125, -1.574005126953125, -1.440673828125, -1.307342529296875, -1.17401123046875, -1.040679931640625, -0.9073486328125, -0.774017333984375, -0.64068603515625, -0.507354736328125, -0.3740234375, -0.240692138671875, -0.10736083984375, 0.025970458984375, 0.1593017578125, 0.292633056640625, 0.42596435546875, 0.559295654296875, 0.692626953125, 0.825958251953125, 0.95928955078125, 1.092620849609375, 1.2259521484375, 1.359283447265625, 1.49261474609375, 1.625946044921875, 1.75927734375, 1.892608642578125, 2.02593994140625, 2.159271240234375, 2.2926025390625, 2.425933837890625, 2.55926513671875, 2.692596435546875, 2.825927734375, 2.959259033203125, 3.09259033203125, 3.225921630859375, 3.3592529296875, 3.492584228515625, 3.62591552734375, 3.759246826171875, 3.892578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 5.0, 8.0, 8.0, 5.0, 21.0, 25.0, 45.0, 3861.0, 48.0, 18.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34765625, -1.311676025390625, -1.27569580078125, -1.239715576171875, -1.2037353515625, -1.167755126953125, -1.13177490234375, -1.095794677734375, -1.059814453125, -1.023834228515625, -0.98785400390625, -0.951873779296875, -0.9158935546875, -0.879913330078125, -0.84393310546875, -0.807952880859375, -0.77197265625, -0.735992431640625, -0.70001220703125, -0.664031982421875, -0.6280517578125, -0.592071533203125, -0.55609130859375, -0.520111083984375, -0.484130859375, -0.448150634765625, -0.41217041015625, -0.376190185546875, -0.3402099609375, -0.304229736328125, -0.26824951171875, -0.232269287109375, -0.1962890625, -0.160308837890625, -0.12432861328125, -0.088348388671875, -0.0523681640625, -0.016387939453125, 0.01959228515625, 0.055572509765625, 0.091552734375, 0.127532958984375, 0.16351318359375, 0.199493408203125, 0.2354736328125, 0.271453857421875, 0.30743408203125, 0.343414306640625, 0.37939453125, 0.415374755859375, 0.45135498046875, 0.487335205078125, 0.5233154296875, 0.559295654296875, 0.59527587890625, 0.631256103515625, 0.667236328125, 0.703216552734375, 0.73919677734375, 0.775177001953125, 0.8111572265625, 0.847137451171875, 0.88311767578125, 0.919097900390625, 0.955078125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 20.0, 90.0, 557.0, 323.0, 22.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.89754867553711, -29.21845245361328, -28.53935432434082, -27.860258102416992, -27.181161880493164, -26.502063751220703, -25.822967529296875, -25.143871307373047, -24.46477508544922, -23.78567886352539, -23.10658073425293, -22.4274845123291, -21.748388290405273, -21.069290161132812, -20.390193939208984, -19.711097717285156, -19.031999588012695, -18.352903366088867, -17.673805236816406, -16.994709014892578, -16.31561279296875, -15.636515617370605, -14.957418441772461, -14.278322219848633, -13.599225044250488, -12.920127868652344, -12.241031646728516, -11.561934471130371, -10.882837295532227, -10.203741073608398, -9.524643898010254, -8.84554672241211, -8.166452407836914, -7.487355709075928, -6.808259010314941, -6.129161834716797, -5.4500651359558105, -4.770968437194824, -4.09187126159668, -3.4127745628356934, -2.733677864074707, -2.0545811653137207, -1.3754842281341553, -0.6963872909545898, -0.017290592193603516, 0.6618061065673828, 1.3409032821655273, 2.0199999809265137, 2.6990966796875, 3.3781933784484863, 4.057290077209473, 4.736387252807617, 5.4154839515686035, 6.09458065032959, 6.773677825927734, 7.452774524688721, 8.131871223449707, 8.810968399047852, 9.49006462097168, 10.169161796569824, 10.848258972167969, 11.527355194091797, 12.206452369689941, 12.885549545288086, 13.564645767211914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 10.0, 5.0, 17.0, 10.0, 17.0, 34.0, 25.0, 30.0, 28.0, 48.0, 39.0, 50.0, 39.0, 51.0, 48.0, 65.0, 57.0, 55.0, 54.0, 44.0, 31.0, 38.0, 41.0, 34.0, 30.0, 32.0, 23.0, 17.0, 9.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8470027446746826, -3.7406296730041504, -3.6342568397521973, -3.527883768081665, -3.421510696411133, -3.3151378631591797, -3.2087647914886475, -3.1023917198181152, -2.996018886566162, -2.88964581489563, -2.7832729816436768, -2.6768999099731445, -2.5705270767211914, -2.464154005050659, -2.357780933380127, -2.251408100128174, -2.1450350284576416, -2.0386619567871094, -1.9322891235351562, -1.825916051864624, -1.7195430994033813, -1.6131701469421387, -1.5067970752716064, -1.4004241228103638, -1.294051170349121, -1.1876782178878784, -1.0813052654266357, -0.9749321937561035, -0.8685592412948608, -0.7621862888336182, -0.6558132767677307, -0.5494402647018433, -0.4430673122406006, -0.3366943299770355, -0.23032134771347046, -0.1239483654499054, -0.017575383186340332, 0.08879756927490234, 0.1951705813407898, 0.30154359340667725, 0.4079165458679199, 0.5142894983291626, 0.62066251039505, 0.7270355224609375, 0.8334084749221802, 0.9397814273834229, 1.046154499053955, 1.1525274515151978, 1.2589004039764404, 1.365273356437683, 1.4716463088989258, 1.578019380569458, 1.6843923330307007, 1.7907652854919434, 1.8971383571624756, 2.003511428833008, 2.109884262084961, 2.216257333755493, 2.3226301670074463, 2.4290032386779785, 2.5353760719299316, 2.641749143600464, 2.748122215270996, 2.854495048522949, 2.9608681201934814]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 9.0, 13.0, 22.0, 22.0, 28.0, 61.0, 85.0, 139.0, 273.0, 455.0, 790.0, 1572.0, 3461.0, 7723.0, 19960.0, 58355.0, 202002.0, 475170.0, 189649.0, 55211.0, 19242.0, 7617.0, 3284.0, 1601.0, 816.0, 381.0, 249.0, 127.0, 89.0, 49.0, 30.0, 20.0, 12.0, 8.0, 5.0, 4.0, 8.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.455078125, -2.368865966796875, -2.28265380859375, -2.196441650390625, -2.1102294921875, -2.024017333984375, -1.93780517578125, -1.851593017578125, -1.765380859375, -1.679168701171875, -1.59295654296875, -1.506744384765625, -1.4205322265625, -1.334320068359375, -1.24810791015625, -1.161895751953125, -1.07568359375, -0.989471435546875, -0.90325927734375, -0.817047119140625, -0.7308349609375, -0.644622802734375, -0.55841064453125, -0.472198486328125, -0.385986328125, -0.299774169921875, -0.21356201171875, -0.127349853515625, -0.0411376953125, 0.045074462890625, 0.13128662109375, 0.217498779296875, 0.3037109375, 0.389923095703125, 0.47613525390625, 0.562347412109375, 0.6485595703125, 0.734771728515625, 0.82098388671875, 0.907196044921875, 0.993408203125, 1.079620361328125, 1.16583251953125, 1.252044677734375, 1.3382568359375, 1.424468994140625, 1.51068115234375, 1.596893310546875, 1.68310546875, 1.769317626953125, 1.85552978515625, 1.941741943359375, 2.0279541015625, 2.114166259765625, 2.20037841796875, 2.286590576171875, 2.372802734375, 2.459014892578125, 2.54522705078125, 2.631439208984375, 2.7176513671875, 2.803863525390625, 2.89007568359375, 2.976287841796875, 3.0625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 3.0, 8.0, 11.0, 14.0, 18.0, 19.0, 25.0, 26.0, 23.0, 25.0, 47.0, 47.0, 44.0, 64.0, 56.0, 64.0, 65.0, 62.0, 62.0, 47.0, 42.0, 44.0, 31.0, 23.0, 27.0, 16.0, 14.0, 19.0, 9.0, 12.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.087890625, -1.0420074462890625, -0.996124267578125, -0.9502410888671875, -0.90435791015625, -0.8584747314453125, -0.812591552734375, -0.7667083740234375, -0.7208251953125, -0.6749420166015625, -0.629058837890625, -0.5831756591796875, -0.53729248046875, -0.4914093017578125, -0.445526123046875, -0.3996429443359375, -0.353759765625, -0.3078765869140625, -0.261993408203125, -0.2161102294921875, -0.17022705078125, -0.1243438720703125, -0.078460693359375, -0.0325775146484375, 0.0133056640625, 0.0591888427734375, 0.105072021484375, 0.1509552001953125, 0.19683837890625, 0.2427215576171875, 0.288604736328125, 0.3344879150390625, 0.38037109375, 0.4262542724609375, 0.472137451171875, 0.5180206298828125, 0.56390380859375, 0.6097869873046875, 0.655670166015625, 0.7015533447265625, 0.7474365234375, 0.7933197021484375, 0.839202880859375, 0.8850860595703125, 0.93096923828125, 0.9768524169921875, 1.022735595703125, 1.0686187744140625, 1.114501953125, 1.1603851318359375, 1.206268310546875, 1.2521514892578125, 1.29803466796875, 1.3439178466796875, 1.389801025390625, 1.4356842041015625, 1.4815673828125, 1.5274505615234375, 1.573333740234375, 1.6192169189453125, 1.66510009765625, 1.7109832763671875, 1.756866455078125, 1.8027496337890625, 1.8486328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 6.0, 8.0, 6.0, 12.0, 16.0, 27.0, 26.0, 44.0, 65.0, 102.0, 159.0, 234.0, 388.0, 721.0, 1570.0, 3569.0, 9764.0, 34736.0, 192015.0, 632619.0, 132005.0, 26519.0, 7891.0, 3082.0, 1334.0, 665.0, 334.0, 208.0, 132.0, 92.0, 57.0, 45.0, 30.0, 19.0, 9.0, 17.0, 5.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.6328125, -3.5272216796875, -3.421630859375, -3.3160400390625, -3.21044921875, -3.1048583984375, -2.999267578125, -2.8936767578125, -2.7880859375, -2.6824951171875, -2.576904296875, -2.4713134765625, -2.36572265625, -2.2601318359375, -2.154541015625, -2.0489501953125, -1.943359375, -1.8377685546875, -1.732177734375, -1.6265869140625, -1.52099609375, -1.4154052734375, -1.309814453125, -1.2042236328125, -1.0986328125, -0.9930419921875, -0.887451171875, -0.7818603515625, -0.67626953125, -0.5706787109375, -0.465087890625, -0.3594970703125, -0.25390625, -0.1483154296875, -0.042724609375, 0.0628662109375, 0.16845703125, 0.2740478515625, 0.379638671875, 0.4852294921875, 0.5908203125, 0.6964111328125, 0.802001953125, 0.9075927734375, 1.01318359375, 1.1187744140625, 1.224365234375, 1.3299560546875, 1.435546875, 1.5411376953125, 1.646728515625, 1.7523193359375, 1.85791015625, 1.9635009765625, 2.069091796875, 2.1746826171875, 2.2802734375, 2.3858642578125, 2.491455078125, 2.5970458984375, 2.70263671875, 2.8082275390625, 2.913818359375, 3.0194091796875, 3.125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 4.0, 7.0, 12.0, 16.0, 22.0, 29.0, 40.0, 61.0, 45.0, 70.0, 62.0, 78.0, 73.0, 75.0, 77.0, 63.0, 70.0, 48.0, 34.0, 31.0, 19.0, 17.0, 14.0, 10.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.68017578125, -9.3759765625, -9.07177734375, -8.767578125, -8.46337890625, -8.1591796875, -7.85498046875, -7.55078125, -7.24658203125, -6.9423828125, -6.63818359375, -6.333984375, -6.02978515625, -5.7255859375, -5.42138671875, -5.1171875, -4.81298828125, -4.5087890625, -4.20458984375, -3.900390625, -3.59619140625, -3.2919921875, -2.98779296875, -2.68359375, -2.37939453125, -2.0751953125, -1.77099609375, -1.466796875, -1.16259765625, -0.8583984375, -0.55419921875, -0.25, 0.05419921875, 0.3583984375, 0.66259765625, 0.966796875, 1.27099609375, 1.5751953125, 1.87939453125, 2.18359375, 2.48779296875, 2.7919921875, 3.09619140625, 3.400390625, 3.70458984375, 4.0087890625, 4.31298828125, 4.6171875, 4.92138671875, 5.2255859375, 5.52978515625, 5.833984375, 6.13818359375, 6.4423828125, 6.74658203125, 7.05078125, 7.35498046875, 7.6591796875, 7.96337890625, 8.267578125, 8.57177734375, 8.8759765625, 9.18017578125, 9.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 4.0, 3.0, 14.0, 10.0, 32.0, 39.0, 79.0, 258.0, 874.0, 5086.0, 523585.0, 512223.0, 5028.0, 855.0, 255.0, 115.0, 35.0, 23.0, 14.0, 7.0, 2.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.81640625, -4.59747314453125, -4.3785400390625, -4.15960693359375, -3.940673828125, -3.72174072265625, -3.5028076171875, -3.28387451171875, -3.06494140625, -2.84600830078125, -2.6270751953125, -2.40814208984375, -2.189208984375, -1.97027587890625, -1.7513427734375, -1.53240966796875, -1.3134765625, -1.09454345703125, -0.8756103515625, -0.65667724609375, -0.437744140625, -0.21881103515625, 0.0001220703125, 0.21905517578125, 0.43798828125, 0.65692138671875, 0.8758544921875, 1.09478759765625, 1.313720703125, 1.53265380859375, 1.7515869140625, 1.97052001953125, 2.189453125, 2.40838623046875, 2.6273193359375, 2.84625244140625, 3.065185546875, 3.28411865234375, 3.5030517578125, 3.72198486328125, 3.94091796875, 4.15985107421875, 4.3787841796875, 4.59771728515625, 4.816650390625, 5.03558349609375, 5.2545166015625, 5.47344970703125, 5.6923828125, 5.91131591796875, 6.1302490234375, 6.34918212890625, 6.568115234375, 6.78704833984375, 7.0059814453125, 7.22491455078125, 7.44384765625, 7.66278076171875, 7.8817138671875, 8.10064697265625, 8.319580078125, 8.53851318359375, 8.7574462890625, 8.97637939453125, 9.1953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 1.0, 6.0, 9.0, 9.0, 11.0, 25.0, 32.0, 47.0, 75.0, 106.0, 138.0, 134.0, 118.0, 89.0, 73.0, 37.0, 27.0, 19.0, 11.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0003991127014160156, -0.00038889050483703613, -0.00037866830825805664, -0.00036844611167907715, -0.00035822391510009766, -0.00034800171852111816, -0.00033777952194213867, -0.0003275573253631592, -0.0003173351287841797, -0.0003071129322052002, -0.0002968907356262207, -0.0002866685390472412, -0.0002764463424682617, -0.0002662241458892822, -0.00025600194931030273, -0.00024577975273132324, -0.00023555755615234375, -0.00022533535957336426, -0.00021511316299438477, -0.00020489096641540527, -0.00019466876983642578, -0.0001844465732574463, -0.0001742243766784668, -0.0001640021800994873, -0.0001537799835205078, -0.00014355778694152832, -0.00013333559036254883, -0.00012311339378356934, -0.00011289119720458984, -0.00010266900062561035, -9.244680404663086e-05, -8.222460746765137e-05, -7.200241088867188e-05, -6.178021430969238e-05, -5.155801773071289e-05, -4.13358211517334e-05, -3.1113624572753906e-05, -2.0891427993774414e-05, -1.0669231414794922e-05, -4.470348358154297e-07, 9.775161743164062e-06, 1.9997358322143555e-05, 3.0219554901123047e-05, 4.044175148010254e-05, 5.066394805908203e-05, 6.0886144638061523e-05, 7.110834121704102e-05, 8.133053779602051e-05, 9.1552734375e-05, 0.00010177493095397949, 0.00011199712753295898, 0.00012221932411193848, 0.00013244152069091797, 0.00014266371726989746, 0.00015288591384887695, 0.00016310811042785645, 0.00017333030700683594, 0.00018355250358581543, 0.00019377470016479492, 0.00020399689674377441, 0.0002142190933227539, 0.0002244412899017334, 0.0002346634864807129, 0.0002448856830596924, 0.0002551078796386719]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 22.0, 28.0, 51.0, 137.0, 260.0, 729.0, 2673.0, 21599.0, 974258.0, 43503.0, 3821.0, 891.0, 307.0, 125.0, 51.0, 31.0, 19.0, 15.0, 9.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.28558349609375, -6.0985107421875, -5.91143798828125, -5.724365234375, -5.53729248046875, -5.3502197265625, -5.16314697265625, -4.97607421875, -4.78900146484375, -4.6019287109375, -4.41485595703125, -4.227783203125, -4.04071044921875, -3.8536376953125, -3.66656494140625, -3.4794921875, -3.29241943359375, -3.1053466796875, -2.91827392578125, -2.731201171875, -2.54412841796875, -2.3570556640625, -2.16998291015625, -1.98291015625, -1.79583740234375, -1.6087646484375, -1.42169189453125, -1.234619140625, -1.04754638671875, -0.8604736328125, -0.67340087890625, -0.486328125, -0.29925537109375, -0.1121826171875, 0.07489013671875, 0.261962890625, 0.44903564453125, 0.6361083984375, 0.82318115234375, 1.01025390625, 1.19732666015625, 1.3843994140625, 1.57147216796875, 1.758544921875, 1.94561767578125, 2.1326904296875, 2.31976318359375, 2.5068359375, 2.69390869140625, 2.8809814453125, 3.06805419921875, 3.255126953125, 3.44219970703125, 3.6292724609375, 3.81634521484375, 4.00341796875, 4.19049072265625, 4.3775634765625, 4.56463623046875, 4.751708984375, 4.93878173828125, 5.1258544921875, 5.31292724609375, 5.5]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 2.0, 7.0, 14.0, 20.0, 34.0, 98.0, 237.0, 279.0, 177.0, 50.0, 18.0, 14.0, 3.0, 8.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -8.0006103515625, -7.766845703125, -7.5330810546875, -7.29931640625, -7.0655517578125, -6.831787109375, -6.5980224609375, -6.3642578125, -6.1304931640625, -5.896728515625, -5.6629638671875, -5.42919921875, -5.1954345703125, -4.961669921875, -4.7279052734375, -4.494140625, -4.2603759765625, -4.026611328125, -3.7928466796875, -3.55908203125, -3.3253173828125, -3.091552734375, -2.8577880859375, -2.6240234375, -2.3902587890625, -2.156494140625, -1.9227294921875, -1.68896484375, -1.4552001953125, -1.221435546875, -0.9876708984375, -0.75390625, -0.5201416015625, -0.286376953125, -0.0526123046875, 0.18115234375, 0.4149169921875, 0.648681640625, 0.8824462890625, 1.1162109375, 1.3499755859375, 1.583740234375, 1.8175048828125, 2.05126953125, 2.2850341796875, 2.518798828125, 2.7525634765625, 2.986328125, 3.2200927734375, 3.453857421875, 3.6876220703125, 3.92138671875, 4.1551513671875, 4.388916015625, 4.6226806640625, 4.8564453125, 5.0902099609375, 5.323974609375, 5.5577392578125, 5.79150390625, 6.0252685546875, 6.259033203125, 6.4927978515625, 6.7265625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 27.0, 38.0, 97.0, 210.0, 290.0, 189.0, 87.0, 36.0, 14.0, 2.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.40178680419922, -76.41718292236328, -74.43258666992188, -72.44798278808594, -70.46337890625, -68.4787826538086, -66.49417877197266, -64.50957489013672, -62.52497482299805, -60.540374755859375, -58.55577087402344, -56.571170806884766, -54.586570739746094, -52.601966857910156, -50.617366790771484, -48.63276672363281, -46.648162841796875, -44.6635627746582, -42.678958892822266, -40.694358825683594, -38.70975875854492, -36.725154876708984, -34.74055480957031, -32.755950927734375, -30.77135467529297, -28.786752700805664, -26.802152633666992, -24.817550659179688, -22.832948684692383, -20.848346710205078, -18.863746643066406, -16.8791446685791, -14.894542694091797, -12.909941673278809, -10.925339698791504, -8.940738677978516, -6.956137180328369, -4.971535682678223, -2.9869346618652344, -1.0023326873779297, 0.9822683334350586, 2.966869831085205, 4.951471328735352, 6.93607234954834, 8.920673370361328, 10.905275344848633, 12.889876365661621, 14.874478340148926, 16.859079360961914, 18.84368133544922, 20.82828140258789, 22.812883377075195, 24.7974853515625, 26.782085418701172, 28.766687393188477, 30.75128936767578, 32.73588943481445, 34.720489501953125, 36.70509338378906, 38.689693450927734, 40.674293518066406, 42.658897399902344, 44.643497467041016, 46.62809753417969, 48.612701416015625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 0.0, 6.0, 9.0, 2.0, 22.0, 12.0, 16.0, 15.0, 13.0, 27.0, 29.0, 39.0, 50.0, 45.0, 55.0, 60.0, 56.0, 58.0, 52.0, 71.0, 59.0, 46.0, 43.0, 30.0, 25.0, 34.0, 26.0, 19.0, 17.0, 13.0, 12.0, 11.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.80224609375, -42.636138916015625, -41.47003173828125, -40.303924560546875, -39.1378173828125, -37.971710205078125, -36.80560302734375, -35.63949203491211, -34.473384857177734, -33.30727767944336, -32.141170501708984, -30.97506332397461, -29.8089542388916, -28.642847061157227, -27.47673988342285, -26.310630798339844, -25.1445255279541, -23.978418350219727, -22.81231117248535, -21.646202087402344, -20.48009490966797, -19.313987731933594, -18.14788055419922, -16.981773376464844, -15.815665245056152, -14.649558067321777, -13.483449935913086, -12.317342758178711, -11.151235580444336, -9.985127449035645, -8.81902027130127, -7.652912139892578, -6.486804962158203, -5.32069730758667, -4.154589653015137, -2.9884824752807617, -1.8223748207092285, -0.6562671661376953, 0.5098400115966797, 1.675948143005371, 2.842055320739746, 4.008162975311279, 5.1742706298828125, 6.3403778076171875, 7.506485462188721, 8.672593116760254, 9.838700294494629, 11.00480842590332, 12.170915603637695, 13.33702278137207, 14.503130912780762, 15.669238090515137, 16.835346221923828, 18.001453399658203, 19.167560577392578, 20.333667755126953, 21.499774932861328, 22.665882110595703, 23.831989288330078, 24.998096466064453, 26.16420555114746, 27.330312728881836, 28.49641990661621, 29.66252899169922, 30.828636169433594]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 10.0, 16.0, 21.0, 24.0, 45.0, 60.0, 96.0, 158.0, 293.0, 575.0, 1472.0, 5971.0, 3974754.0, 202767.0, 5455.0, 1405.0, 534.0, 281.0, 115.0, 74.0, 39.0, 33.0, 19.0, 12.0, 11.0, 10.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0], "bins": [-11.1484375, -10.8948974609375, -10.641357421875, -10.3878173828125, -10.13427734375, -9.8807373046875, -9.627197265625, -9.3736572265625, -9.1201171875, -8.8665771484375, -8.613037109375, -8.3594970703125, -8.10595703125, -7.8524169921875, -7.598876953125, -7.3453369140625, -7.091796875, -6.8382568359375, -6.584716796875, -6.3311767578125, -6.07763671875, -5.8240966796875, -5.570556640625, -5.3170166015625, -5.0634765625, -4.8099365234375, -4.556396484375, -4.3028564453125, -4.04931640625, -3.7957763671875, -3.542236328125, -3.2886962890625, -3.03515625, -2.7816162109375, -2.528076171875, -2.2745361328125, -2.02099609375, -1.7674560546875, -1.513916015625, -1.2603759765625, -1.0068359375, -0.7532958984375, -0.499755859375, -0.2462158203125, 0.00732421875, 0.2608642578125, 0.514404296875, 0.7679443359375, 1.021484375, 1.2750244140625, 1.528564453125, 1.7821044921875, 2.03564453125, 2.2891845703125, 2.542724609375, 2.7962646484375, 3.0498046875, 3.3033447265625, 3.556884765625, 3.8104248046875, 4.06396484375, 4.3175048828125, 4.571044921875, 4.8245849609375, 5.078125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 11.0, 13.0, 13.0, 32.0, 50.0, 55.0, 83.0, 96.0, 90.0, 104.0, 98.0, 105.0, 74.0, 51.0, 37.0, 28.0, 16.0, 15.0, 11.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.798828125, -3.7198333740234375, -3.640838623046875, -3.5618438720703125, -3.48284912109375, -3.4038543701171875, -3.324859619140625, -3.2458648681640625, -3.1668701171875, -3.0878753662109375, -3.008880615234375, -2.9298858642578125, -2.85089111328125, -2.7718963623046875, -2.692901611328125, -2.6139068603515625, -2.534912109375, -2.4559173583984375, -2.376922607421875, -2.2979278564453125, -2.21893310546875, -2.1399383544921875, -2.060943603515625, -1.9819488525390625, -1.9029541015625, -1.8239593505859375, -1.744964599609375, -1.6659698486328125, -1.58697509765625, -1.5079803466796875, -1.428985595703125, -1.3499908447265625, -1.27099609375, -1.1920013427734375, -1.113006591796875, -1.0340118408203125, -0.95501708984375, -0.8760223388671875, -0.797027587890625, -0.7180328369140625, -0.6390380859375, -0.5600433349609375, -0.481048583984375, -0.4020538330078125, -0.32305908203125, -0.2440643310546875, -0.165069580078125, -0.0860748291015625, -0.007080078125, 0.0719146728515625, 0.150909423828125, 0.2299041748046875, 0.30889892578125, 0.3878936767578125, 0.466888427734375, 0.5458831787109375, 0.6248779296875, 0.7038726806640625, 0.782867431640625, 0.8618621826171875, 0.94085693359375, 1.0198516845703125, 1.098846435546875, 1.1778411865234375, 1.2568359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 8.0, 13.0, 15.0, 18.0, 21.0, 11.0, 27.0, 39.0, 56.0, 70.0, 100.0, 132.0, 186.0, 237.0, 326.0, 634.0, 3306.0, 4108137.0, 77050.0, 2095.0, 537.0, 316.0, 270.0, 158.0, 111.0, 88.0, 61.0, 56.0, 45.0, 38.0, 38.0, 13.0, 16.0, 14.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.860107421875, -15.32958984375, -14.799072265625, -14.2685546875, -13.738037109375, -13.20751953125, -12.677001953125, -12.146484375, -11.615966796875, -11.08544921875, -10.554931640625, -10.0244140625, -9.493896484375, -8.96337890625, -8.432861328125, -7.90234375, -7.371826171875, -6.84130859375, -6.310791015625, -5.7802734375, -5.249755859375, -4.71923828125, -4.188720703125, -3.658203125, -3.127685546875, -2.59716796875, -2.066650390625, -1.5361328125, -1.005615234375, -0.47509765625, 0.055419921875, 0.5859375, 1.116455078125, 1.64697265625, 2.177490234375, 2.7080078125, 3.238525390625, 3.76904296875, 4.299560546875, 4.830078125, 5.360595703125, 5.89111328125, 6.421630859375, 6.9521484375, 7.482666015625, 8.01318359375, 8.543701171875, 9.07421875, 9.604736328125, 10.13525390625, 10.665771484375, 11.1962890625, 11.726806640625, 12.25732421875, 12.787841796875, 13.318359375, 13.848876953125, 14.37939453125, 14.909912109375, 15.4404296875, 15.970947265625, 16.50146484375, 17.031982421875, 17.5625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 10.0, 26.0, 180.0, 3810.0, 44.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.4560546875, -5.185546875, -4.9150390625, -4.64453125, -4.3740234375, -4.103515625, -3.8330078125, -3.5625, -3.2919921875, -3.021484375, -2.7509765625, -2.48046875, -2.2099609375, -1.939453125, -1.6689453125, -1.3984375, -1.1279296875, -0.857421875, -0.5869140625, -0.31640625, -0.0458984375, 0.224609375, 0.4951171875, 0.765625, 1.0361328125, 1.306640625, 1.5771484375, 1.84765625, 2.1181640625, 2.388671875, 2.6591796875, 2.9296875, 3.2001953125, 3.470703125, 3.7412109375, 4.01171875, 4.2822265625, 4.552734375, 4.8232421875, 5.09375, 5.3642578125, 5.634765625, 5.9052734375, 6.17578125, 6.4462890625, 6.716796875, 6.9873046875, 7.2578125, 7.5283203125, 7.798828125, 8.0693359375, 8.33984375, 8.6103515625, 8.880859375, 9.1513671875, 9.421875, 9.6923828125, 9.962890625, 10.2333984375, 10.50390625, 10.7744140625, 11.044921875, 11.3154296875, 11.5859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 10.0, 16.0, 62.0, 183.0, 406.0, 234.0, 65.0, 21.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.848400115966797, -18.786211013793945, -17.724021911621094, -16.661832809448242, -15.59964370727539, -14.537454605102539, -13.475265502929688, -12.413076400756836, -11.350887298583984, -10.288698196411133, -9.226509094238281, -8.16431999206543, -7.102130889892578, -6.039941787719727, -4.977752685546875, -3.9155635833740234, -2.853374481201172, -1.7911853790283203, -0.7289962768554688, 0.3331928253173828, 1.3953819274902344, 2.457571029663086, 3.5197601318359375, 4.581949234008789, 5.644138336181641, 6.706327438354492, 7.768516540527344, 8.830705642700195, 9.892894744873047, 10.955083847045898, 12.01727294921875, 13.079462051391602, 14.141651153564453, 15.203840255737305, 16.266029357910156, 17.328218460083008, 18.39040756225586, 19.45259666442871, 20.514785766601562, 21.576974868774414, 22.639163970947266, 23.701353073120117, 24.76354217529297, 25.82573127746582, 26.887920379638672, 27.950109481811523, 29.012298583984375, 30.074487686157227, 31.136676788330078, 32.19886779785156, 33.26105499267578, 34.3232421875, 35.385433197021484, 36.44762420654297, 37.50981140136719, 38.571998596191406, 39.63418960571289, 40.696380615234375, 41.758567810058594, 42.82075500488281, 43.8829460144043, 44.94513702392578, 46.00732421875, 47.06951141357422, 48.1317024230957]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 5.0, 6.0, 14.0, 11.0, 15.0, 24.0, 41.0, 44.0, 56.0, 96.0, 105.0, 109.0, 136.0, 92.0, 74.0, 53.0, 33.0, 19.0, 31.0, 14.0, 13.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.51900863647461, -21.865917205810547, -21.212825775146484, -20.559734344482422, -19.90664291381836, -19.253551483154297, -18.600460052490234, -17.947368621826172, -17.29427719116211, -16.641185760498047, -15.988094329833984, -15.335002899169922, -14.68191146850586, -14.028820037841797, -13.375728607177734, -12.722637176513672, -12.069544792175293, -11.41645336151123, -10.763361930847168, -10.110270500183105, -9.457179069519043, -8.80408763885498, -8.150995254516602, -7.497904300689697, -6.844812870025635, -6.191721439361572, -5.53863000869751, -4.885538101196289, -4.232446670532227, -3.579355478286743, -2.9262638092041016, -2.273172378540039, -1.6200809478759766, -0.9669894576072693, -0.313897967338562, 0.33919358253479004, 0.9922850131988525, 1.645376443862915, 2.2984681129455566, 2.951559543609619, 3.6046509742736816, 4.257742404937744, 4.910833835601807, 5.563925743103027, 6.21701717376709, 6.870108604431152, 7.523200035095215, 8.176291465759277, 8.82938289642334, 9.482474327087402, 10.135565757751465, 10.788657188415527, 11.44174861907959, 12.094840049743652, 12.747932434082031, 13.401023864746094, 14.054115295410156, 14.707206726074219, 15.360298156738281, 16.013389587402344, 16.666481018066406, 17.31957244873047, 17.97266387939453, 18.625755310058594, 19.278846740722656]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 12.0, 11.0, 28.0, 35.0, 52.0, 103.0, 172.0, 356.0, 935.0, 2548.0, 9715.0, 56759.0, 553011.0, 374893.0, 38748.0, 7457.0, 2208.0, 756.0, 332.0, 162.0, 100.0, 57.0, 30.0, 27.0, 10.0, 15.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.2896728515625, -6.114501953125, -5.9393310546875, -5.76416015625, -5.5889892578125, -5.413818359375, -5.2386474609375, -5.0634765625, -4.8883056640625, -4.713134765625, -4.5379638671875, -4.36279296875, -4.1876220703125, -4.012451171875, -3.8372802734375, -3.662109375, -3.4869384765625, -3.311767578125, -3.1365966796875, -2.96142578125, -2.7862548828125, -2.611083984375, -2.4359130859375, -2.2607421875, -2.0855712890625, -1.910400390625, -1.7352294921875, -1.56005859375, -1.3848876953125, -1.209716796875, -1.0345458984375, -0.859375, -0.6842041015625, -0.509033203125, -0.3338623046875, -0.15869140625, 0.0164794921875, 0.191650390625, 0.3668212890625, 0.5419921875, 0.7171630859375, 0.892333984375, 1.0675048828125, 1.24267578125, 1.4178466796875, 1.593017578125, 1.7681884765625, 1.943359375, 2.1185302734375, 2.293701171875, 2.4688720703125, 2.64404296875, 2.8192138671875, 2.994384765625, 3.1695556640625, 3.3447265625, 3.5198974609375, 3.695068359375, 3.8702392578125, 4.04541015625, 4.2205810546875, 4.395751953125, 4.5709228515625, 4.74609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 7.0, 5.0, 8.0, 22.0, 26.0, 32.0, 47.0, 66.0, 71.0, 82.0, 115.0, 95.0, 94.0, 78.0, 71.0, 57.0, 37.0, 27.0, 15.0, 17.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.953125, -3.86151123046875, -3.7698974609375, -3.67828369140625, -3.586669921875, -3.49505615234375, -3.4034423828125, -3.31182861328125, -3.22021484375, -3.12860107421875, -3.0369873046875, -2.94537353515625, -2.853759765625, -2.76214599609375, -2.6705322265625, -2.57891845703125, -2.4873046875, -2.39569091796875, -2.3040771484375, -2.21246337890625, -2.120849609375, -2.02923583984375, -1.9376220703125, -1.84600830078125, -1.75439453125, -1.66278076171875, -1.5711669921875, -1.47955322265625, -1.387939453125, -1.29632568359375, -1.2047119140625, -1.11309814453125, -1.021484375, -0.92987060546875, -0.8382568359375, -0.74664306640625, -0.655029296875, -0.56341552734375, -0.4718017578125, -0.38018798828125, -0.28857421875, -0.19696044921875, -0.1053466796875, -0.01373291015625, 0.077880859375, 0.16949462890625, 0.2611083984375, 0.35272216796875, 0.4443359375, 0.53594970703125, 0.6275634765625, 0.71917724609375, 0.810791015625, 0.90240478515625, 0.9940185546875, 1.08563232421875, 1.17724609375, 1.26885986328125, 1.3604736328125, 1.45208740234375, 1.543701171875, 1.63531494140625, 1.7269287109375, 1.81854248046875, 1.91015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 13.0, 18.0, 47.0, 88.0, 205.0, 676.0, 5374.0, 1022834.0, 17820.0, 945.0, 300.0, 115.0, 52.0, 25.0, 15.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.796875, -30.019775390625, -29.24267578125, -28.465576171875, -27.6884765625, -26.911376953125, -26.13427734375, -25.357177734375, -24.580078125, -23.802978515625, -23.02587890625, -22.248779296875, -21.4716796875, -20.694580078125, -19.91748046875, -19.140380859375, -18.36328125, -17.586181640625, -16.80908203125, -16.031982421875, -15.2548828125, -14.477783203125, -13.70068359375, -12.923583984375, -12.146484375, -11.369384765625, -10.59228515625, -9.815185546875, -9.0380859375, -8.260986328125, -7.48388671875, -6.706787109375, -5.9296875, -5.152587890625, -4.37548828125, -3.598388671875, -2.8212890625, -2.044189453125, -1.26708984375, -0.489990234375, 0.287109375, 1.064208984375, 1.84130859375, 2.618408203125, 3.3955078125, 4.172607421875, 4.94970703125, 5.726806640625, 6.50390625, 7.281005859375, 8.05810546875, 8.835205078125, 9.6123046875, 10.389404296875, 11.16650390625, 11.943603515625, 12.720703125, 13.497802734375, 14.27490234375, 15.052001953125, 15.8291015625, 16.606201171875, 17.38330078125, 18.160400390625, 18.9375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 5.0, 17.0, 19.0, 37.0, 59.0, 66.0, 83.0, 102.0, 123.0, 105.0, 123.0, 87.0, 53.0, 49.0, 35.0, 18.0, 11.0, 10.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5625, -11.0576171875, -10.552734375, -10.0478515625, -9.54296875, -9.0380859375, -8.533203125, -8.0283203125, -7.5234375, -7.0185546875, -6.513671875, -6.0087890625, -5.50390625, -4.9990234375, -4.494140625, -3.9892578125, -3.484375, -2.9794921875, -2.474609375, -1.9697265625, -1.46484375, -0.9599609375, -0.455078125, 0.0498046875, 0.5546875, 1.0595703125, 1.564453125, 2.0693359375, 2.57421875, 3.0791015625, 3.583984375, 4.0888671875, 4.59375, 5.0986328125, 5.603515625, 6.1083984375, 6.61328125, 7.1181640625, 7.623046875, 8.1279296875, 8.6328125, 9.1376953125, 9.642578125, 10.1474609375, 10.65234375, 11.1572265625, 11.662109375, 12.1669921875, 12.671875, 13.1767578125, 13.681640625, 14.1865234375, 14.69140625, 15.1962890625, 15.701171875, 16.2060546875, 16.7109375, 17.2158203125, 17.720703125, 18.2255859375, 18.73046875, 19.2353515625, 19.740234375, 20.2451171875, 20.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 7.0, 7.0, 13.0, 9.0, 29.0, 20.0, 36.0, 67.0, 112.0, 173.0, 331.0, 838.0, 2371.0, 10834.0, 131204.0, 844665.0, 48933.0, 6090.0, 1550.0, 576.0, 274.0, 133.0, 78.0, 59.0, 27.0, 24.0, 28.0, 16.0, 9.0, 6.0, 8.0, 3.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8251953125, -1.7501983642578125, -1.675201416015625, -1.6002044677734375, -1.52520751953125, -1.4502105712890625, -1.375213623046875, -1.3002166748046875, -1.2252197265625, -1.1502227783203125, -1.075225830078125, -1.0002288818359375, -0.92523193359375, -0.8502349853515625, -0.775238037109375, -0.7002410888671875, -0.625244140625, -0.5502471923828125, -0.475250244140625, -0.4002532958984375, -0.32525634765625, -0.2502593994140625, -0.175262451171875, -0.1002655029296875, -0.0252685546875, 0.0497283935546875, 0.124725341796875, 0.1997222900390625, 0.27471923828125, 0.3497161865234375, 0.424713134765625, 0.4997100830078125, 0.57470703125, 0.6497039794921875, 0.724700927734375, 0.7996978759765625, 0.87469482421875, 0.9496917724609375, 1.024688720703125, 1.0996856689453125, 1.1746826171875, 1.2496795654296875, 1.324676513671875, 1.3996734619140625, 1.47467041015625, 1.5496673583984375, 1.624664306640625, 1.6996612548828125, 1.774658203125, 1.8496551513671875, 1.924652099609375, 1.9996490478515625, 2.07464599609375, 2.1496429443359375, 2.224639892578125, 2.2996368408203125, 2.3746337890625, 2.4496307373046875, 2.524627685546875, 2.5996246337890625, 2.67462158203125, 2.7496185302734375, 2.824615478515625, 2.8996124267578125, 2.974609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 12.0, 18.0, 18.0, 38.0, 49.0, 95.0, 106.0, 145.0, 149.0, 103.0, 89.0, 38.0, 43.0, 17.0, 18.0, 16.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033593177795410156, -0.0003247074782848358, -0.00031348317861557007, -0.0003022588789463043, -0.0002910345792770386, -0.00027981027960777283, -0.0002685859799385071, -0.00025736168026924133, -0.0002461373805999756, -0.00023491308093070984, -0.0002236887812614441, -0.00021246448159217834, -0.0002012401819229126, -0.00019001588225364685, -0.0001787915825843811, -0.00016756728291511536, -0.0001563429832458496, -0.00014511868357658386, -0.00013389438390731812, -0.00012267008423805237, -0.00011144578456878662, -0.00010022148489952087, -8.899718523025513e-05, -7.777288556098938e-05, -6.654858589172363e-05, -5.5324286222457886e-05, -4.409998655319214e-05, -3.287568688392639e-05, -2.1651387214660645e-05, -1.0427087545394897e-05, 7.972121238708496e-07, 1.2021511793136597e-05, 2.3245811462402344e-05, 3.447011113166809e-05, 4.569441080093384e-05, 5.6918710470199585e-05, 6.814301013946533e-05, 7.936730980873108e-05, 9.059160947799683e-05, 0.00010181590914726257, 0.00011304020881652832, 0.00012426450848579407, 0.00013548880815505981, 0.00014671310782432556, 0.0001579374074935913, 0.00016916170716285706, 0.0001803860068321228, 0.00019161030650138855, 0.0002028346061706543, 0.00021405890583992004, 0.0002252832055091858, 0.00023650750517845154, 0.0002477318048477173, 0.00025895610451698303, 0.0002701804041862488, 0.0002814047038555145, 0.0002926290035247803, 0.000303853303194046, 0.00031507760286331177, 0.0003263019025325775, 0.00033752620220184326, 0.000348750501871109, 0.00035997480154037476, 0.0003711991012096405, 0.00038242340087890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 20.0, 28.0, 60.0, 163.0, 610.0, 7223.0, 1001231.0, 37577.0, 1202.0, 258.0, 106.0, 42.0, 10.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.28125, -8.08721923828125, -7.8931884765625, -7.69915771484375, -7.505126953125, -7.31109619140625, -7.1170654296875, -6.92303466796875, -6.72900390625, -6.53497314453125, -6.3409423828125, -6.14691162109375, -5.952880859375, -5.75885009765625, -5.5648193359375, -5.37078857421875, -5.1767578125, -4.98272705078125, -4.7886962890625, -4.59466552734375, -4.400634765625, -4.20660400390625, -4.0125732421875, -3.81854248046875, -3.62451171875, -3.43048095703125, -3.2364501953125, -3.04241943359375, -2.848388671875, -2.65435791015625, -2.4603271484375, -2.26629638671875, -2.072265625, -1.87823486328125, -1.6842041015625, -1.49017333984375, -1.296142578125, -1.10211181640625, -0.9080810546875, -0.71405029296875, -0.52001953125, -0.32598876953125, -0.1319580078125, 0.06207275390625, 0.256103515625, 0.45013427734375, 0.6441650390625, 0.83819580078125, 1.0322265625, 1.22625732421875, 1.4202880859375, 1.61431884765625, 1.808349609375, 2.00238037109375, 2.1964111328125, 2.39044189453125, 2.58447265625, 2.77850341796875, 2.9725341796875, 3.16656494140625, 3.360595703125, 3.55462646484375, 3.7486572265625, 3.94268798828125, 4.13671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 13.0, 6.0, 30.0, 54.0, 77.0, 154.0, 226.0, 190.0, 108.0, 56.0, 34.0, 24.0, 12.0, 6.0, 5.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.978515625, -1.853240966796875, -1.72796630859375, -1.602691650390625, -1.4774169921875, -1.352142333984375, -1.22686767578125, -1.101593017578125, -0.976318359375, -0.851043701171875, -0.72576904296875, -0.600494384765625, -0.4752197265625, -0.349945068359375, -0.22467041015625, -0.099395751953125, 0.02587890625, 0.151153564453125, 0.27642822265625, 0.401702880859375, 0.5269775390625, 0.652252197265625, 0.77752685546875, 0.902801513671875, 1.028076171875, 1.153350830078125, 1.27862548828125, 1.403900146484375, 1.5291748046875, 1.654449462890625, 1.77972412109375, 1.904998779296875, 2.0302734375, 2.155548095703125, 2.28082275390625, 2.406097412109375, 2.5313720703125, 2.656646728515625, 2.78192138671875, 2.907196044921875, 3.032470703125, 3.157745361328125, 3.28302001953125, 3.408294677734375, 3.5335693359375, 3.658843994140625, 3.78411865234375, 3.909393310546875, 4.03466796875, 4.159942626953125, 4.28521728515625, 4.410491943359375, 4.5357666015625, 4.661041259765625, 4.78631591796875, 4.911590576171875, 5.036865234375, 5.162139892578125, 5.28741455078125, 5.412689208984375, 5.5379638671875, 5.663238525390625, 5.78851318359375, 5.913787841796875, 6.0390625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 16.0, 135.0, 697.0, 149.0, 11.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.15692138671875, -235.42755126953125, -227.69818115234375, -219.96881103515625, -212.23944091796875, -204.51007080078125, -196.7806854248047, -189.0513153076172, -181.3219451904297, -173.5925750732422, -165.8632049560547, -158.1338348388672, -150.40444946289062, -142.67507934570312, -134.94570922851562, -127.21633911132812, -119.48696899414062, -111.75759887695312, -104.02822875976562, -96.2988510131836, -88.5694808959961, -80.8401107788086, -73.11073303222656, -65.38136291503906, -57.65199279785156, -49.92262268066406, -42.1932487487793, -34.46387481689453, -26.73450469970703, -19.00513458251953, -11.275760650634766, -3.54638671875, 4.1829681396484375, 11.91234016418457, 19.641712188720703, 27.371084213256836, 35.10045623779297, 42.82982635498047, 50.559200286865234, 58.28857421875, 66.0179443359375, 73.747314453125, 81.4766845703125, 89.20606231689453, 96.93543243408203, 104.66480255126953, 112.39418029785156, 120.12355041503906, 127.85292053222656, 135.58229064941406, 143.31166076660156, 151.04103088378906, 158.77041625976562, 166.49978637695312, 174.22915649414062, 181.95852661132812, 189.68789672851562, 197.41726684570312, 205.14663696289062, 212.87600708007812, 220.60537719726562, 228.33474731445312, 236.0641326904297, 243.7935028076172, 251.5228729248047]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 2.0, 9.0, 15.0, 14.0, 24.0, 27.0, 24.0, 32.0, 47.0, 61.0, 52.0, 76.0, 65.0, 79.0, 51.0, 63.0, 49.0, 55.0, 44.0, 35.0, 27.0, 29.0, 26.0, 19.0, 15.0, 6.0, 12.0, 5.0, 7.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.706390380859375, -43.2441291809082, -41.7818717956543, -40.319610595703125, -38.85734939575195, -37.39508819580078, -35.932830810546875, -34.4705696105957, -33.00830841064453, -31.546049118041992, -30.08378791809082, -28.62152862548828, -27.15926742553711, -25.69700813293457, -24.23474884033203, -22.77248764038086, -21.310230255126953, -19.847970962524414, -18.385709762573242, -16.923450469970703, -15.461190223693848, -13.998929977416992, -12.536670684814453, -11.074410438537598, -9.612150192260742, -8.149889945983887, -6.6876301765441895, -5.225370407104492, -3.7631101608276367, -2.3008499145507812, -0.8385906219482422, 0.6236696243286133, 2.0859336853027344, 3.5481936931610107, 5.010453701019287, 6.472713470458984, 7.93497371673584, 9.397233963012695, 10.859493255615234, 12.32175350189209, 13.784013748168945, 15.2462739944458, 16.708534240722656, 18.170793533325195, 19.633052825927734, 21.095314025878906, 22.557573318481445, 24.019832611083984, 25.482093811035156, 26.944353103637695, 28.406614303588867, 29.868873596191406, 31.331134796142578, 32.79339599609375, 34.255653381347656, 35.71791458129883, 37.18017578125, 38.64243698120117, 40.10469436645508, 41.56695556640625, 43.02921676635742, 44.491477966308594, 45.9537353515625, 47.41599655151367, 48.87825393676758]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 16.0, 15.0, 26.0, 27.0, 39.0, 51.0, 87.0, 134.0, 212.0, 357.0, 640.0, 1057.0, 1929.0, 3905.0, 8896.0, 22970.0, 100105.0, 3231571.0, 739418.0, 53464.0, 16222.0, 6597.0, 3164.0, 1493.0, 788.0, 398.0, 261.0, 158.0, 101.0, 56.0, 39.0, 30.0, 21.0, 11.0, 1.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.786529541015625, -2.69610595703125, -2.605682373046875, -2.5152587890625, -2.424835205078125, -2.33441162109375, -2.243988037109375, -2.153564453125, -2.063140869140625, -1.97271728515625, -1.882293701171875, -1.7918701171875, -1.701446533203125, -1.61102294921875, -1.520599365234375, -1.43017578125, -1.339752197265625, -1.24932861328125, -1.158905029296875, -1.0684814453125, -0.978057861328125, -0.88763427734375, -0.797210693359375, -0.706787109375, -0.616363525390625, -0.52593994140625, -0.435516357421875, -0.3450927734375, -0.254669189453125, -0.16424560546875, -0.073822021484375, 0.0166015625, 0.107025146484375, 0.19744873046875, 0.287872314453125, 0.3782958984375, 0.468719482421875, 0.55914306640625, 0.649566650390625, 0.739990234375, 0.830413818359375, 0.92083740234375, 1.011260986328125, 1.1016845703125, 1.192108154296875, 1.28253173828125, 1.372955322265625, 1.46337890625, 1.553802490234375, 1.64422607421875, 1.734649658203125, 1.8250732421875, 1.915496826171875, 2.00592041015625, 2.096343994140625, 2.186767578125, 2.277191162109375, 2.36761474609375, 2.458038330078125, 2.5484619140625, 2.638885498046875, 2.72930908203125, 2.819732666015625, 2.91015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 9.0, 8.0, 16.0, 15.0, 17.0, 27.0, 43.0, 47.0, 40.0, 41.0, 51.0, 67.0, 52.0, 51.0, 53.0, 50.0, 64.0, 54.0, 47.0, 45.0, 47.0, 23.0, 22.0, 22.0, 18.0, 10.0, 12.0, 10.0, 7.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4543304443359375, -1.403778076171875, -1.3532257080078125, -1.30267333984375, -1.2521209716796875, -1.201568603515625, -1.1510162353515625, -1.1004638671875, -1.0499114990234375, -0.999359130859375, -0.9488067626953125, -0.89825439453125, -0.8477020263671875, -0.797149658203125, -0.7465972900390625, -0.696044921875, -0.6454925537109375, -0.594940185546875, -0.5443878173828125, -0.49383544921875, -0.4432830810546875, -0.392730712890625, -0.3421783447265625, -0.2916259765625, -0.2410736083984375, -0.190521240234375, -0.1399688720703125, -0.08941650390625, -0.0388641357421875, 0.011688232421875, 0.0622406005859375, 0.11279296875, 0.1633453369140625, 0.213897705078125, 0.2644500732421875, 0.31500244140625, 0.3655548095703125, 0.416107177734375, 0.4666595458984375, 0.5172119140625, 0.5677642822265625, 0.618316650390625, 0.6688690185546875, 0.71942138671875, 0.7699737548828125, 0.820526123046875, 0.8710784912109375, 0.921630859375, 0.9721832275390625, 1.022735595703125, 1.0732879638671875, 1.12384033203125, 1.1743927001953125, 1.224945068359375, 1.2754974365234375, 1.3260498046875, 1.3766021728515625, 1.427154541015625, 1.4777069091796875, 1.52825927734375, 1.5788116455078125, 1.629364013671875, 1.6799163818359375, 1.73046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 4.0, 9.0, 6.0, 23.0, 42.0, 94.0, 179.0, 474.0, 1652.0, 8244.0, 108860.0, 4015345.0, 51817.0, 5580.0, 1268.0, 387.0, 130.0, 54.0, 38.0, 18.0, 10.0, 13.0, 6.0, 7.0, 5.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5390625, -7.298828125, -7.05859375, -6.818359375, -6.578125, -6.337890625, -6.09765625, -5.857421875, -5.6171875, -5.376953125, -5.13671875, -4.896484375, -4.65625, -4.416015625, -4.17578125, -3.935546875, -3.6953125, -3.455078125, -3.21484375, -2.974609375, -2.734375, -2.494140625, -2.25390625, -2.013671875, -1.7734375, -1.533203125, -1.29296875, -1.052734375, -0.8125, -0.572265625, -0.33203125, -0.091796875, 0.1484375, 0.388671875, 0.62890625, 0.869140625, 1.109375, 1.349609375, 1.58984375, 1.830078125, 2.0703125, 2.310546875, 2.55078125, 2.791015625, 3.03125, 3.271484375, 3.51171875, 3.751953125, 3.9921875, 4.232421875, 4.47265625, 4.712890625, 4.953125, 5.193359375, 5.43359375, 5.673828125, 5.9140625, 6.154296875, 6.39453125, 6.634765625, 6.875, 7.115234375, 7.35546875, 7.595703125, 7.8359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 14.0, 13.0, 24.0, 35.0, 68.0, 147.0, 517.0, 2019.0, 738.0, 194.0, 98.0, 67.0, 35.0, 21.0, 15.0, 11.0, 10.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.8203125, -6.6439208984375, -6.467529296875, -6.2911376953125, -6.11474609375, -5.9383544921875, -5.761962890625, -5.5855712890625, -5.4091796875, -5.2327880859375, -5.056396484375, -4.8800048828125, -4.70361328125, -4.5272216796875, -4.350830078125, -4.1744384765625, -3.998046875, -3.8216552734375, -3.645263671875, -3.4688720703125, -3.29248046875, -3.1160888671875, -2.939697265625, -2.7633056640625, -2.5869140625, -2.4105224609375, -2.234130859375, -2.0577392578125, -1.88134765625, -1.7049560546875, -1.528564453125, -1.3521728515625, -1.17578125, -0.9993896484375, -0.822998046875, -0.6466064453125, -0.47021484375, -0.2938232421875, -0.117431640625, 0.0589599609375, 0.2353515625, 0.4117431640625, 0.588134765625, 0.7645263671875, 0.94091796875, 1.1173095703125, 1.293701171875, 1.4700927734375, 1.646484375, 1.8228759765625, 1.999267578125, 2.1756591796875, 2.35205078125, 2.5284423828125, 2.704833984375, 2.8812255859375, 3.0576171875, 3.2340087890625, 3.410400390625, 3.5867919921875, 3.76318359375, 3.9395751953125, 4.115966796875, 4.2923583984375, 4.46875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 11.0, 4.0, 23.0, 43.0, 115.0, 280.0, 266.0, 141.0, 55.0, 23.0, 11.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.76212692260742, -42.295501708984375, -40.82887268066406, -39.362247467041016, -37.89562225341797, -36.428993225097656, -34.96236801147461, -33.49574279785156, -32.02911376953125, -30.56248664855957, -29.09585952758789, -27.629234313964844, -26.162607192993164, -24.695980072021484, -23.229354858398438, -21.762727737426758, -20.296100616455078, -18.8294734954834, -17.36284637451172, -15.896221160888672, -14.429594039916992, -12.962966918945312, -11.49634075164795, -10.029714584350586, -8.563087463378906, -7.096460819244385, -5.629834175109863, -4.163207530975342, -2.6965808868408203, -1.2299542427062988, 0.23667240142822266, 1.703298568725586, 3.169921875, 4.6365485191345215, 6.103175163269043, 7.5698018074035645, 9.036428451538086, 10.503055572509766, 11.969681739807129, 13.436307907104492, 14.902935028076172, 16.36956214904785, 17.83618927001953, 19.302814483642578, 20.769441604614258, 22.236068725585938, 23.702693939208984, 25.169321060180664, 26.635948181152344, 28.102575302124023, 29.569202423095703, 31.03582763671875, 32.50245666503906, 33.96908187866211, 35.435707092285156, 36.90233612060547, 38.368961334228516, 39.83558654785156, 41.302215576171875, 42.76884078979492, 44.23546600341797, 45.70209503173828, 47.16872024536133, 48.635345458984375, 50.10197448730469]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 10.0, 14.0, 16.0, 32.0, 34.0, 37.0, 44.0, 46.0, 61.0, 59.0, 65.0, 72.0, 80.0, 53.0, 57.0, 51.0, 52.0, 51.0, 37.0, 35.0, 20.0, 18.0, 8.0, 8.0, 6.0, 7.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-31.536386489868164, -30.722824096679688, -29.90926170349121, -29.095699310302734, -28.28213882446289, -27.468576431274414, -26.655014038085938, -25.84145164489746, -25.027889251708984, -24.214326858520508, -23.40076446533203, -22.587203979492188, -21.77364158630371, -20.960079193115234, -20.146516799926758, -19.33295440673828, -18.519393920898438, -17.70583152770996, -16.892269134521484, -16.07870864868164, -15.265146255493164, -14.451583862304688, -13.638021469116211, -12.824459075927734, -12.010897636413574, -11.197335243225098, -10.383773803710938, -9.570211410522461, -8.756649017333984, -7.943087577819824, -7.129525184631348, -6.315963268280029, -5.502403259277344, -4.688841342926025, -3.875279188156128, -3.0617170333862305, -2.248155117034912, -1.4345932006835938, -0.6210308074951172, 0.19253110885620117, 1.0060930252075195, 1.8196550607681274, 2.6332170963287354, 3.446779251098633, 4.260341167449951, 5.0739030838012695, 5.887465476989746, 6.7010273933410645, 7.514589309692383, 8.32815170288086, 9.14171314239502, 9.955275535583496, 10.768836975097656, 11.582399368286133, 12.39596176147461, 13.209524154663086, 14.023085594177246, 14.836647987365723, 15.650209426879883, 16.46377182006836, 17.277334213256836, 18.090896606445312, 18.904457092285156, 19.718019485473633, 20.53158187866211]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 2.0, 5.0, 12.0, 9.0, 26.0, 23.0, 26.0, 73.0, 109.0, 157.0, 223.0, 397.0, 648.0, 1287.0, 2341.0, 4845.0, 10577.0, 25110.0, 64198.0, 171855.0, 374673.0, 240214.0, 89952.0, 34690.0, 14258.0, 6198.0, 3018.0, 1545.0, 870.0, 438.0, 294.0, 174.0, 98.0, 58.0, 42.0, 34.0, 23.0, 20.0, 13.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.889190673828125, -1.82330322265625, -1.757415771484375, -1.6915283203125, -1.625640869140625, -1.55975341796875, -1.493865966796875, -1.427978515625, -1.362091064453125, -1.29620361328125, -1.230316162109375, -1.1644287109375, -1.098541259765625, -1.03265380859375, -0.966766357421875, -0.90087890625, -0.834991455078125, -0.76910400390625, -0.703216552734375, -0.6373291015625, -0.571441650390625, -0.50555419921875, -0.439666748046875, -0.373779296875, -0.307891845703125, -0.24200439453125, -0.176116943359375, -0.1102294921875, -0.044342041015625, 0.02154541015625, 0.087432861328125, 0.1533203125, 0.219207763671875, 0.28509521484375, 0.350982666015625, 0.4168701171875, 0.482757568359375, 0.54864501953125, 0.614532470703125, 0.680419921875, 0.746307373046875, 0.81219482421875, 0.878082275390625, 0.9439697265625, 1.009857177734375, 1.07574462890625, 1.141632080078125, 1.20751953125, 1.273406982421875, 1.33929443359375, 1.405181884765625, 1.4710693359375, 1.536956787109375, 1.60284423828125, 1.668731689453125, 1.734619140625, 1.800506591796875, 1.86639404296875, 1.932281494140625, 1.9981689453125, 2.064056396484375, 2.12994384765625, 2.195831298828125, 2.26171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 4.0, 8.0, 11.0, 11.0, 19.0, 20.0, 21.0, 38.0, 30.0, 36.0, 43.0, 44.0, 36.0, 56.0, 46.0, 51.0, 50.0, 65.0, 48.0, 49.0, 43.0, 40.0, 32.0, 38.0, 23.0, 29.0, 21.0, 21.0, 11.0, 11.0, 6.0, 8.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5009765625, -1.4569244384765625, -1.412872314453125, -1.3688201904296875, -1.32476806640625, -1.2807159423828125, -1.236663818359375, -1.1926116943359375, -1.1485595703125, -1.1045074462890625, -1.060455322265625, -1.0164031982421875, -0.97235107421875, -0.9282989501953125, -0.884246826171875, -0.8401947021484375, -0.796142578125, -0.7520904541015625, -0.708038330078125, -0.6639862060546875, -0.61993408203125, -0.5758819580078125, -0.531829833984375, -0.4877777099609375, -0.4437255859375, -0.3996734619140625, -0.355621337890625, -0.3115692138671875, -0.26751708984375, -0.2234649658203125, -0.179412841796875, -0.1353607177734375, -0.09130859375, -0.0472564697265625, -0.003204345703125, 0.0408477783203125, 0.08489990234375, 0.1289520263671875, 0.173004150390625, 0.2170562744140625, 0.2611083984375, 0.3051605224609375, 0.349212646484375, 0.3932647705078125, 0.43731689453125, 0.4813690185546875, 0.525421142578125, 0.5694732666015625, 0.613525390625, 0.6575775146484375, 0.701629638671875, 0.7456817626953125, 0.78973388671875, 0.8337860107421875, 0.877838134765625, 0.9218902587890625, 0.9659423828125, 1.0099945068359375, 1.054046630859375, 1.0980987548828125, 1.14215087890625, 1.1862030029296875, 1.230255126953125, 1.2743072509765625, 1.318359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 2.0, 6.0, 12.0, 16.0, 21.0, 46.0, 91.0, 160.0, 304.0, 691.0, 1607.0, 6224.0, 65768.0, 877767.0, 85240.0, 7305.0, 1757.0, 746.0, 362.0, 156.0, 90.0, 68.0, 41.0, 27.0, 17.0, 9.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5625, -8.34033203125, -8.1181640625, -7.89599609375, -7.673828125, -7.45166015625, -7.2294921875, -7.00732421875, -6.78515625, -6.56298828125, -6.3408203125, -6.11865234375, -5.896484375, -5.67431640625, -5.4521484375, -5.22998046875, -5.0078125, -4.78564453125, -4.5634765625, -4.34130859375, -4.119140625, -3.89697265625, -3.6748046875, -3.45263671875, -3.23046875, -3.00830078125, -2.7861328125, -2.56396484375, -2.341796875, -2.11962890625, -1.8974609375, -1.67529296875, -1.453125, -1.23095703125, -1.0087890625, -0.78662109375, -0.564453125, -0.34228515625, -0.1201171875, 0.10205078125, 0.32421875, 0.54638671875, 0.7685546875, 0.99072265625, 1.212890625, 1.43505859375, 1.6572265625, 1.87939453125, 2.1015625, 2.32373046875, 2.5458984375, 2.76806640625, 2.990234375, 3.21240234375, 3.4345703125, 3.65673828125, 3.87890625, 4.10107421875, 4.3232421875, 4.54541015625, 4.767578125, 4.98974609375, 5.2119140625, 5.43408203125, 5.65625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 13.0, 16.0, 24.0, 22.0, 41.0, 34.0, 46.0, 61.0, 79.0, 85.0, 71.0, 65.0, 70.0, 60.0, 59.0, 62.0, 42.0, 31.0, 24.0, 28.0, 14.0, 15.0, 10.0, 10.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.96875, -9.675537109375, -9.38232421875, -9.089111328125, -8.7958984375, -8.502685546875, -8.20947265625, -7.916259765625, -7.623046875, -7.329833984375, -7.03662109375, -6.743408203125, -6.4501953125, -6.156982421875, -5.86376953125, -5.570556640625, -5.27734375, -4.984130859375, -4.69091796875, -4.397705078125, -4.1044921875, -3.811279296875, -3.51806640625, -3.224853515625, -2.931640625, -2.638427734375, -2.34521484375, -2.052001953125, -1.7587890625, -1.465576171875, -1.17236328125, -0.879150390625, -0.5859375, -0.292724609375, 0.00048828125, 0.293701171875, 0.5869140625, 0.880126953125, 1.17333984375, 1.466552734375, 1.759765625, 2.052978515625, 2.34619140625, 2.639404296875, 2.9326171875, 3.225830078125, 3.51904296875, 3.812255859375, 4.10546875, 4.398681640625, 4.69189453125, 4.985107421875, 5.2783203125, 5.571533203125, 5.86474609375, 6.157958984375, 6.451171875, 6.744384765625, 7.03759765625, 7.330810546875, 7.6240234375, 7.917236328125, 8.21044921875, 8.503662109375, 8.796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 1.0, 11.0, 12.0, 12.0, 25.0, 18.0, 37.0, 72.0, 109.0, 184.0, 248.0, 486.0, 1091.0, 2931.0, 10671.0, 99042.0, 863978.0, 57002.0, 8070.0, 2454.0, 1002.0, 449.0, 244.0, 137.0, 80.0, 51.0, 37.0, 26.0, 18.0, 13.0, 7.0, 6.0, 9.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8707122802734375, -1.797088623046875, -1.7234649658203125, -1.64984130859375, -1.5762176513671875, -1.502593994140625, -1.4289703369140625, -1.3553466796875, -1.2817230224609375, -1.208099365234375, -1.1344757080078125, -1.06085205078125, -0.9872283935546875, -0.913604736328125, -0.8399810791015625, -0.766357421875, -0.6927337646484375, -0.619110107421875, -0.5454864501953125, -0.47186279296875, -0.3982391357421875, -0.324615478515625, -0.2509918212890625, -0.1773681640625, -0.1037445068359375, -0.030120849609375, 0.0435028076171875, 0.11712646484375, 0.1907501220703125, 0.264373779296875, 0.3379974365234375, 0.41162109375, 0.4852447509765625, 0.558868408203125, 0.6324920654296875, 0.70611572265625, 0.7797393798828125, 0.853363037109375, 0.9269866943359375, 1.0006103515625, 1.0742340087890625, 1.147857666015625, 1.2214813232421875, 1.29510498046875, 1.3687286376953125, 1.442352294921875, 1.5159759521484375, 1.589599609375, 1.6632232666015625, 1.736846923828125, 1.8104705810546875, 1.88409423828125, 1.9577178955078125, 2.031341552734375, 2.1049652099609375, 2.1785888671875, 2.2522125244140625, 2.325836181640625, 2.3994598388671875, 2.47308349609375, 2.5467071533203125, 2.620330810546875, 2.6939544677734375, 2.767578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 5.0, 12.0, 15.0, 25.0, 54.0, 115.0, 259.0, 237.0, 138.0, 66.0, 24.0, 14.0, 9.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006961822509765625, -0.0006737560033798218, -0.0006513297557830811, -0.0006289035081863403, -0.0006064772605895996, -0.0005840510129928589, -0.0005616247653961182, -0.0005391985177993774, -0.0005167722702026367, -0.000494346022605896, -0.0004719197750091553, -0.00044949352741241455, -0.00042706727981567383, -0.0004046410322189331, -0.0003822147846221924, -0.00035978853702545166, -0.00033736228942871094, -0.0003149360418319702, -0.0002925097942352295, -0.00027008354663848877, -0.00024765729904174805, -0.00022523105144500732, -0.0002028048038482666, -0.00018037855625152588, -0.00015795230865478516, -0.00013552606105804443, -0.00011309981346130371, -9.067356586456299e-05, -6.824731826782227e-05, -4.582107067108154e-05, -2.339482307434082e-05, -9.685754776000977e-07, 2.1457672119140625e-05, 4.388391971588135e-05, 6.631016731262207e-05, 8.873641490936279e-05, 0.00011116266250610352, 0.00013358891010284424, 0.00015601515769958496, 0.00017844140529632568, 0.0002008676528930664, 0.00022329390048980713, 0.00024572014808654785, 0.0002681463956832886, 0.0002905726432800293, 0.00031299889087677, 0.00033542513847351074, 0.00035785138607025146, 0.0003802776336669922, 0.0004027038812637329, 0.00042513012886047363, 0.00044755637645721436, 0.0004699826240539551, 0.0004924088716506958, 0.0005148351192474365, 0.0005372613668441772, 0.000559687614440918, 0.0005821138620376587, 0.0006045401096343994, 0.0006269663572311401, 0.0006493926048278809, 0.0006718188524246216, 0.0006942451000213623, 0.000716671347618103, 0.0007390975952148438]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 15.0, 17.0, 16.0, 16.0, 39.0, 50.0, 79.0, 170.0, 279.0, 678.0, 1803.0, 5480.0, 31986.0, 748000.0, 238995.0, 15062.0, 3490.0, 1226.0, 537.0, 255.0, 137.0, 63.0, 39.0, 30.0, 21.0, 19.0, 6.0, 8.0, 9.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.9664306640625, -1.895751953125, -1.8250732421875, -1.75439453125, -1.6837158203125, -1.613037109375, -1.5423583984375, -1.4716796875, -1.4010009765625, -1.330322265625, -1.2596435546875, -1.18896484375, -1.1182861328125, -1.047607421875, -0.9769287109375, -0.90625, -0.8355712890625, -0.764892578125, -0.6942138671875, -0.62353515625, -0.5528564453125, -0.482177734375, -0.4114990234375, -0.3408203125, -0.2701416015625, -0.199462890625, -0.1287841796875, -0.05810546875, 0.0125732421875, 0.083251953125, 0.1539306640625, 0.224609375, 0.2952880859375, 0.365966796875, 0.4366455078125, 0.50732421875, 0.5780029296875, 0.648681640625, 0.7193603515625, 0.7900390625, 0.8607177734375, 0.931396484375, 1.0020751953125, 1.07275390625, 1.1434326171875, 1.214111328125, 1.2847900390625, 1.35546875, 1.4261474609375, 1.496826171875, 1.5675048828125, 1.63818359375, 1.7088623046875, 1.779541015625, 1.8502197265625, 1.9208984375, 1.9915771484375, 2.062255859375, 2.1329345703125, 2.20361328125, 2.2742919921875, 2.344970703125, 2.4156494140625, 2.486328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 2.0, 4.0, 12.0, 14.0, 18.0, 22.0, 33.0, 39.0, 59.0, 73.0, 75.0, 100.0, 97.0, 103.0, 84.0, 64.0, 51.0, 35.0, 21.0, 27.0, 12.0, 6.0, 11.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.990234375, -1.924652099609375, -1.85906982421875, -1.793487548828125, -1.7279052734375, -1.662322998046875, -1.59674072265625, -1.531158447265625, -1.465576171875, -1.399993896484375, -1.33441162109375, -1.268829345703125, -1.2032470703125, -1.137664794921875, -1.07208251953125, -1.006500244140625, -0.94091796875, -0.875335693359375, -0.80975341796875, -0.744171142578125, -0.6785888671875, -0.613006591796875, -0.54742431640625, -0.481842041015625, -0.416259765625, -0.350677490234375, -0.28509521484375, -0.219512939453125, -0.1539306640625, -0.088348388671875, -0.02276611328125, 0.042816162109375, 0.1083984375, 0.173980712890625, 0.23956298828125, 0.305145263671875, 0.3707275390625, 0.436309814453125, 0.50189208984375, 0.567474365234375, 0.633056640625, 0.698638916015625, 0.76422119140625, 0.829803466796875, 0.8953857421875, 0.960968017578125, 1.02655029296875, 1.092132568359375, 1.15771484375, 1.223297119140625, 1.28887939453125, 1.354461669921875, 1.4200439453125, 1.485626220703125, 1.55120849609375, 1.616790771484375, 1.682373046875, 1.747955322265625, 1.81353759765625, 1.879119873046875, 1.9447021484375, 2.010284423828125, 2.07586669921875, 2.141448974609375, 2.20703125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 5.0, 11.0, 27.0, 43.0, 60.0, 92.0, 121.0, 169.0, 162.0, 107.0, 85.0, 46.0, 17.0, 17.0, 8.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.712684631347656, -35.81606674194336, -34.91944885253906, -34.02283477783203, -33.126216888427734, -32.22959899902344, -31.33298110961914, -30.436365127563477, -29.539749145507812, -28.643131256103516, -27.74651527404785, -26.849897384643555, -25.95328140258789, -25.056663513183594, -24.160045623779297, -23.263429641723633, -22.366811752319336, -21.47019386291504, -20.573577880859375, -19.676959991455078, -18.780344009399414, -17.883726119995117, -16.987110137939453, -16.090492248535156, -15.193875312805176, -14.297258377075195, -13.400641441345215, -12.504024505615234, -11.607406616210938, -10.710790634155273, -9.814172744750977, -8.917555809020996, -8.020936965942383, -7.124320030212402, -6.227703094482422, -5.331085681915283, -4.434468746185303, -3.5378518104553223, -2.6412343978881836, -1.7446174621582031, -0.8480005264282227, 0.04861652851104736, 0.9452335834503174, 1.841850757598877, 2.7384676933288574, 3.635084629058838, 4.531702041625977, 5.428318977355957, 6.3249359130859375, 7.221552848815918, 8.118169784545898, 9.014787673950195, 9.91140365600586, 10.808021545410156, 11.704638481140137, 12.601255416870117, 13.497872352600098, 14.394489288330078, 15.291106224060059, 16.18772315979004, 17.084341049194336, 17.98095703125, 18.877574920654297, 19.774192810058594, 20.670808792114258]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 8.0, 3.0, 7.0, 17.0, 31.0, 49.0, 55.0, 60.0, 67.0, 94.0, 119.0, 95.0, 95.0, 85.0, 74.0, 47.0, 32.0, 34.0, 13.0, 13.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.02153778076172, -76.28306579589844, -74.54458618164062, -72.80611419677734, -71.06764221191406, -69.32916259765625, -67.59069061279297, -65.85221099853516, -64.11373901367188, -62.37526321411133, -60.63678741455078, -58.8983154296875, -57.15983963012695, -55.421363830566406, -53.682891845703125, -51.94441604614258, -50.20594024658203, -48.467464447021484, -46.72898864746094, -44.990516662597656, -43.25204086303711, -41.51356506347656, -39.77509307861328, -38.036617279052734, -36.29814147949219, -34.55966567993164, -32.821189880371094, -31.082717895507812, -29.344242095947266, -27.60576629638672, -25.867292404174805, -24.12881851196289, -22.390342712402344, -20.651866912841797, -18.913393020629883, -17.17491912841797, -15.436443328857422, -13.697968482971191, -11.959493637084961, -10.22101879119873, -8.4825439453125, -6.7440690994262695, -5.005594253540039, -3.2671194076538086, -1.5286445617675781, 0.20983028411865234, 1.9483051300048828, 3.6867799758911133, 5.425254821777344, 7.163729667663574, 8.902204513549805, 10.640679359436035, 12.379154205322266, 14.117629051208496, 15.856103897094727, 17.59457778930664, 19.333053588867188, 21.071529388427734, 22.81000328063965, 24.548477172851562, 26.28695297241211, 28.025428771972656, 29.76390266418457, 31.502376556396484, 33.24085235595703]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 12.0, 13.0, 15.0, 31.0, 31.0, 43.0, 62.0, 84.0, 184.0, 399.0, 1238.0, 7205.0, 451409.0, 3713498.0, 16295.0, 2541.0, 732.0, 266.0, 74.0, 43.0, 27.0, 21.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.481201171875, -7.25537109375, -7.029541015625, -6.8037109375, -6.577880859375, -6.35205078125, -6.126220703125, -5.900390625, -5.674560546875, -5.44873046875, -5.222900390625, -4.9970703125, -4.771240234375, -4.54541015625, -4.319580078125, -4.09375, -3.867919921875, -3.64208984375, -3.416259765625, -3.1904296875, -2.964599609375, -2.73876953125, -2.512939453125, -2.287109375, -2.061279296875, -1.83544921875, -1.609619140625, -1.3837890625, -1.157958984375, -0.93212890625, -0.706298828125, -0.48046875, -0.254638671875, -0.02880859375, 0.197021484375, 0.4228515625, 0.648681640625, 0.87451171875, 1.100341796875, 1.326171875, 1.552001953125, 1.77783203125, 2.003662109375, 2.2294921875, 2.455322265625, 2.68115234375, 2.906982421875, 3.1328125, 3.358642578125, 3.58447265625, 3.810302734375, 4.0361328125, 4.261962890625, 4.48779296875, 4.713623046875, 4.939453125, 5.165283203125, 5.39111328125, 5.616943359375, 5.8427734375, 6.068603515625, 6.29443359375, 6.520263671875, 6.74609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 15.0, 52.0, 108.0, 154.0, 221.0, 201.0, 137.0, 81.0, 27.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.78125, -9.588287353515625, -9.39532470703125, -9.202362060546875, -9.0093994140625, -8.816436767578125, -8.62347412109375, -8.430511474609375, -8.237548828125, -8.044586181640625, -7.85162353515625, -7.658660888671875, -7.4656982421875, -7.272735595703125, -7.07977294921875, -6.886810302734375, -6.69384765625, -6.500885009765625, -6.30792236328125, -6.114959716796875, -5.9219970703125, -5.729034423828125, -5.53607177734375, -5.343109130859375, -5.150146484375, -4.957183837890625, -4.76422119140625, -4.571258544921875, -4.3782958984375, -4.185333251953125, -3.99237060546875, -3.799407958984375, -3.6064453125, -3.413482666015625, -3.22052001953125, -3.027557373046875, -2.8345947265625, -2.641632080078125, -2.44866943359375, -2.255706787109375, -2.062744140625, -1.869781494140625, -1.67681884765625, -1.483856201171875, -1.2908935546875, -1.097930908203125, -0.90496826171875, -0.712005615234375, -0.51904296875, -0.326080322265625, -0.13311767578125, 0.059844970703125, 0.2528076171875, 0.445770263671875, 0.63873291015625, 0.831695556640625, 1.024658203125, 1.217620849609375, 1.41058349609375, 1.603546142578125, 1.7965087890625, 1.989471435546875, 2.18243408203125, 2.375396728515625, 2.568359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 10.0, 20.0, 37.0, 54.0, 140.0, 200.0, 408.0, 828.0, 2165.0, 6598.0, 26330.0, 320949.0, 3735721.0, 79598.0, 14200.0, 4152.0, 1598.0, 660.0, 294.0, 138.0, 65.0, 44.0, 25.0, 13.0, 10.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.21484375, -6.074462890625, -5.93408203125, -5.793701171875, -5.6533203125, -5.512939453125, -5.37255859375, -5.232177734375, -5.091796875, -4.951416015625, -4.81103515625, -4.670654296875, -4.5302734375, -4.389892578125, -4.24951171875, -4.109130859375, -3.96875, -3.828369140625, -3.68798828125, -3.547607421875, -3.4072265625, -3.266845703125, -3.12646484375, -2.986083984375, -2.845703125, -2.705322265625, -2.56494140625, -2.424560546875, -2.2841796875, -2.143798828125, -2.00341796875, -1.863037109375, -1.72265625, -1.582275390625, -1.44189453125, -1.301513671875, -1.1611328125, -1.020751953125, -0.88037109375, -0.739990234375, -0.599609375, -0.459228515625, -0.31884765625, -0.178466796875, -0.0380859375, 0.102294921875, 0.24267578125, 0.383056640625, 0.5234375, 0.663818359375, 0.80419921875, 0.944580078125, 1.0849609375, 1.225341796875, 1.36572265625, 1.506103515625, 1.646484375, 1.786865234375, 1.92724609375, 2.067626953125, 2.2080078125, 2.348388671875, 2.48876953125, 2.629150390625, 2.76953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 4.0, 5.0, 8.0, 12.0, 14.0, 10.0, 23.0, 46.0, 98.0, 304.0, 1242.0, 1480.0, 467.0, 158.0, 69.0, 43.0, 23.0, 25.0, 10.0, 5.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01171875, -5.8541259765625, -5.696533203125, -5.5389404296875, -5.38134765625, -5.2237548828125, -5.066162109375, -4.9085693359375, -4.7509765625, -4.5933837890625, -4.435791015625, -4.2781982421875, -4.12060546875, -3.9630126953125, -3.805419921875, -3.6478271484375, -3.490234375, -3.3326416015625, -3.175048828125, -3.0174560546875, -2.85986328125, -2.7022705078125, -2.544677734375, -2.3870849609375, -2.2294921875, -2.0718994140625, -1.914306640625, -1.7567138671875, -1.59912109375, -1.4415283203125, -1.283935546875, -1.1263427734375, -0.96875, -0.8111572265625, -0.653564453125, -0.4959716796875, -0.33837890625, -0.1807861328125, -0.023193359375, 0.1343994140625, 0.2919921875, 0.4495849609375, 0.607177734375, 0.7647705078125, 0.92236328125, 1.0799560546875, 1.237548828125, 1.3951416015625, 1.552734375, 1.7103271484375, 1.867919921875, 2.0255126953125, 2.18310546875, 2.3406982421875, 2.498291015625, 2.6558837890625, 2.8134765625, 2.9710693359375, 3.128662109375, 3.2862548828125, 3.44384765625, 3.6014404296875, 3.759033203125, 3.9166259765625, 4.07421875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 7.0, 11.0, 18.0, 58.0, 196.0, 288.0, 243.0, 99.0, 39.0, 19.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.51406478881836, -22.253549575805664, -20.99303436279297, -19.73251724243164, -18.472002029418945, -17.21148681640625, -15.950971603393555, -14.690455436706543, -13.429940223693848, -12.169425010681152, -10.90890884399414, -9.648393630981445, -8.38787841796875, -7.127362251281738, -5.866847038269043, -4.606330871582031, -3.345815658569336, -2.0852999687194824, -0.824784517288208, 0.4357309341430664, 1.69624662399292, 2.9567623138427734, 4.217277526855469, 5.4777936935424805, 6.738308906555176, 7.998824596405029, 9.259340286254883, 10.519855499267578, 11.780370712280273, 13.040886878967285, 14.30140209197998, 15.561918258666992, 16.822433471679688, 18.082948684692383, 19.343463897705078, 20.603981018066406, 21.8644962310791, 23.125011444091797, 24.385526657104492, 25.646041870117188, 26.906558990478516, 28.16707420349121, 29.427589416503906, 30.688106536865234, 31.94862174987793, 33.209136962890625, 34.46965026855469, 35.730167388916016, 36.990684509277344, 38.25120162963867, 39.511714935302734, 40.77223205566406, 42.032745361328125, 43.29326248168945, 44.55377960205078, 45.814292907714844, 47.074806213378906, 48.335323333740234, 49.5958366394043, 50.856353759765625, 52.11686706542969, 53.377384185791016, 54.637901306152344, 55.898414611816406, 57.158931732177734]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 12.0, 10.0, 14.0, 21.0, 30.0, 44.0, 56.0, 77.0, 77.0, 91.0, 90.0, 104.0, 77.0, 64.0, 58.0, 61.0, 39.0, 31.0, 16.0, 8.0, 7.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.051332473754883, -14.153173446655273, -13.255014419555664, -12.356855392456055, -11.458696365356445, -10.560537338256836, -9.662378311157227, -8.764219284057617, -7.866060256958008, -6.967901229858398, -6.069742202758789, -5.17158317565918, -4.27342414855957, -3.375265121459961, -2.4771060943603516, -1.5789470672607422, -0.6807880401611328, 0.21737098693847656, 1.115530014038086, 2.0136890411376953, 2.9118480682373047, 3.810007095336914, 4.708166122436523, 5.606325149536133, 6.504484176635742, 7.402643203735352, 8.300802230834961, 9.19896125793457, 10.09712028503418, 10.995279312133789, 11.893438339233398, 12.791597366333008, 13.68975830078125, 14.58791732788086, 15.486076354980469, 16.384235382080078, 17.282394409179688, 18.180553436279297, 19.078712463378906, 19.976871490478516, 20.875030517578125, 21.773189544677734, 22.671348571777344, 23.569507598876953, 24.467666625976562, 25.365825653076172, 26.26398468017578, 27.16214370727539, 28.060302734375, 28.95846176147461, 29.85662078857422, 30.754779815673828, 31.652938842773438, 32.55109786987305, 33.449256896972656, 34.347415924072266, 35.245574951171875, 36.143733978271484, 37.041893005371094, 37.9400520324707, 38.83821105957031, 39.73637008666992, 40.63452911376953, 41.53268814086914, 42.43084716796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 7.0, 15.0, 23.0, 64.0, 97.0, 217.0, 423.0, 1141.0, 3562.0, 15098.0, 84270.0, 543181.0, 337593.0, 49147.0, 9670.0, 2513.0, 822.0, 357.0, 157.0, 77.0, 43.0, 25.0, 20.0, 17.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25390625, -5.1151123046875, -4.976318359375, -4.8375244140625, -4.69873046875, -4.5599365234375, -4.421142578125, -4.2823486328125, -4.1435546875, -4.0047607421875, -3.865966796875, -3.7271728515625, -3.58837890625, -3.4495849609375, -3.310791015625, -3.1719970703125, -3.033203125, -2.8944091796875, -2.755615234375, -2.6168212890625, -2.47802734375, -2.3392333984375, -2.200439453125, -2.0616455078125, -1.9228515625, -1.7840576171875, -1.645263671875, -1.5064697265625, -1.36767578125, -1.2288818359375, -1.090087890625, -0.9512939453125, -0.8125, -0.6737060546875, -0.534912109375, -0.3961181640625, -0.25732421875, -0.1185302734375, 0.020263671875, 0.1590576171875, 0.2978515625, 0.4366455078125, 0.575439453125, 0.7142333984375, 0.85302734375, 0.9918212890625, 1.130615234375, 1.2694091796875, 1.408203125, 1.5469970703125, 1.685791015625, 1.8245849609375, 1.96337890625, 2.1021728515625, 2.240966796875, 2.3797607421875, 2.5185546875, 2.6573486328125, 2.796142578125, 2.9349365234375, 3.07373046875, 3.2125244140625, 3.351318359375, 3.4901123046875, 3.62890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 11.0, 12.0, 20.0, 25.0, 39.0, 53.0, 53.0, 56.0, 87.0, 82.0, 85.0, 76.0, 79.0, 86.0, 67.0, 48.0, 35.0, 29.0, 22.0, 14.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.6875, -3.608306884765625, -3.52911376953125, -3.449920654296875, -3.3707275390625, -3.291534423828125, -3.21234130859375, -3.133148193359375, -3.053955078125, -2.974761962890625, -2.89556884765625, -2.816375732421875, -2.7371826171875, -2.657989501953125, -2.57879638671875, -2.499603271484375, -2.42041015625, -2.341217041015625, -2.26202392578125, -2.182830810546875, -2.1036376953125, -2.024444580078125, -1.94525146484375, -1.866058349609375, -1.786865234375, -1.707672119140625, -1.62847900390625, -1.549285888671875, -1.4700927734375, -1.390899658203125, -1.31170654296875, -1.232513427734375, -1.1533203125, -1.074127197265625, -0.99493408203125, -0.915740966796875, -0.8365478515625, -0.757354736328125, -0.67816162109375, -0.598968505859375, -0.519775390625, -0.440582275390625, -0.36138916015625, -0.282196044921875, -0.2030029296875, -0.123809814453125, -0.04461669921875, 0.034576416015625, 0.11376953125, 0.192962646484375, 0.27215576171875, 0.351348876953125, 0.4305419921875, 0.509735107421875, 0.58892822265625, 0.668121337890625, 0.747314453125, 0.826507568359375, 0.90570068359375, 0.984893798828125, 1.0640869140625, 1.143280029296875, 1.22247314453125, 1.301666259765625, 1.380859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 7.0, 1.0, 3.0, 3.0, 4.0, 8.0, 11.0, 24.0, 21.0, 32.0, 52.0, 89.0, 176.0, 330.0, 693.0, 1877.0, 6741.0, 53542.0, 764973.0, 198980.0, 15688.0, 3208.0, 1082.0, 474.0, 217.0, 114.0, 74.0, 51.0, 31.0, 19.0, 13.0, 9.0, 5.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1328125, -4.933349609375, -4.73388671875, -4.534423828125, -4.3349609375, -4.135498046875, -3.93603515625, -3.736572265625, -3.537109375, -3.337646484375, -3.13818359375, -2.938720703125, -2.7392578125, -2.539794921875, -2.34033203125, -2.140869140625, -1.94140625, -1.741943359375, -1.54248046875, -1.343017578125, -1.1435546875, -0.944091796875, -0.74462890625, -0.545166015625, -0.345703125, -0.146240234375, 0.05322265625, 0.252685546875, 0.4521484375, 0.651611328125, 0.85107421875, 1.050537109375, 1.25, 1.449462890625, 1.64892578125, 1.848388671875, 2.0478515625, 2.247314453125, 2.44677734375, 2.646240234375, 2.845703125, 3.045166015625, 3.24462890625, 3.444091796875, 3.6435546875, 3.843017578125, 4.04248046875, 4.241943359375, 4.44140625, 4.640869140625, 4.84033203125, 5.039794921875, 5.2392578125, 5.438720703125, 5.63818359375, 5.837646484375, 6.037109375, 6.236572265625, 6.43603515625, 6.635498046875, 6.8349609375, 7.034423828125, 7.23388671875, 7.433349609375, 7.6328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 12.0, 16.0, 18.0, 19.0, 31.0, 43.0, 53.0, 64.0, 62.0, 60.0, 62.0, 67.0, 72.0, 65.0, 58.0, 61.0, 37.0, 26.0, 38.0, 35.0, 28.0, 21.0, 10.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.72265625, -7.4783935546875, -7.234130859375, -6.9898681640625, -6.74560546875, -6.5013427734375, -6.257080078125, -6.0128173828125, -5.7685546875, -5.5242919921875, -5.280029296875, -5.0357666015625, -4.79150390625, -4.5472412109375, -4.302978515625, -4.0587158203125, -3.814453125, -3.5701904296875, -3.325927734375, -3.0816650390625, -2.83740234375, -2.5931396484375, -2.348876953125, -2.1046142578125, -1.8603515625, -1.6160888671875, -1.371826171875, -1.1275634765625, -0.88330078125, -0.6390380859375, -0.394775390625, -0.1505126953125, 0.09375, 0.3380126953125, 0.582275390625, 0.8265380859375, 1.07080078125, 1.3150634765625, 1.559326171875, 1.8035888671875, 2.0478515625, 2.2921142578125, 2.536376953125, 2.7806396484375, 3.02490234375, 3.2691650390625, 3.513427734375, 3.7576904296875, 4.001953125, 4.2462158203125, 4.490478515625, 4.7347412109375, 4.97900390625, 5.2232666015625, 5.467529296875, 5.7117919921875, 5.9560546875, 6.2003173828125, 6.444580078125, 6.6888427734375, 6.93310546875, 7.1773681640625, 7.421630859375, 7.6658935546875, 7.91015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 11.0, 15.0, 28.0, 53.0, 89.0, 222.0, 638.0, 2869.0, 39507.0, 935631.0, 64528.0, 3692.0, 771.0, 248.0, 92.0, 56.0, 34.0, 21.0, 15.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.716705322265625, -3.61505126953125, -3.513397216796875, -3.4117431640625, -3.310089111328125, -3.20843505859375, -3.106781005859375, -3.005126953125, -2.903472900390625, -2.80181884765625, -2.700164794921875, -2.5985107421875, -2.496856689453125, -2.39520263671875, -2.293548583984375, -2.19189453125, -2.090240478515625, -1.98858642578125, -1.886932373046875, -1.7852783203125, -1.683624267578125, -1.58197021484375, -1.480316162109375, -1.378662109375, -1.277008056640625, -1.17535400390625, -1.073699951171875, -0.9720458984375, -0.870391845703125, -0.76873779296875, -0.667083740234375, -0.5654296875, -0.463775634765625, -0.36212158203125, -0.260467529296875, -0.1588134765625, -0.057159423828125, 0.04449462890625, 0.146148681640625, 0.247802734375, 0.349456787109375, 0.45111083984375, 0.552764892578125, 0.6544189453125, 0.756072998046875, 0.85772705078125, 0.959381103515625, 1.06103515625, 1.162689208984375, 1.26434326171875, 1.365997314453125, 1.4676513671875, 1.569305419921875, 1.67095947265625, 1.772613525390625, 1.874267578125, 1.975921630859375, 2.07757568359375, 2.179229736328125, 2.2808837890625, 2.382537841796875, 2.48419189453125, 2.585845947265625, 2.6875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 7.0, 15.0, 28.0, 17.0, 29.0, 34.0, 50.0, 66.0, 60.0, 96.0, 99.0, 97.0, 87.0, 63.0, 54.0, 50.0, 33.0, 34.0, 21.0, 12.0, 14.0, 6.0, 7.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003509521484375, -0.00034191086888313293, -0.00033286958932876587, -0.0003238283097743988, -0.00031478703022003174, -0.00030574575066566467, -0.0002967044711112976, -0.00028766319155693054, -0.0002786219120025635, -0.0002695806324481964, -0.00026053935289382935, -0.0002514980733394623, -0.00024245679378509521, -0.00023341551423072815, -0.00022437423467636108, -0.00021533295512199402, -0.00020629167556762695, -0.0001972503960132599, -0.00018820911645889282, -0.00017916783690452576, -0.0001701265573501587, -0.00016108527779579163, -0.00015204399824142456, -0.0001430027186870575, -0.00013396143913269043, -0.00012492015957832336, -0.0001158788800239563, -0.00010683760046958923, -9.779632091522217e-05, -8.87550413608551e-05, -7.971376180648804e-05, -7.067248225212097e-05, -6.16312026977539e-05, -5.258992314338684e-05, -4.3548643589019775e-05, -3.450736403465271e-05, -2.5466084480285645e-05, -1.642480492591858e-05, -7.383525371551514e-06, 1.6577541828155518e-06, 1.0699033737182617e-05, 1.9740313291549683e-05, 2.8781592845916748e-05, 3.7822872400283813e-05, 4.686415195465088e-05, 5.5905431509017944e-05, 6.494671106338501e-05, 7.398799061775208e-05, 8.302927017211914e-05, 9.20705497264862e-05, 0.00010111182928085327, 0.00011015310883522034, 0.0001191943883895874, 0.00012823566794395447, 0.00013727694749832153, 0.0001463182270526886, 0.00015535950660705566, 0.00016440078616142273, 0.0001734420657157898, 0.00018248334527015686, 0.00019152462482452393, 0.000200565904378891, 0.00020960718393325806, 0.00021864846348762512, 0.0002276897430419922]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 16.0, 18.0, 29.0, 66.0, 105.0, 187.0, 343.0, 680.0, 1749.0, 6217.0, 42863.0, 646300.0, 319513.0, 23642.0, 4177.0, 1339.0, 585.0, 263.0, 159.0, 102.0, 61.0, 41.0, 14.0, 14.0, 12.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.12890625, -2.0711669921875, -2.013427734375, -1.9556884765625, -1.89794921875, -1.8402099609375, -1.782470703125, -1.7247314453125, -1.6669921875, -1.6092529296875, -1.551513671875, -1.4937744140625, -1.43603515625, -1.3782958984375, -1.320556640625, -1.2628173828125, -1.205078125, -1.1473388671875, -1.089599609375, -1.0318603515625, -0.97412109375, -0.9163818359375, -0.858642578125, -0.8009033203125, -0.7431640625, -0.6854248046875, -0.627685546875, -0.5699462890625, -0.51220703125, -0.4544677734375, -0.396728515625, -0.3389892578125, -0.28125, -0.2235107421875, -0.165771484375, -0.1080322265625, -0.05029296875, 0.0074462890625, 0.065185546875, 0.1229248046875, 0.1806640625, 0.2384033203125, 0.296142578125, 0.3538818359375, 0.41162109375, 0.4693603515625, 0.527099609375, 0.5848388671875, 0.642578125, 0.7003173828125, 0.758056640625, 0.8157958984375, 0.87353515625, 0.9312744140625, 0.989013671875, 1.0467529296875, 1.1044921875, 1.1622314453125, 1.219970703125, 1.2777099609375, 1.33544921875, 1.3931884765625, 1.450927734375, 1.5086669921875, 1.56640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 9.0, 12.0, 19.0, 35.0, 30.0, 55.0, 85.0, 81.0, 126.0, 128.0, 102.0, 101.0, 68.0, 52.0, 37.0, 19.0, 20.0, 6.0, 5.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.237518310546875, -3.16253662109375, -3.087554931640625, -3.0125732421875, -2.937591552734375, -2.86260986328125, -2.787628173828125, -2.712646484375, -2.637664794921875, -2.56268310546875, -2.487701416015625, -2.4127197265625, -2.337738037109375, -2.26275634765625, -2.187774658203125, -2.11279296875, -2.037811279296875, -1.96282958984375, -1.887847900390625, -1.8128662109375, -1.737884521484375, -1.66290283203125, -1.587921142578125, -1.512939453125, -1.437957763671875, -1.36297607421875, -1.287994384765625, -1.2130126953125, -1.138031005859375, -1.06304931640625, -0.988067626953125, -0.9130859375, -0.838104248046875, -0.76312255859375, -0.688140869140625, -0.6131591796875, -0.538177490234375, -0.46319580078125, -0.388214111328125, -0.313232421875, -0.238250732421875, -0.16326904296875, -0.088287353515625, -0.0133056640625, 0.061676025390625, 0.13665771484375, 0.211639404296875, 0.28662109375, 0.361602783203125, 0.43658447265625, 0.511566162109375, 0.5865478515625, 0.661529541015625, 0.73651123046875, 0.811492919921875, 0.886474609375, 0.961456298828125, 1.03643798828125, 1.111419677734375, 1.1864013671875, 1.261383056640625, 1.33636474609375, 1.411346435546875, 1.486328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 7.0, 12.0, 58.0, 246.0, 453.0, 173.0, 40.0, 11.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.93656921386719, -70.539794921875, -68.14302825927734, -65.74625396728516, -63.3494873046875, -60.95271301269531, -58.55594253540039, -56.15917205810547, -53.76240158081055, -51.365631103515625, -48.9688606262207, -46.57209014892578, -44.175315856933594, -41.77854919433594, -39.38177490234375, -36.98500442504883, -34.588233947753906, -32.191463470458984, -29.794692993164062, -27.397920608520508, -25.001150131225586, -22.604379653930664, -20.20760726928711, -17.810836791992188, -15.414066314697266, -13.017295837402344, -10.620524406433105, -8.223752975463867, -5.826982498168945, -3.4302120208740234, -1.0334405899047852, 1.3633308410644531, 3.760101318359375, 6.156872272491455, 8.553643226623535, 10.950414657592773, 13.347185134887695, 15.743955612182617, 18.140727996826172, 20.537498474121094, 22.934268951416016, 25.331039428710938, 27.72780990600586, 30.124582290649414, 32.52135467529297, 34.918121337890625, 37.31489562988281, 39.711666107177734, 42.108436584472656, 44.50520706176758, 46.9019775390625, 49.29874801635742, 51.695518493652344, 54.09229278564453, 56.48906326293945, 58.885833740234375, 61.2826042175293, 63.67937469482422, 66.0761489868164, 68.47291564941406, 70.86968994140625, 73.2664566040039, 75.6632308959961, 78.05999755859375, 80.45677185058594]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 5.0, 3.0, 11.0, 14.0, 17.0, 25.0, 30.0, 35.0, 35.0, 42.0, 55.0, 65.0, 80.0, 75.0, 116.0, 57.0, 61.0, 53.0, 48.0, 31.0, 34.0, 40.0, 26.0, 17.0, 10.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.69707489013672, -35.58203887939453, -34.467002868652344, -33.351966857910156, -32.23693084716797, -31.12189292907715, -30.006855010986328, -28.89181900024414, -27.776782989501953, -26.661746978759766, -25.546710968017578, -24.431673049926758, -23.31663703918457, -22.201601028442383, -21.086563110351562, -19.971527099609375, -18.856491088867188, -17.741455078125, -16.626419067382812, -15.511381149291992, -14.396345138549805, -13.281309127807617, -12.166272163391113, -11.05123519897461, -9.936199188232422, -8.821163177490234, -7.7061262130737305, -6.591089725494385, -5.476053237915039, -4.361016750335693, -3.2459802627563477, -2.130943775177002, -1.0159072875976562, 0.09912919998168945, 1.2141656875610352, 2.329202175140381, 3.4442386627197266, 4.559275150299072, 5.674311637878418, 6.789348125457764, 7.904384613037109, 9.019420623779297, 10.1344575881958, 11.249494552612305, 12.364530563354492, 13.47956657409668, 14.594603538513184, 15.709640502929688, 16.824676513671875, 17.939712524414062, 19.05474853515625, 20.16978645324707, 21.284822463989258, 22.399858474731445, 23.514896392822266, 24.629932403564453, 25.74496841430664, 26.860004425048828, 27.975040435791016, 29.090078353881836, 30.205114364624023, 31.32015037536621, 32.43518829345703, 33.55022430419922, 34.665260314941406]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 9.0, 10.0, 11.0, 15.0, 20.0, 19.0, 37.0, 33.0, 54.0, 90.0, 118.0, 173.0, 342.0, 649.0, 1307.0, 3018.0, 7338.0, 23637.0, 133898.0, 1574841.0, 2205906.0, 191774.0, 32914.0, 10139.0, 4200.0, 1881.0, 888.0, 447.0, 239.0, 119.0, 70.0, 37.0, 19.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.552734375, -2.4948272705078125, -2.436920166015625, -2.3790130615234375, -2.32110595703125, -2.2631988525390625, -2.205291748046875, -2.1473846435546875, -2.0894775390625, -2.0315704345703125, -1.973663330078125, -1.9157562255859375, -1.85784912109375, -1.7999420166015625, -1.742034912109375, -1.6841278076171875, -1.626220703125, -1.5683135986328125, -1.510406494140625, -1.4524993896484375, -1.39459228515625, -1.3366851806640625, -1.278778076171875, -1.2208709716796875, -1.1629638671875, -1.1050567626953125, -1.047149658203125, -0.9892425537109375, -0.93133544921875, -0.8734283447265625, -0.815521240234375, -0.7576141357421875, -0.69970703125, -0.6417999267578125, -0.583892822265625, -0.5259857177734375, -0.46807861328125, -0.4101715087890625, -0.352264404296875, -0.2943572998046875, -0.2364501953125, -0.1785430908203125, -0.120635986328125, -0.0627288818359375, -0.00482177734375, 0.0530853271484375, 0.110992431640625, 0.1688995361328125, 0.226806640625, 0.2847137451171875, 0.342620849609375, 0.4005279541015625, 0.45843505859375, 0.5163421630859375, 0.574249267578125, 0.6321563720703125, 0.6900634765625, 0.7479705810546875, 0.805877685546875, 0.8637847900390625, 0.92169189453125, 0.9795989990234375, 1.037506103515625, 1.0954132080078125, 1.1533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 11.0, 15.0, 24.0, 32.0, 63.0, 70.0, 68.0, 67.0, 96.0, 94.0, 84.0, 90.0, 73.0, 60.0, 47.0, 43.0, 29.0, 16.0, 8.0, 6.0, 6.0, 3.0, 1.0], "bins": [-3.7890625, -3.71392822265625, -3.6387939453125, -3.56365966796875, -3.488525390625, -3.41339111328125, -3.3382568359375, -3.26312255859375, -3.18798828125, -3.11285400390625, -3.0377197265625, -2.96258544921875, -2.887451171875, -2.81231689453125, -2.7371826171875, -2.66204833984375, -2.5869140625, -2.51177978515625, -2.4366455078125, -2.36151123046875, -2.286376953125, -2.21124267578125, -2.1361083984375, -2.06097412109375, -1.98583984375, -1.91070556640625, -1.8355712890625, -1.76043701171875, -1.685302734375, -1.61016845703125, -1.5350341796875, -1.45989990234375, -1.384765625, -1.30963134765625, -1.2344970703125, -1.15936279296875, -1.084228515625, -1.00909423828125, -0.9339599609375, -0.85882568359375, -0.78369140625, -0.70855712890625, -0.6334228515625, -0.55828857421875, -0.483154296875, -0.40802001953125, -0.3328857421875, -0.25775146484375, -0.1826171875, -0.10748291015625, -0.0323486328125, 0.04278564453125, 0.117919921875, 0.19305419921875, 0.2681884765625, 0.34332275390625, 0.41845703125, 0.49359130859375, 0.5687255859375, 0.64385986328125, 0.718994140625, 0.79412841796875, 0.8692626953125, 0.94439697265625, 1.01953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 5.0, 19.0, 20.0, 39.0, 59.0, 104.0, 222.0, 469.0, 1238.0, 4406.0, 24762.0, 354711.0, 3668403.0, 120029.0, 14291.0, 3448.0, 1136.0, 442.0, 191.0, 135.0, 47.0, 31.0, 22.0, 14.0, 7.0, 2.0, 8.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.205078125, -3.083282470703125, -2.96148681640625, -2.839691162109375, -2.7178955078125, -2.596099853515625, -2.47430419921875, -2.352508544921875, -2.230712890625, -2.108917236328125, -1.98712158203125, -1.865325927734375, -1.7435302734375, -1.621734619140625, -1.49993896484375, -1.378143310546875, -1.25634765625, -1.134552001953125, -1.01275634765625, -0.890960693359375, -0.7691650390625, -0.647369384765625, -0.52557373046875, -0.403778076171875, -0.281982421875, -0.160186767578125, -0.03839111328125, 0.083404541015625, 0.2052001953125, 0.326995849609375, 0.44879150390625, 0.570587158203125, 0.6923828125, 0.814178466796875, 0.93597412109375, 1.057769775390625, 1.1795654296875, 1.301361083984375, 1.42315673828125, 1.544952392578125, 1.666748046875, 1.788543701171875, 1.91033935546875, 2.032135009765625, 2.1539306640625, 2.275726318359375, 2.39752197265625, 2.519317626953125, 2.64111328125, 2.762908935546875, 2.88470458984375, 3.006500244140625, 3.1282958984375, 3.250091552734375, 3.37188720703125, 3.493682861328125, 3.615478515625, 3.737274169921875, 3.85906982421875, 3.980865478515625, 4.1026611328125, 4.224456787109375, 4.34625244140625, 4.468048095703125, 4.58984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 2.0, 5.0, 4.0, 9.0, 12.0, 16.0, 14.0, 36.0, 28.0, 40.0, 65.0, 105.0, 206.0, 367.0, 721.0, 890.0, 592.0, 313.0, 202.0, 116.0, 70.0, 60.0, 43.0, 49.0, 18.0, 16.0, 18.0, 10.0, 8.0, 7.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.826171875, -2.736358642578125, -2.64654541015625, -2.556732177734375, -2.4669189453125, -2.377105712890625, -2.28729248046875, -2.197479248046875, -2.107666015625, -2.017852783203125, -1.92803955078125, -1.838226318359375, -1.7484130859375, -1.658599853515625, -1.56878662109375, -1.478973388671875, -1.38916015625, -1.299346923828125, -1.20953369140625, -1.119720458984375, -1.0299072265625, -0.940093994140625, -0.85028076171875, -0.760467529296875, -0.670654296875, -0.580841064453125, -0.49102783203125, -0.401214599609375, -0.3114013671875, -0.221588134765625, -0.13177490234375, -0.041961669921875, 0.0478515625, 0.137664794921875, 0.22747802734375, 0.317291259765625, 0.4071044921875, 0.496917724609375, 0.58673095703125, 0.676544189453125, 0.766357421875, 0.856170654296875, 0.94598388671875, 1.035797119140625, 1.1256103515625, 1.215423583984375, 1.30523681640625, 1.395050048828125, 1.48486328125, 1.574676513671875, 1.66448974609375, 1.754302978515625, 1.8441162109375, 1.933929443359375, 2.02374267578125, 2.113555908203125, 2.203369140625, 2.293182373046875, 2.38299560546875, 2.472808837890625, 2.5626220703125, 2.652435302734375, 2.74224853515625, 2.832061767578125, 2.921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 16.0, 60.0, 170.0, 312.0, 240.0, 120.0, 38.0, 19.0, 8.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.404640197753906, -28.107379913330078, -26.810117721557617, -25.51285743713379, -24.215595245361328, -22.9183349609375, -21.621074676513672, -20.323814392089844, -19.026552200317383, -17.729291915893555, -16.432029724121094, -15.134769439697266, -13.837508201599121, -12.540246963500977, -11.242986679077148, -9.945725440979004, -8.64846420288086, -7.351202964782715, -6.0539422035217285, -4.756681442260742, -3.4594202041625977, -2.162158966064453, -0.8648982048034668, 0.43236255645751953, 1.729623794555664, 3.0268847942352295, 4.324145793914795, 5.621406555175781, 6.918667793273926, 8.21592903137207, 9.513189315795898, 10.810450553894043, 12.107707977294922, 13.404969215393066, 14.702230453491211, 15.999490737915039, 17.2967529296875, 18.594013214111328, 19.891273498535156, 21.188533782958984, 22.485795974731445, 23.783056259155273, 25.080318450927734, 26.377578735351562, 27.67483901977539, 28.97210121154785, 30.26936149597168, 31.56662368774414, 32.86388397216797, 34.1611442565918, 35.458404541015625, 36.75566864013672, 38.05292892456055, 39.350189208984375, 40.6474494934082, 41.94470977783203, 43.241973876953125, 44.53923416137695, 45.83649444580078, 47.133758544921875, 48.4310188293457, 49.72827911376953, 51.02553939819336, 52.32279968261719, 53.620059967041016]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 6.0, 9.0, 11.0, 26.0, 30.0, 27.0, 42.0, 41.0, 53.0, 52.0, 62.0, 60.0, 70.0, 65.0, 67.0, 62.0, 63.0, 53.0, 45.0, 36.0, 35.0, 19.0, 17.0, 15.0, 15.0, 7.0, 6.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.672584533691406, -16.075815200805664, -15.479044914245605, -14.882274627685547, -14.285505294799805, -13.688735008239746, -13.091964721679688, -12.495195388793945, -11.898426055908203, -11.301655769348145, -10.704886436462402, -10.108116149902344, -9.511346817016602, -8.914576530456543, -8.317806243896484, -7.721036911010742, -7.124266624450684, -6.527496814727783, -5.930727005004883, -5.333956718444824, -4.737187385559082, -4.140417098999023, -3.543647289276123, -2.9468774795532227, -2.3501076698303223, -1.7533378601074219, -1.156567931175232, -0.559798002243042, 0.0369718074798584, 0.6337416172027588, 1.2305116653442383, 1.8272814750671387, 2.424051284790039, 3.0208210945129395, 3.61759090423584, 4.214361190795898, 4.811130523681641, 5.407900810241699, 6.0046706199646, 6.6014404296875, 7.1982102394104, 7.794980049133301, 8.39175033569336, 8.988519668579102, 9.58528995513916, 10.182059288024902, 10.778829574584961, 11.375598907470703, 11.972369194030762, 12.56913948059082, 13.165908813476562, 13.762679100036621, 14.359448432922363, 14.956218719482422, 15.552988052368164, 16.149757385253906, 16.74652862548828, 17.343297958374023, 17.9400691986084, 18.53683853149414, 19.133607864379883, 19.730377197265625, 20.3271484375, 20.923917770385742, 21.520687103271484]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 23.0, 25.0, 41.0, 52.0, 93.0, 173.0, 262.0, 532.0, 1025.0, 2010.0, 4063.0, 9145.0, 20787.0, 47935.0, 111028.0, 239903.0, 309448.0, 168586.0, 74474.0, 32377.0, 14243.0, 6333.0, 2903.0, 1406.0, 705.0, 426.0, 206.0, 136.0, 76.0, 33.0, 23.0, 24.0, 17.0, 10.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.681640625, -1.6295166015625, -1.577392578125, -1.5252685546875, -1.47314453125, -1.4210205078125, -1.368896484375, -1.3167724609375, -1.2646484375, -1.2125244140625, -1.160400390625, -1.1082763671875, -1.05615234375, -1.0040283203125, -0.951904296875, -0.8997802734375, -0.84765625, -0.7955322265625, -0.743408203125, -0.6912841796875, -0.63916015625, -0.5870361328125, -0.534912109375, -0.4827880859375, -0.4306640625, -0.3785400390625, -0.326416015625, -0.2742919921875, -0.22216796875, -0.1700439453125, -0.117919921875, -0.0657958984375, -0.013671875, 0.0384521484375, 0.090576171875, 0.1427001953125, 0.19482421875, 0.2469482421875, 0.299072265625, 0.3511962890625, 0.4033203125, 0.4554443359375, 0.507568359375, 0.5596923828125, 0.61181640625, 0.6639404296875, 0.716064453125, 0.7681884765625, 0.8203125, 0.8724365234375, 0.924560546875, 0.9766845703125, 1.02880859375, 1.0809326171875, 1.133056640625, 1.1851806640625, 1.2373046875, 1.2894287109375, 1.341552734375, 1.3936767578125, 1.44580078125, 1.4979248046875, 1.550048828125, 1.6021728515625, 1.654296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 6.0, 8.0, 18.0, 27.0, 21.0, 25.0, 28.0, 32.0, 32.0, 35.0, 45.0, 43.0, 39.0, 54.0, 61.0, 53.0, 51.0, 50.0, 46.0, 50.0, 33.0, 36.0, 39.0, 31.0, 22.0, 26.0, 18.0, 14.0, 15.0, 8.0, 6.0, 6.0, 8.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.666015625, -1.6234893798828125, -1.580963134765625, -1.5384368896484375, -1.49591064453125, -1.4533843994140625, -1.410858154296875, -1.3683319091796875, -1.3258056640625, -1.2832794189453125, -1.240753173828125, -1.1982269287109375, -1.15570068359375, -1.1131744384765625, -1.070648193359375, -1.0281219482421875, -0.985595703125, -0.9430694580078125, -0.900543212890625, -0.8580169677734375, -0.81549072265625, -0.7729644775390625, -0.730438232421875, -0.6879119873046875, -0.6453857421875, -0.6028594970703125, -0.560333251953125, -0.5178070068359375, -0.47528076171875, -0.4327545166015625, -0.390228271484375, -0.3477020263671875, -0.30517578125, -0.2626495361328125, -0.220123291015625, -0.1775970458984375, -0.13507080078125, -0.0925445556640625, -0.050018310546875, -0.0074920654296875, 0.0350341796875, 0.0775604248046875, 0.120086669921875, 0.1626129150390625, 0.20513916015625, 0.2476654052734375, 0.290191650390625, 0.3327178955078125, 0.375244140625, 0.4177703857421875, 0.460296630859375, 0.5028228759765625, 0.54534912109375, 0.5878753662109375, 0.630401611328125, 0.6729278564453125, 0.7154541015625, 0.7579803466796875, 0.800506591796875, 0.8430328369140625, 0.88555908203125, 0.9280853271484375, 0.970611572265625, 1.0131378173828125, 1.0556640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 11.0, 14.0, 20.0, 27.0, 32.0, 66.0, 71.0, 100.0, 137.0, 176.0, 238.0, 357.0, 552.0, 1014.0, 2053.0, 5783.0, 28945.0, 254326.0, 668946.0, 68571.0, 10509.0, 3039.0, 1388.0, 710.0, 418.0, 292.0, 213.0, 147.0, 84.0, 61.0, 54.0, 48.0, 33.0, 21.0, 24.0, 19.0, 18.0, 8.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0], "bins": [-4.77734375, -4.648956298828125, -4.52056884765625, -4.392181396484375, -4.2637939453125, -4.135406494140625, -4.00701904296875, -3.878631591796875, -3.750244140625, -3.621856689453125, -3.49346923828125, -3.365081787109375, -3.2366943359375, -3.108306884765625, -2.97991943359375, -2.851531982421875, -2.72314453125, -2.594757080078125, -2.46636962890625, -2.337982177734375, -2.2095947265625, -2.081207275390625, -1.95281982421875, -1.824432373046875, -1.696044921875, -1.567657470703125, -1.43927001953125, -1.310882568359375, -1.1824951171875, -1.054107666015625, -0.92572021484375, -0.797332763671875, -0.6689453125, -0.540557861328125, -0.41217041015625, -0.283782958984375, -0.1553955078125, -0.027008056640625, 0.10137939453125, 0.229766845703125, 0.358154296875, 0.486541748046875, 0.61492919921875, 0.743316650390625, 0.8717041015625, 1.000091552734375, 1.12847900390625, 1.256866455078125, 1.38525390625, 1.513641357421875, 1.64202880859375, 1.770416259765625, 1.8988037109375, 2.027191162109375, 2.15557861328125, 2.283966064453125, 2.412353515625, 2.540740966796875, 2.66912841796875, 2.797515869140625, 2.9259033203125, 3.054290771484375, 3.18267822265625, 3.311065673828125, 3.439453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 13.0, 8.0, 10.0, 14.0, 20.0, 26.0, 22.0, 37.0, 35.0, 33.0, 39.0, 45.0, 60.0, 44.0, 55.0, 63.0, 59.0, 52.0, 53.0, 47.0, 53.0, 34.0, 41.0, 34.0, 25.0, 22.0, 9.0, 10.0, 10.0, 11.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-7.921875, -7.72052001953125, -7.5191650390625, -7.31781005859375, -7.116455078125, -6.91510009765625, -6.7137451171875, -6.51239013671875, -6.31103515625, -6.10968017578125, -5.9083251953125, -5.70697021484375, -5.505615234375, -5.30426025390625, -5.1029052734375, -4.90155029296875, -4.7001953125, -4.49884033203125, -4.2974853515625, -4.09613037109375, -3.894775390625, -3.69342041015625, -3.4920654296875, -3.29071044921875, -3.08935546875, -2.88800048828125, -2.6866455078125, -2.48529052734375, -2.283935546875, -2.08258056640625, -1.8812255859375, -1.67987060546875, -1.478515625, -1.27716064453125, -1.0758056640625, -0.87445068359375, -0.673095703125, -0.47174072265625, -0.2703857421875, -0.06903076171875, 0.13232421875, 0.33367919921875, 0.5350341796875, 0.73638916015625, 0.937744140625, 1.13909912109375, 1.3404541015625, 1.54180908203125, 1.7431640625, 1.94451904296875, 2.1458740234375, 2.34722900390625, 2.548583984375, 2.74993896484375, 2.9512939453125, 3.15264892578125, 3.35400390625, 3.55535888671875, 3.7567138671875, 3.95806884765625, 4.159423828125, 4.36077880859375, 4.5621337890625, 4.76348876953125, 4.96484375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 4.0, 14.0, 18.0, 28.0, 30.0, 56.0, 79.0, 169.0, 335.0, 783.0, 2765.0, 18032.0, 638512.0, 369023.0, 14850.0, 2361.0, 792.0, 304.0, 139.0, 89.0, 44.0, 38.0, 20.0, 11.0, 7.0, 7.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.092559814453125, -2.02496337890625, -1.957366943359375, -1.8897705078125, -1.822174072265625, -1.75457763671875, -1.686981201171875, -1.619384765625, -1.551788330078125, -1.48419189453125, -1.416595458984375, -1.3489990234375, -1.281402587890625, -1.21380615234375, -1.146209716796875, -1.07861328125, -1.011016845703125, -0.94342041015625, -0.875823974609375, -0.8082275390625, -0.740631103515625, -0.67303466796875, -0.605438232421875, -0.537841796875, -0.470245361328125, -0.40264892578125, -0.335052490234375, -0.2674560546875, -0.199859619140625, -0.13226318359375, -0.064666748046875, 0.0029296875, 0.070526123046875, 0.13812255859375, 0.205718994140625, 0.2733154296875, 0.340911865234375, 0.40850830078125, 0.476104736328125, 0.543701171875, 0.611297607421875, 0.67889404296875, 0.746490478515625, 0.8140869140625, 0.881683349609375, 0.94927978515625, 1.016876220703125, 1.08447265625, 1.152069091796875, 1.21966552734375, 1.287261962890625, 1.3548583984375, 1.422454833984375, 1.49005126953125, 1.557647705078125, 1.625244140625, 1.692840576171875, 1.76043701171875, 1.828033447265625, 1.8956298828125, 1.963226318359375, 2.03082275390625, 2.098419189453125, 2.166015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 3.0, 16.0, 16.0, 37.0, 35.0, 41.0, 73.0, 108.0, 116.0, 159.0, 98.0, 92.0, 55.0, 52.0, 36.0, 15.0, 14.0, 11.0, 9.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000438690185546875, -0.00042686983942985535, -0.0004150494933128357, -0.00040322914719581604, -0.0003914088010787964, -0.00037958845496177673, -0.0003677681088447571, -0.0003559477627277374, -0.0003441274166107178, -0.0003323070704936981, -0.00032048672437667847, -0.0003086663782596588, -0.00029684603214263916, -0.0002850256860256195, -0.00027320533990859985, -0.0002613849937915802, -0.00024956464767456055, -0.0002377443015575409, -0.00022592395544052124, -0.0002141036093235016, -0.00020228326320648193, -0.00019046291708946228, -0.00017864257097244263, -0.00016682222485542297, -0.00015500187873840332, -0.00014318153262138367, -0.00013136118650436401, -0.00011954084038734436, -0.00010772049427032471, -9.590014815330505e-05, -8.40798020362854e-05, -7.225945591926575e-05, -6.0439109802246094e-05, -4.861876368522644e-05, -3.679841756820679e-05, -2.4978071451187134e-05, -1.315772533416748e-05, -1.3373792171478271e-06, 1.0482966899871826e-05, 2.230331301689148e-05, 3.412365913391113e-05, 4.5944005250930786e-05, 5.776435136795044e-05, 6.958469748497009e-05, 8.140504360198975e-05, 9.32253897190094e-05, 0.00010504573583602905, 0.0001168660819530487, 0.00012868642807006836, 0.000140506774187088, 0.00015232712030410767, 0.00016414746642112732, 0.00017596781253814697, 0.00018778815865516663, 0.00019960850477218628, 0.00021142885088920593, 0.00022324919700622559, 0.00023506954312324524, 0.0002468898892402649, 0.00025871023535728455, 0.0002705305814743042, 0.00028235092759132385, 0.0002941712737083435, 0.00030599161982536316, 0.0003178119659423828]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 8.0, 11.0, 27.0, 34.0, 79.0, 112.0, 274.0, 483.0, 1180.0, 4154.0, 28770.0, 837520.0, 162412.0, 9843.0, 2100.0, 751.0, 337.0, 176.0, 87.0, 61.0, 38.0, 18.0, 17.0, 16.0, 8.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.087890625, -2.02215576171875, -1.9564208984375, -1.89068603515625, -1.824951171875, -1.75921630859375, -1.6934814453125, -1.62774658203125, -1.56201171875, -1.49627685546875, -1.4305419921875, -1.36480712890625, -1.299072265625, -1.23333740234375, -1.1676025390625, -1.10186767578125, -1.0361328125, -0.97039794921875, -0.9046630859375, -0.83892822265625, -0.773193359375, -0.70745849609375, -0.6417236328125, -0.57598876953125, -0.51025390625, -0.44451904296875, -0.3787841796875, -0.31304931640625, -0.247314453125, -0.18157958984375, -0.1158447265625, -0.05010986328125, 0.015625, 0.08135986328125, 0.1470947265625, 0.21282958984375, 0.278564453125, 0.34429931640625, 0.4100341796875, 0.47576904296875, 0.54150390625, 0.60723876953125, 0.6729736328125, 0.73870849609375, 0.804443359375, 0.87017822265625, 0.9359130859375, 1.00164794921875, 1.0673828125, 1.13311767578125, 1.1988525390625, 1.26458740234375, 1.330322265625, 1.39605712890625, 1.4617919921875, 1.52752685546875, 1.59326171875, 1.65899658203125, 1.7247314453125, 1.79046630859375, 1.856201171875, 1.92193603515625, 1.9876708984375, 2.05340576171875, 2.119140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 6.0, 8.0, 9.0, 11.0, 7.0, 13.0, 22.0, 22.0, 29.0, 26.0, 40.0, 42.0, 59.0, 66.0, 74.0, 72.0, 82.0, 76.0, 65.0, 60.0, 45.0, 38.0, 24.0, 21.0, 17.0, 11.0, 13.0, 3.0, 8.0, 9.0, 7.0, 3.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90576171875, -0.8703231811523438, -0.8348846435546875, -0.7994461059570312, -0.764007568359375, -0.7285690307617188, -0.6931304931640625, -0.6576919555664062, -0.62225341796875, -0.5868148803710938, -0.5513763427734375, -0.5159378051757812, -0.480499267578125, -0.44506072998046875, -0.4096221923828125, -0.37418365478515625, -0.3387451171875, -0.30330657958984375, -0.2678680419921875, -0.23242950439453125, -0.196990966796875, -0.16155242919921875, -0.1261138916015625, -0.09067535400390625, -0.05523681640625, -0.01979827880859375, 0.0156402587890625, 0.05107879638671875, 0.086517333984375, 0.12195587158203125, 0.1573944091796875, 0.19283294677734375, 0.228271484375, 0.26371002197265625, 0.2991485595703125, 0.33458709716796875, 0.370025634765625, 0.40546417236328125, 0.4409027099609375, 0.47634124755859375, 0.51177978515625, 0.5472183227539062, 0.5826568603515625, 0.6180953979492188, 0.653533935546875, 0.6889724731445312, 0.7244110107421875, 0.7598495483398438, 0.7952880859375, 0.8307266235351562, 0.8661651611328125, 0.9016036987304688, 0.937042236328125, 0.9724807739257812, 1.0079193115234375, 1.0433578491210938, 1.07879638671875, 1.1142349243164062, 1.1496734619140625, 1.1851119995117188, 1.220550537109375, 1.2559890747070312, 1.2914276123046875, 1.3268661499023438, 1.3623046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 12.0, 21.0, 49.0, 116.0, 239.0, 263.0, 149.0, 68.0, 39.0, 20.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.169200897216797, -21.063152313232422, -19.957103729248047, -18.851055145263672, -17.745006561279297, -16.638957977294922, -15.532910346984863, -14.426861763000488, -13.320813179016113, -12.214764595031738, -11.108716011047363, -10.002668380737305, -8.89661979675293, -7.7905707359313965, -6.68452262878418, -5.578474044799805, -4.47242546081543, -3.3663768768310547, -2.260328531265259, -1.154280185699463, -0.04823160171508789, 1.057816982269287, 2.163865089416504, 3.269913673400879, 4.375962257385254, 5.482010841369629, 6.588059425354004, 7.694107532501221, 8.800155639648438, 9.906204223632812, 11.012252807617188, 12.118301391601562, 13.224349975585938, 14.330398559570312, 15.436447143554688, 16.542495727539062, 17.648544311523438, 18.754592895507812, 19.860641479492188, 20.966690063476562, 22.072738647460938, 23.178787231445312, 24.284835815429688, 25.390884399414062, 26.496932983398438, 27.602981567382812, 28.709030151367188, 29.815078735351562, 30.921125411987305, 32.02717208862305, 33.13322067260742, 34.2392692565918, 35.34531784057617, 36.45136642456055, 37.55741500854492, 38.6634635925293, 39.76951217651367, 40.87556076049805, 41.98160934448242, 43.0876579284668, 44.19370651245117, 45.29975509643555, 46.40580368041992, 47.5118522644043, 48.61790084838867]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 9.0, 10.0, 11.0, 13.0, 20.0, 18.0, 26.0, 29.0, 36.0, 47.0, 40.0, 46.0, 57.0, 74.0, 80.0, 75.0, 57.0, 40.0, 36.0, 30.0, 27.0, 34.0, 25.0, 23.0, 18.0, 19.0, 18.0, 8.0, 9.0, 10.0, 4.0, 5.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.92884635925293, -20.237842559814453, -19.54684066772461, -18.855836868286133, -18.164833068847656, -17.47382926940918, -16.782825469970703, -16.09182357788086, -15.400819778442383, -14.709815979003906, -14.018813133239746, -13.327810287475586, -12.63680648803711, -11.945802688598633, -11.254799842834473, -10.563796997070312, -9.872793197631836, -9.18178939819336, -8.4907865524292, -7.799783229827881, -7.1087799072265625, -6.417776584625244, -5.726773262023926, -5.035769939422607, -4.344766616821289, -3.6537632942199707, -2.9627599716186523, -2.271756649017334, -1.5807533264160156, -0.8897500038146973, -0.1987466812133789, 0.49225664138793945, 1.183258056640625, 1.8742613792419434, 2.5652647018432617, 3.25626802444458, 3.9472713470458984, 4.638274669647217, 5.329277992248535, 6.0202813148498535, 6.711284637451172, 7.40228796005249, 8.093291282653809, 8.784294128417969, 9.475297927856445, 10.166301727294922, 10.857304573059082, 11.548307418823242, 12.239311218261719, 12.930315017700195, 13.621317863464355, 14.312320709228516, 15.003324508666992, 15.694328308105469, 16.385330200195312, 17.07633399963379, 17.767337799072266, 18.458341598510742, 19.14934539794922, 19.840347290039062, 20.53135108947754, 21.222354888916016, 21.91335678100586, 22.604360580444336, 23.295364379882812]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 6.0, 9.0, 11.0, 15.0, 19.0, 47.0, 56.0, 125.0, 259.0, 695.0, 2294.0, 11517.0, 211375.0, 3724057.0, 227525.0, 12647.0, 2433.0, 717.0, 240.0, 106.0, 57.0, 23.0, 21.0, 14.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.6015625, -4.493316650390625, -4.38507080078125, -4.276824951171875, -4.1685791015625, -4.060333251953125, -3.95208740234375, -3.843841552734375, -3.735595703125, -3.627349853515625, -3.51910400390625, -3.410858154296875, -3.3026123046875, -3.194366455078125, -3.08612060546875, -2.977874755859375, -2.86962890625, -2.761383056640625, -2.65313720703125, -2.544891357421875, -2.4366455078125, -2.328399658203125, -2.22015380859375, -2.111907958984375, -2.003662109375, -1.895416259765625, -1.78717041015625, -1.678924560546875, -1.5706787109375, -1.462432861328125, -1.35418701171875, -1.245941162109375, -1.1376953125, -1.029449462890625, -0.92120361328125, -0.812957763671875, -0.7047119140625, -0.596466064453125, -0.48822021484375, -0.379974365234375, -0.271728515625, -0.163482666015625, -0.05523681640625, 0.053009033203125, 0.1612548828125, 0.269500732421875, 0.37774658203125, 0.485992431640625, 0.59423828125, 0.702484130859375, 0.81072998046875, 0.918975830078125, 1.0272216796875, 1.135467529296875, 1.24371337890625, 1.351959228515625, 1.460205078125, 1.568450927734375, 1.67669677734375, 1.784942626953125, 1.8931884765625, 2.001434326171875, 2.10968017578125, 2.217926025390625, 2.326171875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 7.0, 5.0, 6.0, 7.0, 6.0, 8.0, 14.0, 13.0, 15.0, 18.0, 12.0, 37.0, 29.0, 33.0, 31.0, 38.0, 39.0, 32.0, 44.0, 38.0, 54.0, 62.0, 36.0, 40.0, 43.0, 40.0, 36.0, 45.0, 28.0, 24.0, 24.0, 19.0, 26.0, 16.0, 16.0, 19.0, 8.0, 13.0, 9.0, 3.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2109375, -1.1745758056640625, -1.138214111328125, -1.1018524169921875, -1.06549072265625, -1.0291290283203125, -0.992767333984375, -0.9564056396484375, -0.9200439453125, -0.8836822509765625, -0.847320556640625, -0.8109588623046875, -0.77459716796875, -0.7382354736328125, -0.701873779296875, -0.6655120849609375, -0.629150390625, -0.5927886962890625, -0.556427001953125, -0.5200653076171875, -0.48370361328125, -0.4473419189453125, -0.410980224609375, -0.3746185302734375, -0.3382568359375, -0.3018951416015625, -0.265533447265625, -0.2291717529296875, -0.19281005859375, -0.1564483642578125, -0.120086669921875, -0.0837249755859375, -0.04736328125, -0.0110015869140625, 0.025360107421875, 0.0617218017578125, 0.09808349609375, 0.1344451904296875, 0.170806884765625, 0.2071685791015625, 0.2435302734375, 0.2798919677734375, 0.316253662109375, 0.3526153564453125, 0.38897705078125, 0.4253387451171875, 0.461700439453125, 0.4980621337890625, 0.534423828125, 0.5707855224609375, 0.607147216796875, 0.6435089111328125, 0.67987060546875, 0.7162322998046875, 0.752593994140625, 0.7889556884765625, 0.8253173828125, 0.8616790771484375, 0.898040771484375, 0.9344024658203125, 0.97076416015625, 1.0071258544921875, 1.043487548828125, 1.0798492431640625, 1.1162109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 6.0, 6.0, 11.0, 10.0, 18.0, 24.0, 23.0, 38.0, 64.0, 113.0, 160.0, 276.0, 560.0, 1019.0, 2077.0, 5450.0, 16228.0, 65698.0, 559439.0, 3245794.0, 238806.0, 40297.0, 10974.0, 3941.0, 1568.0, 768.0, 377.0, 190.0, 109.0, 72.0, 48.0, 33.0, 19.0, 18.0, 17.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-2.482421875, -2.41595458984375, -2.3494873046875, -2.28302001953125, -2.216552734375, -2.15008544921875, -2.0836181640625, -2.01715087890625, -1.95068359375, -1.88421630859375, -1.8177490234375, -1.75128173828125, -1.684814453125, -1.61834716796875, -1.5518798828125, -1.48541259765625, -1.4189453125, -1.35247802734375, -1.2860107421875, -1.21954345703125, -1.153076171875, -1.08660888671875, -1.0201416015625, -0.95367431640625, -0.88720703125, -0.82073974609375, -0.7542724609375, -0.68780517578125, -0.621337890625, -0.55487060546875, -0.4884033203125, -0.42193603515625, -0.35546875, -0.28900146484375, -0.2225341796875, -0.15606689453125, -0.089599609375, -0.02313232421875, 0.0433349609375, 0.10980224609375, 0.17626953125, 0.24273681640625, 0.3092041015625, 0.37567138671875, 0.442138671875, 0.50860595703125, 0.5750732421875, 0.64154052734375, 0.7080078125, 0.77447509765625, 0.8409423828125, 0.90740966796875, 0.973876953125, 1.04034423828125, 1.1068115234375, 1.17327880859375, 1.23974609375, 1.30621337890625, 1.3726806640625, 1.43914794921875, 1.505615234375, 1.57208251953125, 1.6385498046875, 1.70501708984375, 1.771484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 10.0, 11.0, 10.0, 17.0, 24.0, 31.0, 51.0, 70.0, 88.0, 154.0, 317.0, 624.0, 862.0, 768.0, 427.0, 203.0, 117.0, 85.0, 49.0, 43.0, 21.0, 20.0, 14.0, 10.0, 4.0, 8.0, 2.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.24609375, -3.157806396484375, -3.06951904296875, -2.981231689453125, -2.8929443359375, -2.804656982421875, -2.71636962890625, -2.628082275390625, -2.539794921875, -2.451507568359375, -2.36322021484375, -2.274932861328125, -2.1866455078125, -2.098358154296875, -2.01007080078125, -1.921783447265625, -1.83349609375, -1.745208740234375, -1.65692138671875, -1.568634033203125, -1.4803466796875, -1.392059326171875, -1.30377197265625, -1.215484619140625, -1.127197265625, -1.038909912109375, -0.95062255859375, -0.862335205078125, -0.7740478515625, -0.685760498046875, -0.59747314453125, -0.509185791015625, -0.4208984375, -0.332611083984375, -0.24432373046875, -0.156036376953125, -0.0677490234375, 0.020538330078125, 0.10882568359375, 0.197113037109375, 0.285400390625, 0.373687744140625, 0.46197509765625, 0.550262451171875, 0.6385498046875, 0.726837158203125, 0.81512451171875, 0.903411865234375, 0.99169921875, 1.079986572265625, 1.16827392578125, 1.256561279296875, 1.3448486328125, 1.433135986328125, 1.52142333984375, 1.609710693359375, 1.697998046875, 1.786285400390625, 1.87457275390625, 1.962860107421875, 2.0511474609375, 2.139434814453125, 2.22772216796875, 2.316009521484375, 2.404296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 21.0, 49.0, 203.0, 394.0, 229.0, 67.0, 14.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-73.00104522705078, -71.52763366699219, -70.05421447753906, -68.58080291748047, -67.10739135742188, -65.63397979736328, -64.16056823730469, -62.68714904785156, -61.21373748779297, -59.740325927734375, -58.266910552978516, -56.793495178222656, -55.32008361816406, -53.84667205810547, -52.37325668334961, -50.89984130859375, -49.426429748535156, -47.95301818847656, -46.4796028137207, -45.006187438964844, -43.53277587890625, -42.059364318847656, -40.5859489440918, -39.11253356933594, -37.639122009277344, -36.16571044921875, -34.69229507446289, -33.21887969970703, -31.745468139648438, -30.27205467224121, -28.798641204833984, -27.325227737426758, -25.851810455322266, -24.37839698791504, -22.904983520507812, -21.431570053100586, -19.95815658569336, -18.484743118286133, -17.011329650878906, -15.53791618347168, -14.064502716064453, -12.591089248657227, -11.11767578125, -9.644262313842773, -8.170848846435547, -6.69743537902832, -5.224021911621094, -3.750608444213867, -2.2771949768066406, -0.8037815093994141, 0.6696319580078125, 2.143045425415039, 3.6164588928222656, 5.089872360229492, 6.563285827636719, 8.036699295043945, 9.510112762451172, 10.983526229858398, 12.456939697265625, 13.930353164672852, 15.403766632080078, 16.877180099487305, 18.35059356689453, 19.824007034301758, 21.297420501708984]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 11.0, 8.0, 15.0, 26.0, 21.0, 23.0, 34.0, 30.0, 32.0, 41.0, 40.0, 54.0, 52.0, 46.0, 70.0, 55.0, 70.0, 54.0, 45.0, 56.0, 32.0, 43.0, 37.0, 19.0, 15.0, 12.0, 13.0, 10.0, 2.0, 6.0, 5.0, 6.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.72243309020996, -16.26786231994629, -15.813292503356934, -15.358721733093262, -14.904151916503906, -14.449581146240234, -13.995010375976562, -13.54043960571289, -13.085869789123535, -12.631299018859863, -12.176729202270508, -11.722158432006836, -11.267587661743164, -10.813017845153809, -10.358447074890137, -9.903877258300781, -9.44930648803711, -8.994735717773438, -8.540165901184082, -8.08559513092041, -7.6310248374938965, -7.176454544067383, -6.721883773803711, -6.267313480377197, -5.812743186950684, -5.35817289352417, -4.903602600097656, -4.449031829833984, -3.9944615364074707, -3.539891242980957, -3.0853207111358643, -2.6307501792907715, -2.176180839538574, -1.721610426902771, -1.2670400142669678, -0.8124696016311646, -0.35789918899536133, 0.09667110443115234, 0.5512416362762451, 1.005812168121338, 1.4603824615478516, 1.9149528741836548, 2.369523286819458, 2.824093818664551, 3.2786641120910645, 3.733234405517578, 4.18780517578125, 4.642375469207764, 5.096945762634277, 5.551516056060791, 6.006086349487305, 6.460657119750977, 6.91522741317749, 7.369797706604004, 7.824368476867676, 8.278938293457031, 8.733509063720703, 9.188079833984375, 9.64264965057373, 10.097220420837402, 10.551790237426758, 11.00636100769043, 11.460931777954102, 11.915502548217773, 12.370072364807129]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 14.0, 15.0, 10.0, 23.0, 29.0, 55.0, 104.0, 138.0, 227.0, 408.0, 704.0, 1156.0, 2243.0, 4302.0, 8101.0, 16099.0, 32362.0, 67581.0, 143015.0, 286828.0, 252101.0, 119365.0, 57044.0, 27868.0, 13706.0, 6962.0, 3582.0, 1912.0, 1078.0, 615.0, 354.0, 211.0, 127.0, 75.0, 51.0, 32.0, 20.0, 10.0, 6.0, 3.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.736328125, -1.686553955078125, -1.63677978515625, -1.587005615234375, -1.5372314453125, -1.487457275390625, -1.43768310546875, -1.387908935546875, -1.338134765625, -1.288360595703125, -1.23858642578125, -1.188812255859375, -1.1390380859375, -1.089263916015625, -1.03948974609375, -0.989715576171875, -0.93994140625, -0.890167236328125, -0.84039306640625, -0.790618896484375, -0.7408447265625, -0.691070556640625, -0.64129638671875, -0.591522216796875, -0.541748046875, -0.491973876953125, -0.44219970703125, -0.392425537109375, -0.3426513671875, -0.292877197265625, -0.24310302734375, -0.193328857421875, -0.1435546875, -0.093780517578125, -0.04400634765625, 0.005767822265625, 0.0555419921875, 0.105316162109375, 0.15509033203125, 0.204864501953125, 0.254638671875, 0.304412841796875, 0.35418701171875, 0.403961181640625, 0.4537353515625, 0.503509521484375, 0.55328369140625, 0.603057861328125, 0.65283203125, 0.702606201171875, 0.75238037109375, 0.802154541015625, 0.8519287109375, 0.901702880859375, 0.95147705078125, 1.001251220703125, 1.051025390625, 1.100799560546875, 1.15057373046875, 1.200347900390625, 1.2501220703125, 1.299896240234375, 1.34967041015625, 1.399444580078125, 1.44921875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 2.0, 3.0, 8.0, 7.0, 8.0, 13.0, 13.0, 19.0, 14.0, 21.0, 20.0, 22.0, 23.0, 35.0, 38.0, 36.0, 31.0, 39.0, 48.0, 42.0, 36.0, 35.0, 51.0, 37.0, 48.0, 47.0, 34.0, 39.0, 39.0, 26.0, 24.0, 15.0, 21.0, 14.0, 14.0, 21.0, 9.0, 5.0, 10.0, 5.0, 6.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.23046875, -1.1962966918945312, -1.1621246337890625, -1.1279525756835938, -1.093780517578125, -1.0596084594726562, -1.0254364013671875, -0.9912643432617188, -0.95709228515625, -0.9229202270507812, -0.8887481689453125, -0.8545761108398438, -0.820404052734375, -0.7862319946289062, -0.7520599365234375, -0.7178878784179688, -0.6837158203125, -0.6495437622070312, -0.6153717041015625, -0.5811996459960938, -0.547027587890625, -0.5128555297851562, -0.4786834716796875, -0.44451141357421875, -0.41033935546875, -0.37616729736328125, -0.3419952392578125, -0.30782318115234375, -0.273651123046875, -0.23947906494140625, -0.2053070068359375, -0.17113494873046875, -0.136962890625, -0.10279083251953125, -0.0686187744140625, -0.03444671630859375, -0.000274658203125, 0.03389739990234375, 0.0680694580078125, 0.10224151611328125, 0.13641357421875, 0.17058563232421875, 0.2047576904296875, 0.23892974853515625, 0.273101806640625, 0.30727386474609375, 0.3414459228515625, 0.37561798095703125, 0.4097900390625, 0.44396209716796875, 0.4781341552734375, 0.5123062133789062, 0.546478271484375, 0.5806503295898438, 0.6148223876953125, 0.6489944458007812, 0.68316650390625, 0.7173385620117188, 0.7515106201171875, 0.7856826782226562, 0.819854736328125, 0.8540267944335938, 0.8881988525390625, 0.9223709106445312, 0.95654296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 9.0, 8.0, 13.0, 15.0, 22.0, 23.0, 47.0, 47.0, 64.0, 101.0, 139.0, 165.0, 305.0, 382.0, 619.0, 1142.0, 2361.0, 6779.0, 27554.0, 169590.0, 697183.0, 112110.0, 19617.0, 5234.0, 2021.0, 1078.0, 591.0, 352.0, 285.0, 189.0, 125.0, 98.0, 54.0, 62.0, 41.0, 45.0, 17.0, 20.0, 11.0, 11.0, 4.0, 4.0, 3.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4921875, -3.380950927734375, -3.26971435546875, -3.158477783203125, -3.0472412109375, -2.936004638671875, -2.82476806640625, -2.713531494140625, -2.602294921875, -2.491058349609375, -2.37982177734375, -2.268585205078125, -2.1573486328125, -2.046112060546875, -1.93487548828125, -1.823638916015625, -1.71240234375, -1.601165771484375, -1.48992919921875, -1.378692626953125, -1.2674560546875, -1.156219482421875, -1.04498291015625, -0.933746337890625, -0.822509765625, -0.711273193359375, -0.60003662109375, -0.488800048828125, -0.3775634765625, -0.266326904296875, -0.15509033203125, -0.043853759765625, 0.0673828125, 0.178619384765625, 0.28985595703125, 0.401092529296875, 0.5123291015625, 0.623565673828125, 0.73480224609375, 0.846038818359375, 0.957275390625, 1.068511962890625, 1.17974853515625, 1.290985107421875, 1.4022216796875, 1.513458251953125, 1.62469482421875, 1.735931396484375, 1.84716796875, 1.958404541015625, 2.06964111328125, 2.180877685546875, 2.2921142578125, 2.403350830078125, 2.51458740234375, 2.625823974609375, 2.737060546875, 2.848297119140625, 2.95953369140625, 3.070770263671875, 3.1820068359375, 3.293243408203125, 3.40447998046875, 3.515716552734375, 3.626953125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 8.0, 6.0, 6.0, 11.0, 9.0, 6.0, 17.0, 28.0, 16.0, 28.0, 34.0, 31.0, 35.0, 39.0, 35.0, 56.0, 58.0, 65.0, 44.0, 49.0, 48.0, 50.0, 33.0, 37.0, 53.0, 34.0, 23.0, 24.0, 21.0, 19.0, 19.0, 7.0, 12.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.37890625, -4.2374267578125, -4.095947265625, -3.9544677734375, -3.81298828125, -3.6715087890625, -3.530029296875, -3.3885498046875, -3.2470703125, -3.1055908203125, -2.964111328125, -2.8226318359375, -2.68115234375, -2.5396728515625, -2.398193359375, -2.2567138671875, -2.115234375, -1.9737548828125, -1.832275390625, -1.6907958984375, -1.54931640625, -1.4078369140625, -1.266357421875, -1.1248779296875, -0.9833984375, -0.8419189453125, -0.700439453125, -0.5589599609375, -0.41748046875, -0.2760009765625, -0.134521484375, 0.0069580078125, 0.1484375, 0.2899169921875, 0.431396484375, 0.5728759765625, 0.71435546875, 0.8558349609375, 0.997314453125, 1.1387939453125, 1.2802734375, 1.4217529296875, 1.563232421875, 1.7047119140625, 1.84619140625, 1.9876708984375, 2.129150390625, 2.2706298828125, 2.412109375, 2.5535888671875, 2.695068359375, 2.8365478515625, 2.97802734375, 3.1195068359375, 3.260986328125, 3.4024658203125, 3.5439453125, 3.6854248046875, 3.826904296875, 3.9683837890625, 4.10986328125, 4.2513427734375, 4.392822265625, 4.5343017578125, 4.67578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 4.0, 13.0, 17.0, 30.0, 41.0, 84.0, 161.0, 369.0, 940.0, 3336.0, 20067.0, 264097.0, 709587.0, 41962.0, 5580.0, 1387.0, 436.0, 177.0, 108.0, 41.0, 32.0, 19.0, 17.0, 11.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7216796875, -1.6727142333984375, -1.623748779296875, -1.5747833251953125, -1.52581787109375, -1.4768524169921875, -1.427886962890625, -1.3789215087890625, -1.3299560546875, -1.2809906005859375, -1.232025146484375, -1.1830596923828125, -1.13409423828125, -1.0851287841796875, -1.036163330078125, -0.9871978759765625, -0.938232421875, -0.8892669677734375, -0.840301513671875, -0.7913360595703125, -0.74237060546875, -0.6934051513671875, -0.644439697265625, -0.5954742431640625, -0.5465087890625, -0.4975433349609375, -0.448577880859375, -0.3996124267578125, -0.35064697265625, -0.3016815185546875, -0.252716064453125, -0.2037506103515625, -0.15478515625, -0.1058197021484375, -0.056854248046875, -0.0078887939453125, 0.04107666015625, 0.0900421142578125, 0.139007568359375, 0.1879730224609375, 0.2369384765625, 0.2859039306640625, 0.334869384765625, 0.3838348388671875, 0.43280029296875, 0.4817657470703125, 0.530731201171875, 0.5796966552734375, 0.628662109375, 0.6776275634765625, 0.726593017578125, 0.7755584716796875, 0.82452392578125, 0.8734893798828125, 0.922454833984375, 0.9714202880859375, 1.0203857421875, 1.0693511962890625, 1.118316650390625, 1.1672821044921875, 1.21624755859375, 1.2652130126953125, 1.314178466796875, 1.3631439208984375, 1.412109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 9.0, 6.0, 14.0, 7.0, 21.0, 22.0, 38.0, 52.0, 81.0, 124.0, 143.0, 135.0, 113.0, 74.0, 47.0, 39.0, 33.0, 17.0, 10.0, 7.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002570152282714844, -0.0002446472644805908, -0.00023227930068969727, -0.0002199113368988037, -0.00020754337310791016, -0.0001951754093170166, -0.00018280744552612305, -0.0001704394817352295, -0.00015807151794433594, -0.00014570355415344238, -0.00013333559036254883, -0.00012096762657165527, -0.00010859966278076172, -9.623169898986816e-05, -8.386373519897461e-05, -7.149577140808105e-05, -5.91278076171875e-05, -4.6759843826293945e-05, -3.439188003540039e-05, -2.2023916244506836e-05, -9.655952453613281e-06, 2.7120113372802734e-06, 1.5079975128173828e-05, 2.7447938919067383e-05, 3.981590270996094e-05, 5.218386650085449e-05, 6.455183029174805e-05, 7.69197940826416e-05, 8.928775787353516e-05, 0.00010165572166442871, 0.00011402368545532227, 0.00012639164924621582, 0.00013875961303710938, 0.00015112757682800293, 0.00016349554061889648, 0.00017586350440979004, 0.0001882314682006836, 0.00020059943199157715, 0.0002129673957824707, 0.00022533535957336426, 0.0002377033233642578, 0.00025007128715515137, 0.0002624392509460449, 0.0002748072147369385, 0.00028717517852783203, 0.0002995431423187256, 0.00031191110610961914, 0.0003242790699005127, 0.00033664703369140625, 0.0003490149974822998, 0.00036138296127319336, 0.0003737509250640869, 0.00038611888885498047, 0.000398486852645874, 0.0004108548164367676, 0.00042322278022766113, 0.0004355907440185547, 0.00044795870780944824, 0.0004603266716003418, 0.00047269463539123535, 0.0004850625991821289, 0.0004974305629730225, 0.000509798526763916, 0.0005221664905548096, 0.0005345344543457031]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 11.0, 23.0, 20.0, 44.0, 52.0, 90.0, 170.0, 295.0, 507.0, 1090.0, 2854.0, 11222.0, 85504.0, 758394.0, 163869.0, 17763.0, 3914.0, 1399.0, 568.0, 301.0, 150.0, 96.0, 57.0, 42.0, 33.0, 18.0, 14.0, 9.0, 6.0, 5.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.064971923828125, -1.02642822265625, -0.987884521484375, -0.9493408203125, -0.910797119140625, -0.87225341796875, -0.833709716796875, -0.795166015625, -0.756622314453125, -0.71807861328125, -0.679534912109375, -0.6409912109375, -0.602447509765625, -0.56390380859375, -0.525360107421875, -0.48681640625, -0.448272705078125, -0.40972900390625, -0.371185302734375, -0.3326416015625, -0.294097900390625, -0.25555419921875, -0.217010498046875, -0.178466796875, -0.139923095703125, -0.10137939453125, -0.062835693359375, -0.0242919921875, 0.014251708984375, 0.05279541015625, 0.091339111328125, 0.1298828125, 0.168426513671875, 0.20697021484375, 0.245513916015625, 0.2840576171875, 0.322601318359375, 0.36114501953125, 0.399688720703125, 0.438232421875, 0.476776123046875, 0.51531982421875, 0.553863525390625, 0.5924072265625, 0.630950927734375, 0.66949462890625, 0.708038330078125, 0.74658203125, 0.785125732421875, 0.82366943359375, 0.862213134765625, 0.9007568359375, 0.939300537109375, 0.97784423828125, 1.016387939453125, 1.054931640625, 1.093475341796875, 1.13201904296875, 1.170562744140625, 1.2091064453125, 1.247650146484375, 1.28619384765625, 1.324737548828125, 1.36328125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 6.0, 3.0, 3.0, 8.0, 14.0, 16.0, 25.0, 27.0, 22.0, 36.0, 52.0, 50.0, 63.0, 69.0, 91.0, 75.0, 72.0, 70.0, 57.0, 63.0, 39.0, 26.0, 33.0, 17.0, 14.0, 12.0, 9.0, 10.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.08203125, -1.0498504638671875, -1.017669677734375, -0.9854888916015625, -0.95330810546875, -0.9211273193359375, -0.888946533203125, -0.8567657470703125, -0.8245849609375, -0.7924041748046875, -0.760223388671875, -0.7280426025390625, -0.69586181640625, -0.6636810302734375, -0.631500244140625, -0.5993194580078125, -0.567138671875, -0.5349578857421875, -0.502777099609375, -0.4705963134765625, -0.43841552734375, -0.4062347412109375, -0.374053955078125, -0.3418731689453125, -0.3096923828125, -0.2775115966796875, -0.245330810546875, -0.2131500244140625, -0.18096923828125, -0.1487884521484375, -0.116607666015625, -0.0844268798828125, -0.05224609375, -0.0200653076171875, 0.012115478515625, 0.0442962646484375, 0.07647705078125, 0.1086578369140625, 0.140838623046875, 0.1730194091796875, 0.2052001953125, 0.2373809814453125, 0.269561767578125, 0.3017425537109375, 0.33392333984375, 0.3661041259765625, 0.398284912109375, 0.4304656982421875, 0.462646484375, 0.4948272705078125, 0.527008056640625, 0.5591888427734375, 0.59136962890625, 0.6235504150390625, 0.655731201171875, 0.6879119873046875, 0.7200927734375, 0.7522735595703125, 0.784454345703125, 0.8166351318359375, 0.84881591796875, 0.8809967041015625, 0.913177490234375, 0.9453582763671875, 0.9775390625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 13.0, 4.0, 18.0, 75.0, 157.0, 368.0, 188.0, 100.0, 38.0, 16.0, 14.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.955230712890625, -35.78152084350586, -34.607810974121094, -33.434104919433594, -32.26039505004883, -31.086685180664062, -29.91297721862793, -28.739269256591797, -27.56555938720703, -26.391849517822266, -25.218141555786133, -24.04443359375, -22.870723724365234, -21.69701385498047, -20.523305892944336, -19.349597930908203, -18.175888061523438, -17.002178192138672, -15.828470230102539, -14.65476131439209, -13.48105239868164, -12.307343482971191, -11.133634567260742, -9.959925651550293, -8.786216735839844, -7.6125078201293945, -6.438798904418945, -5.265089988708496, -4.091381072998047, -2.9176721572875977, -1.7439632415771484, -0.5702543258666992, 0.6034584045410156, 1.7771673202514648, 2.950876235961914, 4.124585151672363, 5.2982940673828125, 6.472002983093262, 7.645711898803711, 8.81942081451416, 9.99312973022461, 11.166838645935059, 12.340547561645508, 13.514256477355957, 14.687965393066406, 15.861674308776855, 17.035383224487305, 18.209091186523438, 19.382801055908203, 20.55651092529297, 21.7302188873291, 22.903926849365234, 24.07763671875, 25.251346588134766, 26.4250545501709, 27.59876251220703, 28.772472381591797, 29.946182250976562, 31.119890213012695, 32.29359817504883, 33.467308044433594, 34.64101791381836, 35.814727783203125, 36.988433837890625, 38.16214370727539]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 4.0, 9.0, 15.0, 14.0, 16.0, 14.0, 15.0, 18.0, 22.0, 21.0, 21.0, 34.0, 31.0, 28.0, 31.0, 45.0, 52.0, 73.0, 63.0, 72.0, 52.0, 29.0, 35.0, 31.0, 18.0, 33.0, 23.0, 26.0, 26.0, 15.0, 17.0, 14.0, 11.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.901779174804688, -16.37803077697754, -15.85428237915039, -15.330534934997559, -14.80678653717041, -14.283038139343262, -13.75929069519043, -13.235542297363281, -12.711793899536133, -12.188045501708984, -11.664297103881836, -11.140549659729004, -10.616801261901855, -10.093052864074707, -9.569305419921875, -9.045557022094727, -8.521808624267578, -7.99806022644043, -7.4743123054504395, -6.950564384460449, -6.426815986633301, -5.903067588806152, -5.379319667816162, -4.855571746826172, -4.331823348999023, -3.808075189590454, -3.2843270301818848, -2.7605788707733154, -2.236830711364746, -1.7130825519561768, -1.1893343925476074, -0.6655862331390381, -0.14183807373046875, 0.3819100856781006, 0.9056582450866699, 1.4294064044952393, 1.9531545639038086, 2.476902723312378, 3.0006508827209473, 3.5243990421295166, 4.048147201538086, 4.571895599365234, 5.095643520355225, 5.619391441345215, 6.143139839172363, 6.666888236999512, 7.190636157989502, 7.714384078979492, 8.23813247680664, 8.761880874633789, 9.285629272460938, 9.80937671661377, 10.333125114440918, 10.856873512268066, 11.380620956420898, 11.904369354248047, 12.428117752075195, 12.951866149902344, 13.475614547729492, 13.999361991882324, 14.523110389709473, 15.046858787536621, 15.570606231689453, 16.0943546295166, 16.61810302734375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 4.0, 4.0, 8.0, 4.0, 11.0, 2.0, 7.0, 15.0, 20.0, 27.0, 48.0, 34.0, 54.0, 120.0, 145.0, 199.0, 391.0, 702.0, 1497.0, 3975.0, 12402.0, 84602.0, 1159292.0, 2612154.0, 277931.0, 28935.0, 6836.0, 2423.0, 1044.0, 542.0, 313.0, 186.0, 104.0, 87.0, 41.0, 37.0, 25.0, 21.0, 11.0, 8.0, 8.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.20703125, -2.1507720947265625, -2.094512939453125, -2.0382537841796875, -1.98199462890625, -1.9257354736328125, -1.869476318359375, -1.8132171630859375, -1.7569580078125, -1.7006988525390625, -1.644439697265625, -1.5881805419921875, -1.53192138671875, -1.4756622314453125, -1.419403076171875, -1.3631439208984375, -1.306884765625, -1.2506256103515625, -1.194366455078125, -1.1381072998046875, -1.08184814453125, -1.0255889892578125, -0.969329833984375, -0.9130706787109375, -0.8568115234375, -0.8005523681640625, -0.744293212890625, -0.6880340576171875, -0.63177490234375, -0.5755157470703125, -0.519256591796875, -0.4629974365234375, -0.40673828125, -0.3504791259765625, -0.294219970703125, -0.2379608154296875, -0.18170166015625, -0.1254425048828125, -0.069183349609375, -0.0129241943359375, 0.0433349609375, 0.0995941162109375, 0.155853271484375, 0.2121124267578125, 0.26837158203125, 0.3246307373046875, 0.380889892578125, 0.4371490478515625, 0.493408203125, 0.5496673583984375, 0.605926513671875, 0.6621856689453125, 0.71844482421875, 0.7747039794921875, 0.830963134765625, 0.8872222900390625, 0.9434814453125, 0.9997406005859375, 1.055999755859375, 1.1122589111328125, 1.16851806640625, 1.2247772216796875, 1.281036376953125, 1.3372955322265625, 1.3935546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 4.0, 9.0, 4.0, 4.0, 11.0, 12.0, 14.0, 19.0, 18.0, 19.0, 17.0, 29.0, 16.0, 37.0, 24.0, 29.0, 38.0, 39.0, 34.0, 31.0, 29.0, 28.0, 30.0, 42.0, 44.0, 41.0, 34.0, 39.0, 36.0, 30.0, 37.0, 29.0, 17.0, 16.0, 17.0, 11.0, 20.0, 10.0, 8.0, 7.0, 12.0, 9.0, 12.0, 2.0, 2.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.91162109375, -0.8837966918945312, -0.8559722900390625, -0.8281478881835938, -0.800323486328125, -0.7724990844726562, -0.7446746826171875, -0.7168502807617188, -0.68902587890625, -0.6612014770507812, -0.6333770751953125, -0.6055526733398438, -0.577728271484375, -0.5499038696289062, -0.5220794677734375, -0.49425506591796875, -0.4664306640625, -0.43860626220703125, -0.4107818603515625, -0.38295745849609375, -0.355133056640625, -0.32730865478515625, -0.2994842529296875, -0.27165985107421875, -0.24383544921875, -0.21601104736328125, -0.1881866455078125, -0.16036224365234375, -0.132537841796875, -0.10471343994140625, -0.0768890380859375, -0.04906463623046875, -0.021240234375, 0.00658416748046875, 0.0344085693359375, 0.06223297119140625, 0.090057373046875, 0.11788177490234375, 0.1457061767578125, 0.17353057861328125, 0.20135498046875, 0.22917938232421875, 0.2570037841796875, 0.28482818603515625, 0.312652587890625, 0.34047698974609375, 0.3683013916015625, 0.39612579345703125, 0.4239501953125, 0.45177459716796875, 0.4795989990234375, 0.5074234008789062, 0.535247802734375, 0.5630722045898438, 0.5908966064453125, 0.6187210083007812, 0.64654541015625, 0.6743698120117188, 0.7021942138671875, 0.7300186157226562, 0.757843017578125, 0.7856674194335938, 0.8134918212890625, 0.8413162231445312, 0.869140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 16.0, 23.0, 50.0, 90.0, 199.0, 456.0, 1415.0, 8402.0, 851206.0, 3314364.0, 14644.0, 2099.0, 700.0, 268.0, 132.0, 76.0, 56.0, 20.0, 22.0, 12.0, 10.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.6953125, -6.5147705078125, -6.334228515625, -6.1536865234375, -5.97314453125, -5.7926025390625, -5.612060546875, -5.4315185546875, -5.2509765625, -5.0704345703125, -4.889892578125, -4.7093505859375, -4.52880859375, -4.3482666015625, -4.167724609375, -3.9871826171875, -3.806640625, -3.6260986328125, -3.445556640625, -3.2650146484375, -3.08447265625, -2.9039306640625, -2.723388671875, -2.5428466796875, -2.3623046875, -2.1817626953125, -2.001220703125, -1.8206787109375, -1.64013671875, -1.4595947265625, -1.279052734375, -1.0985107421875, -0.91796875, -0.7374267578125, -0.556884765625, -0.3763427734375, -0.19580078125, -0.0152587890625, 0.165283203125, 0.3458251953125, 0.5263671875, 0.7069091796875, 0.887451171875, 1.0679931640625, 1.24853515625, 1.4290771484375, 1.609619140625, 1.7901611328125, 1.970703125, 2.1512451171875, 2.331787109375, 2.5123291015625, 2.69287109375, 2.8734130859375, 3.053955078125, 3.2344970703125, 3.4150390625, 3.5955810546875, 3.776123046875, 3.9566650390625, 4.13720703125, 4.3177490234375, 4.498291015625, 4.6788330078125, 4.859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 18.0, 16.0, 46.0, 103.0, 290.0, 1077.0, 1616.0, 577.0, 194.0, 57.0, 32.0, 15.0, 11.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.716796875, -3.549468994140625, -3.38214111328125, -3.214813232421875, -3.0474853515625, -2.880157470703125, -2.71282958984375, -2.545501708984375, -2.378173828125, -2.210845947265625, -2.04351806640625, -1.876190185546875, -1.7088623046875, -1.541534423828125, -1.37420654296875, -1.206878662109375, -1.03955078125, -0.872222900390625, -0.70489501953125, -0.537567138671875, -0.3702392578125, -0.202911376953125, -0.03558349609375, 0.131744384765625, 0.299072265625, 0.466400146484375, 0.63372802734375, 0.801055908203125, 0.9683837890625, 1.135711669921875, 1.30303955078125, 1.470367431640625, 1.6376953125, 1.805023193359375, 1.97235107421875, 2.139678955078125, 2.3070068359375, 2.474334716796875, 2.64166259765625, 2.808990478515625, 2.976318359375, 3.143646240234375, 3.31097412109375, 3.478302001953125, 3.6456298828125, 3.812957763671875, 3.98028564453125, 4.147613525390625, 4.31494140625, 4.482269287109375, 4.64959716796875, 4.816925048828125, 4.9842529296875, 5.151580810546875, 5.31890869140625, 5.486236572265625, 5.653564453125, 5.820892333984375, 5.98822021484375, 6.155548095703125, 6.3228759765625, 6.490203857421875, 6.65753173828125, 6.824859619140625, 6.9921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 54.0, 566.0, 324.0, 31.0, 11.0, 11.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.50987243652344, -42.62980651855469, -39.7497444152832, -36.86968231201172, -33.98961639404297, -31.10955238342285, -28.229488372802734, -25.349424362182617, -22.4693603515625, -19.589296340942383, -16.709232330322266, -13.829168319702148, -10.949104309082031, -8.069040298461914, -5.188976287841797, -2.3089122772216797, 0.5711517333984375, 3.4512157440185547, 6.331279754638672, 9.211343765258789, 12.091407775878906, 14.971471786499023, 17.85153579711914, 20.731599807739258, 23.611663818359375, 26.491727828979492, 29.37179183959961, 32.251853942871094, 35.131919860839844, 38.011985778808594, 40.89204788208008, 43.77210998535156, 46.65217590332031, 49.53224182128906, 52.41230392456055, 55.29236602783203, 58.17243194580078, 61.05249786376953, 63.932559967041016, 66.8126220703125, 69.69268798828125, 72.57275390625, 75.45281982421875, 78.33287811279297, 81.21294403076172, 84.09300994873047, 86.97306823730469, 89.85313415527344, 92.73320007324219, 95.61326599121094, 98.49333190917969, 101.3733901977539, 104.25345611572266, 107.1335220336914, 110.01358032226562, 112.89364624023438, 115.77371215820312, 118.65377807617188, 121.53384399414062, 124.41390228271484, 127.2939682006836, 130.1740264892578, 133.05409240722656, 135.9341583251953, 138.81422424316406]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 13.0, 13.0, 27.0, 33.0, 40.0, 59.0, 61.0, 71.0, 81.0, 78.0, 84.0, 82.0, 83.0, 58.0, 63.0, 43.0, 36.0, 25.0, 16.0, 8.0, 8.0, 7.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.883245468139648, -15.182271003723145, -14.481297492980957, -13.780323028564453, -13.079349517822266, -12.378375053405762, -11.677400588989258, -10.97642707824707, -10.275452613830566, -9.574478149414062, -8.873504638671875, -8.172530174255371, -7.471556186676025, -6.77058219909668, -6.069607734680176, -5.36863374710083, -4.667659759521484, -3.9666857719421387, -3.265711545944214, -2.564737319946289, -1.8637633323669434, -1.1627893447875977, -0.46181488037109375, 0.23915910720825195, 0.9401330947875977, 1.641107201576233, 2.342081308364868, 3.043055534362793, 3.7440295219421387, 4.445003509521484, 5.145977973937988, 5.846951961517334, 6.5479278564453125, 7.248901844024658, 7.949875831604004, 8.650850296020508, 9.351823806762695, 10.0527982711792, 10.753772735595703, 11.45474624633789, 12.155720710754395, 12.856695175170898, 13.557668685913086, 14.25864315032959, 14.959617614746094, 15.660591125488281, 16.36156463623047, 17.06254005432129, 17.763513565063477, 18.464487075805664, 19.165462493896484, 19.866436004638672, 20.56740951538086, 21.268383026123047, 21.969358444213867, 22.670331954956055, 23.371307373046875, 24.072280883789062, 24.773256301879883, 25.47422981262207, 26.175203323364258, 26.876178741455078, 27.577152252197266, 28.278125762939453, 28.97909927368164]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 8.0, 13.0, 18.0, 19.0, 34.0, 39.0, 76.0, 87.0, 165.0, 256.0, 468.0, 730.0, 1309.0, 2163.0, 3995.0, 7825.0, 15229.0, 31440.0, 67813.0, 150284.0, 284203.0, 250751.0, 122619.0, 55383.0, 26100.0, 12749.0, 6579.0, 3507.0, 1926.0, 1141.0, 630.0, 368.0, 229.0, 155.0, 94.0, 56.0, 33.0, 24.0, 20.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28125, -1.2383575439453125, -1.195465087890625, -1.1525726318359375, -1.10968017578125, -1.0667877197265625, -1.023895263671875, -0.9810028076171875, -0.9381103515625, -0.8952178955078125, -0.852325439453125, -0.8094329833984375, -0.76654052734375, -0.7236480712890625, -0.680755615234375, -0.6378631591796875, -0.594970703125, -0.5520782470703125, -0.509185791015625, -0.4662933349609375, -0.42340087890625, -0.3805084228515625, -0.337615966796875, -0.2947235107421875, -0.2518310546875, -0.2089385986328125, -0.166046142578125, -0.1231536865234375, -0.08026123046875, -0.0373687744140625, 0.005523681640625, 0.0484161376953125, 0.09130859375, 0.1342010498046875, 0.177093505859375, 0.2199859619140625, 0.26287841796875, 0.3057708740234375, 0.348663330078125, 0.3915557861328125, 0.4344482421875, 0.4773406982421875, 0.520233154296875, 0.5631256103515625, 0.60601806640625, 0.6489105224609375, 0.691802978515625, 0.7346954345703125, 0.777587890625, 0.8204803466796875, 0.863372802734375, 0.9062652587890625, 0.94915771484375, 0.9920501708984375, 1.034942626953125, 1.0778350830078125, 1.1207275390625, 1.1636199951171875, 1.206512451171875, 1.2494049072265625, 1.29229736328125, 1.3351898193359375, 1.378082275390625, 1.4209747314453125, 1.4638671875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 5.0, 6.0, 9.0, 8.0, 6.0, 17.0, 13.0, 10.0, 19.0, 21.0, 21.0, 17.0, 30.0, 20.0, 26.0, 28.0, 21.0, 31.0, 27.0, 39.0, 40.0, 42.0, 33.0, 40.0, 39.0, 42.0, 35.0, 38.0, 34.0, 25.0, 38.0, 30.0, 27.0, 21.0, 17.0, 16.0, 21.0, 16.0, 14.0, 9.0, 13.0, 5.0, 7.0, 6.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0148391723632812, -0.9837799072265625, -0.9527206420898438, -0.921661376953125, -0.8906021118164062, -0.8595428466796875, -0.8284835815429688, -0.79742431640625, -0.7663650512695312, -0.7353057861328125, -0.7042465209960938, -0.673187255859375, -0.6421279907226562, -0.6110687255859375, -0.5800094604492188, -0.5489501953125, -0.5178909301757812, -0.4868316650390625, -0.45577239990234375, -0.424713134765625, -0.39365386962890625, -0.3625946044921875, -0.33153533935546875, -0.30047607421875, -0.26941680908203125, -0.2383575439453125, -0.20729827880859375, -0.176239013671875, -0.14517974853515625, -0.1141204833984375, -0.08306121826171875, -0.052001953125, -0.02094268798828125, 0.0101165771484375, 0.04117584228515625, 0.072235107421875, 0.10329437255859375, 0.1343536376953125, 0.16541290283203125, 0.19647216796875, 0.22753143310546875, 0.2585906982421875, 0.28964996337890625, 0.320709228515625, 0.35176849365234375, 0.3828277587890625, 0.41388702392578125, 0.4449462890625, 0.47600555419921875, 0.5070648193359375, 0.5381240844726562, 0.569183349609375, 0.6002426147460938, 0.6313018798828125, 0.6623611450195312, 0.69342041015625, 0.7244796752929688, 0.7555389404296875, 0.7865982055664062, 0.817657470703125, 0.8487167358398438, 0.8797760009765625, 0.9108352661132812, 0.94189453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 4.0, 11.0, 13.0, 17.0, 30.0, 46.0, 53.0, 93.0, 159.0, 294.0, 617.0, 1414.0, 3846.0, 12605.0, 50275.0, 260224.0, 598727.0, 90161.0, 20270.0, 5894.0, 2064.0, 782.0, 363.0, 211.0, 101.0, 83.0, 53.0, 31.0, 33.0, 15.0, 20.0, 10.0, 11.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.0078125, -2.919830322265625, -2.83184814453125, -2.743865966796875, -2.6558837890625, -2.567901611328125, -2.47991943359375, -2.391937255859375, -2.303955078125, -2.215972900390625, -2.12799072265625, -2.040008544921875, -1.9520263671875, -1.864044189453125, -1.77606201171875, -1.688079833984375, -1.60009765625, -1.512115478515625, -1.42413330078125, -1.336151123046875, -1.2481689453125, -1.160186767578125, -1.07220458984375, -0.984222412109375, -0.896240234375, -0.808258056640625, -0.72027587890625, -0.632293701171875, -0.5443115234375, -0.456329345703125, -0.36834716796875, -0.280364990234375, -0.1923828125, -0.104400634765625, -0.01641845703125, 0.071563720703125, 0.1595458984375, 0.247528076171875, 0.33551025390625, 0.423492431640625, 0.511474609375, 0.599456787109375, 0.68743896484375, 0.775421142578125, 0.8634033203125, 0.951385498046875, 1.03936767578125, 1.127349853515625, 1.21533203125, 1.303314208984375, 1.39129638671875, 1.479278564453125, 1.5672607421875, 1.655242919921875, 1.74322509765625, 1.831207275390625, 1.919189453125, 2.007171630859375, 2.09515380859375, 2.183135986328125, 2.2711181640625, 2.359100341796875, 2.44708251953125, 2.535064697265625, 2.623046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 5.0, 6.0, 9.0, 9.0, 9.0, 13.0, 9.0, 21.0, 27.0, 34.0, 36.0, 44.0, 36.0, 48.0, 44.0, 51.0, 44.0, 64.0, 49.0, 40.0, 49.0, 43.0, 36.0, 37.0, 31.0, 39.0, 30.0, 23.0, 17.0, 25.0, 13.0, 10.0, 8.0, 15.0, 9.0, 6.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.57049560546875, -4.4222412109375, -4.27398681640625, -4.125732421875, -3.97747802734375, -3.8292236328125, -3.68096923828125, -3.53271484375, -3.38446044921875, -3.2362060546875, -3.08795166015625, -2.939697265625, -2.79144287109375, -2.6431884765625, -2.49493408203125, -2.3466796875, -2.19842529296875, -2.0501708984375, -1.90191650390625, -1.753662109375, -1.60540771484375, -1.4571533203125, -1.30889892578125, -1.16064453125, -1.01239013671875, -0.8641357421875, -0.71588134765625, -0.567626953125, -0.41937255859375, -0.2711181640625, -0.12286376953125, 0.025390625, 0.17364501953125, 0.3218994140625, 0.47015380859375, 0.618408203125, 0.76666259765625, 0.9149169921875, 1.06317138671875, 1.21142578125, 1.35968017578125, 1.5079345703125, 1.65618896484375, 1.804443359375, 1.95269775390625, 2.1009521484375, 2.24920654296875, 2.3974609375, 2.54571533203125, 2.6939697265625, 2.84222412109375, 2.990478515625, 3.13873291015625, 3.2869873046875, 3.43524169921875, 3.58349609375, 3.73175048828125, 3.8800048828125, 4.02825927734375, 4.176513671875, 4.32476806640625, 4.4730224609375, 4.62127685546875, 4.76953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 7.0, 7.0, 8.0, 13.0, 18.0, 33.0, 58.0, 71.0, 104.0, 144.0, 258.0, 393.0, 699.0, 1357.0, 2647.0, 5839.0, 15170.0, 49232.0, 224850.0, 607027.0, 97816.0, 25637.0, 9169.0, 3762.0, 1789.0, 1001.0, 563.0, 287.0, 190.0, 130.0, 86.0, 50.0, 39.0, 30.0, 15.0, 11.0, 16.0, 8.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.89068603515625, -0.8638916015625, -0.83709716796875, -0.810302734375, -0.78350830078125, -0.7567138671875, -0.72991943359375, -0.703125, -0.67633056640625, -0.6495361328125, -0.62274169921875, -0.595947265625, -0.56915283203125, -0.5423583984375, -0.51556396484375, -0.48876953125, -0.46197509765625, -0.4351806640625, -0.40838623046875, -0.381591796875, -0.35479736328125, -0.3280029296875, -0.30120849609375, -0.2744140625, -0.24761962890625, -0.2208251953125, -0.19403076171875, -0.167236328125, -0.14044189453125, -0.1136474609375, -0.08685302734375, -0.06005859375, -0.03326416015625, -0.0064697265625, 0.02032470703125, 0.047119140625, 0.07391357421875, 0.1007080078125, 0.12750244140625, 0.154296875, 0.18109130859375, 0.2078857421875, 0.23468017578125, 0.261474609375, 0.28826904296875, 0.3150634765625, 0.34185791015625, 0.36865234375, 0.39544677734375, 0.4222412109375, 0.44903564453125, 0.475830078125, 0.50262451171875, 0.5294189453125, 0.55621337890625, 0.5830078125, 0.60980224609375, 0.6365966796875, 0.66339111328125, 0.690185546875, 0.71697998046875, 0.7437744140625, 0.77056884765625, 0.79736328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 9.0, 7.0, 7.0, 12.0, 9.0, 23.0, 28.0, 39.0, 62.0, 92.0, 128.0, 136.0, 126.0, 71.0, 78.0, 51.0, 31.0, 19.0, 21.0, 9.0, 10.0, 7.0, 4.0, 1.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0003864765167236328, -0.0003762058913707733, -0.0003659352660179138, -0.0003556646406650543, -0.0003453940153121948, -0.00033512338995933533, -0.00032485276460647583, -0.00031458213925361633, -0.00030431151390075684, -0.00029404088854789734, -0.00028377026319503784, -0.00027349963784217834, -0.00026322901248931885, -0.00025295838713645935, -0.00024268776178359985, -0.00023241713643074036, -0.00022214651107788086, -0.00021187588572502136, -0.00020160526037216187, -0.00019133463501930237, -0.00018106400966644287, -0.00017079338431358337, -0.00016052275896072388, -0.00015025213360786438, -0.00013998150825500488, -0.00012971088290214539, -0.00011944025754928589, -0.00010916963219642639, -9.88990068435669e-05, -8.86283814907074e-05, -7.83577561378479e-05, -6.80871307849884e-05, -5.7816505432128906e-05, -4.754588007926941e-05, -3.727525472640991e-05, -2.7004629373550415e-05, -1.6734004020690918e-05, -6.463378667831421e-06, 3.807246685028076e-06, 1.4077872037887573e-05, 2.434849739074707e-05, 3.461912274360657e-05, 4.4889748096466064e-05, 5.516037344932556e-05, 6.543099880218506e-05, 7.570162415504456e-05, 8.597224950790405e-05, 9.624287486076355e-05, 0.00010651350021362305, 0.00011678412556648254, 0.00012705475091934204, 0.00013732537627220154, 0.00014759600162506104, 0.00015786662697792053, 0.00016813725233078003, 0.00017840787768363953, 0.00018867850303649902, 0.00019894912838935852, 0.00020921975374221802, 0.00021949037909507751, 0.000229761004447937, 0.0002400316298007965, 0.000250302255153656, 0.0002605728805065155, 0.000270843505859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 11.0, 13.0, 20.0, 31.0, 57.0, 93.0, 187.0, 327.0, 751.0, 1954.0, 6268.0, 25735.0, 156224.0, 713049.0, 115216.0, 20468.0, 5090.0, 1700.0, 688.0, 306.0, 160.0, 87.0, 48.0, 23.0, 16.0, 9.0, 5.0, 10.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -1.003021240234375, -0.96893310546875, -0.934844970703125, -0.9007568359375, -0.866668701171875, -0.83258056640625, -0.798492431640625, -0.764404296875, -0.730316162109375, -0.69622802734375, -0.662139892578125, -0.6280517578125, -0.593963623046875, -0.55987548828125, -0.525787353515625, -0.49169921875, -0.457611083984375, -0.42352294921875, -0.389434814453125, -0.3553466796875, -0.321258544921875, -0.28717041015625, -0.253082275390625, -0.218994140625, -0.184906005859375, -0.15081787109375, -0.116729736328125, -0.0826416015625, -0.048553466796875, -0.01446533203125, 0.019622802734375, 0.0537109375, 0.087799072265625, 0.12188720703125, 0.155975341796875, 0.1900634765625, 0.224151611328125, 0.25823974609375, 0.292327880859375, 0.326416015625, 0.360504150390625, 0.39459228515625, 0.428680419921875, 0.4627685546875, 0.496856689453125, 0.53094482421875, 0.565032958984375, 0.59912109375, 0.633209228515625, 0.66729736328125, 0.701385498046875, 0.7354736328125, 0.769561767578125, 0.80364990234375, 0.837738037109375, 0.871826171875, 0.905914306640625, 0.94000244140625, 0.974090576171875, 1.0081787109375, 1.042266845703125, 1.07635498046875, 1.110443115234375, 1.14453125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 3.0, 1.0, 2.0, 6.0, 7.0, 6.0, 6.0, 6.0, 11.0, 17.0, 29.0, 33.0, 30.0, 32.0, 39.0, 50.0, 56.0, 60.0, 69.0, 63.0, 63.0, 73.0, 50.0, 52.0, 45.0, 26.0, 32.0, 21.0, 20.0, 16.0, 9.0, 9.0, 9.0, 4.0, 7.0, 6.0, 8.0, 5.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.841796875, -0.8165130615234375, -0.791229248046875, -0.7659454345703125, -0.74066162109375, -0.7153778076171875, -0.690093994140625, -0.6648101806640625, -0.6395263671875, -0.6142425537109375, -0.588958740234375, -0.5636749267578125, -0.53839111328125, -0.5131072998046875, -0.487823486328125, -0.4625396728515625, -0.437255859375, -0.4119720458984375, -0.386688232421875, -0.3614044189453125, -0.33612060546875, -0.3108367919921875, -0.285552978515625, -0.2602691650390625, -0.2349853515625, -0.2097015380859375, -0.184417724609375, -0.1591339111328125, -0.13385009765625, -0.1085662841796875, -0.083282470703125, -0.0579986572265625, -0.03271484375, -0.0074310302734375, 0.017852783203125, 0.0431365966796875, 0.06842041015625, 0.0937042236328125, 0.118988037109375, 0.1442718505859375, 0.1695556640625, 0.1948394775390625, 0.220123291015625, 0.2454071044921875, 0.27069091796875, 0.2959747314453125, 0.321258544921875, 0.3465423583984375, 0.371826171875, 0.3971099853515625, 0.422393798828125, 0.4476776123046875, 0.47296142578125, 0.4982452392578125, 0.523529052734375, 0.5488128662109375, 0.5740966796875, 0.5993804931640625, 0.624664306640625, 0.6499481201171875, 0.67523193359375, 0.7005157470703125, 0.725799560546875, 0.7510833740234375, 0.7763671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 11.0, 20.0, 29.0, 81.0, 204.0, 380.0, 160.0, 71.0, 25.0, 8.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.35211944580078, -38.14035415649414, -36.928592681884766, -35.716827392578125, -34.505062103271484, -33.293296813964844, -32.08153533935547, -30.869770050048828, -29.658004760742188, -28.44624137878418, -27.23447608947754, -26.02271270751953, -24.81094741821289, -23.599184036254883, -22.387420654296875, -21.175655364990234, -19.963891983032227, -18.75212860107422, -17.540363311767578, -16.32859992980957, -15.11683464050293, -13.905071258544922, -12.693306922912598, -11.481542587280273, -10.26977825164795, -9.058013916015625, -7.846249580383301, -6.634485721588135, -5.4227213859558105, -4.210957050323486, -2.9991931915283203, -1.787428855895996, -0.5756645202636719, 0.6360996961593628, 1.8478639125823975, 3.0596280097961426, 4.271392345428467, 5.483156681060791, 6.694920539855957, 7.906684875488281, 9.118449211120605, 10.33021354675293, 11.541977882385254, 12.753742218017578, 13.965505599975586, 15.177270889282227, 16.389034271240234, 17.600799560546875, 18.812562942504883, 20.02432632446289, 21.23609161376953, 22.44785499572754, 23.65962028503418, 24.871383666992188, 26.083148956298828, 27.294912338256836, 28.506675720214844, 29.71843910217285, 30.930204391479492, 32.1419677734375, 33.35373306274414, 34.56549835205078, 35.777259826660156, 36.9890251159668, 38.20079040527344]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 8.0, 3.0, 15.0, 7.0, 12.0, 9.0, 14.0, 17.0, 26.0, 26.0, 22.0, 34.0, 35.0, 39.0, 38.0, 38.0, 54.0, 77.0, 84.0, 68.0, 53.0, 30.0, 29.0, 36.0, 24.0, 24.0, 28.0, 20.0, 23.0, 22.0, 15.0, 15.0, 11.0, 10.0, 6.0, 10.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.370031356811523, -18.75562286376953, -18.141216278076172, -17.52680778503418, -16.912399291992188, -16.297992706298828, -15.683584213256836, -15.06917667388916, -14.454769134521484, -13.840361595153809, -13.225954055786133, -12.61154556274414, -11.997138023376465, -11.382730484008789, -10.768321990966797, -10.153914451599121, -9.539506912231445, -8.92509937286377, -8.310691833496094, -7.696283340454102, -7.081875801086426, -6.46746826171875, -5.853060245513916, -5.238652229309082, -4.624244689941406, -4.0098371505737305, -3.3954291343688965, -2.7810213565826416, -2.1666135787963867, -1.5522058010101318, -0.937798023223877, -0.32339000701904297, 0.291015625, 0.9054234027862549, 1.5198311805725098, 2.1342389583587646, 2.7486467361450195, 3.3630545139312744, 3.9774622917175293, 4.591870307922363, 5.206277847290039, 5.820685386657715, 6.435093402862549, 7.049501419067383, 7.663908958435059, 8.278316497802734, 8.892724990844727, 9.507132530212402, 10.121540069580078, 10.735947608947754, 11.35035514831543, 11.964763641357422, 12.579171180725098, 13.193578720092773, 13.807987213134766, 14.422394752502441, 15.036802291870117, 15.651209831237793, 16.26561737060547, 16.88002586364746, 17.494434356689453, 18.108840942382812, 18.723249435424805, 19.337657928466797, 19.952064514160156]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 5.0, 6.0, 7.0, 22.0, 30.0, 42.0, 57.0, 99.0, 177.0, 292.0, 502.0, 1200.0, 3301.0, 13255.0, 146837.0, 2224783.0, 1683382.0, 104053.0, 11071.0, 2902.0, 1110.0, 511.0, 261.0, 154.0, 90.0, 50.0, 32.0, 26.0, 7.0, 10.0, 8.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.327606201171875, -2.26458740234375, -2.201568603515625, -2.1385498046875, -2.075531005859375, -2.01251220703125, -1.949493408203125, -1.886474609375, -1.823455810546875, -1.76043701171875, -1.697418212890625, -1.6343994140625, -1.571380615234375, -1.50836181640625, -1.445343017578125, -1.38232421875, -1.319305419921875, -1.25628662109375, -1.193267822265625, -1.1302490234375, -1.067230224609375, -1.00421142578125, -0.941192626953125, -0.878173828125, -0.815155029296875, -0.75213623046875, -0.689117431640625, -0.6260986328125, -0.563079833984375, -0.50006103515625, -0.437042236328125, -0.3740234375, -0.311004638671875, -0.24798583984375, -0.184967041015625, -0.1219482421875, -0.058929443359375, 0.00408935546875, 0.067108154296875, 0.130126953125, 0.193145751953125, 0.25616455078125, 0.319183349609375, 0.3822021484375, 0.445220947265625, 0.50823974609375, 0.571258544921875, 0.63427734375, 0.697296142578125, 0.76031494140625, 0.823333740234375, 0.8863525390625, 0.949371337890625, 1.01239013671875, 1.075408935546875, 1.138427734375, 1.201446533203125, 1.26446533203125, 1.327484130859375, 1.3905029296875, 1.453521728515625, 1.51654052734375, 1.579559326171875, 1.642578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 10.0, 13.0, 11.0, 9.0, 16.0, 21.0, 21.0, 31.0, 22.0, 26.0, 32.0, 36.0, 47.0, 42.0, 40.0, 37.0, 41.0, 38.0, 38.0, 39.0, 42.0, 42.0, 36.0, 37.0, 42.0, 29.0, 26.0, 35.0, 18.0, 22.0, 16.0, 16.0, 13.0, 6.0, 6.0, 4.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0703125, -1.0362701416015625, -1.002227783203125, -0.9681854248046875, -0.93414306640625, -0.9001007080078125, -0.866058349609375, -0.8320159912109375, -0.7979736328125, -0.7639312744140625, -0.729888916015625, -0.6958465576171875, -0.66180419921875, -0.6277618408203125, -0.593719482421875, -0.5596771240234375, -0.525634765625, -0.4915924072265625, -0.457550048828125, -0.4235076904296875, -0.38946533203125, -0.3554229736328125, -0.321380615234375, -0.2873382568359375, -0.2532958984375, -0.2192535400390625, -0.185211181640625, -0.1511688232421875, -0.11712646484375, -0.0830841064453125, -0.049041748046875, -0.0149993896484375, 0.01904296875, 0.0530853271484375, 0.087127685546875, 0.1211700439453125, 0.15521240234375, 0.1892547607421875, 0.223297119140625, 0.2573394775390625, 0.2913818359375, 0.3254241943359375, 0.359466552734375, 0.3935089111328125, 0.42755126953125, 0.4615936279296875, 0.495635986328125, 0.5296783447265625, 0.563720703125, 0.5977630615234375, 0.631805419921875, 0.6658477783203125, 0.69989013671875, 0.7339324951171875, 0.767974853515625, 0.8020172119140625, 0.8360595703125, 0.8701019287109375, 0.904144287109375, 0.9381866455078125, 0.97222900390625, 1.0062713623046875, 1.040313720703125, 1.0743560791015625, 1.1083984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 11.0, 21.0, 46.0, 96.0, 247.0, 578.0, 1911.0, 20022.0, 4027214.0, 139264.0, 3656.0, 721.0, 273.0, 125.0, 35.0, 23.0, 13.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84375, -4.65533447265625, -4.4669189453125, -4.27850341796875, -4.090087890625, -3.90167236328125, -3.7132568359375, -3.52484130859375, -3.33642578125, -3.14801025390625, -2.9595947265625, -2.77117919921875, -2.582763671875, -2.39434814453125, -2.2059326171875, -2.01751708984375, -1.8291015625, -1.64068603515625, -1.4522705078125, -1.26385498046875, -1.075439453125, -0.88702392578125, -0.6986083984375, -0.51019287109375, -0.32177734375, -0.13336181640625, 0.0550537109375, 0.24346923828125, 0.431884765625, 0.62030029296875, 0.8087158203125, 0.99713134765625, 1.185546875, 1.37396240234375, 1.5623779296875, 1.75079345703125, 1.939208984375, 2.12762451171875, 2.3160400390625, 2.50445556640625, 2.69287109375, 2.88128662109375, 3.0697021484375, 3.25811767578125, 3.446533203125, 3.63494873046875, 3.8233642578125, 4.01177978515625, 4.2001953125, 4.38861083984375, 4.5770263671875, 4.76544189453125, 4.953857421875, 5.14227294921875, 5.3306884765625, 5.51910400390625, 5.70751953125, 5.89593505859375, 6.0843505859375, 6.27276611328125, 6.461181640625, 6.64959716796875, 6.8380126953125, 7.02642822265625, 7.21484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 11.0, 11.0, 8.0, 20.0, 23.0, 47.0, 91.0, 147.0, 239.0, 526.0, 886.0, 898.0, 536.0, 296.0, 132.0, 78.0, 39.0, 32.0, 12.0, 12.0, 6.0, 3.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.1796875, -4.0907440185546875, -4.001800537109375, -3.9128570556640625, -3.82391357421875, -3.7349700927734375, -3.646026611328125, -3.5570831298828125, -3.4681396484375, -3.3791961669921875, -3.290252685546875, -3.2013092041015625, -3.11236572265625, -3.0234222412109375, -2.934478759765625, -2.8455352783203125, -2.756591796875, -2.6676483154296875, -2.578704833984375, -2.4897613525390625, -2.40081787109375, -2.3118743896484375, -2.222930908203125, -2.1339874267578125, -2.0450439453125, -1.9561004638671875, -1.867156982421875, -1.7782135009765625, -1.68927001953125, -1.6003265380859375, -1.511383056640625, -1.4224395751953125, -1.33349609375, -1.2445526123046875, -1.155609130859375, -1.0666656494140625, -0.97772216796875, -0.8887786865234375, -0.799835205078125, -0.7108917236328125, -0.6219482421875, -0.5330047607421875, -0.444061279296875, -0.3551177978515625, -0.26617431640625, -0.1772308349609375, -0.088287353515625, 0.0006561279296875, 0.089599609375, 0.1785430908203125, 0.267486572265625, 0.3564300537109375, 0.44537353515625, 0.5343170166015625, 0.623260498046875, 0.7122039794921875, 0.8011474609375, 0.8900909423828125, 0.979034423828125, 1.0679779052734375, 1.15692138671875, 1.2458648681640625, 1.334808349609375, 1.4237518310546875, 1.5126953125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 9.0, 21.0, 17.0, 31.0, 54.0, 79.0, 153.0, 206.0, 184.0, 118.0, 52.0, 36.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-34.154048919677734, -33.486019134521484, -32.817989349365234, -32.14995574951172, -31.4819278717041, -30.81389617919922, -30.14586639404297, -29.47783660888672, -28.809804916381836, -28.141775131225586, -27.473743438720703, -26.805713653564453, -26.137683868408203, -25.46965217590332, -24.80162239074707, -24.133590698242188, -23.465560913085938, -22.797531127929688, -22.129499435424805, -21.461469650268555, -20.793439865112305, -20.125408172607422, -19.457378387451172, -18.789348602294922, -18.121318817138672, -17.453289031982422, -16.78525733947754, -16.11722755432129, -15.449196815490723, -14.781166076660156, -14.113136291503906, -13.44510555267334, -12.777074813842773, -12.109044075012207, -11.441014289855957, -10.77298355102539, -10.104952812194824, -9.436922073364258, -8.768892288208008, -8.100861549377441, -7.432831287384033, -6.764801025390625, -6.096770286560059, -5.42874002456665, -4.760709762573242, -4.092679023742676, -3.4246487617492676, -2.756618022918701, -2.088587760925293, -1.4205572605133057, -0.7525268793106079, -0.08449649810791016, 0.5835340023040771, 1.2515645027160645, 1.9195947647094727, 2.587625503540039, 3.2556557655334473, 3.9236862659454346, 4.591716766357422, 5.25974702835083, 5.927777290344238, 6.595808029174805, 7.263838291168213, 7.931869029998779, 8.599899291992188]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 7.0, 5.0, 9.0, 10.0, 17.0, 7.0, 23.0, 21.0, 20.0, 27.0, 24.0, 36.0, 24.0, 31.0, 30.0, 40.0, 36.0, 38.0, 43.0, 52.0, 38.0, 29.0, 45.0, 43.0, 38.0, 35.0, 32.0, 39.0, 33.0, 25.0, 23.0, 21.0, 14.0, 14.0, 19.0, 10.0, 11.0, 4.0, 7.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.439665794372559, -10.1176176071167, -9.79556941986084, -9.47352123260498, -9.151473999023438, -8.829425811767578, -8.507377624511719, -8.18532943725586, -7.86328125, -7.541233062744141, -7.219184875488281, -6.89713716506958, -6.575088977813721, -6.253040790557861, -5.93099308013916, -5.608944892883301, -5.286896705627441, -4.964848518371582, -4.642800331115723, -4.3207526206970215, -3.998704433441162, -3.6766562461853027, -3.3546082973480225, -3.032560348510742, -2.710512161254883, -2.3884639739990234, -2.066416025161743, -1.7443679571151733, -1.4223198890686035, -1.1002718210220337, -0.7782237529754639, -0.4561758041381836, -0.1341266632080078, 0.187921404838562, 0.5099694728851318, 0.8320175409317017, 1.1540656089782715, 1.4761136770248413, 1.7981617450714111, 2.1202096939086914, 2.442257881164551, 2.76430606842041, 3.0863540172576904, 3.4084019660949707, 3.73045015335083, 4.0524983406066895, 4.374546051025391, 4.69659423828125, 5.018642425537109, 5.340690612792969, 5.662738800048828, 5.984786510467529, 6.306834697723389, 6.628882884979248, 6.950930595397949, 7.272978782653809, 7.595026969909668, 7.917075157165527, 8.239123344421387, 8.561171531677246, 8.883218765258789, 9.205266952514648, 9.527315139770508, 9.849363327026367, 10.171411514282227]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 12.0, 17.0, 23.0, 43.0, 54.0, 84.0, 134.0, 153.0, 248.0, 366.0, 537.0, 849.0, 1315.0, 2029.0, 3177.0, 5020.0, 8280.0, 13410.0, 21994.0, 38108.0, 65789.0, 117242.0, 196929.0, 223486.0, 147637.0, 83353.0, 47251.0, 27740.0, 16418.0, 9925.0, 6003.0, 3809.0, 2396.0, 1615.0, 1015.0, 680.0, 449.0, 314.0, 189.0, 142.0, 85.0, 74.0, 50.0, 38.0, 27.0, 11.0, 13.0, 3.0, 3.0, 3.0, 0.0, 5.0, 2.0], "bins": [-0.98486328125, -0.9560699462890625, -0.927276611328125, -0.8984832763671875, -0.86968994140625, -0.8408966064453125, -0.812103271484375, -0.7833099365234375, -0.7545166015625, -0.7257232666015625, -0.696929931640625, -0.6681365966796875, -0.63934326171875, -0.6105499267578125, -0.581756591796875, -0.5529632568359375, -0.524169921875, -0.4953765869140625, -0.466583251953125, -0.4377899169921875, -0.40899658203125, -0.3802032470703125, -0.351409912109375, -0.3226165771484375, -0.2938232421875, -0.2650299072265625, -0.236236572265625, -0.2074432373046875, -0.17864990234375, -0.1498565673828125, -0.121063232421875, -0.0922698974609375, -0.0634765625, -0.0346832275390625, -0.005889892578125, 0.0229034423828125, 0.05169677734375, 0.0804901123046875, 0.109283447265625, 0.1380767822265625, 0.1668701171875, 0.1956634521484375, 0.224456787109375, 0.2532501220703125, 0.28204345703125, 0.3108367919921875, 0.339630126953125, 0.3684234619140625, 0.397216796875, 0.4260101318359375, 0.454803466796875, 0.4835968017578125, 0.51239013671875, 0.5411834716796875, 0.569976806640625, 0.5987701416015625, 0.6275634765625, 0.6563568115234375, 0.685150146484375, 0.7139434814453125, 0.74273681640625, 0.7715301513671875, 0.800323486328125, 0.8291168212890625, 0.85791015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 3.0, 3.0, 8.0, 12.0, 11.0, 6.0, 12.0, 10.0, 11.0, 23.0, 24.0, 20.0, 22.0, 32.0, 36.0, 29.0, 33.0, 39.0, 27.0, 49.0, 34.0, 40.0, 43.0, 36.0, 39.0, 35.0, 47.0, 28.0, 37.0, 28.0, 27.0, 31.0, 22.0, 25.0, 28.0, 18.0, 13.0, 12.0, 10.0, 8.0, 7.0, 7.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9794921875, -0.9458770751953125, -0.912261962890625, -0.8786468505859375, -0.84503173828125, -0.8114166259765625, -0.777801513671875, -0.7441864013671875, -0.7105712890625, -0.6769561767578125, -0.643341064453125, -0.6097259521484375, -0.57611083984375, -0.5424957275390625, -0.508880615234375, -0.4752655029296875, -0.441650390625, -0.4080352783203125, -0.374420166015625, -0.3408050537109375, -0.30718994140625, -0.2735748291015625, -0.239959716796875, -0.2063446044921875, -0.1727294921875, -0.1391143798828125, -0.105499267578125, -0.0718841552734375, -0.03826904296875, -0.0046539306640625, 0.028961181640625, 0.0625762939453125, 0.09619140625, 0.1298065185546875, 0.163421630859375, 0.1970367431640625, 0.23065185546875, 0.2642669677734375, 0.297882080078125, 0.3314971923828125, 0.3651123046875, 0.3987274169921875, 0.432342529296875, 0.4659576416015625, 0.49957275390625, 0.5331878662109375, 0.566802978515625, 0.6004180908203125, 0.634033203125, 0.6676483154296875, 0.701263427734375, 0.7348785400390625, 0.76849365234375, 0.8021087646484375, 0.835723876953125, 0.8693389892578125, 0.9029541015625, 0.9365692138671875, 0.970184326171875, 1.0037994384765625, 1.03741455078125, 1.0710296630859375, 1.104644775390625, 1.1382598876953125, 1.171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 10.0, 16.0, 25.0, 27.0, 39.0, 71.0, 87.0, 116.0, 210.0, 298.0, 548.0, 972.0, 2460.0, 7980.0, 38012.0, 314379.0, 618667.0, 49515.0, 9766.0, 2729.0, 1070.0, 570.0, 345.0, 189.0, 148.0, 79.0, 52.0, 55.0, 37.0, 15.0, 19.0, 9.0, 9.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.876953125, -3.76947021484375, -3.6619873046875, -3.55450439453125, -3.447021484375, -3.33953857421875, -3.2320556640625, -3.12457275390625, -3.01708984375, -2.90960693359375, -2.8021240234375, -2.69464111328125, -2.587158203125, -2.47967529296875, -2.3721923828125, -2.26470947265625, -2.1572265625, -2.04974365234375, -1.9422607421875, -1.83477783203125, -1.727294921875, -1.61981201171875, -1.5123291015625, -1.40484619140625, -1.29736328125, -1.18988037109375, -1.0823974609375, -0.97491455078125, -0.867431640625, -0.75994873046875, -0.6524658203125, -0.54498291015625, -0.4375, -0.33001708984375, -0.2225341796875, -0.11505126953125, -0.007568359375, 0.09991455078125, 0.2073974609375, 0.31488037109375, 0.42236328125, 0.52984619140625, 0.6373291015625, 0.74481201171875, 0.852294921875, 0.95977783203125, 1.0672607421875, 1.17474365234375, 1.2822265625, 1.38970947265625, 1.4971923828125, 1.60467529296875, 1.712158203125, 1.81964111328125, 1.9271240234375, 2.03460693359375, 2.14208984375, 2.24957275390625, 2.3570556640625, 2.46453857421875, 2.572021484375, 2.67950439453125, 2.7869873046875, 2.89447021484375, 3.001953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 10.0, 7.0, 16.0, 12.0, 25.0, 30.0, 36.0, 29.0, 52.0, 37.0, 49.0, 74.0, 68.0, 65.0, 65.0, 66.0, 64.0, 50.0, 46.0, 29.0, 31.0, 14.0, 25.0, 22.0, 13.0, 16.0, 11.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.81640625, -6.63665771484375, -6.4569091796875, -6.27716064453125, -6.097412109375, -5.91766357421875, -5.7379150390625, -5.55816650390625, -5.37841796875, -5.19866943359375, -5.0189208984375, -4.83917236328125, -4.659423828125, -4.47967529296875, -4.2999267578125, -4.12017822265625, -3.9404296875, -3.76068115234375, -3.5809326171875, -3.40118408203125, -3.221435546875, -3.04168701171875, -2.8619384765625, -2.68218994140625, -2.50244140625, -2.32269287109375, -2.1429443359375, -1.96319580078125, -1.783447265625, -1.60369873046875, -1.4239501953125, -1.24420166015625, -1.064453125, -0.88470458984375, -0.7049560546875, -0.52520751953125, -0.345458984375, -0.16571044921875, 0.0140380859375, 0.19378662109375, 0.37353515625, 0.55328369140625, 0.7330322265625, 0.91278076171875, 1.092529296875, 1.27227783203125, 1.4520263671875, 1.63177490234375, 1.8115234375, 1.99127197265625, 2.1710205078125, 2.35076904296875, 2.530517578125, 2.71026611328125, 2.8900146484375, 3.06976318359375, 3.24951171875, 3.42926025390625, 3.6090087890625, 3.78875732421875, 3.968505859375, 4.14825439453125, 4.3280029296875, 4.50775146484375, 4.6875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 8.0, 6.0, 4.0, 10.0, 17.0, 20.0, 27.0, 35.0, 62.0, 86.0, 171.0, 320.0, 809.0, 2091.0, 7341.0, 32176.0, 246136.0, 688418.0, 54837.0, 10957.0, 2953.0, 1010.0, 490.0, 210.0, 127.0, 60.0, 41.0, 28.0, 27.0, 14.0, 15.0, 9.0, 9.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.048828125, -1.0189895629882812, -0.9891510009765625, -0.9593124389648438, -0.929473876953125, -0.8996353149414062, -0.8697967529296875, -0.8399581909179688, -0.81011962890625, -0.7802810668945312, -0.7504425048828125, -0.7206039428710938, -0.690765380859375, -0.6609268188476562, -0.6310882568359375, -0.6012496948242188, -0.5714111328125, -0.5415725708007812, -0.5117340087890625, -0.48189544677734375, -0.452056884765625, -0.42221832275390625, -0.3923797607421875, -0.36254119873046875, -0.33270263671875, -0.30286407470703125, -0.2730255126953125, -0.24318695068359375, -0.213348388671875, -0.18350982666015625, -0.1536712646484375, -0.12383270263671875, -0.093994140625, -0.06415557861328125, -0.0343170166015625, -0.00447845458984375, 0.025360107421875, 0.05519866943359375, 0.0850372314453125, 0.11487579345703125, 0.14471435546875, 0.17455291748046875, 0.2043914794921875, 0.23423004150390625, 0.264068603515625, 0.29390716552734375, 0.3237457275390625, 0.35358428955078125, 0.3834228515625, 0.41326141357421875, 0.4430999755859375, 0.47293853759765625, 0.502777099609375, 0.5326156616210938, 0.5624542236328125, 0.5922927856445312, 0.62213134765625, 0.6519699096679688, 0.6818084716796875, 0.7116470336914062, 0.741485595703125, 0.7713241577148438, 0.8011627197265625, 0.8310012817382812, 0.86083984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 13.0, 11.0, 17.0, 9.0, 19.0, 34.0, 49.0, 72.0, 97.0, 118.0, 130.0, 113.0, 78.0, 60.0, 43.0, 26.0, 25.0, 14.0, 18.0, 11.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002524852752685547, -0.0002441816031932831, -0.00023587793111801147, -0.00022757425904273987, -0.00021927058696746826, -0.00021096691489219666, -0.00020266324281692505, -0.00019435957074165344, -0.00018605589866638184, -0.00017775222659111023, -0.00016944855451583862, -0.00016114488244056702, -0.0001528412103652954, -0.0001445375382900238, -0.0001362338662147522, -0.0001279301941394806, -0.00011962652206420898, -0.00011132284998893738, -0.00010301917791366577, -9.471550583839417e-05, -8.641183376312256e-05, -7.810816168785095e-05, -6.980448961257935e-05, -6.150081753730774e-05, -5.319714546203613e-05, -4.4893473386764526e-05, -3.658980131149292e-05, -2.8286129236221313e-05, -1.9982457160949707e-05, -1.16787850856781e-05, -3.375113010406494e-06, 4.928559064865112e-06, 1.3232231140136719e-05, 2.1535903215408325e-05, 2.983957529067993e-05, 3.814324736595154e-05, 4.6446919441223145e-05, 5.475059151649475e-05, 6.305426359176636e-05, 7.135793566703796e-05, 7.966160774230957e-05, 8.796527981758118e-05, 9.626895189285278e-05, 0.00010457262396812439, 0.000112876296043396, 0.0001211799681186676, 0.0001294836401939392, 0.00013778731226921082, 0.00014609098434448242, 0.00015439465641975403, 0.00016269832849502563, 0.00017100200057029724, 0.00017930567264556885, 0.00018760934472084045, 0.00019591301679611206, 0.00020421668887138367, 0.00021252036094665527, 0.00022082403302192688, 0.00022912770509719849, 0.0002374313771724701, 0.0002457350492477417, 0.0002540387213230133, 0.0002623423933982849, 0.0002706460654735565, 0.0002789497375488281]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 5.0, 9.0, 10.0, 20.0, 33.0, 48.0, 58.0, 137.0, 291.0, 731.0, 2485.0, 13670.0, 187218.0, 803004.0, 34203.0, 4624.0, 1158.0, 409.0, 196.0, 96.0, 55.0, 36.0, 13.0, 15.0, 9.0, 8.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.095703125, -1.0522308349609375, -1.008758544921875, -0.9652862548828125, -0.92181396484375, -0.8783416748046875, -0.834869384765625, -0.7913970947265625, -0.7479248046875, -0.7044525146484375, -0.660980224609375, -0.6175079345703125, -0.57403564453125, -0.5305633544921875, -0.487091064453125, -0.4436187744140625, -0.400146484375, -0.3566741943359375, -0.313201904296875, -0.2697296142578125, -0.22625732421875, -0.1827850341796875, -0.139312744140625, -0.0958404541015625, -0.0523681640625, -0.0088958740234375, 0.034576416015625, 0.0780487060546875, 0.12152099609375, 0.1649932861328125, 0.208465576171875, 0.2519378662109375, 0.29541015625, 0.3388824462890625, 0.382354736328125, 0.4258270263671875, 0.46929931640625, 0.5127716064453125, 0.556243896484375, 0.5997161865234375, 0.6431884765625, 0.6866607666015625, 0.730133056640625, 0.7736053466796875, 0.81707763671875, 0.8605499267578125, 0.904022216796875, 0.9474945068359375, 0.990966796875, 1.0344390869140625, 1.077911376953125, 1.1213836669921875, 1.16485595703125, 1.2083282470703125, 1.251800537109375, 1.2952728271484375, 1.3387451171875, 1.3822174072265625, 1.425689697265625, 1.4691619873046875, 1.51263427734375, 1.5561065673828125, 1.599578857421875, 1.6430511474609375, 1.6865234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 8.0, 9.0, 10.0, 12.0, 24.0, 29.0, 21.0, 44.0, 53.0, 64.0, 78.0, 113.0, 84.0, 105.0, 71.0, 57.0, 49.0, 37.0, 19.0, 23.0, 17.0, 13.0, 11.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.7578125, -0.732818603515625, -0.70782470703125, -0.682830810546875, -0.6578369140625, -0.632843017578125, -0.60784912109375, -0.582855224609375, -0.557861328125, -0.532867431640625, -0.50787353515625, -0.482879638671875, -0.4578857421875, -0.432891845703125, -0.40789794921875, -0.382904052734375, -0.35791015625, -0.332916259765625, -0.30792236328125, -0.282928466796875, -0.2579345703125, -0.232940673828125, -0.20794677734375, -0.182952880859375, -0.157958984375, -0.132965087890625, -0.10797119140625, -0.082977294921875, -0.0579833984375, -0.032989501953125, -0.00799560546875, 0.016998291015625, 0.0419921875, 0.066986083984375, 0.09197998046875, 0.116973876953125, 0.1419677734375, 0.166961669921875, 0.19195556640625, 0.216949462890625, 0.241943359375, 0.266937255859375, 0.29193115234375, 0.316925048828125, 0.3419189453125, 0.366912841796875, 0.39190673828125, 0.416900634765625, 0.44189453125, 0.466888427734375, 0.49188232421875, 0.516876220703125, 0.5418701171875, 0.566864013671875, 0.59185791015625, 0.616851806640625, 0.641845703125, 0.666839599609375, 0.69183349609375, 0.716827392578125, 0.7418212890625, 0.766815185546875, 0.79180908203125, 0.816802978515625, 0.841796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 3.0, 11.0, 18.0, 21.0, 57.0, 90.0, 161.0, 324.0, 140.0, 79.0, 37.0, 28.0, 11.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.53421401977539, -26.800222396850586, -26.06622886657715, -25.332237243652344, -24.59824562072754, -23.8642520904541, -23.130260467529297, -22.39626693725586, -21.662275314331055, -20.92828369140625, -20.194290161132812, -19.460298538208008, -18.726306915283203, -17.992313385009766, -17.25832176208496, -16.524330139160156, -15.790337562561035, -15.056344985961914, -14.32235336303711, -13.588360786437988, -12.854368209838867, -12.120376586914062, -11.386384010314941, -10.65239143371582, -9.918399810791016, -9.184407234191895, -8.45041561126709, -7.716423034667969, -6.982430458068848, -6.248438358306885, -5.514446258544922, -4.780453681945801, -4.04646110534668, -3.3124687671661377, -2.5784764289855957, -1.8444843292236328, -1.1104919910430908, -0.37649965286254883, 0.35749244689941406, 1.0914850234985352, 1.825477123260498, 2.55946946144104, 3.293461799621582, 4.027453899383545, 4.761445999145508, 5.495438575744629, 6.229430675506592, 6.963423252105713, 7.697415351867676, 8.431407928466797, 9.165399551391602, 9.899392127990723, 10.633384704589844, 11.367376327514648, 12.10136890411377, 12.83536148071289, 13.569353103637695, 14.303345680236816, 15.037337303161621, 15.771329879760742, 16.505321502685547, 17.239315032958984, 17.97330665588379, 18.707298278808594, 19.44129180908203]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 3.0, 8.0, 9.0, 16.0, 8.0, 17.0, 18.0, 15.0, 27.0, 25.0, 27.0, 45.0, 38.0, 44.0, 64.0, 99.0, 126.0, 67.0, 59.0, 32.0, 26.0, 29.0, 40.0, 16.0, 23.0, 20.0, 19.0, 16.0, 16.0, 10.0, 10.0, 5.0, 3.0, 1.0, 0.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-23.951622009277344, -23.26797103881836, -22.584318161010742, -21.900667190551758, -21.217016220092773, -20.533363342285156, -19.849712371826172, -19.166061401367188, -18.48240852355957, -17.798757553100586, -17.11510467529297, -16.431453704833984, -15.747801780700684, -15.064149856567383, -14.380498886108398, -13.696846961975098, -13.013195991516113, -12.329544067382812, -11.645893096923828, -10.962241172790527, -10.278589248657227, -9.594938278198242, -8.911286354064941, -8.22763442993164, -7.543982982635498, -6.8603315353393555, -6.176679611206055, -5.493028163909912, -4.8093767166137695, -4.125724792480469, -3.442073345184326, -2.7584214210510254, -2.074769973754883, -1.3911182880401611, -0.707466721534729, -0.023815155029296875, 0.6598365306854248, 1.3434882164001465, 2.027139663696289, 2.71079158782959, 3.3944430351257324, 4.078094482421875, 4.761746406555176, 5.445397853851318, 6.129049301147461, 6.812701225280762, 7.496352672576904, 8.180004119873047, 8.863656044006348, 9.547307968139648, 10.230958938598633, 10.914610862731934, 11.598262786865234, 12.281913757324219, 12.96556568145752, 13.64921760559082, 14.332868576049805, 15.016520500183105, 15.70017147064209, 16.38382339477539, 17.067474365234375, 17.751127243041992, 18.434778213500977, 19.118431091308594, 19.802082061767578]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 6.0, 7.0, 14.0, 19.0, 27.0, 48.0, 56.0, 93.0, 126.0, 223.0, 396.0, 727.0, 1758.0, 4590.0, 17928.0, 115418.0, 810377.0, 2391786.0, 710973.0, 112273.0, 19039.0, 5007.0, 1770.0, 737.0, 355.0, 197.0, 110.0, 66.0, 45.0, 45.0, 23.0, 14.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.642578125, -1.599884033203125, -1.55718994140625, -1.514495849609375, -1.4718017578125, -1.429107666015625, -1.38641357421875, -1.343719482421875, -1.301025390625, -1.258331298828125, -1.21563720703125, -1.172943115234375, -1.1302490234375, -1.087554931640625, -1.04486083984375, -1.002166748046875, -0.95947265625, -0.916778564453125, -0.87408447265625, -0.831390380859375, -0.7886962890625, -0.746002197265625, -0.70330810546875, -0.660614013671875, -0.617919921875, -0.575225830078125, -0.53253173828125, -0.489837646484375, -0.4471435546875, -0.404449462890625, -0.36175537109375, -0.319061279296875, -0.2763671875, -0.233673095703125, -0.19097900390625, -0.148284912109375, -0.1055908203125, -0.062896728515625, -0.02020263671875, 0.022491455078125, 0.065185546875, 0.107879638671875, 0.15057373046875, 0.193267822265625, 0.2359619140625, 0.278656005859375, 0.32135009765625, 0.364044189453125, 0.40673828125, 0.449432373046875, 0.49212646484375, 0.534820556640625, 0.5775146484375, 0.620208740234375, 0.66290283203125, 0.705596923828125, 0.748291015625, 0.790985107421875, 0.83367919921875, 0.876373291015625, 0.9190673828125, 0.961761474609375, 1.00445556640625, 1.047149658203125, 1.08984375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 3.0, 8.0, 11.0, 9.0, 10.0, 10.0, 9.0, 13.0, 22.0, 19.0, 21.0, 32.0, 26.0, 34.0, 29.0, 45.0, 39.0, 61.0, 40.0, 44.0, 43.0, 41.0, 47.0, 37.0, 46.0, 30.0, 45.0, 35.0, 34.0, 30.0, 12.0, 30.0, 20.0, 10.0, 10.0, 7.0, 7.0, 13.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.247528076171875, -1.21087646484375, -1.174224853515625, -1.1375732421875, -1.100921630859375, -1.06427001953125, -1.027618408203125, -0.990966796875, -0.954315185546875, -0.91766357421875, -0.881011962890625, -0.8443603515625, -0.807708740234375, -0.77105712890625, -0.734405517578125, -0.69775390625, -0.661102294921875, -0.62445068359375, -0.587799072265625, -0.5511474609375, -0.514495849609375, -0.47784423828125, -0.441192626953125, -0.404541015625, -0.367889404296875, -0.33123779296875, -0.294586181640625, -0.2579345703125, -0.221282958984375, -0.18463134765625, -0.147979736328125, -0.111328125, -0.074676513671875, -0.03802490234375, -0.001373291015625, 0.0352783203125, 0.071929931640625, 0.10858154296875, 0.145233154296875, 0.181884765625, 0.218536376953125, 0.25518798828125, 0.291839599609375, 0.3284912109375, 0.365142822265625, 0.40179443359375, 0.438446044921875, 0.47509765625, 0.511749267578125, 0.54840087890625, 0.585052490234375, 0.6217041015625, 0.658355712890625, 0.69500732421875, 0.731658935546875, 0.768310546875, 0.804962158203125, 0.84161376953125, 0.878265380859375, 0.9149169921875, 0.951568603515625, 0.98822021484375, 1.024871826171875, 1.0615234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 8.0, 9.0, 8.0, 17.0, 14.0, 21.0, 36.0, 77.0, 85.0, 214.0, 415.0, 1037.0, 3536.0, 18396.0, 328835.0, 3711428.0, 115556.0, 10742.0, 2379.0, 740.0, 296.0, 157.0, 87.0, 51.0, 37.0, 19.0, 12.0, 9.0, 11.0, 7.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.49407958984375, -2.4061279296875, -2.31817626953125, -2.230224609375, -2.14227294921875, -2.0543212890625, -1.96636962890625, -1.87841796875, -1.79046630859375, -1.7025146484375, -1.61456298828125, -1.526611328125, -1.43865966796875, -1.3507080078125, -1.26275634765625, -1.1748046875, -1.08685302734375, -0.9989013671875, -0.91094970703125, -0.822998046875, -0.73504638671875, -0.6470947265625, -0.55914306640625, -0.47119140625, -0.38323974609375, -0.2952880859375, -0.20733642578125, -0.119384765625, -0.03143310546875, 0.0565185546875, 0.14447021484375, 0.232421875, 0.32037353515625, 0.4083251953125, 0.49627685546875, 0.584228515625, 0.67218017578125, 0.7601318359375, 0.84808349609375, 0.93603515625, 1.02398681640625, 1.1119384765625, 1.19989013671875, 1.287841796875, 1.37579345703125, 1.4637451171875, 1.55169677734375, 1.6396484375, 1.72760009765625, 1.8155517578125, 1.90350341796875, 1.991455078125, 2.07940673828125, 2.1673583984375, 2.25531005859375, 2.34326171875, 2.43121337890625, 2.5191650390625, 2.60711669921875, 2.695068359375, 2.78302001953125, 2.8709716796875, 2.95892333984375, 3.046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 3.0, 9.0, 14.0, 13.0, 21.0, 26.0, 63.0, 81.0, 155.0, 291.0, 528.0, 724.0, 776.0, 549.0, 331.0, 188.0, 108.0, 60.0, 48.0, 28.0, 17.0, 9.0, 10.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.166015625, -3.0869293212890625, -3.007843017578125, -2.9287567138671875, -2.84967041015625, -2.7705841064453125, -2.691497802734375, -2.6124114990234375, -2.5333251953125, -2.4542388916015625, -2.375152587890625, -2.2960662841796875, -2.21697998046875, -2.1378936767578125, -2.058807373046875, -1.9797210693359375, -1.900634765625, -1.8215484619140625, -1.742462158203125, -1.6633758544921875, -1.58428955078125, -1.5052032470703125, -1.426116943359375, -1.3470306396484375, -1.2679443359375, -1.1888580322265625, -1.109771728515625, -1.0306854248046875, -0.95159912109375, -0.8725128173828125, -0.793426513671875, -0.7143402099609375, -0.63525390625, -0.5561676025390625, -0.477081298828125, -0.3979949951171875, -0.31890869140625, -0.2398223876953125, -0.160736083984375, -0.0816497802734375, -0.0025634765625, 0.0765228271484375, 0.155609130859375, 0.2346954345703125, 0.31378173828125, 0.3928680419921875, 0.471954345703125, 0.5510406494140625, 0.630126953125, 0.7092132568359375, 0.788299560546875, 0.8673858642578125, 0.94647216796875, 1.0255584716796875, 1.104644775390625, 1.1837310791015625, 1.2628173828125, 1.3419036865234375, 1.420989990234375, 1.5000762939453125, 1.57916259765625, 1.6582489013671875, 1.737335205078125, 1.8164215087890625, 1.8955078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 4.0, 2.0, 10.0, 29.0, 59.0, 85.0, 170.0, 211.0, 179.0, 116.0, 64.0, 32.0, 13.0, 6.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.250326156616211, -12.634613990783691, -12.018901824951172, -11.403189659118652, -10.787477493286133, -10.17176628112793, -9.55605411529541, -8.94034194946289, -8.324629783630371, -7.708917617797852, -7.093205451965332, -6.477493762969971, -5.861781597137451, -5.246069431304932, -4.63035774230957, -4.014645576477051, -3.3989334106445312, -2.7832212448120117, -2.1675093173980713, -1.5517972707748413, -0.9360852241516113, -0.3203730583190918, 0.29533886909484863, 0.9110507965087891, 1.5267629623413086, 2.142475128173828, 2.7581870555877686, 3.373898983001709, 3.9896111488342285, 4.605323314666748, 5.221035003662109, 5.836747169494629, 6.452461242675781, 7.068173408508301, 7.68388557434082, 8.29959774017334, 8.91530990600586, 9.531021118164062, 10.146733283996582, 10.762445449829102, 11.378157615661621, 11.99386978149414, 12.60958194732666, 13.22529411315918, 13.841005325317383, 14.456718444824219, 15.072429656982422, 15.688141822814941, 16.30385398864746, 16.919565200805664, 17.5352783203125, 18.150989532470703, 18.76670265197754, 19.382413864135742, 19.998126983642578, 20.61383819580078, 21.229549407958984, 21.845260620117188, 22.460973739624023, 23.076684951782227, 23.692398071289062, 24.308109283447266, 24.9238224029541, 25.539533615112305, 26.15524673461914]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 5.0, 3.0, 7.0, 5.0, 16.0, 20.0, 16.0, 18.0, 19.0, 31.0, 25.0, 26.0, 26.0, 40.0, 44.0, 47.0, 54.0, 47.0, 50.0, 52.0, 58.0, 48.0, 51.0, 42.0, 47.0, 33.0, 23.0, 28.0, 23.0, 23.0, 21.0, 10.0, 11.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.652399063110352, -8.357359886169434, -8.062320709228516, -7.7672810554504395, -7.4722418785095215, -7.177202224731445, -6.882163047790527, -6.587123870849609, -6.292084693908691, -5.997045516967773, -5.702005863189697, -5.406966686248779, -5.111927509307861, -4.816887855529785, -4.521848678588867, -4.226809501647949, -3.931769847869873, -3.636730432510376, -3.341691255569458, -3.046651840209961, -2.751612663269043, -2.456573247909546, -2.161533832550049, -1.8664946556091309, -1.5714552402496338, -1.2764159440994263, -0.981376588344574, -0.6863372325897217, -0.39129793643951416, -0.09625864028930664, 0.19878077507019043, 0.4938199520111084, 0.7888593673706055, 1.083898663520813, 1.3789379596710205, 1.6739773750305176, 1.969016671180725, 2.2640559673309326, 2.5590953826904297, 2.8541345596313477, 3.1491739749908447, 3.444213390350342, 3.7392525672912598, 4.034292221069336, 4.329331398010254, 4.624370574951172, 4.91940975189209, 5.214448928833008, 5.509488582611084, 5.804527759552002, 6.099567413330078, 6.394606590270996, 6.689645767211914, 6.984684944152832, 7.279724597930908, 7.574763774871826, 7.869803428649902, 8.16484260559082, 8.459881782531738, 8.754920959472656, 9.04996109008789, 9.345000267028809, 9.640039443969727, 9.935078620910645, 10.230117797851562]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 7.0, 6.0, 5.0, 14.0, 23.0, 26.0, 46.0, 76.0, 89.0, 146.0, 238.0, 365.0, 506.0, 804.0, 1332.0, 2347.0, 4075.0, 7551.0, 14355.0, 29420.0, 66467.0, 162606.0, 350860.0, 232912.0, 93201.0, 40172.0, 18845.0, 9569.0, 5023.0, 2957.0, 1661.0, 1031.0, 642.0, 380.0, 280.0, 158.0, 112.0, 74.0, 54.0, 37.0, 30.0, 20.0, 11.0, 10.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.366668701171875, -1.31732177734375, -1.267974853515625, -1.2186279296875, -1.169281005859375, -1.11993408203125, -1.070587158203125, -1.021240234375, -0.971893310546875, -0.92254638671875, -0.873199462890625, -0.8238525390625, -0.774505615234375, -0.72515869140625, -0.675811767578125, -0.62646484375, -0.577117919921875, -0.52777099609375, -0.478424072265625, -0.4290771484375, -0.379730224609375, -0.33038330078125, -0.281036376953125, -0.231689453125, -0.182342529296875, -0.13299560546875, -0.083648681640625, -0.0343017578125, 0.015045166015625, 0.06439208984375, 0.113739013671875, 0.1630859375, 0.212432861328125, 0.26177978515625, 0.311126708984375, 0.3604736328125, 0.409820556640625, 0.45916748046875, 0.508514404296875, 0.557861328125, 0.607208251953125, 0.65655517578125, 0.705902099609375, 0.7552490234375, 0.804595947265625, 0.85394287109375, 0.903289794921875, 0.95263671875, 1.001983642578125, 1.05133056640625, 1.100677490234375, 1.1500244140625, 1.199371337890625, 1.24871826171875, 1.298065185546875, 1.347412109375, 1.396759033203125, 1.44610595703125, 1.495452880859375, 1.5447998046875, 1.594146728515625, 1.64349365234375, 1.692840576171875, 1.7421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 7.0, 7.0, 6.0, 18.0, 17.0, 8.0, 17.0, 14.0, 15.0, 25.0, 25.0, 27.0, 29.0, 39.0, 38.0, 33.0, 48.0, 42.0, 46.0, 45.0, 47.0, 53.0, 32.0, 52.0, 36.0, 43.0, 34.0, 23.0, 27.0, 26.0, 25.0, 17.0, 22.0, 5.0, 10.0, 12.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1162109375, -1.0803985595703125, -1.044586181640625, -1.0087738037109375, -0.97296142578125, -0.9371490478515625, -0.901336669921875, -0.8655242919921875, -0.8297119140625, -0.7938995361328125, -0.758087158203125, -0.7222747802734375, -0.68646240234375, -0.6506500244140625, -0.614837646484375, -0.5790252685546875, -0.543212890625, -0.5074005126953125, -0.471588134765625, -0.4357757568359375, -0.39996337890625, -0.3641510009765625, -0.328338623046875, -0.2925262451171875, -0.2567138671875, -0.2209014892578125, -0.185089111328125, -0.1492767333984375, -0.11346435546875, -0.0776519775390625, -0.041839599609375, -0.0060272216796875, 0.02978515625, 0.0655975341796875, 0.101409912109375, 0.1372222900390625, 0.17303466796875, 0.2088470458984375, 0.244659423828125, 0.2804718017578125, 0.3162841796875, 0.3520965576171875, 0.387908935546875, 0.4237213134765625, 0.45953369140625, 0.4953460693359375, 0.531158447265625, 0.5669708251953125, 0.602783203125, 0.6385955810546875, 0.674407958984375, 0.7102203369140625, 0.74603271484375, 0.7818450927734375, 0.817657470703125, 0.8534698486328125, 0.8892822265625, 0.9250946044921875, 0.960906982421875, 0.9967193603515625, 1.03253173828125, 1.0683441162109375, 1.104156494140625, 1.1399688720703125, 1.17578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 15.0, 9.0, 19.0, 21.0, 21.0, 37.0, 68.0, 74.0, 91.0, 158.0, 194.0, 315.0, 500.0, 789.0, 1518.0, 3524.0, 13889.0, 119896.0, 823366.0, 68306.0, 9528.0, 2760.0, 1279.0, 729.0, 433.0, 284.0, 201.0, 145.0, 105.0, 65.0, 60.0, 46.0, 24.0, 22.0, 9.0, 7.0, 11.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.078125, -3.95953369140625, -3.8409423828125, -3.72235107421875, -3.603759765625, -3.48516845703125, -3.3665771484375, -3.24798583984375, -3.12939453125, -3.01080322265625, -2.8922119140625, -2.77362060546875, -2.655029296875, -2.53643798828125, -2.4178466796875, -2.29925537109375, -2.1806640625, -2.06207275390625, -1.9434814453125, -1.82489013671875, -1.706298828125, -1.58770751953125, -1.4691162109375, -1.35052490234375, -1.23193359375, -1.11334228515625, -0.9947509765625, -0.87615966796875, -0.757568359375, -0.63897705078125, -0.5203857421875, -0.40179443359375, -0.283203125, -0.16461181640625, -0.0460205078125, 0.07257080078125, 0.191162109375, 0.30975341796875, 0.4283447265625, 0.54693603515625, 0.66552734375, 0.78411865234375, 0.9027099609375, 1.02130126953125, 1.139892578125, 1.25848388671875, 1.3770751953125, 1.49566650390625, 1.6142578125, 1.73284912109375, 1.8514404296875, 1.97003173828125, 2.088623046875, 2.20721435546875, 2.3258056640625, 2.44439697265625, 2.56298828125, 2.68157958984375, 2.8001708984375, 2.91876220703125, 3.037353515625, 3.15594482421875, 3.2745361328125, 3.39312744140625, 3.51171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 4.0, 10.0, 11.0, 12.0, 18.0, 28.0, 38.0, 42.0, 45.0, 63.0, 52.0, 71.0, 67.0, 75.0, 67.0, 73.0, 53.0, 59.0, 55.0, 33.0, 27.0, 22.0, 15.0, 19.0, 5.0, 7.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.21356201171875, -6.0364990234375, -5.85943603515625, -5.682373046875, -5.50531005859375, -5.3282470703125, -5.15118408203125, -4.97412109375, -4.79705810546875, -4.6199951171875, -4.44293212890625, -4.265869140625, -4.08880615234375, -3.9117431640625, -3.73468017578125, -3.5576171875, -3.38055419921875, -3.2034912109375, -3.02642822265625, -2.849365234375, -2.67230224609375, -2.4952392578125, -2.31817626953125, -2.14111328125, -1.96405029296875, -1.7869873046875, -1.60992431640625, -1.432861328125, -1.25579833984375, -1.0787353515625, -0.90167236328125, -0.724609375, -0.54754638671875, -0.3704833984375, -0.19342041015625, -0.016357421875, 0.16070556640625, 0.3377685546875, 0.51483154296875, 0.69189453125, 0.86895751953125, 1.0460205078125, 1.22308349609375, 1.400146484375, 1.57720947265625, 1.7542724609375, 1.93133544921875, 2.1083984375, 2.28546142578125, 2.4625244140625, 2.63958740234375, 2.816650390625, 2.99371337890625, 3.1707763671875, 3.34783935546875, 3.52490234375, 3.70196533203125, 3.8790283203125, 4.05609130859375, 4.233154296875, 4.41021728515625, 4.5872802734375, 4.76434326171875, 4.94140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 12.0, 26.0, 29.0, 51.0, 98.0, 180.0, 388.0, 1104.0, 4680.0, 41215.0, 882816.0, 107020.0, 8253.0, 1611.0, 541.0, 219.0, 136.0, 55.0, 44.0, 21.0, 10.0, 8.0, 6.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2265625, -1.186553955078125, -1.14654541015625, -1.106536865234375, -1.0665283203125, -1.026519775390625, -0.98651123046875, -0.946502685546875, -0.906494140625, -0.866485595703125, -0.82647705078125, -0.786468505859375, -0.7464599609375, -0.706451416015625, -0.66644287109375, -0.626434326171875, -0.58642578125, -0.546417236328125, -0.50640869140625, -0.466400146484375, -0.4263916015625, -0.386383056640625, -0.34637451171875, -0.306365966796875, -0.266357421875, -0.226348876953125, -0.18634033203125, -0.146331787109375, -0.1063232421875, -0.066314697265625, -0.02630615234375, 0.013702392578125, 0.0537109375, 0.093719482421875, 0.13372802734375, 0.173736572265625, 0.2137451171875, 0.253753662109375, 0.29376220703125, 0.333770751953125, 0.373779296875, 0.413787841796875, 0.45379638671875, 0.493804931640625, 0.5338134765625, 0.573822021484375, 0.61383056640625, 0.653839111328125, 0.69384765625, 0.733856201171875, 0.77386474609375, 0.813873291015625, 0.8538818359375, 0.893890380859375, 0.93389892578125, 0.973907470703125, 1.013916015625, 1.053924560546875, 1.09393310546875, 1.133941650390625, 1.1739501953125, 1.213958740234375, 1.25396728515625, 1.293975830078125, 1.333984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 4.0, 6.0, 9.0, 6.0, 6.0, 16.0, 18.0, 19.0, 28.0, 25.0, 41.0, 66.0, 75.0, 109.0, 135.0, 101.0, 81.0, 58.0, 39.0, 22.0, 24.0, 19.0, 15.0, 14.0, 13.0, 9.0, 6.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022077560424804688, -0.00021305307745933533, -0.00020533055067062378, -0.00019760802388191223, -0.00018988549709320068, -0.00018216297030448914, -0.0001744404435157776, -0.00016671791672706604, -0.0001589953899383545, -0.00015127286314964294, -0.0001435503363609314, -0.00013582780957221985, -0.0001281052827835083, -0.00012038275599479675, -0.0001126602292060852, -0.00010493770241737366, -9.721517562866211e-05, -8.949264883995056e-05, -8.177012205123901e-05, -7.404759526252747e-05, -6.632506847381592e-05, -5.860254168510437e-05, -5.088001489639282e-05, -4.3157488107681274e-05, -3.5434961318969727e-05, -2.771243453025818e-05, -1.998990774154663e-05, -1.2267380952835083e-05, -4.544854164123535e-06, 3.1776726245880127e-06, 1.090019941329956e-05, 1.862272620201111e-05, 2.6345252990722656e-05, 3.4067779779434204e-05, 4.179030656814575e-05, 4.95128333568573e-05, 5.723536014556885e-05, 6.49578869342804e-05, 7.268041372299194e-05, 8.040294051170349e-05, 8.812546730041504e-05, 9.584799408912659e-05, 0.00010357052087783813, 0.00011129304766654968, 0.00011901557445526123, 0.00012673810124397278, 0.00013446062803268433, 0.00014218315482139587, 0.00014990568161010742, 0.00015762820839881897, 0.00016535073518753052, 0.00017307326197624207, 0.0001807957887649536, 0.00018851831555366516, 0.0001962408423423767, 0.00020396336913108826, 0.0002116858959197998, 0.00021940842270851135, 0.0002271309494972229, 0.00023485347628593445, 0.000242576003074646, 0.00025029852986335754, 0.0002580210566520691, 0.00026574358344078064, 0.0002734661102294922]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 21.0, 33.0, 68.0, 93.0, 200.0, 313.0, 692.0, 1590.0, 5277.0, 37293.0, 750037.0, 229287.0, 17825.0, 3404.0, 1152.0, 572.0, 291.0, 152.0, 88.0, 55.0, 32.0, 23.0, 18.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.8135833740234375, -0.785369873046875, -0.7571563720703125, -0.72894287109375, -0.7007293701171875, -0.672515869140625, -0.6443023681640625, -0.6160888671875, -0.5878753662109375, -0.559661865234375, -0.5314483642578125, -0.50323486328125, -0.4750213623046875, -0.446807861328125, -0.4185943603515625, -0.390380859375, -0.3621673583984375, -0.333953857421875, -0.3057403564453125, -0.27752685546875, -0.2493133544921875, -0.221099853515625, -0.1928863525390625, -0.1646728515625, -0.1364593505859375, -0.108245849609375, -0.0800323486328125, -0.05181884765625, -0.0236053466796875, 0.004608154296875, 0.0328216552734375, 0.06103515625, 0.0892486572265625, 0.117462158203125, 0.1456756591796875, 0.17388916015625, 0.2021026611328125, 0.230316162109375, 0.2585296630859375, 0.2867431640625, 0.3149566650390625, 0.343170166015625, 0.3713836669921875, 0.39959716796875, 0.4278106689453125, 0.456024169921875, 0.4842376708984375, 0.512451171875, 0.5406646728515625, 0.568878173828125, 0.5970916748046875, 0.62530517578125, 0.6535186767578125, 0.681732177734375, 0.7099456787109375, 0.7381591796875, 0.7663726806640625, 0.794586181640625, 0.8227996826171875, 0.85101318359375, 0.8792266845703125, 0.907440185546875, 0.9356536865234375, 0.9638671875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 6.0, 10.0, 17.0, 17.0, 26.0, 22.0, 24.0, 46.0, 52.0, 77.0, 88.0, 89.0, 82.0, 67.0, 63.0, 67.0, 50.0, 44.0, 32.0, 23.0, 19.0, 16.0, 18.0, 10.0, 11.0, 10.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.725616455078125, -0.70172119140625, -0.677825927734375, -0.6539306640625, -0.630035400390625, -0.60614013671875, -0.582244873046875, -0.558349609375, -0.534454345703125, -0.51055908203125, -0.486663818359375, -0.4627685546875, -0.438873291015625, -0.41497802734375, -0.391082763671875, -0.3671875, -0.343292236328125, -0.31939697265625, -0.295501708984375, -0.2716064453125, -0.247711181640625, -0.22381591796875, -0.199920654296875, -0.176025390625, -0.152130126953125, -0.12823486328125, -0.104339599609375, -0.0804443359375, -0.056549072265625, -0.03265380859375, -0.008758544921875, 0.01513671875, 0.039031982421875, 0.06292724609375, 0.086822509765625, 0.1107177734375, 0.134613037109375, 0.15850830078125, 0.182403564453125, 0.206298828125, 0.230194091796875, 0.25408935546875, 0.277984619140625, 0.3018798828125, 0.325775146484375, 0.34967041015625, 0.373565673828125, 0.3974609375, 0.421356201171875, 0.44525146484375, 0.469146728515625, 0.4930419921875, 0.516937255859375, 0.54083251953125, 0.564727783203125, 0.588623046875, 0.612518310546875, 0.63641357421875, 0.660308837890625, 0.6842041015625, 0.708099365234375, 0.73199462890625, 0.755889892578125, 0.77978515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 10.0, 7.0, 18.0, 73.0, 174.0, 474.0, 148.0, 52.0, 26.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.35542678833008, -37.32943344116211, -36.303436279296875, -35.277442932128906, -34.25144958496094, -33.22545623779297, -32.199459075927734, -31.173465728759766, -30.147472381591797, -29.121477127075195, -28.095483779907227, -27.069488525390625, -26.043495178222656, -25.017499923706055, -23.991504669189453, -22.965511322021484, -21.939516067504883, -20.91352081298828, -19.887527465820312, -18.86153221130371, -17.835538864135742, -16.80954360961914, -15.783549308776855, -14.75755500793457, -13.731560707092285, -12.70556640625, -11.679572105407715, -10.65357780456543, -9.627582550048828, -8.60158920288086, -7.575593948364258, -6.549599647521973, -5.52360725402832, -4.497612953186035, -3.471618413925171, -2.4456238746643066, -1.4196295738220215, -0.39363527297973633, 0.632359504699707, 1.6583538055419922, 2.6843481063842773, 3.7103424072265625, 4.736336708068848, 5.762331485748291, 6.788325786590576, 7.814320087432861, 8.840314865112305, 9.86630916595459, 10.892303466796875, 11.91829776763916, 12.944292068481445, 13.970287322998047, 14.996280670166016, 16.022275924682617, 17.04827117919922, 18.074264526367188, 19.100257873535156, 20.126253128051758, 21.152246475219727, 22.178241729736328, 23.204235076904297, 24.2302303314209, 25.2562255859375, 26.28221893310547, 27.30821418762207]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 7.0, 9.0, 8.0, 9.0, 18.0, 13.0, 23.0, 26.0, 19.0, 28.0, 36.0, 31.0, 29.0, 52.0, 132.0, 158.0, 69.0, 44.0, 39.0, 36.0, 22.0, 27.0, 31.0, 23.0, 31.0, 10.0, 14.0, 8.0, 9.0, 3.0, 7.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.00809669494629, -18.48225212097168, -17.956409454345703, -17.430564880371094, -16.904720306396484, -16.378877639770508, -15.853033065795898, -15.327189445495605, -14.801345825195312, -14.27550220489502, -13.749658584594727, -13.223814010620117, -12.697970390319824, -12.172126770019531, -11.646282196044922, -11.120438575744629, -10.594594955444336, -10.068751335144043, -9.54290771484375, -9.01706314086914, -8.491219520568848, -7.965375900268555, -7.4395318031311035, -6.913687705993652, -6.387844085693359, -5.862000465393066, -5.336156368255615, -4.810312271118164, -4.284468650817871, -3.758624792098999, -3.232780933380127, -2.706937074661255, -2.1810951232910156, -1.6552512645721436, -1.1294074058532715, -0.6035635471343994, -0.07771968841552734, 0.4481241703033447, 0.9739680290222168, 1.4998118877410889, 2.025655746459961, 2.551499605178833, 3.077343463897705, 3.603187322616577, 4.129031181335449, 4.654874801635742, 5.180718898773193, 5.7065629959106445, 6.2324066162109375, 6.7582502365112305, 7.284094333648682, 7.809938430786133, 8.335782051086426, 8.861625671386719, 9.387470245361328, 9.913313865661621, 10.439157485961914, 10.965001106262207, 11.4908447265625, 12.01668930053711, 12.542532920837402, 13.068376541137695, 13.594221115112305, 14.120064735412598, 14.64590835571289]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 17.0, 13.0, 29.0, 60.0, 101.0, 196.0, 337.0, 643.0, 1325.0, 3096.0, 10929.0, 66652.0, 811823.0, 2615823.0, 612108.0, 55682.0, 9835.0, 3229.0, 1214.0, 581.0, 301.0, 127.0, 76.0, 47.0, 22.0, 9.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.13671875, -3.06768798828125, -2.9986572265625, -2.92962646484375, -2.860595703125, -2.79156494140625, -2.7225341796875, -2.65350341796875, -2.58447265625, -2.51544189453125, -2.4464111328125, -2.37738037109375, -2.308349609375, -2.23931884765625, -2.1702880859375, -2.10125732421875, -2.0322265625, -1.96319580078125, -1.8941650390625, -1.82513427734375, -1.756103515625, -1.68707275390625, -1.6180419921875, -1.54901123046875, -1.47998046875, -1.41094970703125, -1.3419189453125, -1.27288818359375, -1.203857421875, -1.13482666015625, -1.0657958984375, -0.99676513671875, -0.927734375, -0.85870361328125, -0.7896728515625, -0.72064208984375, -0.651611328125, -0.58258056640625, -0.5135498046875, -0.44451904296875, -0.37548828125, -0.30645751953125, -0.2374267578125, -0.16839599609375, -0.099365234375, -0.03033447265625, 0.0386962890625, 0.10772705078125, 0.1767578125, 0.24578857421875, 0.3148193359375, 0.38385009765625, 0.452880859375, 0.52191162109375, 0.5909423828125, 0.65997314453125, 0.72900390625, 0.79803466796875, 0.8670654296875, 0.93609619140625, 1.005126953125, 1.07415771484375, 1.1431884765625, 1.21221923828125, 1.28125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 18.0, 14.0, 20.0, 27.0, 41.0, 40.0, 41.0, 56.0, 58.0, 56.0, 61.0, 63.0, 63.0, 63.0, 67.0, 64.0, 45.0, 36.0, 39.0, 32.0, 25.0, 19.0, 7.0, 16.0, 4.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88671875, -1.8377838134765625, -1.788848876953125, -1.7399139404296875, -1.69097900390625, -1.6420440673828125, -1.593109130859375, -1.5441741943359375, -1.4952392578125, -1.4463043212890625, -1.397369384765625, -1.3484344482421875, -1.29949951171875, -1.2505645751953125, -1.201629638671875, -1.1526947021484375, -1.103759765625, -1.0548248291015625, -1.005889892578125, -0.9569549560546875, -0.90802001953125, -0.8590850830078125, -0.810150146484375, -0.7612152099609375, -0.7122802734375, -0.6633453369140625, -0.614410400390625, -0.5654754638671875, -0.51654052734375, -0.4676055908203125, -0.418670654296875, -0.3697357177734375, -0.32080078125, -0.2718658447265625, -0.222930908203125, -0.1739959716796875, -0.12506103515625, -0.0761260986328125, -0.027191162109375, 0.0217437744140625, 0.0706787109375, 0.1196136474609375, 0.168548583984375, 0.2174835205078125, 0.26641845703125, 0.3153533935546875, 0.364288330078125, 0.4132232666015625, 0.462158203125, 0.5110931396484375, 0.560028076171875, 0.6089630126953125, 0.65789794921875, 0.7068328857421875, 0.755767822265625, 0.8047027587890625, 0.8536376953125, 0.9025726318359375, 0.951507568359375, 1.0004425048828125, 1.04937744140625, 1.0983123779296875, 1.147247314453125, 1.1961822509765625, 1.2451171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 8.0, 9.0, 16.0, 21.0, 39.0, 88.0, 129.0, 278.0, 729.0, 2255.0, 19101.0, 4094836.0, 71924.0, 3331.0, 827.0, 298.0, 165.0, 95.0, 40.0, 20.0, 17.0, 18.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.662353515625, -7.36376953125, -7.065185546875, -6.7666015625, -6.468017578125, -6.16943359375, -5.870849609375, -5.572265625, -5.273681640625, -4.97509765625, -4.676513671875, -4.3779296875, -4.079345703125, -3.78076171875, -3.482177734375, -3.18359375, -2.885009765625, -2.58642578125, -2.287841796875, -1.9892578125, -1.690673828125, -1.39208984375, -1.093505859375, -0.794921875, -0.496337890625, -0.19775390625, 0.100830078125, 0.3994140625, 0.697998046875, 0.99658203125, 1.295166015625, 1.59375, 1.892333984375, 2.19091796875, 2.489501953125, 2.7880859375, 3.086669921875, 3.38525390625, 3.683837890625, 3.982421875, 4.281005859375, 4.57958984375, 4.878173828125, 5.1767578125, 5.475341796875, 5.77392578125, 6.072509765625, 6.37109375, 6.669677734375, 6.96826171875, 7.266845703125, 7.5654296875, 7.864013671875, 8.16259765625, 8.461181640625, 8.759765625, 9.058349609375, 9.35693359375, 9.655517578125, 9.9541015625, 10.252685546875, 10.55126953125, 10.849853515625, 11.1484375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 10.0, 12.0, 15.0, 23.0, 54.0, 69.0, 97.0, 188.0, 336.0, 720.0, 1135.0, 704.0, 316.0, 178.0, 92.0, 52.0, 33.0, 10.0, 8.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.5859375, -6.41021728515625, -6.2344970703125, -6.05877685546875, -5.883056640625, -5.70733642578125, -5.5316162109375, -5.35589599609375, -5.18017578125, -5.00445556640625, -4.8287353515625, -4.65301513671875, -4.477294921875, -4.30157470703125, -4.1258544921875, -3.95013427734375, -3.7744140625, -3.59869384765625, -3.4229736328125, -3.24725341796875, -3.071533203125, -2.89581298828125, -2.7200927734375, -2.54437255859375, -2.36865234375, -2.19293212890625, -2.0172119140625, -1.84149169921875, -1.665771484375, -1.49005126953125, -1.3143310546875, -1.13861083984375, -0.962890625, -0.78717041015625, -0.6114501953125, -0.43572998046875, -0.260009765625, -0.08428955078125, 0.0914306640625, 0.26715087890625, 0.44287109375, 0.61859130859375, 0.7943115234375, 0.97003173828125, 1.145751953125, 1.32147216796875, 1.4971923828125, 1.67291259765625, 1.8486328125, 2.02435302734375, 2.2000732421875, 2.37579345703125, 2.551513671875, 2.72723388671875, 2.9029541015625, 3.07867431640625, 3.25439453125, 3.43011474609375, 3.6058349609375, 3.78155517578125, 3.957275390625, 4.13299560546875, 4.3087158203125, 4.48443603515625, 4.66015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 3.0, 4.0, 8.0, 10.0, 12.0, 32.0, 73.0, 149.0, 262.0, 268.0, 95.0, 44.0, 14.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-90.1289291381836, -88.39374542236328, -86.6585693359375, -84.92338562011719, -83.1882095336914, -81.4530258178711, -79.71784973144531, -77.982666015625, -76.24748992919922, -74.5123062133789, -72.77713012695312, -71.04194641113281, -69.30677032470703, -67.57158660888672, -65.83641052246094, -64.10122680664062, -62.36604690551758, -60.63086700439453, -58.895687103271484, -57.16050720214844, -55.42532730102539, -53.690147399902344, -51.95496368408203, -50.21978759765625, -48.48460388183594, -46.74942398071289, -45.014244079589844, -43.2790641784668, -41.54388427734375, -39.8087043762207, -38.073524475097656, -36.338340759277344, -34.60316467285156, -32.867984771728516, -31.13280487060547, -29.397624969482422, -27.662445068359375, -25.927265167236328, -24.19208335876465, -22.4569034576416, -20.721725463867188, -18.98654556274414, -17.251365661621094, -15.51618480682373, -13.781004905700684, -12.045825004577637, -10.310644149780273, -8.575464248657227, -6.84028434753418, -5.105104446411133, -3.3699240684509277, -1.6347436904907227, 0.10043621063232422, 1.835616111755371, 3.5707969665527344, 5.305976867675781, 7.041156768798828, 8.776336669921875, 10.511516571044922, 12.246697425842285, 13.981877326965332, 15.717057228088379, 17.452238082885742, 19.18741798400879, 20.922597885131836]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 9.0, 15.0, 12.0, 31.0, 24.0, 52.0, 49.0, 53.0, 75.0, 95.0, 97.0, 66.0, 70.0, 62.0, 55.0, 46.0, 39.0, 28.0, 34.0, 23.0, 15.0, 8.0, 14.0, 7.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.352680206298828, -26.396947860717773, -25.441213607788086, -24.48548126220703, -23.529748916625977, -22.574016571044922, -21.618282318115234, -20.66254997253418, -19.706817626953125, -18.75108528137207, -17.795351028442383, -16.839618682861328, -15.883886337280273, -14.928153038024902, -13.972419738769531, -13.016687393188477, -12.060954093933105, -11.105220794677734, -10.14948844909668, -9.193755149841309, -8.238022804260254, -7.282289505004883, -6.32655668258667, -5.370823860168457, -4.415091037750244, -3.4593582153320312, -2.5036253929138184, -1.5478923320770264, -0.5921595096588135, 0.3635735511779785, 1.3193063735961914, 2.2750391960144043, 3.230772018432617, 4.18650484085083, 5.142237663269043, 6.097970962524414, 7.053703308105469, 8.00943660736084, 8.965169906616211, 9.920902252197266, 10.87663459777832, 11.832367897033691, 12.788100242614746, 13.743833541870117, 14.699565887451172, 15.655299186706543, 16.611032485961914, 17.56676483154297, 18.522499084472656, 19.47823143005371, 20.4339656829834, 21.389698028564453, 22.345430374145508, 23.301162719726562, 24.25689697265625, 25.212629318237305, 26.16836166381836, 27.124094009399414, 28.0798282623291, 29.035560607910156, 29.99129295349121, 30.947025299072266, 31.902759552001953, 32.858489990234375, 33.81422424316406]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 7.0, 5.0, 6.0, 14.0, 22.0, 34.0, 58.0, 106.0, 188.0, 321.0, 705.0, 1302.0, 3241.0, 9747.0, 41672.0, 417229.0, 510913.0, 46102.0, 10518.0, 3387.0, 1433.0, 654.0, 377.0, 204.0, 133.0, 65.0, 29.0, 25.0, 20.0, 8.0, 9.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.625, -3.521514892578125, -3.41802978515625, -3.314544677734375, -3.2110595703125, -3.107574462890625, -3.00408935546875, -2.900604248046875, -2.797119140625, -2.693634033203125, -2.59014892578125, -2.486663818359375, -2.3831787109375, -2.279693603515625, -2.17620849609375, -2.072723388671875, -1.96923828125, -1.865753173828125, -1.76226806640625, -1.658782958984375, -1.5552978515625, -1.451812744140625, -1.34832763671875, -1.244842529296875, -1.141357421875, -1.037872314453125, -0.93438720703125, -0.830902099609375, -0.7274169921875, -0.623931884765625, -0.52044677734375, -0.416961669921875, -0.3134765625, -0.209991455078125, -0.10650634765625, -0.003021240234375, 0.1004638671875, 0.203948974609375, 0.30743408203125, 0.410919189453125, 0.514404296875, 0.617889404296875, 0.72137451171875, 0.824859619140625, 0.9283447265625, 1.031829833984375, 1.13531494140625, 1.238800048828125, 1.34228515625, 1.445770263671875, 1.54925537109375, 1.652740478515625, 1.7562255859375, 1.859710693359375, 1.96319580078125, 2.066680908203125, 2.170166015625, 2.273651123046875, 2.37713623046875, 2.480621337890625, 2.5841064453125, 2.687591552734375, 2.79107666015625, 2.894561767578125, 2.998046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 11.0, 10.0, 10.0, 28.0, 31.0, 28.0, 46.0, 51.0, 56.0, 71.0, 83.0, 75.0, 87.0, 85.0, 74.0, 57.0, 47.0, 34.0, 38.0, 32.0, 18.0, 7.0, 9.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12109375, -2.052093505859375, -1.98309326171875, -1.914093017578125, -1.8450927734375, -1.776092529296875, -1.70709228515625, -1.638092041015625, -1.569091796875, -1.500091552734375, -1.43109130859375, -1.362091064453125, -1.2930908203125, -1.224090576171875, -1.15509033203125, -1.086090087890625, -1.01708984375, -0.948089599609375, -0.87908935546875, -0.810089111328125, -0.7410888671875, -0.672088623046875, -0.60308837890625, -0.534088134765625, -0.465087890625, -0.396087646484375, -0.32708740234375, -0.258087158203125, -0.1890869140625, -0.120086669921875, -0.05108642578125, 0.017913818359375, 0.0869140625, 0.155914306640625, 0.22491455078125, 0.293914794921875, 0.3629150390625, 0.431915283203125, 0.50091552734375, 0.569915771484375, 0.638916015625, 0.707916259765625, 0.77691650390625, 0.845916748046875, 0.9149169921875, 0.983917236328125, 1.05291748046875, 1.121917724609375, 1.19091796875, 1.259918212890625, 1.32891845703125, 1.397918701171875, 1.4669189453125, 1.535919189453125, 1.60491943359375, 1.673919677734375, 1.742919921875, 1.811920166015625, 1.88092041015625, 1.949920654296875, 2.0189208984375, 2.087921142578125, 2.15692138671875, 2.225921630859375, 2.294921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 14.0, 16.0, 11.0, 26.0, 32.0, 44.0, 54.0, 73.0, 105.0, 145.0, 218.0, 351.0, 633.0, 1421.0, 3740.0, 14948.0, 120249.0, 858540.0, 36342.0, 7054.0, 2254.0, 915.0, 460.0, 271.0, 180.0, 117.0, 81.0, 63.0, 48.0, 24.0, 22.0, 16.0, 13.0, 13.0, 10.0, 6.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.12109375, -3.0242919921875, -2.927490234375, -2.8306884765625, -2.73388671875, -2.6370849609375, -2.540283203125, -2.4434814453125, -2.3466796875, -2.2498779296875, -2.153076171875, -2.0562744140625, -1.95947265625, -1.8626708984375, -1.765869140625, -1.6690673828125, -1.572265625, -1.4754638671875, -1.378662109375, -1.2818603515625, -1.18505859375, -1.0882568359375, -0.991455078125, -0.8946533203125, -0.7978515625, -0.7010498046875, -0.604248046875, -0.5074462890625, -0.41064453125, -0.3138427734375, -0.217041015625, -0.1202392578125, -0.0234375, 0.0733642578125, 0.170166015625, 0.2669677734375, 0.36376953125, 0.4605712890625, 0.557373046875, 0.6541748046875, 0.7509765625, 0.8477783203125, 0.944580078125, 1.0413818359375, 1.13818359375, 1.2349853515625, 1.331787109375, 1.4285888671875, 1.525390625, 1.6221923828125, 1.718994140625, 1.8157958984375, 1.91259765625, 2.0093994140625, 2.106201171875, 2.2030029296875, 2.2998046875, 2.3966064453125, 2.493408203125, 2.5902099609375, 2.68701171875, 2.7838134765625, 2.880615234375, 2.9774169921875, 3.07421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 17.0, 18.0, 17.0, 20.0, 35.0, 32.0, 38.0, 45.0, 45.0, 68.0, 67.0, 97.0, 65.0, 55.0, 49.0, 51.0, 40.0, 28.0, 26.0, 18.0, 25.0, 19.0, 14.0, 9.0, 13.0, 9.0, 7.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.69683837890625, -5.5147705078125, -5.33270263671875, -5.150634765625, -4.96856689453125, -4.7864990234375, -4.60443115234375, -4.42236328125, -4.24029541015625, -4.0582275390625, -3.87615966796875, -3.694091796875, -3.51202392578125, -3.3299560546875, -3.14788818359375, -2.9658203125, -2.78375244140625, -2.6016845703125, -2.41961669921875, -2.237548828125, -2.05548095703125, -1.8734130859375, -1.69134521484375, -1.50927734375, -1.32720947265625, -1.1451416015625, -0.96307373046875, -0.781005859375, -0.59893798828125, -0.4168701171875, -0.23480224609375, -0.052734375, 0.12933349609375, 0.3114013671875, 0.49346923828125, 0.675537109375, 0.85760498046875, 1.0396728515625, 1.22174072265625, 1.40380859375, 1.58587646484375, 1.7679443359375, 1.95001220703125, 2.132080078125, 2.31414794921875, 2.4962158203125, 2.67828369140625, 2.8603515625, 3.04241943359375, 3.2244873046875, 3.40655517578125, 3.588623046875, 3.77069091796875, 3.9527587890625, 4.13482666015625, 4.31689453125, 4.49896240234375, 4.6810302734375, 4.86309814453125, 5.045166015625, 5.22723388671875, 5.4093017578125, 5.59136962890625, 5.7734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 9.0, 5.0, 4.0, 3.0, 11.0, 11.0, 21.0, 21.0, 23.0, 40.0, 75.0, 112.0, 206.0, 319.0, 774.0, 2009.0, 5594.0, 20387.0, 148587.0, 821344.0, 35520.0, 8402.0, 2786.0, 1116.0, 491.0, 247.0, 152.0, 89.0, 60.0, 42.0, 29.0, 23.0, 13.0, 11.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6842308044433594, -0.6658248901367188, -0.6474189758300781, -0.6290130615234375, -0.6106071472167969, -0.5922012329101562, -0.5737953186035156, -0.555389404296875, -0.5369834899902344, -0.5185775756835938, -0.5001716613769531, -0.4817657470703125, -0.4633598327636719, -0.44495391845703125, -0.4265480041503906, -0.40814208984375, -0.3897361755371094, -0.37133026123046875, -0.3529243469238281, -0.3345184326171875, -0.3161125183105469, -0.29770660400390625, -0.2793006896972656, -0.260894775390625, -0.24248886108398438, -0.22408294677734375, -0.20567703247070312, -0.1872711181640625, -0.16886520385742188, -0.15045928955078125, -0.13205337524414062, -0.1136474609375, -0.09524154663085938, -0.07683563232421875, -0.058429718017578125, -0.0400238037109375, -0.021617889404296875, -0.00321197509765625, 0.015193939208984375, 0.033599853515625, 0.052005767822265625, 0.07041168212890625, 0.08881759643554688, 0.1072235107421875, 0.12562942504882812, 0.14403533935546875, 0.16244125366210938, 0.18084716796875, 0.19925308227539062, 0.21765899658203125, 0.23606491088867188, 0.2544708251953125, 0.2728767395019531, 0.29128265380859375, 0.3096885681152344, 0.328094482421875, 0.3465003967285156, 0.36490631103515625, 0.3833122253417969, 0.4017181396484375, 0.4201240539550781, 0.43852996826171875, 0.4569358825683594, 0.475341796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 6.0, 8.0, 10.0, 16.0, 25.0, 17.0, 35.0, 39.0, 57.0, 87.0, 116.0, 156.0, 115.0, 77.0, 44.0, 48.0, 31.0, 37.0, 18.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002295970916748047, -0.00022292137145996094, -0.0002162456512451172, -0.00020956993103027344, -0.0002028942108154297, -0.00019621849060058594, -0.0001895427703857422, -0.00018286705017089844, -0.0001761913299560547, -0.00016951560974121094, -0.0001628398895263672, -0.00015616416931152344, -0.0001494884490966797, -0.00014281272888183594, -0.0001361370086669922, -0.00012946128845214844, -0.0001227855682373047, -0.00011610984802246094, -0.00010943412780761719, -0.00010275840759277344, -9.608268737792969e-05, -8.940696716308594e-05, -8.273124694824219e-05, -7.605552673339844e-05, -6.937980651855469e-05, -6.270408630371094e-05, -5.602836608886719e-05, -4.935264587402344e-05, -4.267692565917969e-05, -3.600120544433594e-05, -2.9325485229492188e-05, -2.2649765014648438e-05, -1.5974044799804688e-05, -9.298324584960938e-06, -2.6226043701171875e-06, 4.0531158447265625e-06, 1.0728836059570312e-05, 1.7404556274414062e-05, 2.4080276489257812e-05, 3.075599670410156e-05, 3.743171691894531e-05, 4.410743713378906e-05, 5.078315734863281e-05, 5.745887756347656e-05, 6.413459777832031e-05, 7.081031799316406e-05, 7.748603820800781e-05, 8.416175842285156e-05, 9.083747863769531e-05, 9.751319885253906e-05, 0.00010418891906738281, 0.00011086463928222656, 0.00011754035949707031, 0.00012421607971191406, 0.0001308917999267578, 0.00013756752014160156, 0.0001442432403564453, 0.00015091896057128906, 0.0001575946807861328, 0.00016427040100097656, 0.0001709461212158203, 0.00017762184143066406, 0.0001842975616455078, 0.00019097328186035156, 0.0001976490020751953]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 4.0, 6.0, 16.0, 17.0, 24.0, 36.0, 50.0, 51.0, 88.0, 117.0, 181.0, 222.0, 337.0, 541.0, 897.0, 1489.0, 2840.0, 5894.0, 14164.0, 45556.0, 734559.0, 185783.0, 33396.0, 11405.0, 4913.0, 2424.0, 1287.0, 771.0, 467.0, 308.0, 195.0, 139.0, 105.0, 73.0, 44.0, 36.0, 26.0, 19.0, 20.0, 7.0, 8.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.35986328125, -0.3489189147949219, -0.33797454833984375, -0.3270301818847656, -0.3160858154296875, -0.3051414489746094, -0.29419708251953125, -0.2832527160644531, -0.272308349609375, -0.2613639831542969, -0.25041961669921875, -0.23947525024414062, -0.2285308837890625, -0.21758651733398438, -0.20664215087890625, -0.19569778442382812, -0.18475341796875, -0.17380905151367188, -0.16286468505859375, -0.15192031860351562, -0.1409759521484375, -0.13003158569335938, -0.11908721923828125, -0.10814285278320312, -0.097198486328125, -0.08625411987304688, -0.07530975341796875, -0.06436538696289062, -0.0534210205078125, -0.042476654052734375, -0.03153228759765625, -0.020587921142578125, -0.0096435546875, 0.001300811767578125, 0.01224517822265625, 0.023189544677734375, 0.0341339111328125, 0.045078277587890625, 0.05602264404296875, 0.06696701049804688, 0.077911376953125, 0.08885574340820312, 0.09980010986328125, 0.11074447631835938, 0.1216888427734375, 0.13263320922851562, 0.14357757568359375, 0.15452194213867188, 0.16546630859375, 0.17641067504882812, 0.18735504150390625, 0.19829940795898438, 0.2092437744140625, 0.22018814086914062, 0.23113250732421875, 0.24207687377929688, 0.253021240234375, 0.2639656066894531, 0.27490997314453125, 0.2858543395996094, 0.2967987060546875, 0.3077430725097656, 0.31868743896484375, 0.3296318054199219, 0.340576171875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 9.0, 8.0, 11.0, 19.0, 14.0, 24.0, 33.0, 60.0, 64.0, 76.0, 104.0, 105.0, 119.0, 97.0, 58.0, 44.0, 34.0, 20.0, 25.0, 26.0, 7.0, 8.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.6376953125, -0.6215972900390625, -0.605499267578125, -0.5894012451171875, -0.57330322265625, -0.5572052001953125, -0.541107177734375, -0.5250091552734375, -0.5089111328125, -0.4928131103515625, -0.476715087890625, -0.4606170654296875, -0.44451904296875, -0.4284210205078125, -0.412322998046875, -0.3962249755859375, -0.380126953125, -0.3640289306640625, -0.347930908203125, -0.3318328857421875, -0.31573486328125, -0.2996368408203125, -0.283538818359375, -0.2674407958984375, -0.2513427734375, -0.2352447509765625, -0.219146728515625, -0.2030487060546875, -0.18695068359375, -0.1708526611328125, -0.154754638671875, -0.1386566162109375, -0.12255859375, -0.1064605712890625, -0.090362548828125, -0.0742645263671875, -0.05816650390625, -0.0420684814453125, -0.025970458984375, -0.0098724365234375, 0.0062255859375, 0.0223236083984375, 0.038421630859375, 0.0545196533203125, 0.07061767578125, 0.0867156982421875, 0.102813720703125, 0.1189117431640625, 0.135009765625, 0.1511077880859375, 0.167205810546875, 0.1833038330078125, 0.19940185546875, 0.2154998779296875, 0.231597900390625, 0.2476959228515625, 0.2637939453125, 0.2798919677734375, 0.295989990234375, 0.3120880126953125, 0.32818603515625, 0.3442840576171875, 0.360382080078125, 0.3764801025390625, 0.392578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 17.0, 41.0, 86.0, 586.0, 148.0, 64.0, 35.0, 13.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.19683837890625, -59.010616302490234, -57.82439422607422, -56.63816833496094, -55.45194625854492, -54.265724182128906, -53.07950210571289, -51.893280029296875, -50.70705795288086, -49.520835876464844, -48.33461380004883, -47.14839172363281, -45.96216583251953, -44.775943756103516, -43.5897216796875, -42.403499603271484, -41.21727752685547, -40.03105545043945, -38.84483337402344, -37.658607482910156, -36.47238540649414, -35.286163330078125, -34.09994125366211, -32.913719177246094, -31.727493286132812, -30.541271209716797, -29.35504722595215, -28.168825149536133, -26.982603073120117, -25.79637908935547, -24.610157012939453, -23.423934936523438, -22.237714767456055, -21.05149269104004, -19.86526870727539, -18.679046630859375, -17.49282455444336, -16.306602478027344, -15.120378494262695, -13.93415641784668, -12.747933387756348, -11.561710357666016, -10.37548828125, -9.189265251159668, -8.003042221069336, -6.81682014465332, -5.630597114562988, -4.444375038146973, -3.2581520080566406, -2.071929454803467, -0.8857066631317139, 0.30051612854003906, 1.486738681793213, 2.6729612350463867, 3.8591842651367188, 5.045406341552734, 6.231629371643066, 7.41785192489624, 8.604074478149414, 9.790297508239746, 10.976520538330078, 12.162742614746094, 13.348965644836426, 14.535187721252441, 15.721410751342773]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 11.0, 16.0, 16.0, 26.0, 31.0, 35.0, 52.0, 112.0, 423.0, 76.0, 48.0, 37.0, 44.0, 28.0, 16.0, 10.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.350799560546875, -42.39469909667969, -41.4385986328125, -40.48249816894531, -39.526397705078125, -38.57029724121094, -37.61419677734375, -36.65809631347656, -35.70199203491211, -34.74589157104492, -33.789791107177734, -32.83369064331055, -31.877588272094727, -30.92148780822754, -29.96538734436035, -29.009286880493164, -28.05318832397461, -27.097087860107422, -26.140987396240234, -25.184886932373047, -24.228784561157227, -23.27268409729004, -22.31658363342285, -21.360483169555664, -20.404380798339844, -19.448280334472656, -18.49217987060547, -17.53607940673828, -16.57997703552246, -15.623876571655273, -14.667776107788086, -13.711675643920898, -12.755575180053711, -11.799474716186523, -10.84337329864502, -9.887272834777832, -8.931172370910645, -7.975071430206299, -7.018970489501953, -6.062870025634766, -5.10676908493042, -4.150668144226074, -3.1945676803588867, -2.238466739654541, -1.2823660373687744, -0.3262653350830078, 0.6298356056213379, 1.5859360694885254, 2.542037010192871, 3.4981377124786377, 4.454238414764404, 5.41033935546875, 6.3664398193359375, 7.322540760040283, 8.278641700744629, 9.234742164611816, 10.19084358215332, 11.146944046020508, 12.103045463562012, 13.0591459274292, 14.015246391296387, 14.97134780883789, 15.927448272705078, 16.883548736572266, 17.839649200439453]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 5.0, 9.0, 8.0, 8.0, 9.0, 17.0, 20.0, 27.0, 24.0, 44.0, 52.0, 102.0, 293.0, 118.0, 44.0, 37.0, 42.0, 31.0, 31.0, 18.0, 19.0, 15.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.525390625, -2.467254638671875, -2.40911865234375, -2.350982666015625, -2.2928466796875, -2.234710693359375, -2.17657470703125, -2.118438720703125, -2.060302734375, -2.002166748046875, -1.94403076171875, -1.885894775390625, -1.8277587890625, -1.769622802734375, -1.71148681640625, -1.653350830078125, -1.59521484375, -1.537078857421875, -1.47894287109375, -1.420806884765625, -1.3626708984375, -1.304534912109375, -1.24639892578125, -1.188262939453125, -1.130126953125, -1.071990966796875, -1.01385498046875, -0.955718994140625, -0.8975830078125, -0.839447021484375, -0.78131103515625, -0.723175048828125, -0.6650390625, -0.606903076171875, -0.54876708984375, -0.490631103515625, -0.4324951171875, -0.374359130859375, -0.31622314453125, -0.258087158203125, -0.199951171875, -0.141815185546875, -0.08367919921875, -0.025543212890625, 0.0325927734375, 0.090728759765625, 0.14886474609375, 0.207000732421875, 0.26513671875, 0.323272705078125, 0.38140869140625, 0.439544677734375, 0.4976806640625, 0.555816650390625, 0.61395263671875, 0.672088623046875, 0.730224609375, 0.788360595703125, 0.84649658203125, 0.904632568359375, 0.9627685546875, 1.020904541015625, 1.07904052734375, 1.137176513671875, 1.1953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 11.0, 1.0, 0.0, 5.0, 2.0, 5.0, 13.0, 8.0, 6.0, 42.0, 65.0, 98.0, 323.0, 7154.0, 8378349.0, 2063.0, 244.0, 61.0, 45.0, 20.0, 23.0, 11.0, 4.0, 3.0, 9.0, 11.0, 2.0, 9.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-35.27680587768555, -34.074520111083984, -32.872230529785156, -31.669944763183594, -30.46765899658203, -29.265371322631836, -28.06308364868164, -26.860797882080078, -25.658510208129883, -24.456222534179688, -23.253936767578125, -22.05164909362793, -20.849361419677734, -19.647075653076172, -18.444787979125977, -17.24250030517578, -16.04021453857422, -14.83792781829834, -13.635641098022461, -12.433353424072266, -11.231066703796387, -10.028779983520508, -8.826492309570312, -7.624205589294434, -6.421918869018555, -5.219632148742676, -4.017344951629639, -2.8150579929351807, -1.6127710342407227, -0.41048431396484375, 0.7918028831481934, 1.9940900802612305, 3.196380615234375, 4.398667335510254, 5.600954532623291, 6.803241729736328, 8.005528450012207, 9.207815170288086, 10.410102844238281, 11.61238956451416, 12.814676284790039, 14.016963005065918, 15.219249725341797, 16.421537399291992, 17.623825073242188, 18.82611083984375, 20.028398513793945, 21.23068618774414, 22.432971954345703, 23.6352596282959, 24.83754539489746, 26.039833068847656, 27.24211883544922, 28.444406509399414, 29.64669418334961, 30.848979949951172, 32.05126953125, 33.25355529785156, 34.45584487915039, 35.65813064575195, 36.860416412353516, 38.062705993652344, 39.264991760253906, 40.46727752685547, 41.66956329345703]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 5.0, 0.0, 6.0, 5.0, 2.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 3.0, 6.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.726543426513672, -5.4754533767700195, -5.224363327026367, -4.973273277282715, -4.7221832275390625, -4.47109317779541, -4.2200026512146, -3.9689126014709473, -3.717822551727295, -3.4667325019836426, -3.2156424522399902, -2.964552164077759, -2.7134621143341064, -2.462372064590454, -2.2112817764282227, -1.9601917266845703, -1.709101676940918, -1.4580116271972656, -1.2069214582443237, -0.9558313488960266, -0.7047412395477295, -0.45365118980407715, -0.20256102085113525, 0.04852914810180664, 0.299619197845459, 0.5507093071937561, 0.8017994165420532, 1.0528895854949951, 1.3039796352386475, 1.5550696849822998, 1.8061598539352417, 2.0572500228881836, 2.3083391189575195, 2.559429168701172, 2.810519218444824, 3.0616095066070557, 3.312699556350708, 3.5637896060943604, 3.814879894256592, 4.065969944000244, 4.3170599937438965, 4.568150043487549, 4.819240093231201, 5.0703301429748535, 5.321420669555664, 5.572510719299316, 5.823600769042969, 6.074690818786621, 6.325780868530273, 6.576870918273926, 6.827960968017578, 7.0790510177612305, 7.330141067504883, 7.581231117248535, 7.832321643829346, 8.083412170410156, 8.334501266479492, 8.585591316223145, 8.836681365966797, 9.08777141571045, 9.338861465454102, 9.589951515197754, 9.841041564941406, 10.092132568359375, 10.343222618103027]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 2.0, 4.0, 7.0, 14.0, 24.0, 19.0, 46.0, 67.0, 116.0, 185.0, 352.0, 762.0, 1897.0, 6652.0, 31785.0, 198553.0, 235179.0, 37507.0, 7579.0, 1990.0, 708.0, 318.0, 151.0, 96.0, 71.0, 39.0, 32.0, 29.0, 13.0, 14.0, 9.0, 11.0, 8.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.984375, -13.503173828125, -13.02197265625, -12.540771484375, -12.0595703125, -11.578369140625, -11.09716796875, -10.615966796875, -10.134765625, -9.653564453125, -9.17236328125, -8.691162109375, -8.2099609375, -7.728759765625, -7.24755859375, -6.766357421875, -6.28515625, -5.803955078125, -5.32275390625, -4.841552734375, -4.3603515625, -3.879150390625, -3.39794921875, -2.916748046875, -2.435546875, -1.954345703125, -1.47314453125, -0.991943359375, -0.5107421875, -0.029541015625, 0.45166015625, 0.932861328125, 1.4140625, 1.895263671875, 2.37646484375, 2.857666015625, 3.3388671875, 3.820068359375, 4.30126953125, 4.782470703125, 5.263671875, 5.744873046875, 6.22607421875, 6.707275390625, 7.1884765625, 7.669677734375, 8.15087890625, 8.632080078125, 9.11328125, 9.594482421875, 10.07568359375, 10.556884765625, 11.0380859375, 11.519287109375, 12.00048828125, 12.481689453125, 12.962890625, 13.444091796875, 13.92529296875, 14.406494140625, 14.8876953125, 15.368896484375, 15.85009765625, 16.331298828125, 16.8125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 9.0, 10.0, 19.0, 25.0, 16.0, 42.0, 42.0, 78.0, 91.0, 127.0, 123.0, 114.0, 84.0, 65.0, 41.0, 37.0, 26.0, 15.0, 13.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.8917236328125, -2.802978515625, -2.7142333984375, -2.62548828125, -2.5367431640625, -2.447998046875, -2.3592529296875, -2.2705078125, -2.1817626953125, -2.093017578125, -2.0042724609375, -1.91552734375, -1.8267822265625, -1.738037109375, -1.6492919921875, -1.560546875, -1.4718017578125, -1.383056640625, -1.2943115234375, -1.20556640625, -1.1168212890625, -1.028076171875, -0.9393310546875, -0.8505859375, -0.7618408203125, -0.673095703125, -0.5843505859375, -0.49560546875, -0.4068603515625, -0.318115234375, -0.2293701171875, -0.140625, -0.0518798828125, 0.036865234375, 0.1256103515625, 0.21435546875, 0.3031005859375, 0.391845703125, 0.4805908203125, 0.5693359375, 0.6580810546875, 0.746826171875, 0.8355712890625, 0.92431640625, 1.0130615234375, 1.101806640625, 1.1905517578125, 1.279296875, 1.3680419921875, 1.456787109375, 1.5455322265625, 1.63427734375, 1.7230224609375, 1.811767578125, 1.9005126953125, 1.9892578125, 2.0780029296875, 2.166748046875, 2.2554931640625, 2.34423828125, 2.4329833984375, 2.521728515625, 2.6104736328125, 2.69921875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 5.0, 4.0, 10.0, 14.0, 27.0, 80.0, 159.0, 104.0, 44.0, 20.0, 11.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.074398040771484, -14.489947319030762, -13.905495643615723, -13.321044921875, -12.736594200134277, -12.152143478393555, -11.567691802978516, -10.983241081237793, -10.39879035949707, -9.814339637756348, -9.229887962341309, -8.645437240600586, -8.060986518859863, -7.476535320281982, -6.892084121704102, -6.307633399963379, -5.72318172454834, -5.138730525970459, -4.554279804229736, -3.9698286056518555, -3.3853776454925537, -2.800926685333252, -2.216475486755371, -1.6320247650146484, -1.0475735664367676, -0.46312254667282104, 0.12132847309112549, 0.7057795524597168, 1.2902305126190186, 1.8746814727783203, 2.459132671356201, 3.043583393096924, 3.6280345916748047, 4.2124857902526855, 4.796936511993408, 5.381387710571289, 5.965838432312012, 6.550289630889893, 7.134740829467773, 7.719191551208496, 8.303642272949219, 8.888092994689941, 9.47254467010498, 10.056995391845703, 10.641446113586426, 11.225896835327148, 11.810348510742188, 12.39479923248291, 12.97925090789795, 13.563701629638672, 14.148153305053711, 14.732604026794434, 15.317054748535156, 15.901506423950195, 16.485958099365234, 17.07040786743164, 17.65485954284668, 18.23931121826172, 18.823760986328125, 19.408212661743164, 19.992664337158203, 20.57711410522461, 21.16156578063965, 21.746017456054688, 22.330467224121094]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 3.0, 13.0, 17.0, 48.0, 107.0, 104.0, 68.0, 29.0, 20.0, 8.0, 5.0, 5.0, 5.0, 2.0, 7.0, 3.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.336945533752441, -11.991554260253906, -11.646163940429688, -11.300772666931152, -10.955381393432617, -10.609991073608398, -10.264599800109863, -9.919208526611328, -9.57381820678711, -9.228426933288574, -8.883036613464355, -8.53764533996582, -8.192254066467285, -7.846863269805908, -7.501472473144531, -7.156081199645996, -6.810689926147461, -6.465299129486084, -6.119907855987549, -5.774517059326172, -5.429125785827637, -5.08373498916626, -4.738344192504883, -4.392952919006348, -4.047562122344971, -3.7021710872650146, -3.3567800521850586, -3.0113892555236816, -2.6659982204437256, -2.3206071853637695, -1.9752163887023926, -1.6298253536224365, -1.2844343185424805, -0.9390433430671692, -0.5936523675918579, -0.2482614517211914, 0.09712958335876465, 0.4425206184387207, 0.7879114151000977, 1.1333024501800537, 1.4786934852600098, 1.8240845203399658, 2.169475555419922, 2.514866352081299, 2.860257387161255, 3.205648422241211, 3.551039218902588, 3.896430253982544, 4.2418212890625, 4.587212085723877, 4.932603359222412, 5.277994155883789, 5.623385429382324, 5.968776226043701, 6.314167022705078, 6.659558296203613, 7.00494909286499, 7.350339889526367, 7.695731163024902, 8.041122436523438, 8.386512756347656, 8.731904029846191, 9.077295303344727, 9.422685623168945, 9.76807689666748]}, "eval/loss": 4.31812047958374, "eval/wer": 1.8917096390321302, "eval/runtime": 787.054, "eval/samples_per_second": 3.357, "eval/steps_per_second": 0.281} \ No newline at end of file +{"train/loss": 4.4804, "train/learning_rate": 8.403483309143687e-06, "train/epoch": 0.84, "train/global_step": 1000, "_runtime": 5811, "_timestamp": 1646128663, "_step": 1001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 70.0, 942.0, 4.0, 1.0], "bins": [-1010.7235107421875, -994.23681640625, -977.7501220703125, -961.263427734375, -944.7767333984375, -928.2900390625, -911.8033447265625, -895.316650390625, -878.8299560546875, -862.34326171875, -845.8565673828125, -829.369873046875, -812.8831787109375, -796.396484375, -779.9097900390625, -763.423095703125, -746.9364013671875, -730.44970703125, -713.9630126953125, -697.476318359375, -680.9896240234375, -664.5029296875, -648.0162353515625, -631.529541015625, -615.0429077148438, -598.5562133789062, -582.0695190429688, -565.5828247070312, -549.0961303710938, -532.6094360351562, -516.1227416992188, -499.63604736328125, -483.1492919921875, -466.66259765625, -450.1759033203125, -433.689208984375, -417.2025146484375, -400.7158203125, -384.2291259765625, -367.742431640625, -351.2557678222656, -334.7690734863281, -318.2823791503906, -301.7956848144531, -285.3089904785156, -268.8222961425781, -252.3356170654297, -235.8489227294922, -219.3622283935547, -202.8755340576172, -186.3888397216797, -169.90216064453125, -153.41546630859375, -136.92877197265625, -120.44207763671875, -103.95538330078125, -87.46868896484375, -70.98199462890625, -54.495304107666016, -38.00861358642578, -21.52191925048828, -5.035224914550781, 11.451461791992188, 27.938156127929688, 44.42485427856445]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 12.0, 15.0, 13.0, 27.0, 33.0, 36.0, 44.0, 59.0, 52.0, 54.0, 74.0, 68.0, 69.0, 71.0, 83.0, 52.0, 68.0, 43.0, 31.0, 28.0, 16.0, 8.0, 16.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.25445556640625, -85.712890625, -83.17133331298828, -80.62977600097656, -78.08821105957031, -75.54664611816406, -73.00508880615234, -70.46353149414062, -67.92196655273438, -65.38040161132812, -62.838844299316406, -60.29728317260742, -57.75572204589844, -55.21416091918945, -52.67259979248047, -50.131038665771484, -47.5894775390625, -45.047916412353516, -42.50635528564453, -39.96479415893555, -37.42323303222656, -34.88167190551758, -32.340110778808594, -29.79854965209961, -27.256988525390625, -24.71542739868164, -22.173866271972656, -19.632305145263672, -17.090744018554688, -14.549182891845703, -12.007621765136719, -9.466060638427734, -6.92449951171875, -4.382938385009766, -1.8413772583007812, 0.7001838684082031, 3.2417449951171875, 5.783306121826172, 8.324867248535156, 10.86642837524414, 13.407989501953125, 15.94955062866211, 18.491111755371094, 21.032672882080078, 23.574234008789062, 26.115795135498047, 28.65735626220703, 31.198917388916016, 33.740478515625, 36.282039642333984, 38.82360076904297, 41.36516189575195, 43.90672302246094, 46.44828414916992, 48.989845275878906, 51.53140640258789, 54.072967529296875, 56.61452865600586, 59.156089782714844, 61.69765090942383, 64.23921203613281, 66.78077697753906, 69.32233428955078, 71.8638916015625, 74.40545654296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 10.0, 8.0, 11.0, 24.0, 23.0, 24.0, 26.0, 30.0, 30.0, 29.0, 35.0, 40.0, 49.0, 40.0, 44.0, 56.0, 33.0, 58.0, 48.0, 52.0, 46.0, 43.0, 38.0, 34.0, 34.0, 22.0, 23.0, 16.0, 16.0, 13.0, 10.0, 6.0, 4.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.645721435546875, -2.55120849609375, -2.456695556640625, -2.3621826171875, -2.267669677734375, -2.17315673828125, -2.078643798828125, -1.984130859375, -1.889617919921875, -1.79510498046875, -1.700592041015625, -1.6060791015625, -1.511566162109375, -1.41705322265625, -1.322540283203125, -1.22802734375, -1.133514404296875, -1.03900146484375, -0.944488525390625, -0.8499755859375, -0.755462646484375, -0.66094970703125, -0.566436767578125, -0.471923828125, -0.377410888671875, -0.28289794921875, -0.188385009765625, -0.0938720703125, 0.000640869140625, 0.09515380859375, 0.189666748046875, 0.2841796875, 0.378692626953125, 0.47320556640625, 0.567718505859375, 0.6622314453125, 0.756744384765625, 0.85125732421875, 0.945770263671875, 1.040283203125, 1.134796142578125, 1.22930908203125, 1.323822021484375, 1.4183349609375, 1.512847900390625, 1.60736083984375, 1.701873779296875, 1.79638671875, 1.890899658203125, 1.98541259765625, 2.079925537109375, 2.1744384765625, 2.268951416015625, 2.36346435546875, 2.457977294921875, 2.552490234375, 2.647003173828125, 2.74151611328125, 2.836029052734375, 2.9305419921875, 3.025054931640625, 3.11956787109375, 3.214080810546875, 3.30859375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 14.0, 15.0, 15.0, 18.0, 37.0, 53.0, 67.0, 83.0, 139.0, 161.0, 242.0, 379.0, 597.0, 1060.0, 1913.0, 3964.0, 9416.0, 28342.0, 137510.0, 1417279.0, 2290309.0, 239549.0, 40803.0, 12052.0, 4796.0, 2235.0, 1185.0, 687.0, 427.0, 259.0, 184.0, 129.0, 92.0, 63.0, 62.0, 31.0, 24.0, 18.0, 11.0, 16.0, 6.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.265625, -9.9461669921875, -9.626708984375, -9.3072509765625, -8.98779296875, -8.6683349609375, -8.348876953125, -8.0294189453125, -7.7099609375, -7.3905029296875, -7.071044921875, -6.7515869140625, -6.43212890625, -6.1126708984375, -5.793212890625, -5.4737548828125, -5.154296875, -4.8348388671875, -4.515380859375, -4.1959228515625, -3.87646484375, -3.5570068359375, -3.237548828125, -2.9180908203125, -2.5986328125, -2.2791748046875, -1.959716796875, -1.6402587890625, -1.32080078125, -1.0013427734375, -0.681884765625, -0.3624267578125, -0.04296875, 0.2764892578125, 0.595947265625, 0.9154052734375, 1.23486328125, 1.5543212890625, 1.873779296875, 2.1932373046875, 2.5126953125, 2.8321533203125, 3.151611328125, 3.4710693359375, 3.79052734375, 4.1099853515625, 4.429443359375, 4.7489013671875, 5.068359375, 5.3878173828125, 5.707275390625, 6.0267333984375, 6.34619140625, 6.6656494140625, 6.985107421875, 7.3045654296875, 7.6240234375, 7.9434814453125, 8.262939453125, 8.5823974609375, 8.90185546875, 9.2213134765625, 9.540771484375, 9.8602294921875, 10.1796875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 10.0, 22.0, 31.0, 91.0, 197.0, 331.0, 726.0, 1163.0, 766.0, 393.0, 185.0, 85.0, 42.0, 16.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.828125, -31.024169921875, -30.22021484375, -29.416259765625, -28.6123046875, -27.808349609375, -27.00439453125, -26.200439453125, -25.396484375, -24.592529296875, -23.78857421875, -22.984619140625, -22.1806640625, -21.376708984375, -20.57275390625, -19.768798828125, -18.96484375, -18.160888671875, -17.35693359375, -16.552978515625, -15.7490234375, -14.945068359375, -14.14111328125, -13.337158203125, -12.533203125, -11.729248046875, -10.92529296875, -10.121337890625, -9.3173828125, -8.513427734375, -7.70947265625, -6.905517578125, -6.1015625, -5.297607421875, -4.49365234375, -3.689697265625, -2.8857421875, -2.081787109375, -1.27783203125, -0.473876953125, 0.330078125, 1.134033203125, 1.93798828125, 2.741943359375, 3.5458984375, 4.349853515625, 5.15380859375, 5.957763671875, 6.76171875, 7.565673828125, 8.36962890625, 9.173583984375, 9.9775390625, 10.781494140625, 11.58544921875, 12.389404296875, 13.193359375, 13.997314453125, 14.80126953125, 15.605224609375, 16.4091796875, 17.213134765625, 18.01708984375, 18.821044921875, 19.625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 16.0, 14.0, 18.0, 63.0, 170.0, 428.0, 1179.0, 5299.0, 3992841.0, 190540.0, 2456.0, 776.0, 264.0, 118.0, 43.0, 20.0, 10.0, 8.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.1875, -91.4013671875, -88.615234375, -85.8291015625, -83.04296875, -80.2568359375, -77.470703125, -74.6845703125, -71.8984375, -69.1123046875, -66.326171875, -63.5400390625, -60.75390625, -57.9677734375, -55.181640625, -52.3955078125, -49.609375, -46.8232421875, -44.037109375, -41.2509765625, -38.46484375, -35.6787109375, -32.892578125, -30.1064453125, -27.3203125, -24.5341796875, -21.748046875, -18.9619140625, -16.17578125, -13.3896484375, -10.603515625, -7.8173828125, -5.03125, -2.2451171875, 0.541015625, 3.3271484375, 6.11328125, 8.8994140625, 11.685546875, 14.4716796875, 17.2578125, 20.0439453125, 22.830078125, 25.6162109375, 28.40234375, 31.1884765625, 33.974609375, 36.7607421875, 39.546875, 42.3330078125, 45.119140625, 47.9052734375, 50.69140625, 53.4775390625, 56.263671875, 59.0498046875, 61.8359375, 64.6220703125, 67.408203125, 70.1943359375, 72.98046875, 75.7666015625, 78.552734375, 81.3388671875, 84.125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [16.0, 667.0, 329.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.600341796875, -8.848542213439941, 0.9032573699951172, 10.65505599975586, 20.406856536865234, 30.15865707397461, 39.91045379638672, 49.662254333496094, 59.41405487060547, 69.16585540771484, 78.91765594482422, 88.66944885253906, 98.42124938964844, 108.17304992675781, 117.92485046386719, 127.67665100097656, 137.42845153808594, 147.1802520751953, 156.9320526123047, 166.68385314941406, 176.43565368652344, 186.1874542236328, 195.93923950195312, 205.6910400390625, 215.44284057617188, 225.19464111328125, 234.94644165039062, 244.6982421875, 254.45004272460938, 264.20184326171875, 273.9536437988281, 283.7054443359375, 293.4572448730469, 303.20904541015625, 312.9608459472656, 322.712646484375, 332.4644470214844, 342.21624755859375, 351.9680480957031, 361.7198486328125, 371.4716491699219, 381.22344970703125, 390.9752502441406, 400.72705078125, 410.4788513183594, 420.23065185546875, 429.9824523925781, 439.7342529296875, 449.48602294921875, 459.2378234863281, 468.9896240234375, 478.7414245605469, 488.49322509765625, 498.2450256347656, 507.996826171875, 517.7485961914062, 527.5004272460938, 537.252197265625, 547.0040283203125, 556.7557983398438, 566.5076293945312, 576.2593994140625, 586.01123046875, 595.7630004882812, 605.5148315429688]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 1.0, 5.0, 7.0, 6.0, 11.0, 15.0, 14.0, 27.0, 27.0, 24.0, 29.0, 41.0, 31.0, 40.0, 43.0, 48.0, 45.0, 52.0, 43.0, 38.0, 42.0, 42.0, 61.0, 31.0, 37.0, 38.0, 43.0, 24.0, 22.0, 17.0, 22.0, 11.0, 10.0, 12.0, 11.0, 9.0, 4.0, 8.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.319793701171875, -43.89503860473633, -42.47028350830078, -41.0455322265625, -39.62077713012695, -38.196022033691406, -36.771270751953125, -35.34651565551758, -33.92176055908203, -32.497005462646484, -31.07225227355957, -29.647499084472656, -28.22274398803711, -26.797988891601562, -25.37323570251465, -23.948482513427734, -22.523727416992188, -21.09897232055664, -19.674219131469727, -18.249465942382812, -16.824710845947266, -15.399956703186035, -13.975202560424805, -12.550448417663574, -11.125694274902344, -9.700940132141113, -8.276185989379883, -6.851431846618652, -5.426677703857422, -4.001923561096191, -2.577169418334961, -1.1524152755737305, 0.2723388671875, 1.6970930099487305, 3.121847152709961, 4.546601295471191, 5.971355438232422, 7.396109580993652, 8.820863723754883, 10.245617866516113, 11.670372009277344, 13.095126152038574, 14.519880294799805, 15.944634437561035, 17.369388580322266, 18.794143676757812, 20.218896865844727, 21.64365005493164, 23.068405151367188, 24.493160247802734, 25.91791343688965, 27.342666625976562, 28.76742172241211, 30.192176818847656, 31.61693000793457, 33.041683197021484, 34.46643829345703, 35.89119338989258, 37.315948486328125, 38.740699768066406, 40.16545486450195, 41.5902099609375, 43.01496124267578, 44.43971633911133, 45.864471435546875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 8.0, 12.0, 14.0, 16.0, 19.0, 6.0, 20.0, 20.0, 24.0, 21.0, 27.0, 27.0, 27.0, 34.0, 33.0, 49.0, 49.0, 39.0, 46.0, 38.0, 38.0, 47.0, 35.0, 31.0, 31.0, 26.0, 42.0, 31.0, 30.0, 25.0, 25.0, 14.0, 15.0, 12.0, 12.0, 9.0, 7.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.80078125, -2.717620849609375, -2.63446044921875, -2.551300048828125, -2.4681396484375, -2.384979248046875, -2.30181884765625, -2.218658447265625, -2.135498046875, -2.052337646484375, -1.96917724609375, -1.886016845703125, -1.8028564453125, -1.719696044921875, -1.63653564453125, -1.553375244140625, -1.47021484375, -1.387054443359375, -1.30389404296875, -1.220733642578125, -1.1375732421875, -1.054412841796875, -0.97125244140625, -0.888092041015625, -0.804931640625, -0.721771240234375, -0.63861083984375, -0.555450439453125, -0.4722900390625, -0.389129638671875, -0.30596923828125, -0.222808837890625, -0.1396484375, -0.056488037109375, 0.02667236328125, 0.109832763671875, 0.1929931640625, 0.276153564453125, 0.35931396484375, 0.442474365234375, 0.525634765625, 0.608795166015625, 0.69195556640625, 0.775115966796875, 0.8582763671875, 0.941436767578125, 1.02459716796875, 1.107757568359375, 1.19091796875, 1.274078369140625, 1.35723876953125, 1.440399169921875, 1.5235595703125, 1.606719970703125, 1.68988037109375, 1.773040771484375, 1.856201171875, 1.939361572265625, 2.02252197265625, 2.105682373046875, 2.1888427734375, 2.272003173828125, 2.35516357421875, 2.438323974609375, 2.521484375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 12.0, 22.0, 20.0, 38.0, 54.0, 86.0, 111.0, 185.0, 245.0, 353.0, 535.0, 776.0, 1130.0, 1632.0, 2470.0, 3559.0, 5528.0, 8482.0, 13039.0, 20233.0, 32698.0, 54002.0, 89584.0, 143711.0, 196412.0, 172581.0, 115594.0, 69889.0, 42308.0, 25868.0, 16247.0, 10269.0, 7023.0, 4536.0, 2999.0, 1964.0, 1356.0, 948.0, 687.0, 440.0, 301.0, 198.0, 137.0, 93.0, 60.0, 50.0, 35.0, 19.0, 11.0, 10.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.306884765625, -0.297515869140625, -0.28814697265625, -0.278778076171875, -0.2694091796875, -0.260040283203125, -0.25067138671875, -0.241302490234375, -0.23193359375, -0.222564697265625, -0.21319580078125, -0.203826904296875, -0.1944580078125, -0.185089111328125, -0.17572021484375, -0.166351318359375, -0.156982421875, -0.147613525390625, -0.13824462890625, -0.128875732421875, -0.1195068359375, -0.110137939453125, -0.10076904296875, -0.091400146484375, -0.08203125, -0.072662353515625, -0.06329345703125, -0.053924560546875, -0.0445556640625, -0.035186767578125, -0.02581787109375, -0.016448974609375, -0.007080078125, 0.002288818359375, 0.01165771484375, 0.021026611328125, 0.0303955078125, 0.039764404296875, 0.04913330078125, 0.058502197265625, 0.06787109375, 0.077239990234375, 0.08660888671875, 0.095977783203125, 0.1053466796875, 0.114715576171875, 0.12408447265625, 0.133453369140625, 0.142822265625, 0.152191162109375, 0.16156005859375, 0.170928955078125, 0.1802978515625, 0.189666748046875, 0.19903564453125, 0.208404541015625, 0.2177734375, 0.227142333984375, 0.23651123046875, 0.245880126953125, 0.2552490234375, 0.264617919921875, 0.27398681640625, 0.283355712890625, 0.292724609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 1.0, 6.0, 7.0, 12.0, 9.0, 9.0, 11.0, 13.0, 18.0, 25.0, 17.0, 17.0, 22.0, 29.0, 28.0, 31.0, 30.0, 33.0, 29.0, 39.0, 37.0, 35.0, 1072.0, 30.0, 36.0, 28.0, 44.0, 43.0, 38.0, 35.0, 27.0, 24.0, 25.0, 22.0, 13.0, 25.0, 18.0, 16.0, 18.0, 8.0, 6.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.7138671875, -1.663970947265625, -1.61407470703125, -1.564178466796875, -1.5142822265625, -1.464385986328125, -1.41448974609375, -1.364593505859375, -1.314697265625, -1.264801025390625, -1.21490478515625, -1.165008544921875, -1.1151123046875, -1.065216064453125, -1.01531982421875, -0.965423583984375, -0.91552734375, -0.865631103515625, -0.81573486328125, -0.765838623046875, -0.7159423828125, -0.666046142578125, -0.61614990234375, -0.566253662109375, -0.516357421875, -0.466461181640625, -0.41656494140625, -0.366668701171875, -0.3167724609375, -0.266876220703125, -0.21697998046875, -0.167083740234375, -0.1171875, -0.067291259765625, -0.01739501953125, 0.032501220703125, 0.0823974609375, 0.132293701171875, 0.18218994140625, 0.232086181640625, 0.281982421875, 0.331878662109375, 0.38177490234375, 0.431671142578125, 0.4815673828125, 0.531463623046875, 0.58135986328125, 0.631256103515625, 0.68115234375, 0.731048583984375, 0.78094482421875, 0.830841064453125, 0.8807373046875, 0.930633544921875, 0.98052978515625, 1.030426025390625, 1.080322265625, 1.130218505859375, 1.18011474609375, 1.230010986328125, 1.2799072265625, 1.329803466796875, 1.37969970703125, 1.429595947265625, 1.4794921875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 11.0, 5.0, 21.0, 23.0, 36.0, 81.0, 95.0, 150.0, 217.0, 381.0, 587.0, 937.0, 1472.0, 2550.0, 4038.0, 6875.0, 11920.0, 20571.0, 35461.0, 64655.0, 112891.0, 176343.0, 1256137.0, 164676.0, 102401.0, 57449.0, 31951.0, 18485.0, 10683.0, 6339.0, 3710.0, 2318.0, 1384.0, 833.0, 499.0, 331.0, 224.0, 146.0, 85.0, 57.0, 38.0, 21.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.266357421875, -0.25838470458984375, -0.2504119873046875, -0.24243927001953125, -0.234466552734375, -0.22649383544921875, -0.2185211181640625, -0.21054840087890625, -0.20257568359375, -0.19460296630859375, -0.1866302490234375, -0.17865753173828125, -0.170684814453125, -0.16271209716796875, -0.1547393798828125, -0.14676666259765625, -0.1387939453125, -0.13082122802734375, -0.1228485107421875, -0.11487579345703125, -0.106903076171875, -0.09893035888671875, -0.0909576416015625, -0.08298492431640625, -0.07501220703125, -0.06703948974609375, -0.0590667724609375, -0.05109405517578125, -0.043121337890625, -0.03514862060546875, -0.0271759033203125, -0.01920318603515625, -0.01123046875, -0.00325775146484375, 0.0047149658203125, 0.01268768310546875, 0.020660400390625, 0.02863311767578125, 0.0366058349609375, 0.04457855224609375, 0.05255126953125, 0.06052398681640625, 0.0684967041015625, 0.07646942138671875, 0.084442138671875, 0.09241485595703125, 0.1003875732421875, 0.10836029052734375, 0.1163330078125, 0.12430572509765625, 0.1322784423828125, 0.14025115966796875, 0.148223876953125, 0.15619659423828125, 0.1641693115234375, 0.17214202880859375, 0.18011474609375, 0.18808746337890625, 0.1960601806640625, 0.20403289794921875, 0.212005615234375, 0.21997833251953125, 0.2279510498046875, 0.23592376708984375, 0.243896484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 6.0, 3.0, 4.0, 8.0, 7.0, 8.0, 15.0, 12.0, 15.0, 28.0, 22.0, 25.0, 34.0, 41.0, 31.0, 48.0, 45.0, 40.0, 55.0, 54.0, 57.0, 50.0, 53.0, 42.0, 34.0, 48.0, 41.0, 30.0, 28.0, 19.0, 25.0, 16.0, 7.0, 9.0, 10.0, 5.0, 15.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006809234619140625, -0.0006574913859367371, -0.0006340593099594116, -0.0006106272339820862, -0.0005871951580047607, -0.0005637630820274353, -0.0005403310060501099, -0.0005168989300727844, -0.000493466854095459, -0.00047003477811813354, -0.0004466027021408081, -0.00042317062616348267, -0.0003997385501861572, -0.0003763064742088318, -0.00035287439823150635, -0.0003294423222541809, -0.00030601024627685547, -0.00028257817029953003, -0.0002591460943222046, -0.00023571401834487915, -0.0002122819423675537, -0.00018884986639022827, -0.00016541779041290283, -0.0001419857144355774, -0.00011855363845825195, -9.512156248092651e-05, -7.168948650360107e-05, -4.8257410526275635e-05, -2.4825334548950195e-05, -1.3932585716247559e-06, 2.2038817405700684e-05, 4.547089338302612e-05, 6.890296936035156e-05, 9.2335045337677e-05, 0.00011576712131500244, 0.00013919919729232788, 0.00016263127326965332, 0.00018606334924697876, 0.0002094954252243042, 0.00023292750120162964, 0.0002563595771789551, 0.0002797916531562805, 0.00030322372913360596, 0.0003266558051109314, 0.00035008788108825684, 0.0003735199570655823, 0.0003969520330429077, 0.00042038410902023315, 0.0004438161849975586, 0.00046724826097488403, 0.0004906803369522095, 0.0005141124129295349, 0.0005375444889068604, 0.0005609765648841858, 0.0005844086408615112, 0.0006078407168388367, 0.0006312727928161621, 0.0006547048687934875, 0.000678136944770813, 0.0007015690207481384, 0.0007250010967254639, 0.0007484331727027893, 0.0007718652486801147, 0.0007952973246574402, 0.0008187294006347656]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 5.0, 5.0, 6.0, 11.0, 12.0, 16.0, 14.0, 22.0, 26.0, 43.0, 59.0, 68.0, 72.0, 88.0, 107.0, 115.0, 175.0, 193.0, 302.0, 504.0, 1620.0, 976887.0, 65873.0, 757.0, 400.0, 248.0, 210.0, 142.0, 103.0, 100.0, 75.0, 59.0, 55.0, 36.0, 31.0, 23.0, 19.0, 21.0, 10.0, 9.0, 9.0, 12.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01454925537109375, -0.014105558395385742, -0.013661861419677734, -0.013218164443969727, -0.012774467468261719, -0.012330770492553711, -0.011887073516845703, -0.011443376541137695, -0.010999679565429688, -0.01055598258972168, -0.010112285614013672, -0.009668588638305664, -0.009224891662597656, -0.008781194686889648, -0.00833749771118164, -0.007893800735473633, -0.007450103759765625, -0.007006406784057617, -0.006562709808349609, -0.0061190128326416016, -0.005675315856933594, -0.005231618881225586, -0.004787921905517578, -0.00434422492980957, -0.0039005279541015625, -0.0034568309783935547, -0.003013134002685547, -0.002569437026977539, -0.0021257400512695312, -0.0016820430755615234, -0.0012383460998535156, -0.0007946491241455078, -0.0003509521484375, 9.274482727050781e-05, 0.0005364418029785156, 0.0009801387786865234, 0.0014238357543945312, 0.001867532730102539, 0.002311229705810547, 0.0027549266815185547, 0.0031986236572265625, 0.0036423206329345703, 0.004086017608642578, 0.004529714584350586, 0.004973411560058594, 0.0054171085357666016, 0.005860805511474609, 0.006304502487182617, 0.006748199462890625, 0.007191896438598633, 0.007635593414306641, 0.008079290390014648, 0.008522987365722656, 0.008966684341430664, 0.009410381317138672, 0.00985407829284668, 0.010297775268554688, 0.010741472244262695, 0.011185169219970703, 0.011628866195678711, 0.012072563171386719, 0.012516260147094727, 0.012959957122802734, 0.013403654098510742, 0.01384735107421875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 24.0, 606.0, 374.0, 9.0, 2.0, 2.0, 1.0], "bins": [-0.0055391015484929085, -0.005445042159408331, -0.005350982770323753, -0.005256923381239176, -0.005162863992154598, -0.005068804137408733, -0.004974744748324156, -0.004880685359239578, -0.004786625970155001, -0.004692566581070423, -0.0045985071919858456, -0.004504447802901268, -0.0044103884138166904, -0.004316328559070826, -0.004222269169986248, -0.0041282097809016705, -0.004034150391817093, -0.003940091002732515, -0.0038460316136479378, -0.0037519719917327166, -0.003657912602648139, -0.0035638532135635614, -0.003469793824478984, -0.0033757342025637627, -0.0032816750463098288, -0.003187615657225251, -0.0030935562681406736, -0.0029994966462254524, -0.002905437257140875, -0.0028113778680562973, -0.0027173184789717197, -0.002623259089887142, -0.002529199467971921, -0.0024351400788873434, -0.002341080689802766, -0.0022470210678875446, -0.002152961678802967, -0.0020589022897183895, -0.001964842900633812, -0.0018707833951339126, -0.001776724006049335, -0.0016826646169647574, -0.001588605111464858, -0.0014945457223802805, -0.001400486216880381, -0.0013064268277958035, -0.0012123673222959042, -0.0011183079332113266, -0.0010242484277114272, -0.0009301889804191887, -0.0008361295331269503, -0.0007420701440423727, -0.0006480106385424733, -0.0005539512494578958, -0.0004598918021656573, -0.0003658323548734188, -0.0002717729366850108, -0.00017771348939277232, -8.365405665244907e-05, 1.0405376087874174e-05, 0.00010446482338011265, 0.00019852427067235112, 0.00029258368886075914, 0.0003866431361529976, 0.0004807025834452361]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 5.0, 11.0, 9.0, 10.0, 15.0, 9.0, 15.0, 17.0, 27.0, 21.0, 27.0, 38.0, 38.0, 40.0, 37.0, 44.0, 36.0, 56.0, 43.0, 45.0, 53.0, 48.0, 41.0, 36.0, 36.0, 35.0, 28.0, 35.0, 17.0, 22.0, 17.0, 16.0, 9.0, 15.0, 12.0, 7.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00046753883361816406, -0.0004540616646409035, -0.0004405844956636429, -0.0004271073266863823, -0.0004136301577091217, -0.0004001529887318611, -0.0003866758197546005, -0.00037319865077733994, -0.00035972148180007935, -0.00034624431282281876, -0.00033276714384555817, -0.0003192899748682976, -0.000305812805891037, -0.0002923356369137764, -0.0002788584679365158, -0.0002653812989592552, -0.00025190412998199463, -0.00023842696100473404, -0.00022494979202747345, -0.00021147262305021286, -0.00019799545407295227, -0.00018451828509569168, -0.0001710411161184311, -0.0001575639471411705, -0.0001440867781639099, -0.00013060960918664932, -0.00011713244020938873, -0.00010365527123212814, -9.017810225486755e-05, -7.670093327760696e-05, -6.322376430034637e-05, -4.9746595323085785e-05, -3.6269426345825195e-05, -2.2792257368564606e-05, -9.315088391304016e-06, 4.1620805859565735e-06, 1.7639249563217163e-05, 3.111641854047775e-05, 4.459358751773834e-05, 5.807075649499893e-05, 7.154792547225952e-05, 8.502509444952011e-05, 9.85022634267807e-05, 0.00011197943240404129, 0.00012545660138130188, 0.00013893377035856247, 0.00015241093933582306, 0.00016588810831308365, 0.00017936527729034424, 0.00019284244626760483, 0.00020631961524486542, 0.000219796784222126, 0.0002332739531993866, 0.0002467511221766472, 0.0002602282911539078, 0.00027370546013116837, 0.00028718262910842896, 0.00030065979808568954, 0.00031413696706295013, 0.0003276141360402107, 0.0003410913050174713, 0.0003545684739947319, 0.0003680456429719925, 0.0003815228119492531, 0.00039499998092651367]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 8.0, 12.0, 14.0, 16.0, 19.0, 6.0, 20.0, 20.0, 24.0, 21.0, 27.0, 27.0, 27.0, 34.0, 33.0, 49.0, 49.0, 39.0, 46.0, 38.0, 38.0, 47.0, 35.0, 31.0, 31.0, 26.0, 42.0, 31.0, 30.0, 25.0, 25.0, 14.0, 15.0, 12.0, 12.0, 9.0, 7.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.80078125, -2.717620849609375, -2.63446044921875, -2.551300048828125, -2.4681396484375, -2.384979248046875, -2.30181884765625, -2.218658447265625, -2.135498046875, -2.052337646484375, -1.96917724609375, -1.886016845703125, -1.8028564453125, -1.719696044921875, -1.63653564453125, -1.553375244140625, -1.47021484375, -1.387054443359375, -1.30389404296875, -1.220733642578125, -1.1375732421875, -1.054412841796875, -0.97125244140625, -0.888092041015625, -0.804931640625, -0.721771240234375, -0.63861083984375, -0.555450439453125, -0.4722900390625, -0.389129638671875, -0.30596923828125, -0.222808837890625, -0.1396484375, -0.056488037109375, 0.02667236328125, 0.109832763671875, 0.1929931640625, 0.276153564453125, 0.35931396484375, 0.442474365234375, 0.525634765625, 0.608795166015625, 0.69195556640625, 0.775115966796875, 0.8582763671875, 0.941436767578125, 1.02459716796875, 1.107757568359375, 1.19091796875, 1.274078369140625, 1.35723876953125, 1.440399169921875, 1.5235595703125, 1.606719970703125, 1.68988037109375, 1.773040771484375, 1.856201171875, 1.939361572265625, 2.02252197265625, 2.105682373046875, 2.1888427734375, 2.272003173828125, 2.35516357421875, 2.438323974609375, 2.521484375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 11.0, 9.0, 21.0, 27.0, 23.0, 51.0, 48.0, 66.0, 75.0, 118.0, 137.0, 205.0, 289.0, 369.0, 518.0, 704.0, 1015.0, 1360.0, 2194.0, 3378.0, 5427.0, 9746.0, 19933.0, 83465.0, 716898.0, 148796.0, 24586.0, 11022.0, 6254.0, 3825.0, 2416.0, 1666.0, 1110.0, 667.0, 532.0, 420.0, 292.0, 206.0, 162.0, 118.0, 96.0, 70.0, 62.0, 39.0, 26.0, 30.0, 18.0, 15.0, 12.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.1171875, -12.7022705078125, -12.287353515625, -11.8724365234375, -11.45751953125, -11.0426025390625, -10.627685546875, -10.2127685546875, -9.7978515625, -9.3829345703125, -8.968017578125, -8.5531005859375, -8.13818359375, -7.7232666015625, -7.308349609375, -6.8934326171875, -6.478515625, -6.0635986328125, -5.648681640625, -5.2337646484375, -4.81884765625, -4.4039306640625, -3.989013671875, -3.5740966796875, -3.1591796875, -2.7442626953125, -2.329345703125, -1.9144287109375, -1.49951171875, -1.0845947265625, -0.669677734375, -0.2547607421875, 0.16015625, 0.5750732421875, 0.989990234375, 1.4049072265625, 1.81982421875, 2.2347412109375, 2.649658203125, 3.0645751953125, 3.4794921875, 3.8944091796875, 4.309326171875, 4.7242431640625, 5.13916015625, 5.5540771484375, 5.968994140625, 6.3839111328125, 6.798828125, 7.2137451171875, 7.628662109375, 8.0435791015625, 8.45849609375, 8.8734130859375, 9.288330078125, 9.7032470703125, 10.1181640625, 10.5330810546875, 10.947998046875, 11.3629150390625, 11.77783203125, 12.1927490234375, 12.607666015625, 13.0225830078125, 13.4375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 6.0, 7.0, 6.0, 7.0, 10.0, 12.0, 15.0, 27.0, 18.0, 29.0, 30.0, 31.0, 32.0, 31.0, 30.0, 43.0, 42.0, 69.0, 127.0, 311.0, 1490.0, 187.0, 100.0, 67.0, 38.0, 42.0, 33.0, 29.0, 20.0, 27.0, 22.0, 18.0, 18.0, 19.0, 10.0, 8.0, 10.0, 2.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.9609375, -8.68310546875, -8.4052734375, -8.12744140625, -7.849609375, -7.57177734375, -7.2939453125, -7.01611328125, -6.73828125, -6.46044921875, -6.1826171875, -5.90478515625, -5.626953125, -5.34912109375, -5.0712890625, -4.79345703125, -4.515625, -4.23779296875, -3.9599609375, -3.68212890625, -3.404296875, -3.12646484375, -2.8486328125, -2.57080078125, -2.29296875, -2.01513671875, -1.7373046875, -1.45947265625, -1.181640625, -0.90380859375, -0.6259765625, -0.34814453125, -0.0703125, 0.20751953125, 0.4853515625, 0.76318359375, 1.041015625, 1.31884765625, 1.5966796875, 1.87451171875, 2.15234375, 2.43017578125, 2.7080078125, 2.98583984375, 3.263671875, 3.54150390625, 3.8193359375, 4.09716796875, 4.375, 4.65283203125, 4.9306640625, 5.20849609375, 5.486328125, 5.76416015625, 6.0419921875, 6.31982421875, 6.59765625, 6.87548828125, 7.1533203125, 7.43115234375, 7.708984375, 7.98681640625, 8.2646484375, 8.54248046875, 8.8203125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 13.0, 6.0, 10.0, 11.0, 13.0, 15.0, 23.0, 23.0, 20.0, 19.0, 36.0, 38.0, 43.0, 77.0, 140.0, 389.0, 1828.0, 937768.0, 2202051.0, 2164.0, 420.0, 180.0, 67.0, 57.0, 40.0, 41.0, 30.0, 25.0, 32.0, 23.0, 15.0, 22.0, 10.0, 12.0, 10.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-37.46875, -36.26123046875, -35.0537109375, -33.84619140625, -32.638671875, -31.43115234375, -30.2236328125, -29.01611328125, -27.80859375, -26.60107421875, -25.3935546875, -24.18603515625, -22.978515625, -21.77099609375, -20.5634765625, -19.35595703125, -18.1484375, -16.94091796875, -15.7333984375, -14.52587890625, -13.318359375, -12.11083984375, -10.9033203125, -9.69580078125, -8.48828125, -7.28076171875, -6.0732421875, -4.86572265625, -3.658203125, -2.45068359375, -1.2431640625, -0.03564453125, 1.171875, 2.37939453125, 3.5869140625, 4.79443359375, 6.001953125, 7.20947265625, 8.4169921875, 9.62451171875, 10.83203125, 12.03955078125, 13.2470703125, 14.45458984375, 15.662109375, 16.86962890625, 18.0771484375, 19.28466796875, 20.4921875, 21.69970703125, 22.9072265625, 24.11474609375, 25.322265625, 26.52978515625, 27.7373046875, 28.94482421875, 30.15234375, 31.35986328125, 32.5673828125, 33.77490234375, 34.982421875, 36.18994140625, 37.3974609375, 38.60498046875, 39.8125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 826.0, 191.0, 2.0, 1.0, 1.0], "bins": [-514.5261840820312, -505.9359130859375, -497.34564208984375, -488.75537109375, -480.16510009765625, -471.5748291015625, -462.98455810546875, -454.394287109375, -445.80401611328125, -437.2137451171875, -428.62347412109375, -420.033203125, -411.44293212890625, -402.8526611328125, -394.26239013671875, -385.672119140625, -377.0818176269531, -368.4915466308594, -359.9012756347656, -351.3110046386719, -342.7207336425781, -334.1304626464844, -325.5401916503906, -316.94989013671875, -308.359619140625, -299.76934814453125, -291.1790771484375, -282.58880615234375, -273.99853515625, -265.40826416015625, -256.8179931640625, -248.2277069091797, -239.637451171875, -231.04718017578125, -222.4569091796875, -213.86663818359375, -205.2763671875, -196.68609619140625, -188.09580993652344, -179.5055389404297, -170.91526794433594, -162.3249969482422, -153.73472595214844, -145.1444549560547, -136.55416870117188, -127.96390533447266, -119.37362670898438, -110.78335571289062, -102.19308471679688, -93.60281372070312, -85.01254272460938, -76.4222640991211, -67.83199310302734, -59.241722106933594, -50.65144729614258, -42.06117248535156, -33.47090530395508, -24.880632400512695, -16.290359497070312, -7.70008659362793, 0.8901863098144531, 9.480457305908203, 18.07073211669922, 26.661006927490234, 35.251277923583984]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 7.0, 10.0, 9.0, 6.0, 21.0, 17.0, 11.0, 15.0, 23.0, 30.0, 38.0, 42.0, 29.0, 47.0, 35.0, 39.0, 37.0, 44.0, 48.0, 41.0, 24.0, 42.0, 42.0, 47.0, 40.0, 37.0, 21.0, 32.0, 20.0, 25.0, 16.0, 22.0, 8.0, 16.0, 9.0, 10.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.235851287841797, -29.38324546813965, -28.530641555786133, -27.678035736083984, -26.82543182373047, -25.97282600402832, -25.120220184326172, -24.267616271972656, -23.415010452270508, -22.56240463256836, -21.709800720214844, -20.857194900512695, -20.00459098815918, -19.15198516845703, -18.299381256103516, -17.446775436401367, -16.59416961669922, -15.741564750671387, -14.888959884643555, -14.036354064941406, -13.183749198913574, -12.331144332885742, -11.47853946685791, -10.625934600830078, -9.773330688476562, -8.92072582244873, -8.068120956420898, -7.215515613555908, -6.362910270690918, -5.510305404663086, -4.657700538635254, -3.8050951957702637, -2.9524898529052734, -2.0998847484588623, -1.2472797632217407, -0.39467477798461914, 0.457930326461792, 1.3105354309082031, 2.163140296936035, 3.0157456398010254, 3.8683505058288574, 4.7209553718566895, 5.57356071472168, 6.426165580749512, 7.278770446777344, 8.131376266479492, 8.983980178833008, 9.836585998535156, 10.689190864562988, 11.54179573059082, 12.394400596618652, 13.247005462646484, 14.099611282348633, 14.952216148376465, 15.804821014404297, 16.657426834106445, 17.51003074645996, 18.36263656616211, 19.215240478515625, 20.067846298217773, 20.92045021057129, 21.773056030273438, 22.625659942626953, 23.4782657623291, 24.33087158203125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 14.0, 6.0, 12.0, 16.0, 18.0, 17.0, 14.0, 24.0, 26.0, 20.0, 30.0, 27.0, 36.0, 34.0, 42.0, 38.0, 59.0, 46.0, 46.0, 35.0, 37.0, 30.0, 29.0, 36.0, 38.0, 32.0, 30.0, 35.0, 20.0, 24.0, 17.0, 19.0, 12.0, 13.0, 10.0, 4.0, 8.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.80419921875, -2.7158203125, -2.62744140625, -2.5390625, -2.45068359375, -2.3623046875, -2.27392578125, -2.185546875, -2.09716796875, -2.0087890625, -1.92041015625, -1.83203125, -1.74365234375, -1.6552734375, -1.56689453125, -1.478515625, -1.39013671875, -1.3017578125, -1.21337890625, -1.125, -1.03662109375, -0.9482421875, -0.85986328125, -0.771484375, -0.68310546875, -0.5947265625, -0.50634765625, -0.41796875, -0.32958984375, -0.2412109375, -0.15283203125, -0.064453125, 0.02392578125, 0.1123046875, 0.20068359375, 0.2890625, 0.37744140625, 0.4658203125, 0.55419921875, 0.642578125, 0.73095703125, 0.8193359375, 0.90771484375, 0.99609375, 1.08447265625, 1.1728515625, 1.26123046875, 1.349609375, 1.43798828125, 1.5263671875, 1.61474609375, 1.703125, 1.79150390625, 1.8798828125, 1.96826171875, 2.056640625, 2.14501953125, 2.2333984375, 2.32177734375, 2.41015625, 2.49853515625, 2.5869140625, 2.67529296875, 2.763671875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 6.0, 15.0, 10.0, 16.0, 13.0, 24.0, 35.0, 57.0, 51.0, 110.0, 111.0, 175.0, 241.0, 354.0, 609.0, 1058.0, 1877.0, 3503.0, 7508.0, 19865.0, 79653.0, 778175.0, 2899368.0, 326942.0, 48385.0, 13945.0, 5637.0, 2744.0, 1466.0, 814.0, 463.0, 298.0, 225.0, 149.0, 104.0, 74.0, 45.0, 39.0, 23.0, 23.0, 14.0, 5.0, 8.0, 12.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-13.7109375, -13.2996826171875, -12.888427734375, -12.4771728515625, -12.06591796875, -11.6546630859375, -11.243408203125, -10.8321533203125, -10.4208984375, -10.0096435546875, -9.598388671875, -9.1871337890625, -8.77587890625, -8.3646240234375, -7.953369140625, -7.5421142578125, -7.130859375, -6.7196044921875, -6.308349609375, -5.8970947265625, -5.48583984375, -5.0745849609375, -4.663330078125, -4.2520751953125, -3.8408203125, -3.4295654296875, -3.018310546875, -2.6070556640625, -2.19580078125, -1.7845458984375, -1.373291015625, -0.9620361328125, -0.55078125, -0.1395263671875, 0.271728515625, 0.6829833984375, 1.09423828125, 1.5054931640625, 1.916748046875, 2.3280029296875, 2.7392578125, 3.1505126953125, 3.561767578125, 3.9730224609375, 4.38427734375, 4.7955322265625, 5.206787109375, 5.6180419921875, 6.029296875, 6.4405517578125, 6.851806640625, 7.2630615234375, 7.67431640625, 8.0855712890625, 8.496826171875, 8.9080810546875, 9.3193359375, 9.7305908203125, 10.141845703125, 10.5531005859375, 10.96435546875, 11.3756103515625, 11.786865234375, 12.1981201171875, 12.609375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 13.0, 11.0, 12.0, 25.0, 45.0, 53.0, 66.0, 92.0, 155.0, 214.0, 324.0, 477.0, 574.0, 604.0, 455.0, 357.0, 205.0, 120.0, 96.0, 60.0, 39.0, 33.0, 22.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -15.9697265625, -15.470703125, -14.9716796875, -14.47265625, -13.9736328125, -13.474609375, -12.9755859375, -12.4765625, -11.9775390625, -11.478515625, -10.9794921875, -10.48046875, -9.9814453125, -9.482421875, -8.9833984375, -8.484375, -7.9853515625, -7.486328125, -6.9873046875, -6.48828125, -5.9892578125, -5.490234375, -4.9912109375, -4.4921875, -3.9931640625, -3.494140625, -2.9951171875, -2.49609375, -1.9970703125, -1.498046875, -0.9990234375, -0.5, -0.0009765625, 0.498046875, 0.9970703125, 1.49609375, 1.9951171875, 2.494140625, 2.9931640625, 3.4921875, 3.9912109375, 4.490234375, 4.9892578125, 5.48828125, 5.9873046875, 6.486328125, 6.9853515625, 7.484375, 7.9833984375, 8.482421875, 8.9814453125, 9.48046875, 9.9794921875, 10.478515625, 10.9775390625, 11.4765625, 11.9755859375, 12.474609375, 12.9736328125, 13.47265625, 13.9716796875, 14.470703125, 14.9697265625, 15.46875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 11.0, 10.0, 22.0, 25.0, 48.0, 62.0, 108.0, 212.0, 541.0, 2429.0, 1561779.0, 2624873.0, 2872.0, 600.0, 263.0, 153.0, 94.0, 58.0, 42.0, 26.0, 15.0, 15.0, 9.0, 8.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0, -70.6474609375, -68.294921875, -65.9423828125, -63.58984375, -61.2373046875, -58.884765625, -56.5322265625, -54.1796875, -51.8271484375, -49.474609375, -47.1220703125, -44.76953125, -42.4169921875, -40.064453125, -37.7119140625, -35.359375, -33.0068359375, -30.654296875, -28.3017578125, -25.94921875, -23.5966796875, -21.244140625, -18.8916015625, -16.5390625, -14.1865234375, -11.833984375, -9.4814453125, -7.12890625, -4.7763671875, -2.423828125, -0.0712890625, 2.28125, 4.6337890625, 6.986328125, 9.3388671875, 11.69140625, 14.0439453125, 16.396484375, 18.7490234375, 21.1015625, 23.4541015625, 25.806640625, 28.1591796875, 30.51171875, 32.8642578125, 35.216796875, 37.5693359375, 39.921875, 42.2744140625, 44.626953125, 46.9794921875, 49.33203125, 51.6845703125, 54.037109375, 56.3896484375, 58.7421875, 61.0947265625, 63.447265625, 65.7998046875, 68.15234375, 70.5048828125, 72.857421875, 75.2099609375, 77.5625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 14.0, 65.0, 237.0, 368.0, 251.0, 67.0, 9.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-164.59982299804688, -161.06324768066406, -157.5266876220703, -153.9901123046875, -150.45355224609375, -146.91697692871094, -143.38040161132812, -139.84384155273438, -136.30726623535156, -132.77069091796875, -129.234130859375, -125.69755554199219, -122.1609878540039, -118.62442016601562, -115.08785247802734, -111.55128479003906, -108.01472473144531, -104.47815704345703, -100.94158935546875, -97.40501403808594, -93.86844635009766, -90.33187866210938, -86.7953109741211, -83.25874328613281, -79.72216796875, -76.18560028076172, -72.64903259277344, -69.11245727539062, -65.57588958740234, -62.03932189941406, -58.50275421142578, -54.9661865234375, -51.42961502075195, -47.89304733276367, -44.356475830078125, -40.819908142089844, -37.28334045410156, -33.74677276611328, -30.210201263427734, -26.673633575439453, -23.13706398010254, -19.600494384765625, -16.063926696777344, -12.52735710144043, -8.990788459777832, -5.454219818115234, -1.9176502227783203, 1.618917465209961, 5.155487060546875, 8.692055702209473, 12.22862434387207, 15.765193939208984, 19.301761627197266, 22.83833122253418, 26.374900817871094, 29.911468505859375, 33.448036193847656, 36.98460388183594, 40.521175384521484, 44.057743072509766, 47.59431076049805, 51.130882263183594, 54.667449951171875, 58.204017639160156, 61.7405891418457]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 12.0, 16.0, 9.0, 12.0, 15.0, 19.0, 21.0, 23.0, 16.0, 31.0, 27.0, 27.0, 38.0, 27.0, 39.0, 25.0, 47.0, 46.0, 51.0, 43.0, 42.0, 39.0, 29.0, 40.0, 41.0, 29.0, 35.0, 23.0, 22.0, 22.0, 16.0, 22.0, 19.0, 14.0, 18.0, 5.0, 6.0, 8.0, 4.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.191436767578125, -43.72285461425781, -42.2542724609375, -40.78569030761719, -39.31710433959961, -37.8485221862793, -36.379940032958984, -34.91135787963867, -33.44277572631836, -31.974193572998047, -30.5056095123291, -29.03702735900879, -27.568445205688477, -26.09986114501953, -24.63127899169922, -23.162696838378906, -21.69411277770996, -20.22553062438965, -18.756946563720703, -17.28836441040039, -15.819782257080078, -14.35119915008545, -12.88261604309082, -11.414033889770508, -9.945450782775879, -8.47686767578125, -7.0082855224609375, -5.539702415466309, -4.071119785308838, -2.602537155151367, -1.1339540481567383, 0.3346281051635742, 1.8032112121582031, 3.271793842315674, 4.7403764724731445, 6.208959579467773, 7.677542209625244, 9.146124839782715, 10.614707946777344, 12.083290100097656, 13.551873207092285, 15.020456314086914, 16.489038467407227, 17.957622528076172, 19.426204681396484, 20.894786834716797, 22.36336898803711, 23.831951141357422, 25.300535202026367, 26.76911735534668, 28.237701416015625, 29.706283569335938, 31.17486572265625, 32.64344787597656, 34.112030029296875, 35.58061218261719, 37.049198150634766, 38.51778030395508, 39.98636245727539, 41.45494842529297, 42.92353057861328, 44.392112731933594, 45.860694885253906, 47.32927703857422, 48.79785919189453]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 8.0, 9.0, 13.0, 9.0, 10.0, 8.0, 12.0, 20.0, 18.0, 25.0, 17.0, 28.0, 32.0, 26.0, 32.0, 28.0, 35.0, 47.0, 44.0, 38.0, 45.0, 42.0, 36.0, 41.0, 38.0, 37.0, 34.0, 27.0, 45.0, 34.0, 23.0, 21.0, 16.0, 14.0, 20.0, 13.0, 7.0, 12.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.24609375, -3.1541748046875, -3.062255859375, -2.9703369140625, -2.87841796875, -2.7864990234375, -2.694580078125, -2.6026611328125, -2.5107421875, -2.4188232421875, -2.326904296875, -2.2349853515625, -2.14306640625, -2.0511474609375, -1.959228515625, -1.8673095703125, -1.775390625, -1.6834716796875, -1.591552734375, -1.4996337890625, -1.40771484375, -1.3157958984375, -1.223876953125, -1.1319580078125, -1.0400390625, -0.9481201171875, -0.856201171875, -0.7642822265625, -0.67236328125, -0.5804443359375, -0.488525390625, -0.3966064453125, -0.3046875, -0.2127685546875, -0.120849609375, -0.0289306640625, 0.06298828125, 0.1549072265625, 0.246826171875, 0.3387451171875, 0.4306640625, 0.5225830078125, 0.614501953125, 0.7064208984375, 0.79833984375, 0.8902587890625, 0.982177734375, 1.0740966796875, 1.166015625, 1.2579345703125, 1.349853515625, 1.4417724609375, 1.53369140625, 1.6256103515625, 1.717529296875, 1.8094482421875, 1.9013671875, 1.9932861328125, 2.085205078125, 2.1771240234375, 2.26904296875, 2.3609619140625, 2.452880859375, 2.5447998046875, 2.63671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 26.0, 12.0, 22.0, 40.0, 64.0, 78.0, 112.0, 171.0, 253.0, 286.0, 451.0, 640.0, 872.0, 1294.0, 1803.0, 2484.0, 3595.0, 5346.0, 7594.0, 10895.0, 16436.0, 25164.0, 39452.0, 63357.0, 101761.0, 154299.0, 190031.0, 150290.0, 97954.0, 61078.0, 38199.0, 24456.0, 15732.0, 10227.0, 7310.0, 4843.0, 3519.0, 2424.0, 1798.0, 1163.0, 846.0, 677.0, 452.0, 325.0, 214.0, 150.0, 88.0, 89.0, 55.0, 43.0, 25.0, 25.0, 7.0, 8.0, 6.0, 10.0, 3.0, 3.0], "bins": [-0.296142578125, -0.287017822265625, -0.27789306640625, -0.268768310546875, -0.2596435546875, -0.250518798828125, -0.24139404296875, -0.232269287109375, -0.22314453125, -0.214019775390625, -0.20489501953125, -0.195770263671875, -0.1866455078125, -0.177520751953125, -0.16839599609375, -0.159271240234375, -0.150146484375, -0.141021728515625, -0.13189697265625, -0.122772216796875, -0.1136474609375, -0.104522705078125, -0.09539794921875, -0.086273193359375, -0.0771484375, -0.068023681640625, -0.05889892578125, -0.049774169921875, -0.0406494140625, -0.031524658203125, -0.02239990234375, -0.013275146484375, -0.004150390625, 0.004974365234375, 0.01409912109375, 0.023223876953125, 0.0323486328125, 0.041473388671875, 0.05059814453125, 0.059722900390625, 0.06884765625, 0.077972412109375, 0.08709716796875, 0.096221923828125, 0.1053466796875, 0.114471435546875, 0.12359619140625, 0.132720947265625, 0.141845703125, 0.150970458984375, 0.16009521484375, 0.169219970703125, 0.1783447265625, 0.187469482421875, 0.19659423828125, 0.205718994140625, 0.21484375, 0.223968505859375, 0.23309326171875, 0.242218017578125, 0.2513427734375, 0.260467529296875, 0.26959228515625, 0.278717041015625, 0.287841796875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 11.0, 7.0, 8.0, 9.0, 15.0, 21.0, 15.0, 24.0, 26.0, 22.0, 32.0, 28.0, 24.0, 40.0, 38.0, 51.0, 43.0, 43.0, 1071.0, 49.0, 43.0, 43.0, 36.0, 47.0, 40.0, 32.0, 30.0, 28.0, 27.0, 17.0, 24.0, 11.0, 13.0, 10.0, 7.0, 8.0, 9.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.15228271484375, -2.0877685546875, -2.02325439453125, -1.958740234375, -1.89422607421875, -1.8297119140625, -1.76519775390625, -1.70068359375, -1.63616943359375, -1.5716552734375, -1.50714111328125, -1.442626953125, -1.37811279296875, -1.3135986328125, -1.24908447265625, -1.1845703125, -1.12005615234375, -1.0555419921875, -0.99102783203125, -0.926513671875, -0.86199951171875, -0.7974853515625, -0.73297119140625, -0.66845703125, -0.60394287109375, -0.5394287109375, -0.47491455078125, -0.410400390625, -0.34588623046875, -0.2813720703125, -0.21685791015625, -0.15234375, -0.08782958984375, -0.0233154296875, 0.04119873046875, 0.105712890625, 0.17022705078125, 0.2347412109375, 0.29925537109375, 0.36376953125, 0.42828369140625, 0.4927978515625, 0.55731201171875, 0.621826171875, 0.68634033203125, 0.7508544921875, 0.81536865234375, 0.8798828125, 0.94439697265625, 1.0089111328125, 1.07342529296875, 1.137939453125, 1.20245361328125, 1.2669677734375, 1.33148193359375, 1.39599609375, 1.46051025390625, 1.5250244140625, 1.58953857421875, 1.654052734375, 1.71856689453125, 1.7830810546875, 1.84759521484375, 1.912109375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 5.0, 7.0, 8.0, 11.0, 19.0, 34.0, 51.0, 79.0, 115.0, 192.0, 264.0, 424.0, 704.0, 1060.0, 1681.0, 2778.0, 4632.0, 7439.0, 12176.0, 20805.0, 34792.0, 59033.0, 97904.0, 148988.0, 1234082.0, 168918.0, 119160.0, 73449.0, 43673.0, 25545.0, 15276.0, 9227.0, 5485.0, 3399.0, 2082.0, 1329.0, 824.0, 542.0, 309.0, 225.0, 143.0, 92.0, 58.0, 40.0, 21.0, 18.0, 16.0, 4.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.2384357452392578, -0.23041152954101562, -0.22238731384277344, -0.21436309814453125, -0.20633888244628906, -0.19831466674804688, -0.1902904510498047, -0.1822662353515625, -0.1742420196533203, -0.16621780395507812, -0.15819358825683594, -0.15016937255859375, -0.14214515686035156, -0.13412094116210938, -0.1260967254638672, -0.118072509765625, -0.11004829406738281, -0.10202407836914062, -0.09399986267089844, -0.08597564697265625, -0.07795143127441406, -0.06992721557617188, -0.06190299987792969, -0.0538787841796875, -0.04585456848144531, -0.037830352783203125, -0.029806137084960938, -0.02178192138671875, -0.013757705688476562, -0.005733489990234375, 0.0022907257080078125, 0.01031494140625, 0.018339157104492188, 0.026363372802734375, 0.03438758850097656, 0.04241180419921875, 0.05043601989746094, 0.058460235595703125, 0.06648445129394531, 0.0745086669921875, 0.08253288269042969, 0.09055709838867188, 0.09858131408691406, 0.10660552978515625, 0.11462974548339844, 0.12265396118164062, 0.1306781768798828, 0.138702392578125, 0.1467266082763672, 0.15475082397460938, 0.16277503967285156, 0.17079925537109375, 0.17882347106933594, 0.18684768676757812, 0.1948719024658203, 0.2028961181640625, 0.2109203338623047, 0.21894454956054688, 0.22696876525878906, 0.23499298095703125, 0.24301719665527344, 0.2510414123535156, 0.2590656280517578, 0.26708984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 9.0, 11.0, 15.0, 17.0, 14.0, 31.0, 32.0, 41.0, 34.0, 58.0, 60.0, 81.0, 67.0, 60.0, 62.0, 69.0, 58.0, 62.0, 40.0, 41.0, 31.0, 19.0, 17.0, 19.0, 16.0, 7.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010042190551757812, -0.0009712129831314087, -0.0009382069110870361, -0.0009052008390426636, -0.000872194766998291, -0.0008391886949539185, -0.0008061826229095459, -0.0007731765508651733, -0.0007401704788208008, -0.0007071644067764282, -0.0006741583347320557, -0.0006411522626876831, -0.0006081461906433105, -0.000575140118598938, -0.0005421340465545654, -0.0005091279745101929, -0.0004761219024658203, -0.00044311583042144775, -0.0004101097583770752, -0.00037710368633270264, -0.0003440976142883301, -0.0003110915422439575, -0.00027808547019958496, -0.0002450793981552124, -0.00021207332611083984, -0.00017906725406646729, -0.00014606118202209473, -0.00011305510997772217, -8.004903793334961e-05, -4.704296588897705e-05, -1.4036893844604492e-05, 1.8969178199768066e-05, 5.1975250244140625e-05, 8.498132228851318e-05, 0.00011798739433288574, 0.0001509934663772583, 0.00018399953842163086, 0.00021700561046600342, 0.000250011682510376, 0.00028301775455474854, 0.0003160238265991211, 0.00034902989864349365, 0.0003820359706878662, 0.00041504204273223877, 0.00044804811477661133, 0.0004810541868209839, 0.0005140602588653564, 0.000547066330909729, 0.0005800724029541016, 0.0006130784749984741, 0.0006460845470428467, 0.0006790906190872192, 0.0007120966911315918, 0.0007451027631759644, 0.0007781088352203369, 0.0008111149072647095, 0.000844120979309082, 0.0008771270513534546, 0.0009101331233978271, 0.0009431391954421997, 0.0009761452674865723, 0.0010091513395309448, 0.0010421574115753174, 0.00107516348361969, 0.0011081695556640625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 0.0, 9.0, 6.0, 6.0, 10.0, 7.0, 23.0, 21.0, 39.0, 54.0, 65.0, 95.0, 102.0, 173.0, 235.0, 373.0, 1080.0, 731996.0, 312217.0, 877.0, 355.0, 190.0, 172.0, 115.0, 89.0, 81.0, 42.0, 32.0, 25.0, 18.0, 15.0, 9.0, 8.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.023345947265625, -0.022696495056152344, -0.022047042846679688, -0.02139759063720703, -0.020748138427734375, -0.02009868621826172, -0.019449234008789062, -0.018799781799316406, -0.01815032958984375, -0.017500877380371094, -0.016851425170898438, -0.01620197296142578, -0.015552520751953125, -0.014903068542480469, -0.014253616333007812, -0.013604164123535156, -0.0129547119140625, -0.012305259704589844, -0.011655807495117188, -0.011006355285644531, -0.010356903076171875, -0.009707450866699219, -0.009057998657226562, -0.008408546447753906, -0.00775909423828125, -0.007109642028808594, -0.0064601898193359375, -0.005810737609863281, -0.005161285400390625, -0.004511833190917969, -0.0038623809814453125, -0.0032129287719726562, -0.0025634765625, -0.0019140243530273438, -0.0012645721435546875, -0.0006151199340820312, 3.4332275390625e-05, 0.0006837844848632812, 0.0013332366943359375, 0.0019826889038085938, 0.00263214111328125, 0.0032815933227539062, 0.0039310455322265625, 0.004580497741699219, 0.005229949951171875, 0.005879402160644531, 0.0065288543701171875, 0.007178306579589844, 0.0078277587890625, 0.008477210998535156, 0.009126663208007812, 0.009776115417480469, 0.010425567626953125, 0.011075019836425781, 0.011724472045898438, 0.012373924255371094, 0.01302337646484375, 0.013672828674316406, 0.014322280883789062, 0.014971733093261719, 0.015621185302734375, 0.01627063751220703, 0.016920089721679688, 0.017569541931152344, 0.018218994140625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 811.0, 207.0, 0.0, 0.0, 1.0], "bins": [-0.017217513173818588, -0.016929911449551582, -0.016642309725284576, -0.01635470800101757, -0.016067106276750565, -0.01577950455248356, -0.015491901896893978, -0.015204300172626972, -0.014916698448359966, -0.01462909672409296, -0.014341494999825954, -0.014053892344236374, -0.013766290619969368, -0.013478688895702362, -0.013191087171435356, -0.01290348544716835, -0.012615883722901344, -0.012328281998634338, -0.012040680274367332, -0.011753078550100327, -0.011465475894510746, -0.01117787417024374, -0.010890272445976734, -0.010602670721709728, -0.010315068066120148, -0.010027466341853142, -0.009739864617586136, -0.00945226289331913, -0.00916466023772955, -0.008877058513462543, -0.008589456789195538, -0.008301855064928532, -0.008014253340661526, -0.00772665161639452, -0.007439049426466227, -0.007151447702199221, -0.006863845977932215, -0.0065762437880039215, -0.006288642063736916, -0.00600104033946991, -0.005713438615202904, -0.005425836890935898, -0.005138234701007605, -0.004850632976740599, -0.004563031252473593, -0.0042754290625452995, -0.003987827338278294, -0.0037002256140112877, -0.0034126238897442818, -0.003125021932646632, -0.0028374202083796263, -0.0025498182512819767, -0.0022622165270149708, -0.001974614569917321, -0.0016870126128196716, -0.0013994108885526657, -0.0011118088150396943, -0.0008242069743573666, -0.0005366050754673779, -0.00024900317657738924, 3.859866410493851e-05, 0.00032620050478726625, 0.0006138024618849158, 0.0009014041861519217, 0.0011890061432495713]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 10.0, 11.0, 19.0, 28.0, 20.0, 22.0, 27.0, 31.0, 34.0, 44.0, 40.0, 28.0, 33.0, 67.0, 42.0, 50.0, 41.0, 54.0, 50.0, 40.0, 47.0, 29.0, 42.0, 31.0, 28.0, 28.0, 19.0, 15.0, 16.0, 10.0, 9.0, 2.0, 8.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00046622753143310547, -0.0004495270550251007, -0.00043282657861709595, -0.0004161261022090912, -0.0003994256258010864, -0.00038272514939308167, -0.0003660246729850769, -0.00034932419657707214, -0.0003326237201690674, -0.0003159232437610626, -0.00029922276735305786, -0.0002825222909450531, -0.00026582181453704834, -0.0002491213381290436, -0.00023242086172103882, -0.00021572038531303406, -0.0001990199089050293, -0.00018231943249702454, -0.00016561895608901978, -0.00014891847968101501, -0.00013221800327301025, -0.00011551752686500549, -9.881705045700073e-05, -8.211657404899597e-05, -6.541609764099121e-05, -4.871562123298645e-05, -3.201514482498169e-05, -1.531466841697693e-05, 1.385807991027832e-06, 1.8086284399032593e-05, 3.4786760807037354e-05, 5.1487237215042114e-05, 6.818771362304688e-05, 8.488819003105164e-05, 0.0001015886664390564, 0.00011828914284706116, 0.00013498961925506592, 0.00015169009566307068, 0.00016839057207107544, 0.0001850910484790802, 0.00020179152488708496, 0.00021849200129508972, 0.00023519247770309448, 0.00025189295411109924, 0.000268593430519104, 0.00028529390692710876, 0.0003019943833351135, 0.0003186948597431183, 0.00033539533615112305, 0.0003520958125591278, 0.00036879628896713257, 0.00038549676537513733, 0.0004021972417831421, 0.00041889771819114685, 0.0004355981945991516, 0.00045229867100715637, 0.00046899914741516113, 0.0004856996238231659, 0.0005024001002311707, 0.0005191005766391754, 0.0005358010530471802, 0.0005525015294551849, 0.0005692020058631897, 0.0005859024822711945, 0.0006026029586791992]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 8.0, 9.0, 13.0, 9.0, 10.0, 8.0, 12.0, 20.0, 18.0, 25.0, 17.0, 28.0, 32.0, 26.0, 32.0, 28.0, 35.0, 47.0, 44.0, 38.0, 45.0, 42.0, 36.0, 41.0, 38.0, 37.0, 34.0, 27.0, 45.0, 34.0, 23.0, 21.0, 16.0, 14.0, 20.0, 13.0, 7.0, 12.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.24609375, -3.1541748046875, -3.062255859375, -2.9703369140625, -2.87841796875, -2.7864990234375, -2.694580078125, -2.6026611328125, -2.5107421875, -2.4188232421875, -2.326904296875, -2.2349853515625, -2.14306640625, -2.0511474609375, -1.959228515625, -1.8673095703125, -1.775390625, -1.6834716796875, -1.591552734375, -1.4996337890625, -1.40771484375, -1.3157958984375, -1.223876953125, -1.1319580078125, -1.0400390625, -0.9481201171875, -0.856201171875, -0.7642822265625, -0.67236328125, -0.5804443359375, -0.488525390625, -0.3966064453125, -0.3046875, -0.2127685546875, -0.120849609375, -0.0289306640625, 0.06298828125, 0.1549072265625, 0.246826171875, 0.3387451171875, 0.4306640625, 0.5225830078125, 0.614501953125, 0.7064208984375, 0.79833984375, 0.8902587890625, 0.982177734375, 1.0740966796875, 1.166015625, 1.2579345703125, 1.349853515625, 1.4417724609375, 1.53369140625, 1.6256103515625, 1.717529296875, 1.8094482421875, 1.9013671875, 1.9932861328125, 2.085205078125, 2.1771240234375, 2.26904296875, 2.3609619140625, 2.452880859375, 2.5447998046875, 2.63671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 17.0, 22.0, 19.0, 38.0, 38.0, 44.0, 86.0, 114.0, 142.0, 204.0, 281.0, 433.0, 687.0, 1339.0, 2701.0, 6341.0, 17451.0, 52963.0, 173754.0, 423534.0, 249896.0, 77005.0, 24980.0, 8699.0, 3513.0, 1683.0, 885.0, 482.0, 338.0, 260.0, 168.0, 117.0, 70.0, 69.0, 47.0, 32.0, 26.0, 14.0, 13.0, 8.0, 4.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.265625, -3.168609619140625, -3.07159423828125, -2.974578857421875, -2.8775634765625, -2.780548095703125, -2.68353271484375, -2.586517333984375, -2.489501953125, -2.392486572265625, -2.29547119140625, -2.198455810546875, -2.1014404296875, -2.004425048828125, -1.90740966796875, -1.810394287109375, -1.71337890625, -1.616363525390625, -1.51934814453125, -1.422332763671875, -1.3253173828125, -1.228302001953125, -1.13128662109375, -1.034271240234375, -0.937255859375, -0.840240478515625, -0.74322509765625, -0.646209716796875, -0.5491943359375, -0.452178955078125, -0.35516357421875, -0.258148193359375, -0.1611328125, -0.064117431640625, 0.03289794921875, 0.129913330078125, 0.2269287109375, 0.323944091796875, 0.42095947265625, 0.517974853515625, 0.614990234375, 0.712005615234375, 0.80902099609375, 0.906036376953125, 1.0030517578125, 1.100067138671875, 1.19708251953125, 1.294097900390625, 1.39111328125, 1.488128662109375, 1.58514404296875, 1.682159423828125, 1.7791748046875, 1.876190185546875, 1.97320556640625, 2.070220947265625, 2.167236328125, 2.264251708984375, 2.36126708984375, 2.458282470703125, 2.5552978515625, 2.652313232421875, 2.74932861328125, 2.846343994140625, 2.943359375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 5.0, 5.0, 9.0, 9.0, 10.0, 13.0, 13.0, 19.0, 22.0, 22.0, 34.0, 24.0, 20.0, 32.0, 38.0, 27.0, 38.0, 65.0, 66.0, 223.0, 1598.0, 241.0, 82.0, 50.0, 49.0, 37.0, 29.0, 44.0, 38.0, 29.0, 28.0, 22.0, 18.0, 12.0, 17.0, 10.0, 9.0, 10.0, 5.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.828125, -10.5054931640625, -10.182861328125, -9.8602294921875, -9.53759765625, -9.2149658203125, -8.892333984375, -8.5697021484375, -8.2470703125, -7.9244384765625, -7.601806640625, -7.2791748046875, -6.95654296875, -6.6339111328125, -6.311279296875, -5.9886474609375, -5.666015625, -5.3433837890625, -5.020751953125, -4.6981201171875, -4.37548828125, -4.0528564453125, -3.730224609375, -3.4075927734375, -3.0849609375, -2.7623291015625, -2.439697265625, -2.1170654296875, -1.79443359375, -1.4718017578125, -1.149169921875, -0.8265380859375, -0.50390625, -0.1812744140625, 0.141357421875, 0.4639892578125, 0.78662109375, 1.1092529296875, 1.431884765625, 1.7545166015625, 2.0771484375, 2.3997802734375, 2.722412109375, 3.0450439453125, 3.36767578125, 3.6903076171875, 4.012939453125, 4.3355712890625, 4.658203125, 4.9808349609375, 5.303466796875, 5.6260986328125, 5.94873046875, 6.2713623046875, 6.593994140625, 6.9166259765625, 7.2392578125, 7.5618896484375, 7.884521484375, 8.2071533203125, 8.52978515625, 8.8524169921875, 9.175048828125, 9.4976806640625, 9.8203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 14.0, 13.0, 11.0, 17.0, 18.0, 39.0, 30.0, 38.0, 60.0, 69.0, 95.0, 160.0, 343.0, 964.0, 10441.0, 3094080.0, 36668.0, 1454.0, 469.0, 190.0, 116.0, 70.0, 60.0, 43.0, 33.0, 25.0, 28.0, 28.0, 22.0, 13.0, 7.0, 10.0, 11.0, 7.0, 4.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.7802734375, -21.044921875, -20.3095703125, -19.57421875, -18.8388671875, -18.103515625, -17.3681640625, -16.6328125, -15.8974609375, -15.162109375, -14.4267578125, -13.69140625, -12.9560546875, -12.220703125, -11.4853515625, -10.75, -10.0146484375, -9.279296875, -8.5439453125, -7.80859375, -7.0732421875, -6.337890625, -5.6025390625, -4.8671875, -4.1318359375, -3.396484375, -2.6611328125, -1.92578125, -1.1904296875, -0.455078125, 0.2802734375, 1.015625, 1.7509765625, 2.486328125, 3.2216796875, 3.95703125, 4.6923828125, 5.427734375, 6.1630859375, 6.8984375, 7.6337890625, 8.369140625, 9.1044921875, 9.83984375, 10.5751953125, 11.310546875, 12.0458984375, 12.78125, 13.5166015625, 14.251953125, 14.9873046875, 15.72265625, 16.4580078125, 17.193359375, 17.9287109375, 18.6640625, 19.3994140625, 20.134765625, 20.8701171875, 21.60546875, 22.3408203125, 23.076171875, 23.8115234375, 24.546875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [572.0, 445.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.790811061859131, 0.052968740463256836, 3.8967485427856445, 7.740528583526611, 11.584308624267578, 15.42808723449707, 19.271867752075195, 23.115646362304688, 26.959426879882812, 30.803207397460938, 34.64698791503906, 38.49076843261719, 42.33454513549805, 46.17832565307617, 50.0221061706543, 53.865882873535156, 57.70966720581055, 61.55344772338867, 65.39722442626953, 69.24100494384766, 73.08478546142578, 76.9285659790039, 80.77234649658203, 84.61612701416016, 88.45990753173828, 92.3036880493164, 96.14746856689453, 99.99124908447266, 103.83502960205078, 107.67880249023438, 111.5225830078125, 115.36636352539062, 119.21013641357422, 123.05391693115234, 126.89769744873047, 130.74147033691406, 134.5852508544922, 138.4290313720703, 142.27281188964844, 146.11659240722656, 149.9603729248047, 153.8041534423828, 157.64793395996094, 161.49171447753906, 165.3354949951172, 169.1792755126953, 173.02305603027344, 176.86683654785156, 180.7106170654297, 184.5543975830078, 188.39817810058594, 192.24195861816406, 196.0857391357422, 199.9295196533203, 203.77330017089844, 207.61708068847656, 211.46084594726562, 215.30462646484375, 219.14840698242188, 222.9921875, 226.83596801757812, 230.67974853515625, 234.52352905273438, 238.3673095703125, 242.21109008789062]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 8.0, 7.0, 13.0, 19.0, 24.0, 16.0, 30.0, 23.0, 27.0, 27.0, 34.0, 46.0, 34.0, 32.0, 43.0, 50.0, 37.0, 58.0, 38.0, 46.0, 44.0, 41.0, 37.0, 37.0, 30.0, 25.0, 20.0, 19.0, 13.0, 12.0, 12.0, 16.0, 13.0, 6.0, 9.0, 7.0, 1.0, 4.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.27735137939453, -33.21554946899414, -32.153743743896484, -31.091941833496094, -30.030139923095703, -28.96833610534668, -27.906532287597656, -26.844730377197266, -25.782926559448242, -24.72112274169922, -23.659320831298828, -22.597517013549805, -21.53571319580078, -20.47391128540039, -19.412107467651367, -18.350303649902344, -17.288501739501953, -16.22669792175293, -15.164896011352539, -14.103092193603516, -13.041289329528809, -11.979486465454102, -10.917682647705078, -9.855879783630371, -8.794076919555664, -7.732274055480957, -6.670470714569092, -5.608667373657227, -4.5468645095825195, -3.4850616455078125, -2.4232583045959473, -1.361454963684082, -0.299652099609375, 0.7621510028839111, 1.8239541053771973, 2.8857572078704834, 3.9475603103637695, 5.009363174438477, 6.071166515350342, 7.132969856262207, 8.194772720336914, 9.256575584411621, 10.318378448486328, 11.380182266235352, 12.441985130310059, 13.503787994384766, 14.565591812133789, 15.627394676208496, 16.689197540283203, 17.751001358032227, 18.812803268432617, 19.87460708618164, 20.93640899658203, 21.998212814331055, 23.060016632080078, 24.12181854248047, 25.183622360229492, 26.245426177978516, 27.307228088378906, 28.36903190612793, 29.430835723876953, 30.492637634277344, 31.554441452026367, 32.61624526977539, 33.67804718017578]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 5.0, 7.0, 8.0, 13.0, 9.0, 9.0, 12.0, 17.0, 18.0, 19.0, 16.0, 25.0, 22.0, 32.0, 27.0, 22.0, 35.0, 36.0, 40.0, 40.0, 30.0, 48.0, 36.0, 45.0, 34.0, 34.0, 30.0, 46.0, 31.0, 25.0, 38.0, 30.0, 23.0, 19.0, 17.0, 10.0, 19.0, 6.0, 10.0, 17.0, 6.0, 4.0, 8.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-3.048828125, -2.96026611328125, -2.8717041015625, -2.78314208984375, -2.694580078125, -2.60601806640625, -2.5174560546875, -2.42889404296875, -2.34033203125, -2.25177001953125, -2.1632080078125, -2.07464599609375, -1.986083984375, -1.89752197265625, -1.8089599609375, -1.72039794921875, -1.6318359375, -1.54327392578125, -1.4547119140625, -1.36614990234375, -1.277587890625, -1.18902587890625, -1.1004638671875, -1.01190185546875, -0.92333984375, -0.83477783203125, -0.7462158203125, -0.65765380859375, -0.569091796875, -0.48052978515625, -0.3919677734375, -0.30340576171875, -0.21484375, -0.12628173828125, -0.0377197265625, 0.05084228515625, 0.139404296875, 0.22796630859375, 0.3165283203125, 0.40509033203125, 0.49365234375, 0.58221435546875, 0.6707763671875, 0.75933837890625, 0.847900390625, 0.93646240234375, 1.0250244140625, 1.11358642578125, 1.2021484375, 1.29071044921875, 1.3792724609375, 1.46783447265625, 1.556396484375, 1.64495849609375, 1.7335205078125, 1.82208251953125, 1.91064453125, 1.99920654296875, 2.0877685546875, 2.17633056640625, 2.264892578125, 2.35345458984375, 2.4420166015625, 2.53057861328125, 2.619140625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 6.0, 7.0, 13.0, 10.0, 18.0, 12.0, 20.0, 25.0, 19.0, 44.0, 53.0, 42.0, 63.0, 90.0, 159.0, 295.0, 731.0, 2591.0, 15352.0, 141118.0, 2084101.0, 1811594.0, 120235.0, 13506.0, 2552.0, 743.0, 305.0, 142.0, 121.0, 63.0, 36.0, 38.0, 41.0, 21.0, 22.0, 22.0, 17.0, 7.0, 8.0, 6.0, 6.0, 8.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3673095703125, -11.000244140625, -10.6331787109375, -10.26611328125, -9.8990478515625, -9.531982421875, -9.1649169921875, -8.7978515625, -8.4307861328125, -8.063720703125, -7.6966552734375, -7.32958984375, -6.9625244140625, -6.595458984375, -6.2283935546875, -5.861328125, -5.4942626953125, -5.127197265625, -4.7601318359375, -4.39306640625, -4.0260009765625, -3.658935546875, -3.2918701171875, -2.9248046875, -2.5577392578125, -2.190673828125, -1.8236083984375, -1.45654296875, -1.0894775390625, -0.722412109375, -0.3553466796875, 0.01171875, 0.3787841796875, 0.745849609375, 1.1129150390625, 1.47998046875, 1.8470458984375, 2.214111328125, 2.5811767578125, 2.9482421875, 3.3153076171875, 3.682373046875, 4.0494384765625, 4.41650390625, 4.7835693359375, 5.150634765625, 5.5177001953125, 5.884765625, 6.2518310546875, 6.618896484375, 6.9859619140625, 7.35302734375, 7.7200927734375, 8.087158203125, 8.4542236328125, 8.8212890625, 9.1883544921875, 9.555419921875, 9.9224853515625, 10.28955078125, 10.6566162109375, 11.023681640625, 11.3907470703125, 11.7578125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 18.0, 28.0, 36.0, 46.0, 64.0, 121.0, 139.0, 222.0, 293.0, 400.0, 489.0, 509.0, 458.0, 362.0, 257.0, 184.0, 137.0, 85.0, 59.0, 44.0, 37.0, 17.0, 18.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1605224609375, -11.758544921875, -11.3565673828125, -10.95458984375, -10.5526123046875, -10.150634765625, -9.7486572265625, -9.3466796875, -8.9447021484375, -8.542724609375, -8.1407470703125, -7.73876953125, -7.3367919921875, -6.934814453125, -6.5328369140625, -6.130859375, -5.7288818359375, -5.326904296875, -4.9249267578125, -4.52294921875, -4.1209716796875, -3.718994140625, -3.3170166015625, -2.9150390625, -2.5130615234375, -2.111083984375, -1.7091064453125, -1.30712890625, -0.9051513671875, -0.503173828125, -0.1011962890625, 0.30078125, 0.7027587890625, 1.104736328125, 1.5067138671875, 1.90869140625, 2.3106689453125, 2.712646484375, 3.1146240234375, 3.5166015625, 3.9185791015625, 4.320556640625, 4.7225341796875, 5.12451171875, 5.5264892578125, 5.928466796875, 6.3304443359375, 6.732421875, 7.1343994140625, 7.536376953125, 7.9383544921875, 8.34033203125, 8.7423095703125, 9.144287109375, 9.5462646484375, 9.9482421875, 10.3502197265625, 10.752197265625, 11.1541748046875, 11.55615234375, 11.9581298828125, 12.360107421875, 12.7620849609375, 13.1640625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 7.0, 16.0, 17.0, 31.0, 55.0, 58.0, 93.0, 142.0, 268.0, 591.0, 2039.0, 24765.0, 2410212.0, 1733886.0, 19134.0, 1708.0, 523.0, 265.0, 142.0, 90.0, 58.0, 53.0, 40.0, 14.0, 10.0, 13.0, 8.0, 6.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-34.46875, -33.318359375, -32.16796875, -31.017578125, -29.8671875, -28.716796875, -27.56640625, -26.416015625, -25.265625, -24.115234375, -22.96484375, -21.814453125, -20.6640625, -19.513671875, -18.36328125, -17.212890625, -16.0625, -14.912109375, -13.76171875, -12.611328125, -11.4609375, -10.310546875, -9.16015625, -8.009765625, -6.859375, -5.708984375, -4.55859375, -3.408203125, -2.2578125, -1.107421875, 0.04296875, 1.193359375, 2.34375, 3.494140625, 4.64453125, 5.794921875, 6.9453125, 8.095703125, 9.24609375, 10.396484375, 11.546875, 12.697265625, 13.84765625, 14.998046875, 16.1484375, 17.298828125, 18.44921875, 19.599609375, 20.75, 21.900390625, 23.05078125, 24.201171875, 25.3515625, 26.501953125, 27.65234375, 28.802734375, 29.953125, 31.103515625, 32.25390625, 33.404296875, 34.5546875, 35.705078125, 36.85546875, 38.005859375, 39.15625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 54.0, 206.0, 385.0, 259.0, 77.0, 19.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.69924926757812, -65.49522399902344, -61.291194915771484, -57.08716583251953, -52.883140563964844, -48.679115295410156, -44.4750862121582, -40.27105712890625, -36.06703186035156, -31.863004684448242, -27.658977508544922, -23.4549503326416, -19.25092315673828, -15.046895980834961, -10.84286880493164, -6.63884162902832, -2.434814453125, 1.7692127227783203, 5.973239898681641, 10.177267074584961, 14.381294250488281, 18.5853214263916, 22.789348602294922, 26.993375778198242, 31.197402954101562, 35.40142822265625, 39.6054573059082, 43.809486389160156, 48.013511657714844, 52.21753692626953, 56.421566009521484, 60.62559509277344, 64.82963562011719, 69.03366088867188, 73.23768615722656, 77.44171905517578, 81.64574432373047, 85.84976959228516, 90.05380249023438, 94.25782775878906, 98.46185302734375, 102.66587829589844, 106.86990356445312, 111.07393646240234, 115.27796173095703, 119.48198699951172, 123.68601989746094, 127.89004516601562, 132.0940704345703, 136.298095703125, 140.5021209716797, 144.70614624023438, 148.91018676757812, 153.1142120361328, 157.3182373046875, 161.5222625732422, 165.72628784179688, 169.93031311035156, 174.13433837890625, 178.33836364746094, 182.54238891601562, 186.74642944335938, 190.95045471191406, 195.15447998046875, 199.35850524902344]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 9.0, 15.0, 12.0, 19.0, 22.0, 26.0, 22.0, 27.0, 27.0, 38.0, 38.0, 34.0, 42.0, 37.0, 42.0, 35.0, 49.0, 45.0, 52.0, 40.0, 26.0, 30.0, 28.0, 35.0, 32.0, 27.0, 25.0, 27.0, 24.0, 21.0, 16.0, 8.0, 10.0, 10.0, 12.0, 6.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.288360595703125, -33.15347671508789, -32.01859664916992, -30.88371467590332, -29.74883270263672, -28.613948822021484, -27.479066848754883, -26.34418487548828, -25.20930290222168, -24.074420928955078, -22.939538955688477, -21.804656982421875, -20.66977310180664, -19.534893035888672, -18.400009155273438, -17.265127182006836, -16.130245208740234, -14.995363235473633, -13.860481262207031, -12.725598335266113, -11.590716361999512, -10.45583438873291, -9.320951461791992, -8.18606948852539, -7.051187515258789, -5.9163055419921875, -4.781423091888428, -3.646540880203247, -2.5116586685180664, -1.3767766952514648, -0.24189424514770508, 0.8929882049560547, 2.0278701782226562, 3.162752389907837, 4.297634601593018, 5.432517051696777, 6.567399024963379, 7.7022809982299805, 8.837163925170898, 9.9720458984375, 11.106927871704102, 12.241809844970703, 13.376691818237305, 14.511574745178223, 15.646456718444824, 16.78133773803711, 17.916221618652344, 19.051103591918945, 20.185985565185547, 21.32086753845215, 22.45574951171875, 23.59063148498535, 24.725513458251953, 25.860397338867188, 26.99527931213379, 28.13016128540039, 29.265043258666992, 30.399925231933594, 31.534807205200195, 32.6696891784668, 33.80457305908203, 34.939453125, 36.074337005615234, 37.20922088623047, 38.34410095214844]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 8.0, 13.0, 8.0, 14.0, 20.0, 9.0, 18.0, 22.0, 27.0, 26.0, 26.0, 41.0, 29.0, 36.0, 42.0, 40.0, 39.0, 45.0, 52.0, 40.0, 53.0, 42.0, 40.0, 30.0, 27.0, 34.0, 25.0, 29.0, 27.0, 20.0, 28.0, 14.0, 15.0, 12.0, 6.0, 7.0, 6.0, 9.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.439300537109375, -3.33563232421875, -3.231964111328125, -3.1282958984375, -3.024627685546875, -2.92095947265625, -2.817291259765625, -2.713623046875, -2.609954833984375, -2.50628662109375, -2.402618408203125, -2.2989501953125, -2.195281982421875, -2.09161376953125, -1.987945556640625, -1.88427734375, -1.780609130859375, -1.67694091796875, -1.573272705078125, -1.4696044921875, -1.365936279296875, -1.26226806640625, -1.158599853515625, -1.054931640625, -0.951263427734375, -0.84759521484375, -0.743927001953125, -0.6402587890625, -0.536590576171875, -0.43292236328125, -0.329254150390625, -0.2255859375, -0.121917724609375, -0.01824951171875, 0.085418701171875, 0.1890869140625, 0.292755126953125, 0.39642333984375, 0.500091552734375, 0.603759765625, 0.707427978515625, 0.81109619140625, 0.914764404296875, 1.0184326171875, 1.122100830078125, 1.22576904296875, 1.329437255859375, 1.43310546875, 1.536773681640625, 1.64044189453125, 1.744110107421875, 1.8477783203125, 1.951446533203125, 2.05511474609375, 2.158782958984375, 2.262451171875, 2.366119384765625, 2.46978759765625, 2.573455810546875, 2.6771240234375, 2.780792236328125, 2.88446044921875, 2.988128662109375, 3.091796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 20.0, 17.0, 33.0, 41.0, 79.0, 113.0, 196.0, 240.0, 360.0, 563.0, 835.0, 1352.0, 2025.0, 2924.0, 4491.0, 6314.0, 9856.0, 14548.0, 22662.0, 35057.0, 56287.0, 89834.0, 140233.0, 187482.0, 165258.0, 112151.0, 69939.0, 44297.0, 27686.0, 18066.0, 11898.0, 7788.0, 5290.0, 3497.0, 2341.0, 1615.0, 1048.0, 703.0, 482.0, 296.0, 215.0, 135.0, 83.0, 65.0, 44.0, 40.0, 23.0, 11.0, 5.0, 5.0, 1.0, 2.0, 3.0, 4.0], "bins": [-0.3388671875, -0.3288230895996094, -0.31877899169921875, -0.3087348937988281, -0.2986907958984375, -0.2886466979980469, -0.27860260009765625, -0.2685585021972656, -0.258514404296875, -0.24847030639648438, -0.23842620849609375, -0.22838211059570312, -0.2183380126953125, -0.20829391479492188, -0.19824981689453125, -0.18820571899414062, -0.17816162109375, -0.16811752319335938, -0.15807342529296875, -0.14802932739257812, -0.1379852294921875, -0.12794113159179688, -0.11789703369140625, -0.10785293579101562, -0.097808837890625, -0.08776473999023438, -0.07772064208984375, -0.06767654418945312, -0.0576324462890625, -0.047588348388671875, -0.03754425048828125, -0.027500152587890625, -0.0174560546875, -0.007411956787109375, 0.00263214111328125, 0.012676239013671875, 0.0227203369140625, 0.032764434814453125, 0.04280853271484375, 0.052852630615234375, 0.062896728515625, 0.07294082641601562, 0.08298492431640625, 0.09302902221679688, 0.1030731201171875, 0.11311721801757812, 0.12316131591796875, 0.13320541381835938, 0.14324951171875, 0.15329360961914062, 0.16333770751953125, 0.17338180541992188, 0.1834259033203125, 0.19347000122070312, 0.20351409912109375, 0.21355819702148438, 0.223602294921875, 0.23364639282226562, 0.24369049072265625, 0.2537345886230469, 0.2637786865234375, 0.2738227844238281, 0.28386688232421875, 0.2939109802246094, 0.303955078125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 1.0, 3.0, 6.0, 0.0, 2.0, 10.0, 9.0, 10.0, 14.0, 13.0, 19.0, 13.0, 16.0, 20.0, 22.0, 30.0, 35.0, 33.0, 31.0, 32.0, 36.0, 33.0, 32.0, 36.0, 1072.0, 32.0, 49.0, 29.0, 27.0, 38.0, 32.0, 31.0, 37.0, 32.0, 34.0, 19.0, 20.0, 14.0, 16.0, 19.0, 12.0, 9.0, 14.0, 9.0, 5.0, 4.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.11328125, -2.05145263671875, -1.9896240234375, -1.92779541015625, -1.865966796875, -1.80413818359375, -1.7423095703125, -1.68048095703125, -1.61865234375, -1.55682373046875, -1.4949951171875, -1.43316650390625, -1.371337890625, -1.30950927734375, -1.2476806640625, -1.18585205078125, -1.1240234375, -1.06219482421875, -1.0003662109375, -0.93853759765625, -0.876708984375, -0.81488037109375, -0.7530517578125, -0.69122314453125, -0.62939453125, -0.56756591796875, -0.5057373046875, -0.44390869140625, -0.382080078125, -0.32025146484375, -0.2584228515625, -0.19659423828125, -0.134765625, -0.07293701171875, -0.0111083984375, 0.05072021484375, 0.112548828125, 0.17437744140625, 0.2362060546875, 0.29803466796875, 0.35986328125, 0.42169189453125, 0.4835205078125, 0.54534912109375, 0.607177734375, 0.66900634765625, 0.7308349609375, 0.79266357421875, 0.8544921875, 0.91632080078125, 0.9781494140625, 1.03997802734375, 1.101806640625, 1.16363525390625, 1.2254638671875, 1.28729248046875, 1.34912109375, 1.41094970703125, 1.4727783203125, 1.53460693359375, 1.596435546875, 1.65826416015625, 1.7200927734375, 1.78192138671875, 1.84375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 6.0, 17.0, 21.0, 32.0, 42.0, 67.0, 78.0, 157.0, 227.0, 278.0, 494.0, 779.0, 1167.0, 1898.0, 2909.0, 4608.0, 7244.0, 11929.0, 18915.0, 30836.0, 50917.0, 85678.0, 133883.0, 1148261.0, 255115.0, 130140.0, 82422.0, 49731.0, 29689.0, 18571.0, 11286.0, 7171.0, 4518.0, 2885.0, 1858.0, 1176.0, 720.0, 501.0, 299.0, 223.0, 115.0, 94.0, 67.0, 31.0, 28.0, 19.0, 5.0, 8.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.266845703125, -0.25875091552734375, -0.2506561279296875, -0.24256134033203125, -0.234466552734375, -0.22637176513671875, -0.2182769775390625, -0.21018218994140625, -0.20208740234375, -0.19399261474609375, -0.1858978271484375, -0.17780303955078125, -0.169708251953125, -0.16161346435546875, -0.1535186767578125, -0.14542388916015625, -0.1373291015625, -0.12923431396484375, -0.1211395263671875, -0.11304473876953125, -0.104949951171875, -0.09685516357421875, -0.0887603759765625, -0.08066558837890625, -0.07257080078125, -0.06447601318359375, -0.0563812255859375, -0.04828643798828125, -0.040191650390625, -0.03209686279296875, -0.0240020751953125, -0.01590728759765625, -0.0078125, 0.00028228759765625, 0.0083770751953125, 0.01647186279296875, 0.024566650390625, 0.03266143798828125, 0.0407562255859375, 0.04885101318359375, 0.05694580078125, 0.06504058837890625, 0.0731353759765625, 0.08123016357421875, 0.089324951171875, 0.09741973876953125, 0.1055145263671875, 0.11360931396484375, 0.1217041015625, 0.12979888916015625, 0.1378936767578125, 0.14598846435546875, 0.154083251953125, 0.16217803955078125, 0.1702728271484375, 0.17836761474609375, 0.18646240234375, 0.19455718994140625, 0.2026519775390625, 0.21074676513671875, 0.218841552734375, 0.22693634033203125, 0.2350311279296875, 0.24312591552734375, 0.251220703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 12.0, 15.0, 7.0, 17.0, 26.0, 17.0, 28.0, 26.0, 24.0, 41.0, 47.0, 40.0, 44.0, 44.0, 49.0, 39.0, 51.0, 46.0, 50.0, 45.0, 45.0, 38.0, 42.0, 33.0, 27.0, 23.0, 20.0, 19.0, 16.0, 12.0, 9.0, 4.0, 8.0, 1.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0008268356323242188, -0.0008020699024200439, -0.0007773041725158691, -0.0007525384426116943, -0.0007277727127075195, -0.0007030069828033447, -0.0006782412528991699, -0.0006534755229949951, -0.0006287097930908203, -0.0006039440631866455, -0.0005791783332824707, -0.0005544126033782959, -0.0005296468734741211, -0.0005048811435699463, -0.0004801154136657715, -0.0004553496837615967, -0.0004305839538574219, -0.00040581822395324707, -0.00038105249404907227, -0.00035628676414489746, -0.00033152103424072266, -0.00030675530433654785, -0.00028198957443237305, -0.00025722384452819824, -0.00023245811462402344, -0.00020769238471984863, -0.00018292665481567383, -0.00015816092491149902, -0.00013339519500732422, -0.00010862946510314941, -8.386373519897461e-05, -5.9098005294799805e-05, -3.4332275390625e-05, -9.566545486450195e-06, 1.519918441772461e-05, 3.9964914321899414e-05, 6.473064422607422e-05, 8.949637413024902e-05, 0.00011426210403442383, 0.00013902783393859863, 0.00016379356384277344, 0.00018855929374694824, 0.00021332502365112305, 0.00023809075355529785, 0.00026285648345947266, 0.00028762221336364746, 0.00031238794326782227, 0.00033715367317199707, 0.0003619194030761719, 0.0003866851329803467, 0.0004114508628845215, 0.0004362165927886963, 0.0004609823226928711, 0.0004857480525970459, 0.0005105137825012207, 0.0005352795124053955, 0.0005600452423095703, 0.0005848109722137451, 0.0006095767021179199, 0.0006343424320220947, 0.0006591081619262695, 0.0006838738918304443, 0.0007086396217346191, 0.0007334053516387939, 0.0007581710815429688]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 10.0, 15.0, 14.0, 16.0, 34.0, 32.0, 52.0, 56.0, 65.0, 87.0, 114.0, 144.0, 227.0, 323.0, 804.0, 37304.0, 1001516.0, 6052.0, 555.0, 294.0, 199.0, 127.0, 94.0, 82.0, 86.0, 57.0, 26.0, 33.0, 18.0, 30.0, 15.0, 19.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0169219970703125, -0.016398906707763672, -0.015875816345214844, -0.015352725982666016, -0.014829635620117188, -0.01430654525756836, -0.013783454895019531, -0.013260364532470703, -0.012737274169921875, -0.012214183807373047, -0.011691093444824219, -0.01116800308227539, -0.010644912719726562, -0.010121822357177734, -0.009598731994628906, -0.009075641632080078, -0.00855255126953125, -0.008029460906982422, -0.007506370544433594, -0.006983280181884766, -0.0064601898193359375, -0.005937099456787109, -0.005414009094238281, -0.004890918731689453, -0.004367828369140625, -0.003844738006591797, -0.0033216476440429688, -0.0027985572814941406, -0.0022754669189453125, -0.0017523765563964844, -0.0012292861938476562, -0.0007061958312988281, -0.00018310546875, 0.0003399848937988281, 0.0008630752563476562, 0.0013861656188964844, 0.0019092559814453125, 0.0024323463439941406, 0.0029554367065429688, 0.003478527069091797, 0.004001617431640625, 0.004524707794189453, 0.005047798156738281, 0.005570888519287109, 0.0060939788818359375, 0.006617069244384766, 0.007140159606933594, 0.007663249969482422, 0.00818634033203125, 0.008709430694580078, 0.009232521057128906, 0.009755611419677734, 0.010278701782226562, 0.01080179214477539, 0.011324882507324219, 0.011847972869873047, 0.012371063232421875, 0.012894153594970703, 0.013417243957519531, 0.01394033432006836, 0.014463424682617188, 0.014986515045166016, 0.015509605407714844, 0.016032695770263672, 0.0165557861328125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 44.0, 90.0, 185.0, 277.0, 208.0, 122.0, 48.0, 18.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.002124866470694542, -0.002086655469611287, -0.0020484444685280323, -0.0020102334674447775, -0.0019720224663615227, -0.0019338115816935897, -0.0018956005806103349, -0.0018573896959424019, -0.001819178694859147, -0.0017809676937758923, -0.0017427566926926374, -0.0017045458080247045, -0.0016663348069414496, -0.0016281238058581948, -0.00158991280477494, -0.001551701920107007, -0.0015134909190237522, -0.0014752799179404974, -0.0014370689168572426, -0.0013988580321893096, -0.0013606470311060548, -0.0013224360300228, -0.0012842250289395452, -0.0012460141442716122, -0.0012078030267730355, -0.0011695920256897807, -0.001131381024606526, -0.001093170139938593, -0.001054959138855338, -0.0010167481377720833, -0.0009785371366888285, -0.0009403261938132346, -0.0009021152509376407, -0.0008639042498543859, -0.000825693306978792, -0.0007874823058955371, -0.0007492713630199432, -0.0007110603619366884, -0.0006728493608534336, -0.0006346384179778397, -0.0005964274751022458, -0.000558216474018991, -0.0005200055311433971, -0.0004817945300601423, -0.0004435835871845484, -0.00040537258610129356, -0.0003671616141218692, -0.00032895064214244485, -0.0002907396701630205, -0.00025252869818359613, -0.00021431772620417178, -0.0001761067396728322, -0.00013789576769340783, -9.968479571398348e-05, -6.147380918264389e-05, -2.3262837203219533e-05, 1.4948134776204824e-05, 5.315911039360799e-05, 9.137008601101115e-05, 0.00012958106526639313, 0.00016779203724581748, 0.00020600300922524184, 0.0002442139957565814, 0.0002824249677360058, 0.00032063593971543014]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 4.0, 10.0, 7.0, 7.0, 12.0, 16.0, 26.0, 16.0, 27.0, 34.0, 23.0, 33.0, 31.0, 44.0, 45.0, 39.0, 34.0, 35.0, 40.0, 38.0, 38.0, 40.0, 32.0, 42.0, 34.0, 32.0, 26.0, 29.0, 21.0, 23.0, 18.0, 18.0, 22.0, 11.0, 17.0, 11.0, 18.0, 11.0, 5.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004457235336303711, -0.0004318300634622574, -0.0004179365932941437, -0.00040404312312602997, -0.00039014965295791626, -0.00037625618278980255, -0.00036236271262168884, -0.00034846924245357513, -0.0003345757722854614, -0.0003206823021173477, -0.000306788831949234, -0.0002928953617811203, -0.0002790018916130066, -0.0002651084214448929, -0.0002512149512767792, -0.00023732148110866547, -0.00022342801094055176, -0.00020953454077243805, -0.00019564107060432434, -0.00018174760043621063, -0.00016785413026809692, -0.00015396066009998322, -0.0001400671899318695, -0.0001261737197637558, -0.00011228024959564209, -9.838677942752838e-05, -8.449330925941467e-05, -7.059983909130096e-05, -5.6706368923187256e-05, -4.281289875507355e-05, -2.891942858695984e-05, -1.502595841884613e-05, -1.1324882507324219e-06, 1.2760981917381287e-05, 2.6654452085494995e-05, 4.0547922253608704e-05, 5.444139242172241e-05, 6.833486258983612e-05, 8.222833275794983e-05, 9.612180292606354e-05, 0.00011001527309417725, 0.00012390874326229095, 0.00013780221343040466, 0.00015169568359851837, 0.00016558915376663208, 0.0001794826239347458, 0.0001933760941028595, 0.0002072695642709732, 0.00022116303443908691, 0.00023505650460720062, 0.00024894997477531433, 0.00026284344494342804, 0.00027673691511154175, 0.00029063038527965546, 0.00030452385544776917, 0.0003184173256158829, 0.0003323107957839966, 0.0003462042659521103, 0.000360097736120224, 0.0003739912062883377, 0.0003878846764564514, 0.0004017781466245651, 0.00041567161679267883, 0.00042956508696079254, 0.00044345855712890625]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 8.0, 13.0, 8.0, 14.0, 20.0, 9.0, 18.0, 22.0, 27.0, 26.0, 26.0, 41.0, 29.0, 36.0, 41.0, 41.0, 39.0, 45.0, 52.0, 40.0, 53.0, 42.0, 40.0, 30.0, 27.0, 34.0, 25.0, 29.0, 27.0, 20.0, 28.0, 14.0, 15.0, 12.0, 6.0, 7.0, 6.0, 9.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.439300537109375, -3.33563232421875, -3.231964111328125, -3.1282958984375, -3.024627685546875, -2.92095947265625, -2.817291259765625, -2.713623046875, -2.609954833984375, -2.50628662109375, -2.402618408203125, -2.2989501953125, -2.195281982421875, -2.09161376953125, -1.987945556640625, -1.88427734375, -1.780609130859375, -1.67694091796875, -1.573272705078125, -1.4696044921875, -1.365936279296875, -1.26226806640625, -1.158599853515625, -1.054931640625, -0.951263427734375, -0.84759521484375, -0.743927001953125, -0.6402587890625, -0.536590576171875, -0.43292236328125, -0.329254150390625, -0.2255859375, -0.121917724609375, -0.01824951171875, 0.085418701171875, 0.1890869140625, 0.292755126953125, 0.39642333984375, 0.500091552734375, 0.603759765625, 0.707427978515625, 0.81109619140625, 0.914764404296875, 1.0184326171875, 1.122100830078125, 1.22576904296875, 1.329437255859375, 1.43310546875, 1.536773681640625, 1.64044189453125, 1.744110107421875, 1.8477783203125, 1.951446533203125, 2.05511474609375, 2.158782958984375, 2.262451171875, 2.366119384765625, 2.46978759765625, 2.573455810546875, 2.6771240234375, 2.780792236328125, 2.88446044921875, 2.988128662109375, 3.091796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 17.0, 20.0, 26.0, 33.0, 52.0, 75.0, 122.0, 133.0, 216.0, 375.0, 481.0, 770.0, 1223.0, 2055.0, 3324.0, 5474.0, 9521.0, 17482.0, 34472.0, 75683.0, 189118.0, 378165.0, 182292.0, 73389.0, 33463.0, 16893.0, 9320.0, 5445.0, 3242.0, 1940.0, 1301.0, 823.0, 508.0, 322.0, 262.0, 150.0, 109.0, 75.0, 39.0, 39.0, 32.0, 29.0, 10.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.482421875, -2.410430908203125, -2.33843994140625, -2.266448974609375, -2.1944580078125, -2.122467041015625, -2.05047607421875, -1.978485107421875, -1.906494140625, -1.834503173828125, -1.76251220703125, -1.690521240234375, -1.6185302734375, -1.546539306640625, -1.47454833984375, -1.402557373046875, -1.33056640625, -1.258575439453125, -1.18658447265625, -1.114593505859375, -1.0426025390625, -0.970611572265625, -0.89862060546875, -0.826629638671875, -0.754638671875, -0.682647705078125, -0.61065673828125, -0.538665771484375, -0.4666748046875, -0.394683837890625, -0.32269287109375, -0.250701904296875, -0.1787109375, -0.106719970703125, -0.03472900390625, 0.037261962890625, 0.1092529296875, 0.181243896484375, 0.25323486328125, 0.325225830078125, 0.397216796875, 0.469207763671875, 0.54119873046875, 0.613189697265625, 0.6851806640625, 0.757171630859375, 0.82916259765625, 0.901153564453125, 0.97314453125, 1.045135498046875, 1.11712646484375, 1.189117431640625, 1.2611083984375, 1.333099365234375, 1.40509033203125, 1.477081298828125, 1.549072265625, 1.621063232421875, 1.69305419921875, 1.765045166015625, 1.8370361328125, 1.909027099609375, 1.98101806640625, 2.053009033203125, 2.125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 16.0, 19.0, 22.0, 29.0, 28.0, 29.0, 43.0, 35.0, 39.0, 37.0, 52.0, 77.0, 188.0, 1709.0, 200.0, 71.0, 58.0, 39.0, 43.0, 40.0, 31.0, 29.0, 28.0, 25.0, 17.0, 10.0, 20.0, 18.0, 9.0, 11.0, 5.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.640625, -12.2403564453125, -11.840087890625, -11.4398193359375, -11.03955078125, -10.6392822265625, -10.239013671875, -9.8387451171875, -9.4384765625, -9.0382080078125, -8.637939453125, -8.2376708984375, -7.83740234375, -7.4371337890625, -7.036865234375, -6.6365966796875, -6.236328125, -5.8360595703125, -5.435791015625, -5.0355224609375, -4.63525390625, -4.2349853515625, -3.834716796875, -3.4344482421875, -3.0341796875, -2.6339111328125, -2.233642578125, -1.8333740234375, -1.43310546875, -1.0328369140625, -0.632568359375, -0.2322998046875, 0.16796875, 0.5682373046875, 0.968505859375, 1.3687744140625, 1.76904296875, 2.1693115234375, 2.569580078125, 2.9698486328125, 3.3701171875, 3.7703857421875, 4.170654296875, 4.5709228515625, 4.97119140625, 5.3714599609375, 5.771728515625, 6.1719970703125, 6.572265625, 6.9725341796875, 7.372802734375, 7.7730712890625, 8.17333984375, 8.5736083984375, 8.973876953125, 9.3741455078125, 9.7744140625, 10.1746826171875, 10.574951171875, 10.9752197265625, 11.37548828125, 11.7757568359375, 12.176025390625, 12.5762939453125, 12.9765625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 5.0, 3.0, 6.0, 5.0, 15.0, 12.0, 16.0, 24.0, 25.0, 29.0, 32.0, 38.0, 65.0, 84.0, 113.0, 245.0, 447.0, 1389.0, 13595.0, 2611454.0, 508394.0, 7566.0, 1096.0, 350.0, 193.0, 130.0, 75.0, 55.0, 51.0, 43.0, 28.0, 20.0, 18.0, 17.0, 14.0, 11.0, 7.0, 12.0, 9.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -20.281005859375, -19.62451171875, -18.968017578125, -18.3115234375, -17.655029296875, -16.99853515625, -16.342041015625, -15.685546875, -15.029052734375, -14.37255859375, -13.716064453125, -13.0595703125, -12.403076171875, -11.74658203125, -11.090087890625, -10.43359375, -9.777099609375, -9.12060546875, -8.464111328125, -7.8076171875, -7.151123046875, -6.49462890625, -5.838134765625, -5.181640625, -4.525146484375, -3.86865234375, -3.212158203125, -2.5556640625, -1.899169921875, -1.24267578125, -0.586181640625, 0.0703125, 0.726806640625, 1.38330078125, 2.039794921875, 2.6962890625, 3.352783203125, 4.00927734375, 4.665771484375, 5.322265625, 5.978759765625, 6.63525390625, 7.291748046875, 7.9482421875, 8.604736328125, 9.26123046875, 9.917724609375, 10.57421875, 11.230712890625, 11.88720703125, 12.543701171875, 13.2001953125, 13.856689453125, 14.51318359375, 15.169677734375, 15.826171875, 16.482666015625, 17.13916015625, 17.795654296875, 18.4521484375, 19.108642578125, 19.76513671875, 20.421630859375, 21.078125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 62.0, 953.0, 3.0, 0.0, 1.0], "bins": [-456.1365051269531, -448.56988525390625, -441.0032958984375, -433.4366760253906, -425.87005615234375, -418.303466796875, -410.7368469238281, -403.17022705078125, -395.6036376953125, -388.0370178222656, -380.4704284667969, -372.90380859375, -365.3371887207031, -357.77056884765625, -350.2039794921875, -342.6373596191406, -335.07073974609375, -327.5041198730469, -319.9375305175781, -312.37091064453125, -304.8042907714844, -297.2376708984375, -289.67108154296875, -282.1044616699219, -274.537841796875, -266.9712219238281, -259.4046325683594, -251.8380126953125, -244.27139282226562, -236.7047882080078, -229.13818359375, -221.57156372070312, -214.00497436523438, -206.43836975097656, -198.8717498779297, -191.30514526367188, -183.738525390625, -176.1719207763672, -168.60531616210938, -161.0386962890625, -153.4720916748047, -145.90548706054688, -138.3388671875, -130.7722625732422, -123.20565032958984, -115.6390380859375, -108.07243347167969, -100.50582122802734, -92.939208984375, -85.37259674072266, -77.80598449707031, -70.2393798828125, -62.672767639160156, -55.10615539550781, -47.539546966552734, -39.972938537597656, -32.40632629394531, -24.8397159576416, -17.27310562133789, -9.70649528503418, -2.1398849487304688, 5.426727294921875, 12.993335723876953, 20.55994415283203, 28.126558303833008]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 3.0, 7.0, 15.0, 8.0, 17.0, 12.0, 22.0, 14.0, 31.0, 22.0, 34.0, 26.0, 39.0, 35.0, 39.0, 36.0, 31.0, 46.0, 41.0, 49.0, 45.0, 44.0, 40.0, 40.0, 34.0, 31.0, 35.0, 33.0, 26.0, 23.0, 22.0, 20.0, 13.0, 11.0, 13.0, 3.0, 7.0, 7.0, 10.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.53909683227539, -33.306514739990234, -32.07393264770508, -30.841350555419922, -29.608768463134766, -28.37618637084961, -27.143606185913086, -25.91102409362793, -24.678442001342773, -23.445859909057617, -22.21327781677246, -20.980695724487305, -19.74811553955078, -18.515533447265625, -17.28295135498047, -16.050369262695312, -14.817787170410156, -13.585205078125, -12.352622985839844, -11.120041847229004, -9.887459754943848, -8.654877662658691, -7.422296047210693, -6.189714431762695, -4.957132339477539, -3.724550485610962, -2.4919686317443848, -1.2593867778778076, -0.02680492401123047, 1.2057771682739258, 2.438358783721924, 3.670940399169922, 4.9035186767578125, 6.136100769042969, 7.368682384490967, 8.601263999938965, 9.833846092224121, 11.066428184509277, 12.299009323120117, 13.531591415405273, 14.76417350769043, 15.996755599975586, 17.229337692260742, 18.4619197845459, 19.694499969482422, 20.927082061767578, 22.159664154052734, 23.39224624633789, 24.624828338623047, 25.857410430908203, 27.08999252319336, 28.322574615478516, 29.555156707763672, 30.787738800048828, 32.020320892333984, 33.252899169921875, 34.48548126220703, 35.71806335449219, 36.950645446777344, 38.1832275390625, 39.415809631347656, 40.64839172363281, 41.88097381591797, 43.113555908203125, 44.34613800048828]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 8.0, 13.0, 9.0, 6.0, 23.0, 15.0, 16.0, 18.0, 20.0, 23.0, 28.0, 32.0, 29.0, 39.0, 37.0, 38.0, 39.0, 47.0, 44.0, 42.0, 59.0, 39.0, 33.0, 40.0, 40.0, 30.0, 26.0, 20.0, 32.0, 33.0, 21.0, 16.0, 17.0, 16.0, 9.0, 12.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.560546875, -3.4522705078125, -3.343994140625, -3.2357177734375, -3.12744140625, -3.0191650390625, -2.910888671875, -2.8026123046875, -2.6943359375, -2.5860595703125, -2.477783203125, -2.3695068359375, -2.26123046875, -2.1529541015625, -2.044677734375, -1.9364013671875, -1.828125, -1.7198486328125, -1.611572265625, -1.5032958984375, -1.39501953125, -1.2867431640625, -1.178466796875, -1.0701904296875, -0.9619140625, -0.8536376953125, -0.745361328125, -0.6370849609375, -0.52880859375, -0.4205322265625, -0.312255859375, -0.2039794921875, -0.095703125, 0.0125732421875, 0.120849609375, 0.2291259765625, 0.33740234375, 0.4456787109375, 0.553955078125, 0.6622314453125, 0.7705078125, 0.8787841796875, 0.987060546875, 1.0953369140625, 1.20361328125, 1.3118896484375, 1.420166015625, 1.5284423828125, 1.63671875, 1.7449951171875, 1.853271484375, 1.9615478515625, 2.06982421875, 2.1781005859375, 2.286376953125, 2.3946533203125, 2.5029296875, 2.6112060546875, 2.719482421875, 2.8277587890625, 2.93603515625, 3.0443115234375, 3.152587890625, 3.2608642578125, 3.369140625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 10.0, 7.0, 5.0, 10.0, 13.0, 16.0, 18.0, 21.0, 13.0, 14.0, 27.0, 30.0, 29.0, 54.0, 85.0, 137.0, 315.0, 1414.0, 15721.0, 503418.0, 3510550.0, 153821.0, 7042.0, 805.0, 243.0, 106.0, 59.0, 42.0, 36.0, 28.0, 20.0, 33.0, 20.0, 18.0, 24.0, 15.0, 12.0, 6.0, 11.0, 6.0, 2.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-19.03125, -18.477294921875, -17.92333984375, -17.369384765625, -16.8154296875, -16.261474609375, -15.70751953125, -15.153564453125, -14.599609375, -14.045654296875, -13.49169921875, -12.937744140625, -12.3837890625, -11.829833984375, -11.27587890625, -10.721923828125, -10.16796875, -9.614013671875, -9.06005859375, -8.506103515625, -7.9521484375, -7.398193359375, -6.84423828125, -6.290283203125, -5.736328125, -5.182373046875, -4.62841796875, -4.074462890625, -3.5205078125, -2.966552734375, -2.41259765625, -1.858642578125, -1.3046875, -0.750732421875, -0.19677734375, 0.357177734375, 0.9111328125, 1.465087890625, 2.01904296875, 2.572998046875, 3.126953125, 3.680908203125, 4.23486328125, 4.788818359375, 5.3427734375, 5.896728515625, 6.45068359375, 7.004638671875, 7.55859375, 8.112548828125, 8.66650390625, 9.220458984375, 9.7744140625, 10.328369140625, 10.88232421875, 11.436279296875, 11.990234375, 12.544189453125, 13.09814453125, 13.652099609375, 14.2060546875, 14.760009765625, 15.31396484375, 15.867919921875, 16.421875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 17.0, 20.0, 37.0, 37.0, 58.0, 77.0, 119.0, 165.0, 224.0, 315.0, 423.0, 504.0, 510.0, 443.0, 333.0, 242.0, 176.0, 107.0, 87.0, 64.0, 35.0, 17.0, 10.0, 10.0, 13.0, 7.0, 6.0, 3.0, 5.0, 1.0], "bins": [-17.875, -17.48712158203125, -17.0992431640625, -16.71136474609375, -16.323486328125, -15.93560791015625, -15.5477294921875, -15.15985107421875, -14.77197265625, -14.38409423828125, -13.9962158203125, -13.60833740234375, -13.220458984375, -12.83258056640625, -12.4447021484375, -12.05682373046875, -11.6689453125, -11.28106689453125, -10.8931884765625, -10.50531005859375, -10.117431640625, -9.72955322265625, -9.3416748046875, -8.95379638671875, -8.56591796875, -8.17803955078125, -7.7901611328125, -7.40228271484375, -7.014404296875, -6.62652587890625, -6.2386474609375, -5.85076904296875, -5.462890625, -5.07501220703125, -4.6871337890625, -4.29925537109375, -3.911376953125, -3.52349853515625, -3.1356201171875, -2.74774169921875, -2.35986328125, -1.97198486328125, -1.5841064453125, -1.19622802734375, -0.808349609375, -0.42047119140625, -0.0325927734375, 0.35528564453125, 0.7431640625, 1.13104248046875, 1.5189208984375, 1.90679931640625, 2.294677734375, 2.68255615234375, 3.0704345703125, 3.45831298828125, 3.84619140625, 4.23406982421875, 4.6219482421875, 5.00982666015625, 5.397705078125, 5.78558349609375, 6.1734619140625, 6.56134033203125, 6.94921875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 13.0, 11.0, 10.0, 24.0, 39.0, 35.0, 59.0, 81.0, 174.0, 317.0, 635.0, 2402.0, 90552.0, 3970264.0, 125268.0, 2830.0, 696.0, 321.0, 183.0, 132.0, 71.0, 60.0, 34.0, 27.0, 18.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.21875, -40.8359375, -39.453125, -38.0703125, -36.6875, -35.3046875, -33.921875, -32.5390625, -31.15625, -29.7734375, -28.390625, -27.0078125, -25.625, -24.2421875, -22.859375, -21.4765625, -20.09375, -18.7109375, -17.328125, -15.9453125, -14.5625, -13.1796875, -11.796875, -10.4140625, -9.03125, -7.6484375, -6.265625, -4.8828125, -3.5, -2.1171875, -0.734375, 0.6484375, 2.03125, 3.4140625, 4.796875, 6.1796875, 7.5625, 8.9453125, 10.328125, 11.7109375, 13.09375, 14.4765625, 15.859375, 17.2421875, 18.625, 20.0078125, 21.390625, 22.7734375, 24.15625, 25.5390625, 26.921875, 28.3046875, 29.6875, 31.0703125, 32.453125, 33.8359375, 35.21875, 36.6015625, 37.984375, 39.3671875, 40.75, 42.1328125, 43.515625, 44.8984375, 46.28125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 88.0, 254.0, 372.0, 208.0, 62.0, 15.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.20643615722656, -55.73166275024414, -51.25688934326172, -46.7821159362793, -42.307342529296875, -37.83256912231445, -33.35779571533203, -28.88302230834961, -24.408248901367188, -19.933475494384766, -15.458702087402344, -10.983928680419922, -6.5091552734375, -2.034381866455078, 2.4403915405273438, 6.915164947509766, 11.389938354492188, 15.86471176147461, 20.33948516845703, 24.814258575439453, 29.289031982421875, 33.7638053894043, 38.23857879638672, 42.71335220336914, 47.18812561035156, 51.662899017333984, 56.137672424316406, 60.61244583129883, 65.08721923828125, 69.56199645996094, 74.0367660522461, 78.51153564453125, 82.98631286621094, 87.46109008789062, 91.93585968017578, 96.41062927246094, 100.88540649414062, 105.36018371582031, 109.83495330810547, 114.30972290039062, 118.78450012207031, 123.25927734375, 127.73404693603516, 132.2088165283203, 136.68359375, 141.1583709716797, 145.63314819335938, 150.10791015625, 154.5826873779297, 159.05746459960938, 163.5322265625, 168.0070037841797, 172.48178100585938, 176.95655822753906, 181.43133544921875, 185.90609741210938, 190.38087463378906, 194.85565185546875, 199.33041381835938, 203.80519104003906, 208.27996826171875, 212.75474548339844, 217.22952270507812, 221.70428466796875, 226.17906188964844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 12.0, 8.0, 15.0, 15.0, 15.0, 20.0, 18.0, 19.0, 19.0, 20.0, 22.0, 24.0, 43.0, 30.0, 22.0, 38.0, 42.0, 33.0, 31.0, 48.0, 31.0, 40.0, 34.0, 40.0, 34.0, 32.0, 30.0, 29.0, 21.0, 15.0, 23.0, 17.0, 15.0, 18.0, 14.0, 19.0, 12.0, 11.0, 7.0, 9.0, 7.0, 4.0, 6.0, 9.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0], "bins": [-35.346435546875, -34.28113555908203, -33.21583557128906, -32.15053939819336, -31.08523941040039, -30.019939422607422, -28.954641342163086, -27.88934326171875, -26.82404327392578, -25.758743286132812, -24.693445205688477, -23.62814712524414, -22.562847137451172, -21.497547149658203, -20.432249069213867, -19.36695098876953, -18.301651000976562, -17.236351013183594, -16.171052932739258, -15.105753898620605, -14.040454864501953, -12.9751558303833, -11.909856796264648, -10.844557762145996, -9.779258728027344, -8.713959693908691, -7.648660659790039, -6.583361625671387, -5.518062591552734, -4.452763557434082, -3.3874645233154297, -2.3221654891967773, -1.256866455078125, -0.19156742095947266, 0.8737316131591797, 1.939030647277832, 3.0043296813964844, 4.069628715515137, 5.134927749633789, 6.200226783752441, 7.265525817871094, 8.330824851989746, 9.396123886108398, 10.46142292022705, 11.526721954345703, 12.592020988464355, 13.657320022583008, 14.72261905670166, 15.787918090820312, 16.85321807861328, 17.918516159057617, 18.983814239501953, 20.049114227294922, 21.11441421508789, 22.179712295532227, 23.245010375976562, 24.31031036376953, 25.3756103515625, 26.440908432006836, 27.506206512451172, 28.57150650024414, 29.63680648803711, 30.702104568481445, 31.76740264892578, 32.83270263671875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 9.0, 9.0, 17.0, 14.0, 13.0, 19.0, 28.0, 31.0, 32.0, 23.0, 28.0, 31.0, 34.0, 47.0, 41.0, 46.0, 40.0, 54.0, 42.0, 46.0, 36.0, 36.0, 37.0, 28.0, 32.0, 29.0, 36.0, 21.0, 25.0, 21.0, 15.0, 12.0, 13.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.11993408203125, -4.0054931640625, -3.89105224609375, -3.776611328125, -3.66217041015625, -3.5477294921875, -3.43328857421875, -3.31884765625, -3.20440673828125, -3.0899658203125, -2.97552490234375, -2.861083984375, -2.74664306640625, -2.6322021484375, -2.51776123046875, -2.4033203125, -2.28887939453125, -2.1744384765625, -2.05999755859375, -1.945556640625, -1.83111572265625, -1.7166748046875, -1.60223388671875, -1.48779296875, -1.37335205078125, -1.2589111328125, -1.14447021484375, -1.030029296875, -0.91558837890625, -0.8011474609375, -0.68670654296875, -0.572265625, -0.45782470703125, -0.3433837890625, -0.22894287109375, -0.114501953125, -6.103515625e-05, 0.1143798828125, 0.22882080078125, 0.34326171875, 0.45770263671875, 0.5721435546875, 0.68658447265625, 0.801025390625, 0.91546630859375, 1.0299072265625, 1.14434814453125, 1.2587890625, 1.37322998046875, 1.4876708984375, 1.60211181640625, 1.716552734375, 1.83099365234375, 1.9454345703125, 2.05987548828125, 2.17431640625, 2.28875732421875, 2.4031982421875, 2.51763916015625, 2.632080078125, 2.74652099609375, 2.8609619140625, 2.97540283203125, 3.08984375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 13.0, 24.0, 33.0, 57.0, 57.0, 102.0, 123.0, 228.0, 303.0, 428.0, 641.0, 887.0, 1366.0, 1925.0, 2928.0, 4086.0, 5966.0, 9002.0, 13419.0, 20235.0, 31620.0, 50999.0, 83689.0, 134134.0, 186031.0, 175545.0, 120487.0, 74158.0, 45512.0, 28408.0, 18418.0, 12260.0, 8067.0, 5440.0, 3664.0, 2508.0, 1860.0, 1248.0, 856.0, 588.0, 370.0, 271.0, 194.0, 132.0, 87.0, 71.0, 40.0, 35.0, 12.0, 10.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.3515625, -0.3408699035644531, -0.33017730712890625, -0.3194847106933594, -0.3087921142578125, -0.2980995178222656, -0.28740692138671875, -0.2767143249511719, -0.266021728515625, -0.2553291320800781, -0.24463653564453125, -0.23394393920898438, -0.2232513427734375, -0.21255874633789062, -0.20186614990234375, -0.19117355346679688, -0.18048095703125, -0.16978836059570312, -0.15909576416015625, -0.14840316772460938, -0.1377105712890625, -0.12701797485351562, -0.11632537841796875, -0.10563278198242188, -0.094940185546875, -0.08424758911132812, -0.07355499267578125, -0.06286239624023438, -0.0521697998046875, -0.041477203369140625, -0.03078460693359375, -0.020092010498046875, -0.0093994140625, 0.001293182373046875, 0.01198577880859375, 0.022678375244140625, 0.0333709716796875, 0.044063568115234375, 0.05475616455078125, 0.06544876098632812, 0.076141357421875, 0.08683395385742188, 0.09752655029296875, 0.10821914672851562, 0.1189117431640625, 0.12960433959960938, 0.14029693603515625, 0.15098953247070312, 0.16168212890625, 0.17237472534179688, 0.18306732177734375, 0.19375991821289062, 0.2044525146484375, 0.21514511108398438, 0.22583770751953125, 0.23653030395507812, 0.247222900390625, 0.2579154968261719, 0.26860809326171875, 0.2793006896972656, 0.2899932861328125, 0.3006858825683594, 0.31137847900390625, 0.3220710754394531, 0.332763671875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 5.0, 5.0, 6.0, 3.0, 9.0, 8.0, 11.0, 14.0, 13.0, 16.0, 25.0, 19.0, 29.0, 38.0, 19.0, 22.0, 42.0, 28.0, 37.0, 38.0, 32.0, 30.0, 1069.0, 36.0, 29.0, 38.0, 40.0, 35.0, 18.0, 20.0, 36.0, 31.0, 26.0, 29.0, 20.0, 17.0, 21.0, 15.0, 16.0, 10.0, 12.0, 5.0, 5.0, 11.0, 4.0, 8.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-1.984375, -1.920135498046875, -1.85589599609375, -1.791656494140625, -1.7274169921875, -1.663177490234375, -1.59893798828125, -1.534698486328125, -1.470458984375, -1.406219482421875, -1.34197998046875, -1.277740478515625, -1.2135009765625, -1.149261474609375, -1.08502197265625, -1.020782470703125, -0.95654296875, -0.892303466796875, -0.82806396484375, -0.763824462890625, -0.6995849609375, -0.635345458984375, -0.57110595703125, -0.506866455078125, -0.442626953125, -0.378387451171875, -0.31414794921875, -0.249908447265625, -0.1856689453125, -0.121429443359375, -0.05718994140625, 0.007049560546875, 0.0712890625, 0.135528564453125, 0.19976806640625, 0.264007568359375, 0.3282470703125, 0.392486572265625, 0.45672607421875, 0.520965576171875, 0.585205078125, 0.649444580078125, 0.71368408203125, 0.777923583984375, 0.8421630859375, 0.906402587890625, 0.97064208984375, 1.034881591796875, 1.09912109375, 1.163360595703125, 1.22760009765625, 1.291839599609375, 1.3560791015625, 1.420318603515625, 1.48455810546875, 1.548797607421875, 1.613037109375, 1.677276611328125, 1.74151611328125, 1.805755615234375, 1.8699951171875, 1.934234619140625, 1.99847412109375, 2.062713623046875, 2.126953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 17.0, 23.0, 41.0, 43.0, 63.0, 106.0, 143.0, 238.0, 309.0, 437.0, 732.0, 1154.0, 1770.0, 2750.0, 4485.0, 7443.0, 11963.0, 19683.0, 33267.0, 56020.0, 93002.0, 145683.0, 1234483.0, 173181.0, 121877.0, 75213.0, 44619.0, 26718.0, 15978.0, 9626.0, 6023.0, 3605.0, 2288.0, 1452.0, 934.0, 586.0, 405.0, 234.0, 169.0, 122.0, 76.0, 45.0, 34.0, 21.0, 21.0, 9.0, 11.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.26123046875, -0.2521553039550781, -0.24308013916015625, -0.23400497436523438, -0.2249298095703125, -0.21585464477539062, -0.20677947998046875, -0.19770431518554688, -0.188629150390625, -0.17955398559570312, -0.17047882080078125, -0.16140365600585938, -0.1523284912109375, -0.14325332641601562, -0.13417816162109375, -0.12510299682617188, -0.11602783203125, -0.10695266723632812, -0.09787750244140625, -0.08880233764648438, -0.0797271728515625, -0.07065200805664062, -0.06157684326171875, -0.052501678466796875, -0.043426513671875, -0.034351348876953125, -0.02527618408203125, -0.016201019287109375, -0.0071258544921875, 0.001949310302734375, 0.01102447509765625, 0.020099639892578125, 0.0291748046875, 0.038249969482421875, 0.04732513427734375, 0.056400299072265625, 0.0654754638671875, 0.07455062866210938, 0.08362579345703125, 0.09270095825195312, 0.101776123046875, 0.11085128784179688, 0.11992645263671875, 0.12900161743164062, 0.1380767822265625, 0.14715194702148438, 0.15622711181640625, 0.16530227661132812, 0.17437744140625, 0.18345260620117188, 0.19252777099609375, 0.20160293579101562, 0.2106781005859375, 0.21975326538085938, 0.22882843017578125, 0.23790359497070312, 0.246978759765625, 0.2560539245605469, 0.26512908935546875, 0.2742042541503906, 0.2832794189453125, 0.2923545837402344, 0.30142974853515625, 0.3105049133300781, 0.319580078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 15.0, 7.0, 13.0, 18.0, 17.0, 22.0, 17.0, 25.0, 28.0, 34.0, 31.0, 28.0, 50.0, 45.0, 49.0, 39.0, 61.0, 43.0, 47.0, 49.0, 35.0, 41.0, 33.0, 28.0, 31.0, 27.0, 22.0, 23.0, 28.0, 17.0, 13.0, 12.0, 7.0, 7.0, 4.0, 8.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0008392333984375, -0.0008132904767990112, -0.0007873475551605225, -0.0007614046335220337, -0.0007354617118835449, -0.0007095187902450562, -0.0006835758686065674, -0.0006576329469680786, -0.0006316900253295898, -0.0006057471036911011, -0.0005798041820526123, -0.0005538612604141235, -0.0005279183387756348, -0.000501975417137146, -0.0004760324954986572, -0.00045008957386016846, -0.0004241466522216797, -0.0003982037305831909, -0.00037226080894470215, -0.0003463178873062134, -0.0003203749656677246, -0.00029443204402923584, -0.00026848912239074707, -0.0002425462007522583, -0.00021660327911376953, -0.00019066035747528076, -0.000164717435836792, -0.00013877451419830322, -0.00011283159255981445, -8.688867092132568e-05, -6.0945749282836914e-05, -3.5002827644348145e-05, -9.059906005859375e-06, 1.6883015632629395e-05, 4.2825937271118164e-05, 6.876885890960693e-05, 9.47117805480957e-05, 0.00012065470218658447, 0.00014659762382507324, 0.000172540545463562, 0.00019848346710205078, 0.00022442638874053955, 0.0002503693103790283, 0.0002763122320175171, 0.00030225515365600586, 0.00032819807529449463, 0.0003541409969329834, 0.00038008391857147217, 0.00040602684020996094, 0.0004319697618484497, 0.0004579126834869385, 0.00048385560512542725, 0.000509798526763916, 0.0005357414484024048, 0.0005616843700408936, 0.0005876272916793823, 0.0006135702133178711, 0.0006395131349563599, 0.0006654560565948486, 0.0006913989782333374, 0.0007173418998718262, 0.0007432848215103149, 0.0007692277431488037, 0.0007951706647872925, 0.0008211135864257812]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 9.0, 8.0, 10.0, 16.0, 18.0, 31.0, 26.0, 25.0, 51.0, 63.0, 62.0, 120.0, 132.0, 183.0, 276.0, 445.0, 2024.0, 381307.0, 659019.0, 3157.0, 511.0, 279.0, 139.0, 147.0, 102.0, 99.0, 68.0, 43.0, 41.0, 37.0, 25.0, 22.0, 15.0, 10.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171966552734375, -0.016643047332763672, -0.016089439392089844, -0.015535831451416016, -0.014982223510742188, -0.01442861557006836, -0.013875007629394531, -0.013321399688720703, -0.012767791748046875, -0.012214183807373047, -0.011660575866699219, -0.01110696792602539, -0.010553359985351562, -0.009999752044677734, -0.009446144104003906, -0.008892536163330078, -0.00833892822265625, -0.007785320281982422, -0.007231712341308594, -0.006678104400634766, -0.0061244964599609375, -0.005570888519287109, -0.005017280578613281, -0.004463672637939453, -0.003910064697265625, -0.003356456756591797, -0.0028028488159179688, -0.0022492408752441406, -0.0016956329345703125, -0.0011420249938964844, -0.0005884170532226562, -3.4809112548828125e-05, 0.000518798828125, 0.0010724067687988281, 0.0016260147094726562, 0.0021796226501464844, 0.0027332305908203125, 0.0032868385314941406, 0.0038404464721679688, 0.004394054412841797, 0.004947662353515625, 0.005501270294189453, 0.006054878234863281, 0.006608486175537109, 0.0071620941162109375, 0.007715702056884766, 0.008269309997558594, 0.008822917938232422, 0.00937652587890625, 0.009930133819580078, 0.010483741760253906, 0.011037349700927734, 0.011590957641601562, 0.01214456558227539, 0.012698173522949219, 0.013251781463623047, 0.013805389404296875, 0.014358997344970703, 0.014912605285644531, 0.01546621322631836, 0.016019821166992188, 0.016573429107666016, 0.017127037048339844, 0.017680644989013672, 0.0182342529296875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 111.0, 634.0, 245.0, 18.0, 3.0, 1.0], "bins": [-0.008335847407579422, -0.008196127600967884, -0.008056406863033772, -0.007916687056422234, -0.007776966784149408, -0.007637246511876583, -0.007497526705265045, -0.00735780643299222, -0.007218086160719395, -0.0070783658884465694, -0.006938645616173744, -0.006798925809562206, -0.006659205537289381, -0.006519485265016556, -0.006379765458405018, -0.006240045186132193, -0.006100324913859367, -0.005960604641586542, -0.005820884369313717, -0.005681164562702179, -0.005541444290429354, -0.0054017240181565285, -0.0052620042115449905, -0.005122283939272165, -0.00498256366699934, -0.004842843394726515, -0.00470312312245369, -0.004563403315842152, -0.004423683043569326, -0.004283962771296501, -0.004144242964684963, -0.004004522692412138, -0.0038648024201393127, -0.0037250821478664875, -0.003585362108424306, -0.0034456420689821243, -0.003305921796709299, -0.003166201524436474, -0.0030264814849942923, -0.0028867614455521107, -0.0027470411732792854, -0.00260732090100646, -0.0024676008615642786, -0.002327880822122097, -0.0021881605498492718, -0.0020484402775764465, -0.001908720238134265, -0.0017690000822767615, -0.00162928004283458, -0.0014895598869770765, -0.0013498397311195731, -0.0012101195752620697, -0.0010703994194045663, -0.0009306792635470629, -0.0007909591076895595, -0.000651238951832056, -0.0005115187959745526, -0.0003717986401170492, -0.0002320784842595458, -9.235832840204239e-05, 4.7361827455461025e-05, 0.00018708198331296444, 0.00032680213917046785, 0.00046652229502797127, 0.0006062424508854747]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 4.0, 4.0, 13.0, 11.0, 6.0, 10.0, 9.0, 24.0, 27.0, 23.0, 23.0, 33.0, 35.0, 46.0, 33.0, 39.0, 41.0, 30.0, 37.0, 49.0, 50.0, 45.0, 30.0, 32.0, 47.0, 38.0, 33.0, 29.0, 32.0, 30.0, 20.0, 21.0, 20.0, 14.0, 13.0, 15.0, 5.0, 4.0, 5.0, 8.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0005630254745483398, -0.0005469545722007751, -0.0005308836698532104, -0.0005148127675056458, -0.0004987418651580811, -0.00048267096281051636, -0.00046660006046295166, -0.00045052915811538696, -0.00043445825576782227, -0.00041838735342025757, -0.00040231645107269287, -0.0003862455487251282, -0.0003701746463775635, -0.0003541037440299988, -0.0003380328416824341, -0.0003219619393348694, -0.0003058910369873047, -0.00028982013463974, -0.0002737492322921753, -0.0002576783299446106, -0.0002416074275970459, -0.0002255365252494812, -0.0002094656229019165, -0.0001933947205543518, -0.0001773238182067871, -0.0001612529158592224, -0.00014518201351165771, -0.00012911111116409302, -0.00011304020881652832, -9.696930646896362e-05, -8.089840412139893e-05, -6.482750177383423e-05, -4.875659942626953e-05, -3.2685697078704834e-05, -1.6614794731140137e-05, -5.438923835754395e-07, 1.5527009963989258e-05, 3.1597912311553955e-05, 4.766881465911865e-05, 6.373971700668335e-05, 7.981061935424805e-05, 9.588152170181274e-05, 0.00011195242404937744, 0.00012802332639694214, 0.00014409422874450684, 0.00016016513109207153, 0.00017623603343963623, 0.00019230693578720093, 0.00020837783813476562, 0.00022444874048233032, 0.00024051964282989502, 0.0002565905451774597, 0.0002726614475250244, 0.0002887323498725891, 0.0003048032522201538, 0.0003208741545677185, 0.0003369450569152832, 0.0003530159592628479, 0.0003690868616104126, 0.0003851577639579773, 0.000401228666305542, 0.0004172995686531067, 0.0004333704710006714, 0.0004494413733482361, 0.0004655122756958008]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 9.0, 9.0, 17.0, 14.0, 13.0, 19.0, 28.0, 31.0, 32.0, 23.0, 28.0, 31.0, 33.0, 48.0, 41.0, 46.0, 40.0, 54.0, 42.0, 46.0, 36.0, 36.0, 37.0, 28.0, 32.0, 29.0, 36.0, 21.0, 25.0, 21.0, 15.0, 12.0, 13.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.11993408203125, -4.0054931640625, -3.89105224609375, -3.776611328125, -3.66217041015625, -3.5477294921875, -3.43328857421875, -3.31884765625, -3.20440673828125, -3.0899658203125, -2.97552490234375, -2.861083984375, -2.74664306640625, -2.6322021484375, -2.51776123046875, -2.4033203125, -2.28887939453125, -2.1744384765625, -2.05999755859375, -1.945556640625, -1.83111572265625, -1.7166748046875, -1.60223388671875, -1.48779296875, -1.37335205078125, -1.2589111328125, -1.14447021484375, -1.030029296875, -0.91558837890625, -0.8011474609375, -0.68670654296875, -0.572265625, -0.45782470703125, -0.3433837890625, -0.22894287109375, -0.114501953125, -6.103515625e-05, 0.1143798828125, 0.22882080078125, 0.34326171875, 0.45770263671875, 0.5721435546875, 0.68658447265625, 0.801025390625, 0.91546630859375, 1.0299072265625, 1.14434814453125, 1.2587890625, 1.37322998046875, 1.4876708984375, 1.60211181640625, 1.716552734375, 1.83099365234375, 1.9454345703125, 2.05987548828125, 2.17431640625, 2.28875732421875, 2.4031982421875, 2.51763916015625, 2.632080078125, 2.74652099609375, 2.8609619140625, 2.97540283203125, 3.08984375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 5.0, 11.0, 16.0, 22.0, 34.0, 38.0, 63.0, 88.0, 128.0, 229.0, 348.0, 509.0, 832.0, 1487.0, 2750.0, 5526.0, 12331.0, 31732.0, 97724.0, 326635.0, 382716.0, 119720.0, 37749.0, 14082.0, 6208.0, 3176.0, 1697.0, 1014.0, 609.0, 371.0, 250.0, 159.0, 83.0, 63.0, 36.0, 29.0, 29.0, 11.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.162109375, -3.0693359375, -2.9765625, -2.8837890625, -2.791015625, -2.6982421875, -2.60546875, -2.5126953125, -2.419921875, -2.3271484375, -2.234375, -2.1416015625, -2.048828125, -1.9560546875, -1.86328125, -1.7705078125, -1.677734375, -1.5849609375, -1.4921875, -1.3994140625, -1.306640625, -1.2138671875, -1.12109375, -1.0283203125, -0.935546875, -0.8427734375, -0.75, -0.6572265625, -0.564453125, -0.4716796875, -0.37890625, -0.2861328125, -0.193359375, -0.1005859375, -0.0078125, 0.0849609375, 0.177734375, 0.2705078125, 0.36328125, 0.4560546875, 0.548828125, 0.6416015625, 0.734375, 0.8271484375, 0.919921875, 1.0126953125, 1.10546875, 1.1982421875, 1.291015625, 1.3837890625, 1.4765625, 1.5693359375, 1.662109375, 1.7548828125, 1.84765625, 1.9404296875, 2.033203125, 2.1259765625, 2.21875, 2.3115234375, 2.404296875, 2.4970703125, 2.58984375, 2.6826171875, 2.775390625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 10.0, 8.0, 12.0, 23.0, 10.0, 26.0, 18.0, 23.0, 39.0, 29.0, 40.0, 49.0, 45.0, 36.0, 59.0, 133.0, 1713.0, 290.0, 86.0, 57.0, 50.0, 39.0, 43.0, 26.0, 33.0, 22.0, 27.0, 25.0, 20.0, 9.0, 12.0, 9.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1258544921875, -11.689208984375, -11.2525634765625, -10.81591796875, -10.3792724609375, -9.942626953125, -9.5059814453125, -9.0693359375, -8.6326904296875, -8.196044921875, -7.7593994140625, -7.32275390625, -6.8861083984375, -6.449462890625, -6.0128173828125, -5.576171875, -5.1395263671875, -4.702880859375, -4.2662353515625, -3.82958984375, -3.3929443359375, -2.956298828125, -2.5196533203125, -2.0830078125, -1.6463623046875, -1.209716796875, -0.7730712890625, -0.33642578125, 0.1002197265625, 0.536865234375, 0.9735107421875, 1.41015625, 1.8468017578125, 2.283447265625, 2.7200927734375, 3.15673828125, 3.5933837890625, 4.030029296875, 4.4666748046875, 4.9033203125, 5.3399658203125, 5.776611328125, 6.2132568359375, 6.64990234375, 7.0865478515625, 7.523193359375, 7.9598388671875, 8.396484375, 8.8331298828125, 9.269775390625, 9.7064208984375, 10.14306640625, 10.5797119140625, 11.016357421875, 11.4530029296875, 11.8896484375, 12.3262939453125, 12.762939453125, 13.1995849609375, 13.63623046875, 14.0728759765625, 14.509521484375, 14.9461669921875, 15.3828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 0.0, 6.0, 4.0, 8.0, 9.0, 13.0, 13.0, 25.0, 32.0, 40.0, 32.0, 54.0, 77.0, 102.0, 219.0, 481.0, 1403.0, 9895.0, 2662709.0, 462585.0, 5783.0, 1150.0, 417.0, 209.0, 111.0, 80.0, 54.0, 36.0, 30.0, 34.0, 18.0, 13.0, 18.0, 15.0, 8.0, 3.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.640625, -23.9345703125, -23.228515625, -22.5224609375, -21.81640625, -21.1103515625, -20.404296875, -19.6982421875, -18.9921875, -18.2861328125, -17.580078125, -16.8740234375, -16.16796875, -15.4619140625, -14.755859375, -14.0498046875, -13.34375, -12.6376953125, -11.931640625, -11.2255859375, -10.51953125, -9.8134765625, -9.107421875, -8.4013671875, -7.6953125, -6.9892578125, -6.283203125, -5.5771484375, -4.87109375, -4.1650390625, -3.458984375, -2.7529296875, -2.046875, -1.3408203125, -0.634765625, 0.0712890625, 0.77734375, 1.4833984375, 2.189453125, 2.8955078125, 3.6015625, 4.3076171875, 5.013671875, 5.7197265625, 6.42578125, 7.1318359375, 7.837890625, 8.5439453125, 9.25, 9.9560546875, 10.662109375, 11.3681640625, 12.07421875, 12.7802734375, 13.486328125, 14.1923828125, 14.8984375, 15.6044921875, 16.310546875, 17.0166015625, 17.72265625, 18.4287109375, 19.134765625, 19.8408203125, 20.546875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 77.0, 932.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.892574310302734, -7.472862243652344, -2.053150177001953, 3.3665618896484375, 8.786273956298828, 14.205986022949219, 19.62569808959961, 25.04541015625, 30.46512222290039, 35.88483428955078, 41.30454635620117, 46.72425842285156, 52.14397048950195, 57.563682556152344, 62.983394622802734, 68.40310668945312, 73.82281494140625, 79.24252319335938, 84.66223907470703, 90.08195495605469, 95.50166320800781, 100.92137145996094, 106.3410873413086, 111.76080322265625, 117.18051147460938, 122.6002197265625, 128.01992797851562, 133.4396514892578, 138.85935974121094, 144.27906799316406, 149.69879150390625, 155.11849975585938, 160.5382080078125, 165.95791625976562, 171.37762451171875, 176.79734802246094, 182.21705627441406, 187.6367645263672, 193.05648803710938, 198.4761962890625, 203.89590454101562, 209.31561279296875, 214.73532104492188, 220.15504455566406, 225.5747528076172, 230.9944610595703, 236.4141845703125, 241.83389282226562, 247.25360107421875, 252.67330932617188, 258.093017578125, 263.5127258300781, 268.93243408203125, 274.3521728515625, 279.7718811035156, 285.19158935546875, 290.6112976074219, 296.031005859375, 301.4507141113281, 306.87042236328125, 312.2901611328125, 317.7098693847656, 323.12957763671875, 328.5492858886719, 333.968994140625]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 4.0, 5.0, 12.0, 11.0, 12.0, 20.0, 16.0, 22.0, 24.0, 31.0, 28.0, 26.0, 31.0, 34.0, 39.0, 44.0, 44.0, 41.0, 39.0, 63.0, 33.0, 39.0, 47.0, 37.0, 25.0, 36.0, 20.0, 27.0, 26.0, 28.0, 23.0, 21.0, 23.0, 11.0, 17.0, 8.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-43.85280227661133, -42.60800552368164, -41.36321258544922, -40.11841583251953, -38.87362289428711, -37.62882614135742, -36.384033203125, -35.13923645019531, -33.894439697265625, -32.64964294433594, -31.404850006103516, -30.160053253173828, -28.915258407592773, -27.67046356201172, -26.425668716430664, -25.18087387084961, -23.936079025268555, -22.6912841796875, -21.446489334106445, -20.20169448852539, -18.956897735595703, -17.71210289001465, -16.467308044433594, -15.222512245178223, -13.977717399597168, -12.732922554016113, -11.488126754760742, -10.243331909179688, -8.998537063598633, -7.753741264343262, -6.508946418762207, -5.264150619506836, -4.019355773925781, -2.7745604515075684, -1.5297653675079346, -0.2849702835083008, 0.9598250389099121, 2.204620361328125, 3.4494152069091797, 4.694211006164551, 5.9390058517456055, 7.183801174163818, 8.428596496582031, 9.673391342163086, 10.91818618774414, 12.162981986999512, 13.407776832580566, 14.652572631835938, 15.897367477416992, 17.142162322998047, 18.3869571685791, 19.631752014160156, 20.876548767089844, 22.1213436126709, 23.366138458251953, 24.61093521118164, 25.855728149414062, 27.100522994995117, 28.345317840576172, 29.59011459350586, 30.834909439086914, 32.07970428466797, 33.324501037597656, 34.56929397583008, 35.814090728759766]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 5.0, 6.0, 4.0, 6.0, 8.0, 13.0, 8.0, 14.0, 19.0, 13.0, 26.0, 31.0, 28.0, 26.0, 31.0, 25.0, 35.0, 40.0, 31.0, 53.0, 43.0, 44.0, 49.0, 45.0, 46.0, 33.0, 40.0, 30.0, 34.0, 28.0, 28.0, 26.0, 28.0, 23.0, 17.0, 20.0, 12.0, 5.0, 7.0, 12.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.25836181640625, -4.1417236328125, -4.02508544921875, -3.908447265625, -3.79180908203125, -3.6751708984375, -3.55853271484375, -3.44189453125, -3.32525634765625, -3.2086181640625, -3.09197998046875, -2.975341796875, -2.85870361328125, -2.7420654296875, -2.62542724609375, -2.5087890625, -2.39215087890625, -2.2755126953125, -2.15887451171875, -2.042236328125, -1.92559814453125, -1.8089599609375, -1.69232177734375, -1.57568359375, -1.45904541015625, -1.3424072265625, -1.22576904296875, -1.109130859375, -0.99249267578125, -0.8758544921875, -0.75921630859375, -0.642578125, -0.52593994140625, -0.4093017578125, -0.29266357421875, -0.176025390625, -0.05938720703125, 0.0572509765625, 0.17388916015625, 0.29052734375, 0.40716552734375, 0.5238037109375, 0.64044189453125, 0.757080078125, 0.87371826171875, 0.9903564453125, 1.10699462890625, 1.2236328125, 1.34027099609375, 1.4569091796875, 1.57354736328125, 1.690185546875, 1.80682373046875, 1.9234619140625, 2.04010009765625, 2.15673828125, 2.27337646484375, 2.3900146484375, 2.50665283203125, 2.623291015625, 2.73992919921875, 2.8565673828125, 2.97320556640625, 3.08984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 5.0, 6.0, 9.0, 9.0, 14.0, 19.0, 24.0, 29.0, 48.0, 57.0, 92.0, 188.0, 310.0, 656.0, 1799.0, 6148.0, 24191.0, 118035.0, 845851.0, 2346026.0, 715651.0, 105228.0, 21384.0, 5510.0, 1644.0, 609.0, 291.0, 143.0, 94.0, 52.0, 33.0, 27.0, 31.0, 14.0, 13.0, 7.0, 10.0, 10.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.8515625, -9.59539794921875, -9.3392333984375, -9.08306884765625, -8.826904296875, -8.57073974609375, -8.3145751953125, -8.05841064453125, -7.80224609375, -7.54608154296875, -7.2899169921875, -7.03375244140625, -6.777587890625, -6.52142333984375, -6.2652587890625, -6.00909423828125, -5.7529296875, -5.49676513671875, -5.2406005859375, -4.98443603515625, -4.728271484375, -4.47210693359375, -4.2159423828125, -3.95977783203125, -3.70361328125, -3.44744873046875, -3.1912841796875, -2.93511962890625, -2.678955078125, -2.42279052734375, -2.1666259765625, -1.91046142578125, -1.654296875, -1.39813232421875, -1.1419677734375, -0.88580322265625, -0.629638671875, -0.37347412109375, -0.1173095703125, 0.13885498046875, 0.39501953125, 0.65118408203125, 0.9073486328125, 1.16351318359375, 1.419677734375, 1.67584228515625, 1.9320068359375, 2.18817138671875, 2.4443359375, 2.70050048828125, 2.9566650390625, 3.21282958984375, 3.468994140625, 3.72515869140625, 3.9813232421875, 4.23748779296875, 4.49365234375, 4.74981689453125, 5.0059814453125, 5.26214599609375, 5.518310546875, 5.77447509765625, 6.0306396484375, 6.28680419921875, 6.54296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 6.0, 4.0, 12.0, 22.0, 32.0, 28.0, 38.0, 81.0, 99.0, 165.0, 197.0, 303.0, 347.0, 432.0, 518.0, 483.0, 343.0, 264.0, 208.0, 137.0, 101.0, 82.0, 54.0, 39.0, 13.0, 18.0, 16.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.511962890625, -11.13330078125, -10.754638671875, -10.3759765625, -9.997314453125, -9.61865234375, -9.239990234375, -8.861328125, -8.482666015625, -8.10400390625, -7.725341796875, -7.3466796875, -6.968017578125, -6.58935546875, -6.210693359375, -5.83203125, -5.453369140625, -5.07470703125, -4.696044921875, -4.3173828125, -3.938720703125, -3.56005859375, -3.181396484375, -2.802734375, -2.424072265625, -2.04541015625, -1.666748046875, -1.2880859375, -0.909423828125, -0.53076171875, -0.152099609375, 0.2265625, 0.605224609375, 0.98388671875, 1.362548828125, 1.7412109375, 2.119873046875, 2.49853515625, 2.877197265625, 3.255859375, 3.634521484375, 4.01318359375, 4.391845703125, 4.7705078125, 5.149169921875, 5.52783203125, 5.906494140625, 6.28515625, 6.663818359375, 7.04248046875, 7.421142578125, 7.7998046875, 8.178466796875, 8.55712890625, 8.935791015625, 9.314453125, 9.693115234375, 10.07177734375, 10.450439453125, 10.8291015625, 11.207763671875, 11.58642578125, 11.965087890625, 12.34375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 9.0, 12.0, 10.0, 16.0, 27.0, 35.0, 41.0, 66.0, 118.0, 215.0, 438.0, 1467.0, 17892.0, 3077717.0, 1085786.0, 8502.0, 1066.0, 360.0, 189.0, 88.0, 75.0, 43.0, 41.0, 20.0, 15.0, 7.0, 7.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.875, -35.50390625, -34.1328125, -32.76171875, -31.390625, -30.01953125, -28.6484375, -27.27734375, -25.90625, -24.53515625, -23.1640625, -21.79296875, -20.421875, -19.05078125, -17.6796875, -16.30859375, -14.9375, -13.56640625, -12.1953125, -10.82421875, -9.453125, -8.08203125, -6.7109375, -5.33984375, -3.96875, -2.59765625, -1.2265625, 0.14453125, 1.515625, 2.88671875, 4.2578125, 5.62890625, 7.0, 8.37109375, 9.7421875, 11.11328125, 12.484375, 13.85546875, 15.2265625, 16.59765625, 17.96875, 19.33984375, 20.7109375, 22.08203125, 23.453125, 24.82421875, 26.1953125, 27.56640625, 28.9375, 30.30859375, 31.6796875, 33.05078125, 34.421875, 35.79296875, 37.1640625, 38.53515625, 39.90625, 41.27734375, 42.6484375, 44.01953125, 45.390625, 46.76171875, 48.1328125, 49.50390625, 50.875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 54.0, 133.0, 294.0, 305.0, 150.0, 54.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-218.33181762695312, -214.36318969726562, -210.39456176757812, -206.4259490966797, -202.4573211669922, -198.4886932373047, -194.5200653076172, -190.55145263671875, -186.58282470703125, -182.61419677734375, -178.64556884765625, -174.6769561767578, -170.7083282470703, -166.7397003173828, -162.7710723876953, -158.80245971679688, -154.83383178710938, -150.86520385742188, -146.89657592773438, -142.92796325683594, -138.95933532714844, -134.99070739746094, -131.02207946777344, -127.05345916748047, -123.08483123779297, -119.11620330810547, -115.1475830078125, -111.178955078125, -107.21033477783203, -103.24170684814453, -99.27308654785156, -95.30445861816406, -91.33583068847656, -87.36720275878906, -83.3985824584961, -79.4299545288086, -75.46133422851562, -71.49270629882812, -67.52408599853516, -63.555458068847656, -59.58683776855469, -55.61821365356445, -51.64958953857422, -47.680965423583984, -43.71234130859375, -39.74371337890625, -35.77509307861328, -31.806467056274414, -27.837844848632812, -23.869220733642578, -19.900596618652344, -15.931971549987793, -11.963347434997559, -7.994722366333008, -4.026098251342773, -0.05747413635253906, 3.9111499786376953, 7.87977409362793, 11.848398208618164, 15.817023277282715, 19.785648345947266, 23.7542724609375, 27.722896575927734, 31.69152069091797, 35.6601448059082]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 12.0, 8.0, 12.0, 7.0, 13.0, 25.0, 17.0, 13.0, 15.0, 17.0, 21.0, 22.0, 35.0, 29.0, 34.0, 34.0, 24.0, 39.0, 27.0, 46.0, 39.0, 38.0, 38.0, 33.0, 31.0, 33.0, 34.0, 26.0, 28.0, 33.0, 21.0, 32.0, 24.0, 19.0, 16.0, 20.0, 18.0, 12.0, 10.0, 8.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-34.68035125732422, -33.65359878540039, -32.62684631347656, -31.600093841552734, -30.57334327697754, -29.54659080505371, -28.519838333129883, -27.493085861206055, -26.46633529663086, -25.43958282470703, -24.412830352783203, -23.386077880859375, -22.35932731628418, -21.33257484436035, -20.305822372436523, -19.279069900512695, -18.252317428588867, -17.22556495666504, -16.19881248474121, -15.1720609664917, -14.145309448242188, -13.11855697631836, -12.091804504394531, -11.065052032470703, -10.038300514221191, -9.011548042297363, -7.984796524047852, -6.958044052124023, -5.9312920570373535, -4.904540061950684, -3.8777875900268555, -2.8510355949401855, -1.8242835998535156, -0.7975314855575562, 0.22922062873840332, 1.2559728622436523, 2.2827248573303223, 3.309476852416992, 4.33622932434082, 5.36298131942749, 6.38973331451416, 7.41648530960083, 8.4432373046875, 9.469989776611328, 10.496742248535156, 11.523493766784668, 12.550246238708496, 13.576997756958008, 14.603750228881836, 15.630502700805664, 16.657255172729492, 17.684005737304688, 18.710758209228516, 19.737510681152344, 20.764263153076172, 21.791015625, 22.817768096923828, 23.844520568847656, 24.871273040771484, 25.898025512695312, 26.924776077270508, 27.951528549194336, 28.978281021118164, 30.005033493041992, 31.031784057617188]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 6.0, 2.0, 2.0, 3.0, 11.0, 7.0, 11.0, 17.0, 21.0, 13.0, 19.0, 35.0, 28.0, 15.0, 31.0, 43.0, 39.0, 41.0, 48.0, 46.0, 41.0, 49.0, 46.0, 52.0, 31.0, 41.0, 38.0, 33.0, 39.0, 32.0, 28.0, 20.0, 25.0, 23.0, 19.0, 14.0, 11.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.734375, -4.6068115234375, -4.479248046875, -4.3516845703125, -4.22412109375, -4.0965576171875, -3.968994140625, -3.8414306640625, -3.7138671875, -3.5863037109375, -3.458740234375, -3.3311767578125, -3.20361328125, -3.0760498046875, -2.948486328125, -2.8209228515625, -2.693359375, -2.5657958984375, -2.438232421875, -2.3106689453125, -2.18310546875, -2.0555419921875, -1.927978515625, -1.8004150390625, -1.6728515625, -1.5452880859375, -1.417724609375, -1.2901611328125, -1.16259765625, -1.0350341796875, -0.907470703125, -0.7799072265625, -0.65234375, -0.5247802734375, -0.397216796875, -0.2696533203125, -0.14208984375, -0.0145263671875, 0.113037109375, 0.2406005859375, 0.3681640625, 0.4957275390625, 0.623291015625, 0.7508544921875, 0.87841796875, 1.0059814453125, 1.133544921875, 1.2611083984375, 1.388671875, 1.5162353515625, 1.643798828125, 1.7713623046875, 1.89892578125, 2.0264892578125, 2.154052734375, 2.2816162109375, 2.4091796875, 2.5367431640625, 2.664306640625, 2.7918701171875, 2.91943359375, 3.0469970703125, 3.174560546875, 3.3021240234375, 3.4296875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 10.0, 20.0, 19.0, 29.0, 53.0, 50.0, 105.0, 162.0, 225.0, 373.0, 530.0, 776.0, 1176.0, 1802.0, 2630.0, 4127.0, 6425.0, 9639.0, 15333.0, 24459.0, 40418.0, 67592.0, 111361.0, 172249.0, 199800.0, 149279.0, 92860.0, 55522.0, 33646.0, 20846.0, 13059.0, 8323.0, 5360.0, 3442.0, 2306.0, 1493.0, 1034.0, 643.0, 435.0, 292.0, 211.0, 141.0, 113.0, 66.0, 41.0, 27.0, 15.0, 20.0, 9.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.398681640625, -0.38634490966796875, -0.3740081787109375, -0.36167144775390625, -0.349334716796875, -0.33699798583984375, -0.3246612548828125, -0.31232452392578125, -0.29998779296875, -0.28765106201171875, -0.2753143310546875, -0.26297760009765625, -0.250640869140625, -0.23830413818359375, -0.2259674072265625, -0.21363067626953125, -0.2012939453125, -0.18895721435546875, -0.1766204833984375, -0.16428375244140625, -0.151947021484375, -0.13961029052734375, -0.1272735595703125, -0.11493682861328125, -0.10260009765625, -0.09026336669921875, -0.0779266357421875, -0.06558990478515625, -0.053253173828125, -0.04091644287109375, -0.0285797119140625, -0.01624298095703125, -0.00390625, 0.00843048095703125, 0.0207672119140625, 0.03310394287109375, 0.045440673828125, 0.05777740478515625, 0.0701141357421875, 0.08245086669921875, 0.09478759765625, 0.10712432861328125, 0.1194610595703125, 0.13179779052734375, 0.144134521484375, 0.15647125244140625, 0.1688079833984375, 0.18114471435546875, 0.1934814453125, 0.20581817626953125, 0.2181549072265625, 0.23049163818359375, 0.242828369140625, 0.25516510009765625, 0.2675018310546875, 0.27983856201171875, 0.29217529296875, 0.30451202392578125, 0.3168487548828125, 0.32918548583984375, 0.341522216796875, 0.35385894775390625, 0.3661956787109375, 0.37853240966796875, 0.390869140625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 8.0, 10.0, 5.0, 11.0, 13.0, 19.0, 23.0, 19.0, 21.0, 29.0, 26.0, 21.0, 36.0, 37.0, 32.0, 31.0, 36.0, 27.0, 52.0, 1071.0, 39.0, 25.0, 39.0, 44.0, 38.0, 36.0, 22.0, 26.0, 24.0, 28.0, 23.0, 29.0, 14.0, 16.0, 11.0, 13.0, 10.0, 11.0, 11.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.31640625, -2.246856689453125, -2.17730712890625, -2.107757568359375, -2.0382080078125, -1.968658447265625, -1.89910888671875, -1.829559326171875, -1.760009765625, -1.690460205078125, -1.62091064453125, -1.551361083984375, -1.4818115234375, -1.412261962890625, -1.34271240234375, -1.273162841796875, -1.20361328125, -1.134063720703125, -1.06451416015625, -0.994964599609375, -0.9254150390625, -0.855865478515625, -0.78631591796875, -0.716766357421875, -0.647216796875, -0.577667236328125, -0.50811767578125, -0.438568115234375, -0.3690185546875, -0.299468994140625, -0.22991943359375, -0.160369873046875, -0.0908203125, -0.021270751953125, 0.04827880859375, 0.117828369140625, 0.1873779296875, 0.256927490234375, 0.32647705078125, 0.396026611328125, 0.465576171875, 0.535125732421875, 0.60467529296875, 0.674224853515625, 0.7437744140625, 0.813323974609375, 0.88287353515625, 0.952423095703125, 1.02197265625, 1.091522216796875, 1.16107177734375, 1.230621337890625, 1.3001708984375, 1.369720458984375, 1.43927001953125, 1.508819580078125, 1.578369140625, 1.647918701171875, 1.71746826171875, 1.787017822265625, 1.8565673828125, 1.926116943359375, 1.99566650390625, 2.065216064453125, 2.134765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 0.0, 2.0, 8.0, 6.0, 9.0, 9.0, 11.0, 36.0, 44.0, 70.0, 89.0, 154.0, 216.0, 313.0, 426.0, 684.0, 1119.0, 1605.0, 2515.0, 3747.0, 5775.0, 9153.0, 13909.0, 21791.0, 33936.0, 53403.0, 83035.0, 122401.0, 184683.0, 1184701.0, 128063.0, 87529.0, 56515.0, 36103.0, 22957.0, 14693.0, 9391.0, 6238.0, 3999.0, 2666.0, 1728.0, 1116.0, 758.0, 522.0, 297.0, 241.0, 154.0, 100.0, 65.0, 57.0, 40.0, 25.0, 11.0, 9.0, 2.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.265869140625, -0.25757598876953125, -0.2492828369140625, -0.24098968505859375, -0.232696533203125, -0.22440338134765625, -0.2161102294921875, -0.20781707763671875, -0.19952392578125, -0.19123077392578125, -0.1829376220703125, -0.17464447021484375, -0.166351318359375, -0.15805816650390625, -0.1497650146484375, -0.14147186279296875, -0.1331787109375, -0.12488555908203125, -0.1165924072265625, -0.10829925537109375, -0.100006103515625, -0.09171295166015625, -0.0834197998046875, -0.07512664794921875, -0.06683349609375, -0.05854034423828125, -0.0502471923828125, -0.04195404052734375, -0.033660888671875, -0.02536773681640625, -0.0170745849609375, -0.00878143310546875, -0.00048828125, 0.00780487060546875, 0.0160980224609375, 0.02439117431640625, 0.032684326171875, 0.04097747802734375, 0.0492706298828125, 0.05756378173828125, 0.06585693359375, 0.07415008544921875, 0.0824432373046875, 0.09073638916015625, 0.099029541015625, 0.10732269287109375, 0.1156158447265625, 0.12390899658203125, 0.1322021484375, 0.14049530029296875, 0.1487884521484375, 0.15708160400390625, 0.165374755859375, 0.17366790771484375, 0.1819610595703125, 0.19025421142578125, 0.19854736328125, 0.20684051513671875, 0.2151336669921875, 0.22342681884765625, 0.231719970703125, 0.24001312255859375, 0.2483062744140625, 0.25659942626953125, 0.264892578125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 7.0, 15.0, 17.0, 22.0, 28.0, 24.0, 34.0, 48.0, 31.0, 40.0, 54.0, 52.0, 66.0, 69.0, 55.0, 65.0, 55.0, 50.0, 37.0, 31.0, 25.0, 38.0, 11.0, 19.0, 17.0, 12.0, 10.0, 5.0, 8.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0010013580322265625, -0.0009725242853164673, -0.0009436905384063721, -0.0009148567914962769, -0.0008860230445861816, -0.0008571892976760864, -0.0008283555507659912, -0.000799521803855896, -0.0007706880569458008, -0.0007418543100357056, -0.0007130205631256104, -0.0006841868162155151, -0.0006553530693054199, -0.0006265193223953247, -0.0005976855754852295, -0.0005688518285751343, -0.0005400180816650391, -0.0005111843347549438, -0.00048235058784484863, -0.0004535168409347534, -0.0004246830940246582, -0.000395849347114563, -0.0003670156002044678, -0.00033818185329437256, -0.00030934810638427734, -0.00028051435947418213, -0.0002516806125640869, -0.0002228468656539917, -0.00019401311874389648, -0.00016517937183380127, -0.00013634562492370605, -0.00010751187801361084, -7.867813110351562e-05, -4.984438419342041e-05, -2.1010637283325195e-05, 7.82310962677002e-06, 3.6656856536865234e-05, 6.549060344696045e-05, 9.432435035705566e-05, 0.00012315809726715088, 0.0001519918441772461, 0.0001808255910873413, 0.00020965933799743652, 0.00023849308490753174, 0.00026732683181762695, 0.00029616057872772217, 0.0003249943256378174, 0.0003538280725479126, 0.0003826618194580078, 0.00041149556636810303, 0.00044032931327819824, 0.00046916306018829346, 0.0004979968070983887, 0.0005268305540084839, 0.0005556643009185791, 0.0005844980478286743, 0.0006133317947387695, 0.0006421655416488647, 0.00067099928855896, 0.0006998330354690552, 0.0007286667823791504, 0.0007575005292892456, 0.0007863342761993408, 0.000815168023109436, 0.0008440017700195312]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 10.0, 7.0, 11.0, 13.0, 22.0, 21.0, 31.0, 30.0, 39.0, 55.0, 63.0, 103.0, 157.0, 195.0, 305.0, 570.0, 3645.0, 470272.0, 567181.0, 4188.0, 607.0, 318.0, 182.0, 122.0, 86.0, 81.0, 57.0, 48.0, 31.0, 19.0, 16.0, 13.0, 13.0, 11.0, 8.0, 3.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016571044921875, -0.016019105911254883, -0.015467166900634766, -0.014915227890014648, -0.014363288879394531, -0.013811349868774414, -0.013259410858154297, -0.01270747184753418, -0.012155532836914062, -0.011603593826293945, -0.011051654815673828, -0.010499715805053711, -0.009947776794433594, -0.009395837783813477, -0.00884389877319336, -0.008291959762573242, -0.007740020751953125, -0.007188081741333008, -0.006636142730712891, -0.0060842037200927734, -0.005532264709472656, -0.004980325698852539, -0.004428386688232422, -0.0038764476776123047, -0.0033245086669921875, -0.0027725696563720703, -0.002220630645751953, -0.001668691635131836, -0.0011167526245117188, -0.0005648136138916016, -1.2874603271484375e-05, 0.0005390644073486328, 0.00109100341796875, 0.0016429424285888672, 0.0021948814392089844, 0.0027468204498291016, 0.0032987594604492188, 0.003850698471069336, 0.004402637481689453, 0.00495457649230957, 0.0055065155029296875, 0.006058454513549805, 0.006610393524169922, 0.007162332534790039, 0.007714271545410156, 0.008266210556030273, 0.00881814956665039, 0.009370088577270508, 0.009922027587890625, 0.010473966598510742, 0.01102590560913086, 0.011577844619750977, 0.012129783630371094, 0.012681722640991211, 0.013233661651611328, 0.013785600662231445, 0.014337539672851562, 0.01488947868347168, 0.015441417694091797, 0.015993356704711914, 0.01654529571533203, 0.01709723472595215, 0.017649173736572266, 0.018201112747192383, 0.0187530517578125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 41.0, 444.0, 486.0, 44.0], "bins": [-0.009929399937391281, -0.009769328869879246, -0.00960925780236721, -0.009449186734855175, -0.00928911566734314, -0.009129044599831104, -0.008968973532319069, -0.008808901533484459, -0.008648830465972424, -0.008488759398460388, -0.008328688330948353, -0.008168617263436317, -0.008008546195924282, -0.007848475128412247, -0.007688403595238924, -0.007528332527726889, -0.007368261925876141, -0.007208190858364105, -0.00704811979085207, -0.0068880487233400345, -0.006727977190166712, -0.0065679061226546764, -0.006407835055142641, -0.006247763987630606, -0.006087692454457283, -0.005927621386945248, -0.005767550319433212, -0.005607479251921177, -0.005447407718747854, -0.005287336651235819, -0.0051272655837237835, -0.004967194516211748, -0.004807123448699713, -0.004647052381187677, -0.004486981313675642, -0.004326909780502319, -0.004166838712990284, -0.004006767645478249, -0.0038466965779662132, -0.003686625510454178, -0.0035265544429421425, -0.003366483375430107, -0.003206412075087428, -0.0030463410075753927, -0.0028862699400633574, -0.0027261986397206783, -0.002566127572208643, -0.0024060565046966076, -0.0022459852043539286, -0.002085914136841893, -0.001925842952914536, -0.0017657717689871788, -0.0016057007014751434, -0.0014456295175477862, -0.001285558333620429, -0.0011254872661083937, -0.0009654160821810365, -0.0008053449564613402, -0.0006452738307416439, -0.0004852026468142867, -0.0003251315210945904, -0.00016506039537489414, -4.989211447536945e-06, 0.00015508185606449842, 0.0003151530399918556]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 6.0, 4.0, 18.0, 14.0, 15.0, 13.0, 23.0, 20.0, 19.0, 25.0, 33.0, 24.0, 40.0, 29.0, 50.0, 47.0, 42.0, 42.0, 45.0, 50.0, 35.0, 50.0, 36.0, 33.0, 29.0, 36.0, 33.0, 31.0, 30.0, 20.0, 17.0, 20.0, 14.0, 12.0, 6.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041961669921875, -0.0004038959741592407, -0.00038817524909973145, -0.00037245452404022217, -0.0003567337989807129, -0.0003410130739212036, -0.00032529234886169434, -0.00030957162380218506, -0.0002938508987426758, -0.0002781301736831665, -0.0002624094486236572, -0.00024668872356414795, -0.00023096799850463867, -0.0002152472734451294, -0.00019952654838562012, -0.00018380582332611084, -0.00016808509826660156, -0.00015236437320709229, -0.000136643648147583, -0.00012092292308807373, -0.00010520219802856445, -8.948147296905518e-05, -7.37607479095459e-05, -5.804002285003662e-05, -4.2319297790527344e-05, -2.6598572731018066e-05, -1.0877847671508789e-05, 4.842877388000488e-06, 2.0563602447509766e-05, 3.628432750701904e-05, 5.200505256652832e-05, 6.77257776260376e-05, 8.344650268554688e-05, 9.916722774505615e-05, 0.00011488795280456543, 0.0001306086778640747, 0.00014632940292358398, 0.00016205012798309326, 0.00017777085304260254, 0.00019349157810211182, 0.0002092123031616211, 0.00022493302822113037, 0.00024065375328063965, 0.0002563744783401489, 0.0002720952033996582, 0.0002878159284591675, 0.00030353665351867676, 0.00031925737857818604, 0.0003349781036376953, 0.0003506988286972046, 0.00036641955375671387, 0.00038214027881622314, 0.0003978610038757324, 0.0004135817289352417, 0.000429302453994751, 0.00044502317905426025, 0.00046074390411376953, 0.0004764646291732788, 0.0004921853542327881, 0.0005079060792922974, 0.0005236268043518066, 0.0005393475294113159, 0.0005550682544708252, 0.0005707889795303345, 0.0005865097045898438]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 1.0, 6.0, 2.0, 2.0, 3.0, 11.0, 7.0, 11.0, 17.0, 21.0, 13.0, 19.0, 35.0, 28.0, 15.0, 31.0, 43.0, 39.0, 41.0, 48.0, 46.0, 40.0, 50.0, 46.0, 52.0, 31.0, 41.0, 38.0, 33.0, 39.0, 32.0, 28.0, 20.0, 25.0, 23.0, 19.0, 14.0, 11.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.734375, -4.6068115234375, -4.479248046875, -4.3516845703125, -4.22412109375, -4.0965576171875, -3.968994140625, -3.8414306640625, -3.7138671875, -3.5863037109375, -3.458740234375, -3.3311767578125, -3.20361328125, -3.0760498046875, -2.948486328125, -2.8209228515625, -2.693359375, -2.5657958984375, -2.438232421875, -2.3106689453125, -2.18310546875, -2.0555419921875, -1.927978515625, -1.8004150390625, -1.6728515625, -1.5452880859375, -1.417724609375, -1.2901611328125, -1.16259765625, -1.0350341796875, -0.907470703125, -0.7799072265625, -0.65234375, -0.5247802734375, -0.397216796875, -0.2696533203125, -0.14208984375, -0.0145263671875, 0.113037109375, 0.2406005859375, 0.3681640625, 0.4957275390625, 0.623291015625, 0.7508544921875, 0.87841796875, 1.0059814453125, 1.133544921875, 1.2611083984375, 1.388671875, 1.5162353515625, 1.643798828125, 1.7713623046875, 1.89892578125, 2.0264892578125, 2.154052734375, 2.2816162109375, 2.4091796875, 2.5367431640625, 2.664306640625, 2.7918701171875, 2.91943359375, 3.0469970703125, 3.174560546875, 3.3021240234375, 3.4296875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 8.0, 6.0, 12.0, 17.0, 40.0, 55.0, 80.0, 108.0, 190.0, 281.0, 504.0, 693.0, 1235.0, 2192.0, 3542.0, 6616.0, 13194.0, 29266.0, 77311.0, 219814.0, 383117.0, 190740.0, 67208.0, 26029.0, 11668.0, 6128.0, 3386.0, 1987.0, 1186.0, 681.0, 476.0, 251.0, 181.0, 118.0, 82.0, 49.0, 37.0, 24.0, 12.0, 9.0, 3.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.04296875, -2.959442138671875, -2.87591552734375, -2.792388916015625, -2.7088623046875, -2.625335693359375, -2.54180908203125, -2.458282470703125, -2.374755859375, -2.291229248046875, -2.20770263671875, -2.124176025390625, -2.0406494140625, -1.957122802734375, -1.87359619140625, -1.790069580078125, -1.70654296875, -1.623016357421875, -1.53948974609375, -1.455963134765625, -1.3724365234375, -1.288909912109375, -1.20538330078125, -1.121856689453125, -1.038330078125, -0.954803466796875, -0.87127685546875, -0.787750244140625, -0.7042236328125, -0.620697021484375, -0.53717041015625, -0.453643798828125, -0.3701171875, -0.286590576171875, -0.20306396484375, -0.119537353515625, -0.0360107421875, 0.047515869140625, 0.13104248046875, 0.214569091796875, 0.298095703125, 0.381622314453125, 0.46514892578125, 0.548675537109375, 0.6322021484375, 0.715728759765625, 0.79925537109375, 0.882781982421875, 0.96630859375, 1.049835205078125, 1.13336181640625, 1.216888427734375, 1.3004150390625, 1.383941650390625, 1.46746826171875, 1.550994873046875, 1.634521484375, 1.718048095703125, 1.80157470703125, 1.885101318359375, 1.9686279296875, 2.052154541015625, 2.13568115234375, 2.219207763671875, 2.302734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 6.0, 7.0, 12.0, 5.0, 17.0, 14.0, 17.0, 21.0, 30.0, 28.0, 40.0, 30.0, 40.0, 39.0, 46.0, 41.0, 70.0, 268.0, 1653.0, 175.0, 74.0, 50.0, 52.0, 44.0, 38.0, 32.0, 32.0, 19.0, 21.0, 23.0, 20.0, 14.0, 12.0, 13.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.953125, -13.52197265625, -13.0908203125, -12.65966796875, -12.228515625, -11.79736328125, -11.3662109375, -10.93505859375, -10.50390625, -10.07275390625, -9.6416015625, -9.21044921875, -8.779296875, -8.34814453125, -7.9169921875, -7.48583984375, -7.0546875, -6.62353515625, -6.1923828125, -5.76123046875, -5.330078125, -4.89892578125, -4.4677734375, -4.03662109375, -3.60546875, -3.17431640625, -2.7431640625, -2.31201171875, -1.880859375, -1.44970703125, -1.0185546875, -0.58740234375, -0.15625, 0.27490234375, 0.7060546875, 1.13720703125, 1.568359375, 1.99951171875, 2.4306640625, 2.86181640625, 3.29296875, 3.72412109375, 4.1552734375, 4.58642578125, 5.017578125, 5.44873046875, 5.8798828125, 6.31103515625, 6.7421875, 7.17333984375, 7.6044921875, 8.03564453125, 8.466796875, 8.89794921875, 9.3291015625, 9.76025390625, 10.19140625, 10.62255859375, 11.0537109375, 11.48486328125, 11.916015625, 12.34716796875, 12.7783203125, 13.20947265625, 13.640625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 1.0, 7.0, 10.0, 9.0, 10.0, 21.0, 20.0, 36.0, 29.0, 47.0, 61.0, 93.0, 142.0, 246.0, 519.0, 1580.0, 22637.0, 3076970.0, 39973.0, 1909.0, 565.0, 257.0, 147.0, 91.0, 86.0, 62.0, 42.0, 29.0, 26.0, 13.0, 11.0, 15.0, 6.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.78125, -27.971923828125, -27.16259765625, -26.353271484375, -25.5439453125, -24.734619140625, -23.92529296875, -23.115966796875, -22.306640625, -21.497314453125, -20.68798828125, -19.878662109375, -19.0693359375, -18.260009765625, -17.45068359375, -16.641357421875, -15.83203125, -15.022705078125, -14.21337890625, -13.404052734375, -12.5947265625, -11.785400390625, -10.97607421875, -10.166748046875, -9.357421875, -8.548095703125, -7.73876953125, -6.929443359375, -6.1201171875, -5.310791015625, -4.50146484375, -3.692138671875, -2.8828125, -2.073486328125, -1.26416015625, -0.454833984375, 0.3544921875, 1.163818359375, 1.97314453125, 2.782470703125, 3.591796875, 4.401123046875, 5.21044921875, 6.019775390625, 6.8291015625, 7.638427734375, 8.44775390625, 9.257080078125, 10.06640625, 10.875732421875, 11.68505859375, 12.494384765625, 13.3037109375, 14.113037109375, 14.92236328125, 15.731689453125, 16.541015625, 17.350341796875, 18.15966796875, 18.968994140625, 19.7783203125, 20.587646484375, 21.39697265625, 22.206298828125, 23.015625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 14.0, 927.0, 76.0, 0.0, 1.0], "bins": [-343.09576416015625, -337.4305114746094, -331.7652587890625, -326.0999755859375, -320.4347229003906, -314.76947021484375, -309.1042175292969, -303.43896484375, -297.773681640625, -292.1084289550781, -286.44317626953125, -280.77789306640625, -275.1126403808594, -269.4473876953125, -263.7821350097656, -258.11688232421875, -252.45162963867188, -246.786376953125, -241.12110900878906, -235.4558563232422, -229.79058837890625, -224.12533569335938, -218.4600830078125, -212.79483032226562, -207.1295623779297, -201.4643096923828, -195.79904174804688, -190.1337890625, -184.46853637695312, -178.8032684326172, -173.1380157470703, -167.47274780273438, -161.80751037597656, -156.1422576904297, -150.47698974609375, -144.81173706054688, -139.146484375, -133.48121643066406, -127.81596374511719, -122.15070343017578, -116.48544311523438, -110.82018280029297, -105.15492248535156, -99.48966979980469, -93.82440948486328, -88.15914916992188, -82.493896484375, -76.8286361694336, -71.16337585449219, -65.49811553955078, -59.83285903930664, -54.1676025390625, -48.502342224121094, -42.83708190917969, -37.17182540893555, -31.506568908691406, -25.841306686401367, -20.176048278808594, -14.51078987121582, -8.845531463623047, -3.1802730560302734, 2.4849853515625, 8.150243759155273, 13.815500259399414, 19.48076057434082]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 6.0, 19.0, 16.0, 10.0, 12.0, 16.0, 17.0, 15.0, 18.0, 22.0, 16.0, 24.0, 36.0, 40.0, 40.0, 30.0, 45.0, 38.0, 33.0, 39.0, 30.0, 30.0, 49.0, 38.0, 27.0, 34.0, 32.0, 27.0, 18.0, 24.0, 26.0, 29.0, 15.0, 16.0, 13.0, 15.0, 19.0, 14.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-38.482540130615234, -37.325347900390625, -36.16815185546875, -35.01095962524414, -33.853763580322266, -32.696571350097656, -31.539377212524414, -30.382183074951172, -29.22498893737793, -28.067794799804688, -26.910600662231445, -25.753406524658203, -24.596214294433594, -23.43901824951172, -22.28182601928711, -21.124631881713867, -19.967437744140625, -18.810243606567383, -17.65304946899414, -16.4958553314209, -15.338662147521973, -14.18146800994873, -13.024274826049805, -11.867080688476562, -10.70988655090332, -9.552692413330078, -8.395498275756836, -7.23830509185791, -6.081110954284668, -4.923916816711426, -3.766723155975342, -2.609529495239258, -1.4523353576660156, -0.29514145851135254, 0.8620524406433105, 2.0192463397979736, 3.1764402389526367, 4.333634376525879, 5.490828037261963, 6.648021697998047, 7.805215835571289, 8.962409973144531, 10.119604110717773, 11.2767972946167, 12.433991432189941, 13.591185569763184, 14.74837875366211, 15.905572891235352, 17.062767028808594, 18.219961166381836, 19.377155303955078, 20.53434944152832, 21.691543579101562, 22.848735809326172, 24.005929946899414, 25.163124084472656, 26.3203182220459, 27.47751235961914, 28.634706497192383, 29.791900634765625, 30.949092864990234, 32.10628890991211, 33.26348114013672, 34.420677185058594, 35.5778694152832]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 6.0, 12.0, 7.0, 14.0, 14.0, 19.0, 19.0, 33.0, 19.0, 26.0, 23.0, 20.0, 40.0, 34.0, 53.0, 53.0, 40.0, 55.0, 40.0, 52.0, 45.0, 29.0, 34.0, 42.0, 37.0, 32.0, 32.0, 27.0, 22.0, 19.0, 22.0, 20.0, 11.0, 10.0, 10.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.75, -4.62127685546875, -4.4925537109375, -4.36383056640625, -4.235107421875, -4.10638427734375, -3.9776611328125, -3.84893798828125, -3.72021484375, -3.59149169921875, -3.4627685546875, -3.33404541015625, -3.205322265625, -3.07659912109375, -2.9478759765625, -2.81915283203125, -2.6904296875, -2.56170654296875, -2.4329833984375, -2.30426025390625, -2.175537109375, -2.04681396484375, -1.9180908203125, -1.78936767578125, -1.66064453125, -1.53192138671875, -1.4031982421875, -1.27447509765625, -1.145751953125, -1.01702880859375, -0.8883056640625, -0.75958251953125, -0.630859375, -0.50213623046875, -0.3734130859375, -0.24468994140625, -0.115966796875, 0.01275634765625, 0.1414794921875, 0.27020263671875, 0.39892578125, 0.52764892578125, 0.6563720703125, 0.78509521484375, 0.913818359375, 1.04254150390625, 1.1712646484375, 1.29998779296875, 1.4287109375, 1.55743408203125, 1.6861572265625, 1.81488037109375, 1.943603515625, 2.07232666015625, 2.2010498046875, 2.32977294921875, 2.45849609375, 2.58721923828125, 2.7159423828125, 2.84466552734375, 2.973388671875, 3.10211181640625, 3.2308349609375, 3.35955810546875, 3.48828125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 4.0, 8.0, 10.0, 9.0, 13.0, 9.0, 22.0, 21.0, 40.0, 49.0, 69.0, 99.0, 201.0, 439.0, 1617.0, 8985.0, 73562.0, 1108855.0, 2709913.0, 261128.0, 24111.0, 3608.0, 770.0, 286.0, 136.0, 88.0, 52.0, 31.0, 25.0, 23.0, 22.0, 19.0, 13.0, 11.0, 9.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.414794921875, -14.01708984375, -13.619384765625, -13.2216796875, -12.823974609375, -12.42626953125, -12.028564453125, -11.630859375, -11.233154296875, -10.83544921875, -10.437744140625, -10.0400390625, -9.642333984375, -9.24462890625, -8.846923828125, -8.44921875, -8.051513671875, -7.65380859375, -7.256103515625, -6.8583984375, -6.460693359375, -6.06298828125, -5.665283203125, -5.267578125, -4.869873046875, -4.47216796875, -4.074462890625, -3.6767578125, -3.279052734375, -2.88134765625, -2.483642578125, -2.0859375, -1.688232421875, -1.29052734375, -0.892822265625, -0.4951171875, -0.097412109375, 0.30029296875, 0.697998046875, 1.095703125, 1.493408203125, 1.89111328125, 2.288818359375, 2.6865234375, 3.084228515625, 3.48193359375, 3.879638671875, 4.27734375, 4.675048828125, 5.07275390625, 5.470458984375, 5.8681640625, 6.265869140625, 6.66357421875, 7.061279296875, 7.458984375, 7.856689453125, 8.25439453125, 8.652099609375, 9.0498046875, 9.447509765625, 9.84521484375, 10.242919921875, 10.640625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 17.0, 19.0, 33.0, 62.0, 112.0, 120.0, 166.0, 241.0, 343.0, 491.0, 571.0, 515.0, 404.0, 300.0, 202.0, 142.0, 114.0, 74.0, 50.0, 29.0, 21.0, 10.0, 9.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -16.0213623046875, -15.573974609375, -15.1265869140625, -14.67919921875, -14.2318115234375, -13.784423828125, -13.3370361328125, -12.8896484375, -12.4422607421875, -11.994873046875, -11.5474853515625, -11.10009765625, -10.6527099609375, -10.205322265625, -9.7579345703125, -9.310546875, -8.8631591796875, -8.415771484375, -7.9683837890625, -7.52099609375, -7.0736083984375, -6.626220703125, -6.1788330078125, -5.7314453125, -5.2840576171875, -4.836669921875, -4.3892822265625, -3.94189453125, -3.4945068359375, -3.047119140625, -2.5997314453125, -2.15234375, -1.7049560546875, -1.257568359375, -0.8101806640625, -0.36279296875, 0.0845947265625, 0.531982421875, 0.9793701171875, 1.4267578125, 1.8741455078125, 2.321533203125, 2.7689208984375, 3.21630859375, 3.6636962890625, 4.111083984375, 4.5584716796875, 5.005859375, 5.4532470703125, 5.900634765625, 6.3480224609375, 6.79541015625, 7.2427978515625, 7.690185546875, 8.1375732421875, 8.5849609375, 9.0323486328125, 9.479736328125, 9.9271240234375, 10.37451171875, 10.8218994140625, 11.269287109375, 11.7166748046875, 12.1640625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 24.0, 15.0, 25.0, 34.0, 38.0, 65.0, 87.0, 106.0, 183.0, 258.0, 583.0, 1667.0, 14588.0, 607134.0, 3474986.0, 88043.0, 4374.0, 930.0, 399.0, 214.0, 159.0, 81.0, 62.0, 53.0, 45.0, 24.0, 25.0, 13.0, 10.0, 12.0, 8.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.625, -31.58154296875, -30.5380859375, -29.49462890625, -28.451171875, -27.40771484375, -26.3642578125, -25.32080078125, -24.27734375, -23.23388671875, -22.1904296875, -21.14697265625, -20.103515625, -19.06005859375, -18.0166015625, -16.97314453125, -15.9296875, -14.88623046875, -13.8427734375, -12.79931640625, -11.755859375, -10.71240234375, -9.6689453125, -8.62548828125, -7.58203125, -6.53857421875, -5.4951171875, -4.45166015625, -3.408203125, -2.36474609375, -1.3212890625, -0.27783203125, 0.765625, 1.80908203125, 2.8525390625, 3.89599609375, 4.939453125, 5.98291015625, 7.0263671875, 8.06982421875, 9.11328125, 10.15673828125, 11.2001953125, 12.24365234375, 13.287109375, 14.33056640625, 15.3740234375, 16.41748046875, 17.4609375, 18.50439453125, 19.5478515625, 20.59130859375, 21.634765625, 22.67822265625, 23.7216796875, 24.76513671875, 25.80859375, 26.85205078125, 27.8955078125, 28.93896484375, 29.982421875, 31.02587890625, 32.0693359375, 33.11279296875, 34.15625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 11.0, 35.0, 111.0, 181.0, 272.0, 226.0, 115.0, 42.0, 12.0, 10.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.71157455444336, -36.8895263671875, -33.06747817993164, -29.24542999267578, -25.423381805419922, -21.601333618164062, -17.779285430908203, -13.957237243652344, -10.135189056396484, -6.313140869140625, -2.4910926818847656, 1.3309555053710938, 5.153003692626953, 8.975051879882812, 12.797100067138672, 16.61914825439453, 20.44119644165039, 24.26324462890625, 28.08529281616211, 31.90734100341797, 35.72938919067383, 39.55143737792969, 43.37348556518555, 47.195533752441406, 51.017581939697266, 54.839630126953125, 58.661678314208984, 62.483726501464844, 66.30577087402344, 70.12782287597656, 73.94987487792969, 77.77191925048828, 81.59396362304688, 85.416015625, 89.2380599975586, 93.06010437011719, 96.88215637207031, 100.70420837402344, 104.52625274658203, 108.34829711914062, 112.17034912109375, 115.99240112304688, 119.81444549560547, 123.63648986816406, 127.45854187011719, 131.2805938720703, 135.10263061523438, 138.9246826171875, 142.74673461914062, 146.56878662109375, 150.39083862304688, 154.21287536621094, 158.03492736816406, 161.8569793701172, 165.67901611328125, 169.50106811523438, 173.3231201171875, 177.14517211914062, 180.96722412109375, 184.7892608642578, 188.61131286621094, 192.43336486816406, 196.25540161132812, 200.07745361328125, 203.89950561523438]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 7.0, 9.0, 6.0, 14.0, 13.0, 14.0, 19.0, 16.0, 23.0, 24.0, 21.0, 29.0, 34.0, 30.0, 33.0, 27.0, 37.0, 33.0, 30.0, 42.0, 47.0, 48.0, 39.0, 34.0, 34.0, 32.0, 31.0, 36.0, 33.0, 22.0, 25.0, 25.0, 25.0, 14.0, 19.0, 11.0, 11.0, 8.0, 10.0, 6.0, 7.0, 8.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.23828125, -29.138547897338867, -28.038814544677734, -26.9390811920166, -25.83934783935547, -24.739614486694336, -23.639881134033203, -22.54014778137207, -21.440414428710938, -20.340681076049805, -19.240947723388672, -18.14121437072754, -17.041481018066406, -15.941747665405273, -14.84201431274414, -13.742280960083008, -12.642547607421875, -11.542814254760742, -10.44308090209961, -9.343347549438477, -8.243614196777344, -7.143880844116211, -6.044147491455078, -4.944414138793945, -3.8446807861328125, -2.7449474334716797, -1.6452140808105469, -0.5454807281494141, 0.5542526245117188, 1.6539859771728516, 2.7537193298339844, 3.853452682495117, 4.95318603515625, 6.052919387817383, 7.152652740478516, 8.252386093139648, 9.352119445800781, 10.451852798461914, 11.551586151123047, 12.65131950378418, 13.751052856445312, 14.850786209106445, 15.950519561767578, 17.05025291442871, 18.149986267089844, 19.249719619750977, 20.34945297241211, 21.449186325073242, 22.548919677734375, 23.648653030395508, 24.74838638305664, 25.848119735717773, 26.947853088378906, 28.04758644104004, 29.147319793701172, 30.247053146362305, 31.346786499023438, 32.44651794433594, 33.5462532043457, 34.64598846435547, 35.74571990966797, 36.84545135498047, 37.945186614990234, 39.044921875, 40.1446533203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 9.0, 5.0, 2.0, 5.0, 11.0, 12.0, 21.0, 22.0, 24.0, 21.0, 30.0, 29.0, 33.0, 26.0, 21.0, 34.0, 39.0, 45.0, 50.0, 39.0, 41.0, 43.0, 43.0, 45.0, 37.0, 34.0, 29.0, 37.0, 38.0, 20.0, 21.0, 21.0, 18.0, 21.0, 13.0, 14.0, 5.0, 13.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0], "bins": [-4.859375, -4.734893798828125, -4.61041259765625, -4.485931396484375, -4.3614501953125, -4.236968994140625, -4.11248779296875, -3.988006591796875, -3.863525390625, -3.739044189453125, -3.61456298828125, -3.490081787109375, -3.3656005859375, -3.241119384765625, -3.11663818359375, -2.992156982421875, -2.86767578125, -2.743194580078125, -2.61871337890625, -2.494232177734375, -2.3697509765625, -2.245269775390625, -2.12078857421875, -1.996307373046875, -1.871826171875, -1.747344970703125, -1.62286376953125, -1.498382568359375, -1.3739013671875, -1.249420166015625, -1.12493896484375, -1.000457763671875, -0.8759765625, -0.751495361328125, -0.62701416015625, -0.502532958984375, -0.3780517578125, -0.253570556640625, -0.12908935546875, -0.004608154296875, 0.119873046875, 0.244354248046875, 0.36883544921875, 0.493316650390625, 0.6177978515625, 0.742279052734375, 0.86676025390625, 0.991241455078125, 1.11572265625, 1.240203857421875, 1.36468505859375, 1.489166259765625, 1.6136474609375, 1.738128662109375, 1.86260986328125, 1.987091064453125, 2.111572265625, 2.236053466796875, 2.36053466796875, 2.485015869140625, 2.6094970703125, 2.733978271484375, 2.85845947265625, 2.982940673828125, 3.107421875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 8.0, 7.0, 17.0, 24.0, 34.0, 42.0, 55.0, 97.0, 126.0, 181.0, 259.0, 436.0, 700.0, 964.0, 1486.0, 2193.0, 3566.0, 5240.0, 7883.0, 12394.0, 18870.0, 29960.0, 48103.0, 79242.0, 130807.0, 189554.0, 185644.0, 126514.0, 76409.0, 46147.0, 28569.0, 18474.0, 11921.0, 7697.0, 5079.0, 3394.0, 2172.0, 1447.0, 968.0, 640.0, 412.0, 266.0, 181.0, 135.0, 73.0, 62.0, 39.0, 28.0, 14.0, 8.0, 10.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40380859375, -0.3907661437988281, -0.37772369384765625, -0.3646812438964844, -0.3516387939453125, -0.3385963439941406, -0.32555389404296875, -0.3125114440917969, -0.299468994140625, -0.2864265441894531, -0.27338409423828125, -0.2603416442871094, -0.2472991943359375, -0.23425674438476562, -0.22121429443359375, -0.20817184448242188, -0.19512939453125, -0.18208694458007812, -0.16904449462890625, -0.15600204467773438, -0.1429595947265625, -0.12991714477539062, -0.11687469482421875, -0.10383224487304688, -0.090789794921875, -0.07774734497070312, -0.06470489501953125, -0.051662445068359375, -0.0386199951171875, -0.025577545166015625, -0.01253509521484375, 0.000507354736328125, 0.0135498046875, 0.026592254638671875, 0.03963470458984375, 0.052677154541015625, 0.0657196044921875, 0.07876205444335938, 0.09180450439453125, 0.10484695434570312, 0.117889404296875, 0.13093185424804688, 0.14397430419921875, 0.15701675415039062, 0.1700592041015625, 0.18310165405273438, 0.19614410400390625, 0.20918655395507812, 0.22222900390625, 0.23527145385742188, 0.24831390380859375, 0.2613563537597656, 0.2743988037109375, 0.2874412536621094, 0.30048370361328125, 0.3135261535644531, 0.326568603515625, 0.3396110534667969, 0.35265350341796875, 0.3656959533691406, 0.3787384033203125, 0.3917808532714844, 0.40482330322265625, 0.4178657531738281, 0.430908203125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 8.0, 10.0, 6.0, 8.0, 11.0, 14.0, 24.0, 23.0, 20.0, 28.0, 23.0, 34.0, 19.0, 35.0, 40.0, 37.0, 27.0, 51.0, 35.0, 42.0, 1057.0, 52.0, 43.0, 35.0, 45.0, 45.0, 34.0, 31.0, 17.0, 25.0, 23.0, 24.0, 18.0, 13.0, 8.0, 8.0, 9.0, 8.0, 7.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.517578125, -2.441436767578125, -2.36529541015625, -2.289154052734375, -2.2130126953125, -2.136871337890625, -2.06072998046875, -1.984588623046875, -1.908447265625, -1.832305908203125, -1.75616455078125, -1.680023193359375, -1.6038818359375, -1.527740478515625, -1.45159912109375, -1.375457763671875, -1.29931640625, -1.223175048828125, -1.14703369140625, -1.070892333984375, -0.9947509765625, -0.918609619140625, -0.84246826171875, -0.766326904296875, -0.690185546875, -0.614044189453125, -0.53790283203125, -0.461761474609375, -0.3856201171875, -0.309478759765625, -0.23333740234375, -0.157196044921875, -0.0810546875, -0.004913330078125, 0.07122802734375, 0.147369384765625, 0.2235107421875, 0.299652099609375, 0.37579345703125, 0.451934814453125, 0.528076171875, 0.604217529296875, 0.68035888671875, 0.756500244140625, 0.8326416015625, 0.908782958984375, 0.98492431640625, 1.061065673828125, 1.13720703125, 1.213348388671875, 1.28948974609375, 1.365631103515625, 1.4417724609375, 1.517913818359375, 1.59405517578125, 1.670196533203125, 1.746337890625, 1.822479248046875, 1.89862060546875, 1.974761962890625, 2.0509033203125, 2.127044677734375, 2.20318603515625, 2.279327392578125, 2.35546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 8.0, 13.0, 15.0, 38.0, 39.0, 56.0, 100.0, 165.0, 221.0, 363.0, 573.0, 944.0, 1583.0, 2718.0, 4609.0, 8053.0, 14289.0, 25237.0, 46155.0, 85369.0, 149664.0, 1260436.0, 201090.0, 131265.0, 73158.0, 39574.0, 22006.0, 12400.0, 6987.0, 4121.0, 2335.0, 1389.0, 789.0, 498.0, 343.0, 179.0, 112.0, 85.0, 42.0, 31.0, 19.0, 17.0, 20.0, 9.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.35986328125, -0.34781646728515625, -0.3357696533203125, -0.32372283935546875, -0.311676025390625, -0.29962921142578125, -0.2875823974609375, -0.27553558349609375, -0.26348876953125, -0.25144195556640625, -0.2393951416015625, -0.22734832763671875, -0.215301513671875, -0.20325469970703125, -0.1912078857421875, -0.17916107177734375, -0.1671142578125, -0.15506744384765625, -0.1430206298828125, -0.13097381591796875, -0.118927001953125, -0.10688018798828125, -0.0948333740234375, -0.08278656005859375, -0.07073974609375, -0.05869293212890625, -0.0466461181640625, -0.03459930419921875, -0.022552490234375, -0.01050567626953125, 0.0015411376953125, 0.01358795166015625, 0.025634765625, 0.03768157958984375, 0.0497283935546875, 0.06177520751953125, 0.073822021484375, 0.08586883544921875, 0.0979156494140625, 0.10996246337890625, 0.12200927734375, 0.13405609130859375, 0.1461029052734375, 0.15814971923828125, 0.170196533203125, 0.18224334716796875, 0.1942901611328125, 0.20633697509765625, 0.2183837890625, 0.23043060302734375, 0.2424774169921875, 0.25452423095703125, 0.266571044921875, 0.27861785888671875, 0.2906646728515625, 0.30271148681640625, 0.31475830078125, 0.32680511474609375, 0.3388519287109375, 0.35089874267578125, 0.362945556640625, 0.37499237060546875, 0.3870391845703125, 0.39908599853515625, 0.4111328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 10.0, 9.0, 17.0, 26.0, 23.0, 31.0, 28.0, 51.0, 56.0, 62.0, 73.0, 75.0, 56.0, 62.0, 57.0, 44.0, 59.0, 31.0, 43.0, 28.0, 30.0, 24.0, 14.0, 18.0, 16.0, 11.0, 12.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011186599731445312, -0.0010768920183181763, -0.0010351240634918213, -0.0009933561086654663, -0.0009515881538391113, -0.0009098201990127563, -0.0008680522441864014, -0.0008262842893600464, -0.0007845163345336914, -0.0007427483797073364, -0.0007009804248809814, -0.0006592124700546265, -0.0006174445152282715, -0.0005756765604019165, -0.0005339086055755615, -0.0004921406507492065, -0.00045037269592285156, -0.0004086047410964966, -0.0003668367862701416, -0.0003250688314437866, -0.00028330087661743164, -0.00024153292179107666, -0.00019976496696472168, -0.0001579970121383667, -0.00011622905731201172, -7.446110248565674e-05, -3.269314765930176e-05, 9.074807167053223e-06, 5.08427619934082e-05, 9.261071681976318e-05, 0.00013437867164611816, 0.00017614662647247314, 0.00021791458129882812, 0.0002596825361251831, 0.0003014504909515381, 0.00034321844577789307, 0.00038498640060424805, 0.00042675435543060303, 0.000468522310256958, 0.000510290265083313, 0.000552058219909668, 0.000593826174736023, 0.0006355941295623779, 0.0006773620843887329, 0.0007191300392150879, 0.0007608979940414429, 0.0008026659488677979, 0.0008444339036941528, 0.0008862018585205078, 0.0009279698133468628, 0.0009697377681732178, 0.0010115057229995728, 0.0010532736778259277, 0.0010950416326522827, 0.0011368095874786377, 0.0011785775423049927, 0.0012203454971313477, 0.0012621134519577026, 0.0013038814067840576, 0.0013456493616104126, 0.0013874173164367676, 0.0014291852712631226, 0.0014709532260894775, 0.0015127211809158325, 0.0015544891357421875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 4.0, 9.0, 12.0, 10.0, 17.0, 22.0, 35.0, 38.0, 46.0, 81.0, 117.0, 164.0, 313.0, 731.0, 22462.0, 1019491.0, 3724.0, 532.0, 240.0, 159.0, 103.0, 69.0, 43.0, 32.0, 23.0, 18.0, 18.0, 5.0, 8.0, 5.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0282745361328125, -0.02737283706665039, -0.02647113800048828, -0.025569438934326172, -0.024667739868164062, -0.023766040802001953, -0.022864341735839844, -0.021962642669677734, -0.021060943603515625, -0.020159244537353516, -0.019257545471191406, -0.018355846405029297, -0.017454147338867188, -0.016552448272705078, -0.01565074920654297, -0.01474905014038086, -0.01384735107421875, -0.01294565200805664, -0.012043952941894531, -0.011142253875732422, -0.010240554809570312, -0.009338855743408203, -0.008437156677246094, -0.007535457611083984, -0.006633758544921875, -0.005732059478759766, -0.004830360412597656, -0.003928661346435547, -0.0030269622802734375, -0.002125263214111328, -0.0012235641479492188, -0.0003218650817871094, 0.000579833984375, 0.0014815330505371094, 0.0023832321166992188, 0.003284931182861328, 0.0041866302490234375, 0.005088329315185547, 0.005990028381347656, 0.006891727447509766, 0.007793426513671875, 0.008695125579833984, 0.009596824645996094, 0.010498523712158203, 0.011400222778320312, 0.012301921844482422, 0.013203620910644531, 0.01410531997680664, 0.01500701904296875, 0.01590871810913086, 0.01681041717529297, 0.017712116241455078, 0.018613815307617188, 0.019515514373779297, 0.020417213439941406, 0.021318912506103516, 0.022220611572265625, 0.023122310638427734, 0.024024009704589844, 0.024925708770751953, 0.025827407836914062, 0.026729106903076172, 0.02763080596923828, 0.02853250503540039, 0.0294342041015625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 162.0, 854.0], "bins": [-0.027364365756511688, -0.026931503787636757, -0.026498641818761826, -0.026065779849886894, -0.025632917881011963, -0.025200054049491882, -0.02476719208061695, -0.02433433011174202, -0.02390146814286709, -0.023468606173992157, -0.023035744205117226, -0.022602882236242294, -0.022170020267367363, -0.02173715829849243, -0.02130429446697235, -0.02087143249809742, -0.02043857052922249, -0.020005708560347557, -0.019572846591472626, -0.019139984622597694, -0.018707122653722763, -0.018274258822202682, -0.01784139685332775, -0.01740853488445282, -0.01697567291557789, -0.016542810946702957, -0.016109948977828026, -0.015677087008953094, -0.015244224108755589, -0.014811362139880657, -0.014378500171005726, -0.01394563727080822, -0.013512775301933289, -0.013079913333058357, -0.012647051364183426, -0.01221418846398592, -0.011781326495110989, -0.011348464526236057, -0.010915602557361126, -0.01048273965716362, -0.010049878619611263, -0.009617016650736332, -0.0091841546818614, -0.008751291781663895, -0.008318429812788963, -0.007885567843914032, -0.007452705875039101, -0.007019843440502882, -0.006586981005966663, -0.006154119037091732, -0.005721256602555513, -0.005288394633680582, -0.004855532199144363, -0.004422670230269432, -0.003989808261394501, -0.003556945826858282, -0.003124083625152707, -0.002691221423447132, -0.002258359221741557, -0.001825497136451304, -0.001392634934745729, -0.0009597728494554758, -0.0005269106477499008, -9.404844604432583e-05, 0.0003388137847650796]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 3.0, 8.0, 11.0, 16.0, 24.0, 26.0, 19.0, 32.0, 34.0, 55.0, 37.0, 56.0, 42.0, 45.0, 49.0, 58.0, 38.0, 65.0, 53.0, 53.0, 31.0, 42.0, 35.0, 29.0, 23.0, 29.0, 21.0, 14.0, 17.0, 9.0, 7.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005638003349304199, -0.0005384916439652443, -0.0005131829530000687, -0.00048787426203489304, -0.0004625655710697174, -0.0004372568801045418, -0.00041194818913936615, -0.0003866394981741905, -0.0003613308072090149, -0.00033602211624383926, -0.00031071342527866364, -0.000285404734313488, -0.0002600960433483124, -0.00023478735238313675, -0.00020947866141796112, -0.0001841699704527855, -0.00015886127948760986, -0.00013355258852243423, -0.0001082438975572586, -8.293520659208298e-05, -5.762651562690735e-05, -3.231782466173172e-05, -7.009133696556091e-06, 1.8299557268619537e-05, 4.3608248233795166e-05, 6.89169391989708e-05, 9.422563016414642e-05, 0.00011953432112932205, 0.00014484301209449768, 0.0001701517030596733, 0.00019546039402484894, 0.00022076908499002457, 0.0002460777759552002, 0.0002713864669203758, 0.00029669515788555145, 0.0003220038488507271, 0.0003473125398159027, 0.00037262123078107834, 0.00039792992174625397, 0.0004232386127114296, 0.0004485473036766052, 0.00047385599464178085, 0.0004991646856069565, 0.0005244733765721321, 0.0005497820675373077, 0.0005750907585024834, 0.000600399449467659, 0.0006257081404328346, 0.0006510168313980103, 0.0006763255223631859, 0.0007016342133283615, 0.0007269429042935371, 0.0007522515952587128, 0.0007775602862238884, 0.000802868977189064, 0.0008281776681542397, 0.0008534863591194153, 0.0008787950500845909, 0.0009041037410497665, 0.0009294124320149422, 0.0009547211229801178, 0.0009800298139452934, 0.001005338504910469, 0.0010306471958756447, 0.0010559558868408203]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 9.0, 5.0, 2.0, 5.0, 11.0, 12.0, 21.0, 23.0, 23.0, 21.0, 30.0, 29.0, 33.0, 26.0, 21.0, 34.0, 39.0, 45.0, 50.0, 39.0, 41.0, 43.0, 43.0, 45.0, 37.0, 34.0, 29.0, 37.0, 38.0, 20.0, 21.0, 21.0, 18.0, 21.0, 13.0, 14.0, 5.0, 13.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0], "bins": [-4.859375, -4.734893798828125, -4.61041259765625, -4.485931396484375, -4.3614501953125, -4.236968994140625, -4.11248779296875, -3.988006591796875, -3.863525390625, -3.739044189453125, -3.61456298828125, -3.490081787109375, -3.3656005859375, -3.241119384765625, -3.11663818359375, -2.992156982421875, -2.86767578125, -2.743194580078125, -2.61871337890625, -2.494232177734375, -2.3697509765625, -2.245269775390625, -2.12078857421875, -1.996307373046875, -1.871826171875, -1.747344970703125, -1.62286376953125, -1.498382568359375, -1.3739013671875, -1.249420166015625, -1.12493896484375, -1.000457763671875, -0.8759765625, -0.751495361328125, -0.62701416015625, -0.502532958984375, -0.3780517578125, -0.253570556640625, -0.12908935546875, -0.004608154296875, 0.119873046875, 0.244354248046875, 0.36883544921875, 0.493316650390625, 0.6177978515625, 0.742279052734375, 0.86676025390625, 0.991241455078125, 1.11572265625, 1.240203857421875, 1.36468505859375, 1.489166259765625, 1.6136474609375, 1.738128662109375, 1.86260986328125, 1.987091064453125, 2.111572265625, 2.236053466796875, 2.36053466796875, 2.485015869140625, 2.6094970703125, 2.733978271484375, 2.85845947265625, 2.982940673828125, 3.107421875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 20.0, 27.0, 38.0, 52.0, 90.0, 135.0, 181.0, 303.0, 464.0, 690.0, 1112.0, 1639.0, 2829.0, 4329.0, 7318.0, 14322.0, 32804.0, 91854.0, 379489.0, 358623.0, 87578.0, 31636.0, 13922.0, 7313.0, 4348.0, 2597.0, 1685.0, 1081.0, 712.0, 473.0, 306.0, 205.0, 127.0, 77.0, 48.0, 26.0, 33.0, 11.0, 8.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.666015625, -3.539520263671875, -3.41302490234375, -3.286529541015625, -3.1600341796875, -3.033538818359375, -2.90704345703125, -2.780548095703125, -2.654052734375, -2.527557373046875, -2.40106201171875, -2.274566650390625, -2.1480712890625, -2.021575927734375, -1.89508056640625, -1.768585205078125, -1.64208984375, -1.515594482421875, -1.38909912109375, -1.262603759765625, -1.1361083984375, -1.009613037109375, -0.88311767578125, -0.756622314453125, -0.630126953125, -0.503631591796875, -0.37713623046875, -0.250640869140625, -0.1241455078125, 0.002349853515625, 0.12884521484375, 0.255340576171875, 0.3818359375, 0.508331298828125, 0.63482666015625, 0.761322021484375, 0.8878173828125, 1.014312744140625, 1.14080810546875, 1.267303466796875, 1.393798828125, 1.520294189453125, 1.64678955078125, 1.773284912109375, 1.8997802734375, 2.026275634765625, 2.15277099609375, 2.279266357421875, 2.40576171875, 2.532257080078125, 2.65875244140625, 2.785247802734375, 2.9117431640625, 3.038238525390625, 3.16473388671875, 3.291229248046875, 3.417724609375, 3.544219970703125, 3.67071533203125, 3.797210693359375, 3.9237060546875, 4.050201416015625, 4.17669677734375, 4.303192138671875, 4.4296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 14.0, 11.0, 9.0, 18.0, 14.0, 21.0, 27.0, 27.0, 34.0, 24.0, 36.0, 37.0, 34.0, 53.0, 59.0, 92.0, 300.0, 1595.0, 127.0, 85.0, 46.0, 48.0, 36.0, 44.0, 34.0, 36.0, 26.0, 22.0, 20.0, 11.0, 15.0, 12.0, 14.0, 6.0, 7.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.125, -13.712890625, -13.30078125, -12.888671875, -12.4765625, -12.064453125, -11.65234375, -11.240234375, -10.828125, -10.416015625, -10.00390625, -9.591796875, -9.1796875, -8.767578125, -8.35546875, -7.943359375, -7.53125, -7.119140625, -6.70703125, -6.294921875, -5.8828125, -5.470703125, -5.05859375, -4.646484375, -4.234375, -3.822265625, -3.41015625, -2.998046875, -2.5859375, -2.173828125, -1.76171875, -1.349609375, -0.9375, -0.525390625, -0.11328125, 0.298828125, 0.7109375, 1.123046875, 1.53515625, 1.947265625, 2.359375, 2.771484375, 3.18359375, 3.595703125, 4.0078125, 4.419921875, 4.83203125, 5.244140625, 5.65625, 6.068359375, 6.48046875, 6.892578125, 7.3046875, 7.716796875, 8.12890625, 8.541015625, 8.953125, 9.365234375, 9.77734375, 10.189453125, 10.6015625, 11.013671875, 11.42578125, 11.837890625, 12.25]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 9.0, 3.0, 4.0, 4.0, 7.0, 18.0, 19.0, 26.0, 31.0, 49.0, 82.0, 134.0, 214.0, 345.0, 1069.0, 15103.0, 3053943.0, 71105.0, 2256.0, 477.0, 269.0, 157.0, 112.0, 61.0, 47.0, 35.0, 37.0, 19.0, 20.0, 15.0, 9.0, 7.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.40625, -34.32275390625, -33.2392578125, -32.15576171875, -31.072265625, -29.98876953125, -28.9052734375, -27.82177734375, -26.73828125, -25.65478515625, -24.5712890625, -23.48779296875, -22.404296875, -21.32080078125, -20.2373046875, -19.15380859375, -18.0703125, -16.98681640625, -15.9033203125, -14.81982421875, -13.736328125, -12.65283203125, -11.5693359375, -10.48583984375, -9.40234375, -8.31884765625, -7.2353515625, -6.15185546875, -5.068359375, -3.98486328125, -2.9013671875, -1.81787109375, -0.734375, 0.34912109375, 1.4326171875, 2.51611328125, 3.599609375, 4.68310546875, 5.7666015625, 6.85009765625, 7.93359375, 9.01708984375, 10.1005859375, 11.18408203125, 12.267578125, 13.35107421875, 14.4345703125, 15.51806640625, 16.6015625, 17.68505859375, 18.7685546875, 19.85205078125, 20.935546875, 22.01904296875, 23.1025390625, 24.18603515625, 25.26953125, 26.35302734375, 27.4365234375, 28.52001953125, 29.603515625, 30.68701171875, 31.7705078125, 32.85400390625, 33.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 21.0, 88.0, 232.0, 316.0, 228.0, 94.0, 26.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.308319091796875, -5.9836273193359375, -4.658935546875, -3.3342432975769043, -2.009551525115967, -0.6848597526550293, 0.6398324966430664, 1.964524269104004, 3.2892160415649414, 4.613907814025879, 5.938599586486816, 7.263291835784912, 8.587984085083008, 9.912675857543945, 11.237367630004883, 12.56205940246582, 13.886751174926758, 15.211442947387695, 16.536134719848633, 17.86082649230957, 19.185518264770508, 20.510210037231445, 21.834903717041016, 23.159595489501953, 24.48428726196289, 25.808979034423828, 27.133670806884766, 28.458362579345703, 29.78305435180664, 31.107746124267578, 32.432437896728516, 33.75712966918945, 35.08182144165039, 36.40651321411133, 37.731204986572266, 39.0558967590332, 40.38058853149414, 41.70528030395508, 43.029972076416016, 44.35466384887695, 45.67935562133789, 47.00404739379883, 48.328739166259766, 49.6534309387207, 50.97812271118164, 52.30281448364258, 53.627506256103516, 54.95219802856445, 56.276893615722656, 57.601585388183594, 58.92627716064453, 60.25096893310547, 61.575660705566406, 62.900352478027344, 64.22504425048828, 65.54973602294922, 66.87442779541016, 68.1991195678711, 69.52381134033203, 70.84850311279297, 72.1731948852539, 73.49788665771484, 74.82257843017578, 76.14727020263672, 77.47196197509766]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 2.0, 8.0, 7.0, 18.0, 16.0, 22.0, 19.0, 19.0, 25.0, 27.0, 29.0, 28.0, 19.0, 37.0, 33.0, 37.0, 30.0, 46.0, 34.0, 36.0, 38.0, 45.0, 41.0, 36.0, 34.0, 35.0, 35.0, 33.0, 19.0, 28.0, 29.0, 17.0, 17.0, 16.0, 20.0, 11.0, 14.0, 4.0, 6.0, 8.0, 4.0, 6.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.70394515991211, -34.50711441040039, -33.31028366088867, -32.11345291137695, -30.9166202545166, -29.719789505004883, -28.52295684814453, -27.326126098632812, -26.129295349121094, -24.932464599609375, -23.735633850097656, -22.538801193237305, -21.341970443725586, -20.145139694213867, -18.948307037353516, -17.751476287841797, -16.554645538330078, -15.35781478881836, -14.160983085632324, -12.964151382446289, -11.76732063293457, -10.570489883422852, -9.373658180236816, -8.176826477050781, -6.9799957275390625, -5.7831645011901855, -4.586333274841309, -3.3895020484924316, -2.1926708221435547, -0.9958395957946777, 0.20099163055419922, 1.3978233337402344, 2.5946578979492188, 3.7914891242980957, 4.988320350646973, 6.18515157699585, 7.381982803344727, 8.578813552856445, 9.77564525604248, 10.972476959228516, 12.169307708740234, 13.366138458251953, 14.562970161437988, 15.759801864624023, 16.956632614135742, 18.15346336364746, 19.350296020507812, 20.54712677001953, 21.74395751953125, 22.94078826904297, 24.137619018554688, 25.33445167541504, 26.531282424926758, 27.728113174438477, 28.924945831298828, 30.121776580810547, 31.318607330322266, 32.515438079833984, 33.7122688293457, 34.90909957885742, 36.105934143066406, 37.302764892578125, 38.499595642089844, 39.69642639160156, 40.89325714111328]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 3.0, 6.0, 8.0, 12.0, 16.0, 14.0, 19.0, 20.0, 34.0, 27.0, 27.0, 36.0, 38.0, 28.0, 31.0, 43.0, 38.0, 49.0, 54.0, 54.0, 38.0, 40.0, 31.0, 32.0, 41.0, 33.0, 33.0, 30.0, 24.0, 20.0, 26.0, 18.0, 13.0, 12.0, 7.0, 7.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 4.0], "bins": [-5.26171875, -5.128204345703125, -4.99468994140625, -4.861175537109375, -4.7276611328125, -4.594146728515625, -4.46063232421875, -4.327117919921875, -4.193603515625, -4.060089111328125, -3.92657470703125, -3.793060302734375, -3.6595458984375, -3.526031494140625, -3.39251708984375, -3.259002685546875, -3.12548828125, -2.991973876953125, -2.85845947265625, -2.724945068359375, -2.5914306640625, -2.457916259765625, -2.32440185546875, -2.190887451171875, -2.057373046875, -1.923858642578125, -1.79034423828125, -1.656829833984375, -1.5233154296875, -1.389801025390625, -1.25628662109375, -1.122772216796875, -0.9892578125, -0.855743408203125, -0.72222900390625, -0.588714599609375, -0.4552001953125, -0.321685791015625, -0.18817138671875, -0.054656982421875, 0.078857421875, 0.212371826171875, 0.34588623046875, 0.479400634765625, 0.6129150390625, 0.746429443359375, 0.87994384765625, 1.013458251953125, 1.14697265625, 1.280487060546875, 1.41400146484375, 1.547515869140625, 1.6810302734375, 1.814544677734375, 1.94805908203125, 2.081573486328125, 2.215087890625, 2.348602294921875, 2.48211669921875, 2.615631103515625, 2.7491455078125, 2.882659912109375, 3.01617431640625, 3.149688720703125, 3.283203125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 17.0, 19.0, 27.0, 31.0, 56.0, 121.0, 157.0, 293.0, 524.0, 1056.0, 2179.0, 4934.0, 12340.0, 31836.0, 93180.0, 329710.0, 1084018.0, 1573201.0, 746667.0, 211548.0, 63907.0, 22695.0, 8924.0, 3631.0, 1560.0, 712.0, 374.0, 212.0, 98.0, 84.0, 60.0, 30.0, 20.0, 18.0, 12.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.43609619140625, -6.2589111328125, -6.08172607421875, -5.904541015625, -5.72735595703125, -5.5501708984375, -5.37298583984375, -5.19580078125, -5.01861572265625, -4.8414306640625, -4.66424560546875, -4.487060546875, -4.30987548828125, -4.1326904296875, -3.95550537109375, -3.7783203125, -3.60113525390625, -3.4239501953125, -3.24676513671875, -3.069580078125, -2.89239501953125, -2.7152099609375, -2.53802490234375, -2.36083984375, -2.18365478515625, -2.0064697265625, -1.82928466796875, -1.652099609375, -1.47491455078125, -1.2977294921875, -1.12054443359375, -0.943359375, -0.76617431640625, -0.5889892578125, -0.41180419921875, -0.234619140625, -0.05743408203125, 0.1197509765625, 0.29693603515625, 0.47412109375, 0.65130615234375, 0.8284912109375, 1.00567626953125, 1.182861328125, 1.36004638671875, 1.5372314453125, 1.71441650390625, 1.8916015625, 2.06878662109375, 2.2459716796875, 2.42315673828125, 2.600341796875, 2.77752685546875, 2.9547119140625, 3.13189697265625, 3.30908203125, 3.48626708984375, 3.6634521484375, 3.84063720703125, 4.017822265625, 4.19500732421875, 4.3721923828125, 4.54937744140625, 4.7265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 9.0, 3.0, 8.0, 8.0, 6.0, 24.0, 31.0, 26.0, 39.0, 60.0, 68.0, 99.0, 148.0, 191.0, 230.0, 306.0, 362.0, 420.0, 392.0, 388.0, 277.0, 210.0, 194.0, 135.0, 114.0, 79.0, 72.0, 51.0, 34.0, 22.0, 15.0, 17.0, 11.0, 7.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.7265625, -10.3919677734375, -10.057373046875, -9.7227783203125, -9.38818359375, -9.0535888671875, -8.718994140625, -8.3843994140625, -8.0498046875, -7.7152099609375, -7.380615234375, -7.0460205078125, -6.71142578125, -6.3768310546875, -6.042236328125, -5.7076416015625, -5.373046875, -5.0384521484375, -4.703857421875, -4.3692626953125, -4.03466796875, -3.7000732421875, -3.365478515625, -3.0308837890625, -2.6962890625, -2.3616943359375, -2.027099609375, -1.6925048828125, -1.35791015625, -1.0233154296875, -0.688720703125, -0.3541259765625, -0.01953125, 0.3150634765625, 0.649658203125, 0.9842529296875, 1.31884765625, 1.6534423828125, 1.988037109375, 2.3226318359375, 2.6572265625, 2.9918212890625, 3.326416015625, 3.6610107421875, 3.99560546875, 4.3302001953125, 4.664794921875, 4.9993896484375, 5.333984375, 5.6685791015625, 6.003173828125, 6.3377685546875, 6.67236328125, 7.0069580078125, 7.341552734375, 7.6761474609375, 8.0107421875, 8.3453369140625, 8.679931640625, 9.0145263671875, 9.34912109375, 9.6837158203125, 10.018310546875, 10.3529052734375, 10.6875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 13.0, 12.0, 15.0, 20.0, 35.0, 44.0, 52.0, 75.0, 120.0, 117.0, 253.0, 532.0, 1979.0, 27546.0, 1966963.0, 2162929.0, 30206.0, 2148.0, 504.0, 217.0, 141.0, 99.0, 77.0, 46.0, 31.0, 21.0, 24.0, 7.0, 14.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.25, -36.15478515625, -35.0595703125, -33.96435546875, -32.869140625, -31.77392578125, -30.6787109375, -29.58349609375, -28.48828125, -27.39306640625, -26.2978515625, -25.20263671875, -24.107421875, -23.01220703125, -21.9169921875, -20.82177734375, -19.7265625, -18.63134765625, -17.5361328125, -16.44091796875, -15.345703125, -14.25048828125, -13.1552734375, -12.06005859375, -10.96484375, -9.86962890625, -8.7744140625, -7.67919921875, -6.583984375, -5.48876953125, -4.3935546875, -3.29833984375, -2.203125, -1.10791015625, -0.0126953125, 1.08251953125, 2.177734375, 3.27294921875, 4.3681640625, 5.46337890625, 6.55859375, 7.65380859375, 8.7490234375, 9.84423828125, 10.939453125, 12.03466796875, 13.1298828125, 14.22509765625, 15.3203125, 16.41552734375, 17.5107421875, 18.60595703125, 19.701171875, 20.79638671875, 21.8916015625, 22.98681640625, 24.08203125, 25.17724609375, 26.2724609375, 27.36767578125, 28.462890625, 29.55810546875, 30.6533203125, 31.74853515625, 32.84375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 12.0, 30.0, 32.0, 67.0, 111.0, 134.0, 181.0, 174.0, 110.0, 85.0, 38.0, 18.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-117.48446655273438, -115.06231689453125, -112.64017486572266, -110.21802520751953, -107.79588317871094, -105.37373352050781, -102.95158386230469, -100.5294418334961, -98.10729217529297, -95.68514251708984, -93.26300048828125, -90.84085083007812, -88.41870880126953, -85.9965591430664, -83.57441711425781, -81.15226745605469, -78.73011779785156, -76.30796813964844, -73.88582611083984, -71.46367645263672, -69.04153442382812, -66.619384765625, -64.19723510742188, -61.77509307861328, -59.35295104980469, -56.93080520629883, -54.50865936279297, -52.086509704589844, -49.664363861083984, -47.242218017578125, -44.820072174072266, -42.397926330566406, -39.97577667236328, -37.55363082885742, -35.13148498535156, -32.70933532714844, -30.287189483642578, -27.86504364013672, -25.44289779663086, -23.020750045776367, -20.598604202270508, -18.17645835876465, -15.754310607910156, -13.332164764404297, -10.910017967224121, -8.487871170043945, -6.065725326538086, -3.6435775756835938, -1.2214317321777344, 1.2007148265838623, 3.622861385345459, 6.045007705688477, 8.467154502868652, 10.889301300048828, 13.311447143554688, 15.73359489440918, 18.15574073791504, 20.5778865814209, 23.00003433227539, 25.42218017578125, 27.84432601928711, 30.2664737701416, 32.688621520996094, 35.11076736450195, 37.53291320800781]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 4.0, 7.0, 12.0, 9.0, 12.0, 15.0, 15.0, 27.0, 20.0, 21.0, 29.0, 29.0, 30.0, 36.0, 42.0, 46.0, 49.0, 34.0, 37.0, 55.0, 39.0, 37.0, 39.0, 48.0, 28.0, 30.0, 39.0, 32.0, 23.0, 27.0, 20.0, 16.0, 13.0, 18.0, 16.0, 16.0, 10.0, 8.0, 7.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.1024169921875, -38.86738967895508, -37.63235855102539, -36.39733123779297, -35.16230010986328, -33.92727279663086, -32.69224548339844, -31.45721435546875, -30.222187042236328, -28.987157821655273, -27.75212860107422, -26.517101287841797, -25.282072067260742, -24.047042846679688, -22.812013626098633, -21.576984405517578, -20.341955184936523, -19.10692596435547, -17.871896743774414, -16.63686752319336, -15.401840209960938, -14.166810989379883, -12.931781768798828, -11.69675350189209, -10.461724281311035, -9.22669506072998, -7.991666793823242, -6.7566375732421875, -5.521608829498291, -4.2865800857543945, -3.05155086517334, -1.8165225982666016, -0.5814933776855469, 0.6535354852676392, 1.8885643482208252, 3.123593330383301, 4.358622074127197, 5.593650817871094, 6.828680038452148, 8.063708305358887, 9.298737525939941, 10.533766746520996, 11.768795013427734, 13.003824234008789, 14.238853454589844, 15.473881721496582, 16.708911895751953, 17.943939208984375, 19.17896842956543, 20.413997650146484, 21.64902687072754, 22.884056091308594, 24.119083404541016, 25.35411262512207, 26.589141845703125, 27.824169158935547, 29.059200286865234, 30.29422950744629, 31.529258728027344, 32.764286041259766, 33.99931716918945, 35.234344482421875, 36.46937561035156, 37.704402923583984, 38.939430236816406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 7.0, 11.0, 13.0, 5.0, 15.0, 28.0, 23.0, 25.0, 35.0, 36.0, 31.0, 36.0, 35.0, 35.0, 33.0, 45.0, 50.0, 52.0, 45.0, 43.0, 48.0, 52.0, 34.0, 34.0, 33.0, 37.0, 24.0, 23.0, 19.0, 11.0, 12.0, 13.0, 13.0, 10.0, 9.0, 10.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.78125, -5.633636474609375, -5.48602294921875, -5.338409423828125, -5.1907958984375, -5.043182373046875, -4.89556884765625, -4.747955322265625, -4.600341796875, -4.452728271484375, -4.30511474609375, -4.157501220703125, -4.0098876953125, -3.862274169921875, -3.71466064453125, -3.567047119140625, -3.41943359375, -3.271820068359375, -3.12420654296875, -2.976593017578125, -2.8289794921875, -2.681365966796875, -2.53375244140625, -2.386138916015625, -2.238525390625, -2.090911865234375, -1.94329833984375, -1.795684814453125, -1.6480712890625, -1.500457763671875, -1.35284423828125, -1.205230712890625, -1.0576171875, -0.910003662109375, -0.76239013671875, -0.614776611328125, -0.4671630859375, -0.319549560546875, -0.17193603515625, -0.024322509765625, 0.123291015625, 0.270904541015625, 0.41851806640625, 0.566131591796875, 0.7137451171875, 0.861358642578125, 1.00897216796875, 1.156585693359375, 1.30419921875, 1.451812744140625, 1.59942626953125, 1.747039794921875, 1.8946533203125, 2.042266845703125, 2.18988037109375, 2.337493896484375, 2.485107421875, 2.632720947265625, 2.78033447265625, 2.927947998046875, 3.0755615234375, 3.223175048828125, 3.37078857421875, 3.518402099609375, 3.666015625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 17.0, 14.0, 27.0, 30.0, 40.0, 84.0, 133.0, 194.0, 267.0, 413.0, 655.0, 1001.0, 1514.0, 2380.0, 3773.0, 6036.0, 9738.0, 15785.0, 26294.0, 44957.0, 77196.0, 134421.0, 207793.0, 203293.0, 128703.0, 74086.0, 43523.0, 25194.0, 15367.0, 9331.0, 5810.0, 3715.0, 2268.0, 1572.0, 1005.0, 616.0, 423.0, 298.0, 190.0, 122.0, 88.0, 70.0, 37.0, 25.0, 19.0, 9.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.5546875, -0.5383567810058594, -0.5220260620117188, -0.5056953430175781, -0.4893646240234375, -0.4730339050292969, -0.45670318603515625, -0.4403724670410156, -0.424041748046875, -0.4077110290527344, -0.39138031005859375, -0.3750495910644531, -0.3587188720703125, -0.3423881530761719, -0.32605743408203125, -0.3097267150878906, -0.29339599609375, -0.2770652770996094, -0.26073455810546875, -0.24440383911132812, -0.2280731201171875, -0.21174240112304688, -0.19541168212890625, -0.17908096313476562, -0.162750244140625, -0.14641952514648438, -0.13008880615234375, -0.11375808715820312, -0.0974273681640625, -0.08109664916992188, -0.06476593017578125, -0.048435211181640625, -0.0321044921875, -0.015773773193359375, 0.00055694580078125, 0.016887664794921875, 0.0332183837890625, 0.049549102783203125, 0.06587982177734375, 0.08221054077148438, 0.098541259765625, 0.11487197875976562, 0.13120269775390625, 0.14753341674804688, 0.1638641357421875, 0.18019485473632812, 0.19652557373046875, 0.21285629272460938, 0.22918701171875, 0.24551773071289062, 0.26184844970703125, 0.2781791687011719, 0.2945098876953125, 0.3108406066894531, 0.32717132568359375, 0.3435020446777344, 0.359832763671875, 0.3761634826660156, 0.39249420166015625, 0.4088249206542969, 0.4251556396484375, 0.4414863586425781, 0.45781707763671875, 0.4741477966308594, 0.490478515625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 5.0, 9.0, 11.0, 9.0, 24.0, 16.0, 21.0, 18.0, 21.0, 28.0, 22.0, 21.0, 33.0, 35.0, 37.0, 36.0, 35.0, 42.0, 38.0, 1058.0, 42.0, 47.0, 34.0, 28.0, 24.0, 31.0, 39.0, 27.0, 32.0, 20.0, 24.0, 22.0, 19.0, 11.0, 16.0, 12.0, 10.0, 11.0, 7.0, 12.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0], "bins": [-2.728515625, -2.6475830078125, -2.566650390625, -2.4857177734375, -2.40478515625, -2.3238525390625, -2.242919921875, -2.1619873046875, -2.0810546875, -2.0001220703125, -1.919189453125, -1.8382568359375, -1.75732421875, -1.6763916015625, -1.595458984375, -1.5145263671875, -1.43359375, -1.3526611328125, -1.271728515625, -1.1907958984375, -1.10986328125, -1.0289306640625, -0.947998046875, -0.8670654296875, -0.7861328125, -0.7052001953125, -0.624267578125, -0.5433349609375, -0.46240234375, -0.3814697265625, -0.300537109375, -0.2196044921875, -0.138671875, -0.0577392578125, 0.023193359375, 0.1041259765625, 0.18505859375, 0.2659912109375, 0.346923828125, 0.4278564453125, 0.5087890625, 0.5897216796875, 0.670654296875, 0.7515869140625, 0.83251953125, 0.9134521484375, 0.994384765625, 1.0753173828125, 1.15625, 1.2371826171875, 1.318115234375, 1.3990478515625, 1.47998046875, 1.5609130859375, 1.641845703125, 1.7227783203125, 1.8037109375, 1.8846435546875, 1.965576171875, 2.0465087890625, 2.12744140625, 2.2083740234375, 2.289306640625, 2.3702392578125, 2.451171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 3.0, 8.0, 12.0, 26.0, 39.0, 57.0, 77.0, 107.0, 148.0, 257.0, 396.0, 651.0, 877.0, 1532.0, 2418.0, 4068.0, 6662.0, 11112.0, 18745.0, 31688.0, 54881.0, 95154.0, 154544.0, 1249419.0, 179063.0, 118224.0, 69401.0, 39824.0, 23173.0, 13494.0, 8187.0, 4920.0, 2959.0, 1846.0, 1102.0, 759.0, 441.0, 296.0, 204.0, 123.0, 74.0, 45.0, 41.0, 28.0, 16.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.3165168762207031, -0.30466461181640625, -0.2928123474121094, -0.2809600830078125, -0.2691078186035156, -0.25725555419921875, -0.24540328979492188, -0.233551025390625, -0.22169876098632812, -0.20984649658203125, -0.19799423217773438, -0.1861419677734375, -0.17428970336914062, -0.16243743896484375, -0.15058517456054688, -0.13873291015625, -0.12688064575195312, -0.11502838134765625, -0.10317611694335938, -0.0913238525390625, -0.07947158813476562, -0.06761932373046875, -0.055767059326171875, -0.043914794921875, -0.032062530517578125, -0.02021026611328125, -0.008358001708984375, 0.0034942626953125, 0.015346527099609375, 0.02719879150390625, 0.039051055908203125, 0.0509033203125, 0.06275558471679688, 0.07460784912109375, 0.08646011352539062, 0.0983123779296875, 0.11016464233398438, 0.12201690673828125, 0.13386917114257812, 0.145721435546875, 0.15757369995117188, 0.16942596435546875, 0.18127822875976562, 0.1931304931640625, 0.20498275756835938, 0.21683502197265625, 0.22868728637695312, 0.24053955078125, 0.2523918151855469, 0.26424407958984375, 0.2760963439941406, 0.2879486083984375, 0.2998008728027344, 0.31165313720703125, 0.3235054016113281, 0.335357666015625, 0.3472099304199219, 0.35906219482421875, 0.3709144592285156, 0.3827667236328125, 0.3946189880371094, 0.40647125244140625, 0.4183235168457031, 0.43017578125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 2.0, 4.0, 5.0, 11.0, 12.0, 9.0, 22.0, 23.0, 31.0, 32.0, 32.0, 41.0, 49.0, 60.0, 49.0, 65.0, 78.0, 63.0, 54.0, 52.0, 45.0, 47.0, 33.0, 29.0, 36.0, 20.0, 15.0, 14.0, 21.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013685226440429688, -0.0013308972120285034, -0.001293271780014038, -0.0012556463479995728, -0.0012180209159851074, -0.001180395483970642, -0.0011427700519561768, -0.0011051446199417114, -0.001067519187927246, -0.0010298937559127808, -0.0009922683238983154, -0.0009546428918838501, -0.0009170174598693848, -0.0008793920278549194, -0.0008417665958404541, -0.0008041411638259888, -0.0007665157318115234, -0.0007288902997970581, -0.0006912648677825928, -0.0006536394357681274, -0.0006160140037536621, -0.0005783885717391968, -0.0005407631397247314, -0.0005031377077102661, -0.0004655122756958008, -0.00042788684368133545, -0.0003902614116668701, -0.0003526359796524048, -0.00031501054763793945, -0.0002773851156234741, -0.0002397596836090088, -0.00020213425159454346, -0.00016450881958007812, -0.0001268833875656128, -8.925795555114746e-05, -5.163252353668213e-05, -1.4007091522216797e-05, 2.3618340492248535e-05, 6.124377250671387e-05, 9.88692045211792e-05, 0.00013649463653564453, 0.00017412006855010986, 0.0002117455005645752, 0.00024937093257904053, 0.00028699636459350586, 0.0003246217966079712, 0.0003622472286224365, 0.00039987266063690186, 0.0004374980926513672, 0.0004751235246658325, 0.0005127489566802979, 0.0005503743886947632, 0.0005879998207092285, 0.0006256252527236938, 0.0006632506847381592, 0.0007008761167526245, 0.0007385015487670898, 0.0007761269807815552, 0.0008137524127960205, 0.0008513778448104858, 0.0008890032768249512, 0.0009266287088394165, 0.0009642541408538818, 0.0010018795728683472, 0.0010395050048828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 4.0, 8.0, 4.0, 14.0, 16.0, 20.0, 15.0, 19.0, 42.0, 40.0, 61.0, 83.0, 104.0, 190.0, 319.0, 527.0, 2227.0, 356925.0, 682796.0, 3490.0, 637.0, 324.0, 188.0, 139.0, 80.0, 65.0, 47.0, 49.0, 28.0, 20.0, 12.0, 9.0, 7.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0224609375, -0.02178192138671875, -0.0211029052734375, -0.02042388916015625, -0.019744873046875, -0.01906585693359375, -0.0183868408203125, -0.01770782470703125, -0.01702880859375, -0.01634979248046875, -0.0156707763671875, -0.01499176025390625, -0.014312744140625, -0.01363372802734375, -0.0129547119140625, -0.01227569580078125, -0.0115966796875, -0.01091766357421875, -0.0102386474609375, -0.00955963134765625, -0.008880615234375, -0.00820159912109375, -0.0075225830078125, -0.00684356689453125, -0.00616455078125, -0.00548553466796875, -0.0048065185546875, -0.00412750244140625, -0.003448486328125, -0.00276947021484375, -0.0020904541015625, -0.00141143798828125, -0.000732421875, -5.340576171875e-05, 0.0006256103515625, 0.00130462646484375, 0.001983642578125, 0.00266265869140625, 0.0033416748046875, 0.00402069091796875, 0.00469970703125, 0.00537872314453125, 0.0060577392578125, 0.00673675537109375, 0.007415771484375, 0.00809478759765625, 0.0087738037109375, 0.00945281982421875, 0.0101318359375, 0.01081085205078125, 0.0114898681640625, 0.01216888427734375, 0.012847900390625, 0.01352691650390625, 0.0142059326171875, 0.01488494873046875, 0.01556396484375, 0.01624298095703125, 0.0169219970703125, 0.01760101318359375, 0.018280029296875, 0.01895904541015625, 0.0196380615234375, 0.02031707763671875, 0.02099609375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 6.0, 10.0, 33.0, 52.0, 71.0, 101.0, 143.0, 140.0, 133.0, 136.0, 77.0, 49.0, 24.0, 16.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010579447261989117, -0.0010209851898252964, -0.0009840256534516811, -0.0009470661170780659, -0.0009101065807044506, -0.0008731470443308353, -0.0008361875079572201, -0.0007992279715836048, -0.0007622684352099895, -0.0007253088988363743, -0.000688349362462759, -0.0006513898260891438, -0.0006144302897155285, -0.0005774707533419132, -0.000540511216968298, -0.0005035516805946827, -0.0004665920860134065, -0.00042963254963979125, -0.000392673013266176, -0.0003557134768925607, -0.00031875394051894546, -0.0002817944041453302, -0.00024483483866788447, -0.0002078753022942692, -0.00017091576592065394, -0.00013395622954703867, -9.69966858974658e-05, -6.0037142247892916e-05, -2.307760587427765e-05, 1.3881930499337614e-05, 5.084148142486811e-05, 8.780101779848337e-05, 0.00012476055417209864, 0.0001617200905457139, 0.00019867962691932917, 0.00023563917784485966, 0.0002725986996665597, 0.00030955823604017496, 0.0003465178015176207, 0.00038347733789123595, 0.0004204368742648512, 0.0004573964106384665, 0.0004943559761159122, 0.0005313155124895275, 0.0005682750488631427, 0.000605234585236758, 0.0006421941216103733, 0.0006791536579839885, 0.0007161131943576038, 0.000753072730731219, 0.0007900322671048343, 0.0008269918034784496, 0.0008639513398520648, 0.0009009108762256801, 0.0009378704708069563, 0.0009748300071805716, 0.0010117895435541868, 0.001048749079927802, 0.0010857086163014174, 0.0011226681526750326, 0.0011596276890486479, 0.0011965872254222631, 0.0012335467617958784, 0.0012705062981694937, 0.001307465834543109]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 10.0, 13.0, 19.0, 15.0, 14.0, 34.0, 27.0, 19.0, 21.0, 34.0, 40.0, 36.0, 34.0, 44.0, 47.0, 41.0, 45.0, 51.0, 48.0, 31.0, 30.0, 43.0, 30.0, 40.0, 32.0, 29.0, 27.0, 21.0, 23.0, 19.0, 25.0, 8.0, 14.0, 9.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.0006729364395141602, -0.0006530098617076874, -0.0006330832839012146, -0.0006131567060947418, -0.000593230128288269, -0.0005733035504817963, -0.0005533769726753235, -0.0005334503948688507, -0.0005135238170623779, -0.0004935972392559052, -0.0004736706614494324, -0.0004537440836429596, -0.0004338175058364868, -0.00041389092803001404, -0.00039396435022354126, -0.0003740377724170685, -0.0003541111946105957, -0.0003341846168041229, -0.00031425803899765015, -0.00029433146119117737, -0.0002744048833847046, -0.0002544783055782318, -0.00023455172777175903, -0.00021462514996528625, -0.00019469857215881348, -0.0001747719943523407, -0.00015484541654586792, -0.00013491883873939514, -0.00011499226093292236, -9.506568312644958e-05, -7.51391053199768e-05, -5.521252751350403e-05, -3.528594970703125e-05, -1.535937190055847e-05, 4.567205905914307e-06, 2.4493783712387085e-05, 4.442036151885986e-05, 6.434693932533264e-05, 8.427351713180542e-05, 0.0001042000949382782, 0.00012412667274475098, 0.00014405325055122375, 0.00016397982835769653, 0.0001839064061641693, 0.0002038329839706421, 0.00022375956177711487, 0.00024368613958358765, 0.0002636127173900604, 0.0002835392951965332, 0.000303465873003006, 0.00032339245080947876, 0.00034331902861595154, 0.0003632456064224243, 0.0003831721842288971, 0.0004030987620353699, 0.00042302533984184265, 0.00044295191764831543, 0.0004628784954547882, 0.000482805073261261, 0.0005027316510677338, 0.0005226582288742065, 0.0005425848066806793, 0.0005625113844871521, 0.0005824379622936249, 0.0006023645401000977]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 7.0, 11.0, 13.0, 5.0, 15.0, 28.0, 23.0, 25.0, 35.0, 36.0, 31.0, 36.0, 35.0, 35.0, 33.0, 45.0, 50.0, 52.0, 45.0, 43.0, 48.0, 52.0, 34.0, 34.0, 33.0, 37.0, 24.0, 23.0, 19.0, 11.0, 12.0, 13.0, 13.0, 10.0, 9.0, 10.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.78125, -5.633636474609375, -5.48602294921875, -5.338409423828125, -5.1907958984375, -5.043182373046875, -4.89556884765625, -4.747955322265625, -4.600341796875, -4.452728271484375, -4.30511474609375, -4.157501220703125, -4.0098876953125, -3.862274169921875, -3.71466064453125, -3.567047119140625, -3.41943359375, -3.271820068359375, -3.12420654296875, -2.976593017578125, -2.8289794921875, -2.681365966796875, -2.53375244140625, -2.386138916015625, -2.238525390625, -2.090911865234375, -1.94329833984375, -1.795684814453125, -1.6480712890625, -1.500457763671875, -1.35284423828125, -1.205230712890625, -1.0576171875, -0.910003662109375, -0.76239013671875, -0.614776611328125, -0.4671630859375, -0.319549560546875, -0.17193603515625, -0.024322509765625, 0.123291015625, 0.270904541015625, 0.41851806640625, 0.566131591796875, 0.7137451171875, 0.861358642578125, 1.00897216796875, 1.156585693359375, 1.30419921875, 1.451812744140625, 1.59942626953125, 1.747039794921875, 1.8946533203125, 2.042266845703125, 2.18988037109375, 2.337493896484375, 2.485107421875, 2.632720947265625, 2.78033447265625, 2.927947998046875, 3.0755615234375, 3.223175048828125, 3.37078857421875, 3.518402099609375, 3.666015625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 5.0, 9.0, 8.0, 20.0, 30.0, 48.0, 59.0, 108.0, 161.0, 234.0, 439.0, 689.0, 1236.0, 2444.0, 5141.0, 11774.0, 30220.0, 86073.0, 273014.0, 414308.0, 142145.0, 47961.0, 18118.0, 7113.0, 3264.0, 1658.0, 912.0, 489.0, 319.0, 185.0, 124.0, 95.0, 44.0, 32.0, 23.0, 15.0, 10.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.80859375, -4.679412841796875, -4.55023193359375, -4.421051025390625, -4.2918701171875, -4.162689208984375, -4.03350830078125, -3.904327392578125, -3.775146484375, -3.645965576171875, -3.51678466796875, -3.387603759765625, -3.2584228515625, -3.129241943359375, -3.00006103515625, -2.870880126953125, -2.74169921875, -2.612518310546875, -2.48333740234375, -2.354156494140625, -2.2249755859375, -2.095794677734375, -1.96661376953125, -1.837432861328125, -1.708251953125, -1.579071044921875, -1.44989013671875, -1.320709228515625, -1.1915283203125, -1.062347412109375, -0.93316650390625, -0.803985595703125, -0.6748046875, -0.545623779296875, -0.41644287109375, -0.287261962890625, -0.1580810546875, -0.028900146484375, 0.10028076171875, 0.229461669921875, 0.358642578125, 0.487823486328125, 0.61700439453125, 0.746185302734375, 0.8753662109375, 1.004547119140625, 1.13372802734375, 1.262908935546875, 1.39208984375, 1.521270751953125, 1.65045166015625, 1.779632568359375, 1.9088134765625, 2.037994384765625, 2.16717529296875, 2.296356201171875, 2.425537109375, 2.554718017578125, 2.68389892578125, 2.813079833984375, 2.9422607421875, 3.071441650390625, 3.20062255859375, 3.329803466796875, 3.458984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 8.0, 14.0, 17.0, 25.0, 28.0, 20.0, 30.0, 26.0, 35.0, 45.0, 53.0, 78.0, 81.0, 268.0, 1730.0, 161.0, 73.0, 62.0, 64.0, 47.0, 27.0, 37.0, 30.0, 11.0, 22.0, 12.0, 10.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.65625, -22.966552734375, -22.27685546875, -21.587158203125, -20.8974609375, -20.207763671875, -19.51806640625, -18.828369140625, -18.138671875, -17.448974609375, -16.75927734375, -16.069580078125, -15.3798828125, -14.690185546875, -14.00048828125, -13.310791015625, -12.62109375, -11.931396484375, -11.24169921875, -10.552001953125, -9.8623046875, -9.172607421875, -8.48291015625, -7.793212890625, -7.103515625, -6.413818359375, -5.72412109375, -5.034423828125, -4.3447265625, -3.655029296875, -2.96533203125, -2.275634765625, -1.5859375, -0.896240234375, -0.20654296875, 0.483154296875, 1.1728515625, 1.862548828125, 2.55224609375, 3.241943359375, 3.931640625, 4.621337890625, 5.31103515625, 6.000732421875, 6.6904296875, 7.380126953125, 8.06982421875, 8.759521484375, 9.44921875, 10.138916015625, 10.82861328125, 11.518310546875, 12.2080078125, 12.897705078125, 13.58740234375, 14.277099609375, 14.966796875, 15.656494140625, 16.34619140625, 17.035888671875, 17.7255859375, 18.415283203125, 19.10498046875, 19.794677734375, 20.484375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 10.0, 13.0, 18.0, 21.0, 52.0, 54.0, 94.0, 149.0, 299.0, 756.0, 13607.0, 3124460.0, 4868.0, 608.0, 280.0, 156.0, 61.0, 64.0, 46.0, 36.0, 19.0, 17.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.25, -65.294921875, -63.33984375, -61.384765625, -59.4296875, -57.474609375, -55.51953125, -53.564453125, -51.609375, -49.654296875, -47.69921875, -45.744140625, -43.7890625, -41.833984375, -39.87890625, -37.923828125, -35.96875, -34.013671875, -32.05859375, -30.103515625, -28.1484375, -26.193359375, -24.23828125, -22.283203125, -20.328125, -18.373046875, -16.41796875, -14.462890625, -12.5078125, -10.552734375, -8.59765625, -6.642578125, -4.6875, -2.732421875, -0.77734375, 1.177734375, 3.1328125, 5.087890625, 7.04296875, 8.998046875, 10.953125, 12.908203125, 14.86328125, 16.818359375, 18.7734375, 20.728515625, 22.68359375, 24.638671875, 26.59375, 28.548828125, 30.50390625, 32.458984375, 34.4140625, 36.369140625, 38.32421875, 40.279296875, 42.234375, 44.189453125, 46.14453125, 48.099609375, 50.0546875, 52.009765625, 53.96484375, 55.919921875, 57.875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 410.0, 596.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-306.86004638671875, -301.4834899902344, -296.10693359375, -290.73040771484375, -285.3538513183594, -279.977294921875, -274.6007385253906, -269.2242126464844, -263.84765625, -258.4710998535156, -253.0945587158203, -247.71800231933594, -242.34146118164062, -236.96490478515625, -231.58836364746094, -226.21180725097656, -220.83526611328125, -215.45870971679688, -210.08216857910156, -204.7056121826172, -199.32907104492188, -193.9525146484375, -188.5759735107422, -183.1994171142578, -177.82286071777344, -172.44630432128906, -167.06976318359375, -161.69320678710938, -156.31666564941406, -150.9401092529297, -145.56356811523438, -140.18701171875, -134.8104705810547, -129.4339141845703, -124.057373046875, -118.68082427978516, -113.30427551269531, -107.92772674560547, -102.55117797851562, -97.17462158203125, -91.79808044433594, -86.4215316772461, -81.04498291015625, -75.6684341430664, -70.29188537597656, -64.91533660888672, -59.53878402709961, -54.162235260009766, -48.78568649291992, -43.40913772583008, -38.032588958740234, -32.656036376953125, -27.279489517211914, -21.90294075012207, -16.526390075683594, -11.14984130859375, -5.773292541503906, -0.3967432975769043, 4.979805946350098, 10.356355667114258, 15.732904434204102, 21.109453201293945, 26.486003875732422, 31.862552642822266, 37.23910140991211]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 12.0, 7.0, 9.0, 16.0, 12.0, 15.0, 12.0, 17.0, 21.0, 21.0, 14.0, 20.0, 27.0, 36.0, 29.0, 29.0, 35.0, 37.0, 34.0, 33.0, 33.0, 41.0, 46.0, 39.0, 31.0, 23.0, 22.0, 34.0, 29.0, 29.0, 14.0, 24.0, 21.0, 20.0, 26.0, 18.0, 14.0, 18.0, 7.0, 13.0, 6.0, 13.0, 7.0, 6.0, 5.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-34.619956970214844, -33.49950408935547, -32.37905502319336, -31.258602142333984, -30.13814926147461, -29.017698287963867, -27.897247314453125, -26.77679443359375, -25.656343460083008, -24.535892486572266, -23.41543960571289, -22.29498863220215, -21.174537658691406, -20.05408477783203, -18.93363380432129, -17.813182830810547, -16.692729949951172, -15.572278022766113, -14.451826095581055, -13.331375122070312, -12.210923194885254, -11.090471267700195, -9.970020294189453, -8.849568367004395, -7.729116439819336, -6.608664512634277, -5.488213062286377, -4.367761611938477, -3.247309684753418, -2.1268577575683594, -1.006406307220459, 0.1140451431274414, 1.2344970703125, 2.3549487590789795, 3.475400447845459, 4.595851898193359, 5.716303825378418, 6.836755752563477, 7.957207202911377, 9.077658653259277, 10.198110580444336, 11.318562507629395, 12.439014434814453, 13.559465408325195, 14.679917335510254, 15.800369262695312, 16.920820236206055, 18.041271209716797, 19.161724090576172, 20.282175064086914, 21.40262794494629, 22.52307891845703, 23.643531799316406, 24.76398277282715, 25.88443374633789, 27.004886627197266, 28.125337600708008, 29.24578857421875, 30.366241455078125, 31.486692428588867, 32.60714340209961, 33.727596282958984, 34.84804916381836, 35.96849822998047, 37.088951110839844]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 9.0, 10.0, 16.0, 13.0, 18.0, 22.0, 33.0, 28.0, 26.0, 35.0, 26.0, 39.0, 42.0, 31.0, 45.0, 53.0, 42.0, 43.0, 39.0, 42.0, 51.0, 36.0, 37.0, 35.0, 27.0, 29.0, 21.0, 26.0, 20.0, 15.0, 17.0, 9.0, 6.0, 11.0, 15.0, 5.0, 8.0, 2.0, 1.0, 3.0, 3.0], "bins": [-5.828125, -5.681365966796875, -5.53460693359375, -5.387847900390625, -5.2410888671875, -5.094329833984375, -4.94757080078125, -4.800811767578125, -4.654052734375, -4.507293701171875, -4.36053466796875, -4.213775634765625, -4.0670166015625, -3.920257568359375, -3.77349853515625, -3.626739501953125, -3.47998046875, -3.333221435546875, -3.18646240234375, -3.039703369140625, -2.8929443359375, -2.746185302734375, -2.59942626953125, -2.452667236328125, -2.305908203125, -2.159149169921875, -2.01239013671875, -1.865631103515625, -1.7188720703125, -1.572113037109375, -1.42535400390625, -1.278594970703125, -1.1318359375, -0.985076904296875, -0.83831787109375, -0.691558837890625, -0.5447998046875, -0.398040771484375, -0.25128173828125, -0.104522705078125, 0.042236328125, 0.188995361328125, 0.33575439453125, 0.482513427734375, 0.6292724609375, 0.776031494140625, 0.92279052734375, 1.069549560546875, 1.21630859375, 1.363067626953125, 1.50982666015625, 1.656585693359375, 1.8033447265625, 1.950103759765625, 2.09686279296875, 2.243621826171875, 2.390380859375, 2.537139892578125, 2.68389892578125, 2.830657958984375, 2.9774169921875, 3.124176025390625, 3.27093505859375, 3.417694091796875, 3.564453125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 8.0, 12.0, 21.0, 13.0, 31.0, 40.0, 29.0, 38.0, 51.0, 80.0, 129.0, 218.0, 508.0, 3086.0, 63141.0, 3217772.0, 892279.0, 14703.0, 1210.0, 289.0, 180.0, 92.0, 68.0, 51.0, 40.0, 32.0, 15.0, 30.0, 21.0, 16.0, 14.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0], "bins": [-28.296875, -27.5673828125, -26.837890625, -26.1083984375, -25.37890625, -24.6494140625, -23.919921875, -23.1904296875, -22.4609375, -21.7314453125, -21.001953125, -20.2724609375, -19.54296875, -18.8134765625, -18.083984375, -17.3544921875, -16.625, -15.8955078125, -15.166015625, -14.4365234375, -13.70703125, -12.9775390625, -12.248046875, -11.5185546875, -10.7890625, -10.0595703125, -9.330078125, -8.6005859375, -7.87109375, -7.1416015625, -6.412109375, -5.6826171875, -4.953125, -4.2236328125, -3.494140625, -2.7646484375, -2.03515625, -1.3056640625, -0.576171875, 0.1533203125, 0.8828125, 1.6123046875, 2.341796875, 3.0712890625, 3.80078125, 4.5302734375, 5.259765625, 5.9892578125, 6.71875, 7.4482421875, 8.177734375, 8.9072265625, 9.63671875, 10.3662109375, 11.095703125, 11.8251953125, 12.5546875, 13.2841796875, 14.013671875, 14.7431640625, 15.47265625, 16.2021484375, 16.931640625, 17.6611328125, 18.390625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 13.0, 14.0, 23.0, 25.0, 46.0, 69.0, 86.0, 102.0, 188.0, 230.0, 357.0, 385.0, 486.0, 517.0, 391.0, 331.0, 221.0, 190.0, 131.0, 77.0, 52.0, 38.0, 28.0, 24.0, 17.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4453125, -13.0499267578125, -12.654541015625, -12.2591552734375, -11.86376953125, -11.4683837890625, -11.072998046875, -10.6776123046875, -10.2822265625, -9.8868408203125, -9.491455078125, -9.0960693359375, -8.70068359375, -8.3052978515625, -7.909912109375, -7.5145263671875, -7.119140625, -6.7237548828125, -6.328369140625, -5.9329833984375, -5.53759765625, -5.1422119140625, -4.746826171875, -4.3514404296875, -3.9560546875, -3.5606689453125, -3.165283203125, -2.7698974609375, -2.37451171875, -1.9791259765625, -1.583740234375, -1.1883544921875, -0.79296875, -0.3975830078125, -0.002197265625, 0.3931884765625, 0.78857421875, 1.1839599609375, 1.579345703125, 1.9747314453125, 2.3701171875, 2.7655029296875, 3.160888671875, 3.5562744140625, 3.95166015625, 4.3470458984375, 4.742431640625, 5.1378173828125, 5.533203125, 5.9285888671875, 6.323974609375, 6.7193603515625, 7.11474609375, 7.5101318359375, 7.905517578125, 8.3009033203125, 8.6962890625, 9.0916748046875, 9.487060546875, 9.8824462890625, 10.27783203125, 10.6732177734375, 11.068603515625, 11.4639892578125, 11.859375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 9.0, 16.0, 3.0, 14.0, 23.0, 22.0, 45.0, 44.0, 55.0, 103.0, 111.0, 169.0, 227.0, 380.0, 894.0, 4931.0, 170860.0, 3822117.0, 186775.0, 5234.0, 942.0, 422.0, 252.0, 169.0, 123.0, 101.0, 74.0, 39.0, 35.0, 28.0, 17.0, 13.0, 12.0, 6.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.1875, -35.0390625, -33.890625, -32.7421875, -31.59375, -30.4453125, -29.296875, -28.1484375, -27.0, -25.8515625, -24.703125, -23.5546875, -22.40625, -21.2578125, -20.109375, -18.9609375, -17.8125, -16.6640625, -15.515625, -14.3671875, -13.21875, -12.0703125, -10.921875, -9.7734375, -8.625, -7.4765625, -6.328125, -5.1796875, -4.03125, -2.8828125, -1.734375, -0.5859375, 0.5625, 1.7109375, 2.859375, 4.0078125, 5.15625, 6.3046875, 7.453125, 8.6015625, 9.75, 10.8984375, 12.046875, 13.1953125, 14.34375, 15.4921875, 16.640625, 17.7890625, 18.9375, 20.0859375, 21.234375, 22.3828125, 23.53125, 24.6796875, 25.828125, 26.9765625, 28.125, 29.2734375, 30.421875, 31.5703125, 32.71875, 33.8671875, 35.015625, 36.1640625, 37.3125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 31.0, 78.0, 136.0, 200.0, 211.0, 169.0, 105.0, 51.0, 16.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.55401611328125, -63.283809661865234, -60.01360321044922, -56.74340057373047, -53.47319030761719, -50.20298767089844, -46.93278121948242, -43.662574768066406, -40.39236831665039, -37.122161865234375, -33.85195541381836, -30.581750869750977, -27.31154441833496, -24.041337966918945, -20.771133422851562, -17.500926971435547, -14.230720520019531, -10.960514068603516, -7.690308570861816, -4.420103073120117, -1.1498966217041016, 2.120309829711914, 5.390514373779297, 8.660720825195312, 11.930927276611328, 15.201133728027344, 18.47134017944336, 21.741544723510742, 25.011751174926758, 28.281957626342773, 31.552162170410156, 34.82236862182617, 38.09257507324219, 41.3627815246582, 44.63298797607422, 47.90319061279297, 51.17340087890625, 54.443603515625, 57.713809967041016, 60.98401641845703, 64.25422668457031, 67.52442932128906, 70.79463958740234, 74.0648422241211, 77.33505249023438, 80.60525512695312, 83.87545776367188, 87.14566802978516, 90.4158706665039, 93.68607330322266, 96.95628356933594, 100.22648620605469, 103.49669647216797, 106.76689910888672, 110.037109375, 113.30731201171875, 116.5775146484375, 119.84771728515625, 123.11792755126953, 126.38813018798828, 129.65834045410156, 132.9285430908203, 136.19874572753906, 139.46896362304688, 142.73916625976562]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 2.0, 7.0, 28.0, 20.0, 18.0, 22.0, 21.0, 25.0, 41.0, 30.0, 33.0, 37.0, 46.0, 35.0, 47.0, 44.0, 45.0, 57.0, 39.0, 36.0, 32.0, 39.0, 33.0, 41.0, 30.0, 32.0, 21.0, 23.0, 19.0, 16.0, 15.0, 11.0, 8.0, 11.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.150726318359375, -34.92421340942383, -33.69770050048828, -32.471187591552734, -31.244674682617188, -30.01816177368164, -28.791648864746094, -27.565135955810547, -26.338623046875, -25.112110137939453, -23.885597229003906, -22.65908432006836, -21.432571411132812, -20.206058502197266, -18.97954559326172, -17.753032684326172, -16.526519775390625, -15.300006866455078, -14.073493957519531, -12.846981048583984, -11.620468139648438, -10.39395523071289, -9.167442321777344, -7.940929412841797, -6.71441650390625, -5.487903594970703, -4.261390686035156, -3.0348777770996094, -1.8083648681640625, -0.5818519592285156, 0.6446609497070312, 1.8711738586425781, 3.0976905822753906, 4.3242034912109375, 5.550716400146484, 6.777229309082031, 8.003742218017578, 9.230255126953125, 10.456768035888672, 11.683280944824219, 12.909793853759766, 14.136306762695312, 15.36281967163086, 16.589332580566406, 17.815845489501953, 19.0423583984375, 20.268871307373047, 21.495384216308594, 22.72189712524414, 23.948410034179688, 25.174922943115234, 26.40143585205078, 27.627948760986328, 28.854461669921875, 30.080974578857422, 31.30748748779297, 32.534000396728516, 33.76051330566406, 34.98702621459961, 36.213539123535156, 37.4400520324707, 38.66656494140625, 39.8930778503418, 41.119590759277344, 42.34610366821289]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 6.0, 8.0, 9.0, 8.0, 15.0, 20.0, 19.0, 19.0, 26.0, 30.0, 30.0, 52.0, 33.0, 46.0, 49.0, 42.0, 46.0, 42.0, 48.0, 41.0, 37.0, 45.0, 33.0, 43.0, 22.0, 23.0, 33.0, 32.0, 28.0, 16.0, 15.0, 10.0, 11.0, 9.0, 12.0, 11.0, 6.0, 3.0, 7.0, 4.0, 2.0], "bins": [-6.1953125, -6.04296875, -5.890625, -5.73828125, -5.5859375, -5.43359375, -5.28125, -5.12890625, -4.9765625, -4.82421875, -4.671875, -4.51953125, -4.3671875, -4.21484375, -4.0625, -3.91015625, -3.7578125, -3.60546875, -3.453125, -3.30078125, -3.1484375, -2.99609375, -2.84375, -2.69140625, -2.5390625, -2.38671875, -2.234375, -2.08203125, -1.9296875, -1.77734375, -1.625, -1.47265625, -1.3203125, -1.16796875, -1.015625, -0.86328125, -0.7109375, -0.55859375, -0.40625, -0.25390625, -0.1015625, 0.05078125, 0.203125, 0.35546875, 0.5078125, 0.66015625, 0.8125, 0.96484375, 1.1171875, 1.26953125, 1.421875, 1.57421875, 1.7265625, 1.87890625, 2.03125, 2.18359375, 2.3359375, 2.48828125, 2.640625, 2.79296875, 2.9453125, 3.09765625, 3.25, 3.40234375, 3.5546875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 4.0, 7.0, 11.0, 17.0, 29.0, 43.0, 64.0, 79.0, 134.0, 195.0, 275.0, 444.0, 672.0, 946.0, 1413.0, 2242.0, 3232.0, 5228.0, 8278.0, 12758.0, 20593.0, 33330.0, 54897.0, 91440.0, 151345.0, 207747.0, 174894.0, 108367.0, 64597.0, 39175.0, 24265.0, 14882.0, 9516.0, 6000.0, 4024.0, 2564.0, 1623.0, 1080.0, 760.0, 442.0, 330.0, 211.0, 133.0, 99.0, 72.0, 30.0, 23.0, 14.0, 15.0, 9.0, 6.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.50732421875, -0.491302490234375, -0.47528076171875, -0.459259033203125, -0.4432373046875, -0.427215576171875, -0.41119384765625, -0.395172119140625, -0.379150390625, -0.363128662109375, -0.34710693359375, -0.331085205078125, -0.3150634765625, -0.299041748046875, -0.28302001953125, -0.266998291015625, -0.2509765625, -0.234954833984375, -0.21893310546875, -0.202911376953125, -0.1868896484375, -0.170867919921875, -0.15484619140625, -0.138824462890625, -0.122802734375, -0.106781005859375, -0.09075927734375, -0.074737548828125, -0.0587158203125, -0.042694091796875, -0.02667236328125, -0.010650634765625, 0.00537109375, 0.021392822265625, 0.03741455078125, 0.053436279296875, 0.0694580078125, 0.085479736328125, 0.10150146484375, 0.117523193359375, 0.133544921875, 0.149566650390625, 0.16558837890625, 0.181610107421875, 0.1976318359375, 0.213653564453125, 0.22967529296875, 0.245697021484375, 0.26171875, 0.277740478515625, 0.29376220703125, 0.309783935546875, 0.3258056640625, 0.341827392578125, 0.35784912109375, 0.373870849609375, 0.389892578125, 0.405914306640625, 0.42193603515625, 0.437957763671875, 0.4539794921875, 0.470001220703125, 0.48602294921875, 0.502044677734375, 0.51806640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 11.0, 12.0, 5.0, 16.0, 22.0, 22.0, 24.0, 26.0, 28.0, 22.0, 39.0, 30.0, 33.0, 33.0, 41.0, 31.0, 39.0, 1061.0, 45.0, 53.0, 41.0, 30.0, 45.0, 35.0, 29.0, 32.0, 25.0, 25.0, 29.0, 17.0, 13.0, 19.0, 20.0, 10.0, 8.0, 5.0, 11.0, 7.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.849609375, -2.757293701171875, -2.66497802734375, -2.572662353515625, -2.4803466796875, -2.388031005859375, -2.29571533203125, -2.203399658203125, -2.111083984375, -2.018768310546875, -1.92645263671875, -1.834136962890625, -1.7418212890625, -1.649505615234375, -1.55718994140625, -1.464874267578125, -1.37255859375, -1.280242919921875, -1.18792724609375, -1.095611572265625, -1.0032958984375, -0.910980224609375, -0.81866455078125, -0.726348876953125, -0.634033203125, -0.541717529296875, -0.44940185546875, -0.357086181640625, -0.2647705078125, -0.172454833984375, -0.08013916015625, 0.012176513671875, 0.1044921875, 0.196807861328125, 0.28912353515625, 0.381439208984375, 0.4737548828125, 0.566070556640625, 0.65838623046875, 0.750701904296875, 0.843017578125, 0.935333251953125, 1.02764892578125, 1.119964599609375, 1.2122802734375, 1.304595947265625, 1.39691162109375, 1.489227294921875, 1.58154296875, 1.673858642578125, 1.76617431640625, 1.858489990234375, 1.9508056640625, 2.043121337890625, 2.13543701171875, 2.227752685546875, 2.320068359375, 2.412384033203125, 2.50469970703125, 2.597015380859375, 2.6893310546875, 2.781646728515625, 2.87396240234375, 2.966278076171875, 3.05859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 8.0, 19.0, 20.0, 28.0, 62.0, 67.0, 98.0, 142.0, 213.0, 320.0, 476.0, 729.0, 1127.0, 1639.0, 2599.0, 4161.0, 6314.0, 10043.0, 15863.0, 26158.0, 42823.0, 70496.0, 114014.0, 162312.0, 1229071.0, 148895.0, 99700.0, 61294.0, 36968.0, 22736.0, 14131.0, 8556.0, 5678.0, 3529.0, 2224.0, 1562.0, 1016.0, 655.0, 439.0, 305.0, 211.0, 138.0, 87.0, 64.0, 38.0, 24.0, 25.0, 17.0, 10.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.349609375, -0.3384590148925781, -0.32730865478515625, -0.3161582946777344, -0.3050079345703125, -0.2938575744628906, -0.28270721435546875, -0.2715568542480469, -0.260406494140625, -0.24925613403320312, -0.23810577392578125, -0.22695541381835938, -0.2158050537109375, -0.20465469360351562, -0.19350433349609375, -0.18235397338867188, -0.17120361328125, -0.16005325317382812, -0.14890289306640625, -0.13775253295898438, -0.1266021728515625, -0.11545181274414062, -0.10430145263671875, -0.09315109252929688, -0.082000732421875, -0.07085037231445312, -0.05970001220703125, -0.048549652099609375, -0.0373992919921875, -0.026248931884765625, -0.01509857177734375, -0.003948211669921875, 0.0072021484375, 0.018352508544921875, 0.02950286865234375, 0.040653228759765625, 0.0518035888671875, 0.06295394897460938, 0.07410430908203125, 0.08525466918945312, 0.096405029296875, 0.10755538940429688, 0.11870574951171875, 0.12985610961914062, 0.1410064697265625, 0.15215682983398438, 0.16330718994140625, 0.17445755004882812, 0.18560791015625, 0.19675827026367188, 0.20790863037109375, 0.21905899047851562, 0.2302093505859375, 0.24135971069335938, 0.25251007080078125, 0.2636604309082031, 0.274810791015625, 0.2859611511230469, 0.29711151123046875, 0.3082618713378906, 0.3194122314453125, 0.3305625915527344, 0.34171295166015625, 0.3528633117675781, 0.364013671875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 10.0, 5.0, 10.0, 9.0, 13.0, 24.0, 22.0, 22.0, 30.0, 40.0, 42.0, 48.0, 66.0, 52.0, 57.0, 71.0, 59.0, 65.0, 58.0, 52.0, 45.0, 38.0, 35.0, 17.0, 21.0, 20.0, 19.0, 12.0, 9.0, 10.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012407302856445312, -0.0011986792087554932, -0.001156628131866455, -0.001114577054977417, -0.001072525978088379, -0.0010304749011993408, -0.0009884238243103027, -0.0009463727474212646, -0.0009043216705322266, -0.0008622705936431885, -0.0008202195167541504, -0.0007781684398651123, -0.0007361173629760742, -0.0006940662860870361, -0.000652015209197998, -0.00060996413230896, -0.0005679130554199219, -0.0005258619785308838, -0.0004838109016418457, -0.0004417598247528076, -0.00039970874786376953, -0.00035765767097473145, -0.00031560659408569336, -0.0002735555171966553, -0.0002315044403076172, -0.0001894533634185791, -0.00014740228652954102, -0.00010535120964050293, -6.330013275146484e-05, -2.1249055862426758e-05, 2.0802021026611328e-05, 6.285309791564941e-05, 0.0001049041748046875, 0.00014695525169372559, 0.00018900632858276367, 0.00023105740547180176, 0.00027310848236083984, 0.00031515955924987793, 0.000357210636138916, 0.0003992617130279541, 0.0004413127899169922, 0.0004833638668060303, 0.0005254149436950684, 0.0005674660205841064, 0.0006095170974731445, 0.0006515681743621826, 0.0006936192512512207, 0.0007356703281402588, 0.0007777214050292969, 0.000819772481918335, 0.000861823558807373, 0.0009038746356964111, 0.0009459257125854492, 0.0009879767894744873, 0.0010300278663635254, 0.0010720789432525635, 0.0011141300201416016, 0.0011561810970306396, 0.0011982321739196777, 0.0012402832508087158, 0.001282334327697754, 0.001324385404586792, 0.00136643648147583, 0.0014084875583648682, 0.0014505386352539062]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 9.0, 10.0, 16.0, 24.0, 26.0, 50.0, 50.0, 90.0, 143.0, 254.0, 456.0, 1816.0, 649730.0, 393263.0, 1451.0, 482.0, 258.0, 125.0, 80.0, 44.0, 35.0, 31.0, 26.0, 19.0, 10.0, 15.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03118896484375, -0.03027033805847168, -0.02935171127319336, -0.02843308448791504, -0.02751445770263672, -0.0265958309173584, -0.025677204132080078, -0.024758577346801758, -0.023839950561523438, -0.022921323776245117, -0.022002696990966797, -0.021084070205688477, -0.020165443420410156, -0.019246816635131836, -0.018328189849853516, -0.017409563064575195, -0.016490936279296875, -0.015572309494018555, -0.014653682708740234, -0.013735055923461914, -0.012816429138183594, -0.011897802352905273, -0.010979175567626953, -0.010060548782348633, -0.009141921997070312, -0.008223295211791992, -0.007304668426513672, -0.0063860416412353516, -0.005467414855957031, -0.004548788070678711, -0.0036301612854003906, -0.0027115345001220703, -0.00179290771484375, -0.0008742809295654297, 4.4345855712890625e-05, 0.0009629726409912109, 0.0018815994262695312, 0.0028002262115478516, 0.003718852996826172, 0.004637479782104492, 0.0055561065673828125, 0.006474733352661133, 0.007393360137939453, 0.008311986923217773, 0.009230613708496094, 0.010149240493774414, 0.011067867279052734, 0.011986494064331055, 0.012905120849609375, 0.013823747634887695, 0.014742374420166016, 0.015661001205444336, 0.016579627990722656, 0.017498254776000977, 0.018416881561279297, 0.019335508346557617, 0.020254135131835938, 0.021172761917114258, 0.022091388702392578, 0.0230100154876709, 0.02392864227294922, 0.02484726905822754, 0.02576589584350586, 0.02668452262878418, 0.0276031494140625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 30.0, 927.0, 62.0], "bins": [-0.02315860614180565, -0.02278851717710495, -0.02241842821240425, -0.022048339247703552, -0.021678250283002853, -0.021308161318302155, -0.020938072353601456, -0.020567981526255608, -0.02019789256155491, -0.01982780359685421, -0.01945771463215351, -0.019087625667452812, -0.018717536702752113, -0.018347445875406265, -0.017977356910705566, -0.017607267946004868, -0.01723717898130417, -0.01686709001660347, -0.01649700105190277, -0.016126912087202072, -0.015756823122501373, -0.0153867332264781, -0.015016644261777401, -0.014646555297076702, -0.014276467263698578, -0.013906378298997879, -0.01353628933429718, -0.013166200369596481, -0.012796110473573208, -0.012426021508872509, -0.01205593254417181, -0.011685843579471111, -0.011315753683447838, -0.010945664718747139, -0.01057557575404644, -0.010205486789345741, -0.009835396893322468, -0.009465307928621769, -0.00909521896392107, -0.008725129999220371, -0.008355040103197098, -0.007984951138496399, -0.007614861708134413, -0.007244772743433714, -0.006874683313071728, -0.006504594348371029, -0.00613450538367033, -0.005764416418969631, -0.005394327454268932, -0.0050242384895682335, -0.004654149059206247, -0.0042840600945055485, -0.003913970664143562, -0.0035438816994428635, -0.0031737927347421646, -0.002803703537210822, -0.0024336143396794796, -0.002063525142148137, -0.0016934360610321164, -0.0013233469799160957, -0.0009532577823847532, -0.0005831685848534107, -0.00021307962015271187, 0.00015700957737863064, 0.0005270987749099731]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 11.0, 9.0, 20.0, 23.0, 22.0, 18.0, 32.0, 39.0, 48.0, 57.0, 55.0, 62.0, 48.0, 52.0, 55.0, 52.0, 50.0, 40.0, 54.0, 43.0, 37.0, 45.0, 30.0, 21.0, 12.0, 13.0, 16.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006859898567199707, -0.0006585754454135895, -0.0006311610341072083, -0.000603746622800827, -0.0005763322114944458, -0.0005489178001880646, -0.0005215033888816833, -0.0004940889775753021, -0.0004666745662689209, -0.00043926015496253967, -0.00041184574365615845, -0.0003844313323497772, -0.000357016921043396, -0.00032960250973701477, -0.00030218809843063354, -0.0002747736871242523, -0.0002473592758178711, -0.00021994486451148987, -0.00019253045320510864, -0.00016511604189872742, -0.0001377016305923462, -0.00011028721928596497, -8.287280797958374e-05, -5.5458396673202515e-05, -2.804398536682129e-05, -6.295740604400635e-07, 2.6784837245941162e-05, 5.419924855232239e-05, 8.161365985870361e-05, 0.00010902807116508484, 0.00013644248247146606, 0.0001638568937778473, 0.00019127130508422852, 0.00021868571639060974, 0.00024610012769699097, 0.0002735145390033722, 0.0003009289503097534, 0.00032834336161613464, 0.00035575777292251587, 0.0003831721842288971, 0.0004105865955352783, 0.00043800100684165955, 0.00046541541814804077, 0.000492829829454422, 0.0005202442407608032, 0.0005476586520671844, 0.0005750730633735657, 0.0006024874746799469, 0.0006299018859863281, 0.0006573162972927094, 0.0006847307085990906, 0.0007121451199054718, 0.000739559531211853, 0.0007669739425182343, 0.0007943883538246155, 0.0008218027651309967, 0.0008492171764373779, 0.0008766315877437592, 0.0009040459990501404, 0.0009314604103565216, 0.0009588748216629028, 0.000986289232969284, 0.0010137036442756653, 0.0010411180555820465, 0.0010685324668884277]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 6.0, 8.0, 9.0, 8.0, 15.0, 20.0, 19.0, 19.0, 26.0, 30.0, 30.0, 52.0, 33.0, 46.0, 49.0, 42.0, 46.0, 42.0, 48.0, 41.0, 37.0, 45.0, 33.0, 43.0, 22.0, 23.0, 33.0, 32.0, 28.0, 16.0, 15.0, 10.0, 11.0, 9.0, 12.0, 11.0, 6.0, 3.0, 7.0, 4.0, 2.0], "bins": [-6.1953125, -6.04296875, -5.890625, -5.73828125, -5.5859375, -5.43359375, -5.28125, -5.12890625, -4.9765625, -4.82421875, -4.671875, -4.51953125, -4.3671875, -4.21484375, -4.0625, -3.91015625, -3.7578125, -3.60546875, -3.453125, -3.30078125, -3.1484375, -2.99609375, -2.84375, -2.69140625, -2.5390625, -2.38671875, -2.234375, -2.08203125, -1.9296875, -1.77734375, -1.625, -1.47265625, -1.3203125, -1.16796875, -1.015625, -0.86328125, -0.7109375, -0.55859375, -0.40625, -0.25390625, -0.1015625, 0.05078125, 0.203125, 0.35546875, 0.5078125, 0.66015625, 0.8125, 0.96484375, 1.1171875, 1.26953125, 1.421875, 1.57421875, 1.7265625, 1.87890625, 2.03125, 2.18359375, 2.3359375, 2.48828125, 2.640625, 2.79296875, 2.9453125, 3.09765625, 3.25, 3.40234375, 3.5546875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 11.0, 16.0, 28.0, 30.0, 81.0, 130.0, 249.0, 491.0, 878.0, 1745.0, 3457.0, 6839.0, 14517.0, 33167.0, 93482.0, 343523.0, 380973.0, 102505.0, 36116.0, 15384.0, 7449.0, 3684.0, 1825.0, 916.0, 474.0, 259.0, 140.0, 79.0, 42.0, 17.0, 15.0, 17.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.7755126953125, -3.640869140625, -3.5062255859375, -3.37158203125, -3.2369384765625, -3.102294921875, -2.9676513671875, -2.8330078125, -2.6983642578125, -2.563720703125, -2.4290771484375, -2.29443359375, -2.1597900390625, -2.025146484375, -1.8905029296875, -1.755859375, -1.6212158203125, -1.486572265625, -1.3519287109375, -1.21728515625, -1.0826416015625, -0.947998046875, -0.8133544921875, -0.6787109375, -0.5440673828125, -0.409423828125, -0.2747802734375, -0.14013671875, -0.0054931640625, 0.129150390625, 0.2637939453125, 0.3984375, 0.5330810546875, 0.667724609375, 0.8023681640625, 0.93701171875, 1.0716552734375, 1.206298828125, 1.3409423828125, 1.4755859375, 1.6102294921875, 1.744873046875, 1.8795166015625, 2.01416015625, 2.1488037109375, 2.283447265625, 2.4180908203125, 2.552734375, 2.6873779296875, 2.822021484375, 2.9566650390625, 3.09130859375, 3.2259521484375, 3.360595703125, 3.4952392578125, 3.6298828125, 3.7645263671875, 3.899169921875, 4.0338134765625, 4.16845703125, 4.3031005859375, 4.437744140625, 4.5723876953125, 4.70703125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 7.0, 5.0, 3.0, 18.0, 6.0, 12.0, 25.0, 20.0, 21.0, 33.0, 35.0, 36.0, 36.0, 44.0, 46.0, 52.0, 86.0, 157.0, 1571.0, 246.0, 107.0, 78.0, 55.0, 40.0, 35.0, 41.0, 22.0, 27.0, 29.0, 25.0, 16.0, 22.0, 13.0, 14.0, 12.0, 8.0, 8.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.109375, -16.569580078125, -16.02978515625, -15.489990234375, -14.9501953125, -14.410400390625, -13.87060546875, -13.330810546875, -12.791015625, -12.251220703125, -11.71142578125, -11.171630859375, -10.6318359375, -10.092041015625, -9.55224609375, -9.012451171875, -8.47265625, -7.932861328125, -7.39306640625, -6.853271484375, -6.3134765625, -5.773681640625, -5.23388671875, -4.694091796875, -4.154296875, -3.614501953125, -3.07470703125, -2.534912109375, -1.9951171875, -1.455322265625, -0.91552734375, -0.375732421875, 0.1640625, 0.703857421875, 1.24365234375, 1.783447265625, 2.3232421875, 2.863037109375, 3.40283203125, 3.942626953125, 4.482421875, 5.022216796875, 5.56201171875, 6.101806640625, 6.6416015625, 7.181396484375, 7.72119140625, 8.260986328125, 8.80078125, 9.340576171875, 9.88037109375, 10.420166015625, 10.9599609375, 11.499755859375, 12.03955078125, 12.579345703125, 13.119140625, 13.658935546875, 14.19873046875, 14.738525390625, 15.2783203125, 15.818115234375, 16.35791015625, 16.897705078125, 17.4375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 12.0, 13.0, 24.0, 21.0, 39.0, 51.0, 76.0, 148.0, 199.0, 367.0, 813.0, 9278.0, 3110508.0, 22072.0, 1064.0, 379.0, 199.0, 130.0, 94.0, 54.0, 45.0, 19.0, 26.0, 10.0, 14.0, 6.0, 7.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.34375, -55.5283203125, -53.712890625, -51.8974609375, -50.08203125, -48.2666015625, -46.451171875, -44.6357421875, -42.8203125, -41.0048828125, -39.189453125, -37.3740234375, -35.55859375, -33.7431640625, -31.927734375, -30.1123046875, -28.296875, -26.4814453125, -24.666015625, -22.8505859375, -21.03515625, -19.2197265625, -17.404296875, -15.5888671875, -13.7734375, -11.9580078125, -10.142578125, -8.3271484375, -6.51171875, -4.6962890625, -2.880859375, -1.0654296875, 0.75, 2.5654296875, 4.380859375, 6.1962890625, 8.01171875, 9.8271484375, 11.642578125, 13.4580078125, 15.2734375, 17.0888671875, 18.904296875, 20.7197265625, 22.53515625, 24.3505859375, 26.166015625, 27.9814453125, 29.796875, 31.6123046875, 33.427734375, 35.2431640625, 37.05859375, 38.8740234375, 40.689453125, 42.5048828125, 44.3203125, 46.1357421875, 47.951171875, 49.7666015625, 51.58203125, 53.3974609375, 55.212890625, 57.0283203125, 58.84375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 20.0, 40.0, 87.0, 158.0, 187.0, 203.0, 150.0, 92.0, 38.0, 19.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.02022361755371, -18.85841178894043, -17.69659996032715, -16.534788131713867, -15.372976303100586, -14.211164474487305, -13.049351692199707, -11.887539863586426, -10.725728034973145, -9.563916206359863, -8.402104377746582, -7.240292072296143, -6.078480243682861, -4.91666841506958, -3.7548561096191406, -2.5930442810058594, -1.4312324523925781, -0.2694205045700073, 0.8923914432525635, 2.054203510284424, 3.216015338897705, 4.377827167510986, 5.539639472961426, 6.701451301574707, 7.863263130187988, 9.02507495880127, 10.18688678741455, 11.348699569702148, 12.51051139831543, 13.672323226928711, 14.834135055541992, 15.995946884155273, 17.157760620117188, 18.31957244873047, 19.48138427734375, 20.64319610595703, 21.805007934570312, 22.966819763183594, 24.128631591796875, 25.290443420410156, 26.452255249023438, 27.61406707763672, 28.77587890625, 29.93769073486328, 31.099502563476562, 32.261314392089844, 33.423126220703125, 34.584938049316406, 35.74674987792969, 36.90856170654297, 38.07037353515625, 39.23218536376953, 40.39399719238281, 41.555809020996094, 42.717620849609375, 43.879432678222656, 45.0412483215332, 46.203060150146484, 47.364871978759766, 48.52668380737305, 49.68849563598633, 50.85030746459961, 52.01211929321289, 53.17393112182617, 54.33574295043945]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 7.0, 10.0, 7.0, 11.0, 18.0, 13.0, 19.0, 15.0, 24.0, 22.0, 26.0, 37.0, 47.0, 28.0, 33.0, 40.0, 37.0, 40.0, 41.0, 35.0, 47.0, 42.0, 36.0, 39.0, 33.0, 34.0, 30.0, 29.0, 22.0, 28.0, 22.0, 21.0, 21.0, 20.0, 13.0, 9.0, 9.0, 11.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-50.722442626953125, -49.169769287109375, -47.617095947265625, -46.064422607421875, -44.511749267578125, -42.959075927734375, -41.406402587890625, -39.853729248046875, -38.301055908203125, -36.748382568359375, -35.195709228515625, -33.643035888671875, -32.090362548828125, -30.537689208984375, -28.985013961791992, -27.432340621948242, -25.87966537475586, -24.32699203491211, -22.77431869506836, -21.22164535522461, -19.66897201538086, -18.11629867553711, -16.563623428344727, -15.010950088500977, -13.458276748657227, -11.905603408813477, -10.352930068969727, -8.80025577545166, -7.24758243560791, -5.69490909576416, -4.142234802246094, -2.5895614624023438, -1.0368881225585938, 0.5157854557037354, 2.0684590339660645, 3.6211328506469727, 5.173806190490723, 6.726479530334473, 8.279153823852539, 9.831827163696289, 11.384500503540039, 12.937173843383789, 14.489847183227539, 16.042522430419922, 17.595195770263672, 19.147869110107422, 20.700542449951172, 22.253215789794922, 23.805889129638672, 25.358562469482422, 26.911235809326172, 28.463909149169922, 30.016582489013672, 31.569255828857422, 33.12193298339844, 34.67460632324219, 36.22727966308594, 37.77995300292969, 39.33262634277344, 40.88529968261719, 42.43797302246094, 43.99064636230469, 45.54331970214844, 47.09599304199219, 48.64866638183594]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 4.0, 7.0, 9.0, 4.0, 14.0, 29.0, 13.0, 20.0, 29.0, 35.0, 24.0, 43.0, 42.0, 46.0, 38.0, 60.0, 37.0, 55.0, 45.0, 47.0, 49.0, 43.0, 42.0, 30.0, 30.0, 36.0, 27.0, 31.0, 21.0, 17.0, 17.0, 7.0, 9.0, 11.0, 9.0, 6.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.86529541015625, -6.6876220703125, -6.50994873046875, -6.332275390625, -6.15460205078125, -5.9769287109375, -5.79925537109375, -5.62158203125, -5.44390869140625, -5.2662353515625, -5.08856201171875, -4.910888671875, -4.73321533203125, -4.5555419921875, -4.37786865234375, -4.2001953125, -4.02252197265625, -3.8448486328125, -3.66717529296875, -3.489501953125, -3.31182861328125, -3.1341552734375, -2.95648193359375, -2.77880859375, -2.60113525390625, -2.4234619140625, -2.24578857421875, -2.068115234375, -1.89044189453125, -1.7127685546875, -1.53509521484375, -1.357421875, -1.17974853515625, -1.0020751953125, -0.82440185546875, -0.646728515625, -0.46905517578125, -0.2913818359375, -0.11370849609375, 0.06396484375, 0.24163818359375, 0.4193115234375, 0.59698486328125, 0.774658203125, 0.95233154296875, 1.1300048828125, 1.30767822265625, 1.4853515625, 1.66302490234375, 1.8406982421875, 2.01837158203125, 2.196044921875, 2.37371826171875, 2.5513916015625, 2.72906494140625, 2.90673828125, 3.08441162109375, 3.2620849609375, 3.43975830078125, 3.617431640625, 3.79510498046875, 3.9727783203125, 4.15045166015625, 4.328125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 5.0, 16.0, 20.0, 43.0, 38.0, 60.0, 74.0, 160.0, 239.0, 403.0, 883.0, 2469.0, 8697.0, 40676.0, 269411.0, 1614054.0, 1843529.0, 347741.0, 50834.0, 10254.0, 2652.0, 919.0, 435.0, 222.0, 140.0, 87.0, 76.0, 41.0, 34.0, 20.0, 13.0, 9.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -10.0855712890625, -9.780517578125, -9.4754638671875, -9.17041015625, -8.8653564453125, -8.560302734375, -8.2552490234375, -7.9501953125, -7.6451416015625, -7.340087890625, -7.0350341796875, -6.72998046875, -6.4249267578125, -6.119873046875, -5.8148193359375, -5.509765625, -5.2047119140625, -4.899658203125, -4.5946044921875, -4.28955078125, -3.9844970703125, -3.679443359375, -3.3743896484375, -3.0693359375, -2.7642822265625, -2.459228515625, -2.1541748046875, -1.84912109375, -1.5440673828125, -1.239013671875, -0.9339599609375, -0.62890625, -0.3238525390625, -0.018798828125, 0.2862548828125, 0.59130859375, 0.8963623046875, 1.201416015625, 1.5064697265625, 1.8115234375, 2.1165771484375, 2.421630859375, 2.7266845703125, 3.03173828125, 3.3367919921875, 3.641845703125, 3.9468994140625, 4.251953125, 4.5570068359375, 4.862060546875, 5.1671142578125, 5.47216796875, 5.7772216796875, 6.082275390625, 6.3873291015625, 6.6923828125, 6.9974365234375, 7.302490234375, 7.6075439453125, 7.91259765625, 8.2176513671875, 8.522705078125, 8.8277587890625, 9.1328125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 8.0, 11.0, 11.0, 12.0, 22.0, 32.0, 39.0, 39.0, 61.0, 71.0, 95.0, 123.0, 180.0, 223.0, 293.0, 338.0, 355.0, 383.0, 356.0, 296.0, 258.0, 209.0, 144.0, 125.0, 95.0, 63.0, 50.0, 44.0, 28.0, 26.0, 20.0, 9.0, 9.0, 14.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.0474853515625, -8.727783203125, -8.4080810546875, -8.08837890625, -7.7686767578125, -7.448974609375, -7.1292724609375, -6.8095703125, -6.4898681640625, -6.170166015625, -5.8504638671875, -5.53076171875, -5.2110595703125, -4.891357421875, -4.5716552734375, -4.251953125, -3.9322509765625, -3.612548828125, -3.2928466796875, -2.97314453125, -2.6534423828125, -2.333740234375, -2.0140380859375, -1.6943359375, -1.3746337890625, -1.054931640625, -0.7352294921875, -0.41552734375, -0.0958251953125, 0.223876953125, 0.5435791015625, 0.86328125, 1.1829833984375, 1.502685546875, 1.8223876953125, 2.14208984375, 2.4617919921875, 2.781494140625, 3.1011962890625, 3.4208984375, 3.7406005859375, 4.060302734375, 4.3800048828125, 4.69970703125, 5.0194091796875, 5.339111328125, 5.6588134765625, 5.978515625, 6.2982177734375, 6.617919921875, 6.9376220703125, 7.25732421875, 7.5770263671875, 7.896728515625, 8.2164306640625, 8.5361328125, 8.8558349609375, 9.175537109375, 9.4952392578125, 9.81494140625, 10.1346435546875, 10.454345703125, 10.7740478515625, 11.09375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 11.0, 11.0, 24.0, 24.0, 19.0, 31.0, 33.0, 53.0, 50.0, 81.0, 90.0, 131.0, 203.0, 306.0, 582.0, 1989.0, 31191.0, 1715032.0, 2396928.0, 43221.0, 2516.0, 626.0, 322.0, 199.0, 155.0, 101.0, 95.0, 49.0, 45.0, 40.0, 24.0, 26.0, 8.0, 12.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.53125, -30.54736328125, -29.5634765625, -28.57958984375, -27.595703125, -26.61181640625, -25.6279296875, -24.64404296875, -23.66015625, -22.67626953125, -21.6923828125, -20.70849609375, -19.724609375, -18.74072265625, -17.7568359375, -16.77294921875, -15.7890625, -14.80517578125, -13.8212890625, -12.83740234375, -11.853515625, -10.86962890625, -9.8857421875, -8.90185546875, -7.91796875, -6.93408203125, -5.9501953125, -4.96630859375, -3.982421875, -2.99853515625, -2.0146484375, -1.03076171875, -0.046875, 0.93701171875, 1.9208984375, 2.90478515625, 3.888671875, 4.87255859375, 5.8564453125, 6.84033203125, 7.82421875, 8.80810546875, 9.7919921875, 10.77587890625, 11.759765625, 12.74365234375, 13.7275390625, 14.71142578125, 15.6953125, 16.67919921875, 17.6630859375, 18.64697265625, 19.630859375, 20.61474609375, 21.5986328125, 22.58251953125, 23.56640625, 24.55029296875, 25.5341796875, 26.51806640625, 27.501953125, 28.48583984375, 29.4697265625, 30.45361328125, 31.4375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 21.0, 62.0, 127.0, 180.0, 238.0, 201.0, 108.0, 48.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.86643981933594, -110.5593490600586, -107.25226593017578, -103.94517517089844, -100.6380844116211, -97.33099365234375, -94.02391052246094, -90.7168197631836, -87.40972900390625, -84.1026382446289, -80.7955551147461, -77.48846435546875, -74.1813735961914, -70.87428283691406, -67.56719970703125, -64.2601089477539, -60.95302200317383, -57.64593505859375, -54.338844299316406, -51.03175735473633, -47.724666595458984, -44.417579650878906, -41.11048889160156, -37.803401947021484, -34.496315002441406, -31.189226150512695, -27.882137298583984, -24.575050354003906, -21.267959594726562, -17.960872650146484, -14.653783798217773, -11.346694946289062, -8.039604187011719, -4.732515335083008, -1.425426959991455, 1.8816614151000977, 5.188750267028809, 8.495838165283203, 11.802927017211914, 15.110015869140625, 18.417104721069336, 21.724193572998047, 25.031282424926758, 28.33837127685547, 31.645458221435547, 34.952545166015625, 38.25963592529297, 41.56672668457031, 44.87381362915039, 48.18090057373047, 51.48799133300781, 54.79507827758789, 58.102169036865234, 61.40925598144531, 64.71634674072266, 68.0234375, 71.33052062988281, 74.63761138916016, 77.94469451904297, 81.25178527832031, 84.55887603759766, 87.865966796875, 91.17304992675781, 94.48014068603516, 97.7872314453125]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 7.0, 3.0, 14.0, 12.0, 19.0, 12.0, 14.0, 15.0, 18.0, 21.0, 20.0, 23.0, 25.0, 27.0, 28.0, 39.0, 36.0, 36.0, 37.0, 33.0, 26.0, 38.0, 38.0, 31.0, 31.0, 37.0, 28.0, 32.0, 31.0, 30.0, 29.0, 36.0, 19.0, 14.0, 20.0, 16.0, 16.0, 12.0, 13.0, 8.0, 8.0, 8.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-31.427268981933594, -30.416793823242188, -29.406320571899414, -28.39584732055664, -27.385372161865234, -26.374897003173828, -25.364423751831055, -24.35395050048828, -23.343475341796875, -22.33300018310547, -21.322526931762695, -20.312053680419922, -19.301578521728516, -18.29110336303711, -17.280630111694336, -16.270156860351562, -15.259681701660156, -14.249207496643066, -13.238733291625977, -12.228259086608887, -11.217784881591797, -10.207310676574707, -9.196836471557617, -8.186362266540527, -7.1758880615234375, -6.165413856506348, -5.154939651489258, -4.144465446472168, -3.133991241455078, -2.1235170364379883, -1.1130428314208984, -0.1025686264038086, 0.9079055786132812, 1.918379783630371, 2.928853988647461, 3.939328193664551, 4.949802398681641, 5.9602766036987305, 6.97075080871582, 7.98122501373291, 8.99169921875, 10.00217342376709, 11.01264762878418, 12.02312183380127, 13.03359603881836, 14.04407024383545, 15.054544448852539, 16.065017700195312, 17.07549285888672, 18.085968017578125, 19.0964412689209, 20.106914520263672, 21.117389678955078, 22.127864837646484, 23.138338088989258, 24.14881134033203, 25.159286499023438, 26.169761657714844, 27.180234909057617, 28.19070816040039, 29.201183319091797, 30.211658477783203, 31.222131729125977, 32.23260498046875, 33.243080139160156]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 19.0, 19.0, 20.0, 20.0, 31.0, 24.0, 33.0, 27.0, 38.0, 35.0, 42.0, 40.0, 22.0, 47.0, 53.0, 48.0, 46.0, 46.0, 32.0, 41.0, 36.0, 35.0, 27.0, 22.0, 28.0, 17.0, 16.0, 15.0, 14.0, 5.0, 12.0, 9.0, 6.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.58203125, -5.423583984375, -5.26513671875, -5.106689453125, -4.9482421875, -4.789794921875, -4.63134765625, -4.472900390625, -4.314453125, -4.156005859375, -3.99755859375, -3.839111328125, -3.6806640625, -3.522216796875, -3.36376953125, -3.205322265625, -3.046875, -2.888427734375, -2.72998046875, -2.571533203125, -2.4130859375, -2.254638671875, -2.09619140625, -1.937744140625, -1.779296875, -1.620849609375, -1.46240234375, -1.303955078125, -1.1455078125, -0.987060546875, -0.82861328125, -0.670166015625, -0.51171875, -0.353271484375, -0.19482421875, -0.036376953125, 0.1220703125, 0.280517578125, 0.43896484375, 0.597412109375, 0.755859375, 0.914306640625, 1.07275390625, 1.231201171875, 1.3896484375, 1.548095703125, 1.70654296875, 1.864990234375, 2.0234375, 2.181884765625, 2.34033203125, 2.498779296875, 2.6572265625, 2.815673828125, 2.97412109375, 3.132568359375, 3.291015625, 3.449462890625, 3.60791015625, 3.766357421875, 3.9248046875, 4.083251953125, 4.24169921875, 4.400146484375, 4.55859375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 7.0, 5.0, 11.0, 9.0, 14.0, 23.0, 42.0, 57.0, 93.0, 118.0, 186.0, 304.0, 434.0, 668.0, 981.0, 1514.0, 2301.0, 3716.0, 5816.0, 9174.0, 14550.0, 23764.0, 38818.0, 64106.0, 108326.0, 172740.0, 206605.0, 153586.0, 94259.0, 56385.0, 34092.0, 20881.0, 12889.0, 7888.0, 5053.0, 3183.0, 2083.0, 1214.0, 850.0, 604.0, 365.0, 251.0, 183.0, 103.0, 92.0, 58.0, 40.0, 31.0, 30.0, 21.0, 10.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.465576171875, -0.4491615295410156, -0.43274688720703125, -0.4163322448730469, -0.3999176025390625, -0.3835029602050781, -0.36708831787109375, -0.3506736755371094, -0.334259033203125, -0.3178443908691406, -0.30142974853515625, -0.2850151062011719, -0.2686004638671875, -0.2521858215332031, -0.23577117919921875, -0.21935653686523438, -0.20294189453125, -0.18652725219726562, -0.17011260986328125, -0.15369796752929688, -0.1372833251953125, -0.12086868286132812, -0.10445404052734375, -0.08803939819335938, -0.071624755859375, -0.055210113525390625, -0.03879547119140625, -0.022380828857421875, -0.0059661865234375, 0.010448455810546875, 0.02686309814453125, 0.043277740478515625, 0.0596923828125, 0.07610702514648438, 0.09252166748046875, 0.10893630981445312, 0.1253509521484375, 0.14176559448242188, 0.15818023681640625, 0.17459487915039062, 0.191009521484375, 0.20742416381835938, 0.22383880615234375, 0.24025344848632812, 0.2566680908203125, 0.2730827331542969, 0.28949737548828125, 0.3059120178222656, 0.32232666015625, 0.3387413024902344, 0.35515594482421875, 0.3715705871582031, 0.3879852294921875, 0.4043998718261719, 0.42081451416015625, 0.4372291564941406, 0.453643798828125, 0.4700584411621094, 0.48647308349609375, 0.5028877258300781, 0.5193023681640625, 0.5357170104980469, 0.5521316528320312, 0.5685462951660156, 0.5849609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 1.0, 4.0, 8.0, 6.0, 10.0, 12.0, 19.0, 18.0, 12.0, 14.0, 17.0, 19.0, 28.0, 31.0, 27.0, 33.0, 33.0, 34.0, 44.0, 36.0, 42.0, 35.0, 1051.0, 38.0, 29.0, 42.0, 27.0, 36.0, 40.0, 27.0, 32.0, 25.0, 25.0, 22.0, 24.0, 13.0, 18.0, 9.0, 8.0, 11.0, 5.0, 11.0, 9.0, 3.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.048828125, -2.9586181640625, -2.868408203125, -2.7781982421875, -2.68798828125, -2.5977783203125, -2.507568359375, -2.4173583984375, -2.3271484375, -2.2369384765625, -2.146728515625, -2.0565185546875, -1.96630859375, -1.8760986328125, -1.785888671875, -1.6956787109375, -1.60546875, -1.5152587890625, -1.425048828125, -1.3348388671875, -1.24462890625, -1.1544189453125, -1.064208984375, -0.9739990234375, -0.8837890625, -0.7935791015625, -0.703369140625, -0.6131591796875, -0.52294921875, -0.4327392578125, -0.342529296875, -0.2523193359375, -0.162109375, -0.0718994140625, 0.018310546875, 0.1085205078125, 0.19873046875, 0.2889404296875, 0.379150390625, 0.4693603515625, 0.5595703125, 0.6497802734375, 0.739990234375, 0.8302001953125, 0.92041015625, 1.0106201171875, 1.100830078125, 1.1910400390625, 1.28125, 1.3714599609375, 1.461669921875, 1.5518798828125, 1.64208984375, 1.7322998046875, 1.822509765625, 1.9127197265625, 2.0029296875, 2.0931396484375, 2.183349609375, 2.2735595703125, 2.36376953125, 2.4539794921875, 2.544189453125, 2.6343994140625, 2.724609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 8.0, 5.0, 10.0, 21.0, 26.0, 39.0, 72.0, 96.0, 149.0, 226.0, 392.0, 596.0, 898.0, 1557.0, 2419.0, 4046.0, 6470.0, 10974.0, 18801.0, 32905.0, 57234.0, 100145.0, 160500.0, 1250996.0, 175967.0, 115314.0, 66711.0, 37681.0, 21650.0, 12277.0, 7381.0, 4411.0, 2591.0, 1672.0, 989.0, 659.0, 433.0, 277.0, 158.0, 135.0, 73.0, 66.0, 40.0, 25.0, 16.0, 14.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42626953125, -0.4127922058105469, -0.39931488037109375, -0.3858375549316406, -0.3723602294921875, -0.3588829040527344, -0.34540557861328125, -0.3319282531738281, -0.318450927734375, -0.3049736022949219, -0.29149627685546875, -0.2780189514160156, -0.2645416259765625, -0.2510643005371094, -0.23758697509765625, -0.22410964965820312, -0.21063232421875, -0.19715499877929688, -0.18367767333984375, -0.17020034790039062, -0.1567230224609375, -0.14324569702148438, -0.12976837158203125, -0.11629104614257812, -0.102813720703125, -0.08933639526367188, -0.07585906982421875, -0.062381744384765625, -0.0489044189453125, -0.035427093505859375, -0.02194976806640625, -0.008472442626953125, 0.0050048828125, 0.018482208251953125, 0.03195953369140625, 0.045436859130859375, 0.0589141845703125, 0.07239151000976562, 0.08586883544921875, 0.09934616088867188, 0.112823486328125, 0.12630081176757812, 0.13977813720703125, 0.15325546264648438, 0.1667327880859375, 0.18021011352539062, 0.19368743896484375, 0.20716476440429688, 0.22064208984375, 0.23411941528320312, 0.24759674072265625, 0.2610740661621094, 0.2745513916015625, 0.2880287170410156, 0.30150604248046875, 0.3149833679199219, 0.328460693359375, 0.3419380187988281, 0.35541534423828125, 0.3688926696777344, 0.3823699951171875, 0.3958473205566406, 0.40932464599609375, 0.4228019714355469, 0.436279296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 10.0, 8.0, 10.0, 19.0, 19.0, 15.0, 24.0, 29.0, 34.0, 37.0, 40.0, 59.0, 71.0, 71.0, 70.0, 60.0, 70.0, 57.0, 59.0, 44.0, 41.0, 34.0, 30.0, 16.0, 13.0, 12.0, 12.0, 9.0, 8.0, 1.0, 6.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013179779052734375, -0.001270294189453125, -0.0012226104736328125, -0.0011749267578125, -0.0011272430419921875, -0.001079559326171875, -0.0010318756103515625, -0.00098419189453125, -0.0009365081787109375, -0.000888824462890625, -0.0008411407470703125, -0.00079345703125, -0.0007457733154296875, -0.000698089599609375, -0.0006504058837890625, -0.00060272216796875, -0.0005550384521484375, -0.000507354736328125, -0.0004596710205078125, -0.0004119873046875, -0.0003643035888671875, -0.000316619873046875, -0.0002689361572265625, -0.00022125244140625, -0.0001735687255859375, -0.000125885009765625, -7.82012939453125e-05, -3.0517578125e-05, 1.71661376953125e-05, 6.4849853515625e-05, 0.0001125335693359375, 0.00016021728515625, 0.0002079010009765625, 0.000255584716796875, 0.0003032684326171875, 0.0003509521484375, 0.0003986358642578125, 0.000446319580078125, 0.0004940032958984375, 0.00054168701171875, 0.0005893707275390625, 0.000637054443359375, 0.0006847381591796875, 0.000732421875, 0.0007801055908203125, 0.000827789306640625, 0.0008754730224609375, 0.00092315673828125, 0.0009708404541015625, 0.001018524169921875, 0.0010662078857421875, 0.0011138916015625, 0.0011615753173828125, 0.001209259033203125, 0.0012569427490234375, 0.00130462646484375, 0.0013523101806640625, 0.001399993896484375, 0.0014476776123046875, 0.001495361328125, 0.0015430450439453125, 0.001590728759765625, 0.0016384124755859375, 0.00168609619140625, 0.0017337799072265625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 9.0, 9.0, 11.0, 12.0, 24.0, 31.0, 29.0, 48.0, 66.0, 89.0, 140.0, 287.0, 648.0, 4401.0, 991029.0, 49730.0, 1054.0, 346.0, 176.0, 115.0, 66.0, 55.0, 38.0, 25.0, 20.0, 15.0, 18.0, 23.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0338134765625, -0.03286623954772949, -0.031919002532958984, -0.030971765518188477, -0.03002452850341797, -0.02907729148864746, -0.028130054473876953, -0.027182817459106445, -0.026235580444335938, -0.02528834342956543, -0.024341106414794922, -0.023393869400024414, -0.022446632385253906, -0.0214993953704834, -0.02055215835571289, -0.019604921340942383, -0.018657684326171875, -0.017710447311401367, -0.01676321029663086, -0.01581597328186035, -0.014868736267089844, -0.013921499252319336, -0.012974262237548828, -0.01202702522277832, -0.011079788208007812, -0.010132551193237305, -0.009185314178466797, -0.008238077163696289, -0.007290840148925781, -0.0063436031341552734, -0.005396366119384766, -0.004449129104614258, -0.00350189208984375, -0.002554655075073242, -0.0016074180603027344, -0.0006601810455322266, 0.00028705596923828125, 0.001234292984008789, 0.002181529998779297, 0.0031287670135498047, 0.0040760040283203125, 0.00502324104309082, 0.005970478057861328, 0.006917715072631836, 0.007864952087402344, 0.008812189102172852, 0.00975942611694336, 0.010706663131713867, 0.011653900146484375, 0.012601137161254883, 0.01354837417602539, 0.014495611190795898, 0.015442848205566406, 0.016390085220336914, 0.017337322235107422, 0.01828455924987793, 0.019231796264648438, 0.020179033279418945, 0.021126270294189453, 0.02207350730895996, 0.02302074432373047, 0.023967981338500977, 0.024915218353271484, 0.025862455368041992, 0.0268096923828125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 40.0, 784.0, 188.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014264358207583427, -0.013971385546028614, -0.013678411953151226, -0.013385439291596413, -0.0130924666300416, -0.012799493037164211, -0.012506520375609398, -0.01221354678273201, -0.011920574121177197, -0.011627601459622383, -0.011334627866744995, -0.011041655205190182, -0.010748682543635368, -0.01045570895075798, -0.010162736289203167, -0.009869763627648354, -0.009576790034770966, -0.009283817373216152, -0.008990843780338764, -0.00869787111878395, -0.008404898457229137, -0.00811192486435175, -0.007818952202796936, -0.007525979075580835, -0.007233006879687309, -0.006940033752471209, -0.006647061090916395, -0.0063540879637002945, -0.006061114836484194, -0.005768141709268093, -0.00547516904771328, -0.005182195920497179, -0.004889222327619791, -0.00459624920040369, -0.004303276538848877, -0.004010303411632776, -0.0037173302844166756, -0.0034243573900312185, -0.0031313844956457615, -0.002838411368429661, -0.0025454384740442038, -0.0022524655796587467, -0.001959492452442646, -0.001666519558057189, -0.0013735465472564101, -0.0010805735364556313, -0.0007876006420701742, -0.0004946275148540735, -0.00020165462046861649, 9.131836122833192e-05, 0.00038429134292528033, 0.0006772642955183983, 0.0009702373063191772, 0.001263210317119956, 0.001556183211505413, 0.0018491563387215137, 0.002142129233106971, 0.002435102127492428, 0.0027280752547085285, 0.0030210481490939856, 0.0033140210434794426, 0.0036069941706955433, 0.0038999670650810003, 0.004192939959466457, 0.004485913086682558]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 10.0, 15.0, 13.0, 20.0, 10.0, 22.0, 22.0, 29.0, 27.0, 30.0, 30.0, 27.0, 46.0, 41.0, 46.0, 43.0, 50.0, 44.0, 34.0, 44.0, 43.0, 33.0, 27.0, 27.0, 29.0, 27.0, 30.0, 22.0, 22.0, 19.0, 15.0, 14.0, 7.0, 10.0, 5.0, 10.0, 12.0, 3.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0006848573684692383, -0.0006638104096055031, -0.0006427634507417679, -0.0006217164918780327, -0.0006006695330142975, -0.0005796225741505623, -0.0005585756152868271, -0.0005375286564230919, -0.0005164816975593567, -0.0004954347386956215, -0.0004743877798318863, -0.0004533408209681511, -0.0004322938621044159, -0.0004112469032406807, -0.0003901999443769455, -0.0003691529855132103, -0.0003481060266494751, -0.0003270590677857399, -0.0003060121089220047, -0.0002849651500582695, -0.0002639181911945343, -0.0002428712323307991, -0.0002218242734670639, -0.0002007773146033287, -0.0001797303557395935, -0.0001586833968758583, -0.0001376364380121231, -0.00011658947914838791, -9.554252028465271e-05, -7.449556142091751e-05, -5.344860255718231e-05, -3.240164369344711e-05, -1.1354684829711914e-05, 9.692274034023285e-06, 3.0739232897758484e-05, 5.178619176149368e-05, 7.283315062522888e-05, 9.388010948896408e-05, 0.00011492706835269928, 0.00013597402721643448, 0.00015702098608016968, 0.00017806794494390488, 0.00019911490380764008, 0.00022016186267137527, 0.00024120882153511047, 0.00026225578039884567, 0.00028330273926258087, 0.00030434969812631607, 0.00032539665699005127, 0.00034644361585378647, 0.00036749057471752167, 0.00038853753358125687, 0.00040958449244499207, 0.00043063145130872726, 0.00045167841017246246, 0.00047272536903619766, 0.0004937723278999329, 0.0005148192867636681, 0.0005358662456274033, 0.0005569132044911385, 0.0005779601633548737, 0.0005990071222186089, 0.0006200540810823441, 0.0006411010399460793, 0.0006621479988098145]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 19.0, 19.0, 20.0, 20.0, 31.0, 24.0, 33.0, 27.0, 38.0, 35.0, 42.0, 40.0, 22.0, 47.0, 53.0, 48.0, 46.0, 46.0, 33.0, 40.0, 36.0, 35.0, 27.0, 22.0, 28.0, 17.0, 16.0, 15.0, 14.0, 5.0, 12.0, 9.0, 6.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.58203125, -5.423583984375, -5.26513671875, -5.106689453125, -4.9482421875, -4.789794921875, -4.63134765625, -4.472900390625, -4.314453125, -4.156005859375, -3.99755859375, -3.839111328125, -3.6806640625, -3.522216796875, -3.36376953125, -3.205322265625, -3.046875, -2.888427734375, -2.72998046875, -2.571533203125, -2.4130859375, -2.254638671875, -2.09619140625, -1.937744140625, -1.779296875, -1.620849609375, -1.46240234375, -1.303955078125, -1.1455078125, -0.987060546875, -0.82861328125, -0.670166015625, -0.51171875, -0.353271484375, -0.19482421875, -0.036376953125, 0.1220703125, 0.280517578125, 0.43896484375, 0.597412109375, 0.755859375, 0.914306640625, 1.07275390625, 1.231201171875, 1.3896484375, 1.548095703125, 1.70654296875, 1.864990234375, 2.0234375, 2.181884765625, 2.34033203125, 2.498779296875, 2.6572265625, 2.815673828125, 2.97412109375, 3.132568359375, 3.291015625, 3.449462890625, 3.60791015625, 3.766357421875, 3.9248046875, 4.083251953125, 4.24169921875, 4.400146484375, 4.55859375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 11.0, 12.0, 21.0, 47.0, 66.0, 127.0, 223.0, 446.0, 841.0, 1689.0, 3837.0, 9132.0, 24038.0, 65107.0, 198823.0, 446316.0, 194737.0, 63346.0, 23446.0, 9019.0, 3762.0, 1711.0, 869.0, 442.0, 203.0, 121.0, 64.0, 43.0, 20.0, 6.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.57421875, -5.41259765625, -5.2509765625, -5.08935546875, -4.927734375, -4.76611328125, -4.6044921875, -4.44287109375, -4.28125, -4.11962890625, -3.9580078125, -3.79638671875, -3.634765625, -3.47314453125, -3.3115234375, -3.14990234375, -2.98828125, -2.82666015625, -2.6650390625, -2.50341796875, -2.341796875, -2.18017578125, -2.0185546875, -1.85693359375, -1.6953125, -1.53369140625, -1.3720703125, -1.21044921875, -1.048828125, -0.88720703125, -0.7255859375, -0.56396484375, -0.40234375, -0.24072265625, -0.0791015625, 0.08251953125, 0.244140625, 0.40576171875, 0.5673828125, 0.72900390625, 0.890625, 1.05224609375, 1.2138671875, 1.37548828125, 1.537109375, 1.69873046875, 1.8603515625, 2.02197265625, 2.18359375, 2.34521484375, 2.5068359375, 2.66845703125, 2.830078125, 2.99169921875, 3.1533203125, 3.31494140625, 3.4765625, 3.63818359375, 3.7998046875, 3.96142578125, 4.123046875, 4.28466796875, 4.4462890625, 4.60791015625, 4.76953125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 11.0, 11.0, 18.0, 21.0, 21.0, 25.0, 37.0, 42.0, 52.0, 58.0, 61.0, 91.0, 245.0, 1743.0, 148.0, 85.0, 63.0, 56.0, 47.0, 43.0, 34.0, 37.0, 20.0, 13.0, 11.0, 14.0, 12.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.453125, -27.57421875, -26.6953125, -25.81640625, -24.9375, -24.05859375, -23.1796875, -22.30078125, -21.421875, -20.54296875, -19.6640625, -18.78515625, -17.90625, -17.02734375, -16.1484375, -15.26953125, -14.390625, -13.51171875, -12.6328125, -11.75390625, -10.875, -9.99609375, -9.1171875, -8.23828125, -7.359375, -6.48046875, -5.6015625, -4.72265625, -3.84375, -2.96484375, -2.0859375, -1.20703125, -0.328125, 0.55078125, 1.4296875, 2.30859375, 3.1875, 4.06640625, 4.9453125, 5.82421875, 6.703125, 7.58203125, 8.4609375, 9.33984375, 10.21875, 11.09765625, 11.9765625, 12.85546875, 13.734375, 14.61328125, 15.4921875, 16.37109375, 17.25, 18.12890625, 19.0078125, 19.88671875, 20.765625, 21.64453125, 22.5234375, 23.40234375, 24.28125, 25.16015625, 26.0390625, 26.91796875, 27.796875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 10.0, 15.0, 17.0, 20.0, 18.0, 27.0, 51.0, 73.0, 108.0, 157.0, 224.0, 322.0, 836.0, 6477.0, 3099538.0, 35060.0, 1429.0, 440.0, 264.0, 185.0, 127.0, 76.0, 50.0, 34.0, 31.0, 22.0, 21.0, 16.0, 11.0, 4.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.125, -57.197265625, -55.26953125, -53.341796875, -51.4140625, -49.486328125, -47.55859375, -45.630859375, -43.703125, -41.775390625, -39.84765625, -37.919921875, -35.9921875, -34.064453125, -32.13671875, -30.208984375, -28.28125, -26.353515625, -24.42578125, -22.498046875, -20.5703125, -18.642578125, -16.71484375, -14.787109375, -12.859375, -10.931640625, -9.00390625, -7.076171875, -5.1484375, -3.220703125, -1.29296875, 0.634765625, 2.5625, 4.490234375, 6.41796875, 8.345703125, 10.2734375, 12.201171875, 14.12890625, 16.056640625, 17.984375, 19.912109375, 21.83984375, 23.767578125, 25.6953125, 27.623046875, 29.55078125, 31.478515625, 33.40625, 35.333984375, 37.26171875, 39.189453125, 41.1171875, 43.044921875, 44.97265625, 46.900390625, 48.828125, 50.755859375, 52.68359375, 54.611328125, 56.5390625, 58.466796875, 60.39453125, 62.322265625, 64.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 12.0, 209.0, 664.0, 127.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.230323791503906, -39.09013366699219, -34.9499397277832, -30.809749603271484, -26.669557571411133, -22.52936553955078, -18.389175415039062, -14.248983383178711, -10.10879135131836, -5.968599796295166, -1.8284082412719727, 2.3117828369140625, 6.451974868774414, 10.592166900634766, 14.732357025146484, 18.872549057006836, 23.012741088867188, 27.15293312072754, 31.29312515258789, 35.43331527709961, 39.573509216308594, 43.71369934082031, 47.85388946533203, 51.99407958984375, 56.134273529052734, 60.27446365356445, 64.41465759277344, 68.55484771728516, 72.69503784179688, 76.83523559570312, 80.97541809082031, 85.11561584472656, 89.25581359863281, 93.39600372314453, 97.53619384765625, 101.6763916015625, 105.81658172607422, 109.95677185058594, 114.09696197509766, 118.23715209960938, 122.37734985351562, 126.51753997802734, 130.65773010253906, 134.7979278564453, 138.9381103515625, 143.07830810546875, 147.218505859375, 151.3586883544922, 155.49887084960938, 159.63906860351562, 163.7792510986328, 167.91944885253906, 172.05963134765625, 176.1998291015625, 180.34002685546875, 184.48020935058594, 188.6204071044922, 192.76060485839844, 196.90078735351562, 201.04098510742188, 205.18116760253906, 209.3213653564453, 213.4615478515625, 217.60174560546875, 221.741943359375]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 9.0, 11.0, 8.0, 14.0, 22.0, 16.0, 33.0, 25.0, 27.0, 28.0, 28.0, 34.0, 36.0, 43.0, 43.0, 47.0, 33.0, 46.0, 44.0, 37.0, 31.0, 32.0, 41.0, 34.0, 29.0, 35.0, 26.0, 33.0, 24.0, 13.0, 15.0, 25.0, 7.0, 19.0, 12.0, 6.0, 14.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-51.82158660888672, -50.33015060424805, -48.838714599609375, -47.3472785949707, -45.85584259033203, -44.364402770996094, -42.87297058105469, -41.38153076171875, -39.89009475708008, -38.398658752441406, -36.907222747802734, -35.41578674316406, -33.92435073852539, -32.43291473388672, -30.941476821899414, -29.45003890991211, -27.95860481262207, -26.4671688079834, -24.975732803344727, -23.484294891357422, -21.99285888671875, -20.501422882080078, -19.009986877441406, -17.518550872802734, -16.027114868164062, -14.53567886352539, -13.044241905212402, -11.55280590057373, -10.061368942260742, -8.56993293762207, -7.078496932983398, -5.58705997467041, -4.095623016357422, -2.604186534881592, -1.1127502918243408, 0.37868595123291016, 1.8701224327087402, 3.3615589141845703, 4.852994918823242, 6.3444318771362305, 7.835867881774902, 9.327303886413574, 10.818740844726562, 12.310176849365234, 13.801612854003906, 15.293049812316895, 16.78448486328125, 18.275922775268555, 19.767358779907227, 21.2587947845459, 22.75023078918457, 24.241668701171875, 25.733104705810547, 27.22454071044922, 28.71597671508789, 30.207412719726562, 31.698848724365234, 33.190284729003906, 34.68172073364258, 36.17315673828125, 37.66459274291992, 39.156028747558594, 40.64746856689453, 42.1389045715332, 43.630340576171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 10.0, 10.0, 13.0, 15.0, 11.0, 17.0, 32.0, 26.0, 19.0, 26.0, 34.0, 33.0, 30.0, 27.0, 31.0, 44.0, 42.0, 41.0, 43.0, 36.0, 51.0, 32.0, 38.0, 38.0, 24.0, 32.0, 26.0, 17.0, 40.0, 23.0, 14.0, 14.0, 17.0, 9.0, 11.0, 7.0, 10.0, 8.0, 6.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-5.05859375, -4.90625, -4.75390625, -4.6015625, -4.44921875, -4.296875, -4.14453125, -3.9921875, -3.83984375, -3.6875, -3.53515625, -3.3828125, -3.23046875, -3.078125, -2.92578125, -2.7734375, -2.62109375, -2.46875, -2.31640625, -2.1640625, -2.01171875, -1.859375, -1.70703125, -1.5546875, -1.40234375, -1.25, -1.09765625, -0.9453125, -0.79296875, -0.640625, -0.48828125, -0.3359375, -0.18359375, -0.03125, 0.12109375, 0.2734375, 0.42578125, 0.578125, 0.73046875, 0.8828125, 1.03515625, 1.1875, 1.33984375, 1.4921875, 1.64453125, 1.796875, 1.94921875, 2.1015625, 2.25390625, 2.40625, 2.55859375, 2.7109375, 2.86328125, 3.015625, 3.16796875, 3.3203125, 3.47265625, 3.625, 3.77734375, 3.9296875, 4.08203125, 4.234375, 4.38671875, 4.5390625, 4.69140625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 6.0, 10.0, 13.0, 12.0, 13.0, 17.0, 18.0, 20.0, 26.0, 28.0, 33.0, 43.0, 61.0, 127.0, 301.0, 1261.0, 9090.0, 251236.0, 3392004.0, 523228.0, 14308.0, 1616.0, 327.0, 129.0, 69.0, 39.0, 30.0, 41.0, 24.0, 17.0, 21.0, 18.0, 17.0, 12.0, 12.0, 4.0, 5.0, 9.0, 5.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0], "bins": [-22.21875, -21.594482421875, -20.97021484375, -20.345947265625, -19.7216796875, -19.097412109375, -18.47314453125, -17.848876953125, -17.224609375, -16.600341796875, -15.97607421875, -15.351806640625, -14.7275390625, -14.103271484375, -13.47900390625, -12.854736328125, -12.23046875, -11.606201171875, -10.98193359375, -10.357666015625, -9.7333984375, -9.109130859375, -8.48486328125, -7.860595703125, -7.236328125, -6.612060546875, -5.98779296875, -5.363525390625, -4.7392578125, -4.114990234375, -3.49072265625, -2.866455078125, -2.2421875, -1.617919921875, -0.99365234375, -0.369384765625, 0.2548828125, 0.879150390625, 1.50341796875, 2.127685546875, 2.751953125, 3.376220703125, 4.00048828125, 4.624755859375, 5.2490234375, 5.873291015625, 6.49755859375, 7.121826171875, 7.74609375, 8.370361328125, 8.99462890625, 9.618896484375, 10.2431640625, 10.867431640625, 11.49169921875, 12.115966796875, 12.740234375, 13.364501953125, 13.98876953125, 14.613037109375, 15.2373046875, 15.861572265625, 16.48583984375, 17.110107421875, 17.734375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 6.0, 12.0, 10.0, 12.0, 14.0, 22.0, 22.0, 35.0, 39.0, 66.0, 60.0, 89.0, 112.0, 165.0, 190.0, 234.0, 314.0, 332.0, 386.0, 328.0, 351.0, 293.0, 213.0, 170.0, 124.0, 113.0, 79.0, 66.0, 49.0, 46.0, 20.0, 19.0, 28.0, 8.0, 10.0, 7.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8203125, -9.52001953125, -9.2197265625, -8.91943359375, -8.619140625, -8.31884765625, -8.0185546875, -7.71826171875, -7.41796875, -7.11767578125, -6.8173828125, -6.51708984375, -6.216796875, -5.91650390625, -5.6162109375, -5.31591796875, -5.015625, -4.71533203125, -4.4150390625, -4.11474609375, -3.814453125, -3.51416015625, -3.2138671875, -2.91357421875, -2.61328125, -2.31298828125, -2.0126953125, -1.71240234375, -1.412109375, -1.11181640625, -0.8115234375, -0.51123046875, -0.2109375, 0.08935546875, 0.3896484375, 0.68994140625, 0.990234375, 1.29052734375, 1.5908203125, 1.89111328125, 2.19140625, 2.49169921875, 2.7919921875, 3.09228515625, 3.392578125, 3.69287109375, 3.9931640625, 4.29345703125, 4.59375, 4.89404296875, 5.1943359375, 5.49462890625, 5.794921875, 6.09521484375, 6.3955078125, 6.69580078125, 6.99609375, 7.29638671875, 7.5966796875, 7.89697265625, 8.197265625, 8.49755859375, 8.7978515625, 9.09814453125, 9.3984375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 8.0, 6.0, 10.0, 13.0, 21.0, 35.0, 35.0, 49.0, 78.0, 98.0, 184.0, 220.0, 373.0, 1203.0, 16497.0, 2940529.0, 1224989.0, 7964.0, 899.0, 352.0, 183.0, 146.0, 110.0, 69.0, 57.0, 40.0, 27.0, 22.0, 22.0, 11.0, 10.0, 12.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.09375, -45.74462890625, -44.3955078125, -43.04638671875, -41.697265625, -40.34814453125, -38.9990234375, -37.64990234375, -36.30078125, -34.95166015625, -33.6025390625, -32.25341796875, -30.904296875, -29.55517578125, -28.2060546875, -26.85693359375, -25.5078125, -24.15869140625, -22.8095703125, -21.46044921875, -20.111328125, -18.76220703125, -17.4130859375, -16.06396484375, -14.71484375, -13.36572265625, -12.0166015625, -10.66748046875, -9.318359375, -7.96923828125, -6.6201171875, -5.27099609375, -3.921875, -2.57275390625, -1.2236328125, 0.12548828125, 1.474609375, 2.82373046875, 4.1728515625, 5.52197265625, 6.87109375, 8.22021484375, 9.5693359375, 10.91845703125, 12.267578125, 13.61669921875, 14.9658203125, 16.31494140625, 17.6640625, 19.01318359375, 20.3623046875, 21.71142578125, 23.060546875, 24.40966796875, 25.7587890625, 27.10791015625, 28.45703125, 29.80615234375, 31.1552734375, 32.50439453125, 33.853515625, 35.20263671875, 36.5517578125, 37.90087890625, 39.25]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 128.0, 475.0, 359.0, 48.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.47235107421875, -97.2499008178711, -89.02745056152344, -80.80499267578125, -72.5825424194336, -64.36009216308594, -56.137638092041016, -47.915184020996094, -39.69273376464844, -31.47028160095215, -23.24782943725586, -15.02537727355957, -6.802925109863281, 1.419525146484375, 9.641979217529297, 17.86443328857422, 26.086883544921875, 34.30933380126953, 42.53178787231445, 50.754241943359375, 58.97669219970703, 67.19914245605469, 75.42160034179688, 83.64405059814453, 91.86650085449219, 100.08895111083984, 108.3114013671875, 116.53385925292969, 124.75630950927734, 132.978759765625, 141.2012176513672, 149.42367553710938, 157.64614868164062, 165.8686065673828, 174.09104919433594, 182.31350708007812, 190.53594970703125, 198.75840759277344, 206.98086547851562, 215.20330810546875, 223.42576599121094, 231.64822387695312, 239.87066650390625, 248.09312438964844, 256.3155822753906, 264.53802490234375, 272.7604675292969, 280.9829406738281, 289.20538330078125, 297.4278259277344, 305.6502990722656, 313.87274169921875, 322.0951843261719, 330.317626953125, 338.54010009765625, 346.7625427246094, 354.9849853515625, 363.2074279785156, 371.4299011230469, 379.65234375, 387.8747863769531, 396.09722900390625, 404.3197021484375, 412.5421447753906, 420.7646179199219]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 9.0, 6.0, 13.0, 15.0, 14.0, 16.0, 25.0, 20.0, 30.0, 32.0, 34.0, 20.0, 28.0, 28.0, 39.0, 44.0, 41.0, 50.0, 33.0, 43.0, 33.0, 40.0, 33.0, 32.0, 39.0, 34.0, 29.0, 29.0, 31.0, 18.0, 30.0, 19.0, 12.0, 18.0, 12.0, 11.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.222694396972656, -34.116905212402344, -33.01111602783203, -31.90532875061035, -30.79953956604004, -29.693750381469727, -28.587963104248047, -27.482173919677734, -26.376384735107422, -25.27059555053711, -24.164806365966797, -23.059019088745117, -21.953229904174805, -20.847440719604492, -19.741653442382812, -18.6358642578125, -17.530075073242188, -16.424285888671875, -15.318497657775879, -14.212709426879883, -13.10692024230957, -12.001131057739258, -10.895342826843262, -9.789554595947266, -8.683765411376953, -7.577976703643799, -6.4721879959106445, -5.36639928817749, -4.260610580444336, -3.1548218727111816, -2.0490331649780273, -0.943244457244873, 0.16254425048828125, 1.2683329582214355, 2.37412166595459, 3.479910373687744, 4.585699081420898, 5.691487789154053, 6.797276496887207, 7.903065204620361, 9.008853912353516, 10.114643096923828, 11.220431327819824, 12.32621955871582, 13.432008743286133, 14.537797927856445, 15.643586158752441, 16.749374389648438, 17.85516357421875, 18.960952758789062, 20.066741943359375, 21.172529220581055, 22.278318405151367, 23.38410758972168, 24.48989486694336, 25.595684051513672, 26.701473236083984, 27.807262420654297, 28.91305160522461, 30.01883888244629, 31.1246280670166, 32.23041534423828, 33.336204528808594, 34.441993713378906, 35.54778289794922]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 12.0, 9.0, 20.0, 13.0, 21.0, 15.0, 28.0, 25.0, 22.0, 23.0, 36.0, 36.0, 41.0, 32.0, 41.0, 40.0, 44.0, 40.0, 40.0, 44.0, 34.0, 31.0, 30.0, 38.0, 32.0, 25.0, 28.0, 25.0, 27.0, 21.0, 19.0, 18.0, 9.0, 10.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-5.16796875, -5.01397705078125, -4.8599853515625, -4.70599365234375, -4.552001953125, -4.39801025390625, -4.2440185546875, -4.09002685546875, -3.93603515625, -3.78204345703125, -3.6280517578125, -3.47406005859375, -3.320068359375, -3.16607666015625, -3.0120849609375, -2.85809326171875, -2.7041015625, -2.55010986328125, -2.3961181640625, -2.24212646484375, -2.088134765625, -1.93414306640625, -1.7801513671875, -1.62615966796875, -1.47216796875, -1.31817626953125, -1.1641845703125, -1.01019287109375, -0.856201171875, -0.70220947265625, -0.5482177734375, -0.39422607421875, -0.240234375, -0.08624267578125, 0.0677490234375, 0.22174072265625, 0.375732421875, 0.52972412109375, 0.6837158203125, 0.83770751953125, 0.99169921875, 1.14569091796875, 1.2996826171875, 1.45367431640625, 1.607666015625, 1.76165771484375, 1.9156494140625, 2.06964111328125, 2.2236328125, 2.37762451171875, 2.5316162109375, 2.68560791015625, 2.839599609375, 2.99359130859375, 3.1475830078125, 3.30157470703125, 3.45556640625, 3.60955810546875, 3.7635498046875, 3.91754150390625, 4.071533203125, 4.22552490234375, 4.3795166015625, 4.53350830078125, 4.6875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 16.0, 15.0, 25.0, 38.0, 58.0, 62.0, 96.0, 166.0, 277.0, 400.0, 564.0, 816.0, 1176.0, 1828.0, 2758.0, 4018.0, 5982.0, 9073.0, 13774.0, 21112.0, 33150.0, 52093.0, 83904.0, 132541.0, 181890.0, 173309.0, 120179.0, 75695.0, 47215.0, 29601.0, 19209.0, 12653.0, 8187.0, 5388.0, 3657.0, 2435.0, 1693.0, 1134.0, 787.0, 471.0, 399.0, 216.0, 154.0, 125.0, 68.0, 49.0, 32.0, 14.0, 19.0, 12.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.491455078125, -0.4755439758300781, -0.45963287353515625, -0.4437217712402344, -0.4278106689453125, -0.4118995666503906, -0.39598846435546875, -0.3800773620605469, -0.364166259765625, -0.3482551574707031, -0.33234405517578125, -0.3164329528808594, -0.3005218505859375, -0.2846107482910156, -0.26869964599609375, -0.2527885437011719, -0.23687744140625, -0.22096633911132812, -0.20505523681640625, -0.18914413452148438, -0.1732330322265625, -0.15732192993164062, -0.14141082763671875, -0.12549972534179688, -0.109588623046875, -0.09367752075195312, -0.07776641845703125, -0.061855316162109375, -0.0459442138671875, -0.030033111572265625, -0.01412200927734375, 0.001789093017578125, 0.0177001953125, 0.033611297607421875, 0.04952239990234375, 0.06543350219726562, 0.0813446044921875, 0.09725570678710938, 0.11316680908203125, 0.12907791137695312, 0.144989013671875, 0.16090011596679688, 0.17681121826171875, 0.19272232055664062, 0.2086334228515625, 0.22454452514648438, 0.24045562744140625, 0.2563667297363281, 0.27227783203125, 0.2881889343261719, 0.30410003662109375, 0.3200111389160156, 0.3359222412109375, 0.3518333435058594, 0.36774444580078125, 0.3836555480957031, 0.399566650390625, 0.4154777526855469, 0.43138885498046875, 0.4472999572753906, 0.4632110595703125, 0.4791221618652344, 0.49503326416015625, 0.5109443664550781, 0.52685546875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 12.0, 17.0, 16.0, 19.0, 23.0, 20.0, 23.0, 21.0, 26.0, 32.0, 41.0, 32.0, 35.0, 48.0, 51.0, 53.0, 1063.0, 43.0, 51.0, 41.0, 44.0, 20.0, 45.0, 34.0, 38.0, 22.0, 20.0, 21.0, 17.0, 16.0, 17.0, 12.0, 6.0, 11.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.453125, -3.344146728515625, -3.23516845703125, -3.126190185546875, -3.0172119140625, -2.908233642578125, -2.79925537109375, -2.690277099609375, -2.581298828125, -2.472320556640625, -2.36334228515625, -2.254364013671875, -2.1453857421875, -2.036407470703125, -1.92742919921875, -1.818450927734375, -1.70947265625, -1.600494384765625, -1.49151611328125, -1.382537841796875, -1.2735595703125, -1.164581298828125, -1.05560302734375, -0.946624755859375, -0.837646484375, -0.728668212890625, -0.61968994140625, -0.510711669921875, -0.4017333984375, -0.292755126953125, -0.18377685546875, -0.074798583984375, 0.0341796875, 0.143157958984375, 0.25213623046875, 0.361114501953125, 0.4700927734375, 0.579071044921875, 0.68804931640625, 0.797027587890625, 0.906005859375, 1.014984130859375, 1.12396240234375, 1.232940673828125, 1.3419189453125, 1.450897216796875, 1.55987548828125, 1.668853759765625, 1.77783203125, 1.886810302734375, 1.99578857421875, 2.104766845703125, 2.2137451171875, 2.322723388671875, 2.43170166015625, 2.540679931640625, 2.649658203125, 2.758636474609375, 2.86761474609375, 2.976593017578125, 3.0855712890625, 3.194549560546875, 3.30352783203125, 3.412506103515625, 3.521484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 14.0, 18.0, 17.0, 40.0, 48.0, 102.0, 132.0, 229.0, 363.0, 586.0, 939.0, 1574.0, 2737.0, 4522.0, 8306.0, 14920.0, 27737.0, 51879.0, 98144.0, 171215.0, 1274580.0, 190162.0, 115288.0, 61453.0, 32133.0, 17371.0, 9712.0, 5328.0, 3112.0, 1782.0, 1014.0, 608.0, 386.0, 229.0, 167.0, 106.0, 53.0, 42.0, 32.0, 18.0, 15.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54638671875, -0.530609130859375, -0.51483154296875, -0.499053955078125, -0.4832763671875, -0.467498779296875, -0.45172119140625, -0.435943603515625, -0.420166015625, -0.404388427734375, -0.38861083984375, -0.372833251953125, -0.3570556640625, -0.341278076171875, -0.32550048828125, -0.309722900390625, -0.2939453125, -0.278167724609375, -0.26239013671875, -0.246612548828125, -0.2308349609375, -0.215057373046875, -0.19927978515625, -0.183502197265625, -0.167724609375, -0.151947021484375, -0.13616943359375, -0.120391845703125, -0.1046142578125, -0.088836669921875, -0.07305908203125, -0.057281494140625, -0.04150390625, -0.025726318359375, -0.00994873046875, 0.005828857421875, 0.0216064453125, 0.037384033203125, 0.05316162109375, 0.068939208984375, 0.084716796875, 0.100494384765625, 0.11627197265625, 0.132049560546875, 0.1478271484375, 0.163604736328125, 0.17938232421875, 0.195159912109375, 0.2109375, 0.226715087890625, 0.24249267578125, 0.258270263671875, 0.2740478515625, 0.289825439453125, 0.30560302734375, 0.321380615234375, 0.337158203125, 0.352935791015625, 0.36871337890625, 0.384490966796875, 0.4002685546875, 0.416046142578125, 0.43182373046875, 0.447601318359375, 0.46337890625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 8.0, 6.0, 6.0, 8.0, 9.0, 14.0, 18.0, 27.0, 24.0, 25.0, 32.0, 23.0, 44.0, 39.0, 42.0, 61.0, 51.0, 38.0, 44.0, 52.0, 47.0, 50.0, 38.0, 30.0, 41.0, 38.0, 26.0, 26.0, 24.0, 26.0, 12.0, 17.0, 3.0, 14.0, 8.0, 6.0, 6.0, 4.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009899139404296875, -0.0009552240371704102, -0.0009205341339111328, -0.0008858442306518555, -0.0008511543273925781, -0.0008164644241333008, -0.0007817745208740234, -0.0007470846176147461, -0.0007123947143554688, -0.0006777048110961914, -0.0006430149078369141, -0.0006083250045776367, -0.0005736351013183594, -0.000538945198059082, -0.0005042552947998047, -0.00046956539154052734, -0.00043487548828125, -0.00040018558502197266, -0.0003654956817626953, -0.00033080577850341797, -0.0002961158752441406, -0.0002614259719848633, -0.00022673606872558594, -0.0001920461654663086, -0.00015735626220703125, -0.0001226663589477539, -8.797645568847656e-05, -5.328655242919922e-05, -1.8596649169921875e-05, 1.609325408935547e-05, 5.078315734863281e-05, 8.547306060791016e-05, 0.0001201629638671875, 0.00015485286712646484, 0.0001895427703857422, 0.00022423267364501953, 0.0002589225769042969, 0.0002936124801635742, 0.00032830238342285156, 0.0003629922866821289, 0.00039768218994140625, 0.0004323720932006836, 0.00046706199645996094, 0.0005017518997192383, 0.0005364418029785156, 0.000571131706237793, 0.0006058216094970703, 0.0006405115127563477, 0.000675201416015625, 0.0007098913192749023, 0.0007445812225341797, 0.000779271125793457, 0.0008139610290527344, 0.0008486509323120117, 0.0008833408355712891, 0.0009180307388305664, 0.0009527206420898438, 0.000987410545349121, 0.0010221004486083984, 0.0010567903518676758, 0.0010914802551269531, 0.0011261701583862305, 0.0011608600616455078, 0.0011955499649047852, 0.0012302398681640625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 6.0, 7.0, 16.0, 13.0, 13.0, 23.0, 19.0, 25.0, 41.0, 49.0, 56.0, 75.0, 107.0, 162.0, 296.0, 733.0, 4219.0, 798189.0, 241150.0, 1930.0, 582.0, 275.0, 136.0, 94.0, 60.0, 63.0, 35.0, 47.0, 21.0, 24.0, 18.0, 11.0, 14.0, 11.0, 10.0, 0.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0264129638671875, -0.025676250457763672, -0.024939537048339844, -0.024202823638916016, -0.023466110229492188, -0.02272939682006836, -0.02199268341064453, -0.021255970001220703, -0.020519256591796875, -0.019782543182373047, -0.01904582977294922, -0.01830911636352539, -0.017572402954101562, -0.016835689544677734, -0.016098976135253906, -0.015362262725830078, -0.01462554931640625, -0.013888835906982422, -0.013152122497558594, -0.012415409088134766, -0.011678695678710938, -0.01094198226928711, -0.010205268859863281, -0.009468555450439453, -0.008731842041015625, -0.007995128631591797, -0.007258415222167969, -0.006521701812744141, -0.0057849884033203125, -0.005048274993896484, -0.004311561584472656, -0.003574848175048828, -0.002838134765625, -0.002101421356201172, -0.0013647079467773438, -0.0006279945373535156, 0.0001087188720703125, 0.0008454322814941406, 0.0015821456909179688, 0.002318859100341797, 0.003055572509765625, 0.003792285919189453, 0.004528999328613281, 0.005265712738037109, 0.0060024261474609375, 0.006739139556884766, 0.007475852966308594, 0.008212566375732422, 0.00894927978515625, 0.009685993194580078, 0.010422706604003906, 0.011159420013427734, 0.011896133422851562, 0.01263284683227539, 0.013369560241699219, 0.014106273651123047, 0.014842987060546875, 0.015579700469970703, 0.01631641387939453, 0.01705312728881836, 0.017789840698242188, 0.018526554107666016, 0.019263267517089844, 0.019999980926513672, 0.0207366943359375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 13.0, 23.0, 60.0, 124.0, 146.0, 195.0, 172.0, 128.0, 84.0, 27.0, 15.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001208073110319674, -0.0011610151268541813, -0.0011139571433886886, -0.0010668991599231958, -0.0010198410600423813, -0.0009727830765768886, -0.0009257250931113958, -0.0008786671096459031, -0.0008316090679727495, -0.0007845510845072567, -0.0007374930428341031, -0.0006904350593686104, -0.0006433770759031177, -0.000596319034229964, -0.0005492610507644713, -0.0005022030090913177, -0.00045514502562582493, -0.00040808701305650175, -0.00036102900048717856, -0.00031397101702168584, -0.00026691300445236266, -0.00021985499188303947, -0.00017279700841754675, -0.00012573899584822357, -7.868098327890038e-05, -3.162297798553482e-05, 1.543502730783075e-05, 6.24930253252387e-05, 0.00010955103789456189, 0.00015660905046388507, 0.0002036670339293778, 0.000250725046498701, 0.000297783175483346, 0.00034484118805266917, 0.00039189920062199235, 0.0004389571840874851, 0.00048601519665680826, 0.0005330732092261314, 0.0005801311926916242, 0.0006271891761571169, 0.0006742472178302705, 0.0007213052012957633, 0.0007683632429689169, 0.0008154212264344096, 0.0008624792098999023, 0.000909537251573056, 0.0009565952350385487, 0.0010036532767117023, 0.001050711260177195, 0.0010977692436426878, 0.0011448272271081805, 0.0011918852105736732, 0.0012389433104544878, 0.0012860012939199805, 0.0013330592773854733, 0.001380117260850966, 0.0014271752443164587, 0.0014742332277819514, 0.0015212912112474442, 0.0015683493111282587, 0.0016154072945937514, 0.0016624652780592442, 0.0017095232615247369, 0.0017565812449902296, 0.0018036393448710442]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 5.0, 3.0, 12.0, 13.0, 11.0, 23.0, 18.0, 29.0, 22.0, 30.0, 30.0, 28.0, 31.0, 47.0, 38.0, 50.0, 41.0, 37.0, 35.0, 37.0, 35.0, 37.0, 35.0, 46.0, 27.0, 35.0, 33.0, 35.0, 24.0, 21.0, 20.0, 13.0, 18.0, 9.0, 17.0, 15.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000590980052947998, -0.0005714157596230507, -0.0005518514662981033, -0.000532287172973156, -0.0005127228796482086, -0.0004931585863232613, -0.0004735942929983139, -0.00045402999967336655, -0.0004344657063484192, -0.00041490141302347183, -0.0003953371196985245, -0.0003757728263735771, -0.00035620853304862976, -0.0003366442397236824, -0.00031707994639873505, -0.0002975156530737877, -0.00027795135974884033, -0.000258387066423893, -0.00023882277309894562, -0.00021925847977399826, -0.0001996941864490509, -0.00018012989312410355, -0.0001605655997991562, -0.00014100130647420883, -0.00012143701314926147, -0.00010187271982431412, -8.230842649936676e-05, -6.27441331744194e-05, -4.3179839849472046e-05, -2.361554652452469e-05, -4.0512531995773315e-06, 1.5513040125370026e-05, 3.507733345031738e-05, 5.464162677526474e-05, 7.42059201002121e-05, 9.377021342515945e-05, 0.00011333450675010681, 0.00013289880007505417, 0.00015246309340000153, 0.00017202738672494888, 0.00019159168004989624, 0.0002111559733748436, 0.00023072026669979095, 0.0002502845600247383, 0.00026984885334968567, 0.000289413146674633, 0.0003089774399995804, 0.00032854173332452774, 0.0003481060266494751, 0.00036767031997442245, 0.0003872346132993698, 0.00040679890662431717, 0.0004263631999492645, 0.0004459274932742119, 0.00046549178659915924, 0.0004850560799241066, 0.000504620373249054, 0.0005241846665740013, 0.0005437489598989487, 0.000563313253223896, 0.0005828775465488434, 0.0006024418398737907, 0.0006220061331987381, 0.0006415704265236855, 0.0006611347198486328]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 12.0, 9.0, 20.0, 13.0, 21.0, 15.0, 28.0, 25.0, 22.0, 23.0, 36.0, 36.0, 41.0, 32.0, 41.0, 40.0, 44.0, 40.0, 40.0, 44.0, 34.0, 31.0, 30.0, 38.0, 32.0, 25.0, 28.0, 25.0, 27.0, 21.0, 19.0, 18.0, 9.0, 10.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-5.16796875, -5.01397705078125, -4.8599853515625, -4.70599365234375, -4.552001953125, -4.39801025390625, -4.2440185546875, -4.09002685546875, -3.93603515625, -3.78204345703125, -3.6280517578125, -3.47406005859375, -3.320068359375, -3.16607666015625, -3.0120849609375, -2.85809326171875, -2.7041015625, -2.55010986328125, -2.3961181640625, -2.24212646484375, -2.088134765625, -1.93414306640625, -1.7801513671875, -1.62615966796875, -1.47216796875, -1.31817626953125, -1.1641845703125, -1.01019287109375, -0.856201171875, -0.70220947265625, -0.5482177734375, -0.39422607421875, -0.240234375, -0.08624267578125, 0.0677490234375, 0.22174072265625, 0.375732421875, 0.52972412109375, 0.6837158203125, 0.83770751953125, 0.99169921875, 1.14569091796875, 1.2996826171875, 1.45367431640625, 1.607666015625, 1.76165771484375, 1.9156494140625, 2.06964111328125, 2.2236328125, 2.37762451171875, 2.5316162109375, 2.68560791015625, 2.839599609375, 2.99359130859375, 3.1475830078125, 3.30157470703125, 3.45556640625, 3.60955810546875, 3.7635498046875, 3.91754150390625, 4.071533203125, 4.22552490234375, 4.3795166015625, 4.53350830078125, 4.6875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 6.0, 16.0, 24.0, 30.0, 43.0, 56.0, 102.0, 148.0, 201.0, 320.0, 543.0, 909.0, 1535.0, 2619.0, 4830.0, 9181.0, 17613.0, 34573.0, 71833.0, 156811.0, 348403.0, 212714.0, 93598.0, 44808.0, 22052.0, 11497.0, 6004.0, 3341.0, 1827.0, 1061.0, 646.0, 416.0, 290.0, 146.0, 98.0, 77.0, 44.0, 38.0, 29.0, 21.0, 9.0, 11.0, 5.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.00390625, -3.881378173828125, -3.75885009765625, -3.636322021484375, -3.5137939453125, -3.391265869140625, -3.26873779296875, -3.146209716796875, -3.023681640625, -2.901153564453125, -2.77862548828125, -2.656097412109375, -2.5335693359375, -2.411041259765625, -2.28851318359375, -2.165985107421875, -2.04345703125, -1.920928955078125, -1.79840087890625, -1.675872802734375, -1.5533447265625, -1.430816650390625, -1.30828857421875, -1.185760498046875, -1.063232421875, -0.940704345703125, -0.81817626953125, -0.695648193359375, -0.5731201171875, -0.450592041015625, -0.32806396484375, -0.205535888671875, -0.0830078125, 0.039520263671875, 0.16204833984375, 0.284576416015625, 0.4071044921875, 0.529632568359375, 0.65216064453125, 0.774688720703125, 0.897216796875, 1.019744873046875, 1.14227294921875, 1.264801025390625, 1.3873291015625, 1.509857177734375, 1.63238525390625, 1.754913330078125, 1.87744140625, 1.999969482421875, 2.12249755859375, 2.245025634765625, 2.3675537109375, 2.490081787109375, 2.61260986328125, 2.735137939453125, 2.857666015625, 2.980194091796875, 3.10272216796875, 3.225250244140625, 3.3477783203125, 3.470306396484375, 3.59283447265625, 3.715362548828125, 3.837890625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 13.0, 7.0, 13.0, 18.0, 22.0, 19.0, 23.0, 33.0, 28.0, 38.0, 40.0, 33.0, 54.0, 47.0, 68.0, 106.0, 292.0, 1524.0, 162.0, 93.0, 61.0, 45.0, 40.0, 35.0, 32.0, 21.0, 25.0, 22.0, 18.0, 25.0, 15.0, 14.0, 14.0, 9.0, 10.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-19.5625, -18.990478515625, -18.41845703125, -17.846435546875, -17.2744140625, -16.702392578125, -16.13037109375, -15.558349609375, -14.986328125, -14.414306640625, -13.84228515625, -13.270263671875, -12.6982421875, -12.126220703125, -11.55419921875, -10.982177734375, -10.41015625, -9.838134765625, -9.26611328125, -8.694091796875, -8.1220703125, -7.550048828125, -6.97802734375, -6.406005859375, -5.833984375, -5.261962890625, -4.68994140625, -4.117919921875, -3.5458984375, -2.973876953125, -2.40185546875, -1.829833984375, -1.2578125, -0.685791015625, -0.11376953125, 0.458251953125, 1.0302734375, 1.602294921875, 2.17431640625, 2.746337890625, 3.318359375, 3.890380859375, 4.46240234375, 5.034423828125, 5.6064453125, 6.178466796875, 6.75048828125, 7.322509765625, 7.89453125, 8.466552734375, 9.03857421875, 9.610595703125, 10.1826171875, 10.754638671875, 11.32666015625, 11.898681640625, 12.470703125, 13.042724609375, 13.61474609375, 14.186767578125, 14.7587890625, 15.330810546875, 15.90283203125, 16.474853515625, 17.046875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 1.0, 1.0, 6.0, 9.0, 22.0, 42.0, 58.0, 68.0, 116.0, 192.0, 341.0, 743.0, 11755.0, 3127015.0, 3925.0, 627.0, 297.0, 175.0, 106.0, 69.0, 64.0, 25.0, 19.0, 16.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.75, -70.275390625, -67.80078125, -65.326171875, -62.8515625, -60.376953125, -57.90234375, -55.427734375, -52.953125, -50.478515625, -48.00390625, -45.529296875, -43.0546875, -40.580078125, -38.10546875, -35.630859375, -33.15625, -30.681640625, -28.20703125, -25.732421875, -23.2578125, -20.783203125, -18.30859375, -15.833984375, -13.359375, -10.884765625, -8.41015625, -5.935546875, -3.4609375, -0.986328125, 1.48828125, 3.962890625, 6.4375, 8.912109375, 11.38671875, 13.861328125, 16.3359375, 18.810546875, 21.28515625, 23.759765625, 26.234375, 28.708984375, 31.18359375, 33.658203125, 36.1328125, 38.607421875, 41.08203125, 43.556640625, 46.03125, 48.505859375, 50.98046875, 53.455078125, 55.9296875, 58.404296875, 60.87890625, 63.353515625, 65.828125, 68.302734375, 70.77734375, 73.251953125, 75.7265625, 78.201171875, 80.67578125, 83.150390625, 85.625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 12.0, 152.0, 398.0, 355.0, 80.0, 16.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.663169860839844, -44.051605224609375, -41.440040588378906, -38.82847595214844, -36.21691131591797, -33.6053466796875, -30.993785858154297, -28.382221221923828, -25.77065658569336, -23.15909194946289, -20.547527313232422, -17.935964584350586, -15.324399948120117, -12.712835311889648, -10.101271629333496, -7.489707946777344, -4.878143310546875, -2.2665791511535645, 0.3449850082397461, 2.9565491676330566, 5.568113327026367, 8.179677963256836, 10.791241645812988, 13.40280532836914, 16.01436996459961, 18.625934600830078, 21.237499237060547, 23.849061965942383, 26.46062660217285, 29.07219123840332, 31.683753967285156, 34.295318603515625, 36.90687561035156, 39.51844024658203, 42.1300048828125, 44.74156951904297, 47.35313415527344, 49.964698791503906, 52.57625961303711, 55.18782424926758, 57.79938888549805, 60.410953521728516, 63.022518157958984, 65.63407897949219, 68.24564361572266, 70.85720825195312, 73.4687728881836, 76.08033752441406, 78.69190216064453, 81.303466796875, 83.91503143310547, 86.52659606933594, 89.1381607055664, 91.74972534179688, 94.36128997802734, 96.97285461425781, 99.58441162109375, 102.19597625732422, 104.80754089355469, 107.41910552978516, 110.03067016601562, 112.6422348022461, 115.25379943847656, 117.8653564453125, 120.4769287109375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 4.0, 6.0, 12.0, 17.0, 17.0, 38.0, 34.0, 36.0, 23.0, 38.0, 41.0, 52.0, 41.0, 49.0, 53.0, 43.0, 33.0, 39.0, 50.0, 44.0, 55.0, 37.0, 28.0, 33.0, 28.0, 30.0, 15.0, 19.0, 12.0, 13.0, 4.0, 15.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.79033660888672, -60.953773498535156, -59.11720657348633, -57.280643463134766, -55.4440803527832, -53.607513427734375, -51.77095031738281, -49.93438720703125, -48.09782409667969, -46.261260986328125, -44.4246940612793, -42.588130950927734, -40.75156784057617, -38.915000915527344, -37.07843780517578, -35.24187469482422, -33.405311584472656, -31.56874656677246, -29.7321834564209, -27.895618438720703, -26.05905532836914, -24.222490310668945, -22.38592529296875, -20.549362182617188, -18.71279525756836, -16.876230239868164, -15.039667129516602, -13.203102111816406, -11.366539001464844, -9.529973983764648, -7.6934099197387695, -5.856845855712891, -4.020282745361328, -2.183718681335449, -0.3471543788909912, 1.4894099235534668, 3.3259739875793457, 5.162538528442383, 6.999102592468262, 8.83566665649414, 10.67223072052002, 12.508794784545898, 14.345358848571777, 16.181922912597656, 18.01848793029785, 19.855052947998047, 21.69161605834961, 23.528179168701172, 25.364744186401367, 27.201309204101562, 29.037872314453125, 30.87443733215332, 32.711002349853516, 34.54756546020508, 36.38412857055664, 38.22069549560547, 40.05725860595703, 41.893821716308594, 43.73038864135742, 45.566951751708984, 47.40351486206055, 49.240081787109375, 51.07664489746094, 52.9132080078125, 54.74977111816406]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 14.0, 7.0, 8.0, 11.0, 18.0, 18.0, 15.0, 19.0, 28.0, 26.0, 28.0, 35.0, 44.0, 36.0, 28.0, 31.0, 40.0, 48.0, 37.0, 41.0, 45.0, 39.0, 35.0, 33.0, 32.0, 25.0, 40.0, 28.0, 26.0, 26.0, 18.0, 19.0, 20.0, 12.0, 10.0, 7.0, 10.0, 6.0, 6.0, 4.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.3359375, -5.1685791015625, -5.001220703125, -4.8338623046875, -4.66650390625, -4.4991455078125, -4.331787109375, -4.1644287109375, -3.9970703125, -3.8297119140625, -3.662353515625, -3.4949951171875, -3.32763671875, -3.1602783203125, -2.992919921875, -2.8255615234375, -2.658203125, -2.4908447265625, -2.323486328125, -2.1561279296875, -1.98876953125, -1.8214111328125, -1.654052734375, -1.4866943359375, -1.3193359375, -1.1519775390625, -0.984619140625, -0.8172607421875, -0.64990234375, -0.4825439453125, -0.315185546875, -0.1478271484375, 0.01953125, 0.1868896484375, 0.354248046875, 0.5216064453125, 0.68896484375, 0.8563232421875, 1.023681640625, 1.1910400390625, 1.3583984375, 1.5257568359375, 1.693115234375, 1.8604736328125, 2.02783203125, 2.1951904296875, 2.362548828125, 2.5299072265625, 2.697265625, 2.8646240234375, 3.031982421875, 3.1993408203125, 3.36669921875, 3.5340576171875, 3.701416015625, 3.8687744140625, 4.0361328125, 4.2034912109375, 4.370849609375, 4.5382080078125, 4.70556640625, 4.8729248046875, 5.040283203125, 5.2076416015625, 5.375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 6.0, 10.0, 12.0, 9.0, 16.0, 20.0, 19.0, 24.0, 33.0, 25.0, 49.0, 78.0, 149.0, 344.0, 1195.0, 6902.0, 114360.0, 2591100.0, 1431799.0, 43076.0, 3619.0, 769.0, 250.0, 116.0, 56.0, 36.0, 34.0, 23.0, 26.0, 21.0, 14.0, 19.0, 14.0, 8.0, 10.0, 3.0, 5.0, 7.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.328125, -18.721435546875, -18.11474609375, -17.508056640625, -16.9013671875, -16.294677734375, -15.68798828125, -15.081298828125, -14.474609375, -13.867919921875, -13.26123046875, -12.654541015625, -12.0478515625, -11.441162109375, -10.83447265625, -10.227783203125, -9.62109375, -9.014404296875, -8.40771484375, -7.801025390625, -7.1943359375, -6.587646484375, -5.98095703125, -5.374267578125, -4.767578125, -4.160888671875, -3.55419921875, -2.947509765625, -2.3408203125, -1.734130859375, -1.12744140625, -0.520751953125, 0.0859375, 0.692626953125, 1.29931640625, 1.906005859375, 2.5126953125, 3.119384765625, 3.72607421875, 4.332763671875, 4.939453125, 5.546142578125, 6.15283203125, 6.759521484375, 7.3662109375, 7.972900390625, 8.57958984375, 9.186279296875, 9.79296875, 10.399658203125, 11.00634765625, 11.613037109375, 12.2197265625, 12.826416015625, 13.43310546875, 14.039794921875, 14.646484375, 15.253173828125, 15.85986328125, 16.466552734375, 17.0732421875, 17.679931640625, 18.28662109375, 18.893310546875, 19.5]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 15.0, 20.0, 13.0, 24.0, 33.0, 43.0, 55.0, 87.0, 90.0, 140.0, 179.0, 229.0, 276.0, 367.0, 387.0, 379.0, 381.0, 304.0, 237.0, 174.0, 156.0, 94.0, 95.0, 59.0, 54.0, 40.0, 34.0, 30.0, 16.0, 14.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.966064453125, -9.63525390625, -9.304443359375, -8.9736328125, -8.642822265625, -8.31201171875, -7.981201171875, -7.650390625, -7.319580078125, -6.98876953125, -6.657958984375, -6.3271484375, -5.996337890625, -5.66552734375, -5.334716796875, -5.00390625, -4.673095703125, -4.34228515625, -4.011474609375, -3.6806640625, -3.349853515625, -3.01904296875, -2.688232421875, -2.357421875, -2.026611328125, -1.69580078125, -1.364990234375, -1.0341796875, -0.703369140625, -0.37255859375, -0.041748046875, 0.2890625, 0.619873046875, 0.95068359375, 1.281494140625, 1.6123046875, 1.943115234375, 2.27392578125, 2.604736328125, 2.935546875, 3.266357421875, 3.59716796875, 3.927978515625, 4.2587890625, 4.589599609375, 4.92041015625, 5.251220703125, 5.58203125, 5.912841796875, 6.24365234375, 6.574462890625, 6.9052734375, 7.236083984375, 7.56689453125, 7.897705078125, 8.228515625, 8.559326171875, 8.89013671875, 9.220947265625, 9.5517578125, 9.882568359375, 10.21337890625, 10.544189453125, 10.875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 5.0, 6.0, 4.0, 6.0, 4.0, 11.0, 19.0, 17.0, 34.0, 43.0, 43.0, 53.0, 69.0, 101.0, 103.0, 155.0, 171.0, 232.0, 299.0, 579.0, 2046.0, 45833.0, 3377302.0, 754412.0, 10101.0, 1034.0, 398.0, 268.0, 214.0, 123.0, 110.0, 100.0, 90.0, 58.0, 45.0, 47.0, 38.0, 27.0, 15.0, 12.0, 17.0, 10.0, 13.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-38.75, -37.603515625, -36.45703125, -35.310546875, -34.1640625, -33.017578125, -31.87109375, -30.724609375, -29.578125, -28.431640625, -27.28515625, -26.138671875, -24.9921875, -23.845703125, -22.69921875, -21.552734375, -20.40625, -19.259765625, -18.11328125, -16.966796875, -15.8203125, -14.673828125, -13.52734375, -12.380859375, -11.234375, -10.087890625, -8.94140625, -7.794921875, -6.6484375, -5.501953125, -4.35546875, -3.208984375, -2.0625, -0.916015625, 0.23046875, 1.376953125, 2.5234375, 3.669921875, 4.81640625, 5.962890625, 7.109375, 8.255859375, 9.40234375, 10.548828125, 11.6953125, 12.841796875, 13.98828125, 15.134765625, 16.28125, 17.427734375, 18.57421875, 19.720703125, 20.8671875, 22.013671875, 23.16015625, 24.306640625, 25.453125, 26.599609375, 27.74609375, 28.892578125, 30.0390625, 31.185546875, 32.33203125, 33.478515625, 34.625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 17.0, 182.0, 455.0, 311.0, 48.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-266.1879577636719, -259.6512145996094, -253.11444091796875, -246.57769775390625, -240.0409393310547, -233.50418090820312, -226.96742248535156, -220.4306640625, -213.8939208984375, -207.35716247558594, -200.82040405273438, -194.28366088867188, -187.7469024658203, -181.21014404296875, -174.6733856201172, -168.13662719726562, -161.59986877441406, -155.0631103515625, -148.52635192871094, -141.98959350585938, -135.45285034179688, -128.9160919189453, -122.37933349609375, -115.84257507324219, -109.30582427978516, -102.7690658569336, -96.23231506347656, -89.695556640625, -83.15879821777344, -76.6220474243164, -70.08528900146484, -63.54853439331055, -57.01176452636719, -50.47500991821289, -43.938255310058594, -37.40149688720703, -30.864742279052734, -24.327987670898438, -17.791229248046875, -11.254474639892578, -4.717720031738281, 1.819035530090332, 8.355791091918945, 14.892547607421875, 21.429302215576172, 27.96605682373047, 34.50281524658203, 41.03956985473633, 47.576324462890625, 54.11307907104492, 60.64983367919922, 67.18659210205078, 73.72334289550781, 80.26010131835938, 86.79685974121094, 93.3336181640625, 99.87036895751953, 106.4071273803711, 112.94387817382812, 119.48063659667969, 126.01739501953125, 132.55413818359375, 139.09091186523438, 145.62765502929688, 152.16441345214844]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 4.0, 11.0, 2.0, 9.0, 12.0, 11.0, 14.0, 20.0, 23.0, 15.0, 24.0, 33.0, 35.0, 32.0, 35.0, 36.0, 33.0, 37.0, 35.0, 33.0, 33.0, 38.0, 49.0, 29.0, 40.0, 30.0, 30.0, 42.0, 33.0, 27.0, 32.0, 23.0, 19.0, 16.0, 16.0, 17.0, 21.0, 10.0, 10.0, 10.0, 2.0, 3.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.9398193359375, -31.855924606323242, -30.772029876708984, -29.688135147094727, -28.60424041748047, -27.52034568786621, -26.436450958251953, -25.352556228637695, -24.268661499023438, -23.18476676940918, -22.100872039794922, -21.016977310180664, -19.933082580566406, -18.84918785095215, -17.76529312133789, -16.681398391723633, -15.597503662109375, -14.513608932495117, -13.42971420288086, -12.345819473266602, -11.261924743652344, -10.178030014038086, -9.094135284423828, -8.01024055480957, -6.9263458251953125, -5.842451095581055, -4.758556365966797, -3.674661636352539, -2.5907669067382812, -1.5068721771240234, -0.4229774475097656, 0.6609172821044922, 1.74481201171875, 2.828706741333008, 3.9126014709472656, 4.996496200561523, 6.080390930175781, 7.164285659790039, 8.248180389404297, 9.332075119018555, 10.415969848632812, 11.49986457824707, 12.583759307861328, 13.667654037475586, 14.751548767089844, 15.835443496704102, 16.91933822631836, 18.003232955932617, 19.087127685546875, 20.171022415161133, 21.25491714477539, 22.33881187438965, 23.422706604003906, 24.506601333618164, 25.590496063232422, 26.67439079284668, 27.758285522460938, 28.842180252075195, 29.926074981689453, 31.00996971130371, 32.09386444091797, 33.177757263183594, 34.261653900146484, 35.345550537109375, 36.429443359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 8.0, 13.0, 17.0, 9.0, 17.0, 17.0, 21.0, 21.0, 39.0, 26.0, 21.0, 35.0, 43.0, 41.0, 39.0, 42.0, 48.0, 36.0, 45.0, 34.0, 46.0, 51.0, 37.0, 36.0, 29.0, 25.0, 29.0, 22.0, 26.0, 26.0, 22.0, 13.0, 14.0, 5.0, 7.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.1875, -5.01373291015625, -4.8399658203125, -4.66619873046875, -4.492431640625, -4.31866455078125, -4.1448974609375, -3.97113037109375, -3.79736328125, -3.62359619140625, -3.4498291015625, -3.27606201171875, -3.102294921875, -2.92852783203125, -2.7547607421875, -2.58099365234375, -2.4072265625, -2.23345947265625, -2.0596923828125, -1.88592529296875, -1.712158203125, -1.53839111328125, -1.3646240234375, -1.19085693359375, -1.01708984375, -0.84332275390625, -0.6695556640625, -0.49578857421875, -0.322021484375, -0.14825439453125, 0.0255126953125, 0.19927978515625, 0.373046875, 0.54681396484375, 0.7205810546875, 0.89434814453125, 1.068115234375, 1.24188232421875, 1.4156494140625, 1.58941650390625, 1.76318359375, 1.93695068359375, 2.1107177734375, 2.28448486328125, 2.458251953125, 2.63201904296875, 2.8057861328125, 2.97955322265625, 3.1533203125, 3.32708740234375, 3.5008544921875, 3.67462158203125, 3.848388671875, 4.02215576171875, 4.1959228515625, 4.36968994140625, 4.54345703125, 4.71722412109375, 4.8909912109375, 5.06475830078125, 5.238525390625, 5.41229248046875, 5.5860595703125, 5.75982666015625, 5.93359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 10.0, 22.0, 23.0, 32.0, 76.0, 118.0, 136.0, 212.0, 357.0, 509.0, 734.0, 1085.0, 1716.0, 2566.0, 3966.0, 6466.0, 10201.0, 16058.0, 26370.0, 43636.0, 71987.0, 118230.0, 178845.0, 196265.0, 141779.0, 88579.0, 52734.0, 32201.0, 19699.0, 12395.0, 7534.0, 4905.0, 3084.0, 2109.0, 1289.0, 864.0, 582.0, 379.0, 242.0, 168.0, 135.0, 82.0, 62.0, 40.0, 30.0, 11.0, 12.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.60791015625, -0.589599609375, -0.5712890625, -0.552978515625, -0.53466796875, -0.516357421875, -0.498046875, -0.479736328125, -0.46142578125, -0.443115234375, -0.4248046875, -0.406494140625, -0.38818359375, -0.369873046875, -0.3515625, -0.333251953125, -0.31494140625, -0.296630859375, -0.2783203125, -0.260009765625, -0.24169921875, -0.223388671875, -0.205078125, -0.186767578125, -0.16845703125, -0.150146484375, -0.1318359375, -0.113525390625, -0.09521484375, -0.076904296875, -0.05859375, -0.040283203125, -0.02197265625, -0.003662109375, 0.0146484375, 0.032958984375, 0.05126953125, 0.069580078125, 0.087890625, 0.106201171875, 0.12451171875, 0.142822265625, 0.1611328125, 0.179443359375, 0.19775390625, 0.216064453125, 0.234375, 0.252685546875, 0.27099609375, 0.289306640625, 0.3076171875, 0.325927734375, 0.34423828125, 0.362548828125, 0.380859375, 0.399169921875, 0.41748046875, 0.435791015625, 0.4541015625, 0.472412109375, 0.49072265625, 0.509033203125, 0.52734375, 0.545654296875, 0.56396484375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 7.0, 10.0, 13.0, 17.0, 16.0, 20.0, 24.0, 35.0, 37.0, 39.0, 41.0, 37.0, 60.0, 59.0, 42.0, 1083.0, 60.0, 54.0, 58.0, 44.0, 40.0, 36.0, 25.0, 33.0, 24.0, 21.0, 12.0, 22.0, 17.0, 10.0, 3.0, 11.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.966796875, -3.828643798828125, -3.69049072265625, -3.552337646484375, -3.4141845703125, -3.276031494140625, -3.13787841796875, -2.999725341796875, -2.861572265625, -2.723419189453125, -2.58526611328125, -2.447113037109375, -2.3089599609375, -2.170806884765625, -2.03265380859375, -1.894500732421875, -1.75634765625, -1.618194580078125, -1.48004150390625, -1.341888427734375, -1.2037353515625, -1.065582275390625, -0.92742919921875, -0.789276123046875, -0.651123046875, -0.512969970703125, -0.37481689453125, -0.236663818359375, -0.0985107421875, 0.039642333984375, 0.17779541015625, 0.315948486328125, 0.4541015625, 0.592254638671875, 0.73040771484375, 0.868560791015625, 1.0067138671875, 1.144866943359375, 1.28302001953125, 1.421173095703125, 1.559326171875, 1.697479248046875, 1.83563232421875, 1.973785400390625, 2.1119384765625, 2.250091552734375, 2.38824462890625, 2.526397705078125, 2.66455078125, 2.802703857421875, 2.94085693359375, 3.079010009765625, 3.2171630859375, 3.355316162109375, 3.49346923828125, 3.631622314453125, 3.769775390625, 3.907928466796875, 4.04608154296875, 4.184234619140625, 4.3223876953125, 4.460540771484375, 4.59869384765625, 4.736846923828125, 4.875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 15.0, 17.0, 28.0, 54.0, 63.0, 83.0, 153.0, 233.0, 349.0, 511.0, 787.0, 1240.0, 1900.0, 3017.0, 4819.0, 7949.0, 13199.0, 21750.0, 37568.0, 64881.0, 109205.0, 168257.0, 1248974.0, 161056.0, 102894.0, 60427.0, 34760.0, 20695.0, 12102.0, 7580.0, 4587.0, 2909.0, 1778.0, 1170.0, 725.0, 464.0, 292.0, 206.0, 145.0, 85.0, 56.0, 39.0, 37.0, 23.0, 17.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.449462890625, -0.4351654052734375, -0.420867919921875, -0.4065704345703125, -0.39227294921875, -0.3779754638671875, -0.363677978515625, -0.3493804931640625, -0.3350830078125, -0.3207855224609375, -0.306488037109375, -0.2921905517578125, -0.27789306640625, -0.2635955810546875, -0.249298095703125, -0.2350006103515625, -0.220703125, -0.2064056396484375, -0.192108154296875, -0.1778106689453125, -0.16351318359375, -0.1492156982421875, -0.134918212890625, -0.1206207275390625, -0.1063232421875, -0.0920257568359375, -0.077728271484375, -0.0634307861328125, -0.04913330078125, -0.0348358154296875, -0.020538330078125, -0.0062408447265625, 0.008056640625, 0.0223541259765625, 0.036651611328125, 0.0509490966796875, 0.06524658203125, 0.0795440673828125, 0.093841552734375, 0.1081390380859375, 0.1224365234375, 0.1367340087890625, 0.151031494140625, 0.1653289794921875, 0.17962646484375, 0.1939239501953125, 0.208221435546875, 0.2225189208984375, 0.23681640625, 0.2511138916015625, 0.265411376953125, 0.2797088623046875, 0.29400634765625, 0.3083038330078125, 0.322601318359375, 0.3368988037109375, 0.3511962890625, 0.3654937744140625, 0.379791259765625, 0.3940887451171875, 0.40838623046875, 0.4226837158203125, 0.436981201171875, 0.4512786865234375, 0.465576171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 9.0, 8.0, 7.0, 13.0, 18.0, 24.0, 21.0, 20.0, 36.0, 27.0, 34.0, 40.0, 60.0, 52.0, 39.0, 56.0, 48.0, 65.0, 44.0, 54.0, 43.0, 43.0, 34.0, 38.0, 27.0, 24.0, 22.0, 16.0, 16.0, 13.0, 8.0, 3.0, 7.0, 3.0, 6.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014190673828125, -0.0013776421546936035, -0.001336216926574707, -0.0012947916984558105, -0.001253366470336914, -0.0012119412422180176, -0.001170516014099121, -0.0011290907859802246, -0.0010876655578613281, -0.0010462403297424316, -0.0010048151016235352, -0.0009633898735046387, -0.0009219646453857422, -0.0008805394172668457, -0.0008391141891479492, -0.0007976889610290527, -0.0007562637329101562, -0.0007148385047912598, -0.0006734132766723633, -0.0006319880485534668, -0.0005905628204345703, -0.0005491375923156738, -0.0005077123641967773, -0.00046628713607788086, -0.0004248619079589844, -0.0003834366798400879, -0.0003420114517211914, -0.0003005862236022949, -0.00025916099548339844, -0.00021773576736450195, -0.00017631053924560547, -0.00013488531112670898, -9.34600830078125e-05, -5.2034854888916016e-05, -1.0609626770019531e-05, 3.081560134887695e-05, 7.224082946777344e-05, 0.00011366605758666992, 0.0001550912857055664, 0.0001965165138244629, 0.00023794174194335938, 0.00027936697006225586, 0.00032079219818115234, 0.00036221742630004883, 0.0004036426544189453, 0.0004450678825378418, 0.0004864931106567383, 0.0005279183387756348, 0.0005693435668945312, 0.0006107687950134277, 0.0006521940231323242, 0.0006936192512512207, 0.0007350444793701172, 0.0007764697074890137, 0.0008178949356079102, 0.0008593201637268066, 0.0009007453918457031, 0.0009421706199645996, 0.000983595848083496, 0.0010250210762023926, 0.001066446304321289, 0.0011078715324401855, 0.001149296760559082, 0.0011907219886779785, 0.001232147216796875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 0.0, 3.0, 8.0, 5.0, 8.0, 14.0, 16.0, 14.0, 25.0, 25.0, 34.0, 45.0, 44.0, 64.0, 102.0, 168.0, 298.0, 762.0, 8681.0, 1004566.0, 31722.0, 959.0, 361.0, 156.0, 116.0, 68.0, 56.0, 60.0, 34.0, 32.0, 23.0, 25.0, 15.0, 4.0, 11.0, 7.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0263214111328125, -0.025432348251342773, -0.024543285369873047, -0.02365422248840332, -0.022765159606933594, -0.021876096725463867, -0.02098703384399414, -0.020097970962524414, -0.019208908081054688, -0.01831984519958496, -0.017430782318115234, -0.016541719436645508, -0.01565265655517578, -0.014763593673706055, -0.013874530792236328, -0.012985467910766602, -0.012096405029296875, -0.011207342147827148, -0.010318279266357422, -0.009429216384887695, -0.008540153503417969, -0.007651090621948242, -0.006762027740478516, -0.005872964859008789, -0.0049839019775390625, -0.004094839096069336, -0.0032057762145996094, -0.002316713333129883, -0.0014276504516601562, -0.0005385875701904297, 0.0003504753112792969, 0.0012395381927490234, 0.00212860107421875, 0.0030176639556884766, 0.003906726837158203, 0.00479578971862793, 0.005684852600097656, 0.006573915481567383, 0.007462978363037109, 0.008352041244506836, 0.009241104125976562, 0.010130167007446289, 0.011019229888916016, 0.011908292770385742, 0.012797355651855469, 0.013686418533325195, 0.014575481414794922, 0.015464544296264648, 0.016353607177734375, 0.0172426700592041, 0.018131732940673828, 0.019020795822143555, 0.01990985870361328, 0.020798921585083008, 0.021687984466552734, 0.02257704734802246, 0.023466110229492188, 0.024355173110961914, 0.02524423599243164, 0.026133298873901367, 0.027022361755371094, 0.02791142463684082, 0.028800487518310547, 0.029689550399780273, 0.03057861328125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 43.0, 242.0, 519.0, 175.0, 29.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005974913015961647, -0.005827170796692371, -0.005679429043084383, -0.005531686823815107, -0.005383944604545832, -0.005236202850937843, -0.005088460631668568, -0.004940718412399292, -0.004792976193130016, -0.004645233973860741, -0.004497492220252752, -0.004349750000983477, -0.004202007781714201, -0.004054266028106213, -0.003906523808836937, -0.0037587815895676613, -0.003611039835959673, -0.003463297849521041, -0.0033155556302517653, -0.0031678136438131332, -0.0030200714245438576, -0.0028723294381052256, -0.0027245874516665936, -0.002576845232397318, -0.002429103245958686, -0.002281361259520054, -0.002133619040250778, -0.001985877053812146, -0.0018381349509581923, -0.0016903928481042385, -0.0015426508616656065, -0.0013949087588116527, -0.0012471671216189861, -0.0010994250187650323, -0.0009516829741187394, -0.0008039409294724464, -0.0006561988266184926, -0.0005084567237645388, -0.00036071467911824584, -0.00021297263447195292, -6.523053161799908e-05, 8.25115421321243e-05, 0.00023025361588224769, 0.00037799568963237107, 0.0005257377633824944, 0.0006734798662364483, 0.0008212219108827412, 0.0009689639555290341, 0.001116706058382988, 0.0012644481612369418, 0.0014121902640908957, 0.0015599322505295277, 0.0017076743533834815, 0.0018554164562374353, 0.0020031584426760674, 0.002150900661945343, 0.002298642648383975, 0.002446384634822607, 0.0025941268540918827, 0.0027418688405305147, 0.0028896108269691467, 0.0030373530462384224, 0.0031850950326770544, 0.0033328370191156864, 0.003480579238384962]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 5.0, 7.0, 11.0, 7.0, 14.0, 9.0, 17.0, 22.0, 11.0, 16.0, 17.0, 19.0, 29.0, 21.0, 30.0, 34.0, 28.0, 44.0, 30.0, 42.0, 45.0, 47.0, 31.0, 47.0, 36.0, 20.0, 36.0, 43.0, 39.0, 20.0, 27.0, 20.0, 17.0, 10.0, 21.0, 13.0, 18.0, 14.0, 13.0, 14.0, 11.0, 6.0, 10.0, 6.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0006487369537353516, -0.0006285011768341064, -0.0006082653999328613, -0.0005880296230316162, -0.0005677938461303711, -0.000547558069229126, -0.0005273222923278809, -0.0005070865154266357, -0.0004868507385253906, -0.0004666149616241455, -0.0004463791847229004, -0.0004261434078216553, -0.00040590763092041016, -0.00038567185401916504, -0.0003654360771179199, -0.0003452003002166748, -0.0003249645233154297, -0.00030472874641418457, -0.00028449296951293945, -0.00026425719261169434, -0.00024402141571044922, -0.0002237856388092041, -0.00020354986190795898, -0.00018331408500671387, -0.00016307830810546875, -0.00014284253120422363, -0.00012260675430297852, -0.0001023709774017334, -8.213520050048828e-05, -6.189942359924316e-05, -4.166364669799805e-05, -2.142786979675293e-05, -1.1920928955078125e-06, 1.9043684005737305e-05, 3.927946090698242e-05, 5.951523780822754e-05, 7.975101470947266e-05, 9.998679161071777e-05, 0.00012022256851196289, 0.000140458345413208, 0.00016069412231445312, 0.00018092989921569824, 0.00020116567611694336, 0.00022140145301818848, 0.0002416372299194336, 0.0002618730068206787, 0.00028210878372192383, 0.00030234456062316895, 0.00032258033752441406, 0.0003428161144256592, 0.0003630518913269043, 0.0003832876682281494, 0.00040352344512939453, 0.00042375922203063965, 0.00044399499893188477, 0.0004642307758331299, 0.000484466552734375, 0.0005047023296356201, 0.0005249381065368652, 0.0005451738834381104, 0.0005654096603393555, 0.0005856454372406006, 0.0006058812141418457, 0.0006261169910430908, 0.0006463527679443359]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 14.0, 17.0, 9.0, 17.0, 17.0, 21.0, 21.0, 39.0, 26.0, 21.0, 35.0, 43.0, 41.0, 39.0, 42.0, 48.0, 36.0, 45.0, 34.0, 46.0, 51.0, 37.0, 36.0, 29.0, 25.0, 29.0, 22.0, 26.0, 26.0, 22.0, 13.0, 14.0, 5.0, 7.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.1875, -5.01373291015625, -4.8399658203125, -4.66619873046875, -4.492431640625, -4.31866455078125, -4.1448974609375, -3.97113037109375, -3.79736328125, -3.62359619140625, -3.4498291015625, -3.27606201171875, -3.102294921875, -2.92852783203125, -2.7547607421875, -2.58099365234375, -2.4072265625, -2.23345947265625, -2.0596923828125, -1.88592529296875, -1.712158203125, -1.53839111328125, -1.3646240234375, -1.19085693359375, -1.01708984375, -0.84332275390625, -0.6695556640625, -0.49578857421875, -0.322021484375, -0.14825439453125, 0.0255126953125, 0.19927978515625, 0.373046875, 0.54681396484375, 0.7205810546875, 0.89434814453125, 1.068115234375, 1.24188232421875, 1.4156494140625, 1.58941650390625, 1.76318359375, 1.93695068359375, 2.1107177734375, 2.28448486328125, 2.458251953125, 2.63201904296875, 2.8057861328125, 2.97955322265625, 3.1533203125, 3.32708740234375, 3.5008544921875, 3.67462158203125, 3.848388671875, 4.02215576171875, 4.1959228515625, 4.36968994140625, 4.54345703125, 4.71722412109375, 4.8909912109375, 5.06475830078125, 5.238525390625, 5.41229248046875, 5.5860595703125, 5.75982666015625, 5.93359375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 13.0, 12.0, 22.0, 29.0, 47.0, 65.0, 104.0, 180.0, 242.0, 412.0, 669.0, 1108.0, 1879.0, 3377.0, 6690.0, 14267.0, 32613.0, 85138.0, 259348.0, 410895.0, 140871.0, 50002.0, 20394.0, 9419.0, 4557.0, 2483.0, 1441.0, 842.0, 478.0, 345.0, 213.0, 133.0, 94.0, 56.0, 38.0, 18.0, 18.0, 15.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.41796875, -5.2684326171875, -5.118896484375, -4.9693603515625, -4.81982421875, -4.6702880859375, -4.520751953125, -4.3712158203125, -4.2216796875, -4.0721435546875, -3.922607421875, -3.7730712890625, -3.62353515625, -3.4739990234375, -3.324462890625, -3.1749267578125, -3.025390625, -2.8758544921875, -2.726318359375, -2.5767822265625, -2.42724609375, -2.2777099609375, -2.128173828125, -1.9786376953125, -1.8291015625, -1.6795654296875, -1.530029296875, -1.3804931640625, -1.23095703125, -1.0814208984375, -0.931884765625, -0.7823486328125, -0.6328125, -0.4832763671875, -0.333740234375, -0.1842041015625, -0.03466796875, 0.1148681640625, 0.264404296875, 0.4139404296875, 0.5634765625, 0.7130126953125, 0.862548828125, 1.0120849609375, 1.16162109375, 1.3111572265625, 1.460693359375, 1.6102294921875, 1.759765625, 1.9093017578125, 2.058837890625, 2.2083740234375, 2.35791015625, 2.5074462890625, 2.656982421875, 2.8065185546875, 2.9560546875, 3.1055908203125, 3.255126953125, 3.4046630859375, 3.55419921875, 3.7037353515625, 3.853271484375, 4.0028076171875, 4.15234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 4.0, 6.0, 4.0, 9.0, 9.0, 10.0, 15.0, 17.0, 22.0, 22.0, 27.0, 36.0, 29.0, 38.0, 40.0, 39.0, 35.0, 53.0, 119.0, 356.0, 1525.0, 141.0, 77.0, 62.0, 49.0, 38.0, 44.0, 33.0, 39.0, 27.0, 26.0, 17.0, 12.0, 16.0, 10.0, 7.0, 8.0, 2.0, 3.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.099853515625, -20.48095703125, -19.862060546875, -19.2431640625, -18.624267578125, -18.00537109375, -17.386474609375, -16.767578125, -16.148681640625, -15.52978515625, -14.910888671875, -14.2919921875, -13.673095703125, -13.05419921875, -12.435302734375, -11.81640625, -11.197509765625, -10.57861328125, -9.959716796875, -9.3408203125, -8.721923828125, -8.10302734375, -7.484130859375, -6.865234375, -6.246337890625, -5.62744140625, -5.008544921875, -4.3896484375, -3.770751953125, -3.15185546875, -2.532958984375, -1.9140625, -1.295166015625, -0.67626953125, -0.057373046875, 0.5615234375, 1.180419921875, 1.79931640625, 2.418212890625, 3.037109375, 3.656005859375, 4.27490234375, 4.893798828125, 5.5126953125, 6.131591796875, 6.75048828125, 7.369384765625, 7.98828125, 8.607177734375, 9.22607421875, 9.844970703125, 10.4638671875, 11.082763671875, 11.70166015625, 12.320556640625, 12.939453125, 13.558349609375, 14.17724609375, 14.796142578125, 15.4150390625, 16.033935546875, 16.65283203125, 17.271728515625, 17.890625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 11.0, 10.0, 12.0, 13.0, 23.0, 41.0, 59.0, 77.0, 138.0, 165.0, 252.0, 433.0, 905.0, 25391.0, 3110114.0, 6305.0, 608.0, 333.0, 253.0, 159.0, 130.0, 68.0, 53.0, 37.0, 33.0, 18.0, 16.0, 18.0, 10.0, 7.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-67.1875, -65.173828125, -63.16015625, -61.146484375, -59.1328125, -57.119140625, -55.10546875, -53.091796875, -51.078125, -49.064453125, -47.05078125, -45.037109375, -43.0234375, -41.009765625, -38.99609375, -36.982421875, -34.96875, -32.955078125, -30.94140625, -28.927734375, -26.9140625, -24.900390625, -22.88671875, -20.873046875, -18.859375, -16.845703125, -14.83203125, -12.818359375, -10.8046875, -8.791015625, -6.77734375, -4.763671875, -2.75, -0.736328125, 1.27734375, 3.291015625, 5.3046875, 7.318359375, 9.33203125, 11.345703125, 13.359375, 15.373046875, 17.38671875, 19.400390625, 21.4140625, 23.427734375, 25.44140625, 27.455078125, 29.46875, 31.482421875, 33.49609375, 35.509765625, 37.5234375, 39.537109375, 41.55078125, 43.564453125, 45.578125, 47.591796875, 49.60546875, 51.619140625, 53.6328125, 55.646484375, 57.66015625, 59.673828125, 61.6875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 19.0, 134.0, 450.0, 313.0, 88.0, 11.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-148.3781280517578, -145.7188720703125, -143.0596160888672, -140.40037536621094, -137.74111938476562, -135.0818634033203, -132.422607421875, -129.7633514404297, -127.1041030883789, -124.4448471069336, -121.78559875488281, -119.1263427734375, -116.46709442138672, -113.8078384399414, -111.14859008789062, -108.48933410644531, -105.830078125, -103.17082214355469, -100.5115737915039, -97.8523178100586, -95.19306945800781, -92.5338134765625, -89.87455749511719, -87.2153091430664, -84.55606079101562, -81.89680480957031, -79.23755645751953, -76.57830047607422, -73.91905212402344, -71.25979614257812, -68.60054016113281, -65.94129180908203, -63.28203582763672, -60.62278366088867, -57.963531494140625, -55.30427551269531, -52.645023345947266, -49.98577117919922, -47.32651901245117, -44.667266845703125, -42.00801086425781, -39.348758697509766, -36.68950653076172, -34.030250549316406, -31.37099838256836, -28.711746215820312, -26.052494049072266, -23.393239974975586, -20.733989715576172, -18.074737548828125, -15.415483474731445, -12.756231307983398, -10.096978187561035, -7.437725067138672, -4.778472900390625, -2.1192188262939453, 0.5400333404541016, 3.1992862224578857, 5.85853910446167, 8.517791748046875, 11.177044868469238, 13.836297988891602, 16.49555015563965, 19.154804229736328, 21.814056396484375]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 7.0, 8.0, 3.0, 5.0, 7.0, 8.0, 13.0, 13.0, 23.0, 17.0, 22.0, 25.0, 23.0, 21.0, 21.0, 27.0, 31.0, 23.0, 30.0, 32.0, 42.0, 42.0, 37.0, 46.0, 31.0, 38.0, 28.0, 44.0, 34.0, 35.0, 37.0, 30.0, 21.0, 27.0, 22.0, 23.0, 24.0, 20.0, 12.0, 12.0, 6.0, 5.0, 4.0, 6.0, 6.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.33206558227539, -47.75941467285156, -46.18675994873047, -44.61410903930664, -43.04145812988281, -41.46880340576172, -39.89615249633789, -38.32350158691406, -36.75084686279297, -35.17819595336914, -33.60554122924805, -32.03289031982422, -30.460237503051758, -28.887584686279297, -27.31493377685547, -25.742280960083008, -24.169628143310547, -22.596975326538086, -21.024322509765625, -19.451671600341797, -17.879018783569336, -16.306365966796875, -14.73371410369873, -13.161062240600586, -11.588409423828125, -10.015756607055664, -8.44310474395752, -6.870452404022217, -5.297800064086914, -3.7251477241516113, -2.1524953842163086, -0.5798435211181641, 0.9928092956542969, 2.5654616355895996, 4.138113975524902, 5.710766315460205, 7.283418655395508, 8.856071472167969, 10.428723335266113, 12.001375198364258, 13.574028015136719, 15.14668083190918, 16.71933364868164, 18.29198455810547, 19.86463737487793, 21.43729019165039, 23.00994110107422, 24.58259391784668, 26.15524673461914, 27.7278995513916, 29.300552368164062, 30.87320327758789, 32.44585418701172, 34.01850891113281, 35.59115982055664, 37.16381072998047, 38.73646545410156, 40.30911636352539, 41.881771087646484, 43.45442199707031, 45.027076721191406, 46.599727630615234, 48.17237854003906, 49.745033264160156, 51.317684173583984]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 11.0, 10.0, 6.0, 13.0, 19.0, 13.0, 16.0, 15.0, 23.0, 20.0, 33.0, 32.0, 35.0, 40.0, 31.0, 44.0, 44.0, 34.0, 42.0, 41.0, 50.0, 37.0, 41.0, 31.0, 38.0, 32.0, 28.0, 27.0, 34.0, 21.0, 21.0, 26.0, 21.0, 11.0, 10.0, 8.0, 10.0, 4.0, 5.0, 7.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.078125, -4.8988037109375, -4.719482421875, -4.5401611328125, -4.36083984375, -4.1815185546875, -4.002197265625, -3.8228759765625, -3.6435546875, -3.4642333984375, -3.284912109375, -3.1055908203125, -2.92626953125, -2.7469482421875, -2.567626953125, -2.3883056640625, -2.208984375, -2.0296630859375, -1.850341796875, -1.6710205078125, -1.49169921875, -1.3123779296875, -1.133056640625, -0.9537353515625, -0.7744140625, -0.5950927734375, -0.415771484375, -0.2364501953125, -0.05712890625, 0.1221923828125, 0.301513671875, 0.4808349609375, 0.66015625, 0.8394775390625, 1.018798828125, 1.1981201171875, 1.37744140625, 1.5567626953125, 1.736083984375, 1.9154052734375, 2.0947265625, 2.2740478515625, 2.453369140625, 2.6326904296875, 2.81201171875, 2.9913330078125, 3.170654296875, 3.3499755859375, 3.529296875, 3.7086181640625, 3.887939453125, 4.0672607421875, 4.24658203125, 4.4259033203125, 4.605224609375, 4.7845458984375, 4.9638671875, 5.1431884765625, 5.322509765625, 5.5018310546875, 5.68115234375, 5.8604736328125, 6.039794921875, 6.2191162109375, 6.3984375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 9.0, 14.0, 11.0, 15.0, 22.0, 23.0, 35.0, 63.0, 82.0, 138.0, 264.0, 562.0, 1700.0, 8602.0, 87350.0, 1346825.0, 2476472.0, 249408.0, 18166.0, 2871.0, 769.0, 337.0, 176.0, 79.0, 60.0, 36.0, 34.0, 30.0, 27.0, 12.0, 14.0, 11.0, 6.0, 7.0, 5.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.8348388671875, -11.364990234375, -10.8951416015625, -10.42529296875, -9.9554443359375, -9.485595703125, -9.0157470703125, -8.5458984375, -8.0760498046875, -7.606201171875, -7.1363525390625, -6.66650390625, -6.1966552734375, -5.726806640625, -5.2569580078125, -4.787109375, -4.3172607421875, -3.847412109375, -3.3775634765625, -2.90771484375, -2.4378662109375, -1.968017578125, -1.4981689453125, -1.0283203125, -0.5584716796875, -0.088623046875, 0.3812255859375, 0.85107421875, 1.3209228515625, 1.790771484375, 2.2606201171875, 2.73046875, 3.2003173828125, 3.670166015625, 4.1400146484375, 4.60986328125, 5.0797119140625, 5.549560546875, 6.0194091796875, 6.4892578125, 6.9591064453125, 7.428955078125, 7.8988037109375, 8.36865234375, 8.8385009765625, 9.308349609375, 9.7781982421875, 10.248046875, 10.7178955078125, 11.187744140625, 11.6575927734375, 12.12744140625, 12.5972900390625, 13.067138671875, 13.5369873046875, 14.0068359375, 14.4766845703125, 14.946533203125, 15.4163818359375, 15.88623046875, 16.3560791015625, 16.825927734375, 17.2957763671875, 17.765625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 12.0, 16.0, 22.0, 31.0, 39.0, 61.0, 99.0, 140.0, 204.0, 290.0, 401.0, 509.0, 565.0, 438.0, 375.0, 270.0, 169.0, 124.0, 79.0, 78.0, 38.0, 40.0, 18.0, 13.0, 11.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.421875, -14.971435546875, -14.52099609375, -14.070556640625, -13.6201171875, -13.169677734375, -12.71923828125, -12.268798828125, -11.818359375, -11.367919921875, -10.91748046875, -10.467041015625, -10.0166015625, -9.566162109375, -9.11572265625, -8.665283203125, -8.21484375, -7.764404296875, -7.31396484375, -6.863525390625, -6.4130859375, -5.962646484375, -5.51220703125, -5.061767578125, -4.611328125, -4.160888671875, -3.71044921875, -3.260009765625, -2.8095703125, -2.359130859375, -1.90869140625, -1.458251953125, -1.0078125, -0.557373046875, -0.10693359375, 0.343505859375, 0.7939453125, 1.244384765625, 1.69482421875, 2.145263671875, 2.595703125, 3.046142578125, 3.49658203125, 3.947021484375, 4.3974609375, 4.847900390625, 5.29833984375, 5.748779296875, 6.19921875, 6.649658203125, 7.10009765625, 7.550537109375, 8.0009765625, 8.451416015625, 8.90185546875, 9.352294921875, 9.802734375, 10.253173828125, 10.70361328125, 11.154052734375, 11.6044921875, 12.054931640625, 12.50537109375, 12.955810546875, 13.40625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 7.0, 4.0, 9.0, 7.0, 15.0, 24.0, 28.0, 34.0, 50.0, 78.0, 109.0, 150.0, 189.0, 228.0, 416.0, 908.0, 10629.0, 3589451.0, 587536.0, 2688.0, 614.0, 334.0, 232.0, 142.0, 104.0, 83.0, 58.0, 46.0, 36.0, 20.0, 18.0, 17.0, 13.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.9375, -46.2744140625, -44.611328125, -42.9482421875, -41.28515625, -39.6220703125, -37.958984375, -36.2958984375, -34.6328125, -32.9697265625, -31.306640625, -29.6435546875, -27.98046875, -26.3173828125, -24.654296875, -22.9912109375, -21.328125, -19.6650390625, -18.001953125, -16.3388671875, -14.67578125, -13.0126953125, -11.349609375, -9.6865234375, -8.0234375, -6.3603515625, -4.697265625, -3.0341796875, -1.37109375, 0.2919921875, 1.955078125, 3.6181640625, 5.28125, 6.9443359375, 8.607421875, 10.2705078125, 11.93359375, 13.5966796875, 15.259765625, 16.9228515625, 18.5859375, 20.2490234375, 21.912109375, 23.5751953125, 25.23828125, 26.9013671875, 28.564453125, 30.2275390625, 31.890625, 33.5537109375, 35.216796875, 36.8798828125, 38.54296875, 40.2060546875, 41.869140625, 43.5322265625, 45.1953125, 46.8583984375, 48.521484375, 50.1845703125, 51.84765625, 53.5107421875, 55.173828125, 56.8369140625, 58.5]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 9.0, 11.0, 33.0, 39.0, 64.0, 102.0, 135.0, 146.0, 162.0, 108.0, 81.0, 52.0, 29.0, 24.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.32976150512695, -58.35004806518555, -56.37033462524414, -54.39061737060547, -52.41090393066406, -50.431190490722656, -48.45147705078125, -46.471763610839844, -44.49205017089844, -42.51233673095703, -40.532623291015625, -38.55290985107422, -36.57319259643555, -34.59347915649414, -32.613765716552734, -30.634052276611328, -28.654335021972656, -26.67462158203125, -24.69490623474121, -22.715192794799805, -20.735477447509766, -18.75576400756836, -16.776050567626953, -14.79633617401123, -12.816621780395508, -10.836907386779785, -8.857192993164062, -6.877479553222656, -4.897765159606934, -2.918050765991211, -0.9383373260498047, 1.041377067565918, 3.021087646484375, 5.000802040100098, 6.980515956878662, 8.960229873657227, 10.93994426727295, 12.919658660888672, 14.899372100830078, 16.879085540771484, 18.858800888061523, 20.83851432800293, 22.81822967529297, 24.797943115234375, 26.77765655517578, 28.75737190246582, 30.737085342407227, 32.716800689697266, 34.69651412963867, 36.67622756958008, 38.655941009521484, 40.635658264160156, 42.61537170410156, 44.59508514404297, 46.574798583984375, 48.55451202392578, 50.53422546386719, 52.513938903808594, 54.49365234375, 56.473365783691406, 58.45308303833008, 60.432796478271484, 62.41250991821289, 64.39222717285156, 66.37194061279297]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 5.0, 2.0, 10.0, 15.0, 11.0, 12.0, 23.0, 11.0, 23.0, 20.0, 19.0, 27.0, 34.0, 25.0, 42.0, 30.0, 36.0, 44.0, 40.0, 38.0, 36.0, 38.0, 45.0, 36.0, 25.0, 31.0, 26.0, 31.0, 25.0, 25.0, 31.0, 21.0, 18.0, 25.0, 19.0, 17.0, 12.0, 8.0, 7.0, 6.0, 13.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.90130615234375, -34.78737258911133, -33.673439025878906, -32.559505462646484, -31.445571899414062, -30.33163833618164, -29.21770477294922, -28.103771209716797, -26.989837646484375, -25.875904083251953, -24.76197052001953, -23.64803695678711, -22.534103393554688, -21.420169830322266, -20.306236267089844, -19.192302703857422, -18.078369140625, -16.964435577392578, -15.850502014160156, -14.736568450927734, -13.622634887695312, -12.50870132446289, -11.394767761230469, -10.280834197998047, -9.166900634765625, -8.052967071533203, -6.939033508300781, -5.825099945068359, -4.7111663818359375, -3.5972328186035156, -2.4832992553710938, -1.3693656921386719, -0.25543212890625, 0.8585014343261719, 1.9724349975585938, 3.0863685607910156, 4.2003021240234375, 5.314235687255859, 6.428169250488281, 7.542102813720703, 8.656036376953125, 9.769969940185547, 10.883903503417969, 11.99783706665039, 13.111770629882812, 14.225704193115234, 15.339637756347656, 16.453571319580078, 17.5675048828125, 18.681438446044922, 19.795372009277344, 20.909305572509766, 22.023239135742188, 23.13717269897461, 24.25110626220703, 25.365039825439453, 26.478973388671875, 27.592906951904297, 28.70684051513672, 29.82077407836914, 30.934707641601562, 32.048641204833984, 33.162574768066406, 34.27650833129883, 35.39044189453125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 9.0, 10.0, 10.0, 18.0, 15.0, 21.0, 21.0, 16.0, 30.0, 33.0, 39.0, 43.0, 36.0, 44.0, 55.0, 31.0, 48.0, 47.0, 43.0, 43.0, 44.0, 38.0, 37.0, 33.0, 29.0, 31.0, 30.0, 25.0, 15.0, 18.0, 11.0, 17.0, 15.0, 10.0, 3.0, 3.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.37890625, -6.19329833984375, -6.0076904296875, -5.82208251953125, -5.636474609375, -5.45086669921875, -5.2652587890625, -5.07965087890625, -4.89404296875, -4.70843505859375, -4.5228271484375, -4.33721923828125, -4.151611328125, -3.96600341796875, -3.7803955078125, -3.59478759765625, -3.4091796875, -3.22357177734375, -3.0379638671875, -2.85235595703125, -2.666748046875, -2.48114013671875, -2.2955322265625, -2.10992431640625, -1.92431640625, -1.73870849609375, -1.5531005859375, -1.36749267578125, -1.181884765625, -0.99627685546875, -0.8106689453125, -0.62506103515625, -0.439453125, -0.25384521484375, -0.0682373046875, 0.11737060546875, 0.302978515625, 0.48858642578125, 0.6741943359375, 0.85980224609375, 1.04541015625, 1.23101806640625, 1.4166259765625, 1.60223388671875, 1.787841796875, 1.97344970703125, 2.1590576171875, 2.34466552734375, 2.5302734375, 2.71588134765625, 2.9014892578125, 3.08709716796875, 3.272705078125, 3.45831298828125, 3.6439208984375, 3.82952880859375, 4.01513671875, 4.20074462890625, 4.3863525390625, 4.57196044921875, 4.757568359375, 4.94317626953125, 5.1287841796875, 5.31439208984375, 5.5]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 7.0, 18.0, 14.0, 42.0, 66.0, 116.0, 168.0, 269.0, 430.0, 648.0, 971.0, 1514.0, 2467.0, 3804.0, 6185.0, 10030.0, 15820.0, 25661.0, 43923.0, 74875.0, 131944.0, 198994.0, 201282.0, 135523.0, 78297.0, 45254.0, 26740.0, 16071.0, 10125.0, 6244.0, 4081.0, 2633.0, 1603.0, 959.0, 641.0, 385.0, 260.0, 176.0, 96.0, 60.0, 47.0, 36.0, 27.0, 14.0, 7.0, 8.0, 9.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.64990234375, -0.6302261352539062, -0.6105499267578125, -0.5908737182617188, -0.571197509765625, -0.5515213012695312, -0.5318450927734375, -0.5121688842773438, -0.49249267578125, -0.47281646728515625, -0.4531402587890625, -0.43346405029296875, -0.413787841796875, -0.39411163330078125, -0.3744354248046875, -0.35475921630859375, -0.3350830078125, -0.31540679931640625, -0.2957305908203125, -0.27605438232421875, -0.256378173828125, -0.23670196533203125, -0.2170257568359375, -0.19734954833984375, -0.17767333984375, -0.15799713134765625, -0.1383209228515625, -0.11864471435546875, -0.098968505859375, -0.07929229736328125, -0.0596160888671875, -0.03993988037109375, -0.020263671875, -0.00058746337890625, 0.0190887451171875, 0.03876495361328125, 0.058441162109375, 0.07811737060546875, 0.0977935791015625, 0.11746978759765625, 0.13714599609375, 0.15682220458984375, 0.1764984130859375, 0.19617462158203125, 0.215850830078125, 0.23552703857421875, 0.2552032470703125, 0.27487945556640625, 0.2945556640625, 0.31423187255859375, 0.3339080810546875, 0.35358428955078125, 0.373260498046875, 0.39293670654296875, 0.4126129150390625, 0.43228912353515625, 0.45196533203125, 0.47164154052734375, 0.4913177490234375, 0.5109939575195312, 0.530670166015625, 0.5503463745117188, 0.5700225830078125, 0.5896987915039062, 0.609375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 9.0, 3.0, 6.0, 7.0, 11.0, 10.0, 16.0, 9.0, 17.0, 17.0, 19.0, 20.0, 25.0, 33.0, 25.0, 35.0, 36.0, 44.0, 40.0, 37.0, 46.0, 1071.0, 42.0, 35.0, 41.0, 37.0, 46.0, 52.0, 26.0, 34.0, 31.0, 17.0, 19.0, 28.0, 19.0, 16.0, 11.0, 11.0, 8.0, 6.0, 5.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.373321533203125, -3.26031494140625, -3.147308349609375, -3.0343017578125, -2.921295166015625, -2.80828857421875, -2.695281982421875, -2.582275390625, -2.469268798828125, -2.35626220703125, -2.243255615234375, -2.1302490234375, -2.017242431640625, -1.90423583984375, -1.791229248046875, -1.67822265625, -1.565216064453125, -1.45220947265625, -1.339202880859375, -1.2261962890625, -1.113189697265625, -1.00018310546875, -0.887176513671875, -0.774169921875, -0.661163330078125, -0.54815673828125, -0.435150146484375, -0.3221435546875, -0.209136962890625, -0.09613037109375, 0.016876220703125, 0.1298828125, 0.242889404296875, 0.35589599609375, 0.468902587890625, 0.5819091796875, 0.694915771484375, 0.80792236328125, 0.920928955078125, 1.033935546875, 1.146942138671875, 1.25994873046875, 1.372955322265625, 1.4859619140625, 1.598968505859375, 1.71197509765625, 1.824981689453125, 1.93798828125, 2.050994873046875, 2.16400146484375, 2.277008056640625, 2.3900146484375, 2.503021240234375, 2.61602783203125, 2.729034423828125, 2.842041015625, 2.955047607421875, 3.06805419921875, 3.181060791015625, 3.2940673828125, 3.407073974609375, 3.52008056640625, 3.633087158203125, 3.74609375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 16.0, 9.0, 16.0, 31.0, 52.0, 60.0, 100.0, 180.0, 237.0, 379.0, 581.0, 926.0, 1429.0, 2287.0, 3602.0, 5656.0, 8895.0, 14733.0, 23058.0, 37627.0, 61702.0, 99101.0, 146528.0, 1223456.0, 159896.0, 115149.0, 72915.0, 44636.0, 27867.0, 16938.0, 10620.0, 6588.0, 4341.0, 2742.0, 1651.0, 1107.0, 699.0, 438.0, 287.0, 214.0, 126.0, 89.0, 57.0, 34.0, 22.0, 17.0, 15.0, 3.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4012260437011719, -0.38814544677734375, -0.3750648498535156, -0.3619842529296875, -0.3489036560058594, -0.33582305908203125, -0.3227424621582031, -0.309661865234375, -0.2965812683105469, -0.28350067138671875, -0.2704200744628906, -0.2573394775390625, -0.24425888061523438, -0.23117828369140625, -0.21809768676757812, -0.20501708984375, -0.19193649291992188, -0.17885589599609375, -0.16577529907226562, -0.1526947021484375, -0.13961410522460938, -0.12653350830078125, -0.11345291137695312, -0.100372314453125, -0.08729171752929688, -0.07421112060546875, -0.061130523681640625, -0.0480499267578125, -0.034969329833984375, -0.02188873291015625, -0.008808135986328125, 0.0042724609375, 0.017353057861328125, 0.03043365478515625, 0.043514251708984375, 0.0565948486328125, 0.06967544555664062, 0.08275604248046875, 0.09583663940429688, 0.108917236328125, 0.12199783325195312, 0.13507843017578125, 0.14815902709960938, 0.1612396240234375, 0.17432022094726562, 0.18740081787109375, 0.20048141479492188, 0.21356201171875, 0.22664260864257812, 0.23972320556640625, 0.2528038024902344, 0.2658843994140625, 0.2789649963378906, 0.29204559326171875, 0.3051261901855469, 0.318206787109375, 0.3312873840332031, 0.34436798095703125, 0.3574485778808594, 0.3705291748046875, 0.3836097717285156, 0.39669036865234375, 0.4097709655761719, 0.4228515625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 6.0, 2.0, 2.0, 5.0, 8.0, 11.0, 13.0, 18.0, 10.0, 20.0, 17.0, 22.0, 26.0, 49.0, 51.0, 39.0, 43.0, 48.0, 53.0, 54.0, 53.0, 53.0, 60.0, 47.0, 30.0, 54.0, 37.0, 37.0, 34.0, 20.0, 16.0, 6.0, 8.0, 11.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014600753784179688, -0.0014127492904663086, -0.0013654232025146484, -0.0013180971145629883, -0.0012707710266113281, -0.001223444938659668, -0.0011761188507080078, -0.0011287927627563477, -0.0010814666748046875, -0.0010341405868530273, -0.0009868144989013672, -0.000939488410949707, -0.0008921623229980469, -0.0008448362350463867, -0.0007975101470947266, -0.0007501840591430664, -0.0007028579711914062, -0.0006555318832397461, -0.0006082057952880859, -0.0005608797073364258, -0.0005135536193847656, -0.00046622753143310547, -0.0004189014434814453, -0.00037157535552978516, -0.000324249267578125, -0.00027692317962646484, -0.0002295970916748047, -0.00018227100372314453, -0.00013494491577148438, -8.761882781982422e-05, -4.029273986816406e-05, 7.033348083496094e-06, 5.435943603515625e-05, 0.0001016855239868164, 0.00014901161193847656, 0.00019633769989013672, 0.00024366378784179688, 0.00029098987579345703, 0.0003383159637451172, 0.00038564205169677734, 0.0004329681396484375, 0.00048029422760009766, 0.0005276203155517578, 0.000574946403503418, 0.0006222724914550781, 0.0006695985794067383, 0.0007169246673583984, 0.0007642507553100586, 0.0008115768432617188, 0.0008589029312133789, 0.0009062290191650391, 0.0009535551071166992, 0.0010008811950683594, 0.0010482072830200195, 0.0010955333709716797, 0.0011428594589233398, 0.001190185546875, 0.0012375116348266602, 0.0012848377227783203, 0.0013321638107299805, 0.0013794898986816406, 0.0014268159866333008, 0.001474142074584961, 0.001521468162536621, 0.0015687942504882812]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 8.0, 2.0, 9.0, 11.0, 6.0, 9.0, 13.0, 19.0, 8.0, 42.0, 44.0, 42.0, 45.0, 82.0, 93.0, 143.0, 190.0, 377.0, 1198.0, 39938.0, 990443.0, 13855.0, 887.0, 347.0, 186.0, 115.0, 84.0, 62.0, 42.0, 55.0, 26.0, 24.0, 18.0, 16.0, 15.0, 24.0, 18.0, 8.0, 9.0, 9.0, 3.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.0280609130859375, -0.027194976806640625, -0.02632904052734375, -0.025463104248046875, -0.02459716796875, -0.023731231689453125, -0.02286529541015625, -0.021999359130859375, -0.0211334228515625, -0.020267486572265625, -0.01940155029296875, -0.018535614013671875, -0.017669677734375, -0.016803741455078125, -0.01593780517578125, -0.015071868896484375, -0.0142059326171875, -0.013339996337890625, -0.01247406005859375, -0.011608123779296875, -0.0107421875, -0.009876251220703125, -0.00901031494140625, -0.008144378662109375, -0.0072784423828125, -0.006412506103515625, -0.00554656982421875, -0.004680633544921875, -0.003814697265625, -0.002948760986328125, -0.00208282470703125, -0.001216888427734375, -0.0003509521484375, 0.000514984130859375, 0.00138092041015625, 0.002246856689453125, 0.00311279296875, 0.003978729248046875, 0.00484466552734375, 0.005710601806640625, 0.0065765380859375, 0.007442474365234375, 0.00830841064453125, 0.009174346923828125, 0.010040283203125, 0.010906219482421875, 0.01177215576171875, 0.012638092041015625, 0.0135040283203125, 0.014369964599609375, 0.01523590087890625, 0.016101837158203125, 0.0169677734375, 0.017833709716796875, 0.01869964599609375, 0.019565582275390625, 0.0204315185546875, 0.021297454833984375, 0.02216339111328125, 0.023029327392578125, 0.023895263671875, 0.024761199951171875, 0.02562713623046875, 0.026493072509765625, 0.0273590087890625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 189.0, 690.0, 123.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016015776200219989, -0.0013522914377972484, -0.0011030053719878197, -0.0008537191897630692, -0.0006044330075383186, -0.0003551468253135681, -0.00010586075950413942, 0.0001434254227206111, 0.0003927116049453616, 0.0006419977871701121, 0.0008912839111872017, 0.0011405700352042913, 0.0013898562174290419, 0.0016391423996537924, 0.001888428465463221, 0.0021377145312726498, 0.0023870007134974003, 0.002636286895722151, 0.0028855730779469013, 0.003134859260171652, 0.0033841454423964024, 0.003633431624621153, 0.0038827175740152597, 0.004132003523409367, 0.0043812901712954044, 0.004630576353520155, 0.0048798625357449055, 0.005129148717969656, 0.0053784349001944065, 0.005627721082419157, 0.00587700679898262, 0.006126292981207371, 0.006375580094754696, 0.006624866276979446, 0.006874152459204197, 0.0071234386414289474, 0.007372724823653698, 0.0076220110058784485, 0.007871297188103199, 0.00812058337032795, 0.0083698695525527, 0.00861915573477745, 0.008868441917002201, 0.009117728099226952, 0.009367014281451702, 0.009616300463676453, 0.009865586645901203, 0.010114872828125954, 0.01036415807902813, 0.01061344426125288, 0.01086273044347763, 0.011112016625702381, 0.011361302807927132, 0.011610588990151882, 0.011859875172376633, 0.012109161354601383, 0.012358447536826134, 0.012607733719050884, 0.012857019901275635, 0.013106306083500385, 0.013355592265725136, 0.013604878447949886, 0.013854164630174637, 0.014103450812399387, 0.014352736994624138]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 7.0, 1.0, 8.0, 5.0, 10.0, 18.0, 15.0, 18.0, 19.0, 16.0, 28.0, 28.0, 22.0, 31.0, 28.0, 32.0, 43.0, 30.0, 44.0, 47.0, 46.0, 32.0, 35.0, 37.0, 26.0, 40.0, 48.0, 31.0, 32.0, 29.0, 27.0, 23.0, 16.0, 21.0, 13.0, 22.0, 15.0, 14.0, 7.0, 9.0, 6.0, 12.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008257627487182617, -0.0008004559203982353, -0.0007751490920782089, -0.0007498422637581825, -0.0007245354354381561, -0.0006992286071181297, -0.0006739217787981033, -0.0006486149504780769, -0.0006233081221580505, -0.0005980012938380241, -0.0005726944655179977, -0.0005473876371979713, -0.000522080808877945, -0.0004967739805579185, -0.00047146715223789215, -0.00044616032391786575, -0.00042085349559783936, -0.00039554666727781296, -0.00037023983895778656, -0.00034493301063776016, -0.00031962618231773376, -0.00029431935399770737, -0.00026901252567768097, -0.00024370569735765457, -0.00021839886903762817, -0.00019309204071760178, -0.00016778521239757538, -0.00014247838407754898, -0.00011717155575752258, -9.186472743749619e-05, -6.655789911746979e-05, -4.125107079744339e-05, -1.5944242477416992e-05, 9.362585842609406e-06, 3.46694141626358e-05, 5.99762424826622e-05, 8.52830708026886e-05, 0.000110589899122715, 0.0001358967274427414, 0.0001612035557627678, 0.0001865103840827942, 0.0002118172124028206, 0.00023712404072284698, 0.0002624308690428734, 0.0002877376973628998, 0.0003130445256829262, 0.0003383513540029526, 0.000363658182322979, 0.00038896501064300537, 0.00041427183896303177, 0.00043957866728305817, 0.00046488549560308456, 0.000490192323923111, 0.0005154991522431374, 0.0005408059805631638, 0.0005661128088831902, 0.0005914196372032166, 0.000616726465523243, 0.0006420332938432693, 0.0006673401221632957, 0.0006926469504833221, 0.0007179537788033485, 0.0007432606071233749, 0.0007685674354434013, 0.0007938742637634277]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 9.0, 10.0, 10.0, 18.0, 15.0, 21.0, 21.0, 16.0, 30.0, 33.0, 39.0, 42.0, 37.0, 44.0, 55.0, 31.0, 48.0, 46.0, 44.0, 43.0, 44.0, 38.0, 37.0, 33.0, 29.0, 31.0, 30.0, 25.0, 15.0, 18.0, 11.0, 17.0, 15.0, 10.0, 3.0, 3.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.37890625, -6.19329833984375, -6.0076904296875, -5.82208251953125, -5.636474609375, -5.45086669921875, -5.2652587890625, -5.07965087890625, -4.89404296875, -4.70843505859375, -4.5228271484375, -4.33721923828125, -4.151611328125, -3.96600341796875, -3.7803955078125, -3.59478759765625, -3.4091796875, -3.22357177734375, -3.0379638671875, -2.85235595703125, -2.666748046875, -2.48114013671875, -2.2955322265625, -2.10992431640625, -1.92431640625, -1.73870849609375, -1.5531005859375, -1.36749267578125, -1.181884765625, -0.99627685546875, -0.8106689453125, -0.62506103515625, -0.439453125, -0.25384521484375, -0.0682373046875, 0.11737060546875, 0.302978515625, 0.48858642578125, 0.6741943359375, 0.85980224609375, 1.04541015625, 1.23101806640625, 1.4166259765625, 1.60223388671875, 1.787841796875, 1.97344970703125, 2.1590576171875, 2.34466552734375, 2.5302734375, 2.71588134765625, 2.9014892578125, 3.08709716796875, 3.272705078125, 3.45831298828125, 3.6439208984375, 3.82952880859375, 4.01513671875, 4.20074462890625, 4.3863525390625, 4.57196044921875, 4.757568359375, 4.94317626953125, 5.1287841796875, 5.31439208984375, 5.5]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 7.0, 5.0, 11.0, 15.0, 16.0, 21.0, 24.0, 42.0, 50.0, 85.0, 130.0, 215.0, 360.0, 648.0, 1269.0, 2455.0, 5580.0, 14137.0, 46979.0, 190790.0, 537777.0, 179607.0, 44225.0, 13539.0, 5296.0, 2459.0, 1218.0, 638.0, 342.0, 211.0, 138.0, 57.0, 57.0, 32.0, 32.0, 21.0, 24.0, 11.0, 5.0, 7.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.22265625, -6.04217529296875, -5.8616943359375, -5.68121337890625, -5.500732421875, -5.32025146484375, -5.1397705078125, -4.95928955078125, -4.77880859375, -4.59832763671875, -4.4178466796875, -4.23736572265625, -4.056884765625, -3.87640380859375, -3.6959228515625, -3.51544189453125, -3.3349609375, -3.15447998046875, -2.9739990234375, -2.79351806640625, -2.613037109375, -2.43255615234375, -2.2520751953125, -2.07159423828125, -1.89111328125, -1.71063232421875, -1.5301513671875, -1.34967041015625, -1.169189453125, -0.98870849609375, -0.8082275390625, -0.62774658203125, -0.447265625, -0.26678466796875, -0.0863037109375, 0.09417724609375, 0.274658203125, 0.45513916015625, 0.6356201171875, 0.81610107421875, 0.99658203125, 1.17706298828125, 1.3575439453125, 1.53802490234375, 1.718505859375, 1.89898681640625, 2.0794677734375, 2.25994873046875, 2.4404296875, 2.62091064453125, 2.8013916015625, 2.98187255859375, 3.162353515625, 3.34283447265625, 3.5233154296875, 3.70379638671875, 3.88427734375, 4.06475830078125, 4.2452392578125, 4.42572021484375, 4.606201171875, 4.78668212890625, 4.9671630859375, 5.14764404296875, 5.328125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 8.0, 8.0, 4.0, 13.0, 17.0, 12.0, 20.0, 18.0, 19.0, 20.0, 33.0, 40.0, 43.0, 32.0, 45.0, 54.0, 93.0, 325.0, 1627.0, 153.0, 58.0, 47.0, 46.0, 47.0, 40.0, 35.0, 25.0, 24.0, 25.0, 23.0, 16.0, 16.0, 13.0, 11.0, 14.0, 12.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.0625, -19.419921875, -18.77734375, -18.134765625, -17.4921875, -16.849609375, -16.20703125, -15.564453125, -14.921875, -14.279296875, -13.63671875, -12.994140625, -12.3515625, -11.708984375, -11.06640625, -10.423828125, -9.78125, -9.138671875, -8.49609375, -7.853515625, -7.2109375, -6.568359375, -5.92578125, -5.283203125, -4.640625, -3.998046875, -3.35546875, -2.712890625, -2.0703125, -1.427734375, -0.78515625, -0.142578125, 0.5, 1.142578125, 1.78515625, 2.427734375, 3.0703125, 3.712890625, 4.35546875, 4.998046875, 5.640625, 6.283203125, 6.92578125, 7.568359375, 8.2109375, 8.853515625, 9.49609375, 10.138671875, 10.78125, 11.423828125, 12.06640625, 12.708984375, 13.3515625, 13.994140625, 14.63671875, 15.279296875, 15.921875, 16.564453125, 17.20703125, 17.849609375, 18.4921875, 19.134765625, 19.77734375, 20.419921875, 21.0625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 24.0, 14.0, 18.0, 31.0, 27.0, 55.0, 61.0, 103.0, 143.0, 214.0, 315.0, 508.0, 1852.0, 126176.0, 3010266.0, 4156.0, 673.0, 317.0, 228.0, 150.0, 99.0, 69.0, 36.0, 40.0, 22.0, 30.0, 16.0, 11.0, 11.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.0, -53.28955078125, -51.5791015625, -49.86865234375, -48.158203125, -46.44775390625, -44.7373046875, -43.02685546875, -41.31640625, -39.60595703125, -37.8955078125, -36.18505859375, -34.474609375, -32.76416015625, -31.0537109375, -29.34326171875, -27.6328125, -25.92236328125, -24.2119140625, -22.50146484375, -20.791015625, -19.08056640625, -17.3701171875, -15.65966796875, -13.94921875, -12.23876953125, -10.5283203125, -8.81787109375, -7.107421875, -5.39697265625, -3.6865234375, -1.97607421875, -0.265625, 1.44482421875, 3.1552734375, 4.86572265625, 6.576171875, 8.28662109375, 9.9970703125, 11.70751953125, 13.41796875, 15.12841796875, 16.8388671875, 18.54931640625, 20.259765625, 21.97021484375, 23.6806640625, 25.39111328125, 27.1015625, 28.81201171875, 30.5224609375, 32.23291015625, 33.943359375, 35.65380859375, 37.3642578125, 39.07470703125, 40.78515625, 42.49560546875, 44.2060546875, 45.91650390625, 47.626953125, 49.33740234375, 51.0478515625, 52.75830078125, 54.46875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 103.0, 756.0, 157.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.90377807617188, -204.0189971923828, -200.1342010498047, -196.24942016601562, -192.36463928222656, -188.4798583984375, -184.59506225585938, -180.7102813720703, -176.82550048828125, -172.9407196044922, -169.05592346191406, -165.171142578125, -161.28636169433594, -157.40158081054688, -153.51678466796875, -149.6320037841797, -145.74722290039062, -141.86244201660156, -137.97764587402344, -134.09286499023438, -130.2080841064453, -126.32329559326172, -122.43850708007812, -118.55372619628906, -114.66893005371094, -110.78414154052734, -106.89936065673828, -103.01457214355469, -99.12979125976562, -95.24500274658203, -91.36021423339844, -87.47543334960938, -83.59065246582031, -79.70586395263672, -75.82108306884766, -71.93629455566406, -68.051513671875, -64.1667251586914, -60.28194046020508, -56.39715576171875, -52.51237106323242, -48.627586364746094, -44.742801666259766, -40.85801696777344, -36.973228454589844, -33.08844757080078, -29.203659057617188, -25.31887435913086, -21.43408966064453, -17.549304962158203, -13.664519309997559, -9.779733657836914, -5.894948959350586, -2.010164260864258, 1.8746223449707031, 5.759407043457031, 9.64419174194336, 13.528976440429688, 17.413761138916016, 21.298547744750977, 25.183332443237305, 29.068117141723633, 32.952903747558594, 36.83768844604492, 40.72247314453125]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 12.0, 8.0, 14.0, 15.0, 23.0, 15.0, 22.0, 31.0, 37.0, 28.0, 22.0, 44.0, 32.0, 32.0, 48.0, 47.0, 53.0, 38.0, 43.0, 49.0, 45.0, 44.0, 44.0, 43.0, 32.0, 36.0, 18.0, 20.0, 13.0, 15.0, 14.0, 14.0, 4.0, 11.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-57.84894943237305, -56.14171600341797, -54.43448257446289, -52.72724914550781, -51.02001953125, -49.31278610229492, -47.605552673339844, -45.898319244384766, -44.19108581542969, -42.48385238647461, -40.77661895751953, -39.06938934326172, -37.36215591430664, -35.65492248535156, -33.947689056396484, -32.240455627441406, -30.533226013183594, -28.825992584228516, -27.11876106262207, -25.411527633666992, -23.704296112060547, -21.99706268310547, -20.28982925415039, -18.582595825195312, -16.875364303588867, -15.168131828308105, -13.460899353027344, -11.753665924072266, -10.046433448791504, -8.339200973510742, -6.631967544555664, -4.924735069274902, -3.2175064086914062, -1.5102736949920654, 0.1969590187072754, 1.9041919708251953, 3.611424446105957, 5.318656921386719, 7.025890350341797, 8.733122825622559, 10.44035530090332, 12.147587776184082, 13.854820251464844, 15.562053680419922, 17.269287109375, 18.976518630981445, 20.683752059936523, 22.39098358154297, 24.098217010498047, 25.805450439453125, 27.51268196105957, 29.21991539001465, 30.927146911621094, 32.63438034057617, 34.34161376953125, 36.04884719848633, 37.756080627441406, 39.463314056396484, 41.17054748535156, 42.877777099609375, 44.58501052856445, 46.29224395751953, 47.99947738647461, 49.70671081542969, 51.4139404296875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 5.0, 10.0, 18.0, 15.0, 13.0, 11.0, 19.0, 27.0, 23.0, 31.0, 52.0, 36.0, 42.0, 35.0, 48.0, 42.0, 48.0, 54.0, 43.0, 34.0, 41.0, 46.0, 41.0, 30.0, 34.0, 19.0, 26.0, 18.0, 24.0, 20.0, 15.0, 17.0, 12.0, 5.0, 11.0, 7.0, 7.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2109375, -6.019775390625, -5.82861328125, -5.637451171875, -5.4462890625, -5.255126953125, -5.06396484375, -4.872802734375, -4.681640625, -4.490478515625, -4.29931640625, -4.108154296875, -3.9169921875, -3.725830078125, -3.53466796875, -3.343505859375, -3.15234375, -2.961181640625, -2.77001953125, -2.578857421875, -2.3876953125, -2.196533203125, -2.00537109375, -1.814208984375, -1.623046875, -1.431884765625, -1.24072265625, -1.049560546875, -0.8583984375, -0.667236328125, -0.47607421875, -0.284912109375, -0.09375, 0.097412109375, 0.28857421875, 0.479736328125, 0.6708984375, 0.862060546875, 1.05322265625, 1.244384765625, 1.435546875, 1.626708984375, 1.81787109375, 2.009033203125, 2.2001953125, 2.391357421875, 2.58251953125, 2.773681640625, 2.96484375, 3.156005859375, 3.34716796875, 3.538330078125, 3.7294921875, 3.920654296875, 4.11181640625, 4.302978515625, 4.494140625, 4.685302734375, 4.87646484375, 5.067626953125, 5.2587890625, 5.449951171875, 5.64111328125, 5.832275390625, 6.0234375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 11.0, 4.0, 14.0, 16.0, 21.0, 25.0, 21.0, 35.0, 50.0, 62.0, 71.0, 87.0, 138.0, 244.0, 472.0, 1233.0, 5151.0, 44448.0, 736769.0, 2841649.0, 525699.0, 31761.0, 4076.0, 1028.0, 419.0, 203.0, 126.0, 90.0, 68.0, 54.0, 49.0, 44.0, 22.0, 30.0, 16.0, 15.0, 17.0, 11.0, 9.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.7890625, -15.31689453125, -14.8447265625, -14.37255859375, -13.900390625, -13.42822265625, -12.9560546875, -12.48388671875, -12.01171875, -11.53955078125, -11.0673828125, -10.59521484375, -10.123046875, -9.65087890625, -9.1787109375, -8.70654296875, -8.234375, -7.76220703125, -7.2900390625, -6.81787109375, -6.345703125, -5.87353515625, -5.4013671875, -4.92919921875, -4.45703125, -3.98486328125, -3.5126953125, -3.04052734375, -2.568359375, -2.09619140625, -1.6240234375, -1.15185546875, -0.6796875, -0.20751953125, 0.2646484375, 0.73681640625, 1.208984375, 1.68115234375, 2.1533203125, 2.62548828125, 3.09765625, 3.56982421875, 4.0419921875, 4.51416015625, 4.986328125, 5.45849609375, 5.9306640625, 6.40283203125, 6.875, 7.34716796875, 7.8193359375, 8.29150390625, 8.763671875, 9.23583984375, 9.7080078125, 10.18017578125, 10.65234375, 11.12451171875, 11.5966796875, 12.06884765625, 12.541015625, 13.01318359375, 13.4853515625, 13.95751953125, 14.4296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 4.0, 12.0, 17.0, 27.0, 42.0, 41.0, 57.0, 75.0, 127.0, 171.0, 206.0, 315.0, 405.0, 508.0, 478.0, 435.0, 330.0, 219.0, 178.0, 126.0, 96.0, 54.0, 48.0, 33.0, 17.0, 14.0, 13.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.67529296875, -12.2802734375, -11.88525390625, -11.490234375, -11.09521484375, -10.7001953125, -10.30517578125, -9.91015625, -9.51513671875, -9.1201171875, -8.72509765625, -8.330078125, -7.93505859375, -7.5400390625, -7.14501953125, -6.75, -6.35498046875, -5.9599609375, -5.56494140625, -5.169921875, -4.77490234375, -4.3798828125, -3.98486328125, -3.58984375, -3.19482421875, -2.7998046875, -2.40478515625, -2.009765625, -1.61474609375, -1.2197265625, -0.82470703125, -0.4296875, -0.03466796875, 0.3603515625, 0.75537109375, 1.150390625, 1.54541015625, 1.9404296875, 2.33544921875, 2.73046875, 3.12548828125, 3.5205078125, 3.91552734375, 4.310546875, 4.70556640625, 5.1005859375, 5.49560546875, 5.890625, 6.28564453125, 6.6806640625, 7.07568359375, 7.470703125, 7.86572265625, 8.2607421875, 8.65576171875, 9.05078125, 9.44580078125, 9.8408203125, 10.23583984375, 10.630859375, 11.02587890625, 11.4208984375, 11.81591796875, 12.2109375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 5.0, 11.0, 24.0, 40.0, 61.0, 90.0, 118.0, 185.0, 248.0, 335.0, 592.0, 6994.0, 4024997.0, 158139.0, 1025.0, 447.0, 302.0, 206.0, 142.0, 92.0, 77.0, 42.0, 40.0, 22.0, 13.0, 11.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.4375, -67.3154296875, -65.193359375, -63.0712890625, -60.94921875, -58.8271484375, -56.705078125, -54.5830078125, -52.4609375, -50.3388671875, -48.216796875, -46.0947265625, -43.97265625, -41.8505859375, -39.728515625, -37.6064453125, -35.484375, -33.3623046875, -31.240234375, -29.1181640625, -26.99609375, -24.8740234375, -22.751953125, -20.6298828125, -18.5078125, -16.3857421875, -14.263671875, -12.1416015625, -10.01953125, -7.8974609375, -5.775390625, -3.6533203125, -1.53125, 0.5908203125, 2.712890625, 4.8349609375, 6.95703125, 9.0791015625, 11.201171875, 13.3232421875, 15.4453125, 17.5673828125, 19.689453125, 21.8115234375, 23.93359375, 26.0556640625, 28.177734375, 30.2998046875, 32.421875, 34.5439453125, 36.666015625, 38.7880859375, 40.91015625, 43.0322265625, 45.154296875, 47.2763671875, 49.3984375, 51.5205078125, 53.642578125, 55.7646484375, 57.88671875, 60.0087890625, 62.130859375, 64.2529296875, 66.375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 22.0, 113.0, 277.0, 376.0, 174.0, 42.0, 9.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-240.79660034179688, -235.9137725830078, -231.03094482421875, -226.1481170654297, -221.26528930664062, -216.38246154785156, -211.4996337890625, -206.6168212890625, -201.73397827148438, -196.8511505126953, -191.96832275390625, -187.0854949951172, -182.20266723632812, -177.31983947753906, -172.43701171875, -167.55419921875, -162.67137145996094, -157.78854370117188, -152.9057159423828, -148.02288818359375, -143.1400604248047, -138.25723266601562, -133.37440490722656, -128.4915771484375, -123.60875701904297, -118.7259292602539, -113.84310150146484, -108.96027374267578, -104.07745361328125, -99.19462585449219, -94.31179809570312, -89.42897033691406, -84.54615020751953, -79.66332244873047, -74.7804946899414, -69.89766693115234, -65.01484680175781, -60.132015228271484, -55.24919128417969, -50.366363525390625, -45.48353576660156, -40.6007080078125, -35.71788024902344, -30.83505630493164, -25.952228546142578, -21.069400787353516, -16.186574935913086, -11.303749084472656, -6.420921325683594, -1.5380945205688477, 3.3447322845458984, 8.227559089660645, 13.11038589477539, 17.993213653564453, 22.876039505004883, 27.758865356445312, 32.641693115234375, 37.52452087402344, 42.4073486328125, 47.2901725769043, 52.17300033569336, 57.05582809448242, 61.93865203857422, 66.82147979736328, 71.70430755615234]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 6.0, 6.0, 11.0, 14.0, 17.0, 11.0, 20.0, 22.0, 18.0, 19.0, 27.0, 19.0, 25.0, 35.0, 32.0, 39.0, 37.0, 36.0, 35.0, 33.0, 32.0, 31.0, 34.0, 44.0, 40.0, 35.0, 33.0, 40.0, 29.0, 29.0, 23.0, 16.0, 18.0, 13.0, 25.0, 11.0, 12.0, 15.0, 12.0, 4.0, 7.0, 3.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.04292297363281, -33.971466064453125, -32.90000915527344, -31.82855224609375, -30.757097244262695, -29.685640335083008, -28.61418342590332, -27.542726516723633, -26.471271514892578, -25.39981460571289, -24.328357696533203, -23.256900787353516, -22.18544578552246, -21.113988876342773, -20.042531967163086, -18.9710750579834, -17.89961814880371, -16.828161239624023, -15.756705284118652, -14.685248374938965, -13.613792419433594, -12.542335510253906, -11.470878601074219, -10.399421691894531, -9.32796573638916, -8.256508827209473, -7.185052871704102, -6.113595962524414, -5.042139530181885, -3.9706830978393555, -2.899226188659668, -1.8277697563171387, -0.7563133239746094, 0.3151432275772095, 1.3865997791290283, 2.4580564498901367, 3.529512882232666, 4.600969314575195, 5.672426223754883, 6.743882656097412, 7.815339088439941, 8.886795997619629, 9.958251953125, 11.029708862304688, 12.101165771484375, 13.172621726989746, 14.244078636169434, 15.315534591674805, 16.386991500854492, 17.45844841003418, 18.529905319213867, 19.601360321044922, 20.67281723022461, 21.744274139404297, 22.815731048583984, 23.887187957763672, 24.95864486694336, 26.030101776123047, 27.101558685302734, 28.173015594482422, 29.244470596313477, 30.315927505493164, 31.38738441467285, 32.458839416503906, 33.530296325683594]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 9.0, 4.0, 6.0, 8.0, 9.0, 8.0, 17.0, 11.0, 14.0, 22.0, 25.0, 25.0, 24.0, 35.0, 31.0, 32.0, 46.0, 34.0, 50.0, 32.0, 35.0, 41.0, 39.0, 38.0, 37.0, 44.0, 28.0, 30.0, 24.0, 30.0, 28.0, 23.0, 18.0, 15.0, 14.0, 23.0, 14.0, 14.0, 12.0, 12.0, 9.0, 2.0, 6.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.859375, -4.6976318359375, -4.535888671875, -4.3741455078125, -4.21240234375, -4.0506591796875, -3.888916015625, -3.7271728515625, -3.5654296875, -3.4036865234375, -3.241943359375, -3.0802001953125, -2.91845703125, -2.7567138671875, -2.594970703125, -2.4332275390625, -2.271484375, -2.1097412109375, -1.947998046875, -1.7862548828125, -1.62451171875, -1.4627685546875, -1.301025390625, -1.1392822265625, -0.9775390625, -0.8157958984375, -0.654052734375, -0.4923095703125, -0.33056640625, -0.1688232421875, -0.007080078125, 0.1546630859375, 0.31640625, 0.4781494140625, 0.639892578125, 0.8016357421875, 0.96337890625, 1.1251220703125, 1.286865234375, 1.4486083984375, 1.6103515625, 1.7720947265625, 1.933837890625, 2.0955810546875, 2.25732421875, 2.4190673828125, 2.580810546875, 2.7425537109375, 2.904296875, 3.0660400390625, 3.227783203125, 3.3895263671875, 3.55126953125, 3.7130126953125, 3.874755859375, 4.0364990234375, 4.1982421875, 4.3599853515625, 4.521728515625, 4.6834716796875, 4.84521484375, 5.0069580078125, 5.168701171875, 5.3304443359375, 5.4921875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 10.0, 14.0, 19.0, 41.0, 57.0, 101.0, 113.0, 166.0, 231.0, 354.0, 569.0, 818.0, 1181.0, 1793.0, 2692.0, 3967.0, 5945.0, 9086.0, 13553.0, 21704.0, 34028.0, 54335.0, 86947.0, 133184.0, 177578.0, 168415.0, 120149.0, 77083.0, 48248.0, 30137.0, 19304.0, 12282.0, 8118.0, 5440.0, 3488.0, 2456.0, 1597.0, 1056.0, 771.0, 516.0, 328.0, 222.0, 148.0, 108.0, 66.0, 43.0, 35.0, 23.0, 15.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.54541015625, -0.5282974243164062, -0.5111846923828125, -0.49407196044921875, -0.476959228515625, -0.45984649658203125, -0.4427337646484375, -0.42562103271484375, -0.40850830078125, -0.39139556884765625, -0.3742828369140625, -0.35717010498046875, -0.340057373046875, -0.32294464111328125, -0.3058319091796875, -0.28871917724609375, -0.2716064453125, -0.25449371337890625, -0.2373809814453125, -0.22026824951171875, -0.203155517578125, -0.18604278564453125, -0.1689300537109375, -0.15181732177734375, -0.13470458984375, -0.11759185791015625, -0.1004791259765625, -0.08336639404296875, -0.066253662109375, -0.04914093017578125, -0.0320281982421875, -0.01491546630859375, 0.002197265625, 0.01930999755859375, 0.0364227294921875, 0.05353546142578125, 0.070648193359375, 0.08776092529296875, 0.1048736572265625, 0.12198638916015625, 0.13909912109375, 0.15621185302734375, 0.1733245849609375, 0.19043731689453125, 0.207550048828125, 0.22466278076171875, 0.2417755126953125, 0.25888824462890625, 0.2760009765625, 0.29311370849609375, 0.3102264404296875, 0.32733917236328125, 0.344451904296875, 0.36156463623046875, 0.3786773681640625, 0.39579010009765625, 0.41290283203125, 0.43001556396484375, 0.4471282958984375, 0.46424102783203125, 0.481353759765625, 0.49846649169921875, 0.5155792236328125, 0.5326919555664062, 0.5498046875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 8.0, 13.0, 11.0, 7.0, 22.0, 15.0, 22.0, 17.0, 18.0, 31.0, 35.0, 26.0, 41.0, 42.0, 35.0, 42.0, 36.0, 24.0, 1064.0, 41.0, 29.0, 35.0, 37.0, 39.0, 47.0, 43.0, 27.0, 30.0, 22.0, 24.0, 33.0, 17.0, 17.0, 14.0, 12.0, 15.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.953125, -3.839752197265625, -3.72637939453125, -3.613006591796875, -3.4996337890625, -3.386260986328125, -3.27288818359375, -3.159515380859375, -3.046142578125, -2.932769775390625, -2.81939697265625, -2.706024169921875, -2.5926513671875, -2.479278564453125, -2.36590576171875, -2.252532958984375, -2.13916015625, -2.025787353515625, -1.91241455078125, -1.799041748046875, -1.6856689453125, -1.572296142578125, -1.45892333984375, -1.345550537109375, -1.232177734375, -1.118804931640625, -1.00543212890625, -0.892059326171875, -0.7786865234375, -0.665313720703125, -0.55194091796875, -0.438568115234375, -0.3251953125, -0.211822509765625, -0.09844970703125, 0.014923095703125, 0.1282958984375, 0.241668701171875, 0.35504150390625, 0.468414306640625, 0.581787109375, 0.695159912109375, 0.80853271484375, 0.921905517578125, 1.0352783203125, 1.148651123046875, 1.26202392578125, 1.375396728515625, 1.48876953125, 1.602142333984375, 1.71551513671875, 1.828887939453125, 1.9422607421875, 2.055633544921875, 2.16900634765625, 2.282379150390625, 2.395751953125, 2.509124755859375, 2.62249755859375, 2.735870361328125, 2.8492431640625, 2.962615966796875, 3.07598876953125, 3.189361572265625, 3.302734375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 2.0, 5.0, 12.0, 17.0, 38.0, 33.0, 69.0, 104.0, 152.0, 249.0, 368.0, 558.0, 920.0, 1468.0, 2330.0, 3840.0, 6241.0, 10632.0, 17437.0, 29616.0, 50414.0, 87917.0, 140425.0, 1226280.0, 190720.0, 132013.0, 80833.0, 46950.0, 26997.0, 15782.0, 9542.0, 5852.0, 3560.0, 2112.0, 1352.0, 823.0, 518.0, 327.0, 205.0, 137.0, 102.0, 58.0, 35.0, 33.0, 18.0, 15.0, 9.0, 8.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.464111328125, -0.44910430908203125, -0.4340972900390625, -0.41909027099609375, -0.404083251953125, -0.38907623291015625, -0.3740692138671875, -0.35906219482421875, -0.34405517578125, -0.32904815673828125, -0.3140411376953125, -0.29903411865234375, -0.284027099609375, -0.26902008056640625, -0.2540130615234375, -0.23900604248046875, -0.2239990234375, -0.20899200439453125, -0.1939849853515625, -0.17897796630859375, -0.163970947265625, -0.14896392822265625, -0.1339569091796875, -0.11894989013671875, -0.10394287109375, -0.08893585205078125, -0.0739288330078125, -0.05892181396484375, -0.043914794921875, -0.02890777587890625, -0.0139007568359375, 0.00110626220703125, 0.01611328125, 0.03112030029296875, 0.0461273193359375, 0.06113433837890625, 0.076141357421875, 0.09114837646484375, 0.1061553955078125, 0.12116241455078125, 0.13616943359375, 0.15117645263671875, 0.1661834716796875, 0.18119049072265625, 0.196197509765625, 0.21120452880859375, 0.2262115478515625, 0.24121856689453125, 0.2562255859375, 0.27123260498046875, 0.2862396240234375, 0.30124664306640625, 0.316253662109375, 0.33126068115234375, 0.3462677001953125, 0.36127471923828125, 0.37628173828125, 0.39128875732421875, 0.4062957763671875, 0.42130279541015625, 0.436309814453125, 0.45131683349609375, 0.4663238525390625, 0.48133087158203125, 0.496337890625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 6.0, 10.0, 11.0, 14.0, 19.0, 25.0, 25.0, 26.0, 38.0, 54.0, 81.0, 71.0, 78.0, 71.0, 89.0, 60.0, 80.0, 51.0, 41.0, 34.0, 32.0, 25.0, 17.0, 15.0, 7.0, 4.0, 5.0, 5.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002246856689453125, -0.0021757185459136963, -0.0021045804023742676, -0.002033442258834839, -0.00196230411529541, -0.0018911659717559814, -0.0018200278282165527, -0.001748889684677124, -0.0016777515411376953, -0.0016066133975982666, -0.0015354752540588379, -0.0014643371105194092, -0.0013931989669799805, -0.0013220608234405518, -0.001250922679901123, -0.0011797845363616943, -0.0011086463928222656, -0.001037508249282837, -0.0009663701057434082, -0.0008952319622039795, -0.0008240938186645508, -0.0007529556751251221, -0.0006818175315856934, -0.0006106793880462646, -0.0005395412445068359, -0.0004684031009674072, -0.0003972649574279785, -0.0003261268138885498, -0.0002549886703491211, -0.00018385052680969238, -0.00011271238327026367, -4.157423973083496e-05, 2.956390380859375e-05, 0.00010070204734802246, 0.00017184019088745117, 0.00024297833442687988, 0.0003141164779663086, 0.0003852546215057373, 0.000456392765045166, 0.0005275309085845947, 0.0005986690521240234, 0.0006698071956634521, 0.0007409453392028809, 0.0008120834827423096, 0.0008832216262817383, 0.000954359769821167, 0.0010254979133605957, 0.0010966360569000244, 0.0011677742004394531, 0.0012389123439788818, 0.0013100504875183105, 0.0013811886310577393, 0.001452326774597168, 0.0015234649181365967, 0.0015946030616760254, 0.001665741205215454, 0.0017368793487548828, 0.0018080174922943115, 0.0018791556358337402, 0.001950293779373169, 0.0020214319229125977, 0.0020925700664520264, 0.002163708209991455, 0.002234846353530884, 0.0023059844970703125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 7.0, 4.0, 8.0, 13.0, 14.0, 21.0, 36.0, 38.0, 55.0, 89.0, 140.0, 237.0, 532.0, 11808.0, 1032062.0, 2498.0, 414.0, 198.0, 103.0, 76.0, 58.0, 32.0, 33.0, 23.0, 16.0, 14.0, 11.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049835205078125, -0.048295021057128906, -0.04675483703613281, -0.04521465301513672, -0.043674468994140625, -0.04213428497314453, -0.04059410095214844, -0.039053916931152344, -0.03751373291015625, -0.035973548889160156, -0.03443336486816406, -0.03289318084716797, -0.031352996826171875, -0.02981281280517578, -0.028272628784179688, -0.026732444763183594, -0.0251922607421875, -0.023652076721191406, -0.022111892700195312, -0.02057170867919922, -0.019031524658203125, -0.01749134063720703, -0.015951156616210938, -0.014410972595214844, -0.01287078857421875, -0.011330604553222656, -0.009790420532226562, -0.008250236511230469, -0.006710052490234375, -0.005169868469238281, -0.0036296844482421875, -0.0020895004272460938, -0.00054931640625, 0.0009908676147460938, 0.0025310516357421875, 0.004071235656738281, 0.005611419677734375, 0.007151603698730469, 0.008691787719726562, 0.010231971740722656, 0.01177215576171875, 0.013312339782714844, 0.014852523803710938, 0.01639270782470703, 0.017932891845703125, 0.01947307586669922, 0.021013259887695312, 0.022553443908691406, 0.0240936279296875, 0.025633811950683594, 0.027173995971679688, 0.02871417999267578, 0.030254364013671875, 0.03179454803466797, 0.03333473205566406, 0.034874916076660156, 0.03641510009765625, 0.037955284118652344, 0.03949546813964844, 0.04103565216064453, 0.042575836181640625, 0.04411602020263672, 0.04565620422363281, 0.047196388244628906, 0.048736572265625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 6.0, 20.0, 31.0, 69.0, 85.0, 117.0, 156.0, 145.0, 138.0, 89.0, 59.0, 32.0, 29.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010949239367619157, -0.0010528148850426078, -0.0010107058333232999, -0.0009685968398116529, -0.000926487788092345, -0.0008843787363730371, -0.0008422697428613901, -0.0008001606911420822, -0.0007580516394227743, -0.0007159425877034664, -0.0006738335359841585, -0.0006317245424725115, -0.0005896154907532036, -0.0005475064390338957, -0.0005053974455222487, -0.00046328839380294085, -0.00042117934208363295, -0.00037907029036432505, -0.0003369612677488476, -0.00029485224513337016, -0.00025274319341406226, -0.0002106341562466696, -0.00016852511907927692, -0.00012641609646379948, -8.430704474449158e-05, -4.2198007577098906e-05, -8.897040970623493e-08, 4.2020066757686436e-05, 8.412910392507911e-05, 0.00012623814109247178, 0.00016834717825986445, 0.0002104562008753419, 0.0002525653690099716, 0.0002946744207292795, 0.00033678344334475696, 0.0003788924659602344, 0.0004210015176795423, 0.0004631105693988502, 0.0005052195629104972, 0.0005473286146298051, 0.000589437666349113, 0.0006315467180684209, 0.0006736557697877288, 0.0007157647632993758, 0.0007578738150186837, 0.0007999828667379916, 0.0008420918602496386, 0.0008842009119689465, 0.0009263099636882544, 0.0009684190154075623, 0.0010105280671268702, 0.001052637118846178, 0.001094746170565486, 0.001136855105869472, 0.00117896415758878, 0.0012210732093080878, 0.0012631822610273957, 0.0013052913127467036, 0.0013474003644660115, 0.0013895094161853194, 0.0014316183514893055, 0.0014737274032086134, 0.0015158364549279213, 0.0015579455066472292, 0.001600054558366537]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 7.0, 8.0, 9.0, 12.0, 20.0, 12.0, 10.0, 18.0, 17.0, 29.0, 22.0, 21.0, 32.0, 40.0, 39.0, 36.0, 34.0, 31.0, 39.0, 27.0, 47.0, 50.0, 38.0, 40.0, 49.0, 25.0, 35.0, 31.0, 28.0, 27.0, 30.0, 20.0, 13.0, 19.0, 15.0, 17.0, 6.0, 4.0, 4.0, 9.0, 9.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007822513580322266, -0.0007548760622739792, -0.0007275007665157318, -0.0007001254707574844, -0.0006727501749992371, -0.0006453748792409897, -0.0006179995834827423, -0.0005906242877244949, -0.0005632489919662476, -0.0005358736962080002, -0.0005084984004497528, -0.00048112310469150543, -0.00045374780893325806, -0.0004263725131750107, -0.0003989972174167633, -0.00037162192165851593, -0.00034424662590026855, -0.0003168713301420212, -0.0002894960343837738, -0.00026212073862552643, -0.00023474544286727905, -0.00020737014710903168, -0.0001799948513507843, -0.00015261955559253693, -0.00012524425983428955, -9.786896407604218e-05, -7.04936683177948e-05, -4.3118372559547424e-05, -1.574307680130005e-05, 1.1632218956947327e-05, 3.90075147151947e-05, 6.638281047344208e-05, 9.375810623168945e-05, 0.00012113340198993683, 0.0001485086977481842, 0.00017588399350643158, 0.00020325928926467896, 0.00023063458502292633, 0.0002580098807811737, 0.0002853851765394211, 0.00031276047229766846, 0.00034013576805591583, 0.0003675110638141632, 0.0003948863595724106, 0.00042226165533065796, 0.00044963695108890533, 0.0004770122468471527, 0.0005043875426054001, 0.0005317628383636475, 0.0005591381341218948, 0.0005865134298801422, 0.0006138887256383896, 0.000641264021396637, 0.0006686393171548843, 0.0006960146129131317, 0.0007233899086713791, 0.0007507652044296265, 0.0007781405001878738, 0.0008055157959461212, 0.0008328910917043686, 0.000860266387462616, 0.0008876416832208633, 0.0009150169789791107, 0.0009423922747373581, 0.0009697675704956055]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 9.0, 4.0, 6.0, 8.0, 9.0, 8.0, 17.0, 11.0, 14.0, 22.0, 25.0, 25.0, 24.0, 35.0, 31.0, 32.0, 46.0, 34.0, 50.0, 32.0, 34.0, 42.0, 39.0, 38.0, 37.0, 44.0, 28.0, 30.0, 24.0, 30.0, 28.0, 23.0, 18.0, 15.0, 14.0, 23.0, 14.0, 14.0, 12.0, 12.0, 9.0, 2.0, 6.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.859375, -4.6976318359375, -4.535888671875, -4.3741455078125, -4.21240234375, -4.0506591796875, -3.888916015625, -3.7271728515625, -3.5654296875, -3.4036865234375, -3.241943359375, -3.0802001953125, -2.91845703125, -2.7567138671875, -2.594970703125, -2.4332275390625, -2.271484375, -2.1097412109375, -1.947998046875, -1.7862548828125, -1.62451171875, -1.4627685546875, -1.301025390625, -1.1392822265625, -0.9775390625, -0.8157958984375, -0.654052734375, -0.4923095703125, -0.33056640625, -0.1688232421875, -0.007080078125, 0.1546630859375, 0.31640625, 0.4781494140625, 0.639892578125, 0.8016357421875, 0.96337890625, 1.1251220703125, 1.286865234375, 1.4486083984375, 1.6103515625, 1.7720947265625, 1.933837890625, 2.0955810546875, 2.25732421875, 2.4190673828125, 2.580810546875, 2.7425537109375, 2.904296875, 3.0660400390625, 3.227783203125, 3.3895263671875, 3.55126953125, 3.7130126953125, 3.874755859375, 4.0364990234375, 4.1982421875, 4.3599853515625, 4.521728515625, 4.6834716796875, 4.84521484375, 5.0069580078125, 5.168701171875, 5.3304443359375, 5.4921875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 9.0, 12.0, 14.0, 25.0, 47.0, 72.0, 116.0, 167.0, 294.0, 542.0, 906.0, 1717.0, 3442.0, 6723.0, 13185.0, 27565.0, 60855.0, 145021.0, 355765.0, 247301.0, 100155.0, 43205.0, 20677.0, 10041.0, 5022.0, 2556.0, 1365.0, 703.0, 410.0, 213.0, 153.0, 94.0, 53.0, 34.0, 22.0, 16.0, 10.0, 4.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4375, -4.30218505859375, -4.1668701171875, -4.03155517578125, -3.896240234375, -3.76092529296875, -3.6256103515625, -3.49029541015625, -3.35498046875, -3.21966552734375, -3.0843505859375, -2.94903564453125, -2.813720703125, -2.67840576171875, -2.5430908203125, -2.40777587890625, -2.2724609375, -2.13714599609375, -2.0018310546875, -1.86651611328125, -1.731201171875, -1.59588623046875, -1.4605712890625, -1.32525634765625, -1.18994140625, -1.05462646484375, -0.9193115234375, -0.78399658203125, -0.648681640625, -0.51336669921875, -0.3780517578125, -0.24273681640625, -0.107421875, 0.02789306640625, 0.1632080078125, 0.29852294921875, 0.433837890625, 0.56915283203125, 0.7044677734375, 0.83978271484375, 0.97509765625, 1.11041259765625, 1.2457275390625, 1.38104248046875, 1.516357421875, 1.65167236328125, 1.7869873046875, 1.92230224609375, 2.0576171875, 2.19293212890625, 2.3282470703125, 2.46356201171875, 2.598876953125, 2.73419189453125, 2.8695068359375, 3.00482177734375, 3.14013671875, 3.27545166015625, 3.4107666015625, 3.54608154296875, 3.681396484375, 3.81671142578125, 3.9520263671875, 4.08734130859375, 4.22265625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 8.0, 8.0, 8.0, 15.0, 21.0, 15.0, 32.0, 34.0, 38.0, 42.0, 29.0, 46.0, 52.0, 77.0, 119.0, 378.0, 1547.0, 127.0, 72.0, 60.0, 39.0, 39.0, 38.0, 37.0, 25.0, 28.0, 23.0, 20.0, 15.0, 13.0, 9.0, 7.0, 9.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.15625, -24.458251953125, -23.76025390625, -23.062255859375, -22.3642578125, -21.666259765625, -20.96826171875, -20.270263671875, -19.572265625, -18.874267578125, -18.17626953125, -17.478271484375, -16.7802734375, -16.082275390625, -15.38427734375, -14.686279296875, -13.98828125, -13.290283203125, -12.59228515625, -11.894287109375, -11.1962890625, -10.498291015625, -9.80029296875, -9.102294921875, -8.404296875, -7.706298828125, -7.00830078125, -6.310302734375, -5.6123046875, -4.914306640625, -4.21630859375, -3.518310546875, -2.8203125, -2.122314453125, -1.42431640625, -0.726318359375, -0.0283203125, 0.669677734375, 1.36767578125, 2.065673828125, 2.763671875, 3.461669921875, 4.15966796875, 4.857666015625, 5.5556640625, 6.253662109375, 6.95166015625, 7.649658203125, 8.34765625, 9.045654296875, 9.74365234375, 10.441650390625, 11.1396484375, 11.837646484375, 12.53564453125, 13.233642578125, 13.931640625, 14.629638671875, 15.32763671875, 16.025634765625, 16.7236328125, 17.421630859375, 18.11962890625, 18.817626953125, 19.515625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 5.0, 9.0, 9.0, 15.0, 15.0, 19.0, 23.0, 39.0, 39.0, 74.0, 81.0, 125.0, 171.0, 253.0, 346.0, 888.0, 10930.0, 3099927.0, 30191.0, 1181.0, 438.0, 251.0, 173.0, 145.0, 82.0, 74.0, 53.0, 44.0, 25.0, 19.0, 13.0, 15.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.9375, -51.20703125, -49.4765625, -47.74609375, -46.015625, -44.28515625, -42.5546875, -40.82421875, -39.09375, -37.36328125, -35.6328125, -33.90234375, -32.171875, -30.44140625, -28.7109375, -26.98046875, -25.25, -23.51953125, -21.7890625, -20.05859375, -18.328125, -16.59765625, -14.8671875, -13.13671875, -11.40625, -9.67578125, -7.9453125, -6.21484375, -4.484375, -2.75390625, -1.0234375, 0.70703125, 2.4375, 4.16796875, 5.8984375, 7.62890625, 9.359375, 11.08984375, 12.8203125, 14.55078125, 16.28125, 18.01171875, 19.7421875, 21.47265625, 23.203125, 24.93359375, 26.6640625, 28.39453125, 30.125, 31.85546875, 33.5859375, 35.31640625, 37.046875, 38.77734375, 40.5078125, 42.23828125, 43.96875, 45.69921875, 47.4296875, 49.16015625, 50.890625, 52.62109375, 54.3515625, 56.08203125, 57.8125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 25.0, 267.0, 566.0, 147.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.9264678955078, -152.76657104492188, -149.606689453125, -146.44679260253906, -143.28689575195312, -140.1269989013672, -136.96710205078125, -133.80722045898438, -130.64732360839844, -127.4874267578125, -124.3275375366211, -121.16764831542969, -118.00775146484375, -114.84785461425781, -111.6879653930664, -108.528076171875, -105.36817932128906, -102.20828247070312, -99.04839324951172, -95.88850402832031, -92.72860717773438, -89.56871032714844, -86.40882110595703, -83.24893188476562, -80.08903503417969, -76.92913818359375, -73.76924896240234, -70.60935974121094, -67.449462890625, -64.28956604003906, -61.129676818847656, -57.969783782958984, -54.80989456176758, -51.650001525878906, -48.490108489990234, -45.33021545410156, -42.17032241821289, -39.01042938232422, -35.85053634643555, -32.690643310546875, -29.530750274658203, -26.37085723876953, -23.21096420288086, -20.051071166992188, -16.891178131103516, -13.731285095214844, -10.571392059326172, -7.4114990234375, -4.251605987548828, -1.0917129516601562, 2.0681800842285156, 5.2280731201171875, 8.38796615600586, 11.547859191894531, 14.707752227783203, 17.867645263671875, 21.027538299560547, 24.18743133544922, 27.34732437133789, 30.507217407226562, 33.667110443115234, 36.827003479003906, 39.98689651489258, 43.14678955078125, 46.30668258666992]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 1.0, 6.0, 7.0, 10.0, 9.0, 15.0, 20.0, 9.0, 15.0, 25.0, 21.0, 35.0, 27.0, 41.0, 35.0, 34.0, 39.0, 34.0, 36.0, 35.0, 36.0, 46.0, 26.0, 41.0, 42.0, 35.0, 34.0, 30.0, 28.0, 37.0, 27.0, 17.0, 17.0, 19.0, 10.0, 21.0, 14.0, 9.0, 10.0, 12.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-41.557090759277344, -40.16460418701172, -38.772117614746094, -37.379634857177734, -35.98714828491211, -34.594661712646484, -33.20217514038086, -31.809690475463867, -30.417205810546875, -29.02471923828125, -27.632234573364258, -26.239748001098633, -24.84726333618164, -23.454776763916016, -22.06229019165039, -20.6698055267334, -19.277318954467773, -17.88483238220215, -16.492347717285156, -15.099861145019531, -13.707376480102539, -12.314889907836914, -10.922404289245605, -9.529918670654297, -8.137433052062988, -6.74494743347168, -5.352461814880371, -3.9599757194519043, -2.5674901008605957, -1.175004482269287, 0.2174816131591797, 1.6099672317504883, 3.002452850341797, 4.3949384689331055, 5.787424087524414, 7.179910182952881, 8.572395324707031, 9.964881896972656, 11.357367515563965, 12.749853134155273, 14.142338752746582, 15.53482437133789, 16.927310943603516, 18.319795608520508, 19.712282180786133, 21.104766845703125, 22.49725341796875, 23.889739990234375, 25.282224655151367, 26.674711227416992, 28.067195892333984, 29.45968246459961, 30.8521671295166, 32.244651794433594, 33.63713836669922, 35.029624938964844, 36.42211151123047, 37.814598083496094, 39.20708465576172, 40.59956741333008, 41.9920539855957, 43.38454055786133, 44.77702713012695, 46.16950988769531, 47.56199645996094]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 3.0, 3.0, 8.0, 12.0, 12.0, 11.0, 10.0, 13.0, 23.0, 22.0, 22.0, 25.0, 36.0, 40.0, 39.0, 40.0, 36.0, 35.0, 30.0, 48.0, 37.0, 36.0, 36.0, 44.0, 36.0, 38.0, 30.0, 32.0, 25.0, 15.0, 29.0, 21.0, 19.0, 12.0, 25.0, 15.0, 8.0, 12.0, 9.0, 14.0, 2.0, 8.0, 5.0, 1.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.00390625, -4.83209228515625, -4.6602783203125, -4.48846435546875, -4.316650390625, -4.14483642578125, -3.9730224609375, -3.80120849609375, -3.62939453125, -3.45758056640625, -3.2857666015625, -3.11395263671875, -2.942138671875, -2.77032470703125, -2.5985107421875, -2.42669677734375, -2.2548828125, -2.08306884765625, -1.9112548828125, -1.73944091796875, -1.567626953125, -1.39581298828125, -1.2239990234375, -1.05218505859375, -0.88037109375, -0.70855712890625, -0.5367431640625, -0.36492919921875, -0.193115234375, -0.02130126953125, 0.1505126953125, 0.32232666015625, 0.494140625, 0.66595458984375, 0.8377685546875, 1.00958251953125, 1.181396484375, 1.35321044921875, 1.5250244140625, 1.69683837890625, 1.86865234375, 2.04046630859375, 2.2122802734375, 2.38409423828125, 2.555908203125, 2.72772216796875, 2.8995361328125, 3.07135009765625, 3.2431640625, 3.41497802734375, 3.5867919921875, 3.75860595703125, 3.930419921875, 4.10223388671875, 4.2740478515625, 4.44586181640625, 4.61767578125, 4.78948974609375, 4.9613037109375, 5.13311767578125, 5.304931640625, 5.47674560546875, 5.6485595703125, 5.82037353515625, 5.9921875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 6.0, 5.0, 14.0, 11.0, 16.0, 11.0, 24.0, 30.0, 25.0, 42.0, 39.0, 70.0, 127.0, 237.0, 568.0, 1657.0, 7861.0, 94360.0, 1989567.0, 2003021.0, 86607.0, 7240.0, 1545.0, 517.0, 231.0, 116.0, 58.0, 49.0, 41.0, 30.0, 21.0, 17.0, 23.0, 13.0, 10.0, 9.0, 8.0, 11.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.8125, -16.232666015625, -15.65283203125, -15.072998046875, -14.4931640625, -13.913330078125, -13.33349609375, -12.753662109375, -12.173828125, -11.593994140625, -11.01416015625, -10.434326171875, -9.8544921875, -9.274658203125, -8.69482421875, -8.114990234375, -7.53515625, -6.955322265625, -6.37548828125, -5.795654296875, -5.2158203125, -4.635986328125, -4.05615234375, -3.476318359375, -2.896484375, -2.316650390625, -1.73681640625, -1.156982421875, -0.5771484375, 0.002685546875, 0.58251953125, 1.162353515625, 1.7421875, 2.322021484375, 2.90185546875, 3.481689453125, 4.0615234375, 4.641357421875, 5.22119140625, 5.801025390625, 6.380859375, 6.960693359375, 7.54052734375, 8.120361328125, 8.7001953125, 9.280029296875, 9.85986328125, 10.439697265625, 11.01953125, 11.599365234375, 12.17919921875, 12.759033203125, 13.3388671875, 13.918701171875, 14.49853515625, 15.078369140625, 15.658203125, 16.238037109375, 16.81787109375, 17.397705078125, 17.9775390625, 18.557373046875, 19.13720703125, 19.717041015625, 20.296875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 3.0, 6.0, 8.0, 11.0, 16.0, 9.0, 24.0, 33.0, 43.0, 56.0, 67.0, 85.0, 114.0, 119.0, 180.0, 190.0, 273.0, 331.0, 376.0, 415.0, 360.0, 294.0, 254.0, 189.0, 149.0, 121.0, 83.0, 64.0, 45.0, 27.0, 25.0, 26.0, 14.0, 17.0, 12.0, 10.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.578125, -9.2606201171875, -8.943115234375, -8.6256103515625, -8.30810546875, -7.9906005859375, -7.673095703125, -7.3555908203125, -7.0380859375, -6.7205810546875, -6.403076171875, -6.0855712890625, -5.76806640625, -5.4505615234375, -5.133056640625, -4.8155517578125, -4.498046875, -4.1805419921875, -3.863037109375, -3.5455322265625, -3.22802734375, -2.9105224609375, -2.593017578125, -2.2755126953125, -1.9580078125, -1.6405029296875, -1.322998046875, -1.0054931640625, -0.68798828125, -0.3704833984375, -0.052978515625, 0.2645263671875, 0.58203125, 0.8995361328125, 1.217041015625, 1.5345458984375, 1.85205078125, 2.1695556640625, 2.487060546875, 2.8045654296875, 3.1220703125, 3.4395751953125, 3.757080078125, 4.0745849609375, 4.39208984375, 4.7095947265625, 5.027099609375, 5.3446044921875, 5.662109375, 5.9796142578125, 6.297119140625, 6.6146240234375, 6.93212890625, 7.2496337890625, 7.567138671875, 7.8846435546875, 8.2021484375, 8.5196533203125, 8.837158203125, 9.1546630859375, 9.47216796875, 9.7896728515625, 10.107177734375, 10.4246826171875, 10.7421875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 10.0, 10.0, 21.0, 19.0, 20.0, 43.0, 33.0, 59.0, 69.0, 83.0, 136.0, 176.0, 236.0, 290.0, 419.0, 1103.0, 15217.0, 3177819.0, 989973.0, 6206.0, 761.0, 353.0, 271.0, 202.0, 157.0, 151.0, 102.0, 79.0, 65.0, 44.0, 33.0, 27.0, 22.0, 16.0, 15.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-49.375, -47.87353515625, -46.3720703125, -44.87060546875, -43.369140625, -41.86767578125, -40.3662109375, -38.86474609375, -37.36328125, -35.86181640625, -34.3603515625, -32.85888671875, -31.357421875, -29.85595703125, -28.3544921875, -26.85302734375, -25.3515625, -23.85009765625, -22.3486328125, -20.84716796875, -19.345703125, -17.84423828125, -16.3427734375, -14.84130859375, -13.33984375, -11.83837890625, -10.3369140625, -8.83544921875, -7.333984375, -5.83251953125, -4.3310546875, -2.82958984375, -1.328125, 0.17333984375, 1.6748046875, 3.17626953125, 4.677734375, 6.17919921875, 7.6806640625, 9.18212890625, 10.68359375, 12.18505859375, 13.6865234375, 15.18798828125, 16.689453125, 18.19091796875, 19.6923828125, 21.19384765625, 22.6953125, 24.19677734375, 25.6982421875, 27.19970703125, 28.701171875, 30.20263671875, 31.7041015625, 33.20556640625, 34.70703125, 36.20849609375, 37.7099609375, 39.21142578125, 40.712890625, 42.21435546875, 43.7158203125, 45.21728515625, 46.71875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 15.0, 23.0, 44.0, 81.0, 90.0, 97.0, 110.0, 111.0, 112.0, 89.0, 68.0, 50.0, 35.0, 27.0, 20.0, 12.0, 3.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.89492797851562, -65.3831558227539, -63.87138748168945, -62.359619140625, -60.84785079956055, -59.336082458496094, -57.824310302734375, -56.31254196166992, -54.80077362060547, -53.289005279541016, -51.7772331237793, -50.265464782714844, -48.75369644165039, -47.24192810058594, -45.73015594482422, -44.218387603759766, -42.70661544799805, -41.194847106933594, -39.683074951171875, -38.17130661010742, -36.65953826904297, -35.14776611328125, -33.6359977722168, -32.124229431152344, -30.612459182739258, -29.100688934326172, -27.58892059326172, -26.077150344848633, -24.565380096435547, -23.053611755371094, -21.541841506958008, -20.030071258544922, -18.518306732177734, -17.00653648376465, -15.494768142700195, -13.98299789428711, -12.47122859954834, -10.95945930480957, -9.447689056396484, -7.935919761657715, -6.424150466918945, -4.912381172180176, -3.400611400604248, -1.8888416290283203, -0.3770723342895508, 1.1346969604492188, 2.6464672088623047, 4.158236503601074, 5.670005798339844, 7.181775093078613, 8.693544387817383, 10.205314636230469, 11.717083930969238, 13.228853225708008, 14.740623474121094, 16.252391815185547, 17.764162063598633, 19.27593231201172, 20.787700653076172, 22.299470901489258, 23.811241149902344, 25.323009490966797, 26.834779739379883, 28.34654998779297, 29.858318328857422]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 5.0, 8.0, 6.0, 10.0, 14.0, 19.0, 20.0, 16.0, 22.0, 33.0, 34.0, 26.0, 31.0, 48.0, 38.0, 49.0, 49.0, 36.0, 53.0, 44.0, 45.0, 29.0, 49.0, 42.0, 49.0, 38.0, 22.0, 34.0, 23.0, 23.0, 16.0, 16.0, 17.0, 14.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.432861328125, -41.165992736816406, -39.89912414550781, -38.63225555419922, -37.365386962890625, -36.09851837158203, -34.83164978027344, -33.56478500366211, -32.297916412353516, -31.031047821044922, -29.764179229736328, -28.497310638427734, -27.230443954467773, -25.96357536315918, -24.696706771850586, -23.429840087890625, -22.1629695892334, -20.896100997924805, -19.62923240661621, -18.36236572265625, -17.095497131347656, -15.828628540039062, -14.561759948730469, -13.294892311096191, -12.028023719787598, -10.761155128479004, -9.494287490844727, -8.227418899536133, -6.960550785064697, -5.693682670593262, -4.426814079284668, -3.1599464416503906, -1.8930778503417969, -0.6262096166610718, 0.6406586170196533, 1.907526969909668, 3.1743950843811035, 4.441263198852539, 5.708131790161133, 6.97499942779541, 8.241868019104004, 9.508736610412598, 10.775604248046875, 12.042472839355469, 13.309341430664062, 14.57620906829834, 15.843077659606934, 17.10994529724121, 18.376813888549805, 19.6436824798584, 20.910551071166992, 22.177417755126953, 23.444286346435547, 24.71115493774414, 25.978023529052734, 27.244892120361328, 28.511760711669922, 29.778629302978516, 31.04549789428711, 32.3123664855957, 33.5792350769043, 34.846099853515625, 36.11296844482422, 37.37983703613281, 38.646705627441406]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 8.0, 7.0, 4.0, 5.0, 12.0, 13.0, 12.0, 20.0, 20.0, 21.0, 19.0, 23.0, 31.0, 41.0, 32.0, 40.0, 48.0, 48.0, 47.0, 42.0, 39.0, 33.0, 38.0, 38.0, 50.0, 37.0, 39.0, 41.0, 31.0, 17.0, 21.0, 21.0, 16.0, 14.0, 12.0, 19.0, 13.0, 7.0, 4.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5625, -5.368896484375, -5.17529296875, -4.981689453125, -4.7880859375, -4.594482421875, -4.40087890625, -4.207275390625, -4.013671875, -3.820068359375, -3.62646484375, -3.432861328125, -3.2392578125, -3.045654296875, -2.85205078125, -2.658447265625, -2.46484375, -2.271240234375, -2.07763671875, -1.884033203125, -1.6904296875, -1.496826171875, -1.30322265625, -1.109619140625, -0.916015625, -0.722412109375, -0.52880859375, -0.335205078125, -0.1416015625, 0.052001953125, 0.24560546875, 0.439208984375, 0.6328125, 0.826416015625, 1.02001953125, 1.213623046875, 1.4072265625, 1.600830078125, 1.79443359375, 1.988037109375, 2.181640625, 2.375244140625, 2.56884765625, 2.762451171875, 2.9560546875, 3.149658203125, 3.34326171875, 3.536865234375, 3.73046875, 3.924072265625, 4.11767578125, 4.311279296875, 4.5048828125, 4.698486328125, 4.89208984375, 5.085693359375, 5.279296875, 5.472900390625, 5.66650390625, 5.860107421875, 6.0537109375, 6.247314453125, 6.44091796875, 6.634521484375, 6.828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 7.0, 6.0, 10.0, 21.0, 35.0, 47.0, 70.0, 111.0, 176.0, 284.0, 396.0, 537.0, 712.0, 992.0, 1452.0, 1996.0, 2907.0, 4023.0, 5838.0, 8179.0, 11893.0, 16777.0, 25118.0, 37921.0, 56728.0, 85364.0, 123093.0, 159067.0, 151779.0, 114521.0, 77385.0, 51808.0, 34398.0, 22963.0, 15911.0, 10539.0, 7409.0, 5138.0, 3853.0, 2641.0, 1908.0, 1409.0, 978.0, 701.0, 500.0, 331.0, 223.0, 159.0, 100.0, 60.0, 34.0, 21.0, 14.0, 11.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.462890625, -0.4479026794433594, -0.43291473388671875, -0.4179267883300781, -0.4029388427734375, -0.3879508972167969, -0.37296295166015625, -0.3579750061035156, -0.342987060546875, -0.3279991149902344, -0.31301116943359375, -0.2980232238769531, -0.2830352783203125, -0.2680473327636719, -0.25305938720703125, -0.23807144165039062, -0.22308349609375, -0.20809555053710938, -0.19310760498046875, -0.17811965942382812, -0.1631317138671875, -0.14814376831054688, -0.13315582275390625, -0.11816787719726562, -0.103179931640625, -0.08819198608398438, -0.07320404052734375, -0.058216094970703125, -0.0432281494140625, -0.028240203857421875, -0.01325225830078125, 0.001735687255859375, 0.0167236328125, 0.031711578369140625, 0.04669952392578125, 0.061687469482421875, 0.0766754150390625, 0.09166336059570312, 0.10665130615234375, 0.12163925170898438, 0.136627197265625, 0.15161514282226562, 0.16660308837890625, 0.18159103393554688, 0.1965789794921875, 0.21156692504882812, 0.22655487060546875, 0.24154281616210938, 0.25653076171875, 0.2715187072753906, 0.28650665283203125, 0.3014945983886719, 0.3164825439453125, 0.3314704895019531, 0.34645843505859375, 0.3614463806152344, 0.376434326171875, 0.3914222717285156, 0.40641021728515625, 0.4213981628417969, 0.4363861083984375, 0.4513740539550781, 0.46636199951171875, 0.4813499450683594, 0.496337890625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 0.0, 5.0, 14.0, 3.0, 13.0, 23.0, 19.0, 11.0, 14.0, 20.0, 22.0, 34.0, 25.0, 30.0, 28.0, 33.0, 46.0, 45.0, 50.0, 39.0, 1068.0, 43.0, 48.0, 33.0, 52.0, 37.0, 26.0, 42.0, 32.0, 25.0, 22.0, 21.0, 23.0, 20.0, 16.0, 9.0, 12.0, 10.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.921875, -3.801544189453125, -3.68121337890625, -3.560882568359375, -3.4405517578125, -3.320220947265625, -3.19989013671875, -3.079559326171875, -2.959228515625, -2.838897705078125, -2.71856689453125, -2.598236083984375, -2.4779052734375, -2.357574462890625, -2.23724365234375, -2.116912841796875, -1.99658203125, -1.876251220703125, -1.75592041015625, -1.635589599609375, -1.5152587890625, -1.394927978515625, -1.27459716796875, -1.154266357421875, -1.033935546875, -0.913604736328125, -0.79327392578125, -0.672943115234375, -0.5526123046875, -0.432281494140625, -0.31195068359375, -0.191619873046875, -0.0712890625, 0.049041748046875, 0.16937255859375, 0.289703369140625, 0.4100341796875, 0.530364990234375, 0.65069580078125, 0.771026611328125, 0.891357421875, 1.011688232421875, 1.13201904296875, 1.252349853515625, 1.3726806640625, 1.493011474609375, 1.61334228515625, 1.733673095703125, 1.85400390625, 1.974334716796875, 2.09466552734375, 2.214996337890625, 2.3353271484375, 2.455657958984375, 2.57598876953125, 2.696319580078125, 2.816650390625, 2.936981201171875, 3.05731201171875, 3.177642822265625, 3.2979736328125, 3.418304443359375, 3.53863525390625, 3.658966064453125, 3.779296875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 15.0, 5.0, 20.0, 23.0, 35.0, 51.0, 81.0, 135.0, 167.0, 306.0, 461.0, 690.0, 993.0, 1725.0, 2671.0, 4385.0, 6999.0, 11315.0, 18677.0, 31039.0, 51568.0, 86258.0, 134615.0, 1079756.0, 320367.0, 132429.0, 84643.0, 50672.0, 29871.0, 17811.0, 10972.0, 6802.0, 4199.0, 2680.0, 1696.0, 1031.0, 694.0, 442.0, 287.0, 181.0, 123.0, 90.0, 60.0, 35.0, 19.0, 14.0, 12.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4401512145996094, -0.42546844482421875, -0.4107856750488281, -0.3961029052734375, -0.3814201354980469, -0.36673736572265625, -0.3520545959472656, -0.337371826171875, -0.3226890563964844, -0.30800628662109375, -0.2933235168457031, -0.2786407470703125, -0.2639579772949219, -0.24927520751953125, -0.23459243774414062, -0.21990966796875, -0.20522689819335938, -0.19054412841796875, -0.17586135864257812, -0.1611785888671875, -0.14649581909179688, -0.13181304931640625, -0.11713027954101562, -0.102447509765625, -0.08776473999023438, -0.07308197021484375, -0.058399200439453125, -0.0437164306640625, -0.029033660888671875, -0.01435089111328125, 0.000331878662109375, 0.0150146484375, 0.029697418212890625, 0.04438018798828125, 0.059062957763671875, 0.0737457275390625, 0.08842849731445312, 0.10311126708984375, 0.11779403686523438, 0.132476806640625, 0.14715957641601562, 0.16184234619140625, 0.17652511596679688, 0.1912078857421875, 0.20589065551757812, 0.22057342529296875, 0.23525619506835938, 0.24993896484375, 0.2646217346191406, 0.27930450439453125, 0.2939872741699219, 0.3086700439453125, 0.3233528137207031, 0.33803558349609375, 0.3527183532714844, 0.367401123046875, 0.3820838928222656, 0.39676666259765625, 0.4114494323730469, 0.4261322021484375, 0.4408149719238281, 0.45549774169921875, 0.4701805114746094, 0.48486328125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 8.0, 9.0, 15.0, 11.0, 17.0, 24.0, 16.0, 20.0, 35.0, 24.0, 32.0, 44.0, 44.0, 62.0, 51.0, 52.0, 52.0, 71.0, 55.0, 52.0, 40.0, 45.0, 41.0, 29.0, 24.0, 18.0, 20.0, 20.0, 13.0, 6.0, 7.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00136566162109375, -0.0013147294521331787, -0.0012637972831726074, -0.0012128651142120361, -0.0011619329452514648, -0.0011110007762908936, -0.0010600686073303223, -0.001009136438369751, -0.0009582042694091797, -0.0009072721004486084, -0.0008563399314880371, -0.0008054077625274658, -0.0007544755935668945, -0.0007035434246063232, -0.000652611255645752, -0.0006016790866851807, -0.0005507469177246094, -0.0004998147487640381, -0.0004488825798034668, -0.0003979504108428955, -0.0003470182418823242, -0.00029608607292175293, -0.00024515390396118164, -0.00019422173500061035, -0.00014328956604003906, -9.235739707946777e-05, -4.1425228118896484e-05, 9.506940841674805e-06, 6.0439109802246094e-05, 0.00011137127876281738, 0.00016230344772338867, 0.00021323561668395996, 0.00026416778564453125, 0.00031509995460510254, 0.00036603212356567383, 0.0004169642925262451, 0.0004678964614868164, 0.0005188286304473877, 0.000569760799407959, 0.0006206929683685303, 0.0006716251373291016, 0.0007225573062896729, 0.0007734894752502441, 0.0008244216442108154, 0.0008753538131713867, 0.000926285982131958, 0.0009772181510925293, 0.0010281503200531006, 0.0010790824890136719, 0.0011300146579742432, 0.0011809468269348145, 0.0012318789958953857, 0.001282811164855957, 0.0013337433338165283, 0.0013846755027770996, 0.001435607671737671, 0.0014865398406982422, 0.0015374720096588135, 0.0015884041786193848, 0.001639336347579956, 0.0016902685165405273, 0.0017412006855010986, 0.00179213285446167, 0.0018430650234222412, 0.0018939971923828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 11.0, 11.0, 9.0, 13.0, 14.0, 17.0, 26.0, 31.0, 33.0, 52.0, 69.0, 82.0, 99.0, 155.0, 261.0, 656.0, 5288.0, 993884.0, 45901.0, 968.0, 341.0, 161.0, 102.0, 80.0, 58.0, 43.0, 29.0, 34.0, 21.0, 28.0, 18.0, 8.0, 10.0, 15.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.037967681884765625, -0.03690338134765625, -0.035839080810546875, -0.0347747802734375, -0.033710479736328125, -0.03264617919921875, -0.031581878662109375, -0.030517578125, -0.029453277587890625, -0.02838897705078125, -0.027324676513671875, -0.0262603759765625, -0.025196075439453125, -0.02413177490234375, -0.023067474365234375, -0.022003173828125, -0.020938873291015625, -0.01987457275390625, -0.018810272216796875, -0.0177459716796875, -0.016681671142578125, -0.01561737060546875, -0.014553070068359375, -0.01348876953125, -0.012424468994140625, -0.01136016845703125, -0.010295867919921875, -0.0092315673828125, -0.008167266845703125, -0.00710296630859375, -0.006038665771484375, -0.004974365234375, -0.003910064697265625, -0.00284576416015625, -0.001781463623046875, -0.0007171630859375, 0.000347137451171875, 0.00141143798828125, 0.002475738525390625, 0.0035400390625, 0.004604339599609375, 0.00566864013671875, 0.006732940673828125, 0.0077972412109375, 0.008861541748046875, 0.00992584228515625, 0.010990142822265625, 0.012054443359375, 0.013118743896484375, 0.01418304443359375, 0.015247344970703125, 0.0163116455078125, 0.017375946044921875, 0.01844024658203125, 0.019504547119140625, 0.02056884765625, 0.021633148193359375, 0.02269744873046875, 0.023761749267578125, 0.0248260498046875, 0.025890350341796875, 0.02695465087890625, 0.028018951416015625, 0.029083251953125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 94.0, 301.0, 422.0, 161.0, 24.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021073613315820694, -0.0019686666782945395, -0.0018299721414223313, -0.0016912776045501232, -0.0015525829512625933, -0.0014138884143903852, -0.001275193877518177, -0.001136499224230647, -0.000997804687358439, -0.0008591100922785699, -0.0007204154971987009, -0.0005817209603264928, -0.00044302636524662375, -0.0003043317701667547, -0.0001656372332945466, -2.6942638214677572e-05, 0.00011175195686519146, 0.0002504465519450605, 0.00038914111792109907, 0.0005278356838971376, 0.0006665302789770067, 0.0008052248740568757, 0.0009439194109290838, 0.0010826140642166138, 0.0012213086010888219, 0.00136000313796103, 0.00149869779124856, 0.001637392328120768, 0.0017760868649929762, 0.0019147815182805061, 0.0020534759387373924, 0.0021921705920249224, 0.0023308652453124523, 0.0024695598985999823, 0.0026082543190568686, 0.0027469489723443985, 0.0028856436256319284, 0.0030243382789194584, 0.0031630326993763447, 0.0033017273526638746, 0.0034404220059514046, 0.0035791166592389345, 0.003717811079695821, 0.0038565057329833508, 0.003995200153440237, 0.004133895039558411, 0.004272589460015297, 0.004411283880472183, 0.0045499783009290695, 0.004688672721385956, 0.004827367607504129, 0.004966062027961016, 0.005104756448417902, 0.005243451334536076, 0.005382145754992962, 0.005520840175449848, 0.005659535061568022, 0.005798229482024908, 0.005936924368143082, 0.006075618788599968, 0.006214313209056854, 0.006353008095175028, 0.006491702515631914, 0.0066303969360888, 0.006769091822206974]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 9.0, 3.0, 9.0, 8.0, 13.0, 15.0, 15.0, 17.0, 22.0, 26.0, 28.0, 26.0, 30.0, 32.0, 39.0, 40.0, 34.0, 39.0, 44.0, 53.0, 46.0, 37.0, 39.0, 40.0, 42.0, 31.0, 27.0, 27.0, 25.0, 29.0, 30.0, 25.0, 18.0, 19.0, 10.0, 9.0, 7.0, 8.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007494688034057617, -0.0007223617285490036, -0.0006952546536922455, -0.0006681475788354874, -0.0006410405039787292, -0.0006139334291219711, -0.000586826354265213, -0.0005597192794084549, -0.0005326122045516968, -0.0005055051296949387, -0.00047839805483818054, -0.0004512909799814224, -0.0004241839051246643, -0.0003970768302679062, -0.00036996975541114807, -0.00034286268055438995, -0.00031575560569763184, -0.0002886485308408737, -0.0002615414559841156, -0.00023443438112735748, -0.00020732730627059937, -0.00018022023141384125, -0.00015311315655708313, -0.000126006081700325, -9.88990068435669e-05, -7.179193198680878e-05, -4.468485713005066e-05, -1.757778227329254e-05, 9.529292583465576e-06, 3.6636367440223694e-05, 6.374344229698181e-05, 9.085051715373993e-05, 0.00011795759201049805, 0.00014506466686725616, 0.00017217174172401428, 0.0001992788165807724, 0.00022638589143753052, 0.00025349296629428864, 0.00028060004115104675, 0.00030770711600780487, 0.000334814190864563, 0.0003619212657213211, 0.0003890283405780792, 0.00041613541543483734, 0.00044324249029159546, 0.0004703495651483536, 0.0004974566400051117, 0.0005245637148618698, 0.0005516707897186279, 0.000578777864575386, 0.0006058849394321442, 0.0006329920142889023, 0.0006600990891456604, 0.0006872061640024185, 0.0007143132388591766, 0.0007414203137159348, 0.0007685273885726929, 0.000795634463429451, 0.0008227415382862091, 0.0008498486131429672, 0.0008769556879997253, 0.0009040627628564835, 0.0009311698377132416, 0.0009582769125699997, 0.0009853839874267578]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 8.0, 7.0, 4.0, 5.0, 12.0, 13.0, 12.0, 20.0, 20.0, 21.0, 19.0, 23.0, 31.0, 41.0, 32.0, 40.0, 48.0, 48.0, 47.0, 42.0, 39.0, 33.0, 38.0, 38.0, 50.0, 37.0, 39.0, 41.0, 31.0, 17.0, 21.0, 21.0, 16.0, 14.0, 12.0, 19.0, 13.0, 7.0, 4.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5625, -5.368896484375, -5.17529296875, -4.981689453125, -4.7880859375, -4.594482421875, -4.40087890625, -4.207275390625, -4.013671875, -3.820068359375, -3.62646484375, -3.432861328125, -3.2392578125, -3.045654296875, -2.85205078125, -2.658447265625, -2.46484375, -2.271240234375, -2.07763671875, -1.884033203125, -1.6904296875, -1.496826171875, -1.30322265625, -1.109619140625, -0.916015625, -0.722412109375, -0.52880859375, -0.335205078125, -0.1416015625, 0.052001953125, 0.24560546875, 0.439208984375, 0.6328125, 0.826416015625, 1.02001953125, 1.213623046875, 1.4072265625, 1.600830078125, 1.79443359375, 1.988037109375, 2.181640625, 2.375244140625, 2.56884765625, 2.762451171875, 2.9560546875, 3.149658203125, 3.34326171875, 3.536865234375, 3.73046875, 3.924072265625, 4.11767578125, 4.311279296875, 4.5048828125, 4.698486328125, 4.89208984375, 5.085693359375, 5.279296875, 5.472900390625, 5.66650390625, 5.860107421875, 6.0537109375, 6.247314453125, 6.44091796875, 6.634521484375, 6.828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 12.0, 27.0, 18.0, 34.0, 37.0, 39.0, 79.0, 81.0, 111.0, 146.0, 231.0, 394.0, 881.0, 1842.0, 4880.0, 12511.0, 34234.0, 96643.0, 308190.0, 397191.0, 122133.0, 42673.0, 15499.0, 5885.0, 2364.0, 1026.0, 488.0, 265.0, 159.0, 87.0, 87.0, 68.0, 39.0, 44.0, 27.0, 25.0, 18.0, 13.0, 16.0, 12.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.796875, -5.61053466796875, -5.4241943359375, -5.23785400390625, -5.051513671875, -4.86517333984375, -4.6788330078125, -4.49249267578125, -4.30615234375, -4.11981201171875, -3.9334716796875, -3.74713134765625, -3.560791015625, -3.37445068359375, -3.1881103515625, -3.00177001953125, -2.8154296875, -2.62908935546875, -2.4427490234375, -2.25640869140625, -2.070068359375, -1.88372802734375, -1.6973876953125, -1.51104736328125, -1.32470703125, -1.13836669921875, -0.9520263671875, -0.76568603515625, -0.579345703125, -0.39300537109375, -0.2066650390625, -0.02032470703125, 0.166015625, 0.35235595703125, 0.5386962890625, 0.72503662109375, 0.911376953125, 1.09771728515625, 1.2840576171875, 1.47039794921875, 1.65673828125, 1.84307861328125, 2.0294189453125, 2.21575927734375, 2.402099609375, 2.58843994140625, 2.7747802734375, 2.96112060546875, 3.1474609375, 3.33380126953125, 3.5201416015625, 3.70648193359375, 3.892822265625, 4.07916259765625, 4.2655029296875, 4.45184326171875, 4.63818359375, 4.82452392578125, 5.0108642578125, 5.19720458984375, 5.383544921875, 5.56988525390625, 5.7562255859375, 5.94256591796875, 6.12890625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 1.0, 8.0, 6.0, 8.0, 10.0, 13.0, 11.0, 17.0, 21.0, 22.0, 34.0, 25.0, 37.0, 53.0, 45.0, 61.0, 63.0, 78.0, 345.0, 1576.0, 167.0, 48.0, 70.0, 41.0, 36.0, 35.0, 34.0, 31.0, 17.0, 27.0, 21.0, 17.0, 16.0, 11.0, 11.0, 7.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.65625, -21.00439453125, -20.3525390625, -19.70068359375, -19.048828125, -18.39697265625, -17.7451171875, -17.09326171875, -16.44140625, -15.78955078125, -15.1376953125, -14.48583984375, -13.833984375, -13.18212890625, -12.5302734375, -11.87841796875, -11.2265625, -10.57470703125, -9.9228515625, -9.27099609375, -8.619140625, -7.96728515625, -7.3154296875, -6.66357421875, -6.01171875, -5.35986328125, -4.7080078125, -4.05615234375, -3.404296875, -2.75244140625, -2.1005859375, -1.44873046875, -0.796875, -0.14501953125, 0.5068359375, 1.15869140625, 1.810546875, 2.46240234375, 3.1142578125, 3.76611328125, 4.41796875, 5.06982421875, 5.7216796875, 6.37353515625, 7.025390625, 7.67724609375, 8.3291015625, 8.98095703125, 9.6328125, 10.28466796875, 10.9365234375, 11.58837890625, 12.240234375, 12.89208984375, 13.5439453125, 14.19580078125, 14.84765625, 15.49951171875, 16.1513671875, 16.80322265625, 17.455078125, 18.10693359375, 18.7587890625, 19.41064453125, 20.0625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 11.0, 5.0, 4.0, 5.0, 5.0, 11.0, 13.0, 12.0, 16.0, 27.0, 29.0, 34.0, 28.0, 48.0, 54.0, 75.0, 106.0, 131.0, 176.0, 320.0, 559.0, 1230.0, 8405.0, 2930686.0, 198406.0, 2968.0, 831.0, 467.0, 280.0, 174.0, 120.0, 100.0, 75.0, 40.0, 55.0, 45.0, 30.0, 22.0, 16.0, 13.0, 14.0, 11.0, 9.0, 11.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.09375, -39.759765625, -38.42578125, -37.091796875, -35.7578125, -34.423828125, -33.08984375, -31.755859375, -30.421875, -29.087890625, -27.75390625, -26.419921875, -25.0859375, -23.751953125, -22.41796875, -21.083984375, -19.75, -18.416015625, -17.08203125, -15.748046875, -14.4140625, -13.080078125, -11.74609375, -10.412109375, -9.078125, -7.744140625, -6.41015625, -5.076171875, -3.7421875, -2.408203125, -1.07421875, 0.259765625, 1.59375, 2.927734375, 4.26171875, 5.595703125, 6.9296875, 8.263671875, 9.59765625, 10.931640625, 12.265625, 13.599609375, 14.93359375, 16.267578125, 17.6015625, 18.935546875, 20.26953125, 21.603515625, 22.9375, 24.271484375, 25.60546875, 26.939453125, 28.2734375, 29.607421875, 30.94140625, 32.275390625, 33.609375, 34.943359375, 36.27734375, 37.611328125, 38.9453125, 40.279296875, 41.61328125, 42.947265625, 44.28125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [2.0, 17.0, 555.0, 435.0, 11.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.344505310058594, -9.471978187561035, -4.599451065063477, 0.27307605743408203, 5.145603179931641, 10.018131256103516, 14.890657424926758, 19.76318359375, 24.635711669921875, 29.50823974609375, 34.380767822265625, 39.253292083740234, 44.12582015991211, 48.998348236083984, 53.870872497558594, 58.74340057373047, 63.615928649902344, 68.48845672607422, 73.3609848022461, 78.23351287841797, 83.10603332519531, 87.97856140136719, 92.85108947753906, 97.72361755371094, 102.59614562988281, 107.46867370605469, 112.34120178222656, 117.21372985839844, 122.08625793457031, 126.95878601074219, 131.83131408691406, 136.70382690429688, 141.57635498046875, 146.44888305664062, 151.3214111328125, 156.19393920898438, 161.06646728515625, 165.93899536132812, 170.8115234375, 175.68405151367188, 180.55657958984375, 185.42910766601562, 190.3016357421875, 195.17416381835938, 200.04669189453125, 204.91921997070312, 209.791748046875, 214.66427612304688, 219.5367889404297, 224.40931701660156, 229.28184509277344, 234.1543731689453, 239.0269012451172, 243.89942932128906, 248.77195739746094, 253.64447021484375, 258.5169982910156, 263.3895263671875, 268.2620544433594, 273.13458251953125, 278.0071105957031, 282.879638671875, 287.7521667480469, 292.62469482421875, 297.4972229003906]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 9.0, 5.0, 13.0, 13.0, 13.0, 13.0, 21.0, 10.0, 28.0, 23.0, 34.0, 35.0, 29.0, 32.0, 45.0, 37.0, 28.0, 24.0, 37.0, 40.0, 47.0, 35.0, 40.0, 36.0, 40.0, 30.0, 29.0, 30.0, 32.0, 26.0, 20.0, 17.0, 12.0, 18.0, 8.0, 12.0, 12.0, 8.0, 7.0, 8.0, 4.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-46.500328063964844, -45.11433410644531, -43.72834014892578, -42.342342376708984, -40.95634841918945, -39.57035446166992, -38.184356689453125, -36.798362731933594, -35.41236877441406, -34.02637481689453, -32.640380859375, -31.254383087158203, -29.868389129638672, -28.48239517211914, -27.096399307250977, -25.710403442382812, -24.32440948486328, -22.93841552734375, -21.552419662475586, -20.166423797607422, -18.78042984008789, -17.39443588256836, -16.008440017700195, -14.622445106506348, -13.2364501953125, -11.850455284118652, -10.464460372924805, -9.078465461730957, -7.692470550537109, -6.306475639343262, -4.920480728149414, -3.5344858169555664, -2.1484909057617188, -0.7624959945678711, 0.6234989166259766, 2.009493827819824, 3.395488739013672, 4.7814836502075195, 6.167478561401367, 7.553473472595215, 8.939468383789062, 10.32546329498291, 11.711458206176758, 13.097453117370605, 14.483448028564453, 15.8694429397583, 17.25543785095215, 18.641433715820312, 20.027427673339844, 21.413421630859375, 22.79941749572754, 24.185413360595703, 25.571407318115234, 26.957401275634766, 28.34339714050293, 29.729393005371094, 31.115386962890625, 32.501380920410156, 33.88737487792969, 35.273372650146484, 36.659366607666016, 38.04536056518555, 39.431358337402344, 40.817352294921875, 42.203346252441406]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 14.0, 11.0, 11.0, 17.0, 19.0, 11.0, 21.0, 33.0, 23.0, 27.0, 49.0, 46.0, 48.0, 36.0, 53.0, 38.0, 47.0, 53.0, 35.0, 43.0, 43.0, 38.0, 33.0, 32.0, 28.0, 27.0, 30.0, 23.0, 17.0, 9.0, 15.0, 14.0, 6.0, 7.0, 7.0, 11.0, 7.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1171875, -5.9052734375, -5.693359375, -5.4814453125, -5.26953125, -5.0576171875, -4.845703125, -4.6337890625, -4.421875, -4.2099609375, -3.998046875, -3.7861328125, -3.57421875, -3.3623046875, -3.150390625, -2.9384765625, -2.7265625, -2.5146484375, -2.302734375, -2.0908203125, -1.87890625, -1.6669921875, -1.455078125, -1.2431640625, -1.03125, -0.8193359375, -0.607421875, -0.3955078125, -0.18359375, 0.0283203125, 0.240234375, 0.4521484375, 0.6640625, 0.8759765625, 1.087890625, 1.2998046875, 1.51171875, 1.7236328125, 1.935546875, 2.1474609375, 2.359375, 2.5712890625, 2.783203125, 2.9951171875, 3.20703125, 3.4189453125, 3.630859375, 3.8427734375, 4.0546875, 4.2666015625, 4.478515625, 4.6904296875, 4.90234375, 5.1142578125, 5.326171875, 5.5380859375, 5.75, 5.9619140625, 6.173828125, 6.3857421875, 6.59765625, 6.8095703125, 7.021484375, 7.2333984375, 7.4453125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 5.0, 6.0, 8.0, 6.0, 8.0, 22.0, 13.0, 22.0, 23.0, 27.0, 37.0, 46.0, 82.0, 102.0, 171.0, 370.0, 936.0, 3976.0, 48332.0, 1864019.0, 2211957.0, 57651.0, 4502.0, 958.0, 379.0, 188.0, 106.0, 74.0, 53.0, 40.0, 32.0, 29.0, 21.0, 11.0, 16.0, 11.0, 7.0, 6.0, 7.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.83447265625, -18.1376953125, -17.44091796875, -16.744140625, -16.04736328125, -15.3505859375, -14.65380859375, -13.95703125, -13.26025390625, -12.5634765625, -11.86669921875, -11.169921875, -10.47314453125, -9.7763671875, -9.07958984375, -8.3828125, -7.68603515625, -6.9892578125, -6.29248046875, -5.595703125, -4.89892578125, -4.2021484375, -3.50537109375, -2.80859375, -2.11181640625, -1.4150390625, -0.71826171875, -0.021484375, 0.67529296875, 1.3720703125, 2.06884765625, 2.765625, 3.46240234375, 4.1591796875, 4.85595703125, 5.552734375, 6.24951171875, 6.9462890625, 7.64306640625, 8.33984375, 9.03662109375, 9.7333984375, 10.43017578125, 11.126953125, 11.82373046875, 12.5205078125, 13.21728515625, 13.9140625, 14.61083984375, 15.3076171875, 16.00439453125, 16.701171875, 17.39794921875, 18.0947265625, 18.79150390625, 19.48828125, 20.18505859375, 20.8818359375, 21.57861328125, 22.275390625, 22.97216796875, 23.6689453125, 24.36572265625, 25.0625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 6.0, 7.0, 8.0, 11.0, 18.0, 25.0, 31.0, 41.0, 46.0, 84.0, 99.0, 132.0, 200.0, 278.0, 279.0, 405.0, 441.0, 381.0, 369.0, 302.0, 234.0, 147.0, 116.0, 104.0, 68.0, 48.0, 43.0, 35.0, 24.0, 22.0, 11.0, 10.0, 2.0, 3.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.3092041015625, -10.954345703125, -10.5994873046875, -10.24462890625, -9.8897705078125, -9.534912109375, -9.1800537109375, -8.8251953125, -8.4703369140625, -8.115478515625, -7.7606201171875, -7.40576171875, -7.0509033203125, -6.696044921875, -6.3411865234375, -5.986328125, -5.6314697265625, -5.276611328125, -4.9217529296875, -4.56689453125, -4.2120361328125, -3.857177734375, -3.5023193359375, -3.1474609375, -2.7926025390625, -2.437744140625, -2.0828857421875, -1.72802734375, -1.3731689453125, -1.018310546875, -0.6634521484375, -0.30859375, 0.0462646484375, 0.401123046875, 0.7559814453125, 1.11083984375, 1.4656982421875, 1.820556640625, 2.1754150390625, 2.5302734375, 2.8851318359375, 3.239990234375, 3.5948486328125, 3.94970703125, 4.3045654296875, 4.659423828125, 5.0142822265625, 5.369140625, 5.7239990234375, 6.078857421875, 6.4337158203125, 6.78857421875, 7.1434326171875, 7.498291015625, 7.8531494140625, 8.2080078125, 8.5628662109375, 8.917724609375, 9.2725830078125, 9.62744140625, 9.9822998046875, 10.337158203125, 10.6920166015625, 11.046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 12.0, 8.0, 17.0, 30.0, 28.0, 46.0, 69.0, 88.0, 103.0, 146.0, 165.0, 229.0, 356.0, 798.0, 7545.0, 1395960.0, 2775578.0, 10612.0, 986.0, 430.0, 283.0, 209.0, 152.0, 108.0, 87.0, 44.0, 49.0, 28.0, 26.0, 19.0, 10.0, 14.0, 5.0, 6.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-59.03125, -57.13037109375, -55.2294921875, -53.32861328125, -51.427734375, -49.52685546875, -47.6259765625, -45.72509765625, -43.82421875, -41.92333984375, -40.0224609375, -38.12158203125, -36.220703125, -34.31982421875, -32.4189453125, -30.51806640625, -28.6171875, -26.71630859375, -24.8154296875, -22.91455078125, -21.013671875, -19.11279296875, -17.2119140625, -15.31103515625, -13.41015625, -11.50927734375, -9.6083984375, -7.70751953125, -5.806640625, -3.90576171875, -2.0048828125, -0.10400390625, 1.796875, 3.69775390625, 5.5986328125, 7.49951171875, 9.400390625, 11.30126953125, 13.2021484375, 15.10302734375, 17.00390625, 18.90478515625, 20.8056640625, 22.70654296875, 24.607421875, 26.50830078125, 28.4091796875, 30.31005859375, 32.2109375, 34.11181640625, 36.0126953125, 37.91357421875, 39.814453125, 41.71533203125, 43.6162109375, 45.51708984375, 47.41796875, 49.31884765625, 51.2197265625, 53.12060546875, 55.021484375, 56.92236328125, 58.8232421875, 60.72412109375, 62.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 7.0, 7.0, 17.0, 30.0, 69.0, 71.0, 99.0, 132.0, 125.0, 138.0, 107.0, 82.0, 53.0, 24.0, 11.0, 14.0, 10.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.42529296875, -65.57601165771484, -63.72673034667969, -61.87744903564453, -60.02817153930664, -58.178890228271484, -56.32960891723633, -54.48032760620117, -52.63105010986328, -50.781768798828125, -48.93248748779297, -47.08320617675781, -45.23392868041992, -43.384647369384766, -41.53536605834961, -39.68608474731445, -37.8368034362793, -35.98752212524414, -34.138240814208984, -32.288963317871094, -30.439682006835938, -28.59040069580078, -26.741119384765625, -24.89183807373047, -23.042558670043945, -21.19327735900879, -19.343997955322266, -17.49471664428711, -15.64543628692627, -13.79615592956543, -11.946874618530273, -10.097594261169434, -8.248313903808594, -6.399033546447754, -4.549752712249756, -2.700471878051758, -0.851191520690918, 0.9980888366699219, 2.847370147705078, 4.696650505065918, 6.545930862426758, 8.395211219787598, 10.244491577148438, 12.093772888183594, 13.943053245544434, 15.792333602905273, 17.64161491394043, 19.490894317626953, 21.34017562866211, 23.189456939697266, 25.03873634338379, 26.888017654418945, 28.73729705810547, 30.586578369140625, 32.43585968017578, 34.28514099121094, 36.134422302246094, 37.98370361328125, 39.832984924316406, 41.68226623535156, 43.53154373168945, 45.38082504272461, 47.230106353759766, 49.07938766479492, 50.92866516113281]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 7.0, 5.0, 9.0, 3.0, 13.0, 13.0, 17.0, 16.0, 16.0, 12.0, 23.0, 22.0, 27.0, 38.0, 35.0, 40.0, 38.0, 29.0, 37.0, 42.0, 49.0, 44.0, 33.0, 41.0, 35.0, 32.0, 31.0, 26.0, 28.0, 24.0, 28.0, 25.0, 22.0, 22.0, 10.0, 12.0, 14.0, 7.0, 14.0, 11.0, 13.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-37.36811828613281, -36.15095520019531, -34.93379211425781, -33.71662902832031, -32.49946594238281, -31.282304763793945, -30.065143585205078, -28.847980499267578, -27.630817413330078, -26.413654327392578, -25.196491241455078, -23.97933006286621, -22.76216697692871, -21.54500389099121, -20.327842712402344, -19.110679626464844, -17.893516540527344, -16.676353454589844, -15.45919132232666, -14.242029190063477, -13.024866104125977, -11.807703018188477, -10.590540885925293, -9.37337875366211, -8.15621566772461, -6.939053058624268, -5.721890449523926, -4.504727840423584, -3.287565231323242, -2.0704026222229004, -0.8532400131225586, 0.363922119140625, 1.581085205078125, 2.798247814178467, 4.015410423278809, 5.23257303237915, 6.449735641479492, 7.666898250579834, 8.884060859680176, 10.10122299194336, 11.31838607788086, 12.53554916381836, 13.752711296081543, 14.969873428344727, 16.187036514282227, 17.404199600219727, 18.621360778808594, 19.838523864746094, 21.055686950683594, 22.272850036621094, 23.490013122558594, 24.70717430114746, 25.92433738708496, 27.14150047302246, 28.358661651611328, 29.575824737548828, 30.792987823486328, 32.01015090942383, 33.22731399536133, 34.44447708129883, 35.66163635253906, 36.87879943847656, 38.09596252441406, 39.31312561035156, 40.53028869628906]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 12.0, 10.0, 17.0, 20.0, 21.0, 26.0, 28.0, 33.0, 49.0, 41.0, 47.0, 42.0, 54.0, 45.0, 45.0, 42.0, 44.0, 43.0, 40.0, 40.0, 27.0, 44.0, 23.0, 31.0, 21.0, 25.0, 15.0, 13.0, 15.0, 11.0, 9.0, 13.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.015625, -5.790283203125, -5.56494140625, -5.339599609375, -5.1142578125, -4.888916015625, -4.66357421875, -4.438232421875, -4.212890625, -3.987548828125, -3.76220703125, -3.536865234375, -3.3115234375, -3.086181640625, -2.86083984375, -2.635498046875, -2.41015625, -2.184814453125, -1.95947265625, -1.734130859375, -1.5087890625, -1.283447265625, -1.05810546875, -0.832763671875, -0.607421875, -0.382080078125, -0.15673828125, 0.068603515625, 0.2939453125, 0.519287109375, 0.74462890625, 0.969970703125, 1.1953125, 1.420654296875, 1.64599609375, 1.871337890625, 2.0966796875, 2.322021484375, 2.54736328125, 2.772705078125, 2.998046875, 3.223388671875, 3.44873046875, 3.674072265625, 3.8994140625, 4.124755859375, 4.35009765625, 4.575439453125, 4.80078125, 5.026123046875, 5.25146484375, 5.476806640625, 5.7021484375, 5.927490234375, 6.15283203125, 6.378173828125, 6.603515625, 6.828857421875, 7.05419921875, 7.279541015625, 7.5048828125, 7.730224609375, 7.95556640625, 8.180908203125, 8.40625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 18.0, 22.0, 51.0, 61.0, 74.0, 101.0, 172.0, 268.0, 400.0, 574.0, 934.0, 1418.0, 2021.0, 3301.0, 5314.0, 8177.0, 13258.0, 21158.0, 36297.0, 61375.0, 105485.0, 168471.0, 210565.0, 161880.0, 100259.0, 57931.0, 34395.0, 20320.0, 12428.0, 7862.0, 4960.0, 3126.0, 2036.0, 1295.0, 869.0, 526.0, 378.0, 242.0, 164.0, 114.0, 75.0, 62.0, 36.0, 19.0, 18.0, 14.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.671875, -0.6511688232421875, -0.630462646484375, -0.6097564697265625, -0.58905029296875, -0.5683441162109375, -0.547637939453125, -0.5269317626953125, -0.5062255859375, -0.4855194091796875, -0.464813232421875, -0.4441070556640625, -0.42340087890625, -0.4026947021484375, -0.381988525390625, -0.3612823486328125, -0.340576171875, -0.3198699951171875, -0.299163818359375, -0.2784576416015625, -0.25775146484375, -0.2370452880859375, -0.216339111328125, -0.1956329345703125, -0.1749267578125, -0.1542205810546875, -0.133514404296875, -0.1128082275390625, -0.09210205078125, -0.0713958740234375, -0.050689697265625, -0.0299835205078125, -0.00927734375, 0.0114288330078125, 0.032135009765625, 0.0528411865234375, 0.07354736328125, 0.0942535400390625, 0.114959716796875, 0.1356658935546875, 0.1563720703125, 0.1770782470703125, 0.197784423828125, 0.2184906005859375, 0.23919677734375, 0.2599029541015625, 0.280609130859375, 0.3013153076171875, 0.322021484375, 0.3427276611328125, 0.363433837890625, 0.3841400146484375, 0.40484619140625, 0.4255523681640625, 0.446258544921875, 0.4669647216796875, 0.4876708984375, 0.5083770751953125, 0.529083251953125, 0.5497894287109375, 0.57049560546875, 0.5912017822265625, 0.611907958984375, 0.6326141357421875, 0.6533203125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 7.0, 3.0, 6.0, 11.0, 8.0, 20.0, 13.0, 24.0, 19.0, 19.0, 19.0, 30.0, 40.0, 26.0, 41.0, 38.0, 44.0, 54.0, 48.0, 1066.0, 50.0, 48.0, 44.0, 35.0, 44.0, 31.0, 31.0, 24.0, 28.0, 30.0, 23.0, 21.0, 17.0, 9.0, 9.0, 9.0, 15.0, 4.0, 9.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.62109375, -4.475830078125, -4.33056640625, -4.185302734375, -4.0400390625, -3.894775390625, -3.74951171875, -3.604248046875, -3.458984375, -3.313720703125, -3.16845703125, -3.023193359375, -2.8779296875, -2.732666015625, -2.58740234375, -2.442138671875, -2.296875, -2.151611328125, -2.00634765625, -1.861083984375, -1.7158203125, -1.570556640625, -1.42529296875, -1.280029296875, -1.134765625, -0.989501953125, -0.84423828125, -0.698974609375, -0.5537109375, -0.408447265625, -0.26318359375, -0.117919921875, 0.02734375, 0.172607421875, 0.31787109375, 0.463134765625, 0.6083984375, 0.753662109375, 0.89892578125, 1.044189453125, 1.189453125, 1.334716796875, 1.47998046875, 1.625244140625, 1.7705078125, 1.915771484375, 2.06103515625, 2.206298828125, 2.3515625, 2.496826171875, 2.64208984375, 2.787353515625, 2.9326171875, 3.077880859375, 3.22314453125, 3.368408203125, 3.513671875, 3.658935546875, 3.80419921875, 3.949462890625, 4.0947265625, 4.239990234375, 4.38525390625, 4.530517578125, 4.67578125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 10.0, 7.0, 10.0, 17.0, 19.0, 30.0, 53.0, 84.0, 106.0, 194.0, 286.0, 480.0, 770.0, 1167.0, 1929.0, 3120.0, 5204.0, 8387.0, 14107.0, 23947.0, 40967.0, 72757.0, 124250.0, 180960.0, 1243686.0, 151337.0, 94182.0, 53911.0, 30426.0, 17659.0, 10658.0, 6270.0, 3860.0, 2400.0, 1405.0, 924.0, 577.0, 357.0, 215.0, 121.0, 101.0, 69.0, 37.0, 31.0, 18.0, 11.0, 9.0, 2.0, 2.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49951171875, -0.482421875, -0.46533203125, -0.4482421875, -0.43115234375, -0.4140625, -0.39697265625, -0.3798828125, -0.36279296875, -0.345703125, -0.32861328125, -0.3115234375, -0.29443359375, -0.27734375, -0.26025390625, -0.2431640625, -0.22607421875, -0.208984375, -0.19189453125, -0.1748046875, -0.15771484375, -0.140625, -0.12353515625, -0.1064453125, -0.08935546875, -0.072265625, -0.05517578125, -0.0380859375, -0.02099609375, -0.00390625, 0.01318359375, 0.0302734375, 0.04736328125, 0.064453125, 0.08154296875, 0.0986328125, 0.11572265625, 0.1328125, 0.14990234375, 0.1669921875, 0.18408203125, 0.201171875, 0.21826171875, 0.2353515625, 0.25244140625, 0.26953125, 0.28662109375, 0.3037109375, 0.32080078125, 0.337890625, 0.35498046875, 0.3720703125, 0.38916015625, 0.40625, 0.42333984375, 0.4404296875, 0.45751953125, 0.474609375, 0.49169921875, 0.5087890625, 0.52587890625, 0.54296875, 0.56005859375, 0.5771484375, 0.59423828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 0.0, 5.0, 8.0, 11.0, 9.0, 13.0, 22.0, 15.0, 13.0, 27.0, 24.0, 37.0, 26.0, 39.0, 50.0, 38.0, 44.0, 51.0, 52.0, 60.0, 61.0, 47.0, 44.0, 45.0, 32.0, 29.0, 23.0, 35.0, 23.0, 19.0, 20.0, 13.0, 4.0, 9.0, 9.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0021762847900390625, -0.0021111667156219482, -0.002046048641204834, -0.0019809305667877197, -0.0019158124923706055, -0.0018506944179534912, -0.001785576343536377, -0.0017204582691192627, -0.0016553401947021484, -0.0015902221202850342, -0.00152510404586792, -0.0014599859714508057, -0.0013948678970336914, -0.0013297498226165771, -0.0012646317481994629, -0.0011995136737823486, -0.0011343955993652344, -0.0010692775249481201, -0.0010041594505310059, -0.0009390413761138916, -0.0008739233016967773, -0.0008088052272796631, -0.0007436871528625488, -0.0006785690784454346, -0.0006134510040283203, -0.0005483329296112061, -0.0004832148551940918, -0.00041809678077697754, -0.0003529787063598633, -0.000287860631942749, -0.00022274255752563477, -0.0001576244831085205, -9.250640869140625e-05, -2.7388334274291992e-05, 3.7729740142822266e-05, 0.00010284781455993652, 0.00016796588897705078, 0.00023308396339416504, 0.0002982020378112793, 0.00036332011222839355, 0.0004284381866455078, 0.0004935562610626221, 0.0005586743354797363, 0.0006237924098968506, 0.0006889104843139648, 0.0007540285587310791, 0.0008191466331481934, 0.0008842647075653076, 0.0009493827819824219, 0.0010145008563995361, 0.0010796189308166504, 0.0011447370052337646, 0.001209855079650879, 0.0012749731540679932, 0.0013400912284851074, 0.0014052093029022217, 0.001470327377319336, 0.0015354454517364502, 0.0016005635261535645, 0.0016656816005706787, 0.001730799674987793, 0.0017959177494049072, 0.0018610358238220215, 0.0019261538982391357, 0.00199127197265625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 3.0, 8.0, 1.0, 19.0, 13.0, 12.0, 22.0, 27.0, 29.0, 36.0, 47.0, 57.0, 69.0, 84.0, 133.0, 199.0, 396.0, 1247.0, 106157.0, 935313.0, 3277.0, 566.0, 224.0, 152.0, 100.0, 67.0, 56.0, 50.0, 34.0, 28.0, 24.0, 23.0, 19.0, 10.0, 10.0, 7.0, 7.0, 5.0, 7.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042572021484375, -0.04116249084472656, -0.039752960205078125, -0.03834342956542969, -0.03693389892578125, -0.03552436828613281, -0.034114837646484375, -0.03270530700683594, -0.0312957763671875, -0.029886245727539062, -0.028476715087890625, -0.027067184448242188, -0.02565765380859375, -0.024248123168945312, -0.022838592529296875, -0.021429061889648438, -0.02001953125, -0.018610000610351562, -0.017200469970703125, -0.015790939331054688, -0.01438140869140625, -0.012971878051757812, -0.011562347412109375, -0.010152816772460938, -0.0087432861328125, -0.0073337554931640625, -0.005924224853515625, -0.0045146942138671875, -0.00310516357421875, -0.0016956329345703125, -0.000286102294921875, 0.0011234283447265625, 0.002532958984375, 0.0039424896240234375, 0.005352020263671875, 0.0067615509033203125, 0.00817108154296875, 0.009580612182617188, 0.010990142822265625, 0.012399673461914062, 0.0138092041015625, 0.015218734741210938, 0.016628265380859375, 0.018037796020507812, 0.01944732666015625, 0.020856857299804688, 0.022266387939453125, 0.023675918579101562, 0.02508544921875, 0.026494979858398438, 0.027904510498046875, 0.029314041137695312, 0.03072357177734375, 0.03213310241699219, 0.033542633056640625, 0.03495216369628906, 0.0363616943359375, 0.03777122497558594, 0.039180755615234375, 0.04059028625488281, 0.04199981689453125, 0.04340934753417969, 0.044818878173828125, 0.04622840881347656, 0.047637939453125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 182.0, 793.0, 41.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02585594728589058, -0.025371214374899864, -0.02488648146390915, -0.024401746690273285, -0.02391701377928257, -0.023432280868291855, -0.02294754795730114, -0.022462815046310425, -0.02197808027267456, -0.021493347361683846, -0.02100861445069313, -0.020523879677057266, -0.02003914676606655, -0.019554413855075836, -0.01906968094408512, -0.018584948033094406, -0.018100213259458542, -0.017615480348467827, -0.017130747437477112, -0.016646012663841248, -0.016161279752850533, -0.015676546841859818, -0.015191813930869102, -0.014707080088555813, -0.014222348108887672, -0.013737615197896957, -0.013252881355583668, -0.012768148444592953, -0.012283414602279663, -0.011798681691288948, -0.011313948780298233, -0.010829214937984943, -0.010344480164349079, -0.009859747253358364, -0.009375013411045074, -0.00889028050005436, -0.00840554665774107, -0.007920813746750355, -0.007436080370098352, -0.00695134699344635, -0.006466613616794348, -0.005981880240142345, -0.005497146863490343, -0.005012413486838341, -0.004527680575847626, -0.004042946733534336, -0.003558213822543621, -0.0030734804458916187, -0.0025887470692396164, -0.002104013692587614, -0.0016192804323509336, -0.001134547172114253, -0.0006498137954622507, -0.00016508041881024837, 0.0003196527250111103, 0.0008043861016631126, 0.001289119478315115, 0.0017738528549671173, 0.0022585862316191196, 0.0027433193754404783, 0.0032280527520924807, 0.003712786128744483, 0.004197519272565842, 0.004682252649217844, 0.005166986025869846]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 5.0, 6.0, 6.0, 4.0, 7.0, 10.0, 10.0, 14.0, 18.0, 13.0, 25.0, 25.0, 24.0, 27.0, 24.0, 38.0, 25.0, 36.0, 33.0, 38.0, 38.0, 34.0, 37.0, 38.0, 55.0, 37.0, 32.0, 33.0, 43.0, 25.0, 31.0, 24.0, 36.0, 18.0, 22.0, 16.0, 26.0, 11.0, 13.0, 11.0, 7.0, 7.0, 2.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011115670204162598, -0.001074160449206829, -0.0010367538779973984, -0.0009993473067879677, -0.000961940735578537, -0.0009245341643691063, -0.0008871275931596756, -0.0008497210219502449, -0.0008123144507408142, -0.0007749078795313835, -0.0007375013083219528, -0.0007000947371125221, -0.0006626881659030914, -0.0006252815946936607, -0.00058787502348423, -0.0005504684522747993, -0.0005130618810653687, -0.00047565530985593796, -0.00043824873864650726, -0.00040084216743707657, -0.0003634355962276459, -0.0003260290250182152, -0.0002886224538087845, -0.0002512158825993538, -0.0002138093113899231, -0.0001764027401804924, -0.0001389961689710617, -0.00010158959776163101, -6.418302655220032e-05, -2.6776455342769623e-05, 1.0630115866661072e-05, 4.8036687076091766e-05, 8.544325828552246e-05, 0.00012284982949495316, 0.00016025640070438385, 0.00019766297191381454, 0.00023506954312324524, 0.00027247611433267593, 0.00030988268554210663, 0.0003472892567515373, 0.000384695827960968, 0.0004221023991703987, 0.0004595089703798294, 0.0004969155415892601, 0.0005343221127986908, 0.0005717286840081215, 0.0006091352552175522, 0.0006465418264269829, 0.0006839483976364136, 0.0007213549688458443, 0.000758761540055275, 0.0007961681112647057, 0.0008335746824741364, 0.000870981253683567, 0.0009083878248929977, 0.0009457943961024284, 0.0009832009673118591, 0.0010206075385212898, 0.0010580141097307205, 0.0010954206809401512, 0.001132827252149582, 0.0011702338233590126, 0.0012076403945684433, 0.001245046965777874, 0.0012824535369873047]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 12.0, 10.0, 17.0, 20.0, 21.0, 26.0, 28.0, 33.0, 49.0, 41.0, 47.0, 42.0, 54.0, 45.0, 45.0, 42.0, 44.0, 43.0, 40.0, 40.0, 27.0, 44.0, 23.0, 30.0, 22.0, 25.0, 15.0, 13.0, 15.0, 11.0, 9.0, 13.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.015625, -5.790283203125, -5.56494140625, -5.339599609375, -5.1142578125, -4.888916015625, -4.66357421875, -4.438232421875, -4.212890625, -3.987548828125, -3.76220703125, -3.536865234375, -3.3115234375, -3.086181640625, -2.86083984375, -2.635498046875, -2.41015625, -2.184814453125, -1.95947265625, -1.734130859375, -1.5087890625, -1.283447265625, -1.05810546875, -0.832763671875, -0.607421875, -0.382080078125, -0.15673828125, 0.068603515625, 0.2939453125, 0.519287109375, 0.74462890625, 0.969970703125, 1.1953125, 1.420654296875, 1.64599609375, 1.871337890625, 2.0966796875, 2.322021484375, 2.54736328125, 2.772705078125, 2.998046875, 3.223388671875, 3.44873046875, 3.674072265625, 3.8994140625, 4.124755859375, 4.35009765625, 4.575439453125, 4.80078125, 5.026123046875, 5.25146484375, 5.476806640625, 5.7021484375, 5.927490234375, 6.15283203125, 6.378173828125, 6.603515625, 6.828857421875, 7.05419921875, 7.279541015625, 7.5048828125, 7.730224609375, 7.95556640625, 8.180908203125, 8.40625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 11.0, 19.0, 20.0, 23.0, 24.0, 42.0, 68.0, 76.0, 93.0, 150.0, 231.0, 369.0, 693.0, 1752.0, 7802.0, 50992.0, 613109.0, 331673.0, 32864.0, 5533.0, 1381.0, 578.0, 312.0, 231.0, 117.0, 90.0, 68.0, 57.0, 43.0, 19.0, 25.0, 16.0, 18.0, 15.0, 8.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.125, -10.7113037109375, -10.297607421875, -9.8839111328125, -9.47021484375, -9.0565185546875, -8.642822265625, -8.2291259765625, -7.8154296875, -7.4017333984375, -6.988037109375, -6.5743408203125, -6.16064453125, -5.7469482421875, -5.333251953125, -4.9195556640625, -4.505859375, -4.0921630859375, -3.678466796875, -3.2647705078125, -2.85107421875, -2.4373779296875, -2.023681640625, -1.6099853515625, -1.1962890625, -0.7825927734375, -0.368896484375, 0.0447998046875, 0.45849609375, 0.8721923828125, 1.285888671875, 1.6995849609375, 2.11328125, 2.5269775390625, 2.940673828125, 3.3543701171875, 3.76806640625, 4.1817626953125, 4.595458984375, 5.0091552734375, 5.4228515625, 5.8365478515625, 6.250244140625, 6.6639404296875, 7.07763671875, 7.4913330078125, 7.905029296875, 8.3187255859375, 8.732421875, 9.1461181640625, 9.559814453125, 9.9735107421875, 10.38720703125, 10.8009033203125, 11.214599609375, 11.6282958984375, 12.0419921875, 12.4556884765625, 12.869384765625, 13.2830810546875, 13.69677734375, 14.1104736328125, 14.524169921875, 14.9378662109375, 15.3515625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 10.0, 5.0, 17.0, 12.0, 17.0, 24.0, 25.0, 29.0, 37.0, 38.0, 49.0, 45.0, 63.0, 96.0, 1690.0, 362.0, 91.0, 64.0, 62.0, 55.0, 42.0, 26.0, 39.0, 28.0, 35.0, 21.0, 9.0, 13.0, 8.0, 6.0, 9.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5625, -28.663818359375, -27.76513671875, -26.866455078125, -25.9677734375, -25.069091796875, -24.17041015625, -23.271728515625, -22.373046875, -21.474365234375, -20.57568359375, -19.677001953125, -18.7783203125, -17.879638671875, -16.98095703125, -16.082275390625, -15.18359375, -14.284912109375, -13.38623046875, -12.487548828125, -11.5888671875, -10.690185546875, -9.79150390625, -8.892822265625, -7.994140625, -7.095458984375, -6.19677734375, -5.298095703125, -4.3994140625, -3.500732421875, -2.60205078125, -1.703369140625, -0.8046875, 0.093994140625, 0.99267578125, 1.891357421875, 2.7900390625, 3.688720703125, 4.58740234375, 5.486083984375, 6.384765625, 7.283447265625, 8.18212890625, 9.080810546875, 9.9794921875, 10.878173828125, 11.77685546875, 12.675537109375, 13.57421875, 14.472900390625, 15.37158203125, 16.270263671875, 17.1689453125, 18.067626953125, 18.96630859375, 19.864990234375, 20.763671875, 21.662353515625, 22.56103515625, 23.459716796875, 24.3583984375, 25.257080078125, 26.15576171875, 27.054443359375, 27.953125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 9.0, 7.0, 12.0, 12.0, 19.0, 36.0, 39.0, 42.0, 36.0, 69.0, 102.0, 180.0, 377.0, 972.0, 209224.0, 2932270.0, 1332.0, 371.0, 180.0, 110.0, 69.0, 48.0, 37.0, 32.0, 27.0, 21.0, 13.0, 16.0, 9.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.75, -82.0244140625, -79.298828125, -76.5732421875, -73.84765625, -71.1220703125, -68.396484375, -65.6708984375, -62.9453125, -60.2197265625, -57.494140625, -54.7685546875, -52.04296875, -49.3173828125, -46.591796875, -43.8662109375, -41.140625, -38.4150390625, -35.689453125, -32.9638671875, -30.23828125, -27.5126953125, -24.787109375, -22.0615234375, -19.3359375, -16.6103515625, -13.884765625, -11.1591796875, -8.43359375, -5.7080078125, -2.982421875, -0.2568359375, 2.46875, 5.1943359375, 7.919921875, 10.6455078125, 13.37109375, 16.0966796875, 18.822265625, 21.5478515625, 24.2734375, 26.9990234375, 29.724609375, 32.4501953125, 35.17578125, 37.9013671875, 40.626953125, 43.3525390625, 46.078125, 48.8037109375, 51.529296875, 54.2548828125, 56.98046875, 59.7060546875, 62.431640625, 65.1572265625, 67.8828125, 70.6083984375, 73.333984375, 76.0595703125, 78.78515625, 81.5107421875, 84.236328125, 86.9619140625, 89.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 301.0, 645.0, 62.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.72957611083984, -75.79257202148438, -71.8555679321289, -67.91856384277344, -63.9815673828125, -60.04456329345703, -56.10755920410156, -52.170555114746094, -48.23355484008789, -44.29655075073242, -40.35955047607422, -36.42254638671875, -32.48554229736328, -28.548542022705078, -24.61153793334961, -20.674535751342773, -16.737533569335938, -12.800531387329102, -8.86352825164795, -4.926525115966797, -0.9895229339599609, 2.947479248046875, 6.884483337402344, 10.82148551940918, 14.758487701416016, 18.69548988342285, 22.632492065429688, 26.569496154785156, 30.506498336791992, 34.44350051879883, 38.3805046081543, 42.3175048828125, 46.25450134277344, 50.191505432128906, 54.12850570678711, 58.06550979614258, 62.00251007080078, 65.93951416015625, 69.87651824951172, 73.81352233886719, 77.75051879882812, 81.6875228881836, 85.62452697753906, 89.5615234375, 93.49852752685547, 97.43553161621094, 101.3725357055664, 105.30953979492188, 109.24654388427734, 113.18354797363281, 117.12055206298828, 121.05755615234375, 124.99455261230469, 128.93154907226562, 132.86856079101562, 136.80555725097656, 140.74256896972656, 144.6795654296875, 148.6165771484375, 152.55357360839844, 156.49058532714844, 160.42758178710938, 164.36459350585938, 168.3015899658203, 172.23858642578125]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 6.0, 1.0, 12.0, 8.0, 15.0, 13.0, 11.0, 23.0, 15.0, 16.0, 20.0, 16.0, 33.0, 31.0, 28.0, 45.0, 41.0, 38.0, 46.0, 36.0, 48.0, 40.0, 36.0, 40.0, 36.0, 43.0, 39.0, 35.0, 30.0, 26.0, 25.0, 21.0, 21.0, 20.0, 12.0, 11.0, 14.0, 9.0, 9.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-64.33148956298828, -62.33515167236328, -60.33881759643555, -58.34247970581055, -56.34614181518555, -54.34980773925781, -52.35346984863281, -50.35713195800781, -48.36079406738281, -46.36445617675781, -44.36812210083008, -42.37178421020508, -40.37544631958008, -38.379112243652344, -36.382774353027344, -34.386436462402344, -32.39010238647461, -30.393766403198242, -28.397428512573242, -26.401092529296875, -24.404754638671875, -22.408418655395508, -20.41208267211914, -18.41574478149414, -16.419408798217773, -14.42307186126709, -12.426734924316406, -10.430398941040039, -8.434062004089355, -6.437725067138672, -4.441389083862305, -2.445052146911621, -0.4487152099609375, 1.547621488571167, 3.5439581871032715, 5.540294647216797, 7.5366315841674805, 9.532968521118164, 11.529304504394531, 13.525641441345215, 15.521978378295898, 17.518314361572266, 19.514652252197266, 21.510988235473633, 23.50732421875, 25.503662109375, 27.499998092651367, 29.496334075927734, 31.492671966552734, 33.489009857177734, 35.48534393310547, 37.48168182373047, 39.47801971435547, 41.47435760498047, 43.4706916809082, 45.4670295715332, 47.46336364746094, 49.45970153808594, 51.45603561401367, 53.45237350463867, 55.44871139526367, 57.445045471191406, 59.441383361816406, 61.437721252441406, 63.434059143066406]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 13.0, 9.0, 6.0, 12.0, 22.0, 17.0, 24.0, 22.0, 34.0, 36.0, 43.0, 40.0, 46.0, 47.0, 67.0, 43.0, 38.0, 38.0, 43.0, 47.0, 49.0, 32.0, 46.0, 33.0, 28.0, 24.0, 18.0, 14.0, 23.0, 18.0, 12.0, 11.0, 8.0, 5.0, 4.0, 5.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.50726318359375, -6.2606201171875, -6.01397705078125, -5.767333984375, -5.52069091796875, -5.2740478515625, -5.02740478515625, -4.78076171875, -4.53411865234375, -4.2874755859375, -4.04083251953125, -3.794189453125, -3.54754638671875, -3.3009033203125, -3.05426025390625, -2.8076171875, -2.56097412109375, -2.3143310546875, -2.06768798828125, -1.821044921875, -1.57440185546875, -1.3277587890625, -1.08111572265625, -0.83447265625, -0.58782958984375, -0.3411865234375, -0.09454345703125, 0.152099609375, 0.39874267578125, 0.6453857421875, 0.89202880859375, 1.138671875, 1.38531494140625, 1.6319580078125, 1.87860107421875, 2.125244140625, 2.37188720703125, 2.6185302734375, 2.86517333984375, 3.11181640625, 3.35845947265625, 3.6051025390625, 3.85174560546875, 4.098388671875, 4.34503173828125, 4.5916748046875, 4.83831787109375, 5.0849609375, 5.33160400390625, 5.5782470703125, 5.82489013671875, 6.071533203125, 6.31817626953125, 6.5648193359375, 6.81146240234375, 7.05810546875, 7.30474853515625, 7.5513916015625, 7.79803466796875, 8.044677734375, 8.29132080078125, 8.5379638671875, 8.78460693359375, 9.03125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 3.0, 10.0, 12.0, 10.0, 12.0, 29.0, 28.0, 38.0, 59.0, 71.0, 86.0, 141.0, 241.0, 430.0, 791.0, 1642.0, 4181.0, 13449.0, 54486.0, 276945.0, 1096710.0, 1739725.0, 783709.0, 172009.0, 34212.0, 9132.0, 3059.0, 1318.0, 673.0, 360.0, 219.0, 133.0, 94.0, 75.0, 54.0, 41.0, 24.0, 20.0, 13.0, 9.0, 7.0, 10.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5802001953125, -8.277587890625, -7.9749755859375, -7.67236328125, -7.3697509765625, -7.067138671875, -6.7645263671875, -6.4619140625, -6.1593017578125, -5.856689453125, -5.5540771484375, -5.25146484375, -4.9488525390625, -4.646240234375, -4.3436279296875, -4.041015625, -3.7384033203125, -3.435791015625, -3.1331787109375, -2.83056640625, -2.5279541015625, -2.225341796875, -1.9227294921875, -1.6201171875, -1.3175048828125, -1.014892578125, -0.7122802734375, -0.40966796875, -0.1070556640625, 0.195556640625, 0.4981689453125, 0.80078125, 1.1033935546875, 1.406005859375, 1.7086181640625, 2.01123046875, 2.3138427734375, 2.616455078125, 2.9190673828125, 3.2216796875, 3.5242919921875, 3.826904296875, 4.1295166015625, 4.43212890625, 4.7347412109375, 5.037353515625, 5.3399658203125, 5.642578125, 5.9451904296875, 6.247802734375, 6.5504150390625, 6.85302734375, 7.1556396484375, 7.458251953125, 7.7608642578125, 8.0634765625, 8.3660888671875, 8.668701171875, 8.9713134765625, 9.27392578125, 9.5765380859375, 9.879150390625, 10.1817626953125, 10.484375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 11.0, 6.0, 16.0, 9.0, 16.0, 19.0, 29.0, 39.0, 51.0, 50.0, 77.0, 103.0, 136.0, 158.0, 216.0, 237.0, 306.0, 351.0, 364.0, 372.0, 302.0, 255.0, 207.0, 157.0, 134.0, 93.0, 75.0, 65.0, 48.0, 37.0, 22.0, 26.0, 21.0, 15.0, 14.0, 6.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.3017578125, -9.962890625, -9.6240234375, -9.28515625, -8.9462890625, -8.607421875, -8.2685546875, -7.9296875, -7.5908203125, -7.251953125, -6.9130859375, -6.57421875, -6.2353515625, -5.896484375, -5.5576171875, -5.21875, -4.8798828125, -4.541015625, -4.2021484375, -3.86328125, -3.5244140625, -3.185546875, -2.8466796875, -2.5078125, -2.1689453125, -1.830078125, -1.4912109375, -1.15234375, -0.8134765625, -0.474609375, -0.1357421875, 0.203125, 0.5419921875, 0.880859375, 1.2197265625, 1.55859375, 1.8974609375, 2.236328125, 2.5751953125, 2.9140625, 3.2529296875, 3.591796875, 3.9306640625, 4.26953125, 4.6083984375, 4.947265625, 5.2861328125, 5.625, 5.9638671875, 6.302734375, 6.6416015625, 6.98046875, 7.3193359375, 7.658203125, 7.9970703125, 8.3359375, 8.6748046875, 9.013671875, 9.3525390625, 9.69140625, 10.0302734375, 10.369140625, 10.7080078125, 11.046875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 7.0, 17.0, 25.0, 36.0, 41.0, 59.0, 69.0, 101.0, 106.0, 151.0, 196.0, 269.0, 412.0, 650.0, 1584.0, 8180.0, 284062.0, 3791264.0, 98890.0, 4994.0, 1185.0, 589.0, 349.0, 261.0, 203.0, 133.0, 102.0, 79.0, 55.0, 50.0, 31.0, 31.0, 19.0, 11.0, 13.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.28125, -40.9755859375, -39.669921875, -38.3642578125, -37.05859375, -35.7529296875, -34.447265625, -33.1416015625, -31.8359375, -30.5302734375, -29.224609375, -27.9189453125, -26.61328125, -25.3076171875, -24.001953125, -22.6962890625, -21.390625, -20.0849609375, -18.779296875, -17.4736328125, -16.16796875, -14.8623046875, -13.556640625, -12.2509765625, -10.9453125, -9.6396484375, -8.333984375, -7.0283203125, -5.72265625, -4.4169921875, -3.111328125, -1.8056640625, -0.5, 0.8056640625, 2.111328125, 3.4169921875, 4.72265625, 6.0283203125, 7.333984375, 8.6396484375, 9.9453125, 11.2509765625, 12.556640625, 13.8623046875, 15.16796875, 16.4736328125, 17.779296875, 19.0849609375, 20.390625, 21.6962890625, 23.001953125, 24.3076171875, 25.61328125, 26.9189453125, 28.224609375, 29.5302734375, 30.8359375, 32.1416015625, 33.447265625, 34.7529296875, 36.05859375, 37.3642578125, 38.669921875, 39.9755859375, 41.28125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 33.0, 653.0, 324.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.59719848632812, -202.88308715820312, -189.1689910888672, -175.4548797607422, -161.74078369140625, -148.02667236328125, -134.31256103515625, -120.59845733642578, -106.88435363769531, -93.17024993896484, -79.45614624023438, -65.74203491210938, -52.027931213378906, -38.31382751464844, -24.599716186523438, -10.885612487792969, 2.8284912109375, 16.5425968170166, 30.256702423095703, 43.97080993652344, 57.684913635253906, 71.39901733398438, 85.11312866210938, 98.82723236083984, 112.54133605957031, 126.25543975830078, 139.96954345703125, 153.68365478515625, 167.39776611328125, 181.1118621826172, 194.8259735107422, 208.54006958007812, 222.25421142578125, 235.96832275390625, 249.6824188232422, 263.39654541015625, 277.1106262207031, 290.8247375488281, 304.5388488769531, 318.2529602050781, 331.967041015625, 345.68115234375, 359.395263671875, 373.109375, 386.8234558105469, 400.5375671386719, 414.2516784667969, 427.9657897949219, 441.6799011230469, 455.3940124511719, 469.1081237792969, 482.82220458984375, 496.53631591796875, 510.25042724609375, 523.9645385742188, 537.6786499023438, 551.3927612304688, 565.1068725585938, 578.8209838867188, 592.5350952148438, 606.2492065429688, 619.9632568359375, 633.6773681640625, 647.3914794921875, 661.1055908203125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 10.0, 8.0, 11.0, 20.0, 16.0, 13.0, 32.0, 31.0, 26.0, 38.0, 36.0, 43.0, 31.0, 31.0, 40.0, 48.0, 39.0, 47.0, 42.0, 37.0, 40.0, 40.0, 38.0, 37.0, 34.0, 28.0, 27.0, 33.0, 15.0, 18.0, 19.0, 11.0, 10.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.46484375, -45.00541687011719, -43.545989990234375, -42.08656311035156, -40.627140045166016, -39.1677131652832, -37.70828628540039, -36.24885940551758, -34.78943634033203, -33.33000946044922, -31.87058448791504, -30.411157608032227, -28.951732635498047, -27.492305755615234, -26.032878875732422, -24.57345199584961, -23.114025115966797, -21.654598236083984, -20.195173263549805, -18.735746383666992, -17.276321411132812, -15.81689453125, -14.357467651367188, -12.898041725158691, -11.438615798950195, -9.9791898727417, -8.519763946533203, -7.060337066650391, -5.6009111404418945, -4.141485214233398, -2.682058334350586, -1.2226324081420898, 0.23679351806640625, 1.6962196826934814, 3.1556458473205566, 4.615072250366211, 6.074498176574707, 7.533924102783203, 8.993350982666016, 10.452776908874512, 11.912202835083008, 13.371628761291504, 14.8310546875, 16.290481567382812, 17.749908447265625, 19.209333419799805, 20.668760299682617, 22.128185272216797, 23.58761215209961, 25.047039031982422, 26.5064640045166, 27.965890884399414, 29.425315856933594, 30.884742736816406, 32.34416961669922, 33.80359649658203, 35.263023376464844, 36.722450256347656, 38.18187713623047, 39.64130401611328, 41.10072708129883, 42.56015396118164, 44.01958084106445, 45.479007720947266, 46.93843078613281]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 6.0, 4.0, 10.0, 7.0, 16.0, 16.0, 16.0, 26.0, 23.0, 22.0, 26.0, 36.0, 38.0, 42.0, 36.0, 38.0, 34.0, 50.0, 45.0, 40.0, 39.0, 56.0, 37.0, 41.0, 30.0, 35.0, 32.0, 27.0, 25.0, 25.0, 18.0, 13.0, 24.0, 15.0, 10.0, 10.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.5003662109375, -5.274169921875, -5.0479736328125, -4.82177734375, -4.5955810546875, -4.369384765625, -4.1431884765625, -3.9169921875, -3.6907958984375, -3.464599609375, -3.2384033203125, -3.01220703125, -2.7860107421875, -2.559814453125, -2.3336181640625, -2.107421875, -1.8812255859375, -1.655029296875, -1.4288330078125, -1.20263671875, -0.9764404296875, -0.750244140625, -0.5240478515625, -0.2978515625, -0.0716552734375, 0.154541015625, 0.3807373046875, 0.60693359375, 0.8331298828125, 1.059326171875, 1.2855224609375, 1.51171875, 1.7379150390625, 1.964111328125, 2.1903076171875, 2.41650390625, 2.6427001953125, 2.868896484375, 3.0950927734375, 3.3212890625, 3.5474853515625, 3.773681640625, 3.9998779296875, 4.22607421875, 4.4522705078125, 4.678466796875, 4.9046630859375, 5.130859375, 5.3570556640625, 5.583251953125, 5.8094482421875, 6.03564453125, 6.2618408203125, 6.488037109375, 6.7142333984375, 6.9404296875, 7.1666259765625, 7.392822265625, 7.6190185546875, 7.84521484375, 8.0714111328125, 8.297607421875, 8.5238037109375, 8.75]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 12.0, 23.0, 22.0, 26.0, 58.0, 85.0, 129.0, 206.0, 325.0, 449.0, 706.0, 1072.0, 1676.0, 2563.0, 4139.0, 6613.0, 10863.0, 17681.0, 30513.0, 53833.0, 95654.0, 159567.0, 214839.0, 180435.0, 112505.0, 63993.0, 36039.0, 21010.0, 12751.0, 7570.0, 4723.0, 2979.0, 1973.0, 1262.0, 746.0, 494.0, 345.0, 245.0, 148.0, 89.0, 53.0, 48.0, 29.0, 25.0, 11.0, 13.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.73486328125, -0.7123565673828125, -0.689849853515625, -0.6673431396484375, -0.64483642578125, -0.6223297119140625, -0.599822998046875, -0.5773162841796875, -0.5548095703125, -0.5323028564453125, -0.509796142578125, -0.4872894287109375, -0.46478271484375, -0.4422760009765625, -0.419769287109375, -0.3972625732421875, -0.374755859375, -0.3522491455078125, -0.329742431640625, -0.3072357177734375, -0.28472900390625, -0.2622222900390625, -0.239715576171875, -0.2172088623046875, -0.1947021484375, -0.1721954345703125, -0.149688720703125, -0.1271820068359375, -0.10467529296875, -0.0821685791015625, -0.059661865234375, -0.0371551513671875, -0.0146484375, 0.0078582763671875, 0.030364990234375, 0.0528717041015625, 0.07537841796875, 0.0978851318359375, 0.120391845703125, 0.1428985595703125, 0.1654052734375, 0.1879119873046875, 0.210418701171875, 0.2329254150390625, 0.25543212890625, 0.2779388427734375, 0.300445556640625, 0.3229522705078125, 0.345458984375, 0.3679656982421875, 0.390472412109375, 0.4129791259765625, 0.43548583984375, 0.4579925537109375, 0.480499267578125, 0.5030059814453125, 0.5255126953125, 0.5480194091796875, 0.570526123046875, 0.5930328369140625, 0.61553955078125, 0.6380462646484375, 0.660552978515625, 0.6830596923828125, 0.70556640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 3.0, 8.0, 6.0, 8.0, 7.0, 15.0, 13.0, 22.0, 25.0, 22.0, 19.0, 24.0, 24.0, 37.0, 23.0, 29.0, 27.0, 31.0, 40.0, 46.0, 47.0, 1057.0, 43.0, 30.0, 49.0, 36.0, 29.0, 33.0, 22.0, 26.0, 16.0, 16.0, 25.0, 27.0, 22.0, 14.0, 14.0, 14.0, 13.0, 14.0, 12.0, 8.0, 12.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.673828125, -3.548919677734375, -3.42401123046875, -3.299102783203125, -3.1741943359375, -3.049285888671875, -2.92437744140625, -2.799468994140625, -2.674560546875, -2.549652099609375, -2.42474365234375, -2.299835205078125, -2.1749267578125, -2.050018310546875, -1.92510986328125, -1.800201416015625, -1.67529296875, -1.550384521484375, -1.42547607421875, -1.300567626953125, -1.1756591796875, -1.050750732421875, -0.92584228515625, -0.800933837890625, -0.676025390625, -0.551116943359375, -0.42620849609375, -0.301300048828125, -0.1763916015625, -0.051483154296875, 0.07342529296875, 0.198333740234375, 0.3232421875, 0.448150634765625, 0.57305908203125, 0.697967529296875, 0.8228759765625, 0.947784423828125, 1.07269287109375, 1.197601318359375, 1.322509765625, 1.447418212890625, 1.57232666015625, 1.697235107421875, 1.8221435546875, 1.947052001953125, 2.07196044921875, 2.196868896484375, 2.32177734375, 2.446685791015625, 2.57159423828125, 2.696502685546875, 2.8214111328125, 2.946319580078125, 3.07122802734375, 3.196136474609375, 3.321044921875, 3.445953369140625, 3.57086181640625, 3.695770263671875, 3.8206787109375, 3.945587158203125, 4.07049560546875, 4.195404052734375, 4.3203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 13.0, 8.0, 13.0, 20.0, 30.0, 53.0, 67.0, 105.0, 151.0, 246.0, 387.0, 580.0, 926.0, 1494.0, 2436.0, 3777.0, 6408.0, 10459.0, 17803.0, 29360.0, 49761.0, 83978.0, 133937.0, 705676.0, 707085.0, 133901.0, 84462.0, 49728.0, 29329.0, 17530.0, 10634.0, 6394.0, 3798.0, 2377.0, 1533.0, 960.0, 658.0, 352.0, 224.0, 160.0, 98.0, 82.0, 46.0, 35.0, 15.0, 19.0, 10.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5478515625, -0.530731201171875, -0.51361083984375, -0.496490478515625, -0.4793701171875, -0.462249755859375, -0.44512939453125, -0.428009033203125, -0.410888671875, -0.393768310546875, -0.37664794921875, -0.359527587890625, -0.3424072265625, -0.325286865234375, -0.30816650390625, -0.291046142578125, -0.27392578125, -0.256805419921875, -0.23968505859375, -0.222564697265625, -0.2054443359375, -0.188323974609375, -0.17120361328125, -0.154083251953125, -0.136962890625, -0.119842529296875, -0.10272216796875, -0.085601806640625, -0.0684814453125, -0.051361083984375, -0.03424072265625, -0.017120361328125, 0.0, 0.017120361328125, 0.03424072265625, 0.051361083984375, 0.0684814453125, 0.085601806640625, 0.10272216796875, 0.119842529296875, 0.136962890625, 0.154083251953125, 0.17120361328125, 0.188323974609375, 0.2054443359375, 0.222564697265625, 0.23968505859375, 0.256805419921875, 0.27392578125, 0.291046142578125, 0.30816650390625, 0.325286865234375, 0.3424072265625, 0.359527587890625, 0.37664794921875, 0.393768310546875, 0.410888671875, 0.428009033203125, 0.44512939453125, 0.462249755859375, 0.4793701171875, 0.496490478515625, 0.51361083984375, 0.530731201171875, 0.5478515625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 5.0, 6.0, 14.0, 13.0, 15.0, 28.0, 19.0, 28.0, 33.0, 27.0, 37.0, 41.0, 42.0, 59.0, 49.0, 72.0, 51.0, 48.0, 56.0, 55.0, 47.0, 40.0, 35.0, 23.0, 29.0, 19.0, 21.0, 18.0, 19.0, 9.0, 7.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0020427703857421875, -0.0019805431365966797, -0.0019183158874511719, -0.001856088638305664, -0.0017938613891601562, -0.0017316341400146484, -0.0016694068908691406, -0.0016071796417236328, -0.001544952392578125, -0.0014827251434326172, -0.0014204978942871094, -0.0013582706451416016, -0.0012960433959960938, -0.001233816146850586, -0.0011715888977050781, -0.0011093616485595703, -0.0010471343994140625, -0.0009849071502685547, -0.0009226799011230469, -0.0008604526519775391, -0.0007982254028320312, -0.0007359981536865234, -0.0006737709045410156, -0.0006115436553955078, -0.00054931640625, -0.0004870891571044922, -0.0004248619079589844, -0.00036263465881347656, -0.00030040740966796875, -0.00023818016052246094, -0.00017595291137695312, -0.00011372566223144531, -5.14984130859375e-05, 1.0728836059570312e-05, 7.295608520507812e-05, 0.00013518333435058594, 0.00019741058349609375, 0.00025963783264160156, 0.0003218650817871094, 0.0003840923309326172, 0.000446319580078125, 0.0005085468292236328, 0.0005707740783691406, 0.0006330013275146484, 0.0006952285766601562, 0.0007574558258056641, 0.0008196830749511719, 0.0008819103240966797, 0.0009441375732421875, 0.0010063648223876953, 0.0010685920715332031, 0.001130819320678711, 0.0011930465698242188, 0.0012552738189697266, 0.0013175010681152344, 0.0013797283172607422, 0.00144195556640625, 0.0015041828155517578, 0.0015664100646972656, 0.0016286373138427734, 0.0016908645629882812, 0.001753091812133789, 0.0018153190612792969, 0.0018775463104248047, 0.0019397735595703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 6.0, 9.0, 8.0, 13.0, 18.0, 23.0, 22.0, 36.0, 43.0, 45.0, 70.0, 96.0, 108.0, 145.0, 297.0, 700.0, 8399.0, 1027585.0, 9316.0, 677.0, 299.0, 157.0, 104.0, 71.0, 66.0, 39.0, 44.0, 34.0, 25.0, 19.0, 19.0, 10.0, 14.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.041107177734375, -0.03980255126953125, -0.0384979248046875, -0.03719329833984375, -0.035888671875, -0.03458404541015625, -0.0332794189453125, -0.03197479248046875, -0.030670166015625, -0.02936553955078125, -0.0280609130859375, -0.02675628662109375, -0.02545166015625, -0.02414703369140625, -0.0228424072265625, -0.02153778076171875, -0.020233154296875, -0.01892852783203125, -0.0176239013671875, -0.01631927490234375, -0.0150146484375, -0.01371002197265625, -0.0124053955078125, -0.01110076904296875, -0.009796142578125, -0.00849151611328125, -0.0071868896484375, -0.00588226318359375, -0.00457763671875, -0.00327301025390625, -0.0019683837890625, -0.00066375732421875, 0.000640869140625, 0.00194549560546875, 0.0032501220703125, 0.00455474853515625, 0.005859375, 0.00716400146484375, 0.0084686279296875, 0.00977325439453125, 0.011077880859375, 0.01238250732421875, 0.0136871337890625, 0.01499176025390625, 0.01629638671875, 0.01760101318359375, 0.0189056396484375, 0.02021026611328125, 0.021514892578125, 0.02281951904296875, 0.0241241455078125, 0.02542877197265625, 0.0267333984375, 0.02803802490234375, 0.0293426513671875, 0.03064727783203125, 0.031951904296875, 0.03325653076171875, 0.0345611572265625, 0.03586578369140625, 0.03717041015625, 0.03847503662109375, 0.0397796630859375, 0.04108428955078125, 0.042388916015625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 81.0, 933.0, 3.0], "bins": [-0.04052910581231117, -0.039878811687231064, -0.039228521287441254, -0.038578227162361145, -0.037927933037281036, -0.03727763891220093, -0.03662734851241112, -0.03597705438733101, -0.0353267602622509, -0.03467646613717079, -0.03402617573738098, -0.03337588161230087, -0.032725587487220764, -0.032075293362140656, -0.031425002962350845, -0.030774708837270737, -0.030124416574835777, -0.029474124312400818, -0.02882383018732071, -0.02817353792488575, -0.02752324379980564, -0.026872951537370682, -0.026222657412290573, -0.025572365149855614, -0.024922072887420654, -0.024271780624985695, -0.023621486499905586, -0.022971194237470627, -0.022320900112390518, -0.02167060784995556, -0.02102031372487545, -0.02037002146244049, -0.019719725474715233, -0.019069433212280273, -0.018419139087200165, -0.017768846824765205, -0.017118552699685097, -0.016468260437250137, -0.01581796631217003, -0.01516767404973507, -0.01451738178730011, -0.013867088593542576, -0.013216795399785042, -0.012566502206027508, -0.011916209012269974, -0.011265916749835014, -0.01061562355607748, -0.009965330362319946, -0.009315037168562412, -0.008664743974804878, -0.008014450781047344, -0.0073641580529510975, -0.0067138648591935635, -0.0060635716654360294, -0.005413278937339783, -0.004762985743582249, -0.004112692084163427, -0.0034623988904058933, -0.002812105929479003, -0.0021618129685521126, -0.0015115197747945786, -0.0008612265810370445, -0.00021093362011015415, 0.0004393593408167362, 0.0010896524181589484]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 21.0, 17.0, 22.0, 30.0, 35.0, 39.0, 38.0, 44.0, 47.0, 50.0, 57.0, 50.0, 64.0, 57.0, 45.0, 60.0, 49.0, 38.0, 28.0, 38.0, 33.0, 22.0, 18.0, 12.0, 14.0, 7.0, 9.0, 8.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010290741920471191, -0.0009841816499829292, -0.0009392891079187393, -0.0008943965658545494, -0.0008495040237903595, -0.0008046114817261696, -0.0007597189396619797, -0.0007148263975977898, -0.0006699338555335999, -0.0006250413134694099, -0.00058014877140522, -0.0005352562293410301, -0.0004903636872768402, -0.0004454711452126503, -0.0004005786031484604, -0.0003556860610842705, -0.00031079351902008057, -0.00026590097695589066, -0.00022100843489170074, -0.00017611589282751083, -0.00013122335076332092, -8.633080869913101e-05, -4.14382666349411e-05, 3.45427542924881e-06, 4.834681749343872e-05, 9.323935955762863e-05, 0.00013813190162181854, 0.00018302444368600845, 0.00022791698575019836, 0.0002728095278143883, 0.0003177020698785782, 0.0003625946119427681, 0.000407487154006958, 0.0004523796960711479, 0.0004972722381353378, 0.0005421647801995277, 0.0005870573222637177, 0.0006319498643279076, 0.0006768424063920975, 0.0007217349484562874, 0.0007666274905204773, 0.0008115200325846672, 0.0008564125746488571, 0.000901305116713047, 0.0009461976587772369, 0.0009910902008414268, 0.0010359827429056168, 0.0010808752849698067, 0.0011257678270339966, 0.0011706603690981865, 0.0012155529111623764, 0.0012604454532265663, 0.0013053379952907562, 0.0013502305373549461, 0.001395123079419136, 0.001440015621483326, 0.0014849081635475159, 0.0015298007056117058, 0.0015746932476758957, 0.0016195857897400856, 0.0016644783318042755, 0.0017093708738684654, 0.0017542634159326553, 0.0017991559579968452, 0.0018440485000610352]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 6.0, 4.0, 10.0, 7.0, 16.0, 16.0, 16.0, 26.0, 23.0, 22.0, 26.0, 36.0, 38.0, 42.0, 36.0, 38.0, 34.0, 50.0, 45.0, 40.0, 39.0, 56.0, 37.0, 41.0, 30.0, 35.0, 32.0, 27.0, 25.0, 25.0, 18.0, 13.0, 24.0, 15.0, 10.0, 10.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.5003662109375, -5.274169921875, -5.0479736328125, -4.82177734375, -4.5955810546875, -4.369384765625, -4.1431884765625, -3.9169921875, -3.6907958984375, -3.464599609375, -3.2384033203125, -3.01220703125, -2.7860107421875, -2.559814453125, -2.3336181640625, -2.107421875, -1.8812255859375, -1.655029296875, -1.4288330078125, -1.20263671875, -0.9764404296875, -0.750244140625, -0.5240478515625, -0.2978515625, -0.0716552734375, 0.154541015625, 0.3807373046875, 0.60693359375, 0.8331298828125, 1.059326171875, 1.2855224609375, 1.51171875, 1.7379150390625, 1.964111328125, 2.1903076171875, 2.41650390625, 2.6427001953125, 2.868896484375, 3.0950927734375, 3.3212890625, 3.5474853515625, 3.773681640625, 3.9998779296875, 4.22607421875, 4.4522705078125, 4.678466796875, 4.9046630859375, 5.130859375, 5.3570556640625, 5.583251953125, 5.8094482421875, 6.03564453125, 6.2618408203125, 6.488037109375, 6.7142333984375, 6.9404296875, 7.1666259765625, 7.392822265625, 7.6190185546875, 7.84521484375, 8.0714111328125, 8.297607421875, 8.5238037109375, 8.75]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 8.0, 7.0, 10.0, 17.0, 23.0, 33.0, 42.0, 71.0, 104.0, 187.0, 385.0, 792.0, 1730.0, 3687.0, 8240.0, 19321.0, 48010.0, 126838.0, 359294.0, 306131.0, 103758.0, 40123.0, 16592.0, 7082.0, 3063.0, 1468.0, 695.0, 356.0, 163.0, 105.0, 55.0, 35.0, 33.0, 25.0, 20.0, 16.0, 4.0, 9.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.30645751953125, -5.0933837890625, -4.88031005859375, -4.667236328125, -4.45416259765625, -4.2410888671875, -4.02801513671875, -3.81494140625, -3.60186767578125, -3.3887939453125, -3.17572021484375, -2.962646484375, -2.74957275390625, -2.5364990234375, -2.32342529296875, -2.1103515625, -1.89727783203125, -1.6842041015625, -1.47113037109375, -1.258056640625, -1.04498291015625, -0.8319091796875, -0.61883544921875, -0.40576171875, -0.19268798828125, 0.0203857421875, 0.23345947265625, 0.446533203125, 0.65960693359375, 0.8726806640625, 1.08575439453125, 1.298828125, 1.51190185546875, 1.7249755859375, 1.93804931640625, 2.151123046875, 2.36419677734375, 2.5772705078125, 2.79034423828125, 3.00341796875, 3.21649169921875, 3.4295654296875, 3.64263916015625, 3.855712890625, 4.06878662109375, 4.2818603515625, 4.49493408203125, 4.7080078125, 4.92108154296875, 5.1341552734375, 5.34722900390625, 5.560302734375, 5.77337646484375, 5.9864501953125, 6.19952392578125, 6.41259765625, 6.62567138671875, 6.8387451171875, 7.05181884765625, 7.264892578125, 7.47796630859375, 7.6910400390625, 7.90411376953125, 8.1171875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 13.0, 9.0, 11.0, 17.0, 15.0, 16.0, 18.0, 15.0, 30.0, 32.0, 28.0, 42.0, 29.0, 41.0, 58.0, 55.0, 95.0, 354.0, 1555.0, 146.0, 75.0, 48.0, 42.0, 35.0, 32.0, 27.0, 25.0, 29.0, 19.0, 21.0, 26.0, 15.0, 13.0, 8.0, 9.0, 11.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -20.945068359375, -20.20263671875, -19.460205078125, -18.7177734375, -17.975341796875, -17.23291015625, -16.490478515625, -15.748046875, -15.005615234375, -14.26318359375, -13.520751953125, -12.7783203125, -12.035888671875, -11.29345703125, -10.551025390625, -9.80859375, -9.066162109375, -8.32373046875, -7.581298828125, -6.8388671875, -6.096435546875, -5.35400390625, -4.611572265625, -3.869140625, -3.126708984375, -2.38427734375, -1.641845703125, -0.8994140625, -0.156982421875, 0.58544921875, 1.327880859375, 2.0703125, 2.812744140625, 3.55517578125, 4.297607421875, 5.0400390625, 5.782470703125, 6.52490234375, 7.267333984375, 8.009765625, 8.752197265625, 9.49462890625, 10.237060546875, 10.9794921875, 11.721923828125, 12.46435546875, 13.206787109375, 13.94921875, 14.691650390625, 15.43408203125, 16.176513671875, 16.9189453125, 17.661376953125, 18.40380859375, 19.146240234375, 19.888671875, 20.631103515625, 21.37353515625, 22.115966796875, 22.8583984375, 23.600830078125, 24.34326171875, 25.085693359375, 25.828125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 12.0, 11.0, 13.0, 11.0, 17.0, 11.0, 25.0, 40.0, 58.0, 36.0, 70.0, 89.0, 98.0, 139.0, 206.0, 317.0, 572.0, 2041.0, 55736.0, 3009269.0, 72689.0, 2437.0, 594.0, 342.0, 204.0, 133.0, 99.0, 99.0, 75.0, 53.0, 44.0, 24.0, 29.0, 24.0, 16.0, 12.0, 14.0, 11.0, 7.0, 5.0, 4.0, 4.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-42.78125, -41.5771484375, -40.373046875, -39.1689453125, -37.96484375, -36.7607421875, -35.556640625, -34.3525390625, -33.1484375, -31.9443359375, -30.740234375, -29.5361328125, -28.33203125, -27.1279296875, -25.923828125, -24.7197265625, -23.515625, -22.3115234375, -21.107421875, -19.9033203125, -18.69921875, -17.4951171875, -16.291015625, -15.0869140625, -13.8828125, -12.6787109375, -11.474609375, -10.2705078125, -9.06640625, -7.8623046875, -6.658203125, -5.4541015625, -4.25, -3.0458984375, -1.841796875, -0.6376953125, 0.56640625, 1.7705078125, 2.974609375, 4.1787109375, 5.3828125, 6.5869140625, 7.791015625, 8.9951171875, 10.19921875, 11.4033203125, 12.607421875, 13.8115234375, 15.015625, 16.2197265625, 17.423828125, 18.6279296875, 19.83203125, 21.0361328125, 22.240234375, 23.4443359375, 24.6484375, 25.8525390625, 27.056640625, 28.2607421875, 29.46484375, 30.6689453125, 31.873046875, 33.0771484375, 34.28125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 26.0, 101.0, 260.0, 353.0, 207.0, 49.0, 13.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6065902709961, -62.23388671875, -59.861183166503906, -57.48847579956055, -55.11577224731445, -52.74306869506836, -50.370361328125, -47.997657775878906, -45.62495422363281, -43.25225067138672, -40.879547119140625, -38.506839752197266, -36.13413619995117, -33.76143264770508, -31.38872718811035, -29.016021728515625, -26.64331817626953, -24.270614624023438, -21.89790916442871, -19.525203704833984, -17.15250015258789, -14.77979564666748, -12.40709114074707, -10.034385681152344, -7.66168212890625, -5.28897762298584, -2.9162731170654297, -0.5435686111450195, 1.8291358947753906, 4.201840400695801, 6.574544906616211, 8.947250366210938, 11.319953918457031, 13.692658424377441, 16.06536293029785, 18.438068389892578, 20.810771942138672, 23.183475494384766, 25.556180953979492, 27.92888641357422, 30.301589965820312, 32.674293518066406, 35.0469970703125, 37.41970443725586, 39.79240798950195, 42.16511154174805, 44.537818908691406, 46.9105224609375, 49.283226013183594, 51.65592956542969, 54.02863311767578, 56.40134048461914, 58.774044036865234, 61.14674758911133, 63.51945495605469, 65.89215850830078, 68.26486206054688, 70.63756561279297, 73.01026916503906, 75.38297271728516, 77.75567626953125, 80.12838745117188, 82.50109100341797, 84.87379455566406, 87.24649810791016]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 9.0, 3.0, 7.0, 8.0, 12.0, 13.0, 12.0, 14.0, 16.0, 22.0, 34.0, 28.0, 33.0, 25.0, 29.0, 31.0, 36.0, 42.0, 32.0, 42.0, 50.0, 49.0, 54.0, 38.0, 34.0, 38.0, 33.0, 29.0, 23.0, 29.0, 27.0, 23.0, 13.0, 12.0, 21.0, 15.0, 15.0, 9.0, 8.0, 5.0, 10.0, 4.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.220550537109375, -52.39317321777344, -50.5657958984375, -48.73841857910156, -46.911041259765625, -45.08366394042969, -43.25628662109375, -41.42890930175781, -39.601531982421875, -37.77415466308594, -35.94677734375, -34.11940002441406, -32.292022705078125, -30.464645385742188, -28.63726806640625, -26.809890747070312, -24.982513427734375, -23.155136108398438, -21.3277587890625, -19.500381469726562, -17.673004150390625, -15.845626831054688, -14.01824951171875, -12.190872192382812, -10.363494873046875, -8.536117553710938, -6.708740234375, -4.8813629150390625, -3.053985595703125, -1.2266082763671875, 0.60076904296875, 2.4281463623046875, 4.255523681640625, 6.0829010009765625, 7.9102783203125, 9.737655639648438, 11.565032958984375, 13.392410278320312, 15.21978759765625, 17.047164916992188, 18.874542236328125, 20.701919555664062, 22.529296875, 24.356674194335938, 26.184051513671875, 28.011428833007812, 29.83880615234375, 31.666183471679688, 33.493560791015625, 35.32093811035156, 37.1483154296875, 38.97569274902344, 40.803070068359375, 42.63044738769531, 44.45782470703125, 46.28520202636719, 48.112579345703125, 49.93995666503906, 51.767333984375, 53.59471130371094, 55.422088623046875, 57.24946594238281, 59.07684326171875, 60.90422058105469, 62.731597900390625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 0.0, 5.0, 7.0, 10.0, 13.0, 10.0, 19.0, 17.0, 13.0, 21.0, 21.0, 28.0, 29.0, 24.0, 35.0, 35.0, 37.0, 44.0, 41.0, 34.0, 45.0, 41.0, 44.0, 29.0, 45.0, 40.0, 32.0, 41.0, 27.0, 31.0, 22.0, 21.0, 19.0, 17.0, 16.0, 13.0, 14.0, 15.0, 13.0, 8.0, 6.0, 6.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.96685791015625, -5.7501220703125, -5.53338623046875, -5.316650390625, -5.09991455078125, -4.8831787109375, -4.66644287109375, -4.44970703125, -4.23297119140625, -4.0162353515625, -3.79949951171875, -3.582763671875, -3.36602783203125, -3.1492919921875, -2.93255615234375, -2.7158203125, -2.49908447265625, -2.2823486328125, -2.06561279296875, -1.848876953125, -1.63214111328125, -1.4154052734375, -1.19866943359375, -0.98193359375, -0.76519775390625, -0.5484619140625, -0.33172607421875, -0.114990234375, 0.10174560546875, 0.3184814453125, 0.53521728515625, 0.751953125, 0.96868896484375, 1.1854248046875, 1.40216064453125, 1.618896484375, 1.83563232421875, 2.0523681640625, 2.26910400390625, 2.48583984375, 2.70257568359375, 2.9193115234375, 3.13604736328125, 3.352783203125, 3.56951904296875, 3.7862548828125, 4.00299072265625, 4.2197265625, 4.43646240234375, 4.6531982421875, 4.86993408203125, 5.086669921875, 5.30340576171875, 5.5201416015625, 5.73687744140625, 5.95361328125, 6.17034912109375, 6.3870849609375, 6.60382080078125, 6.820556640625, 7.03729248046875, 7.2540283203125, 7.47076416015625, 7.6875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 7.0, 7.0, 14.0, 14.0, 20.0, 28.0, 24.0, 37.0, 48.0, 60.0, 74.0, 113.0, 205.0, 529.0, 2011.0, 13904.0, 263128.0, 3124957.0, 754130.0, 30108.0, 3364.0, 747.0, 236.0, 113.0, 68.0, 62.0, 52.0, 33.0, 35.0, 27.0, 13.0, 21.0, 14.0, 12.0, 9.0, 8.0, 13.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.640625, -17.966552734375, -17.29248046875, -16.618408203125, -15.9443359375, -15.270263671875, -14.59619140625, -13.922119140625, -13.248046875, -12.573974609375, -11.89990234375, -11.225830078125, -10.5517578125, -9.877685546875, -9.20361328125, -8.529541015625, -7.85546875, -7.181396484375, -6.50732421875, -5.833251953125, -5.1591796875, -4.485107421875, -3.81103515625, -3.136962890625, -2.462890625, -1.788818359375, -1.11474609375, -0.440673828125, 0.2333984375, 0.907470703125, 1.58154296875, 2.255615234375, 2.9296875, 3.603759765625, 4.27783203125, 4.951904296875, 5.6259765625, 6.300048828125, 6.97412109375, 7.648193359375, 8.322265625, 8.996337890625, 9.67041015625, 10.344482421875, 11.0185546875, 11.692626953125, 12.36669921875, 13.040771484375, 13.71484375, 14.388916015625, 15.06298828125, 15.737060546875, 16.4111328125, 17.085205078125, 17.75927734375, 18.433349609375, 19.107421875, 19.781494140625, 20.45556640625, 21.129638671875, 21.8037109375, 22.477783203125, 23.15185546875, 23.825927734375, 24.5]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 4.0, 7.0, 4.0, 14.0, 14.0, 13.0, 20.0, 45.0, 63.0, 69.0, 121.0, 152.0, 210.0, 302.0, 444.0, 513.0, 508.0, 434.0, 348.0, 229.0, 175.0, 128.0, 90.0, 55.0, 32.0, 21.0, 17.0, 8.0, 9.0, 8.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.9046630859375, -16.449951171875, -15.9952392578125, -15.54052734375, -15.0858154296875, -14.631103515625, -14.1763916015625, -13.7216796875, -13.2669677734375, -12.812255859375, -12.3575439453125, -11.90283203125, -11.4481201171875, -10.993408203125, -10.5386962890625, -10.083984375, -9.6292724609375, -9.174560546875, -8.7198486328125, -8.26513671875, -7.8104248046875, -7.355712890625, -6.9010009765625, -6.4462890625, -5.9915771484375, -5.536865234375, -5.0821533203125, -4.62744140625, -4.1727294921875, -3.718017578125, -3.2633056640625, -2.80859375, -2.3538818359375, -1.899169921875, -1.4444580078125, -0.98974609375, -0.5350341796875, -0.080322265625, 0.3743896484375, 0.8291015625, 1.2838134765625, 1.738525390625, 2.1932373046875, 2.64794921875, 3.1026611328125, 3.557373046875, 4.0120849609375, 4.466796875, 4.9215087890625, 5.376220703125, 5.8309326171875, 6.28564453125, 6.7403564453125, 7.195068359375, 7.6497802734375, 8.1044921875, 8.5592041015625, 9.013916015625, 9.4686279296875, 9.92333984375, 10.3780517578125, 10.832763671875, 11.2874755859375, 11.7421875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 10.0, 15.0, 14.0, 24.0, 34.0, 43.0, 70.0, 103.0, 108.0, 163.0, 236.0, 390.0, 1060.0, 7882.0, 501194.0, 3648209.0, 30850.0, 2257.0, 564.0, 284.0, 213.0, 152.0, 106.0, 80.0, 50.0, 46.0, 32.0, 27.0, 16.0, 9.0, 9.0, 11.0, 7.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.84375, -49.103515625, -47.36328125, -45.623046875, -43.8828125, -42.142578125, -40.40234375, -38.662109375, -36.921875, -35.181640625, -33.44140625, -31.701171875, -29.9609375, -28.220703125, -26.48046875, -24.740234375, -23.0, -21.259765625, -19.51953125, -17.779296875, -16.0390625, -14.298828125, -12.55859375, -10.818359375, -9.078125, -7.337890625, -5.59765625, -3.857421875, -2.1171875, -0.376953125, 1.36328125, 3.103515625, 4.84375, 6.583984375, 8.32421875, 10.064453125, 11.8046875, 13.544921875, 15.28515625, 17.025390625, 18.765625, 20.505859375, 22.24609375, 23.986328125, 25.7265625, 27.466796875, 29.20703125, 30.947265625, 32.6875, 34.427734375, 36.16796875, 37.908203125, 39.6484375, 41.388671875, 43.12890625, 44.869140625, 46.609375, 48.349609375, 50.08984375, 51.830078125, 53.5703125, 55.310546875, 57.05078125, 58.791015625, 60.53125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 10.0, 35.0, 103.0, 265.0, 325.0, 182.0, 58.0, 30.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.02708053588867, -42.880699157714844, -38.73431396484375, -34.58793258666992, -30.44154930114746, -26.295166015625, -22.148784637451172, -18.00240135192871, -13.85601806640625, -9.709634780883789, -5.5632524490356445, -1.4168701171875, 2.729513168334961, 6.875896453857422, 11.02227783203125, 15.168661117553711, 19.315044403076172, 23.461427688598633, 27.607810974121094, 31.754192352294922, 35.90057373046875, 40.046958923339844, 44.19334030151367, 48.3397216796875, 52.486106872558594, 56.63248825073242, 60.778873443603516, 64.92525482177734, 69.07164001464844, 73.218017578125, 77.3644027709961, 81.51078796386719, 85.65716552734375, 89.80355072021484, 93.9499282836914, 98.0963134765625, 102.2426986694336, 106.38908386230469, 110.53546142578125, 114.68184661865234, 118.82823181152344, 122.97461700439453, 127.1209945678711, 131.2673797607422, 135.41375732421875, 139.56015014648438, 143.70652770996094, 147.8529052734375, 151.99929809570312, 156.1456756591797, 160.2920684814453, 164.43844604492188, 168.58482360839844, 172.73121643066406, 176.87759399414062, 181.0239715576172, 185.17034912109375, 189.3167266845703, 193.46311950683594, 197.6094970703125, 201.75587463378906, 205.9022674560547, 210.04864501953125, 214.1950225830078, 218.34141540527344]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 6.0, 9.0, 8.0, 13.0, 16.0, 19.0, 13.0, 26.0, 22.0, 15.0, 36.0, 32.0, 31.0, 42.0, 41.0, 42.0, 44.0, 51.0, 44.0, 47.0, 42.0, 42.0, 39.0, 31.0, 37.0, 29.0, 31.0, 31.0, 29.0, 19.0, 14.0, 28.0, 9.0, 12.0, 11.0, 10.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0], "bins": [-52.600250244140625, -51.14336013793945, -49.68647003173828, -48.229583740234375, -46.7726936340332, -45.31580352783203, -43.85891342163086, -42.40202331542969, -40.94513702392578, -39.48824691772461, -38.03135681152344, -36.57447052001953, -35.11758041381836, -33.66069030761719, -32.203800201416016, -30.746910095214844, -29.290019989013672, -27.8331298828125, -26.37624168395996, -24.91935157775879, -23.46246337890625, -22.005573272705078, -20.548683166503906, -19.091793060302734, -17.634904861450195, -16.178014755249023, -14.721126556396484, -13.264236450195312, -11.807347297668457, -10.350458145141602, -8.89356803894043, -7.436678886413574, -5.979789733886719, -4.522900581359863, -3.0660109519958496, -1.609121322631836, -0.15223217010498047, 1.304656982421875, 2.761547088623047, 4.218436241149902, 5.675325393676758, 7.132214546203613, 8.589103698730469, 10.04599380493164, 11.502882957458496, 12.959772109985352, 14.416662216186523, 15.873551368713379, 17.330440521240234, 18.787330627441406, 20.244218826293945, 21.701108932495117, 23.157997131347656, 24.614887237548828, 26.07177734375, 27.528667449951172, 28.98555564880371, 30.442445755004883, 31.899333953857422, 33.356224060058594, 34.813114166259766, 36.27000427246094, 37.726890563964844, 39.183780670166016, 40.64067077636719]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 7.0, 14.0, 6.0, 19.0, 19.0, 22.0, 30.0, 23.0, 28.0, 35.0, 34.0, 28.0, 43.0, 44.0, 45.0, 50.0, 34.0, 39.0, 51.0, 45.0, 42.0, 36.0, 38.0, 25.0, 36.0, 22.0, 17.0, 27.0, 17.0, 20.0, 13.0, 16.0, 12.0, 10.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.67919921875, -5.4521484375, -5.22509765625, -4.998046875, -4.77099609375, -4.5439453125, -4.31689453125, -4.08984375, -3.86279296875, -3.6357421875, -3.40869140625, -3.181640625, -2.95458984375, -2.7275390625, -2.50048828125, -2.2734375, -2.04638671875, -1.8193359375, -1.59228515625, -1.365234375, -1.13818359375, -0.9111328125, -0.68408203125, -0.45703125, -0.22998046875, -0.0029296875, 0.22412109375, 0.451171875, 0.67822265625, 0.9052734375, 1.13232421875, 1.359375, 1.58642578125, 1.8134765625, 2.04052734375, 2.267578125, 2.49462890625, 2.7216796875, 2.94873046875, 3.17578125, 3.40283203125, 3.6298828125, 3.85693359375, 4.083984375, 4.31103515625, 4.5380859375, 4.76513671875, 4.9921875, 5.21923828125, 5.4462890625, 5.67333984375, 5.900390625, 6.12744140625, 6.3544921875, 6.58154296875, 6.80859375, 7.03564453125, 7.2626953125, 7.48974609375, 7.716796875, 7.94384765625, 8.1708984375, 8.39794921875, 8.625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 12.0, 8.0, 19.0, 12.0, 31.0, 47.0, 52.0, 93.0, 155.0, 229.0, 383.0, 573.0, 940.0, 1468.0, 2466.0, 3911.0, 6358.0, 10199.0, 17185.0, 28968.0, 51658.0, 92597.0, 159173.0, 219792.0, 185749.0, 113812.0, 64163.0, 35810.0, 20633.0, 12248.0, 7546.0, 4582.0, 2901.0, 1728.0, 1153.0, 698.0, 445.0, 246.0, 156.0, 123.0, 71.0, 49.0, 36.0, 27.0, 18.0, 9.0, 9.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7831649780273438, -0.7592010498046875, -0.7352371215820312, -0.711273193359375, -0.6873092651367188, -0.6633453369140625, -0.6393814086914062, -0.61541748046875, -0.5914535522460938, -0.5674896240234375, -0.5435256958007812, -0.519561767578125, -0.49559783935546875, -0.4716339111328125, -0.44766998291015625, -0.4237060546875, -0.39974212646484375, -0.3757781982421875, -0.35181427001953125, -0.327850341796875, -0.30388641357421875, -0.2799224853515625, -0.25595855712890625, -0.23199462890625, -0.20803070068359375, -0.1840667724609375, -0.16010284423828125, -0.136138916015625, -0.11217498779296875, -0.0882110595703125, -0.06424713134765625, -0.040283203125, -0.01631927490234375, 0.0076446533203125, 0.03160858154296875, 0.055572509765625, 0.07953643798828125, 0.1035003662109375, 0.12746429443359375, 0.15142822265625, 0.17539215087890625, 0.1993560791015625, 0.22332000732421875, 0.247283935546875, 0.27124786376953125, 0.2952117919921875, 0.31917572021484375, 0.3431396484375, 0.36710357666015625, 0.3910675048828125, 0.41503143310546875, 0.438995361328125, 0.46295928955078125, 0.4869232177734375, 0.5108871459960938, 0.53485107421875, 0.5588150024414062, 0.5827789306640625, 0.6067428588867188, 0.630706787109375, 0.6546707153320312, 0.6786346435546875, 0.7025985717773438, 0.7265625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 5.0, 8.0, 9.0, 8.0, 8.0, 10.0, 19.0, 19.0, 16.0, 20.0, 35.0, 24.0, 28.0, 29.0, 30.0, 32.0, 39.0, 46.0, 38.0, 36.0, 1069.0, 44.0, 47.0, 32.0, 41.0, 37.0, 35.0, 33.0, 30.0, 27.0, 22.0, 17.0, 24.0, 17.0, 16.0, 13.0, 11.0, 12.0, 8.0, 4.0, 0.0, 10.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.928466796875, -3.79443359375, -3.660400390625, -3.5263671875, -3.392333984375, -3.25830078125, -3.124267578125, -2.990234375, -2.856201171875, -2.72216796875, -2.588134765625, -2.4541015625, -2.320068359375, -2.18603515625, -2.052001953125, -1.91796875, -1.783935546875, -1.64990234375, -1.515869140625, -1.3818359375, -1.247802734375, -1.11376953125, -0.979736328125, -0.845703125, -0.711669921875, -0.57763671875, -0.443603515625, -0.3095703125, -0.175537109375, -0.04150390625, 0.092529296875, 0.2265625, 0.360595703125, 0.49462890625, 0.628662109375, 0.7626953125, 0.896728515625, 1.03076171875, 1.164794921875, 1.298828125, 1.432861328125, 1.56689453125, 1.700927734375, 1.8349609375, 1.968994140625, 2.10302734375, 2.237060546875, 2.37109375, 2.505126953125, 2.63916015625, 2.773193359375, 2.9072265625, 3.041259765625, 3.17529296875, 3.309326171875, 3.443359375, 3.577392578125, 3.71142578125, 3.845458984375, 3.9794921875, 4.113525390625, 4.24755859375, 4.381591796875, 4.515625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 8.0, 7.0, 11.0, 17.0, 29.0, 45.0, 85.0, 108.0, 184.0, 287.0, 457.0, 728.0, 1139.0, 1902.0, 3311.0, 5415.0, 9505.0, 15895.0, 28452.0, 50556.0, 89947.0, 149172.0, 1247166.0, 188347.0, 129085.0, 75740.0, 42388.0, 23697.0, 13713.0, 7901.0, 4721.0, 2794.0, 1665.0, 1051.0, 605.0, 385.0, 217.0, 142.0, 87.0, 61.0, 41.0, 18.0, 15.0, 15.0, 5.0, 10.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65625, -0.6362686157226562, -0.6162872314453125, -0.5963058471679688, -0.576324462890625, -0.5563430786132812, -0.5363616943359375, -0.5163803100585938, -0.49639892578125, -0.47641754150390625, -0.4564361572265625, -0.43645477294921875, -0.416473388671875, -0.39649200439453125, -0.3765106201171875, -0.35652923583984375, -0.3365478515625, -0.31656646728515625, -0.2965850830078125, -0.27660369873046875, -0.256622314453125, -0.23664093017578125, -0.2166595458984375, -0.19667816162109375, -0.17669677734375, -0.15671539306640625, -0.1367340087890625, -0.11675262451171875, -0.096771240234375, -0.07678985595703125, -0.0568084716796875, -0.03682708740234375, -0.016845703125, 0.00313568115234375, 0.0231170654296875, 0.04309844970703125, 0.063079833984375, 0.08306121826171875, 0.1030426025390625, 0.12302398681640625, 0.14300537109375, 0.16298675537109375, 0.1829681396484375, 0.20294952392578125, 0.222930908203125, 0.24291229248046875, 0.2628936767578125, 0.28287506103515625, 0.3028564453125, 0.32283782958984375, 0.3428192138671875, 0.36280059814453125, 0.382781982421875, 0.40276336669921875, 0.4227447509765625, 0.44272613525390625, 0.46270751953125, 0.48268890380859375, 0.5026702880859375, 0.5226516723632812, 0.542633056640625, 0.5626144409179688, 0.5825958251953125, 0.6025772094726562, 0.62255859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 10.0, 7.0, 10.0, 15.0, 14.0, 25.0, 12.0, 27.0, 38.0, 39.0, 36.0, 44.0, 66.0, 60.0, 69.0, 55.0, 60.0, 60.0, 51.0, 48.0, 40.0, 43.0, 33.0, 27.0, 15.0, 26.0, 13.0, 13.0, 4.0, 5.0, 8.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024585723876953125, -0.0023823678493499756, -0.0023061633110046387, -0.0022299587726593018, -0.002153754234313965, -0.002077549695968628, -0.002001345157623291, -0.001925140619277954, -0.0018489360809326172, -0.0017727315425872803, -0.0016965270042419434, -0.0016203224658966064, -0.0015441179275512695, -0.0014679133892059326, -0.0013917088508605957, -0.0013155043125152588, -0.0012392997741699219, -0.001163095235824585, -0.001086890697479248, -0.0010106861591339111, -0.0009344816207885742, -0.0008582770824432373, -0.0007820725440979004, -0.0007058680057525635, -0.0006296634674072266, -0.0005534589290618896, -0.00047725439071655273, -0.0004010498523712158, -0.0003248453140258789, -0.000248640775680542, -0.00017243623733520508, -9.623169898986816e-05, -2.002716064453125e-05, 5.6177377700805664e-05, 0.00013238191604614258, 0.0002085864543914795, 0.0002847909927368164, 0.0003609955310821533, 0.00043720006942749023, 0.0005134046077728271, 0.0005896091461181641, 0.000665813684463501, 0.0007420182228088379, 0.0008182227611541748, 0.0008944272994995117, 0.0009706318378448486, 0.0010468363761901855, 0.0011230409145355225, 0.0011992454528808594, 0.0012754499912261963, 0.0013516545295715332, 0.0014278590679168701, 0.001504063606262207, 0.001580268144607544, 0.0016564726829528809, 0.0017326772212982178, 0.0018088817596435547, 0.0018850862979888916, 0.0019612908363342285, 0.0020374953746795654, 0.0021136999130249023, 0.0021899044513702393, 0.002266108989715576, 0.002342313528060913, 0.00241851806640625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 4.0, 10.0, 6.0, 11.0, 13.0, 19.0, 25.0, 29.0, 36.0, 43.0, 61.0, 74.0, 105.0, 151.0, 241.0, 444.0, 1569.0, 355416.0, 686915.0, 2077.0, 464.0, 238.0, 141.0, 100.0, 82.0, 50.0, 51.0, 41.0, 24.0, 24.0, 12.0, 18.0, 13.0, 10.0, 3.0, 0.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043853759765625, -0.04239463806152344, -0.040935516357421875, -0.03947639465332031, -0.03801727294921875, -0.03655815124511719, -0.035099029541015625, -0.03363990783691406, -0.0321807861328125, -0.030721664428710938, -0.029262542724609375, -0.027803421020507812, -0.02634429931640625, -0.024885177612304688, -0.023426055908203125, -0.021966934204101562, -0.0205078125, -0.019048690795898438, -0.017589569091796875, -0.016130447387695312, -0.01467132568359375, -0.013212203979492188, -0.011753082275390625, -0.010293960571289062, -0.0088348388671875, -0.0073757171630859375, -0.005916595458984375, -0.0044574737548828125, -0.00299835205078125, -0.0015392303466796875, -8.0108642578125e-05, 0.0013790130615234375, 0.002838134765625, 0.0042972564697265625, 0.005756378173828125, 0.0072154998779296875, 0.00867462158203125, 0.010133743286132812, 0.011592864990234375, 0.013051986694335938, 0.0145111083984375, 0.015970230102539062, 0.017429351806640625, 0.018888473510742188, 0.02034759521484375, 0.021806716918945312, 0.023265838623046875, 0.024724960327148438, 0.02618408203125, 0.027643203735351562, 0.029102325439453125, 0.030561447143554688, 0.03202056884765625, 0.03347969055175781, 0.034938812255859375, 0.03639793395996094, 0.0378570556640625, 0.03931617736816406, 0.040775299072265625, 0.04223442077636719, 0.04369354248046875, 0.04515266418457031, 0.046611785888671875, 0.04807090759277344, 0.049530029296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 213.0, 798.0, 5.0], "bins": [-0.04439961910247803, -0.04368560016155243, -0.04297157749533653, -0.042257558554410934, -0.041543539613485336, -0.04082952067255974, -0.04011549800634384, -0.03940147906541824, -0.038687460124492645, -0.03797344118356705, -0.03725941851735115, -0.03654539957642555, -0.035831380635499954, -0.035117361694574356, -0.03440333902835846, -0.03368932008743286, -0.03297530114650726, -0.032261282205581665, -0.03154725953936577, -0.03083324059844017, -0.030119221657514572, -0.029405200853943825, -0.028691181913018227, -0.02797716110944748, -0.027263140305876732, -0.026549119502305984, -0.025835100561380386, -0.02512107975780964, -0.02440706081688404, -0.023693040013313293, -0.022979021072387695, -0.022265000268816948, -0.02155098132789135, -0.020836960524320602, -0.020122941583395004, -0.019408920779824257, -0.01869490183889866, -0.01798088103532791, -0.017266862094402313, -0.016552841290831566, -0.015838822349905968, -0.015124802477657795, -0.014410782605409622, -0.01369676273316145, -0.012982742860913277, -0.012268722988665104, -0.011554703116416931, -0.010840682312846184, -0.010126662440598011, -0.009412642568349838, -0.008698622696101665, -0.007984602823853493, -0.00727058295160532, -0.006556563079357147, -0.005842542741447687, -0.005128522869199514, -0.004414502531290054, -0.0037004826590418816, -0.002986462786793709, -0.0022724426817148924, -0.0015584228094667196, -0.0008444029372185469, -0.00013038283213973045, 0.0005836370401084423, 0.0012976567959412932]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 27.0, 15.0, 22.0, 20.0, 20.0, 37.0, 31.0, 38.0, 39.0, 42.0, 42.0, 62.0, 63.0, 53.0, 57.0, 42.0, 54.0, 43.0, 48.0, 32.0, 38.0, 34.0, 24.0, 23.0, 23.0, 19.0, 14.0, 4.0, 8.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012828707695007324, -0.001228678971529007, -0.0011744871735572815, -0.001120295375585556, -0.0010661035776138306, -0.001011911779642105, -0.0009577199816703796, -0.0009035281836986542, -0.0008493363857269287, -0.0007951445877552032, -0.0007409527897834778, -0.0006867609918117523, -0.0006325691938400269, -0.0005783773958683014, -0.0005241855978965759, -0.00046999379992485046, -0.000415802001953125, -0.00036161020398139954, -0.00030741840600967407, -0.0002532266080379486, -0.00019903481006622314, -0.00014484301209449768, -9.065121412277222e-05, -3.645941615104675e-05, 1.773238182067871e-05, 7.192417979240417e-05, 0.00012611597776412964, 0.0001803077757358551, 0.00023449957370758057, 0.00028869137167930603, 0.0003428831696510315, 0.00039707496762275696, 0.0004512667655944824, 0.0005054585635662079, 0.0005596503615379333, 0.0006138421595096588, 0.0006680339574813843, 0.0007222257554531097, 0.0007764175534248352, 0.0008306093513965607, 0.0008848011493682861, 0.0009389929473400116, 0.000993184745311737, 0.0010473765432834625, 0.001101568341255188, 0.0011557601392269135, 0.001209951937198639, 0.0012641437351703644, 0.0013183355331420898, 0.0013725273311138153, 0.0014267191290855408, 0.0014809109270572662, 0.0015351027250289917, 0.0015892945230007172, 0.0016434863209724426, 0.001697678118944168, 0.0017518699169158936, 0.001806061714887619, 0.0018602535128593445, 0.00191444531083107, 0.0019686371088027954, 0.002022828906774521, 0.0020770207047462463, 0.002131212502717972, 0.0021854043006896973]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 7.0, 14.0, 6.0, 19.0, 19.0, 22.0, 30.0, 23.0, 28.0, 35.0, 34.0, 28.0, 44.0, 43.0, 45.0, 50.0, 34.0, 39.0, 51.0, 45.0, 42.0, 36.0, 38.0, 25.0, 36.0, 22.0, 17.0, 27.0, 17.0, 20.0, 13.0, 16.0, 12.0, 10.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.67919921875, -5.4521484375, -5.22509765625, -4.998046875, -4.77099609375, -4.5439453125, -4.31689453125, -4.08984375, -3.86279296875, -3.6357421875, -3.40869140625, -3.181640625, -2.95458984375, -2.7275390625, -2.50048828125, -2.2734375, -2.04638671875, -1.8193359375, -1.59228515625, -1.365234375, -1.13818359375, -0.9111328125, -0.68408203125, -0.45703125, -0.22998046875, -0.0029296875, 0.22412109375, 0.451171875, 0.67822265625, 0.9052734375, 1.13232421875, 1.359375, 1.58642578125, 1.8134765625, 2.04052734375, 2.267578125, 2.49462890625, 2.7216796875, 2.94873046875, 3.17578125, 3.40283203125, 3.6298828125, 3.85693359375, 4.083984375, 4.31103515625, 4.5380859375, 4.76513671875, 4.9921875, 5.21923828125, 5.4462890625, 5.67333984375, 5.900390625, 6.12744140625, 6.3544921875, 6.58154296875, 6.80859375, 7.03564453125, 7.2626953125, 7.48974609375, 7.716796875, 7.94384765625, 8.1708984375, 8.39794921875, 8.625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 9.0, 7.0, 15.0, 15.0, 15.0, 27.0, 36.0, 39.0, 69.0, 63.0, 97.0, 149.0, 188.0, 295.0, 580.0, 1715.0, 7404.0, 51257.0, 535983.0, 401552.0, 40016.0, 6077.0, 1405.0, 528.0, 281.0, 184.0, 152.0, 102.0, 51.0, 55.0, 40.0, 34.0, 23.0, 22.0, 13.0, 12.0, 12.0, 9.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.1392822265625, -10.692626953125, -10.2459716796875, -9.79931640625, -9.3526611328125, -8.906005859375, -8.4593505859375, -8.0126953125, -7.5660400390625, -7.119384765625, -6.6727294921875, -6.22607421875, -5.7794189453125, -5.332763671875, -4.8861083984375, -4.439453125, -3.9927978515625, -3.546142578125, -3.0994873046875, -2.65283203125, -2.2061767578125, -1.759521484375, -1.3128662109375, -0.8662109375, -0.4195556640625, 0.027099609375, 0.4737548828125, 0.92041015625, 1.3670654296875, 1.813720703125, 2.2603759765625, 2.70703125, 3.1536865234375, 3.600341796875, 4.0469970703125, 4.49365234375, 4.9403076171875, 5.386962890625, 5.8336181640625, 6.2802734375, 6.7269287109375, 7.173583984375, 7.6202392578125, 8.06689453125, 8.5135498046875, 8.960205078125, 9.4068603515625, 9.853515625, 10.3001708984375, 10.746826171875, 11.1934814453125, 11.64013671875, 12.0867919921875, 12.533447265625, 12.9801025390625, 13.4267578125, 13.8734130859375, 14.320068359375, 14.7667236328125, 15.21337890625, 15.6600341796875, 16.106689453125, 16.5533447265625, 17.0]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 17.0, 9.0, 12.0, 29.0, 22.0, 24.0, 25.0, 32.0, 54.0, 52.0, 34.0, 69.0, 121.0, 412.0, 1548.0, 135.0, 66.0, 56.0, 42.0, 50.0, 41.0, 31.0, 31.0, 21.0, 27.0, 10.0, 12.0, 11.0, 8.0, 9.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.734375, -28.88720703125, -28.0400390625, -27.19287109375, -26.345703125, -25.49853515625, -24.6513671875, -23.80419921875, -22.95703125, -22.10986328125, -21.2626953125, -20.41552734375, -19.568359375, -18.72119140625, -17.8740234375, -17.02685546875, -16.1796875, -15.33251953125, -14.4853515625, -13.63818359375, -12.791015625, -11.94384765625, -11.0966796875, -10.24951171875, -9.40234375, -8.55517578125, -7.7080078125, -6.86083984375, -6.013671875, -5.16650390625, -4.3193359375, -3.47216796875, -2.625, -1.77783203125, -0.9306640625, -0.08349609375, 0.763671875, 1.61083984375, 2.4580078125, 3.30517578125, 4.15234375, 4.99951171875, 5.8466796875, 6.69384765625, 7.541015625, 8.38818359375, 9.2353515625, 10.08251953125, 10.9296875, 11.77685546875, 12.6240234375, 13.47119140625, 14.318359375, 15.16552734375, 16.0126953125, 16.85986328125, 17.70703125, 18.55419921875, 19.4013671875, 20.24853515625, 21.095703125, 21.94287109375, 22.7900390625, 23.63720703125, 24.484375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 10.0, 10.0, 12.0, 11.0, 13.0, 12.0, 30.0, 37.0, 34.0, 60.0, 90.0, 105.0, 181.0, 360.0, 929.0, 16013.0, 3109074.0, 16727.0, 1005.0, 360.0, 165.0, 143.0, 75.0, 60.0, 34.0, 36.0, 25.0, 28.0, 9.0, 16.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.75, -52.8291015625, -50.908203125, -48.9873046875, -47.06640625, -45.1455078125, -43.224609375, -41.3037109375, -39.3828125, -37.4619140625, -35.541015625, -33.6201171875, -31.69921875, -29.7783203125, -27.857421875, -25.9365234375, -24.015625, -22.0947265625, -20.173828125, -18.2529296875, -16.33203125, -14.4111328125, -12.490234375, -10.5693359375, -8.6484375, -6.7275390625, -4.806640625, -2.8857421875, -0.96484375, 0.9560546875, 2.876953125, 4.7978515625, 6.71875, 8.6396484375, 10.560546875, 12.4814453125, 14.40234375, 16.3232421875, 18.244140625, 20.1650390625, 22.0859375, 24.0068359375, 25.927734375, 27.8486328125, 29.76953125, 31.6904296875, 33.611328125, 35.5322265625, 37.453125, 39.3740234375, 41.294921875, 43.2158203125, 45.13671875, 47.0576171875, 48.978515625, 50.8994140625, 52.8203125, 54.7412109375, 56.662109375, 58.5830078125, 60.50390625, 62.4248046875, 64.345703125, 66.2666015625, 68.1875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 50.0, 128.0, 271.0, 330.0, 147.0, 67.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.9830551147461, -87.17090606689453, -85.3587646484375, -83.54661560058594, -81.73446655273438, -79.92231750488281, -78.11016845703125, -76.29802703857422, -74.48587799072266, -72.6737289428711, -70.86158752441406, -69.0494384765625, -67.23728942871094, -65.42514038085938, -63.61299514770508, -61.80084991455078, -59.98870086669922, -58.176551818847656, -56.36440658569336, -54.55226135253906, -52.7401123046875, -50.92796325683594, -49.11581802368164, -47.303672790527344, -45.49152374267578, -43.67937469482422, -41.86722946166992, -40.055084228515625, -38.24293518066406, -36.4307861328125, -34.6186408996582, -32.806495666503906, -30.99434471130371, -29.18219757080078, -27.37005043029785, -25.557903289794922, -23.745756149291992, -21.933609008789062, -20.121461868286133, -18.309314727783203, -16.497167587280273, -14.685020446777344, -12.872873306274414, -11.060726165771484, -9.248579025268555, -7.436431884765625, -5.624284744262695, -3.8121376037597656, -1.999990463256836, -0.18784332275390625, 1.6243038177490234, 3.436450958251953, 5.248598098754883, 7.0607452392578125, 8.872892379760742, 10.685039520263672, 12.497186660766602, 14.309333801269531, 16.12148094177246, 17.93362808227539, 19.74577522277832, 21.55792236328125, 23.37006950378418, 25.18221664428711, 26.99436378479004]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 9.0, 7.0, 6.0, 10.0, 12.0, 11.0, 13.0, 32.0, 26.0, 27.0, 28.0, 23.0, 31.0, 27.0, 50.0, 39.0, 40.0, 38.0, 50.0, 48.0, 40.0, 42.0, 40.0, 44.0, 37.0, 37.0, 34.0, 33.0, 23.0, 23.0, 21.0, 17.0, 8.0, 4.0, 11.0, 10.0, 10.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.07486343383789, -51.349910736083984, -49.624961853027344, -47.90000915527344, -46.17505645751953, -44.450103759765625, -42.72515106201172, -41.00020217895508, -39.27524948120117, -37.550296783447266, -35.825347900390625, -34.10039520263672, -32.37544250488281, -30.650489807128906, -28.925539016723633, -27.20058822631836, -25.475635528564453, -23.750682830810547, -22.025732040405273, -20.30078125, -18.575828552246094, -16.850875854492188, -15.125925064086914, -13.400973320007324, -11.676021575927734, -9.951069831848145, -8.226118087768555, -6.501166343688965, -4.776214599609375, -3.051262855529785, -1.3263111114501953, 0.39864063262939453, 2.1235885620117188, 3.8485403060913086, 5.573492050170898, 7.298443794250488, 9.023395538330078, 10.748347282409668, 12.473299026489258, 14.198250770568848, 15.923202514648438, 17.648155212402344, 19.373106002807617, 21.09805679321289, 22.823009490966797, 24.547962188720703, 26.272912979125977, 27.99786376953125, 29.722816467285156, 31.447769165039062, 33.17272186279297, 34.89767074584961, 36.622623443603516, 38.34757614135742, 40.07252502441406, 41.79747772216797, 43.522430419921875, 45.24738311767578, 46.97233581542969, 48.69728469848633, 50.422237396240234, 52.14719009399414, 53.87213897705078, 55.59709167480469, 57.322044372558594]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 11.0, 6.0, 12.0, 12.0, 25.0, 13.0, 22.0, 27.0, 23.0, 34.0, 29.0, 30.0, 22.0, 36.0, 52.0, 51.0, 34.0, 44.0, 35.0, 32.0, 55.0, 41.0, 36.0, 29.0, 28.0, 27.0, 24.0, 31.0, 20.0, 22.0, 25.0, 14.0, 12.0, 11.0, 12.0, 8.0, 8.0, 7.0, 5.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1484375, -5.92938232421875, -5.7103271484375, -5.49127197265625, -5.272216796875, -5.05316162109375, -4.8341064453125, -4.61505126953125, -4.39599609375, -4.17694091796875, -3.9578857421875, -3.73883056640625, -3.519775390625, -3.30072021484375, -3.0816650390625, -2.86260986328125, -2.6435546875, -2.42449951171875, -2.2054443359375, -1.98638916015625, -1.767333984375, -1.54827880859375, -1.3292236328125, -1.11016845703125, -0.89111328125, -0.67205810546875, -0.4530029296875, -0.23394775390625, -0.014892578125, 0.20416259765625, 0.4232177734375, 0.64227294921875, 0.861328125, 1.08038330078125, 1.2994384765625, 1.51849365234375, 1.737548828125, 1.95660400390625, 2.1756591796875, 2.39471435546875, 2.61376953125, 2.83282470703125, 3.0518798828125, 3.27093505859375, 3.489990234375, 3.70904541015625, 3.9281005859375, 4.14715576171875, 4.3662109375, 4.58526611328125, 4.8043212890625, 5.02337646484375, 5.242431640625, 5.46148681640625, 5.6805419921875, 5.89959716796875, 6.11865234375, 6.33770751953125, 6.5567626953125, 6.77581787109375, 6.994873046875, 7.21392822265625, 7.4329833984375, 7.65203857421875, 7.87109375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 7.0, 11.0, 10.0, 12.0, 10.0, 13.0, 17.0, 28.0, 21.0, 34.0, 46.0, 68.0, 112.0, 187.0, 349.0, 758.0, 1833.0, 5411.0, 22313.0, 174529.0, 1666558.0, 2043763.0, 239519.0, 28119.0, 6404.0, 2155.0, 926.0, 420.0, 200.0, 107.0, 75.0, 48.0, 40.0, 31.0, 24.0, 16.0, 19.0, 13.0, 11.0, 11.0, 13.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-14.4453125, -13.9483642578125, -13.451416015625, -12.9544677734375, -12.45751953125, -11.9605712890625, -11.463623046875, -10.9666748046875, -10.4697265625, -9.9727783203125, -9.475830078125, -8.9788818359375, -8.48193359375, -7.9849853515625, -7.488037109375, -6.9910888671875, -6.494140625, -5.9971923828125, -5.500244140625, -5.0032958984375, -4.50634765625, -4.0093994140625, -3.512451171875, -3.0155029296875, -2.5185546875, -2.0216064453125, -1.524658203125, -1.0277099609375, -0.53076171875, -0.0338134765625, 0.463134765625, 0.9600830078125, 1.45703125, 1.9539794921875, 2.450927734375, 2.9478759765625, 3.44482421875, 3.9417724609375, 4.438720703125, 4.9356689453125, 5.4326171875, 5.9295654296875, 6.426513671875, 6.9234619140625, 7.42041015625, 7.9173583984375, 8.414306640625, 8.9112548828125, 9.408203125, 9.9051513671875, 10.402099609375, 10.8990478515625, 11.39599609375, 11.8929443359375, 12.389892578125, 12.8868408203125, 13.3837890625, 13.8807373046875, 14.377685546875, 14.8746337890625, 15.37158203125, 15.8685302734375, 16.365478515625, 16.8624267578125, 17.359375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 6.0, 8.0, 8.0, 10.0, 13.0, 19.0, 18.0, 19.0, 31.0, 47.0, 74.0, 81.0, 126.0, 187.0, 234.0, 285.0, 369.0, 429.0, 464.0, 400.0, 328.0, 261.0, 178.0, 102.0, 94.0, 66.0, 54.0, 35.0, 36.0, 19.0, 20.0, 8.0, 10.0, 11.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.921875, -12.543701171875, -12.16552734375, -11.787353515625, -11.4091796875, -11.031005859375, -10.65283203125, -10.274658203125, -9.896484375, -9.518310546875, -9.14013671875, -8.761962890625, -8.3837890625, -8.005615234375, -7.62744140625, -7.249267578125, -6.87109375, -6.492919921875, -6.11474609375, -5.736572265625, -5.3583984375, -4.980224609375, -4.60205078125, -4.223876953125, -3.845703125, -3.467529296875, -3.08935546875, -2.711181640625, -2.3330078125, -1.954833984375, -1.57666015625, -1.198486328125, -0.8203125, -0.442138671875, -0.06396484375, 0.314208984375, 0.6923828125, 1.070556640625, 1.44873046875, 1.826904296875, 2.205078125, 2.583251953125, 2.96142578125, 3.339599609375, 3.7177734375, 4.095947265625, 4.47412109375, 4.852294921875, 5.23046875, 5.608642578125, 5.98681640625, 6.364990234375, 6.7431640625, 7.121337890625, 7.49951171875, 7.877685546875, 8.255859375, 8.634033203125, 9.01220703125, 9.390380859375, 9.7685546875, 10.146728515625, 10.52490234375, 10.903076171875, 11.28125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 3.0, 4.0, 6.0, 10.0, 12.0, 20.0, 29.0, 26.0, 21.0, 43.0, 60.0, 61.0, 72.0, 108.0, 150.0, 191.0, 352.0, 629.0, 1605.0, 5716.0, 35793.0, 758829.0, 3246655.0, 126089.0, 12580.0, 2791.0, 988.0, 450.0, 264.0, 178.0, 117.0, 93.0, 72.0, 46.0, 46.0, 47.0, 18.0, 27.0, 13.0, 17.0, 19.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.125, -29.12890625, -28.1328125, -27.13671875, -26.140625, -25.14453125, -24.1484375, -23.15234375, -22.15625, -21.16015625, -20.1640625, -19.16796875, -18.171875, -17.17578125, -16.1796875, -15.18359375, -14.1875, -13.19140625, -12.1953125, -11.19921875, -10.203125, -9.20703125, -8.2109375, -7.21484375, -6.21875, -5.22265625, -4.2265625, -3.23046875, -2.234375, -1.23828125, -0.2421875, 0.75390625, 1.75, 2.74609375, 3.7421875, 4.73828125, 5.734375, 6.73046875, 7.7265625, 8.72265625, 9.71875, 10.71484375, 11.7109375, 12.70703125, 13.703125, 14.69921875, 15.6953125, 16.69140625, 17.6875, 18.68359375, 19.6796875, 20.67578125, 21.671875, 22.66796875, 23.6640625, 24.66015625, 25.65625, 26.65234375, 27.6484375, 28.64453125, 29.640625, 30.63671875, 31.6328125, 32.62890625, 33.625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 10.0, 60.0, 212.0, 369.0, 256.0, 82.0, 21.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-257.1615295410156, -251.8807373046875, -246.59996032714844, -241.3191680908203, -236.0383758544922, -230.75759887695312, -225.476806640625, -220.19601440429688, -214.9152374267578, -209.6344451904297, -204.35366821289062, -199.0728759765625, -193.79208374023438, -188.5113067626953, -183.2305145263672, -177.94973754882812, -172.6689453125, -167.38815307617188, -162.1073760986328, -156.8265838623047, -151.54579162597656, -146.2650146484375, -140.98422241210938, -135.70343017578125, -130.42263793945312, -125.14185333251953, -119.8610610961914, -114.58027648925781, -109.29949188232422, -104.01870727539062, -98.7379150390625, -93.4571304321289, -88.17633819580078, -82.89555358886719, -77.61476135253906, -72.33397674560547, -67.05319213867188, -61.772403717041016, -56.491615295410156, -51.21083068847656, -45.9300422668457, -40.649253845214844, -35.36846923828125, -30.08768081665039, -24.806894302368164, -19.526107788085938, -14.245319366455078, -8.964534759521484, -3.683746337890625, 1.5970406532287598, 6.8778276443481445, 12.158615112304688, 17.439401626586914, 22.72018814086914, 28.0009765625, 33.281761169433594, 38.56254959106445, 43.84333801269531, 49.124122619628906, 54.404911041259766, 59.685699462890625, 64.96648406982422, 70.24726867675781, 75.52806091308594, 80.80884552001953]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 7.0, 6.0, 12.0, 5.0, 11.0, 10.0, 25.0, 10.0, 19.0, 30.0, 21.0, 31.0, 25.0, 28.0, 42.0, 36.0, 34.0, 42.0, 43.0, 49.0, 39.0, 48.0, 50.0, 33.0, 30.0, 30.0, 35.0, 35.0, 30.0, 26.0, 25.0, 18.0, 25.0, 17.0, 12.0, 13.0, 9.0, 6.0, 13.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-45.03558349609375, -43.67991256713867, -42.32424545288086, -40.96857452392578, -39.61290740966797, -38.25723648071289, -36.90156555175781, -35.5458984375, -34.19023132324219, -32.83456039428711, -31.478893280029297, -30.12322235107422, -28.767555236816406, -27.411884307861328, -26.056215286254883, -24.700546264648438, -23.34487533569336, -21.989206314086914, -20.63353729248047, -19.27786636352539, -17.922199249267578, -16.5665283203125, -15.210859298706055, -13.85519027709961, -12.499521255493164, -11.143852233886719, -9.788183212280273, -8.432513236999512, -7.076844215393066, -5.721175193786621, -4.365505218505859, -3.009836196899414, -1.6541671752929688, -0.29849791526794434, 1.05717134475708, 2.4128408432006836, 3.768509864807129, 5.124178886413574, 6.479848861694336, 7.835517883300781, 9.191186904907227, 10.546855926513672, 11.902524948120117, 13.258194923400879, 14.613863945007324, 15.96953296661377, 17.32520294189453, 18.680871963500977, 20.036540985107422, 21.392210006713867, 22.747879028320312, 24.10354995727539, 25.459217071533203, 26.81488800048828, 28.170557022094727, 29.526226043701172, 30.881895065307617, 32.23756408691406, 33.59323501586914, 34.94890213012695, 36.30457305908203, 37.660240173339844, 39.01591110229492, 40.37158203125, 41.72724914550781]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 1.0, 2.0, 7.0, 5.0, 6.0, 11.0, 16.0, 13.0, 14.0, 15.0, 13.0, 11.0, 26.0, 29.0, 35.0, 32.0, 24.0, 22.0, 36.0, 42.0, 42.0, 32.0, 36.0, 46.0, 44.0, 44.0, 43.0, 31.0, 26.0, 30.0, 28.0, 32.0, 29.0, 22.0, 21.0, 23.0, 18.0, 11.0, 14.0, 13.0, 12.0, 7.0, 7.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.46820068359375, -6.2489013671875, -6.02960205078125, -5.810302734375, -5.59100341796875, -5.3717041015625, -5.15240478515625, -4.93310546875, -4.71380615234375, -4.4945068359375, -4.27520751953125, -4.055908203125, -3.83660888671875, -3.6173095703125, -3.39801025390625, -3.1787109375, -2.95941162109375, -2.7401123046875, -2.52081298828125, -2.301513671875, -2.08221435546875, -1.8629150390625, -1.64361572265625, -1.42431640625, -1.20501708984375, -0.9857177734375, -0.76641845703125, -0.547119140625, -0.32781982421875, -0.1085205078125, 0.11077880859375, 0.330078125, 0.54937744140625, 0.7686767578125, 0.98797607421875, 1.207275390625, 1.42657470703125, 1.6458740234375, 1.86517333984375, 2.08447265625, 2.30377197265625, 2.5230712890625, 2.74237060546875, 2.961669921875, 3.18096923828125, 3.4002685546875, 3.61956787109375, 3.8388671875, 4.05816650390625, 4.2774658203125, 4.49676513671875, 4.716064453125, 4.93536376953125, 5.1546630859375, 5.37396240234375, 5.59326171875, 5.81256103515625, 6.0318603515625, 6.25115966796875, 6.470458984375, 6.68975830078125, 6.9090576171875, 7.12835693359375, 7.34765625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 11.0, 9.0, 19.0, 29.0, 25.0, 70.0, 80.0, 164.0, 233.0, 329.0, 542.0, 760.0, 1159.0, 1938.0, 2978.0, 4572.0, 7404.0, 11886.0, 19448.0, 32753.0, 55997.0, 95774.0, 155651.0, 205569.0, 174882.0, 112565.0, 65476.0, 38301.0, 22909.0, 13771.0, 8497.0, 5249.0, 3334.0, 2173.0, 1411.0, 904.0, 564.0, 359.0, 257.0, 167.0, 110.0, 67.0, 59.0, 29.0, 26.0, 15.0, 12.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.79638671875, -0.7727203369140625, -0.749053955078125, -0.7253875732421875, -0.70172119140625, -0.6780548095703125, -0.654388427734375, -0.6307220458984375, -0.6070556640625, -0.5833892822265625, -0.559722900390625, -0.5360565185546875, -0.51239013671875, -0.4887237548828125, -0.465057373046875, -0.4413909912109375, -0.417724609375, -0.3940582275390625, -0.370391845703125, -0.3467254638671875, -0.32305908203125, -0.2993927001953125, -0.275726318359375, -0.2520599365234375, -0.2283935546875, -0.2047271728515625, -0.181060791015625, -0.1573944091796875, -0.13372802734375, -0.1100616455078125, -0.086395263671875, -0.0627288818359375, -0.0390625, -0.0153961181640625, 0.008270263671875, 0.0319366455078125, 0.05560302734375, 0.0792694091796875, 0.102935791015625, 0.1266021728515625, 0.1502685546875, 0.1739349365234375, 0.197601318359375, 0.2212677001953125, 0.24493408203125, 0.2686004638671875, 0.292266845703125, 0.3159332275390625, 0.339599609375, 0.3632659912109375, 0.386932373046875, 0.4105987548828125, 0.43426513671875, 0.4579315185546875, 0.481597900390625, 0.5052642822265625, 0.5289306640625, 0.5525970458984375, 0.576263427734375, 0.5999298095703125, 0.62359619140625, 0.6472625732421875, 0.670928955078125, 0.6945953369140625, 0.71826171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 11.0, 9.0, 7.0, 10.0, 19.0, 25.0, 31.0, 17.0, 28.0, 26.0, 47.0, 36.0, 36.0, 40.0, 42.0, 31.0, 44.0, 1060.0, 42.0, 47.0, 33.0, 34.0, 35.0, 31.0, 43.0, 32.0, 26.0, 21.0, 25.0, 16.0, 23.0, 16.0, 10.0, 6.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-5.1015625, -4.9530029296875, -4.804443359375, -4.6558837890625, -4.50732421875, -4.3587646484375, -4.210205078125, -4.0616455078125, -3.9130859375, -3.7645263671875, -3.615966796875, -3.4674072265625, -3.31884765625, -3.1702880859375, -3.021728515625, -2.8731689453125, -2.724609375, -2.5760498046875, -2.427490234375, -2.2789306640625, -2.13037109375, -1.9818115234375, -1.833251953125, -1.6846923828125, -1.5361328125, -1.3875732421875, -1.239013671875, -1.0904541015625, -0.94189453125, -0.7933349609375, -0.644775390625, -0.4962158203125, -0.34765625, -0.1990966796875, -0.050537109375, 0.0980224609375, 0.24658203125, 0.3951416015625, 0.543701171875, 0.6922607421875, 0.8408203125, 0.9893798828125, 1.137939453125, 1.2864990234375, 1.43505859375, 1.5836181640625, 1.732177734375, 1.8807373046875, 2.029296875, 2.1778564453125, 2.326416015625, 2.4749755859375, 2.62353515625, 2.7720947265625, 2.920654296875, 3.0692138671875, 3.2177734375, 3.3663330078125, 3.514892578125, 3.6634521484375, 3.81201171875, 3.9605712890625, 4.109130859375, 4.2576904296875, 4.40625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 7.0, 22.0, 21.0, 32.0, 49.0, 79.0, 115.0, 183.0, 238.0, 449.0, 675.0, 1034.0, 1648.0, 2682.0, 4442.0, 6896.0, 11138.0, 18353.0, 29077.0, 47974.0, 78086.0, 121352.0, 164438.0, 1221834.0, 139396.0, 94849.0, 58394.0, 35932.0, 21861.0, 13284.0, 8499.0, 5203.0, 3225.0, 2033.0, 1263.0, 779.0, 567.0, 356.0, 212.0, 149.0, 93.0, 61.0, 46.0, 35.0, 18.0, 15.0, 4.0, 10.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.59375, -0.57586669921875, -0.5579833984375, -0.54010009765625, -0.522216796875, -0.50433349609375, -0.4864501953125, -0.46856689453125, -0.45068359375, -0.43280029296875, -0.4149169921875, -0.39703369140625, -0.379150390625, -0.36126708984375, -0.3433837890625, -0.32550048828125, -0.3076171875, -0.28973388671875, -0.2718505859375, -0.25396728515625, -0.236083984375, -0.21820068359375, -0.2003173828125, -0.18243408203125, -0.16455078125, -0.14666748046875, -0.1287841796875, -0.11090087890625, -0.093017578125, -0.07513427734375, -0.0572509765625, -0.03936767578125, -0.021484375, -0.00360107421875, 0.0142822265625, 0.03216552734375, 0.050048828125, 0.06793212890625, 0.0858154296875, 0.10369873046875, 0.12158203125, 0.13946533203125, 0.1573486328125, 0.17523193359375, 0.193115234375, 0.21099853515625, 0.2288818359375, 0.24676513671875, 0.2646484375, 0.28253173828125, 0.3004150390625, 0.31829833984375, 0.336181640625, 0.35406494140625, 0.3719482421875, 0.38983154296875, 0.40771484375, 0.42559814453125, 0.4434814453125, 0.46136474609375, 0.479248046875, 0.49713134765625, 0.5150146484375, 0.53289794921875, 0.55078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 4.0, 7.0, 13.0, 22.0, 16.0, 17.0, 15.0, 20.0, 27.0, 29.0, 43.0, 38.0, 50.0, 37.0, 49.0, 50.0, 54.0, 48.0, 40.0, 50.0, 39.0, 41.0, 37.0, 34.0, 34.0, 32.0, 21.0, 17.0, 15.0, 10.0, 14.0, 16.0, 16.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017518997192382812, -0.001692935824394226, -0.001633971929550171, -0.0015750080347061157, -0.0015160441398620605, -0.0014570802450180054, -0.0013981163501739502, -0.001339152455329895, -0.0012801885604858398, -0.0012212246656417847, -0.0011622607707977295, -0.0011032968759536743, -0.0010443329811096191, -0.000985369086265564, -0.0009264051914215088, -0.0008674412965774536, -0.0008084774017333984, -0.0007495135068893433, -0.0006905496120452881, -0.0006315857172012329, -0.0005726218223571777, -0.0005136579275131226, -0.0004546940326690674, -0.0003957301378250122, -0.00033676624298095703, -0.00027780234813690186, -0.00021883845329284668, -0.0001598745584487915, -0.00010091066360473633, -4.194676876068115e-05, 1.7017126083374023e-05, 7.59810209274292e-05, 0.00013494491577148438, 0.00019390881061553955, 0.0002528727054595947, 0.0003118366003036499, 0.0003708004951477051, 0.00042976438999176025, 0.0004887282848358154, 0.0005476921796798706, 0.0006066560745239258, 0.000665619969367981, 0.0007245838642120361, 0.0007835477590560913, 0.0008425116539001465, 0.0009014755487442017, 0.0009604394435882568, 0.001019403338432312, 0.0010783672332763672, 0.0011373311281204224, 0.0011962950229644775, 0.0012552589178085327, 0.0013142228126525879, 0.001373186707496643, 0.0014321506023406982, 0.0014911144971847534, 0.0015500783920288086, 0.0016090422868728638, 0.001668006181716919, 0.0017269700765609741, 0.0017859339714050293, 0.0018448978662490845, 0.0019038617610931396, 0.001962825655937195, 0.00202178955078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 5.0, 13.0, 19.0, 14.0, 17.0, 20.0, 30.0, 27.0, 31.0, 58.0, 68.0, 86.0, 123.0, 155.0, 223.0, 450.0, 1180.0, 65527.0, 972343.0, 6360.0, 682.0, 337.0, 199.0, 126.0, 93.0, 63.0, 53.0, 52.0, 34.0, 31.0, 24.0, 16.0, 18.0, 10.0, 14.0, 8.0, 4.0, 6.0, 5.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0], "bins": [-0.044769287109375, -0.043535709381103516, -0.04230213165283203, -0.04106855392456055, -0.03983497619628906, -0.03860139846801758, -0.037367820739746094, -0.03613424301147461, -0.034900665283203125, -0.03366708755493164, -0.032433509826660156, -0.031199932098388672, -0.029966354370117188, -0.028732776641845703, -0.02749919891357422, -0.026265621185302734, -0.02503204345703125, -0.023798465728759766, -0.02256488800048828, -0.021331310272216797, -0.020097732543945312, -0.018864154815673828, -0.017630577087402344, -0.01639699935913086, -0.015163421630859375, -0.01392984390258789, -0.012696266174316406, -0.011462688446044922, -0.010229110717773438, -0.008995532989501953, -0.007761955261230469, -0.006528377532958984, -0.0052947998046875, -0.004061222076416016, -0.0028276443481445312, -0.0015940666198730469, -0.0003604888916015625, 0.0008730888366699219, 0.0021066665649414062, 0.0033402442932128906, 0.004573822021484375, 0.005807399749755859, 0.007040977478027344, 0.008274555206298828, 0.009508132934570312, 0.010741710662841797, 0.011975288391113281, 0.013208866119384766, 0.01444244384765625, 0.015676021575927734, 0.01690959930419922, 0.018143177032470703, 0.019376754760742188, 0.020610332489013672, 0.021843910217285156, 0.02307748794555664, 0.024311065673828125, 0.02554464340209961, 0.026778221130371094, 0.028011798858642578, 0.029245376586914062, 0.030478954315185547, 0.03171253204345703, 0.032946109771728516, 0.0341796875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 14.0, 36.0, 60.0, 184.0, 279.0, 260.0, 136.0, 28.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0051488433964550495, -0.00503904465585947, -0.004929245915263891, -0.004819447174668312, -0.00470964889973402, -0.004599850159138441, -0.004490051418542862, -0.004380252677947283, -0.004270453937351704, -0.0041606551967561245, -0.004050856456160545, -0.0039410581812262535, -0.0038312592078000307, -0.003721460700035095, -0.003611661959439516, -0.003501863218843937, -0.0033920647110790014, -0.0032822659704834223, -0.003172467462718487, -0.0030626687221229076, -0.0029528699815273285, -0.0028430712409317493, -0.002733272733166814, -0.0026234739925712347, -0.002513675484806299, -0.00240387674421072, -0.0022940782364457846, -0.0021842794958502054, -0.0020744807552546263, -0.0019646822474896908, -0.0018548835068941116, -0.0017450847662985325, -0.0016352861421182752, -0.0015254875179380178, -0.0014156887773424387, -0.0013058901531621814, -0.001196091528981924, -0.001086292788386345, -0.0009764941642060876, -0.0008666954818181694, -0.0007568967994302511, -0.0006470981170423329, -0.0005372994346544147, -0.00042750081047415733, -0.0003177021280862391, -0.00020790344569832087, -9.810482151806355e-05, 1.1693860869854689e-05, 0.00012149254325777292, 0.00023129121109377593, 0.00034108987892977893, 0.0004508885322138667, 0.0005606872146017849, 0.0006704858969897032, 0.0007802845211699605, 0.0008900832035578787, 0.000999881885945797, 0.0011096805101260543, 0.0012194792507216334, 0.0013292778749018908, 0.00143907661549747, 0.0015488752396777272, 0.0016586738638579845, 0.0017684726044535637, 0.001878271228633821]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 7.0, 5.0, 10.0, 9.0, 11.0, 17.0, 30.0, 23.0, 16.0, 31.0, 32.0, 37.0, 50.0, 43.0, 51.0, 44.0, 61.0, 51.0, 51.0, 43.0, 44.0, 51.0, 43.0, 31.0, 32.0, 29.0, 22.0, 19.0, 26.0, 22.0, 9.0, 7.0, 8.0, 11.0, 9.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012853741645812988, -0.0012443633750081062, -0.0012033525854349136, -0.001162341795861721, -0.0011213310062885284, -0.0010803202167153358, -0.0010393094271421432, -0.0009982986375689507, -0.0009572878479957581, -0.0009162770584225655, -0.0008752662688493729, -0.0008342554792761803, -0.0007932446897029877, -0.0007522339001297951, -0.0007112231105566025, -0.0006702123209834099, -0.0006292015314102173, -0.0005881907418370247, -0.0005471799522638321, -0.0005061691626906395, -0.0004651583731174469, -0.0004241475835442543, -0.0003831367939710617, -0.0003421260043978691, -0.0003011152148246765, -0.0002601044252514839, -0.00021909363567829132, -0.00017808284610509872, -0.00013707205653190613, -9.606126695871353e-05, -5.5050477385520935e-05, -1.4039687812328339e-05, 2.6971101760864258e-05, 6.798189133405685e-05, 0.00010899268090724945, 0.00015000347048044205, 0.00019101426005363464, 0.00023202504962682724, 0.00027303583920001984, 0.00031404662877321243, 0.00035505741834640503, 0.0003960682079195976, 0.0004370789974927902, 0.0004780897870659828, 0.0005191005766391754, 0.000560111366212368, 0.0006011221557855606, 0.0006421329453587532, 0.0006831437349319458, 0.0007241545245051384, 0.000765165314078331, 0.0008061761036515236, 0.0008471868932247162, 0.0008881976827979088, 0.0009292084723711014, 0.000970219261944294, 0.0010112300515174866, 0.0010522408410906792, 0.0010932516306638718, 0.0011342624202370644, 0.001175273209810257, 0.0012162839993834496, 0.0012572947889566422, 0.0012983055785298347, 0.0013393163681030273]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 1.0, 2.0, 7.0, 5.0, 6.0, 11.0, 16.0, 13.0, 14.0, 15.0, 13.0, 11.0, 26.0, 29.0, 35.0, 32.0, 24.0, 22.0, 36.0, 42.0, 41.0, 33.0, 36.0, 46.0, 44.0, 44.0, 43.0, 31.0, 26.0, 30.0, 28.0, 32.0, 29.0, 22.0, 21.0, 23.0, 18.0, 11.0, 14.0, 13.0, 12.0, 7.0, 7.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.46820068359375, -6.2489013671875, -6.02960205078125, -5.810302734375, -5.59100341796875, -5.3717041015625, -5.15240478515625, -4.93310546875, -4.71380615234375, -4.4945068359375, -4.27520751953125, -4.055908203125, -3.83660888671875, -3.6173095703125, -3.39801025390625, -3.1787109375, -2.95941162109375, -2.7401123046875, -2.52081298828125, -2.301513671875, -2.08221435546875, -1.8629150390625, -1.64361572265625, -1.42431640625, -1.20501708984375, -0.9857177734375, -0.76641845703125, -0.547119140625, -0.32781982421875, -0.1085205078125, 0.11077880859375, 0.330078125, 0.54937744140625, 0.7686767578125, 0.98797607421875, 1.207275390625, 1.42657470703125, 1.6458740234375, 1.86517333984375, 2.08447265625, 2.30377197265625, 2.5230712890625, 2.74237060546875, 2.961669921875, 3.18096923828125, 3.4002685546875, 3.61956787109375, 3.8388671875, 4.05816650390625, 4.2774658203125, 4.49676513671875, 4.716064453125, 4.93536376953125, 5.1546630859375, 5.37396240234375, 5.59326171875, 5.81256103515625, 6.0318603515625, 6.25115966796875, 6.470458984375, 6.68975830078125, 6.9090576171875, 7.12835693359375, 7.34765625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 9.0, 3.0, 5.0, 12.0, 9.0, 9.0, 24.0, 26.0, 30.0, 45.0, 38.0, 74.0, 61.0, 109.0, 147.0, 209.0, 275.0, 322.0, 422.0, 650.0, 1187.0, 3344.0, 15247.0, 97061.0, 814068.0, 93484.0, 14709.0, 3355.0, 1117.0, 651.0, 426.0, 314.0, 279.0, 212.0, 154.0, 111.0, 84.0, 69.0, 41.0, 27.0, 34.0, 21.0, 18.0, 14.0, 14.0, 8.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.90625, -16.351806640625, -15.79736328125, -15.242919921875, -14.6884765625, -14.134033203125, -13.57958984375, -13.025146484375, -12.470703125, -11.916259765625, -11.36181640625, -10.807373046875, -10.2529296875, -9.698486328125, -9.14404296875, -8.589599609375, -8.03515625, -7.480712890625, -6.92626953125, -6.371826171875, -5.8173828125, -5.262939453125, -4.70849609375, -4.154052734375, -3.599609375, -3.045166015625, -2.49072265625, -1.936279296875, -1.3818359375, -0.827392578125, -0.27294921875, 0.281494140625, 0.8359375, 1.390380859375, 1.94482421875, 2.499267578125, 3.0537109375, 3.608154296875, 4.16259765625, 4.717041015625, 5.271484375, 5.825927734375, 6.38037109375, 6.934814453125, 7.4892578125, 8.043701171875, 8.59814453125, 9.152587890625, 9.70703125, 10.261474609375, 10.81591796875, 11.370361328125, 11.9248046875, 12.479248046875, 13.03369140625, 13.588134765625, 14.142578125, 14.697021484375, 15.25146484375, 15.805908203125, 16.3603515625, 16.914794921875, 17.46923828125, 18.023681640625, 18.578125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 5.0, 4.0, 10.0, 9.0, 18.0, 17.0, 22.0, 11.0, 15.0, 26.0, 24.0, 32.0, 34.0, 35.0, 53.0, 46.0, 52.0, 103.0, 245.0, 1639.0, 131.0, 71.0, 58.0, 48.0, 42.0, 28.0, 42.0, 31.0, 21.0, 30.0, 19.0, 26.0, 15.0, 11.0, 15.0, 14.0, 11.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.015625, -20.2724609375, -19.529296875, -18.7861328125, -18.04296875, -17.2998046875, -16.556640625, -15.8134765625, -15.0703125, -14.3271484375, -13.583984375, -12.8408203125, -12.09765625, -11.3544921875, -10.611328125, -9.8681640625, -9.125, -8.3818359375, -7.638671875, -6.8955078125, -6.15234375, -5.4091796875, -4.666015625, -3.9228515625, -3.1796875, -2.4365234375, -1.693359375, -0.9501953125, -0.20703125, 0.5361328125, 1.279296875, 2.0224609375, 2.765625, 3.5087890625, 4.251953125, 4.9951171875, 5.73828125, 6.4814453125, 7.224609375, 7.9677734375, 8.7109375, 9.4541015625, 10.197265625, 10.9404296875, 11.68359375, 12.4267578125, 13.169921875, 13.9130859375, 14.65625, 15.3994140625, 16.142578125, 16.8857421875, 17.62890625, 18.3720703125, 19.115234375, 19.8583984375, 20.6015625, 21.3447265625, 22.087890625, 22.8310546875, 23.57421875, 24.3173828125, 25.060546875, 25.8037109375, 26.546875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 4.0, 5.0, 6.0, 9.0, 14.0, 18.0, 16.0, 20.0, 23.0, 26.0, 33.0, 35.0, 45.0, 59.0, 80.0, 112.0, 196.0, 354.0, 998.0, 8473.0, 3081142.0, 50944.0, 1787.0, 517.0, 235.0, 137.0, 90.0, 63.0, 44.0, 35.0, 29.0, 17.0, 23.0, 24.0, 19.0, 18.0, 11.0, 7.0, 9.0, 2.0, 7.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-74.625, -72.4736328125, -70.322265625, -68.1708984375, -66.01953125, -63.8681640625, -61.716796875, -59.5654296875, -57.4140625, -55.2626953125, -53.111328125, -50.9599609375, -48.80859375, -46.6572265625, -44.505859375, -42.3544921875, -40.203125, -38.0517578125, -35.900390625, -33.7490234375, -31.59765625, -29.4462890625, -27.294921875, -25.1435546875, -22.9921875, -20.8408203125, -18.689453125, -16.5380859375, -14.38671875, -12.2353515625, -10.083984375, -7.9326171875, -5.78125, -3.6298828125, -1.478515625, 0.6728515625, 2.82421875, 4.9755859375, 7.126953125, 9.2783203125, 11.4296875, 13.5810546875, 15.732421875, 17.8837890625, 20.03515625, 22.1865234375, 24.337890625, 26.4892578125, 28.640625, 30.7919921875, 32.943359375, 35.0947265625, 37.24609375, 39.3974609375, 41.548828125, 43.7001953125, 45.8515625, 48.0029296875, 50.154296875, 52.3056640625, 54.45703125, 56.6083984375, 58.759765625, 60.9111328125, 63.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 243.0, 601.0, 160.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.7018814086914, -120.00689697265625, -116.3119125366211, -112.61692810058594, -108.92194366455078, -105.22695922851562, -101.53197479248047, -97.83699035644531, -94.14200592041016, -90.447021484375, -86.75203704833984, -83.05705261230469, -79.36206817626953, -75.66708374023438, -71.97209930419922, -68.27711486816406, -64.58212280273438, -60.88713836669922, -57.19215393066406, -53.497169494628906, -49.80218505859375, -46.107200622558594, -42.41221618652344, -38.71723175048828, -35.022247314453125, -31.32726287841797, -27.632278442382812, -23.937294006347656, -20.2423095703125, -16.54732322692871, -12.852338790893555, -9.157354354858398, -5.462371826171875, -1.7673871517181396, 1.9275975227355957, 5.62258243560791, 9.317566871643066, 13.012552261352539, 16.707536697387695, 20.40252113342285, 24.097505569458008, 27.792490005493164, 31.48747444152832, 35.18246078491211, 38.877445220947266, 42.57242965698242, 46.26741409301758, 49.962398529052734, 53.65738296508789, 57.35236740112305, 61.0473518371582, 64.74234008789062, 68.43732452392578, 72.13230895996094, 75.8272933959961, 79.52227783203125, 83.2172622680664, 86.91224670410156, 90.60723114013672, 94.30221557617188, 97.99720001220703, 101.69218444824219, 105.38716888427734, 109.0821533203125, 112.77713775634766]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 7.0, 6.0, 8.0, 8.0, 8.0, 10.0, 21.0, 14.0, 28.0, 20.0, 29.0, 27.0, 24.0, 40.0, 39.0, 37.0, 34.0, 43.0, 45.0, 30.0, 42.0, 40.0, 51.0, 31.0, 45.0, 33.0, 33.0, 31.0, 15.0, 22.0, 17.0, 13.0, 24.0, 13.0, 20.0, 12.0, 13.0, 4.0, 14.0, 6.0, 4.0, 10.0, 5.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 4.0], "bins": [-58.57500076293945, -56.92686080932617, -55.27872085571289, -53.63058090209961, -51.98244094848633, -50.33430099487305, -48.6861572265625, -47.03801727294922, -45.38987731933594, -43.741737365722656, -42.093597412109375, -40.445457458496094, -38.79731750488281, -37.14917755126953, -35.50103759765625, -33.85289764404297, -32.20475769042969, -30.556617736816406, -28.908477783203125, -27.260337829589844, -25.612197875976562, -23.96405792236328, -22.315916061401367, -20.667776107788086, -19.019636154174805, -17.371496200561523, -15.723356246948242, -14.075215339660645, -12.427075386047363, -10.778935432434082, -9.130794525146484, -7.482654571533203, -5.8345184326171875, -4.186378479003906, -2.538238048553467, -0.8900976181030273, 0.7580423355102539, 2.406182289123535, 4.054323196411133, 5.702463150024414, 7.350603103637695, 8.998743057250977, 10.646883010864258, 12.295023918151855, 13.943163871765137, 15.591303825378418, 17.239444732666016, 18.887584686279297, 20.535724639892578, 22.18386459350586, 23.83200454711914, 25.480144500732422, 27.128284454345703, 28.776424407958984, 30.4245662689209, 32.07270812988281, 33.720848083496094, 35.368988037109375, 37.017127990722656, 38.66526794433594, 40.31340789794922, 41.9615478515625, 43.60968780517578, 45.25782775878906, 46.905967712402344]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 8.0, 6.0, 8.0, 12.0, 11.0, 13.0, 20.0, 26.0, 22.0, 21.0, 26.0, 30.0, 31.0, 34.0, 20.0, 29.0, 38.0, 38.0, 32.0, 40.0, 46.0, 39.0, 33.0, 36.0, 34.0, 28.0, 39.0, 38.0, 23.0, 28.0, 21.0, 24.0, 18.0, 14.0, 15.0, 13.0, 16.0, 11.0, 11.0, 7.0, 6.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.7578125, -6.5355224609375, -6.313232421875, -6.0909423828125, -5.86865234375, -5.6463623046875, -5.424072265625, -5.2017822265625, -4.9794921875, -4.7572021484375, -4.534912109375, -4.3126220703125, -4.09033203125, -3.8680419921875, -3.645751953125, -3.4234619140625, -3.201171875, -2.9788818359375, -2.756591796875, -2.5343017578125, -2.31201171875, -2.0897216796875, -1.867431640625, -1.6451416015625, -1.4228515625, -1.2005615234375, -0.978271484375, -0.7559814453125, -0.53369140625, -0.3114013671875, -0.089111328125, 0.1331787109375, 0.35546875, 0.5777587890625, 0.800048828125, 1.0223388671875, 1.24462890625, 1.4669189453125, 1.689208984375, 1.9114990234375, 2.1337890625, 2.3560791015625, 2.578369140625, 2.8006591796875, 3.02294921875, 3.2452392578125, 3.467529296875, 3.6898193359375, 3.912109375, 4.1343994140625, 4.356689453125, 4.5789794921875, 4.80126953125, 5.0235595703125, 5.245849609375, 5.4681396484375, 5.6904296875, 5.9127197265625, 6.135009765625, 6.3572998046875, 6.57958984375, 6.8018798828125, 7.024169921875, 7.2464599609375, 7.46875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 9.0, 6.0, 15.0, 17.0, 24.0, 28.0, 25.0, 57.0, 73.0, 91.0, 135.0, 182.0, 276.0, 428.0, 696.0, 1214.0, 2447.0, 5449.0, 16746.0, 79677.0, 576468.0, 2175978.0, 1130890.0, 159325.0, 28361.0, 8315.0, 3280.0, 1594.0, 845.0, 504.0, 327.0, 222.0, 129.0, 114.0, 87.0, 61.0, 34.0, 35.0, 29.0, 19.0, 22.0, 9.0, 6.0, 10.0, 5.0, 5.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-14.1953125, -13.77392578125, -13.3525390625, -12.93115234375, -12.509765625, -12.08837890625, -11.6669921875, -11.24560546875, -10.82421875, -10.40283203125, -9.9814453125, -9.56005859375, -9.138671875, -8.71728515625, -8.2958984375, -7.87451171875, -7.453125, -7.03173828125, -6.6103515625, -6.18896484375, -5.767578125, -5.34619140625, -4.9248046875, -4.50341796875, -4.08203125, -3.66064453125, -3.2392578125, -2.81787109375, -2.396484375, -1.97509765625, -1.5537109375, -1.13232421875, -0.7109375, -0.28955078125, 0.1318359375, 0.55322265625, 0.974609375, 1.39599609375, 1.8173828125, 2.23876953125, 2.66015625, 3.08154296875, 3.5029296875, 3.92431640625, 4.345703125, 4.76708984375, 5.1884765625, 5.60986328125, 6.03125, 6.45263671875, 6.8740234375, 7.29541015625, 7.716796875, 8.13818359375, 8.5595703125, 8.98095703125, 9.40234375, 9.82373046875, 10.2451171875, 10.66650390625, 11.087890625, 11.50927734375, 11.9306640625, 12.35205078125, 12.7734375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 8.0, 5.0, 23.0, 22.0, 47.0, 62.0, 92.0, 138.0, 188.0, 300.0, 434.0, 525.0, 589.0, 465.0, 367.0, 262.0, 160.0, 94.0, 69.0, 54.0, 46.0, 43.0, 16.0, 9.0, 11.0, 7.0, 5.0, 11.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -16.1220703125, -15.650390625, -15.1787109375, -14.70703125, -14.2353515625, -13.763671875, -13.2919921875, -12.8203125, -12.3486328125, -11.876953125, -11.4052734375, -10.93359375, -10.4619140625, -9.990234375, -9.5185546875, -9.046875, -8.5751953125, -8.103515625, -7.6318359375, -7.16015625, -6.6884765625, -6.216796875, -5.7451171875, -5.2734375, -4.8017578125, -4.330078125, -3.8583984375, -3.38671875, -2.9150390625, -2.443359375, -1.9716796875, -1.5, -1.0283203125, -0.556640625, -0.0849609375, 0.38671875, 0.8583984375, 1.330078125, 1.8017578125, 2.2734375, 2.7451171875, 3.216796875, 3.6884765625, 4.16015625, 4.6318359375, 5.103515625, 5.5751953125, 6.046875, 6.5185546875, 6.990234375, 7.4619140625, 7.93359375, 8.4052734375, 8.876953125, 9.3486328125, 9.8203125, 10.2919921875, 10.763671875, 11.2353515625, 11.70703125, 12.1787109375, 12.650390625, 13.1220703125, 13.59375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 11.0, 5.0, 8.0, 14.0, 15.0, 20.0, 31.0, 42.0, 50.0, 104.0, 132.0, 204.0, 355.0, 822.0, 2317.0, 12765.0, 290510.0, 3752640.0, 122810.0, 8224.0, 1714.0, 668.0, 310.0, 191.0, 113.0, 70.0, 32.0, 38.0, 19.0, 16.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.875, -44.541015625, -43.20703125, -41.873046875, -40.5390625, -39.205078125, -37.87109375, -36.537109375, -35.203125, -33.869140625, -32.53515625, -31.201171875, -29.8671875, -28.533203125, -27.19921875, -25.865234375, -24.53125, -23.197265625, -21.86328125, -20.529296875, -19.1953125, -17.861328125, -16.52734375, -15.193359375, -13.859375, -12.525390625, -11.19140625, -9.857421875, -8.5234375, -7.189453125, -5.85546875, -4.521484375, -3.1875, -1.853515625, -0.51953125, 0.814453125, 2.1484375, 3.482421875, 4.81640625, 6.150390625, 7.484375, 8.818359375, 10.15234375, 11.486328125, 12.8203125, 14.154296875, 15.48828125, 16.822265625, 18.15625, 19.490234375, 20.82421875, 22.158203125, 23.4921875, 24.826171875, 26.16015625, 27.494140625, 28.828125, 30.162109375, 31.49609375, 32.830078125, 34.1640625, 35.498046875, 36.83203125, 38.166015625, 39.5]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 15.0, 716.0, 286.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-367.4073181152344, -350.5296630859375, -333.6520080566406, -316.77435302734375, -299.8966979980469, -283.01904296875, -266.141357421875, -249.2637176513672, -232.3860626220703, -215.50840759277344, -198.63075256347656, -181.75308227539062, -164.87542724609375, -147.99777221679688, -131.1201171875, -114.24246215820312, -97.36480712890625, -80.48715209960938, -63.609493255615234, -46.731834411621094, -29.85417938232422, -12.976524353027344, 3.9011383056640625, 20.778793334960938, 37.65644836425781, 54.53410339355469, 71.41175842285156, 88.28942108154297, 105.16707611083984, 122.04473114013672, 138.92239379882812, 155.800048828125, 172.67767333984375, 189.55532836914062, 206.4329833984375, 223.31063842773438, 240.18829345703125, 257.0659484863281, 273.943603515625, 290.8212890625, 307.69891357421875, 324.5765686035156, 341.4542236328125, 358.3318786621094, 375.20953369140625, 392.0871887207031, 408.96484375, 425.842529296875, 442.7201843261719, 459.59783935546875, 476.4754943847656, 493.3531494140625, 510.2308044433594, 527.1084594726562, 543.9861450195312, 560.86376953125, 577.741455078125, 594.619140625, 611.4967651367188, 628.3744506835938, 645.2520751953125, 662.1297607421875, 679.0073852539062, 695.8850708007812, 712.7626953125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 5.0, 8.0, 8.0, 14.0, 20.0, 12.0, 17.0, 20.0, 24.0, 29.0, 30.0, 34.0, 47.0, 34.0, 34.0, 30.0, 32.0, 50.0, 38.0, 34.0, 44.0, 45.0, 34.0, 44.0, 39.0, 33.0, 29.0, 31.0, 29.0, 26.0, 17.0, 22.0, 9.0, 8.0, 10.0, 7.0, 9.0, 11.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.06842041015625, -38.75014114379883, -37.431861877441406, -36.113582611083984, -34.79530334472656, -33.47702407836914, -32.15874481201172, -30.840465545654297, -29.522186279296875, -28.203907012939453, -26.88562774658203, -25.56734848022461, -24.249069213867188, -22.930789947509766, -21.612510681152344, -20.294231414794922, -18.9759521484375, -17.657672882080078, -16.339393615722656, -15.021114349365234, -13.702835083007812, -12.38455581665039, -11.066276550292969, -9.747997283935547, -8.429718017578125, -7.111438751220703, -5.793159484863281, -4.474880218505859, -3.1566009521484375, -1.8383216857910156, -0.5200424194335938, 0.7982368469238281, 2.11651611328125, 3.434795379638672, 4.753074645996094, 6.071353912353516, 7.3896331787109375, 8.70791244506836, 10.026191711425781, 11.344470977783203, 12.662750244140625, 13.981029510498047, 15.299308776855469, 16.61758804321289, 17.935867309570312, 19.254146575927734, 20.572425842285156, 21.890705108642578, 23.208984375, 24.527263641357422, 25.845542907714844, 27.163822174072266, 28.482101440429688, 29.80038070678711, 31.11865997314453, 32.43693923950195, 33.755218505859375, 35.0734977722168, 36.39177703857422, 37.71005630493164, 39.02833557128906, 40.346614837646484, 41.664894104003906, 42.98317337036133, 44.30145263671875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 8.0, 10.0, 7.0, 9.0, 13.0, 24.0, 21.0, 30.0, 20.0, 21.0, 35.0, 33.0, 20.0, 28.0, 37.0, 33.0, 40.0, 31.0, 38.0, 44.0, 52.0, 34.0, 35.0, 41.0, 36.0, 26.0, 29.0, 32.0, 32.0, 26.0, 17.0, 22.0, 12.0, 13.0, 13.0, 17.0, 6.0, 9.0, 8.0, 0.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.98828125, -7.74749755859375, -7.5067138671875, -7.26593017578125, -7.025146484375, -6.78436279296875, -6.5435791015625, -6.30279541015625, -6.06201171875, -5.82122802734375, -5.5804443359375, -5.33966064453125, -5.098876953125, -4.85809326171875, -4.6173095703125, -4.37652587890625, -4.1357421875, -3.89495849609375, -3.6541748046875, -3.41339111328125, -3.172607421875, -2.93182373046875, -2.6910400390625, -2.45025634765625, -2.20947265625, -1.96868896484375, -1.7279052734375, -1.48712158203125, -1.246337890625, -1.00555419921875, -0.7647705078125, -0.52398681640625, -0.283203125, -0.04241943359375, 0.1983642578125, 0.43914794921875, 0.679931640625, 0.92071533203125, 1.1614990234375, 1.40228271484375, 1.64306640625, 1.88385009765625, 2.1246337890625, 2.36541748046875, 2.606201171875, 2.84698486328125, 3.0877685546875, 3.32855224609375, 3.5693359375, 3.81011962890625, 4.0509033203125, 4.29168701171875, 4.532470703125, 4.77325439453125, 5.0140380859375, 5.25482177734375, 5.49560546875, 5.73638916015625, 5.9771728515625, 6.21795654296875, 6.458740234375, 6.69952392578125, 6.9403076171875, 7.18109130859375, 7.421875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 13.0, 11.0, 25.0, 35.0, 55.0, 87.0, 112.0, 173.0, 273.0, 388.0, 578.0, 807.0, 1263.0, 1872.0, 2897.0, 4359.0, 6648.0, 10513.0, 16537.0, 27490.0, 45789.0, 77779.0, 125617.0, 180698.0, 187633.0, 138032.0, 86117.0, 51082.0, 30249.0, 18225.0, 11575.0, 7461.0, 4786.0, 3103.0, 2069.0, 1436.0, 905.0, 598.0, 422.0, 270.0, 185.0, 126.0, 102.0, 53.0, 34.0, 23.0, 16.0, 12.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.78369140625, -0.7600173950195312, -0.7363433837890625, -0.7126693725585938, -0.688995361328125, -0.6653213500976562, -0.6416473388671875, -0.6179733276367188, -0.59429931640625, -0.5706253051757812, -0.5469512939453125, -0.5232772827148438, -0.499603271484375, -0.47592926025390625, -0.4522552490234375, -0.42858123779296875, -0.4049072265625, -0.38123321533203125, -0.3575592041015625, -0.33388519287109375, -0.310211181640625, -0.28653717041015625, -0.2628631591796875, -0.23918914794921875, -0.21551513671875, -0.19184112548828125, -0.1681671142578125, -0.14449310302734375, -0.120819091796875, -0.09714508056640625, -0.0734710693359375, -0.04979705810546875, -0.026123046875, -0.00244903564453125, 0.0212249755859375, 0.04489898681640625, 0.068572998046875, 0.09224700927734375, 0.1159210205078125, 0.13959503173828125, 0.16326904296875, 0.18694305419921875, 0.2106170654296875, 0.23429107666015625, 0.257965087890625, 0.28163909912109375, 0.3053131103515625, 0.32898712158203125, 0.3526611328125, 0.37633514404296875, 0.4000091552734375, 0.42368316650390625, 0.447357177734375, 0.47103118896484375, 0.4947052001953125, 0.5183792114257812, 0.54205322265625, 0.5657272338867188, 0.5894012451171875, 0.6130752563476562, 0.636749267578125, 0.6604232788085938, 0.6840972900390625, 0.7077713012695312, 0.7314453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 8.0, 9.0, 4.0, 6.0, 12.0, 15.0, 13.0, 17.0, 19.0, 18.0, 22.0, 29.0, 37.0, 27.0, 37.0, 35.0, 36.0, 34.0, 32.0, 27.0, 30.0, 1058.0, 48.0, 45.0, 43.0, 29.0, 31.0, 32.0, 22.0, 25.0, 22.0, 39.0, 12.0, 20.0, 16.0, 16.0, 13.0, 16.0, 10.0, 14.0, 12.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.09765625, -4.94769287109375, -4.7977294921875, -4.64776611328125, -4.497802734375, -4.34783935546875, -4.1978759765625, -4.04791259765625, -3.89794921875, -3.74798583984375, -3.5980224609375, -3.44805908203125, -3.298095703125, -3.14813232421875, -2.9981689453125, -2.84820556640625, -2.6982421875, -2.54827880859375, -2.3983154296875, -2.24835205078125, -2.098388671875, -1.94842529296875, -1.7984619140625, -1.64849853515625, -1.49853515625, -1.34857177734375, -1.1986083984375, -1.04864501953125, -0.898681640625, -0.74871826171875, -0.5987548828125, -0.44879150390625, -0.298828125, -0.14886474609375, 0.0010986328125, 0.15106201171875, 0.301025390625, 0.45098876953125, 0.6009521484375, 0.75091552734375, 0.90087890625, 1.05084228515625, 1.2008056640625, 1.35076904296875, 1.500732421875, 1.65069580078125, 1.8006591796875, 1.95062255859375, 2.1005859375, 2.25054931640625, 2.4005126953125, 2.55047607421875, 2.700439453125, 2.85040283203125, 3.0003662109375, 3.15032958984375, 3.30029296875, 3.45025634765625, 3.6002197265625, 3.75018310546875, 3.900146484375, 4.05010986328125, 4.2000732421875, 4.35003662109375, 4.5]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 10.0, 14.0, 20.0, 37.0, 49.0, 76.0, 140.0, 241.0, 399.0, 676.0, 1133.0, 2069.0, 3348.0, 6072.0, 10639.0, 18910.0, 34426.0, 62684.0, 114473.0, 185902.0, 1267125.0, 168168.0, 99536.0, 54339.0, 29228.0, 15987.0, 9276.0, 5073.0, 3015.0, 1668.0, 983.0, 542.0, 336.0, 195.0, 135.0, 79.0, 44.0, 29.0, 15.0, 14.0, 13.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.6224441528320312, -0.5979156494140625, -0.5733871459960938, -0.548858642578125, -0.5243301391601562, -0.4998016357421875, -0.47527313232421875, -0.45074462890625, -0.42621612548828125, -0.4016876220703125, -0.37715911865234375, -0.352630615234375, -0.32810211181640625, -0.3035736083984375, -0.27904510498046875, -0.2545166015625, -0.22998809814453125, -0.2054595947265625, -0.18093109130859375, -0.156402587890625, -0.13187408447265625, -0.1073455810546875, -0.08281707763671875, -0.05828857421875, -0.03376007080078125, -0.0092315673828125, 0.01529693603515625, 0.039825439453125, 0.06435394287109375, 0.0888824462890625, 0.11341094970703125, 0.137939453125, 0.16246795654296875, 0.1869964599609375, 0.21152496337890625, 0.236053466796875, 0.26058197021484375, 0.2851104736328125, 0.30963897705078125, 0.33416748046875, 0.35869598388671875, 0.3832244873046875, 0.40775299072265625, 0.432281494140625, 0.45680999755859375, 0.4813385009765625, 0.5058670043945312, 0.5303955078125, 0.5549240112304688, 0.5794525146484375, 0.6039810180664062, 0.628509521484375, 0.6530380249023438, 0.6775665283203125, 0.7020950317382812, 0.72662353515625, 0.7511520385742188, 0.7756805419921875, 0.8002090454101562, 0.824737548828125, 0.8492660522460938, 0.8737945556640625, 0.8983230590820312, 0.9228515625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 0.0, 4.0, 7.0, 4.0, 3.0, 8.0, 10.0, 13.0, 22.0, 12.0, 21.0, 26.0, 25.0, 31.0, 51.0, 43.0, 34.0, 52.0, 58.0, 64.0, 51.0, 56.0, 53.0, 48.0, 44.0, 52.0, 30.0, 28.0, 28.0, 22.0, 18.0, 17.0, 13.0, 12.0, 11.0, 8.0, 10.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0026569366455078125, -0.0025802552700042725, -0.0025035738945007324, -0.0024268925189971924, -0.0023502111434936523, -0.0022735297679901123, -0.0021968483924865723, -0.0021201670169830322, -0.002043485641479492, -0.001966804265975952, -0.0018901228904724121, -0.001813441514968872, -0.001736760139465332, -0.001660078763961792, -0.001583397388458252, -0.001506716012954712, -0.0014300346374511719, -0.0013533532619476318, -0.0012766718864440918, -0.0011999905109405518, -0.0011233091354370117, -0.0010466277599334717, -0.0009699463844299316, -0.0008932650089263916, -0.0008165836334228516, -0.0007399022579193115, -0.0006632208824157715, -0.0005865395069122314, -0.0005098581314086914, -0.00043317675590515137, -0.00035649538040161133, -0.0002798140048980713, -0.00020313262939453125, -0.0001264512538909912, -4.976987838745117e-05, 2.6911497116088867e-05, 0.0001035928726196289, 0.00018027424812316895, 0.000256955623626709, 0.000333636999130249, 0.00041031837463378906, 0.0004869997501373291, 0.0005636811256408691, 0.0006403625011444092, 0.0007170438766479492, 0.0007937252521514893, 0.0008704066276550293, 0.0009470880031585693, 0.0010237693786621094, 0.0011004507541656494, 0.0011771321296691895, 0.0012538135051727295, 0.0013304948806762695, 0.0014071762561798096, 0.0014838576316833496, 0.0015605390071868896, 0.0016372203826904297, 0.0017139017581939697, 0.0017905831336975098, 0.0018672645092010498, 0.0019439458847045898, 0.00202062726020813, 0.00209730863571167, 0.00217399001121521, 0.00225067138671875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 5.0, 12.0, 17.0, 22.0, 20.0, 30.0, 51.0, 59.0, 61.0, 79.0, 123.0, 207.0, 364.0, 721.0, 13790.0, 1022870.0, 8244.0, 686.0, 406.0, 192.0, 140.0, 94.0, 83.0, 61.0, 38.0, 37.0, 31.0, 19.0, 16.0, 15.0, 10.0, 9.0, 3.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04779052734375, -0.04616832733154297, -0.04454612731933594, -0.042923927307128906, -0.041301727294921875, -0.039679527282714844, -0.03805732727050781, -0.03643512725830078, -0.03481292724609375, -0.03319072723388672, -0.03156852722167969, -0.029946327209472656, -0.028324127197265625, -0.026701927185058594, -0.025079727172851562, -0.02345752716064453, -0.0218353271484375, -0.02021312713623047, -0.018590927124023438, -0.016968727111816406, -0.015346527099609375, -0.013724327087402344, -0.012102127075195312, -0.010479927062988281, -0.00885772705078125, -0.007235527038574219, -0.0056133270263671875, -0.003991127014160156, -0.002368927001953125, -0.0007467269897460938, 0.0008754730224609375, 0.0024976730346679688, 0.004119873046875, 0.005742073059082031, 0.0073642730712890625, 0.008986473083496094, 0.010608673095703125, 0.012230873107910156, 0.013853073120117188, 0.015475273132324219, 0.01709747314453125, 0.01871967315673828, 0.020341873168945312, 0.021964073181152344, 0.023586273193359375, 0.025208473205566406, 0.026830673217773438, 0.02845287322998047, 0.0300750732421875, 0.03169727325439453, 0.03331947326660156, 0.034941673278808594, 0.036563873291015625, 0.038186073303222656, 0.03980827331542969, 0.04143047332763672, 0.04305267333984375, 0.04467487335205078, 0.04629707336425781, 0.047919273376464844, 0.049541473388671875, 0.051163673400878906, 0.05278587341308594, 0.05440807342529297, 0.0560302734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 384.0, 629.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03326241672039032, -0.032689839601516724, -0.03211726248264313, -0.03154468536376953, -0.030972106382250786, -0.03039952926337719, -0.029826950281858444, -0.029254373162984848, -0.028681796044111252, -0.028109218925237656, -0.02753664180636406, -0.026964062824845314, -0.026391485705971718, -0.02581890858709812, -0.025246329605579376, -0.02467375248670578, -0.024101175367832184, -0.023528598248958588, -0.02295602113008499, -0.022383442148566246, -0.02181086502969265, -0.021238287910819054, -0.020665708929300308, -0.020093131810426712, -0.019520554691553116, -0.01894797757267952, -0.018375400453805923, -0.017802821472287178, -0.017230244353413582, -0.016657667234539986, -0.01608508825302124, -0.015512511134147644, -0.014939934015274048, -0.014367356896400452, -0.01379477884620428, -0.01322220079600811, -0.012649623677134514, -0.012077046558260918, -0.011504468508064747, -0.010931890457868576, -0.01035931333899498, -0.009786736220121384, -0.009214158169925213, -0.008641580119729042, -0.008069003000855446, -0.007496425416320562, -0.006923847831785679, -0.006351270247250795, -0.005778692662715912, -0.005206115078181028, -0.004633537493646145, -0.004060959909111261, -0.003488382324576378, -0.0029158047400414944, -0.002343227155506611, -0.0017706495709717274, -0.0011980719864368439, -0.0006254944019019604, -5.2916817367076874e-05, 0.0005196607671678066, 0.0010922383517026901, 0.0016648159362375736, 0.002237393520772457, 0.0028099711053073406, 0.003382548689842224]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 4.0, 2.0, 4.0, 12.0, 9.0, 15.0, 9.0, 19.0, 14.0, 27.0, 24.0, 23.0, 26.0, 26.0, 37.0, 28.0, 42.0, 32.0, 36.0, 51.0, 32.0, 31.0, 34.0, 34.0, 43.0, 31.0, 46.0, 34.0, 32.0, 39.0, 25.0, 24.0, 25.0, 22.0, 14.0, 11.0, 20.0, 13.0, 9.0, 3.0, 4.0, 4.0, 4.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011951327323913574, -0.0011548642069101334, -0.0011145956814289093, -0.0010743271559476852, -0.0010340586304664612, -0.0009937901049852371, -0.0009535215795040131, -0.000913253054022789, -0.0008729845285415649, -0.0008327160030603409, -0.0007924474775791168, -0.0007521789520978928, -0.0007119104266166687, -0.0006716419011354446, -0.0006313733756542206, -0.0005911048501729965, -0.0005508363246917725, -0.0005105677992105484, -0.00047029927372932434, -0.0004300307482481003, -0.0003897622227668762, -0.00034949369728565216, -0.0003092251718044281, -0.00026895664632320404, -0.00022868812084197998, -0.00018841959536075592, -0.00014815106987953186, -0.0001078825443983078, -6.761401891708374e-05, -2.734549343585968e-05, 1.292303204536438e-05, 5.319155752658844e-05, 9.34600830078125e-05, 0.00013372860848903656, 0.00017399713397026062, 0.00021426565945148468, 0.00025453418493270874, 0.0002948027104139328, 0.00033507123589515686, 0.0003753397613763809, 0.000415608286857605, 0.00045587681233882904, 0.0004961453378200531, 0.0005364138633012772, 0.0005766823887825012, 0.0006169509142637253, 0.0006572194397449493, 0.0006974879652261734, 0.0007377564907073975, 0.0007780250161886215, 0.0008182935416698456, 0.0008585620671510696, 0.0008988305926322937, 0.0009390991181135178, 0.0009793676435947418, 0.0010196361690759659, 0.00105990469455719, 0.001100173220038414, 0.001140441745519638, 0.0011807102710008621, 0.0012209787964820862, 0.0012612473219633102, 0.0013015158474445343, 0.0013417843729257584, 0.0013820528984069824]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 8.0, 10.0, 7.0, 9.0, 13.0, 24.0, 21.0, 30.0, 20.0, 21.0, 35.0, 33.0, 20.0, 28.0, 37.0, 33.0, 40.0, 31.0, 38.0, 44.0, 52.0, 34.0, 35.0, 41.0, 36.0, 26.0, 29.0, 32.0, 32.0, 26.0, 17.0, 22.0, 12.0, 13.0, 13.0, 17.0, 6.0, 9.0, 8.0, 0.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.98828125, -7.74749755859375, -7.5067138671875, -7.26593017578125, -7.025146484375, -6.78436279296875, -6.5435791015625, -6.30279541015625, -6.06201171875, -5.82122802734375, -5.5804443359375, -5.33966064453125, -5.098876953125, -4.85809326171875, -4.6173095703125, -4.37652587890625, -4.1357421875, -3.89495849609375, -3.6541748046875, -3.41339111328125, -3.172607421875, -2.93182373046875, -2.6910400390625, -2.45025634765625, -2.20947265625, -1.96868896484375, -1.7279052734375, -1.48712158203125, -1.246337890625, -1.00555419921875, -0.7647705078125, -0.52398681640625, -0.283203125, -0.04241943359375, 0.1983642578125, 0.43914794921875, 0.679931640625, 0.92071533203125, 1.1614990234375, 1.40228271484375, 1.64306640625, 1.88385009765625, 2.1246337890625, 2.36541748046875, 2.606201171875, 2.84698486328125, 3.0877685546875, 3.32855224609375, 3.5693359375, 3.81011962890625, 4.0509033203125, 4.29168701171875, 4.532470703125, 4.77325439453125, 5.0140380859375, 5.25482177734375, 5.49560546875, 5.73638916015625, 5.9771728515625, 6.21795654296875, 6.458740234375, 6.69952392578125, 6.9403076171875, 7.18109130859375, 7.421875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 10.0, 17.0, 21.0, 24.0, 27.0, 33.0, 48.0, 74.0, 63.0, 111.0, 139.0, 211.0, 332.0, 493.0, 843.0, 1348.0, 2466.0, 4636.0, 9339.0, 20285.0, 50197.0, 149602.0, 449801.0, 233637.0, 71506.0, 27493.0, 12309.0, 5860.0, 3127.0, 1719.0, 962.0, 597.0, 333.0, 265.0, 149.0, 127.0, 83.0, 65.0, 43.0, 36.0, 30.0, 23.0, 16.0, 13.0, 10.0, 12.0, 6.0, 8.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-10.0, -9.6939697265625, -9.387939453125, -9.0819091796875, -8.77587890625, -8.4698486328125, -8.163818359375, -7.8577880859375, -7.5517578125, -7.2457275390625, -6.939697265625, -6.6336669921875, -6.32763671875, -6.0216064453125, -5.715576171875, -5.4095458984375, -5.103515625, -4.7974853515625, -4.491455078125, -4.1854248046875, -3.87939453125, -3.5733642578125, -3.267333984375, -2.9613037109375, -2.6552734375, -2.3492431640625, -2.043212890625, -1.7371826171875, -1.43115234375, -1.1251220703125, -0.819091796875, -0.5130615234375, -0.20703125, 0.0989990234375, 0.405029296875, 0.7110595703125, 1.01708984375, 1.3231201171875, 1.629150390625, 1.9351806640625, 2.2412109375, 2.5472412109375, 2.853271484375, 3.1593017578125, 3.46533203125, 3.7713623046875, 4.077392578125, 4.3834228515625, 4.689453125, 4.9954833984375, 5.301513671875, 5.6075439453125, 5.91357421875, 6.2196044921875, 6.525634765625, 6.8316650390625, 7.1376953125, 7.4437255859375, 7.749755859375, 8.0557861328125, 8.36181640625, 8.6678466796875, 8.973876953125, 9.2799072265625, 9.5859375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 9.0, 7.0, 9.0, 12.0, 9.0, 14.0, 19.0, 9.0, 21.0, 21.0, 27.0, 25.0, 31.0, 30.0, 32.0, 31.0, 50.0, 60.0, 95.0, 129.0, 1395.0, 350.0, 137.0, 83.0, 63.0, 36.0, 50.0, 39.0, 34.0, 26.0, 34.0, 26.0, 15.0, 18.0, 15.0, 14.0, 13.0, 9.0, 8.0, 10.0, 6.0, 3.0, 5.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-23.625, -22.949951171875, -22.27490234375, -21.599853515625, -20.9248046875, -20.249755859375, -19.57470703125, -18.899658203125, -18.224609375, -17.549560546875, -16.87451171875, -16.199462890625, -15.5244140625, -14.849365234375, -14.17431640625, -13.499267578125, -12.82421875, -12.149169921875, -11.47412109375, -10.799072265625, -10.1240234375, -9.448974609375, -8.77392578125, -8.098876953125, -7.423828125, -6.748779296875, -6.07373046875, -5.398681640625, -4.7236328125, -4.048583984375, -3.37353515625, -2.698486328125, -2.0234375, -1.348388671875, -0.67333984375, 0.001708984375, 0.6767578125, 1.351806640625, 2.02685546875, 2.701904296875, 3.376953125, 4.052001953125, 4.72705078125, 5.402099609375, 6.0771484375, 6.752197265625, 7.42724609375, 8.102294921875, 8.77734375, 9.452392578125, 10.12744140625, 10.802490234375, 11.4775390625, 12.152587890625, 12.82763671875, 13.502685546875, 14.177734375, 14.852783203125, 15.52783203125, 16.202880859375, 16.8779296875, 17.552978515625, 18.22802734375, 18.903076171875, 19.578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 11.0, 18.0, 18.0, 22.0, 26.0, 41.0, 64.0, 73.0, 112.0, 130.0, 187.0, 335.0, 663.0, 2539.0, 29079.0, 2437870.0, 655548.0, 15727.0, 1681.0, 533.0, 278.0, 220.0, 134.0, 81.0, 78.0, 60.0, 31.0, 31.0, 19.0, 22.0, 11.0, 9.0, 13.0, 9.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.5517578125, -31.384765625, -30.2177734375, -29.05078125, -27.8837890625, -26.716796875, -25.5498046875, -24.3828125, -23.2158203125, -22.048828125, -20.8818359375, -19.71484375, -18.5478515625, -17.380859375, -16.2138671875, -15.046875, -13.8798828125, -12.712890625, -11.5458984375, -10.37890625, -9.2119140625, -8.044921875, -6.8779296875, -5.7109375, -4.5439453125, -3.376953125, -2.2099609375, -1.04296875, 0.1240234375, 1.291015625, 2.4580078125, 3.625, 4.7919921875, 5.958984375, 7.1259765625, 8.29296875, 9.4599609375, 10.626953125, 11.7939453125, 12.9609375, 14.1279296875, 15.294921875, 16.4619140625, 17.62890625, 18.7958984375, 19.962890625, 21.1298828125, 22.296875, 23.4638671875, 24.630859375, 25.7978515625, 26.96484375, 28.1318359375, 29.298828125, 30.4658203125, 31.6328125, 32.7998046875, 33.966796875, 35.1337890625, 36.30078125, 37.4677734375, 38.634765625, 39.8017578125, 40.96875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 35.0, 796.0, 183.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.10650634765625, -46.885040283203125, -38.663578033447266, -30.442113876342773, -22.22064971923828, -13.999183654785156, -5.777721405029297, 2.4437408447265625, 10.665206909179688, 18.88667106628418, 27.108135223388672, 35.32959747314453, 43.551063537597656, 51.77252960205078, 59.99399185180664, 68.2154541015625, 76.43692016601562, 84.65838623046875, 92.87985229492188, 101.10131072998047, 109.3227767944336, 117.54424285888672, 125.76570129394531, 133.98716735839844, 142.20863342285156, 150.4300994873047, 158.6515655517578, 166.87303161621094, 175.094482421875, 183.31594848632812, 191.53741455078125, 199.75888061523438, 207.98031616210938, 216.2017822265625, 224.42324829101562, 232.64471435546875, 240.86618041992188, 249.087646484375, 257.3091125488281, 265.53057861328125, 273.75201416015625, 281.9734802246094, 290.1949462890625, 298.4164123535156, 306.63787841796875, 314.8593444824219, 323.080810546875, 331.30224609375, 339.52374267578125, 347.7452087402344, 355.9666748046875, 364.1881408691406, 372.40960693359375, 380.6310729980469, 388.8525390625, 397.073974609375, 405.29547119140625, 413.5169372558594, 421.7384033203125, 429.9598693847656, 438.18133544921875, 446.4028015136719, 454.624267578125, 462.845703125, 471.0671691894531]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 6.0, 9.0, 8.0, 7.0, 9.0, 16.0, 22.0, 11.0, 21.0, 20.0, 29.0, 26.0, 31.0, 35.0, 44.0, 37.0, 35.0, 49.0, 52.0, 44.0, 39.0, 52.0, 41.0, 40.0, 39.0, 33.0, 30.0, 29.0, 33.0, 22.0, 19.0, 20.0, 15.0, 14.0, 12.0, 8.0, 9.0, 9.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.40476608276367, -55.64702224731445, -53.88927459716797, -52.13153076171875, -50.373783111572266, -48.61603927612305, -46.85829162597656, -45.100547790527344, -43.342803955078125, -41.585060119628906, -39.82731246948242, -38.0695686340332, -36.31182098388672, -34.5540771484375, -32.79633331298828, -31.038585662841797, -29.280838012695312, -27.52309226989746, -25.76534652709961, -24.00760269165039, -22.249855041503906, -20.492111206054688, -18.734365463256836, -16.976619720458984, -15.218873977661133, -13.461128234863281, -11.70338249206543, -9.945637702941895, -8.187891960144043, -6.430146217346191, -4.672401428222656, -2.9146556854248047, -1.1569061279296875, 0.600839376449585, 2.3585848808288574, 4.116330146789551, 5.874075889587402, 7.631821632385254, 9.389566421508789, 11.14731216430664, 12.905057907104492, 14.662803649902344, 16.420549392700195, 18.178295135498047, 19.936038970947266, 21.69378662109375, 23.45153045654297, 25.20927619934082, 26.967021942138672, 28.724767684936523, 30.482513427734375, 32.240257263183594, 33.99800491333008, 35.7557487487793, 37.51349639892578, 39.271240234375, 41.02898406982422, 42.78672790527344, 44.54447555541992, 46.30221939086914, 48.059967041015625, 49.817710876464844, 51.57545471191406, 53.33320236206055, 55.09095001220703]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 3.0, 12.0, 9.0, 21.0, 17.0, 19.0, 22.0, 25.0, 29.0, 23.0, 25.0, 33.0, 28.0, 46.0, 38.0, 41.0, 43.0, 43.0, 40.0, 47.0, 44.0, 44.0, 32.0, 27.0, 38.0, 37.0, 28.0, 26.0, 21.0, 33.0, 15.0, 22.0, 16.0, 13.0, 7.0, 6.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.9339599609375, -8.656982421875, -8.3800048828125, -8.10302734375, -7.8260498046875, -7.549072265625, -7.2720947265625, -6.9951171875, -6.7181396484375, -6.441162109375, -6.1641845703125, -5.88720703125, -5.6102294921875, -5.333251953125, -5.0562744140625, -4.779296875, -4.5023193359375, -4.225341796875, -3.9483642578125, -3.67138671875, -3.3944091796875, -3.117431640625, -2.8404541015625, -2.5634765625, -2.2864990234375, -2.009521484375, -1.7325439453125, -1.45556640625, -1.1785888671875, -0.901611328125, -0.6246337890625, -0.34765625, -0.0706787109375, 0.206298828125, 0.4832763671875, 0.76025390625, 1.0372314453125, 1.314208984375, 1.5911865234375, 1.8681640625, 2.1451416015625, 2.422119140625, 2.6990966796875, 2.97607421875, 3.2530517578125, 3.530029296875, 3.8070068359375, 4.083984375, 4.3609619140625, 4.637939453125, 4.9149169921875, 5.19189453125, 5.4688720703125, 5.745849609375, 6.0228271484375, 6.2998046875, 6.5767822265625, 6.853759765625, 7.1307373046875, 7.40771484375, 7.6846923828125, 7.961669921875, 8.2386474609375, 8.515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 6.0, 10.0, 8.0, 13.0, 11.0, 20.0, 12.0, 32.0, 43.0, 57.0, 106.0, 182.0, 334.0, 834.0, 2442.0, 9080.0, 54723.0, 568365.0, 2512924.0, 937964.0, 88965.0, 12972.0, 3087.0, 1043.0, 459.0, 197.0, 125.0, 60.0, 44.0, 32.0, 13.0, 8.0, 11.0, 15.0, 17.0, 11.0, 13.0, 5.0, 7.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.515625, -15.0087890625, -14.501953125, -13.9951171875, -13.48828125, -12.9814453125, -12.474609375, -11.9677734375, -11.4609375, -10.9541015625, -10.447265625, -9.9404296875, -9.43359375, -8.9267578125, -8.419921875, -7.9130859375, -7.40625, -6.8994140625, -6.392578125, -5.8857421875, -5.37890625, -4.8720703125, -4.365234375, -3.8583984375, -3.3515625, -2.8447265625, -2.337890625, -1.8310546875, -1.32421875, -0.8173828125, -0.310546875, 0.1962890625, 0.703125, 1.2099609375, 1.716796875, 2.2236328125, 2.73046875, 3.2373046875, 3.744140625, 4.2509765625, 4.7578125, 5.2646484375, 5.771484375, 6.2783203125, 6.78515625, 7.2919921875, 7.798828125, 8.3056640625, 8.8125, 9.3193359375, 9.826171875, 10.3330078125, 10.83984375, 11.3466796875, 11.853515625, 12.3603515625, 12.8671875, 13.3740234375, 13.880859375, 14.3876953125, 14.89453125, 15.4013671875, 15.908203125, 16.4150390625, 16.921875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 9.0, 10.0, 16.0, 16.0, 20.0, 33.0, 49.0, 64.0, 82.0, 119.0, 189.0, 310.0, 443.0, 542.0, 541.0, 484.0, 382.0, 236.0, 163.0, 105.0, 72.0, 48.0, 29.0, 25.0, 16.0, 15.0, 11.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.953125, -15.5233154296875, -15.093505859375, -14.6636962890625, -14.23388671875, -13.8040771484375, -13.374267578125, -12.9444580078125, -12.5146484375, -12.0848388671875, -11.655029296875, -11.2252197265625, -10.79541015625, -10.3656005859375, -9.935791015625, -9.5059814453125, -9.076171875, -8.6463623046875, -8.216552734375, -7.7867431640625, -7.35693359375, -6.9271240234375, -6.497314453125, -6.0675048828125, -5.6376953125, -5.2078857421875, -4.778076171875, -4.3482666015625, -3.91845703125, -3.4886474609375, -3.058837890625, -2.6290283203125, -2.19921875, -1.7694091796875, -1.339599609375, -0.9097900390625, -0.47998046875, -0.0501708984375, 0.379638671875, 0.8094482421875, 1.2392578125, 1.6690673828125, 2.098876953125, 2.5286865234375, 2.95849609375, 3.3883056640625, 3.818115234375, 4.2479248046875, 4.677734375, 5.1075439453125, 5.537353515625, 5.9671630859375, 6.39697265625, 6.8267822265625, 7.256591796875, 7.6864013671875, 8.1162109375, 8.5460205078125, 8.975830078125, 9.4056396484375, 9.83544921875, 10.2652587890625, 10.695068359375, 11.1248779296875, 11.5546875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 16.0, 24.0, 25.0, 37.0, 36.0, 77.0, 101.0, 189.0, 306.0, 592.0, 1266.0, 3140.0, 10246.0, 48035.0, 394895.0, 3131243.0, 528243.0, 58070.0, 11436.0, 3513.0, 1290.0, 606.0, 326.0, 158.0, 127.0, 73.0, 60.0, 39.0, 20.0, 18.0, 21.0, 11.0, 6.0, 6.0, 9.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-24.0, -23.324951171875, -22.64990234375, -21.974853515625, -21.2998046875, -20.624755859375, -19.94970703125, -19.274658203125, -18.599609375, -17.924560546875, -17.24951171875, -16.574462890625, -15.8994140625, -15.224365234375, -14.54931640625, -13.874267578125, -13.19921875, -12.524169921875, -11.84912109375, -11.174072265625, -10.4990234375, -9.823974609375, -9.14892578125, -8.473876953125, -7.798828125, -7.123779296875, -6.44873046875, -5.773681640625, -5.0986328125, -4.423583984375, -3.74853515625, -3.073486328125, -2.3984375, -1.723388671875, -1.04833984375, -0.373291015625, 0.3017578125, 0.976806640625, 1.65185546875, 2.326904296875, 3.001953125, 3.677001953125, 4.35205078125, 5.027099609375, 5.7021484375, 6.377197265625, 7.05224609375, 7.727294921875, 8.40234375, 9.077392578125, 9.75244140625, 10.427490234375, 11.1025390625, 11.777587890625, 12.45263671875, 13.127685546875, 13.802734375, 14.477783203125, 15.15283203125, 15.827880859375, 16.5029296875, 17.177978515625, 17.85302734375, 18.528076171875, 19.203125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 14.0, 148.0, 535.0, 279.0, 35.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-416.5489807128906, -409.1947021484375, -401.84039306640625, -394.4861145019531, -387.1318359375, -379.7775573730469, -372.4232482910156, -365.0689697265625, -357.7146911621094, -350.36041259765625, -343.006103515625, -335.6518249511719, -328.29754638671875, -320.9432678222656, -313.5889587402344, -306.23468017578125, -298.8804016113281, -291.526123046875, -284.17181396484375, -276.8175354003906, -269.4632568359375, -262.1089782714844, -254.7546844482422, -247.400390625, -240.0460968017578, -232.69180297851562, -225.3375244140625, -217.9832305908203, -210.6289520263672, -203.274658203125, -195.92037963867188, -188.5660858154297, -181.21182250976562, -173.85752868652344, -166.5032501220703, -159.14895629882812, -151.794677734375, -144.4403839111328, -137.0861053466797, -129.7318115234375, -122.37751770019531, -115.02323150634766, -107.6689453125, -100.31465911865234, -92.96037292480469, -85.6060791015625, -78.25180053710938, -70.89750671386719, -63.54322814941406, -56.188941955566406, -48.83465576171875, -41.480369567871094, -34.12608337402344, -26.771793365478516, -19.41750717163086, -12.063220977783203, -4.708934783935547, 2.6453518867492676, 9.999638557434082, 17.353925704956055, 24.70821189880371, 32.0625, 39.416786193847656, 46.77107238769531, 54.12535858154297]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 5.0, 8.0, 7.0, 8.0, 9.0, 18.0, 13.0, 14.0, 19.0, 22.0, 20.0, 29.0, 18.0, 22.0, 32.0, 29.0, 23.0, 40.0, 33.0, 27.0, 39.0, 44.0, 31.0, 38.0, 33.0, 37.0, 33.0, 31.0, 31.0, 34.0, 29.0, 27.0, 22.0, 10.0, 13.0, 25.0, 17.0, 10.0, 15.0, 17.0, 6.0, 10.0, 10.0, 10.0, 6.0, 6.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-40.50442886352539, -39.3116340637207, -38.118839263916016, -36.92604446411133, -35.733253479003906, -34.54045867919922, -33.34766387939453, -32.154869079589844, -30.962074279785156, -29.76927947998047, -28.57648468017578, -27.383691787719727, -26.19089698791504, -24.99810218811035, -23.805309295654297, -22.61251449584961, -21.419719696044922, -20.226924896240234, -19.034130096435547, -17.841337203979492, -16.648542404174805, -15.455747604370117, -14.262953758239746, -13.070159912109375, -11.877365112304688, -10.6845703125, -9.491776466369629, -8.298982620239258, -7.10618782043457, -5.913393497467041, -4.720599174499512, -3.5278053283691406, -2.3350067138671875, -1.1422123908996582, 0.050581932067871094, 1.2433762550354004, 2.4361705780029297, 3.628964900970459, 4.821759223937988, 6.014553070068359, 7.207347869873047, 8.400142669677734, 9.592936515808105, 10.785730361938477, 11.978525161743164, 13.171319961547852, 14.364113807678223, 15.556907653808594, 16.74970245361328, 17.94249725341797, 19.135292053222656, 20.32808494567871, 21.5208797454834, 22.713674545288086, 23.90646743774414, 25.099262237548828, 26.292057037353516, 27.484851837158203, 28.67764663696289, 29.870439529418945, 31.063234329223633, 32.25602722167969, 33.448822021484375, 34.64161682128906, 35.83441162109375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 7.0, 10.0, 23.0, 18.0, 15.0, 30.0, 27.0, 23.0, 30.0, 28.0, 38.0, 42.0, 44.0, 44.0, 36.0, 49.0, 47.0, 43.0, 36.0, 42.0, 45.0, 33.0, 31.0, 29.0, 27.0, 19.0, 19.0, 15.0, 19.0, 25.0, 21.0, 9.0, 11.0, 7.0, 5.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.566162109375, -7.28857421875, -7.010986328125, -6.7333984375, -6.455810546875, -6.17822265625, -5.900634765625, -5.623046875, -5.345458984375, -5.06787109375, -4.790283203125, -4.5126953125, -4.235107421875, -3.95751953125, -3.679931640625, -3.40234375, -3.124755859375, -2.84716796875, -2.569580078125, -2.2919921875, -2.014404296875, -1.73681640625, -1.459228515625, -1.181640625, -0.904052734375, -0.62646484375, -0.348876953125, -0.0712890625, 0.206298828125, 0.48388671875, 0.761474609375, 1.0390625, 1.316650390625, 1.59423828125, 1.871826171875, 2.1494140625, 2.427001953125, 2.70458984375, 2.982177734375, 3.259765625, 3.537353515625, 3.81494140625, 4.092529296875, 4.3701171875, 4.647705078125, 4.92529296875, 5.202880859375, 5.48046875, 5.758056640625, 6.03564453125, 6.313232421875, 6.5908203125, 6.868408203125, 7.14599609375, 7.423583984375, 7.701171875, 7.978759765625, 8.25634765625, 8.533935546875, 8.8115234375, 9.089111328125, 9.36669921875, 9.644287109375, 9.921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 9.0, 16.0, 24.0, 34.0, 46.0, 81.0, 94.0, 144.0, 253.0, 378.0, 598.0, 887.0, 1258.0, 2032.0, 2954.0, 4723.0, 7385.0, 12134.0, 19599.0, 32958.0, 56667.0, 97436.0, 157743.0, 206309.0, 173490.0, 110339.0, 64559.0, 37459.0, 22044.0, 13378.0, 8400.0, 5302.0, 3348.0, 2209.0, 1472.0, 927.0, 657.0, 436.0, 261.0, 158.0, 111.0, 84.0, 46.0, 35.0, 25.0, 10.0, 13.0, 14.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.78369140625, -0.757232666015625, -0.73077392578125, -0.704315185546875, -0.6778564453125, -0.651397705078125, -0.62493896484375, -0.598480224609375, -0.572021484375, -0.545562744140625, -0.51910400390625, -0.492645263671875, -0.4661865234375, -0.439727783203125, -0.41326904296875, -0.386810302734375, -0.3603515625, -0.333892822265625, -0.30743408203125, -0.280975341796875, -0.2545166015625, -0.228057861328125, -0.20159912109375, -0.175140380859375, -0.148681640625, -0.122222900390625, -0.09576416015625, -0.069305419921875, -0.0428466796875, -0.016387939453125, 0.01007080078125, 0.036529541015625, 0.06298828125, 0.089447021484375, 0.11590576171875, 0.142364501953125, 0.1688232421875, 0.195281982421875, 0.22174072265625, 0.248199462890625, 0.274658203125, 0.301116943359375, 0.32757568359375, 0.354034423828125, 0.3804931640625, 0.406951904296875, 0.43341064453125, 0.459869384765625, 0.486328125, 0.512786865234375, 0.53924560546875, 0.565704345703125, 0.5921630859375, 0.618621826171875, 0.64508056640625, 0.671539306640625, 0.697998046875, 0.724456787109375, 0.75091552734375, 0.777374267578125, 0.8038330078125, 0.830291748046875, 0.85675048828125, 0.883209228515625, 0.90966796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 6.0, 7.0, 18.0, 12.0, 9.0, 19.0, 17.0, 17.0, 24.0, 25.0, 35.0, 29.0, 41.0, 33.0, 46.0, 46.0, 56.0, 32.0, 1072.0, 35.0, 39.0, 46.0, 46.0, 34.0, 29.0, 36.0, 36.0, 33.0, 27.0, 20.0, 23.0, 10.0, 11.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-6.69140625, -6.50347900390625, -6.3155517578125, -6.12762451171875, -5.939697265625, -5.75177001953125, -5.5638427734375, -5.37591552734375, -5.18798828125, -5.00006103515625, -4.8121337890625, -4.62420654296875, -4.436279296875, -4.24835205078125, -4.0604248046875, -3.87249755859375, -3.6845703125, -3.49664306640625, -3.3087158203125, -3.12078857421875, -2.932861328125, -2.74493408203125, -2.5570068359375, -2.36907958984375, -2.18115234375, -1.99322509765625, -1.8052978515625, -1.61737060546875, -1.429443359375, -1.24151611328125, -1.0535888671875, -0.86566162109375, -0.677734375, -0.48980712890625, -0.3018798828125, -0.11395263671875, 0.073974609375, 0.26190185546875, 0.4498291015625, 0.63775634765625, 0.82568359375, 1.01361083984375, 1.2015380859375, 1.38946533203125, 1.577392578125, 1.76531982421875, 1.9532470703125, 2.14117431640625, 2.3291015625, 2.51702880859375, 2.7049560546875, 2.89288330078125, 3.080810546875, 3.26873779296875, 3.4566650390625, 3.64459228515625, 3.83251953125, 4.02044677734375, 4.2083740234375, 4.39630126953125, 4.584228515625, 4.77215576171875, 4.9600830078125, 5.14801025390625, 5.3359375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 13.0, 16.0, 38.0, 51.0, 57.0, 94.0, 124.0, 238.0, 356.0, 578.0, 903.0, 1482.0, 2397.0, 3818.0, 6278.0, 10220.0, 17161.0, 28718.0, 49309.0, 82967.0, 132525.0, 219667.0, 1187876.0, 138006.0, 87300.0, 51636.0, 29875.0, 17840.0, 10750.0, 6457.0, 3956.0, 2364.0, 1463.0, 873.0, 614.0, 409.0, 260.0, 158.0, 100.0, 48.0, 48.0, 31.0, 16.0, 13.0, 10.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.634765625, -0.6136398315429688, -0.5925140380859375, -0.5713882446289062, -0.550262451171875, -0.5291366577148438, -0.5080108642578125, -0.48688507080078125, -0.46575927734375, -0.44463348388671875, -0.4235076904296875, -0.40238189697265625, -0.381256103515625, -0.36013031005859375, -0.3390045166015625, -0.31787872314453125, -0.2967529296875, -0.27562713623046875, -0.2545013427734375, -0.23337554931640625, -0.212249755859375, -0.19112396240234375, -0.1699981689453125, -0.14887237548828125, -0.12774658203125, -0.10662078857421875, -0.0854949951171875, -0.06436920166015625, -0.043243408203125, -0.02211761474609375, -0.0009918212890625, 0.02013397216796875, 0.041259765625, 0.06238555908203125, 0.0835113525390625, 0.10463714599609375, 0.125762939453125, 0.14688873291015625, 0.1680145263671875, 0.18914031982421875, 0.21026611328125, 0.23139190673828125, 0.2525177001953125, 0.27364349365234375, 0.294769287109375, 0.31589508056640625, 0.3370208740234375, 0.35814666748046875, 0.3792724609375, 0.40039825439453125, 0.4215240478515625, 0.44264984130859375, 0.463775634765625, 0.48490142822265625, 0.5060272216796875, 0.5271530151367188, 0.54827880859375, 0.5694046020507812, 0.5905303955078125, 0.6116561889648438, 0.632781982421875, 0.6539077758789062, 0.6750335693359375, 0.6961593627929688, 0.71728515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 9.0, 9.0, 11.0, 14.0, 21.0, 18.0, 22.0, 32.0, 43.0, 38.0, 47.0, 53.0, 54.0, 56.0, 54.0, 66.0, 58.0, 42.0, 42.0, 57.0, 40.0, 30.0, 27.0, 24.0, 23.0, 21.0, 16.0, 18.0, 6.0, 4.0, 6.0, 6.0, 5.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0026988983154296875, -0.0026188790798187256, -0.0025388598442077637, -0.0024588406085968018, -0.00237882137298584, -0.002298802137374878, -0.002218782901763916, -0.002138763666152954, -0.002058744430541992, -0.0019787251949310303, -0.0018987059593200684, -0.0018186867237091064, -0.0017386674880981445, -0.0016586482524871826, -0.0015786290168762207, -0.0014986097812652588, -0.0014185905456542969, -0.001338571310043335, -0.001258552074432373, -0.0011785328388214111, -0.0010985136032104492, -0.0010184943675994873, -0.0009384751319885254, -0.0008584558963775635, -0.0007784366607666016, -0.0006984174251556396, -0.0006183981895446777, -0.0005383789539337158, -0.0004583597183227539, -0.000378340482711792, -0.0002983212471008301, -0.00021830201148986816, -0.00013828277587890625, -5.8263540267944336e-05, 2.1755695343017578e-05, 0.00010177493095397949, 0.0001817941665649414, 0.0002618134021759033, 0.00034183263778686523, 0.00042185187339782715, 0.0005018711090087891, 0.000581890344619751, 0.0006619095802307129, 0.0007419288158416748, 0.0008219480514526367, 0.0009019672870635986, 0.0009819865226745605, 0.0010620057582855225, 0.0011420249938964844, 0.0012220442295074463, 0.0013020634651184082, 0.0013820827007293701, 0.001462101936340332, 0.001542121171951294, 0.0016221404075622559, 0.0017021596431732178, 0.0017821788787841797, 0.0018621981143951416, 0.0019422173500061035, 0.0020222365856170654, 0.0021022558212280273, 0.0021822750568389893, 0.002262294292449951, 0.002342313528060913, 0.002422332763671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 5.0, 6.0, 14.0, 11.0, 11.0, 12.0, 22.0, 21.0, 26.0, 34.0, 38.0, 52.0, 72.0, 77.0, 130.0, 168.0, 233.0, 465.0, 1179.0, 88304.0, 951278.0, 4715.0, 625.0, 336.0, 172.0, 134.0, 85.0, 86.0, 55.0, 33.0, 34.0, 23.0, 22.0, 20.0, 13.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044952392578125, -0.043415069580078125, -0.04187774658203125, -0.040340423583984375, -0.0388031005859375, -0.037265777587890625, -0.03572845458984375, -0.034191131591796875, -0.03265380859375, -0.031116485595703125, -0.02957916259765625, -0.028041839599609375, -0.0265045166015625, -0.024967193603515625, -0.02342987060546875, -0.021892547607421875, -0.020355224609375, -0.018817901611328125, -0.01728057861328125, -0.015743255615234375, -0.0142059326171875, -0.012668609619140625, -0.01113128662109375, -0.009593963623046875, -0.008056640625, -0.006519317626953125, -0.00498199462890625, -0.003444671630859375, -0.0019073486328125, -0.000370025634765625, 0.00116729736328125, 0.002704620361328125, 0.004241943359375, 0.005779266357421875, 0.00731658935546875, 0.008853912353515625, 0.0103912353515625, 0.011928558349609375, 0.01346588134765625, 0.015003204345703125, 0.01654052734375, 0.018077850341796875, 0.01961517333984375, 0.021152496337890625, 0.0226898193359375, 0.024227142333984375, 0.02576446533203125, 0.027301788330078125, 0.028839111328125, 0.030376434326171875, 0.03191375732421875, 0.033451080322265625, 0.0349884033203125, 0.036525726318359375, 0.03806304931640625, 0.039600372314453125, 0.0411376953125, 0.042675018310546875, 0.04421234130859375, 0.045749664306640625, 0.0472869873046875, 0.048824310302734375, 0.05036163330078125, 0.051898956298828125, 0.053436279296875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 434.0, 582.0], "bins": [-0.04661134257912636, -0.04587218165397644, -0.04513302072882652, -0.044393859803676605, -0.04365469887852669, -0.04291553795337677, -0.04217637702822685, -0.041437216103076935, -0.04069805517792702, -0.0399588942527771, -0.03921973332762718, -0.038480572402477264, -0.03774141147732735, -0.03700225055217743, -0.03626308962702751, -0.035523928701877594, -0.034784767776727676, -0.03404560685157776, -0.03330644592642784, -0.032567285001277924, -0.031828124076128006, -0.03108896315097809, -0.03034980222582817, -0.029610641300678253, -0.028871482238173485, -0.028132321313023567, -0.02739316038787365, -0.026653999462723732, -0.025914838537573814, -0.025175677612423897, -0.02443651668727398, -0.02369735576212406, -0.022958194836974144, -0.022219033911824226, -0.02147987298667431, -0.02074071206152439, -0.020001551136374474, -0.019262390211224556, -0.01852322928607464, -0.01778406836092472, -0.017044909298419952, -0.016305748373270035, -0.015566587448120117, -0.0148274265229702, -0.014088265597820282, -0.013349104672670364, -0.012609943747520447, -0.01187078282237053, -0.011131621897220612, -0.010392460972070694, -0.009653300046920776, -0.008914139121770859, -0.008174978196620941, -0.0074358172714710236, -0.006696656811982393, -0.005957495886832476, -0.005218334496021271, -0.004479173570871353, -0.0037400126457214355, -0.0030008519534021616, -0.002261691028252244, -0.0015225301031023264, -0.0007833694107830524, -4.420848563313484e-05, 0.0006949523231014609]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 13.0, 11.0, 20.0, 19.0, 22.0, 35.0, 36.0, 34.0, 43.0, 44.0, 55.0, 59.0, 52.0, 55.0, 61.0, 53.0, 50.0, 62.0, 38.0, 39.0, 45.0, 27.0, 38.0, 16.0, 18.0, 7.0, 6.0, 14.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015953779220581055, -0.0015363981947302818, -0.0014774184674024582, -0.0014184387400746346, -0.001359459012746811, -0.0013004792854189873, -0.0012414995580911636, -0.00118251983076334, -0.0011235401034355164, -0.0010645603761076927, -0.001005580648779869, -0.0009466009214520454, -0.0008876211941242218, -0.0008286414667963982, -0.0007696617394685745, -0.0007106820121407509, -0.0006517022848129272, -0.0005927225574851036, -0.00053374283015728, -0.00047476310282945633, -0.0004157833755016327, -0.00035680364817380905, -0.0002978239208459854, -0.00023884419351816177, -0.00017986446619033813, -0.0001208847388625145, -6.190501153469086e-05, -2.925284206867218e-06, 5.605444312095642e-05, 0.00011503417044878006, 0.0001740138977766037, 0.00023299362510442734, 0.000291973352432251, 0.0003509530797600746, 0.00040993280708789825, 0.0004689125344157219, 0.0005278922617435455, 0.0005868719890713692, 0.0006458517163991928, 0.0007048314437270164, 0.0007638111710548401, 0.0008227908983826637, 0.0008817706257104874, 0.000940750353038311, 0.0009997300803661346, 0.0010587098076939583, 0.001117689535021782, 0.0011766692623496056, 0.0012356489896774292, 0.0012946287170052528, 0.0013536084443330765, 0.0014125881716609001, 0.0014715678989887238, 0.0015305476263165474, 0.001589527353644371, 0.0016485070809721947, 0.0017074868083000183, 0.001766466535627842, 0.0018254462629556656, 0.0018844259902834892, 0.0019434057176113129, 0.0020023854449391365, 0.00206136517226696, 0.0021203448995947838, 0.0021793246269226074]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 7.0, 11.0, 22.0, 18.0, 16.0, 29.0, 27.0, 23.0, 31.0, 28.0, 37.0, 42.0, 44.0, 44.0, 36.0, 51.0, 45.0, 43.0, 36.0, 42.0, 45.0, 33.0, 31.0, 29.0, 27.0, 19.0, 19.0, 15.0, 19.0, 25.0, 21.0, 9.0, 11.0, 7.0, 5.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.56231689453125, -7.2847900390625, -7.00726318359375, -6.729736328125, -6.45220947265625, -6.1746826171875, -5.89715576171875, -5.61962890625, -5.34210205078125, -5.0645751953125, -4.78704833984375, -4.509521484375, -4.23199462890625, -3.9544677734375, -3.67694091796875, -3.3994140625, -3.12188720703125, -2.8443603515625, -2.56683349609375, -2.289306640625, -2.01177978515625, -1.7342529296875, -1.45672607421875, -1.17919921875, -0.90167236328125, -0.6241455078125, -0.34661865234375, -0.069091796875, 0.20843505859375, 0.4859619140625, 0.76348876953125, 1.041015625, 1.31854248046875, 1.5960693359375, 1.87359619140625, 2.151123046875, 2.42864990234375, 2.7061767578125, 2.98370361328125, 3.26123046875, 3.53875732421875, 3.8162841796875, 4.09381103515625, 4.371337890625, 4.64886474609375, 4.9263916015625, 5.20391845703125, 5.4814453125, 5.75897216796875, 6.0364990234375, 6.31402587890625, 6.591552734375, 6.86907958984375, 7.1466064453125, 7.42413330078125, 7.70166015625, 7.97918701171875, 8.2567138671875, 8.53424072265625, 8.811767578125, 9.08929443359375, 9.3668212890625, 9.64434814453125, 9.921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 7.0, 12.0, 12.0, 12.0, 13.0, 33.0, 48.0, 57.0, 76.0, 81.0, 130.0, 210.0, 271.0, 421.0, 692.0, 1219.0, 2407.0, 4815.0, 9886.0, 22445.0, 56483.0, 174371.0, 461528.0, 202373.0, 63764.0, 25030.0, 10966.0, 5005.0, 2619.0, 1402.0, 730.0, 457.0, 258.0, 208.0, 113.0, 101.0, 66.0, 63.0, 40.0, 26.0, 34.0, 26.0, 12.0, 6.0, 3.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0], "bins": [-12.0625, -11.7232666015625, -11.384033203125, -11.0447998046875, -10.70556640625, -10.3663330078125, -10.027099609375, -9.6878662109375, -9.3486328125, -9.0093994140625, -8.670166015625, -8.3309326171875, -7.99169921875, -7.6524658203125, -7.313232421875, -6.9739990234375, -6.634765625, -6.2955322265625, -5.956298828125, -5.6170654296875, -5.27783203125, -4.9385986328125, -4.599365234375, -4.2601318359375, -3.9208984375, -3.5816650390625, -3.242431640625, -2.9031982421875, -2.56396484375, -2.2247314453125, -1.885498046875, -1.5462646484375, -1.20703125, -0.8677978515625, -0.528564453125, -0.1893310546875, 0.14990234375, 0.4891357421875, 0.828369140625, 1.1676025390625, 1.5068359375, 1.8460693359375, 2.185302734375, 2.5245361328125, 2.86376953125, 3.2030029296875, 3.542236328125, 3.8814697265625, 4.220703125, 4.5599365234375, 4.899169921875, 5.2384033203125, 5.57763671875, 5.9168701171875, 6.256103515625, 6.5953369140625, 6.9345703125, 7.2738037109375, 7.613037109375, 7.9522705078125, 8.29150390625, 8.6307373046875, 8.969970703125, 9.3092041015625, 9.6484375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 1.0, 9.0, 5.0, 2.0, 8.0, 13.0, 15.0, 11.0, 18.0, 18.0, 30.0, 21.0, 32.0, 38.0, 38.0, 43.0, 45.0, 57.0, 100.0, 199.0, 1441.0, 312.0, 135.0, 67.0, 63.0, 48.0, 32.0, 39.0, 35.0, 29.0, 21.0, 19.0, 18.0, 14.0, 18.0, 10.0, 10.0, 11.0, 5.0, 8.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.515625, -24.7607421875, -24.005859375, -23.2509765625, -22.49609375, -21.7412109375, -20.986328125, -20.2314453125, -19.4765625, -18.7216796875, -17.966796875, -17.2119140625, -16.45703125, -15.7021484375, -14.947265625, -14.1923828125, -13.4375, -12.6826171875, -11.927734375, -11.1728515625, -10.41796875, -9.6630859375, -8.908203125, -8.1533203125, -7.3984375, -6.6435546875, -5.888671875, -5.1337890625, -4.37890625, -3.6240234375, -2.869140625, -2.1142578125, -1.359375, -0.6044921875, 0.150390625, 0.9052734375, 1.66015625, 2.4150390625, 3.169921875, 3.9248046875, 4.6796875, 5.4345703125, 6.189453125, 6.9443359375, 7.69921875, 8.4541015625, 9.208984375, 9.9638671875, 10.71875, 11.4736328125, 12.228515625, 12.9833984375, 13.73828125, 14.4931640625, 15.248046875, 16.0029296875, 16.7578125, 17.5126953125, 18.267578125, 19.0224609375, 19.77734375, 20.5322265625, 21.287109375, 22.0419921875, 22.796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 5.0, 6.0, 11.0, 15.0, 18.0, 18.0, 24.0, 37.0, 40.0, 65.0, 79.0, 108.0, 165.0, 241.0, 469.0, 1397.0, 13736.0, 2174485.0, 942061.0, 10293.0, 1154.0, 431.0, 262.0, 144.0, 131.0, 61.0, 56.0, 41.0, 39.0, 28.0, 21.0, 17.0, 8.0, 13.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.6875, -40.24755859375, -38.8076171875, -37.36767578125, -35.927734375, -34.48779296875, -33.0478515625, -31.60791015625, -30.16796875, -28.72802734375, -27.2880859375, -25.84814453125, -24.408203125, -22.96826171875, -21.5283203125, -20.08837890625, -18.6484375, -17.20849609375, -15.7685546875, -14.32861328125, -12.888671875, -11.44873046875, -10.0087890625, -8.56884765625, -7.12890625, -5.68896484375, -4.2490234375, -2.80908203125, -1.369140625, 0.07080078125, 1.5107421875, 2.95068359375, 4.390625, 5.83056640625, 7.2705078125, 8.71044921875, 10.150390625, 11.59033203125, 13.0302734375, 14.47021484375, 15.91015625, 17.35009765625, 18.7900390625, 20.22998046875, 21.669921875, 23.10986328125, 24.5498046875, 25.98974609375, 27.4296875, 28.86962890625, 30.3095703125, 31.74951171875, 33.189453125, 34.62939453125, 36.0693359375, 37.50927734375, 38.94921875, 40.38916015625, 41.8291015625, 43.26904296875, 44.708984375, 46.14892578125, 47.5888671875, 49.02880859375, 50.46875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 167.0, 832.0, 17.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-475.1203308105469, -465.277587890625, -455.434814453125, -445.5920715332031, -435.74932861328125, -425.90655517578125, -416.0638122558594, -406.2210693359375, -396.3782958984375, -386.5355529785156, -376.6927795410156, -366.85003662109375, -357.0072937011719, -347.16455078125, -337.32177734375, -327.4790344238281, -317.63629150390625, -307.7935485839844, -297.9507751464844, -288.1080322265625, -278.2652893066406, -268.42254638671875, -258.57977294921875, -248.73703002929688, -238.89427185058594, -229.051513671875, -219.20877075195312, -209.3660125732422, -199.52325439453125, -189.68051147460938, -179.83775329589844, -169.9949951171875, -160.1522216796875, -150.30946350097656, -140.4667205810547, -130.62396240234375, -120.78121185302734, -110.93846130371094, -101.095703125, -91.2529525756836, -81.41020202636719, -71.56745147705078, -61.72469711303711, -51.88194274902344, -42.03919219970703, -32.196441650390625, -22.353687286376953, -12.510932922363281, -2.668182373046875, 7.174570083618164, 17.017322540283203, 26.860074996948242, 36.70282745361328, 46.54557800292969, 56.38833236694336, 66.23108673095703, 76.07383728027344, 85.91658782958984, 95.75933837890625, 105.60209655761719, 115.4448471069336, 125.28759765625, 135.13035583496094, 144.97311401367188, 154.81585693359375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 8.0, 5.0, 5.0, 6.0, 15.0, 17.0, 13.0, 19.0, 16.0, 20.0, 30.0, 24.0, 30.0, 26.0, 40.0, 30.0, 41.0, 37.0, 30.0, 40.0, 52.0, 36.0, 44.0, 29.0, 28.0, 45.0, 30.0, 35.0, 32.0, 29.0, 37.0, 14.0, 18.0, 23.0, 18.0, 14.0, 8.0, 12.0, 11.0, 3.0, 12.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 4.0, 0.0, 2.0], "bins": [-61.60636901855469, -59.895355224609375, -58.1843376159668, -56.473323822021484, -54.762306213378906, -53.051292419433594, -51.34027862548828, -49.6292610168457, -47.918243408203125, -46.20722961425781, -44.496212005615234, -42.78519821166992, -41.074180603027344, -39.36316680908203, -37.65215301513672, -35.94113540649414, -34.23012161254883, -32.519107818603516, -30.808090209960938, -29.097076416015625, -27.386058807373047, -25.675045013427734, -23.96402931213379, -22.253013610839844, -20.5419979095459, -18.830982208251953, -17.119966506958008, -15.408951759338379, -13.697936058044434, -11.986920356750488, -10.27590560913086, -8.564889907836914, -6.853874206542969, -5.142858505249023, -3.4318432807922363, -1.7208280563354492, -0.009812355041503906, 1.7012033462524414, 3.4122180938720703, 5.123233795166016, 6.834249496459961, 8.545265197753906, 10.256280899047852, 11.96729564666748, 13.678311347961426, 15.389327049255371, 17.100341796875, 18.811357498168945, 20.52237319946289, 22.233388900756836, 23.94440460205078, 25.655418395996094, 27.366436004638672, 29.077449798583984, 30.78846549987793, 32.499481201171875, 34.21049499511719, 35.9215087890625, 37.63252639770508, 39.34354019165039, 41.05455780029297, 42.76557159423828, 44.476585388183594, 46.18760299682617, 47.89862060546875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 16.0, 21.0, 21.0, 16.0, 25.0, 29.0, 24.0, 27.0, 40.0, 34.0, 37.0, 50.0, 34.0, 49.0, 48.0, 44.0, 45.0, 43.0, 31.0, 42.0, 34.0, 24.0, 24.0, 31.0, 23.0, 19.0, 20.0, 14.0, 19.0, 9.0, 16.0, 17.0, 11.0, 11.0, 5.0, 5.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0703125, -7.784423828125, -7.49853515625, -7.212646484375, -6.9267578125, -6.640869140625, -6.35498046875, -6.069091796875, -5.783203125, -5.497314453125, -5.21142578125, -4.925537109375, -4.6396484375, -4.353759765625, -4.06787109375, -3.781982421875, -3.49609375, -3.210205078125, -2.92431640625, -2.638427734375, -2.3525390625, -2.066650390625, -1.78076171875, -1.494873046875, -1.208984375, -0.923095703125, -0.63720703125, -0.351318359375, -0.0654296875, 0.220458984375, 0.50634765625, 0.792236328125, 1.078125, 1.364013671875, 1.64990234375, 1.935791015625, 2.2216796875, 2.507568359375, 2.79345703125, 3.079345703125, 3.365234375, 3.651123046875, 3.93701171875, 4.222900390625, 4.5087890625, 4.794677734375, 5.08056640625, 5.366455078125, 5.65234375, 5.938232421875, 6.22412109375, 6.510009765625, 6.7958984375, 7.081787109375, 7.36767578125, 7.653564453125, 7.939453125, 8.225341796875, 8.51123046875, 8.797119140625, 9.0830078125, 9.368896484375, 9.65478515625, 9.940673828125, 10.2265625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 11.0, 15.0, 8.0, 17.0, 15.0, 30.0, 31.0, 52.0, 49.0, 71.0, 95.0, 133.0, 167.0, 256.0, 320.0, 445.0, 1289.0, 4151022.0, 38082.0, 617.0, 411.0, 267.0, 201.0, 179.0, 109.0, 90.0, 62.0, 48.0, 37.0, 21.0, 20.0, 19.0, 21.0, 9.0, 18.0, 5.0, 6.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-140.625, -136.19921875, -131.7734375, -127.34765625, -122.921875, -118.49609375, -114.0703125, -109.64453125, -105.21875, -100.79296875, -96.3671875, -91.94140625, -87.515625, -83.08984375, -78.6640625, -74.23828125, -69.8125, -65.38671875, -60.9609375, -56.53515625, -52.109375, -47.68359375, -43.2578125, -38.83203125, -34.40625, -29.98046875, -25.5546875, -21.12890625, -16.703125, -12.27734375, -7.8515625, -3.42578125, 1.0, 5.42578125, 9.8515625, 14.27734375, 18.703125, 23.12890625, 27.5546875, 31.98046875, 36.40625, 40.83203125, 45.2578125, 49.68359375, 54.109375, 58.53515625, 62.9609375, 67.38671875, 71.8125, 76.23828125, 80.6640625, 85.08984375, 89.515625, 93.94140625, 98.3671875, 102.79296875, 107.21875, 111.64453125, 116.0703125, 120.49609375, 124.921875, 129.34765625, 133.7734375, 138.19921875, 142.625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 4.0, 7.0, 11.0, 13.0, 25.0, 32.0, 36.0, 77.0, 92.0, 158.0, 229.0, 434.0, 698.0, 814.0, 594.0, 354.0, 183.0, 101.0, 70.0, 44.0, 26.0, 19.0, 22.0, 13.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.234375, -22.6427001953125, -22.051025390625, -21.4593505859375, -20.86767578125, -20.2760009765625, -19.684326171875, -19.0926513671875, -18.5009765625, -17.9093017578125, -17.317626953125, -16.7259521484375, -16.13427734375, -15.5426025390625, -14.950927734375, -14.3592529296875, -13.767578125, -13.1759033203125, -12.584228515625, -11.9925537109375, -11.40087890625, -10.8092041015625, -10.217529296875, -9.6258544921875, -9.0341796875, -8.4425048828125, -7.850830078125, -7.2591552734375, -6.66748046875, -6.0758056640625, -5.484130859375, -4.8924560546875, -4.30078125, -3.7091064453125, -3.117431640625, -2.5257568359375, -1.93408203125, -1.3424072265625, -0.750732421875, -0.1590576171875, 0.4326171875, 1.0242919921875, 1.615966796875, 2.2076416015625, 2.79931640625, 3.3909912109375, 3.982666015625, 4.5743408203125, 5.166015625, 5.7576904296875, 6.349365234375, 6.9410400390625, 7.53271484375, 8.1243896484375, 8.716064453125, 9.3077392578125, 9.8994140625, 10.4910888671875, 11.082763671875, 11.6744384765625, 12.26611328125, 12.8577880859375, 13.449462890625, 14.0411376953125, 14.6328125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 9.0, 6.0, 5.0, 11.0, 7.0, 21.0, 28.0, 27.0, 35.0, 39.0, 58.0, 61.0, 147.0, 440.0, 4962.0, 3408358.0, 776647.0, 2627.0, 341.0, 120.0, 70.0, 51.0, 30.0, 32.0, 29.0, 26.0, 23.0, 22.0, 13.0, 9.0, 5.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0, -71.5263671875, -69.052734375, -66.5791015625, -64.10546875, -61.6318359375, -59.158203125, -56.6845703125, -54.2109375, -51.7373046875, -49.263671875, -46.7900390625, -44.31640625, -41.8427734375, -39.369140625, -36.8955078125, -34.421875, -31.9482421875, -29.474609375, -27.0009765625, -24.52734375, -22.0537109375, -19.580078125, -17.1064453125, -14.6328125, -12.1591796875, -9.685546875, -7.2119140625, -4.73828125, -2.2646484375, 0.208984375, 2.6826171875, 5.15625, 7.6298828125, 10.103515625, 12.5771484375, 15.05078125, 17.5244140625, 19.998046875, 22.4716796875, 24.9453125, 27.4189453125, 29.892578125, 32.3662109375, 34.83984375, 37.3134765625, 39.787109375, 42.2607421875, 44.734375, 47.2080078125, 49.681640625, 52.1552734375, 54.62890625, 57.1025390625, 59.576171875, 62.0498046875, 64.5234375, 66.9970703125, 69.470703125, 71.9443359375, 74.41796875, 76.8916015625, 79.365234375, 81.8388671875, 84.3125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 113.0, 471.0, 353.0, 58.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.155487060546875, -49.82224655151367, -43.48900604248047, -37.15576171875, -30.822521209716797, -24.489280700683594, -18.156036376953125, -11.822795867919922, -5.489555358886719, 0.8436861038208008, 7.17692756652832, 13.510169982910156, 19.84341049194336, 26.176651000976562, 32.50989532470703, 38.843135833740234, 45.17637634277344, 51.50961685180664, 57.842857360839844, 64.17610168457031, 70.50933837890625, 76.84258270263672, 83.17582702636719, 89.50906372070312, 95.8423080444336, 102.17555236816406, 108.5087890625, 114.84203338623047, 121.17527770996094, 127.50851440429688, 133.84176635742188, 140.1750030517578, 146.50823974609375, 152.8414764404297, 159.1747283935547, 165.50796508789062, 171.84120178222656, 178.1744384765625, 184.5076904296875, 190.84092712402344, 197.17416381835938, 203.5074005126953, 209.8406524658203, 216.17388916015625, 222.5071258544922, 228.84036254882812, 235.17361450195312, 241.50685119628906, 247.84010314941406, 254.17333984375, 260.506591796875, 266.83984375, 273.1730651855469, 279.5063171386719, 285.83953857421875, 292.17279052734375, 298.50604248046875, 304.83929443359375, 311.1725158691406, 317.5057678222656, 323.8390197753906, 330.1722412109375, 336.5054931640625, 342.8387451171875, 349.1719665527344]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 6.0, 13.0, 9.0, 12.0, 9.0, 6.0, 13.0, 27.0, 26.0, 16.0, 19.0, 29.0, 31.0, 34.0, 32.0, 42.0, 48.0, 35.0, 36.0, 46.0, 45.0, 48.0, 48.0, 31.0, 47.0, 37.0, 33.0, 27.0, 33.0, 23.0, 25.0, 24.0, 18.0, 12.0, 15.0, 7.0, 6.0, 6.0, 3.0, 9.0, 2.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.41960906982422, -42.93485641479492, -41.450103759765625, -39.96535110473633, -38.48059844970703, -36.99584197998047, -35.51108932495117, -34.026336669921875, -32.54158401489258, -31.05683135986328, -29.572078704833984, -28.087324142456055, -26.602571487426758, -25.11781883239746, -23.63306427001953, -22.148311614990234, -20.663558959960938, -19.17880630493164, -17.694053649902344, -16.209299087524414, -14.724546432495117, -13.23979377746582, -11.755040168762207, -10.270286560058594, -8.785533905029297, -7.300780773162842, -5.816027641296387, -4.331274509429932, -2.8465213775634766, -1.3617682456970215, 0.1229848861694336, 1.6077384948730469, 3.0924911499023438, 4.577244281768799, 6.061997413635254, 7.546750545501709, 9.031503677368164, 10.516256332397461, 12.001009941101074, 13.485763549804688, 14.970516204833984, 16.45526885986328, 17.940021514892578, 19.424776077270508, 20.909528732299805, 22.3942813873291, 23.87903594970703, 25.363788604736328, 26.848541259765625, 28.333293914794922, 29.81804656982422, 31.30280113220215, 32.78755187988281, 34.272308349609375, 35.75706100463867, 37.24181365966797, 38.726566314697266, 40.21131896972656, 41.69607162475586, 43.180824279785156, 44.66558074951172, 46.150333404541016, 47.63508605957031, 49.11983871459961, 50.604591369628906]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 5.0, 6.0, 13.0, 13.0, 4.0, 13.0, 17.0, 29.0, 25.0, 30.0, 30.0, 24.0, 28.0, 29.0, 36.0, 32.0, 30.0, 36.0, 39.0, 46.0, 39.0, 29.0, 37.0, 31.0, 38.0, 42.0, 31.0, 32.0, 23.0, 27.0, 20.0, 24.0, 29.0, 13.0, 8.0, 13.0, 19.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.95703125, -6.71905517578125, -6.4810791015625, -6.24310302734375, -6.005126953125, -5.76715087890625, -5.5291748046875, -5.29119873046875, -5.05322265625, -4.81524658203125, -4.5772705078125, -4.33929443359375, -4.101318359375, -3.86334228515625, -3.6253662109375, -3.38739013671875, -3.1494140625, -2.91143798828125, -2.6734619140625, -2.43548583984375, -2.197509765625, -1.95953369140625, -1.7215576171875, -1.48358154296875, -1.24560546875, -1.00762939453125, -0.7696533203125, -0.53167724609375, -0.293701171875, -0.05572509765625, 0.1822509765625, 0.42022705078125, 0.658203125, 0.89617919921875, 1.1341552734375, 1.37213134765625, 1.610107421875, 1.84808349609375, 2.0860595703125, 2.32403564453125, 2.56201171875, 2.79998779296875, 3.0379638671875, 3.27593994140625, 3.513916015625, 3.75189208984375, 3.9898681640625, 4.22784423828125, 4.4658203125, 4.70379638671875, 4.9417724609375, 5.17974853515625, 5.417724609375, 5.65570068359375, 5.8936767578125, 6.13165283203125, 6.36962890625, 6.60760498046875, 6.8455810546875, 7.08355712890625, 7.321533203125, 7.55950927734375, 7.7974853515625, 8.03546142578125, 8.2734375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 6.0, 5.0, 20.0, 28.0, 41.0, 69.0, 117.0, 141.0, 214.0, 276.0, 388.0, 574.0, 845.0, 1153.0, 1665.0, 2547.0, 3487.0, 5266.0, 7530.0, 11058.0, 16420.0, 25176.0, 38406.0, 60293.0, 94081.0, 138881.0, 172731.0, 154177.0, 108959.0, 70272.0, 45261.0, 29019.0, 19027.0, 12726.0, 8629.0, 5869.0, 3999.0, 2844.0, 1994.0, 1330.0, 861.0, 666.0, 455.0, 335.0, 230.0, 147.0, 128.0, 80.0, 45.0, 21.0, 26.0, 12.0, 8.0, 5.0, 7.0, 6.0, 4.0], "bins": [-0.72705078125, -0.7054595947265625, -0.683868408203125, -0.6622772216796875, -0.64068603515625, -0.6190948486328125, -0.597503662109375, -0.5759124755859375, -0.5543212890625, -0.5327301025390625, -0.511138916015625, -0.4895477294921875, -0.46795654296875, -0.4463653564453125, -0.424774169921875, -0.4031829833984375, -0.381591796875, -0.3600006103515625, -0.338409423828125, -0.3168182373046875, -0.29522705078125, -0.2736358642578125, -0.252044677734375, -0.2304534912109375, -0.2088623046875, -0.1872711181640625, -0.165679931640625, -0.1440887451171875, -0.12249755859375, -0.1009063720703125, -0.079315185546875, -0.0577239990234375, -0.0361328125, -0.0145416259765625, 0.007049560546875, 0.0286407470703125, 0.05023193359375, 0.0718231201171875, 0.093414306640625, 0.1150054931640625, 0.1365966796875, 0.1581878662109375, 0.179779052734375, 0.2013702392578125, 0.22296142578125, 0.2445526123046875, 0.266143798828125, 0.2877349853515625, 0.309326171875, 0.3309173583984375, 0.352508544921875, 0.3740997314453125, 0.39569091796875, 0.4172821044921875, 0.438873291015625, 0.4604644775390625, 0.4820556640625, 0.5036468505859375, 0.525238037109375, 0.5468292236328125, 0.56842041015625, 0.5900115966796875, 0.611602783203125, 0.6331939697265625, 0.65478515625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 6.0, 2.0, 7.0, 3.0, 6.0, 6.0, 9.0, 12.0, 14.0, 19.0, 22.0, 22.0, 19.0, 27.0, 33.0, 40.0, 30.0, 33.0, 27.0, 56.0, 39.0, 35.0, 27.0, 1065.0, 49.0, 38.0, 31.0, 32.0, 24.0, 29.0, 25.0, 36.0, 25.0, 21.0, 29.0, 25.0, 16.0, 15.0, 8.0, 13.0, 11.0, 11.0, 8.0, 5.0, 9.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-5.05859375, -4.9036865234375, -4.748779296875, -4.5938720703125, -4.43896484375, -4.2840576171875, -4.129150390625, -3.9742431640625, -3.8193359375, -3.6644287109375, -3.509521484375, -3.3546142578125, -3.19970703125, -3.0447998046875, -2.889892578125, -2.7349853515625, -2.580078125, -2.4251708984375, -2.270263671875, -2.1153564453125, -1.96044921875, -1.8055419921875, -1.650634765625, -1.4957275390625, -1.3408203125, -1.1859130859375, -1.031005859375, -0.8760986328125, -0.72119140625, -0.5662841796875, -0.411376953125, -0.2564697265625, -0.1015625, 0.0533447265625, 0.208251953125, 0.3631591796875, 0.51806640625, 0.6729736328125, 0.827880859375, 0.9827880859375, 1.1376953125, 1.2926025390625, 1.447509765625, 1.6024169921875, 1.75732421875, 1.9122314453125, 2.067138671875, 2.2220458984375, 2.376953125, 2.5318603515625, 2.686767578125, 2.8416748046875, 2.99658203125, 3.1514892578125, 3.306396484375, 3.4613037109375, 3.6162109375, 3.7711181640625, 3.926025390625, 4.0809326171875, 4.23583984375, 4.3907470703125, 4.545654296875, 4.7005615234375, 4.85546875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 11.0, 11.0, 15.0, 42.0, 62.0, 97.0, 132.0, 192.0, 301.0, 475.0, 820.0, 1180.0, 1929.0, 3027.0, 4964.0, 7976.0, 13280.0, 21817.0, 35977.0, 59336.0, 97241.0, 147603.0, 1231987.0, 166181.0, 116391.0, 72711.0, 44165.0, 26928.0, 16257.0, 9819.0, 6141.0, 3704.0, 2395.0, 1446.0, 909.0, 581.0, 357.0, 245.0, 144.0, 84.0, 71.0, 47.0, 29.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.623046875, -0.602752685546875, -0.58245849609375, -0.562164306640625, -0.5418701171875, -0.521575927734375, -0.50128173828125, -0.480987548828125, -0.460693359375, -0.440399169921875, -0.42010498046875, -0.399810791015625, -0.3795166015625, -0.359222412109375, -0.33892822265625, -0.318634033203125, -0.29833984375, -0.278045654296875, -0.25775146484375, -0.237457275390625, -0.2171630859375, -0.196868896484375, -0.17657470703125, -0.156280517578125, -0.135986328125, -0.115692138671875, -0.09539794921875, -0.075103759765625, -0.0548095703125, -0.034515380859375, -0.01422119140625, 0.006072998046875, 0.0263671875, 0.046661376953125, 0.06695556640625, 0.087249755859375, 0.1075439453125, 0.127838134765625, 0.14813232421875, 0.168426513671875, 0.188720703125, 0.209014892578125, 0.22930908203125, 0.249603271484375, 0.2698974609375, 0.290191650390625, 0.31048583984375, 0.330780029296875, 0.35107421875, 0.371368408203125, 0.39166259765625, 0.411956787109375, 0.4322509765625, 0.452545166015625, 0.47283935546875, 0.493133544921875, 0.513427734375, 0.533721923828125, 0.55401611328125, 0.574310302734375, 0.5946044921875, 0.614898681640625, 0.63519287109375, 0.655487060546875, 0.67578125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 8.0, 9.0, 5.0, 9.0, 13.0, 17.0, 15.0, 19.0, 27.0, 21.0, 31.0, 41.0, 39.0, 46.0, 73.0, 57.0, 79.0, 53.0, 52.0, 52.0, 50.0, 36.0, 40.0, 38.0, 32.0, 20.0, 22.0, 13.0, 9.0, 8.0, 7.0, 7.0, 10.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.002193450927734375, -0.0021162331104278564, -0.002039015293121338, -0.0019617974758148193, -0.0018845796585083008, -0.0018073618412017822, -0.0017301440238952637, -0.0016529262065887451, -0.0015757083892822266, -0.001498490571975708, -0.0014212727546691895, -0.001344054937362671, -0.0012668371200561523, -0.0011896193027496338, -0.0011124014854431152, -0.0010351836681365967, -0.0009579658508300781, -0.0008807480335235596, -0.000803530216217041, -0.0007263123989105225, -0.0006490945816040039, -0.0005718767642974854, -0.0004946589469909668, -0.00041744112968444824, -0.0003402233123779297, -0.00026300549507141113, -0.00018578767776489258, -0.00010856986045837402, -3.135204315185547e-05, 4.5865774154663086e-05, 0.00012308359146118164, 0.0002003014087677002, 0.00027751922607421875, 0.0003547370433807373, 0.00043195486068725586, 0.0005091726779937744, 0.000586390495300293, 0.0006636083126068115, 0.0007408261299133301, 0.0008180439472198486, 0.0008952617645263672, 0.0009724795818328857, 0.0010496973991394043, 0.0011269152164459229, 0.0012041330337524414, 0.00128135085105896, 0.0013585686683654785, 0.001435786485671997, 0.0015130043029785156, 0.0015902221202850342, 0.0016674399375915527, 0.0017446577548980713, 0.0018218755722045898, 0.0018990933895111084, 0.001976311206817627, 0.0020535290241241455, 0.002130746841430664, 0.0022079646587371826, 0.002285182476043701, 0.0023624002933502197, 0.0024396181106567383, 0.002516835927963257, 0.0025940537452697754, 0.002671271562576294, 0.0027484893798828125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 4.0, 8.0, 10.0, 6.0, 11.0, 21.0, 17.0, 15.0, 24.0, 28.0, 30.0, 50.0, 78.0, 98.0, 154.0, 210.0, 342.0, 641.0, 2834.0, 934348.0, 106747.0, 1268.0, 558.0, 313.0, 189.0, 128.0, 80.0, 67.0, 46.0, 38.0, 36.0, 35.0, 24.0, 15.0, 16.0, 14.0, 12.0, 11.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.05303955078125, -0.05151557922363281, -0.049991607666015625, -0.04846763610839844, -0.04694366455078125, -0.04541969299316406, -0.043895721435546875, -0.04237174987792969, -0.0408477783203125, -0.03932380676269531, -0.037799835205078125, -0.03627586364746094, -0.03475189208984375, -0.03322792053222656, -0.031703948974609375, -0.030179977416992188, -0.028656005859375, -0.027132034301757812, -0.025608062744140625, -0.024084091186523438, -0.02256011962890625, -0.021036148071289062, -0.019512176513671875, -0.017988204956054688, -0.0164642333984375, -0.014940261840820312, -0.013416290283203125, -0.011892318725585938, -0.01036834716796875, -0.008844375610351562, -0.007320404052734375, -0.0057964324951171875, -0.0042724609375, -0.0027484893798828125, -0.001224517822265625, 0.0002994537353515625, 0.00182342529296875, 0.0033473968505859375, 0.004871368408203125, 0.0063953399658203125, 0.0079193115234375, 0.009443283081054688, 0.010967254638671875, 0.012491226196289062, 0.01401519775390625, 0.015539169311523438, 0.017063140869140625, 0.018587112426757812, 0.020111083984375, 0.021635055541992188, 0.023159027099609375, 0.024682998657226562, 0.02620697021484375, 0.027730941772460938, 0.029254913330078125, 0.030778884887695312, 0.0323028564453125, 0.03382682800292969, 0.035350799560546875, 0.03687477111816406, 0.03839874267578125, 0.03992271423339844, 0.041446685791015625, 0.04297065734863281, 0.04449462890625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 15.0, 1003.0], "bins": [-0.06981678307056427, -0.06871691346168518, -0.06761705130338669, -0.0665171816945076, -0.0654173195362091, -0.06431744992733002, -0.06321758031845093, -0.062117718160152435, -0.061017848551273346, -0.059917982667684555, -0.058818116784095764, -0.057718247175216675, -0.056618381291627884, -0.05551851540803909, -0.0544186495244503, -0.05331878364086151, -0.05221891775727272, -0.05111905187368393, -0.05001918599009514, -0.04891931638121605, -0.04781945049762726, -0.04671958461403847, -0.045619718730449677, -0.044519852846860886, -0.043419986963272095, -0.042320121079683304, -0.04122025519609451, -0.040120385587215424, -0.03902051970362663, -0.03792065382003784, -0.03682078793644905, -0.03572092205286026, -0.03462105244398117, -0.03352118656039238, -0.03242132067680359, -0.0313214510679245, -0.03022158518433571, -0.029121719300746918, -0.028021853417158127, -0.026921987533569336, -0.025822117924690247, -0.024722252041101456, -0.023622384294867516, -0.022522518411278725, -0.021422650665044785, -0.020322784781455994, -0.019222918897867203, -0.018123053014278412, -0.017023185268044472, -0.01592331938445568, -0.01482345163822174, -0.01372358575463295, -0.012623718939721584, -0.011523852124810219, -0.010423986241221428, -0.009324119426310062, -0.008224252611398697, -0.007124385796487331, -0.006024519447237253, -0.004924653097987175, -0.0038247862830758095, -0.002724919468164444, -0.0016250531189143658, -0.0005251867696642876, 0.0005746795795857906]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 8.0, 15.0, 9.0, 14.0, 35.0, 34.0, 46.0, 54.0, 74.0, 80.0, 81.0, 70.0, 94.0, 73.0, 61.0, 49.0, 43.0, 55.0, 36.0, 23.0, 19.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014673471450805664, -0.0013855146244168282, -0.00130368210375309, -0.0012218495830893517, -0.0011400170624256134, -0.0010581845417618752, -0.0009763520210981369, -0.0008945195004343987, -0.0008126869797706604, -0.0007308544591069221, -0.0006490219384431839, -0.0005671894177794456, -0.0004853568971157074, -0.00040352437645196915, -0.0003216918557882309, -0.00023985933512449265, -0.0001580268144607544, -7.619429379701614e-05, 5.638226866722107e-06, 8.747074753046036e-05, 0.0001693032681941986, 0.00025113578885793686, 0.0003329683095216751, 0.00041480083018541336, 0.0004966333508491516, 0.0005784658715128899, 0.0006602983921766281, 0.0007421309128403664, 0.0008239634335041046, 0.0009057959541678429, 0.0009876284748315811, 0.0010694609954953194, 0.0011512935161590576, 0.0012331260368227959, 0.0013149585574865341, 0.0013967910781502724, 0.0014786235988140106, 0.0015604561194777489, 0.0016422886401414871, 0.0017241211608052254, 0.0018059536814689636, 0.0018877862021327019, 0.00196961872279644, 0.0020514512434601784, 0.0021332837641239166, 0.002215116284787655, 0.002296948805451393, 0.0023787813261151314, 0.0024606138467788696, 0.002542446367442608, 0.002624278888106346, 0.0027061114087700844, 0.0027879439294338226, 0.002869776450097561, 0.002951608970761299, 0.0030334414914250374, 0.0031152740120887756, 0.003197106532752514, 0.003278939053416252, 0.0033607715740799904, 0.0034426040947437286, 0.003524436615407467, 0.003606269136071205, 0.0036881016567349434, 0.0037699341773986816]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 5.0, 6.0, 14.0, 12.0, 4.0, 13.0, 17.0, 29.0, 25.0, 30.0, 30.0, 24.0, 28.0, 29.0, 36.0, 32.0, 30.0, 36.0, 39.0, 46.0, 39.0, 30.0, 36.0, 31.0, 38.0, 42.0, 31.0, 32.0, 23.0, 27.0, 20.0, 24.0, 29.0, 13.0, 8.0, 13.0, 19.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.95703125, -6.71905517578125, -6.4810791015625, -6.24310302734375, -6.005126953125, -5.76715087890625, -5.5291748046875, -5.29119873046875, -5.05322265625, -4.81524658203125, -4.5772705078125, -4.33929443359375, -4.101318359375, -3.86334228515625, -3.6253662109375, -3.38739013671875, -3.1494140625, -2.91143798828125, -2.6734619140625, -2.43548583984375, -2.197509765625, -1.95953369140625, -1.7215576171875, -1.48358154296875, -1.24560546875, -1.00762939453125, -0.7696533203125, -0.53167724609375, -0.293701171875, -0.05572509765625, 0.1822509765625, 0.42022705078125, 0.658203125, 0.89617919921875, 1.1341552734375, 1.37213134765625, 1.610107421875, 1.84808349609375, 2.0860595703125, 2.32403564453125, 2.56201171875, 2.79998779296875, 3.0379638671875, 3.27593994140625, 3.513916015625, 3.75189208984375, 3.9898681640625, 4.22784423828125, 4.4658203125, 4.70379638671875, 4.9417724609375, 5.17974853515625, 5.417724609375, 5.65570068359375, 5.8936767578125, 6.13165283203125, 6.36962890625, 6.60760498046875, 6.8455810546875, 7.08355712890625, 7.321533203125, 7.55950927734375, 7.7974853515625, 8.03546142578125, 8.2734375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 11.0, 11.0, 19.0, 27.0, 42.0, 41.0, 54.0, 72.0, 82.0, 108.0, 165.0, 189.0, 265.0, 340.0, 415.0, 561.0, 721.0, 1008.0, 1381.0, 2337.0, 5068.0, 15430.0, 62761.0, 278814.0, 487146.0, 140464.0, 32122.0, 8821.0, 3437.0, 1816.0, 1152.0, 863.0, 685.0, 450.0, 383.0, 286.0, 249.0, 185.0, 139.0, 93.0, 74.0, 54.0, 54.0, 41.0, 28.0, 22.0, 15.0, 10.0, 6.0, 6.0, 5.0, 6.0, 4.0, 5.0, 3.0, 0.0, 2.0], "bins": [-12.0390625, -11.654052734375, -11.26904296875, -10.884033203125, -10.4990234375, -10.114013671875, -9.72900390625, -9.343994140625, -8.958984375, -8.573974609375, -8.18896484375, -7.803955078125, -7.4189453125, -7.033935546875, -6.64892578125, -6.263916015625, -5.87890625, -5.493896484375, -5.10888671875, -4.723876953125, -4.3388671875, -3.953857421875, -3.56884765625, -3.183837890625, -2.798828125, -2.413818359375, -2.02880859375, -1.643798828125, -1.2587890625, -0.873779296875, -0.48876953125, -0.103759765625, 0.28125, 0.666259765625, 1.05126953125, 1.436279296875, 1.8212890625, 2.206298828125, 2.59130859375, 2.976318359375, 3.361328125, 3.746337890625, 4.13134765625, 4.516357421875, 4.9013671875, 5.286376953125, 5.67138671875, 6.056396484375, 6.44140625, 6.826416015625, 7.21142578125, 7.596435546875, 7.9814453125, 8.366455078125, 8.75146484375, 9.136474609375, 9.521484375, 9.906494140625, 10.29150390625, 10.676513671875, 11.0615234375, 11.446533203125, 11.83154296875, 12.216552734375, 12.6015625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 1.0, 7.0, 6.0, 6.0, 10.0, 10.0, 19.0, 12.0, 20.0, 23.0, 28.0, 21.0, 30.0, 34.0, 42.0, 54.0, 73.0, 89.0, 167.0, 1550.0, 318.0, 84.0, 71.0, 51.0, 37.0, 49.0, 40.0, 37.0, 31.0, 26.0, 11.0, 20.0, 14.0, 13.0, 13.0, 10.0, 6.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.216552734375, -17.47998046875, -16.743408203125, -16.0068359375, -15.270263671875, -14.53369140625, -13.797119140625, -13.060546875, -12.323974609375, -11.58740234375, -10.850830078125, -10.1142578125, -9.377685546875, -8.64111328125, -7.904541015625, -7.16796875, -6.431396484375, -5.69482421875, -4.958251953125, -4.2216796875, -3.485107421875, -2.74853515625, -2.011962890625, -1.275390625, -0.538818359375, 0.19775390625, 0.934326171875, 1.6708984375, 2.407470703125, 3.14404296875, 3.880615234375, 4.6171875, 5.353759765625, 6.09033203125, 6.826904296875, 7.5634765625, 8.300048828125, 9.03662109375, 9.773193359375, 10.509765625, 11.246337890625, 11.98291015625, 12.719482421875, 13.4560546875, 14.192626953125, 14.92919921875, 15.665771484375, 16.40234375, 17.138916015625, 17.87548828125, 18.612060546875, 19.3486328125, 20.085205078125, 20.82177734375, 21.558349609375, 22.294921875, 23.031494140625, 23.76806640625, 24.504638671875, 25.2412109375, 25.977783203125, 26.71435546875, 27.450927734375, 28.1875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 3.0, 4.0, 5.0, 10.0, 7.0, 16.0, 14.0, 20.0, 26.0, 32.0, 40.0, 51.0, 74.0, 93.0, 177.0, 239.0, 435.0, 879.0, 3144.0, 2950346.0, 186506.0, 1817.0, 653.0, 339.0, 209.0, 157.0, 86.0, 71.0, 56.0, 43.0, 32.0, 25.0, 20.0, 13.0, 9.0, 12.0, 6.0, 10.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-64.625, -62.595703125, -60.56640625, -58.537109375, -56.5078125, -54.478515625, -52.44921875, -50.419921875, -48.390625, -46.361328125, -44.33203125, -42.302734375, -40.2734375, -38.244140625, -36.21484375, -34.185546875, -32.15625, -30.126953125, -28.09765625, -26.068359375, -24.0390625, -22.009765625, -19.98046875, -17.951171875, -15.921875, -13.892578125, -11.86328125, -9.833984375, -7.8046875, -5.775390625, -3.74609375, -1.716796875, 0.3125, 2.341796875, 4.37109375, 6.400390625, 8.4296875, 10.458984375, 12.48828125, 14.517578125, 16.546875, 18.576171875, 20.60546875, 22.634765625, 24.6640625, 26.693359375, 28.72265625, 30.751953125, 32.78125, 34.810546875, 36.83984375, 38.869140625, 40.8984375, 42.927734375, 44.95703125, 46.986328125, 49.015625, 51.044921875, 53.07421875, 55.103515625, 57.1328125, 59.162109375, 61.19140625, 63.220703125, 65.25]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 20.0, 511.0, 468.0, 14.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.58877563476562, -142.6553955078125, -134.72203063964844, -126.78865051269531, -118.85527801513672, -110.92190551757812, -102.988525390625, -95.0551528930664, -87.12178039550781, -79.18840789794922, -71.25503540039062, -63.3216552734375, -55.388282775878906, -47.45491027832031, -39.52153396606445, -31.588157653808594, -23.65478515625, -15.721410751342773, -7.788036346435547, 0.1453380584716797, 8.078712463378906, 16.0120849609375, 23.94546127319336, 31.87883758544922, 39.81221008300781, 47.745582580566406, 55.678958892822266, 63.612335205078125, 71.54570770263672, 79.47908020019531, 87.41246032714844, 95.34583282470703, 103.27920532226562, 111.21257781982422, 119.14595031738281, 127.07933044433594, 135.0126953125, 142.94607543945312, 150.87945556640625, 158.81283569335938, 166.74620056152344, 174.67958068847656, 182.61294555664062, 190.54632568359375, 198.47970581054688, 206.41307067871094, 214.34645080566406, 222.27981567382812, 230.21319580078125, 238.14657592773438, 246.07994079589844, 254.01332092285156, 261.9466857910156, 269.88006591796875, 277.8134460449219, 285.746826171875, 293.68017578125, 301.6135559082031, 309.54693603515625, 317.48028564453125, 325.4136657714844, 333.3470458984375, 341.2804260253906, 349.21380615234375, 357.1471862792969]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 7.0, 2.0, 6.0, 3.0, 8.0, 2.0, 5.0, 6.0, 7.0, 8.0, 6.0, 17.0, 9.0, 19.0, 22.0, 29.0, 17.0, 17.0, 29.0, 25.0, 35.0, 43.0, 35.0, 33.0, 31.0, 43.0, 47.0, 39.0, 49.0, 33.0, 37.0, 38.0, 30.0, 27.0, 39.0, 29.0, 19.0, 19.0, 26.0, 25.0, 14.0, 12.0, 14.0, 14.0, 7.0, 6.0, 1.0, 11.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-50.74373245239258, -49.099422454833984, -47.45511245727539, -45.8108024597168, -44.1664924621582, -42.52218246459961, -40.87786865234375, -39.233558654785156, -37.58924865722656, -35.94493865966797, -34.300628662109375, -32.65631866455078, -31.012008666992188, -29.367698669433594, -27.723386764526367, -26.079076766967773, -24.434768676757812, -22.79045867919922, -21.146148681640625, -19.50183868408203, -17.857528686523438, -16.213218688964844, -14.568906784057617, -12.924596786499023, -11.28028678894043, -9.635976791381836, -7.991666316986084, -6.347355842590332, -4.703045845031738, -3.0587358474731445, -1.4144248962402344, 0.22988510131835938, 1.8741989135742188, 3.5185091495513916, 5.1628193855285645, 6.807129859924316, 8.45143985748291, 10.095749855041504, 11.740060806274414, 13.384370803833008, 15.028680801391602, 16.672990798950195, 18.31730079650879, 19.961612701416016, 21.60592269897461, 23.250232696533203, 24.894542694091797, 26.53885269165039, 28.183162689208984, 29.827472686767578, 31.471782684326172, 33.116092681884766, 34.76040267944336, 36.40471267700195, 38.04902648925781, 39.693336486816406, 41.337646484375, 42.981956481933594, 44.62626647949219, 46.27057647705078, 47.914886474609375, 49.55919647216797, 51.20350646972656, 52.847816467285156, 54.49212646484375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 6.0, 10.0, 10.0, 13.0, 9.0, 15.0, 16.0, 24.0, 31.0, 25.0, 35.0, 37.0, 34.0, 30.0, 34.0, 43.0, 39.0, 40.0, 44.0, 44.0, 46.0, 43.0, 30.0, 36.0, 33.0, 35.0, 34.0, 28.0, 28.0, 18.0, 18.0, 16.0, 24.0, 12.0, 11.0, 13.0, 6.0, 5.0, 0.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.8671875, -7.6116943359375, -7.356201171875, -7.1007080078125, -6.84521484375, -6.5897216796875, -6.334228515625, -6.0787353515625, -5.8232421875, -5.5677490234375, -5.312255859375, -5.0567626953125, -4.80126953125, -4.5457763671875, -4.290283203125, -4.0347900390625, -3.779296875, -3.5238037109375, -3.268310546875, -3.0128173828125, -2.75732421875, -2.5018310546875, -2.246337890625, -1.9908447265625, -1.7353515625, -1.4798583984375, -1.224365234375, -0.9688720703125, -0.71337890625, -0.4578857421875, -0.202392578125, 0.0531005859375, 0.30859375, 0.5640869140625, 0.819580078125, 1.0750732421875, 1.33056640625, 1.5860595703125, 1.841552734375, 2.0970458984375, 2.3525390625, 2.6080322265625, 2.863525390625, 3.1190185546875, 3.37451171875, 3.6300048828125, 3.885498046875, 4.1409912109375, 4.396484375, 4.6519775390625, 4.907470703125, 5.1629638671875, 5.41845703125, 5.6739501953125, 5.929443359375, 6.1849365234375, 6.4404296875, 6.6959228515625, 6.951416015625, 7.2069091796875, 7.46240234375, 7.7178955078125, 7.973388671875, 8.2288818359375, 8.484375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 6.0, 19.0, 20.0, 19.0, 28.0, 31.0, 61.0, 75.0, 95.0, 113.0, 199.0, 282.0, 410.0, 799.0, 1597.0, 4064.0, 15708.0, 115645.0, 1127391.0, 2446965.0, 424266.0, 42893.0, 8102.0, 2574.0, 1117.0, 581.0, 382.0, 225.0, 162.0, 104.0, 95.0, 64.0, 43.0, 38.0, 24.0, 23.0, 16.0, 5.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-19.75, -19.20556640625, -18.6611328125, -18.11669921875, -17.572265625, -17.02783203125, -16.4833984375, -15.93896484375, -15.39453125, -14.85009765625, -14.3056640625, -13.76123046875, -13.216796875, -12.67236328125, -12.1279296875, -11.58349609375, -11.0390625, -10.49462890625, -9.9501953125, -9.40576171875, -8.861328125, -8.31689453125, -7.7724609375, -7.22802734375, -6.68359375, -6.13916015625, -5.5947265625, -5.05029296875, -4.505859375, -3.96142578125, -3.4169921875, -2.87255859375, -2.328125, -1.78369140625, -1.2392578125, -0.69482421875, -0.150390625, 0.39404296875, 0.9384765625, 1.48291015625, 2.02734375, 2.57177734375, 3.1162109375, 3.66064453125, 4.205078125, 4.74951171875, 5.2939453125, 5.83837890625, 6.3828125, 6.92724609375, 7.4716796875, 8.01611328125, 8.560546875, 9.10498046875, 9.6494140625, 10.19384765625, 10.73828125, 11.28271484375, 11.8271484375, 12.37158203125, 12.916015625, 13.46044921875, 14.0048828125, 14.54931640625, 15.09375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 3.0, 7.0, 10.0, 13.0, 16.0, 33.0, 26.0, 42.0, 55.0, 79.0, 99.0, 113.0, 171.0, 184.0, 295.0, 395.0, 481.0, 538.0, 396.0, 283.0, 177.0, 144.0, 109.0, 96.0, 72.0, 64.0, 44.0, 39.0, 22.0, 12.0, 18.0, 12.0, 9.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.75, -12.29541015625, -11.8408203125, -11.38623046875, -10.931640625, -10.47705078125, -10.0224609375, -9.56787109375, -9.11328125, -8.65869140625, -8.2041015625, -7.74951171875, -7.294921875, -6.84033203125, -6.3857421875, -5.93115234375, -5.4765625, -5.02197265625, -4.5673828125, -4.11279296875, -3.658203125, -3.20361328125, -2.7490234375, -2.29443359375, -1.83984375, -1.38525390625, -0.9306640625, -0.47607421875, -0.021484375, 0.43310546875, 0.8876953125, 1.34228515625, 1.796875, 2.25146484375, 2.7060546875, 3.16064453125, 3.615234375, 4.06982421875, 4.5244140625, 4.97900390625, 5.43359375, 5.88818359375, 6.3427734375, 6.79736328125, 7.251953125, 7.70654296875, 8.1611328125, 8.61572265625, 9.0703125, 9.52490234375, 9.9794921875, 10.43408203125, 10.888671875, 11.34326171875, 11.7978515625, 12.25244140625, 12.70703125, 13.16162109375, 13.6162109375, 14.07080078125, 14.525390625, 14.97998046875, 15.4345703125, 15.88916015625, 16.34375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 5.0, 10.0, 32.0, 32.0, 57.0, 137.0, 300.0, 779.0, 2824.0, 37355.0, 3735650.0, 407688.0, 7108.0, 1399.0, 482.0, 210.0, 98.0, 51.0, 27.0, 12.0, 7.0, 11.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.78125, -58.197265625, -56.61328125, -55.029296875, -53.4453125, -51.861328125, -50.27734375, -48.693359375, -47.109375, -45.525390625, -43.94140625, -42.357421875, -40.7734375, -39.189453125, -37.60546875, -36.021484375, -34.4375, -32.853515625, -31.26953125, -29.685546875, -28.1015625, -26.517578125, -24.93359375, -23.349609375, -21.765625, -20.181640625, -18.59765625, -17.013671875, -15.4296875, -13.845703125, -12.26171875, -10.677734375, -9.09375, -7.509765625, -5.92578125, -4.341796875, -2.7578125, -1.173828125, 0.41015625, 1.994140625, 3.578125, 5.162109375, 6.74609375, 8.330078125, 9.9140625, 11.498046875, 13.08203125, 14.666015625, 16.25, 17.833984375, 19.41796875, 21.001953125, 22.5859375, 24.169921875, 25.75390625, 27.337890625, 28.921875, 30.505859375, 32.08984375, 33.673828125, 35.2578125, 36.841796875, 38.42578125, 40.009765625, 41.59375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 622.0, 390.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.78530883789062, -173.51446533203125, -144.2436065673828, -114.9727554321289, -85.701904296875, -56.431060791015625, -27.160202026367188, 2.11065673828125, 31.381500244140625, 60.65235137939453, 89.92320251464844, 119.19405364990234, 148.46490478515625, 177.73574829101562, 207.00660705566406, 236.2774658203125, 265.5483093261719, 294.81915283203125, 324.09002685546875, 353.3608703613281, 382.6317138671875, 411.9025573730469, 441.17340087890625, 470.44427490234375, 499.7151184082031, 528.9859619140625, 558.2568359375, 587.5276489257812, 616.7985229492188, 646.0693359375, 675.3402099609375, 704.611083984375, 733.8819580078125, 763.15283203125, 792.4236450195312, 821.6945190429688, 850.96533203125, 880.2362060546875, 909.507080078125, 938.7779541015625, 968.0487670898438, 997.3196411132812, 1026.5904541015625, 1055.861328125, 1085.1322021484375, 1114.403076171875, 1143.673828125, 1172.9447021484375, 1202.215576171875, 1231.4864501953125, 1260.75732421875, 1290.028076171875, 1319.2989501953125, 1348.56982421875, 1377.8406982421875, 1407.111572265625, 1436.38232421875, 1465.6531982421875, 1494.924072265625, 1524.19482421875, 1553.4656982421875, 1582.736572265625, 1612.0074462890625, 1641.2783203125, 1670.5491943359375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 12.0, 14.0, 6.0, 15.0, 27.0, 24.0, 43.0, 36.0, 45.0, 53.0, 63.0, 59.0, 73.0, 63.0, 74.0, 67.0, 69.0, 45.0, 42.0, 38.0, 35.0, 28.0, 18.0, 18.0, 6.0, 10.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-104.1339111328125, -101.5208740234375, -98.9078369140625, -96.2947998046875, -93.68177032470703, -91.06873321533203, -88.45569610595703, -85.84265899658203, -83.22962188720703, -80.61658477783203, -78.00354766845703, -75.39051818847656, -72.77748107910156, -70.16444396972656, -67.55140686035156, -64.93836975097656, -62.32533645629883, -59.71229934692383, -57.099266052246094, -54.486228942871094, -51.873191833496094, -49.260154724121094, -46.64712142944336, -44.03408432006836, -41.421051025390625, -38.808013916015625, -36.19498062133789, -33.58194351196289, -30.96890640258789, -28.355871200561523, -25.742835998535156, -23.129798889160156, -20.516761779785156, -17.90372657775879, -15.290689468383789, -12.677654266357422, -10.064618110656738, -7.451581954956055, -4.8385467529296875, -2.2255096435546875, 0.3875255584716797, 3.000561475753784, 5.613597393035889, 8.226633071899414, 10.839669227600098, 13.452705383300781, 16.06574058532715, 18.67877769470215, 21.291812896728516, 23.904848098754883, 26.517885208129883, 29.13092041015625, 31.74395751953125, 34.35699462890625, 36.970027923583984, 39.583065032958984, 42.19609832763672, 44.80913543701172, 47.42216873168945, 50.03520584106445, 52.64824295043945, 55.26127624511719, 57.87431335449219, 60.48735046386719, 63.10038757324219]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 11.0, 12.0, 12.0, 12.0, 18.0, 14.0, 21.0, 21.0, 28.0, 26.0, 40.0, 31.0, 30.0, 48.0, 40.0, 42.0, 39.0, 37.0, 34.0, 49.0, 36.0, 45.0, 38.0, 35.0, 29.0, 34.0, 34.0, 25.0, 18.0, 21.0, 24.0, 16.0, 16.0, 10.0, 12.0, 6.0, 5.0, 10.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.511962890625, -6.30908203125, -6.106201171875, -5.9033203125, -5.700439453125, -5.49755859375, -5.294677734375, -5.091796875, -4.888916015625, -4.68603515625, -4.483154296875, -4.2802734375, -4.077392578125, -3.87451171875, -3.671630859375, -3.46875, -3.265869140625, -3.06298828125, -2.860107421875, -2.6572265625, -2.454345703125, -2.25146484375, -2.048583984375, -1.845703125, -1.642822265625, -1.43994140625, -1.237060546875, -1.0341796875, -0.831298828125, -0.62841796875, -0.425537109375, -0.22265625, -0.019775390625, 0.18310546875, 0.385986328125, 0.5888671875, 0.791748046875, 0.99462890625, 1.197509765625, 1.400390625, 1.603271484375, 1.80615234375, 2.009033203125, 2.2119140625, 2.414794921875, 2.61767578125, 2.820556640625, 3.0234375, 3.226318359375, 3.42919921875, 3.632080078125, 3.8349609375, 4.037841796875, 4.24072265625, 4.443603515625, 4.646484375, 4.849365234375, 5.05224609375, 5.255126953125, 5.4580078125, 5.660888671875, 5.86376953125, 6.066650390625, 6.26953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 6.0, 11.0, 17.0, 24.0, 32.0, 47.0, 56.0, 86.0, 99.0, 154.0, 194.0, 267.0, 396.0, 547.0, 742.0, 1071.0, 1499.0, 2202.0, 3214.0, 4439.0, 6701.0, 9730.0, 14893.0, 23005.0, 35586.0, 56628.0, 89718.0, 137319.0, 174507.0, 161472.0, 115445.0, 74067.0, 46677.0, 29179.0, 19043.0, 12535.0, 8514.0, 5563.0, 3842.0, 2591.0, 1834.0, 1343.0, 912.0, 671.0, 465.0, 362.0, 251.0, 167.0, 124.0, 80.0, 70.0, 52.0, 43.0, 16.0, 21.0, 15.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0], "bins": [-0.5263671875, -0.5092697143554688, -0.4921722412109375, -0.47507476806640625, -0.457977294921875, -0.44087982177734375, -0.4237823486328125, -0.40668487548828125, -0.38958740234375, -0.37248992919921875, -0.3553924560546875, -0.33829498291015625, -0.321197509765625, -0.30410003662109375, -0.2870025634765625, -0.26990509033203125, -0.2528076171875, -0.23571014404296875, -0.2186126708984375, -0.20151519775390625, -0.184417724609375, -0.16732025146484375, -0.1502227783203125, -0.13312530517578125, -0.11602783203125, -0.09893035888671875, -0.0818328857421875, -0.06473541259765625, -0.047637939453125, -0.03054046630859375, -0.0134429931640625, 0.00365447998046875, 0.020751953125, 0.03784942626953125, 0.0549468994140625, 0.07204437255859375, 0.089141845703125, 0.10623931884765625, 0.1233367919921875, 0.14043426513671875, 0.15753173828125, 0.17462921142578125, 0.1917266845703125, 0.20882415771484375, 0.225921630859375, 0.24301910400390625, 0.2601165771484375, 0.27721405029296875, 0.2943115234375, 0.31140899658203125, 0.3285064697265625, 0.34560394287109375, 0.362701416015625, 0.37979888916015625, 0.3968963623046875, 0.41399383544921875, 0.43109130859375, 0.44818878173828125, 0.4652862548828125, 0.48238372802734375, 0.499481201171875, 0.5165786743164062, 0.5336761474609375, 0.5507736206054688, 0.56787109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 4.0, 5.0, 7.0, 14.0, 8.0, 6.0, 11.0, 16.0, 10.0, 27.0, 22.0, 21.0, 20.0, 27.0, 28.0, 27.0, 34.0, 40.0, 40.0, 34.0, 39.0, 40.0, 1068.0, 34.0, 43.0, 47.0, 32.0, 34.0, 27.0, 38.0, 23.0, 35.0, 27.0, 22.0, 21.0, 22.0, 10.0, 14.0, 11.0, 5.0, 8.0, 5.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.890472412109375, -3.76531982421875, -3.640167236328125, -3.5150146484375, -3.389862060546875, -3.26470947265625, -3.139556884765625, -3.014404296875, -2.889251708984375, -2.76409912109375, -2.638946533203125, -2.5137939453125, -2.388641357421875, -2.26348876953125, -2.138336181640625, -2.01318359375, -1.888031005859375, -1.76287841796875, -1.637725830078125, -1.5125732421875, -1.387420654296875, -1.26226806640625, -1.137115478515625, -1.011962890625, -0.886810302734375, -0.76165771484375, -0.636505126953125, -0.5113525390625, -0.386199951171875, -0.26104736328125, -0.135894775390625, -0.0107421875, 0.114410400390625, 0.23956298828125, 0.364715576171875, 0.4898681640625, 0.615020751953125, 0.74017333984375, 0.865325927734375, 0.990478515625, 1.115631103515625, 1.24078369140625, 1.365936279296875, 1.4910888671875, 1.616241455078125, 1.74139404296875, 1.866546630859375, 1.99169921875, 2.116851806640625, 2.24200439453125, 2.367156982421875, 2.4923095703125, 2.617462158203125, 2.74261474609375, 2.867767333984375, 2.992919921875, 3.118072509765625, 3.24322509765625, 3.368377685546875, 3.4935302734375, 3.618682861328125, 3.74383544921875, 3.868988037109375, 3.994140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 14.0, 13.0, 21.0, 33.0, 32.0, 64.0, 124.0, 141.0, 244.0, 407.0, 627.0, 983.0, 1481.0, 2572.0, 3743.0, 6279.0, 9908.0, 15953.0, 27132.0, 45483.0, 77539.0, 126638.0, 182235.0, 1233944.0, 141830.0, 88394.0, 52548.0, 30881.0, 18104.0, 11243.0, 6897.0, 4294.0, 2668.0, 1668.0, 1045.0, 684.0, 444.0, 280.0, 178.0, 111.0, 97.0, 56.0, 38.0, 24.0, 15.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.54443359375, -0.5274887084960938, -0.5105438232421875, -0.49359893798828125, -0.476654052734375, -0.45970916748046875, -0.4427642822265625, -0.42581939697265625, -0.40887451171875, -0.39192962646484375, -0.3749847412109375, -0.35803985595703125, -0.341094970703125, -0.32415008544921875, -0.3072052001953125, -0.29026031494140625, -0.2733154296875, -0.25637054443359375, -0.2394256591796875, -0.22248077392578125, -0.205535888671875, -0.18859100341796875, -0.1716461181640625, -0.15470123291015625, -0.13775634765625, -0.12081146240234375, -0.1038665771484375, -0.08692169189453125, -0.069976806640625, -0.05303192138671875, -0.0360870361328125, -0.01914215087890625, -0.002197265625, 0.01474761962890625, 0.0316925048828125, 0.04863739013671875, 0.065582275390625, 0.08252716064453125, 0.0994720458984375, 0.11641693115234375, 0.13336181640625, 0.15030670166015625, 0.1672515869140625, 0.18419647216796875, 0.201141357421875, 0.21808624267578125, 0.2350311279296875, 0.25197601318359375, 0.2689208984375, 0.28586578369140625, 0.3028106689453125, 0.31975555419921875, 0.336700439453125, 0.35364532470703125, 0.3705902099609375, 0.38753509521484375, 0.40447998046875, 0.42142486572265625, 0.4383697509765625, 0.45531463623046875, 0.472259521484375, 0.48920440673828125, 0.5061492919921875, 0.5230941772460938, 0.5400390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 7.0, 6.0, 7.0, 5.0, 12.0, 16.0, 11.0, 19.0, 26.0, 26.0, 31.0, 42.0, 39.0, 40.0, 60.0, 52.0, 54.0, 52.0, 50.0, 55.0, 39.0, 50.0, 37.0, 53.0, 36.0, 22.0, 27.0, 23.0, 13.0, 11.0, 14.0, 13.0, 9.0, 10.0, 5.0, 7.0, 11.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002277374267578125, -0.0022150129079818726, -0.00215265154838562, -0.0020902901887893677, -0.0020279288291931152, -0.001965567469596863, -0.0019032061100006104, -0.001840844750404358, -0.0017784833908081055, -0.001716122031211853, -0.0016537606716156006, -0.0015913993120193481, -0.0015290379524230957, -0.0014666765928268433, -0.0014043152332305908, -0.0013419538736343384, -0.001279592514038086, -0.0012172311544418335, -0.001154869794845581, -0.0010925084352493286, -0.0010301470756530762, -0.0009677857160568237, -0.0009054243564605713, -0.0008430629968643188, -0.0007807016372680664, -0.000718340277671814, -0.0006559789180755615, -0.0005936175584793091, -0.0005312561988830566, -0.0004688948392868042, -0.00040653347969055176, -0.0003441721200942993, -0.0002818107604980469, -0.00021944940090179443, -0.000157088041305542, -9.472668170928955e-05, -3.236532211303711e-05, 2.9996037483215332e-05, 9.235739707946777e-05, 0.00015471875667572021, 0.00021708011627197266, 0.0002794414758682251, 0.00034180283546447754, 0.00040416419506073, 0.0004665255546569824, 0.0005288869142532349, 0.0005912482738494873, 0.0006536096334457397, 0.0007159709930419922, 0.0007783323526382446, 0.0008406937122344971, 0.0009030550718307495, 0.000965416431427002, 0.0010277777910232544, 0.0010901391506195068, 0.0011525005102157593, 0.0012148618698120117, 0.0012772232294082642, 0.0013395845890045166, 0.001401945948600769, 0.0014643073081970215, 0.001526668667793274, 0.0015890300273895264, 0.0016513913869857788, 0.0017137527465820312]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 13.0, 6.0, 11.0, 15.0, 11.0, 17.0, 15.0, 20.0, 35.0, 34.0, 26.0, 41.0, 55.0, 59.0, 103.0, 160.0, 232.0, 328.0, 576.0, 1257.0, 124462.0, 915796.0, 3043.0, 730.0, 425.0, 279.0, 200.0, 134.0, 104.0, 81.0, 50.0, 55.0, 40.0, 27.0, 22.0, 22.0, 15.0, 10.0, 8.0, 19.0, 10.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.03149557113647461, -0.03033733367919922, -0.029179096221923828, -0.028020858764648438, -0.026862621307373047, -0.025704383850097656, -0.024546146392822266, -0.023387908935546875, -0.022229671478271484, -0.021071434020996094, -0.019913196563720703, -0.018754959106445312, -0.017596721649169922, -0.01643848419189453, -0.01528024673461914, -0.01412200927734375, -0.01296377182006836, -0.011805534362792969, -0.010647296905517578, -0.009489059448242188, -0.008330821990966797, -0.007172584533691406, -0.006014347076416016, -0.004856109619140625, -0.0036978721618652344, -0.0025396347045898438, -0.0013813972473144531, -0.0002231597900390625, 0.0009350776672363281, 0.0020933151245117188, 0.0032515525817871094, 0.0044097900390625, 0.005568027496337891, 0.006726264953613281, 0.007884502410888672, 0.009042739868164062, 0.010200977325439453, 0.011359214782714844, 0.012517452239990234, 0.013675689697265625, 0.014833927154541016, 0.015992164611816406, 0.017150402069091797, 0.018308639526367188, 0.019466876983642578, 0.02062511444091797, 0.02178335189819336, 0.02294158935546875, 0.02409982681274414, 0.02525806427001953, 0.026416301727294922, 0.027574539184570312, 0.028732776641845703, 0.029891014099121094, 0.031049251556396484, 0.032207489013671875, 0.033365726470947266, 0.034523963928222656, 0.03568220138549805, 0.03684043884277344, 0.03799867630004883, 0.03915691375732422, 0.04031515121459961, 0.041473388671875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 36.0, 491.0, 463.0, 26.0, 0.0, 2.0], "bins": [-0.016192831099033356, -0.01592288166284561, -0.015652932226657867, -0.015382983721792698, -0.015113034285604954, -0.01484308484941721, -0.01457313634455204, -0.014303186908364296, -0.014033237472176552, -0.013763288035988808, -0.013493339531123638, -0.013223390094935894, -0.01295344065874815, -0.012683491222560406, -0.012413542717695236, -0.012143593281507492, -0.011873643845319748, -0.011603694409132004, -0.011333745904266834, -0.01106379646807909, -0.010793847031891346, -0.010523897595703602, -0.010253949090838432, -0.009983999654650688, -0.009714051149785519, -0.009444101713597775, -0.009174153208732605, -0.00890420377254486, -0.008634254336357117, -0.008364304900169373, -0.008094356395304203, -0.007824406959116459, -0.007554457522928715, -0.007284508552402258, -0.007014559116214514, -0.006744610145688057, -0.006474660709500313, -0.006204711738973856, -0.005934762768447399, -0.005664813332259655, -0.005394863896071911, -0.005124914925545454, -0.00485496548935771, -0.004585016518831253, -0.004315067082643509, -0.004045118112117052, -0.0037751689087599516, -0.003505219705402851, -0.0032352707348763943, -0.002965321531519294, -0.0026953723281621933, -0.0024254233576357365, -0.0021554739214479923, -0.0018855248345062137, -0.001615575747564435, -0.0013456265442073345, -0.0010756772244349122, -0.0008057280210778117, -0.0005357788759283721, -0.00026582973077893257, 4.119472578167915e-06, 0.0002740686759352684, 0.0005440177628770471, 0.0008139669662341475, 0.001083916169591248]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 12.0, 17.0, 18.0, 22.0, 23.0, 24.0, 26.0, 20.0, 34.0, 28.0, 40.0, 41.0, 35.0, 38.0, 32.0, 31.0, 34.0, 49.0, 34.0, 43.0, 41.0, 26.0, 36.0, 38.0, 31.0, 25.0, 23.0, 14.0, 15.0, 19.0, 21.0, 15.0, 18.0, 14.0, 6.0, 8.0, 5.0, 7.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009385347366333008, -0.0009065307676792145, -0.0008745267987251282, -0.0008425228297710419, -0.0008105188608169556, -0.0007785148918628693, -0.000746510922908783, -0.0007145069539546967, -0.0006825029850006104, -0.000650499016046524, -0.0006184950470924377, -0.0005864910781383514, -0.0005544871091842651, -0.0005224831402301788, -0.0004904791712760925, -0.0004584752023220062, -0.0004264712333679199, -0.0003944672644138336, -0.0003624632954597473, -0.000330459326505661, -0.0002984553575515747, -0.0002664513885974884, -0.0002344474196434021, -0.0002024434506893158, -0.0001704394817352295, -0.0001384355127811432, -0.00010643154382705688, -7.442757487297058e-05, -4.242360591888428e-05, -1.0419636964797974e-05, 2.158433198928833e-05, 5.3588300943374634e-05, 8.559226989746094e-05, 0.00011759623885154724, 0.00014960020780563354, 0.00018160417675971985, 0.00021360814571380615, 0.00024561211466789246, 0.00027761608362197876, 0.00030962005257606506, 0.00034162402153015137, 0.00037362799048423767, 0.000405631959438324, 0.0004376359283924103, 0.0004696398973464966, 0.0005016438663005829, 0.0005336478352546692, 0.0005656518042087555, 0.0005976557731628418, 0.0006296597421169281, 0.0006616637110710144, 0.0006936676800251007, 0.000725671648979187, 0.0007576756179332733, 0.0007896795868873596, 0.0008216835558414459, 0.0008536875247955322, 0.0008856914937496185, 0.0009176954627037048, 0.0009496994316577911, 0.0009817034006118774, 0.0010137073695659637, 0.00104571133852005, 0.0010777153074741364, 0.0011097192764282227]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 11.0, 12.0, 12.0, 12.0, 18.0, 14.0, 21.0, 21.0, 28.0, 26.0, 40.0, 31.0, 30.0, 48.0, 40.0, 42.0, 39.0, 37.0, 34.0, 49.0, 36.0, 45.0, 38.0, 35.0, 29.0, 34.0, 34.0, 25.0, 18.0, 21.0, 24.0, 16.0, 16.0, 10.0, 12.0, 6.0, 5.0, 10.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.511962890625, -6.30908203125, -6.106201171875, -5.9033203125, -5.700439453125, -5.49755859375, -5.294677734375, -5.091796875, -4.888916015625, -4.68603515625, -4.483154296875, -4.2802734375, -4.077392578125, -3.87451171875, -3.671630859375, -3.46875, -3.265869140625, -3.06298828125, -2.860107421875, -2.6572265625, -2.454345703125, -2.25146484375, -2.048583984375, -1.845703125, -1.642822265625, -1.43994140625, -1.237060546875, -1.0341796875, -0.831298828125, -0.62841796875, -0.425537109375, -0.22265625, -0.019775390625, 0.18310546875, 0.385986328125, 0.5888671875, 0.791748046875, 0.99462890625, 1.197509765625, 1.400390625, 1.603271484375, 1.80615234375, 2.009033203125, 2.2119140625, 2.414794921875, 2.61767578125, 2.820556640625, 3.0234375, 3.226318359375, 3.42919921875, 3.632080078125, 3.8349609375, 4.037841796875, 4.24072265625, 4.443603515625, 4.646484375, 4.849365234375, 5.05224609375, 5.255126953125, 5.4580078125, 5.660888671875, 5.86376953125, 6.066650390625, 6.26953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 14.0, 13.0, 30.0, 44.0, 77.0, 73.0, 122.0, 147.0, 214.0, 330.0, 433.0, 691.0, 966.0, 1443.0, 2307.0, 4471.0, 12410.0, 85021.0, 693562.0, 209815.0, 22257.0, 5865.0, 2879.0, 1703.0, 1150.0, 719.0, 528.0, 373.0, 269.0, 171.0, 120.0, 89.0, 60.0, 40.0, 38.0, 23.0, 19.0, 18.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.53125, -15.992431640625, -15.45361328125, -14.914794921875, -14.3759765625, -13.837158203125, -13.29833984375, -12.759521484375, -12.220703125, -11.681884765625, -11.14306640625, -10.604248046875, -10.0654296875, -9.526611328125, -8.98779296875, -8.448974609375, -7.91015625, -7.371337890625, -6.83251953125, -6.293701171875, -5.7548828125, -5.216064453125, -4.67724609375, -4.138427734375, -3.599609375, -3.060791015625, -2.52197265625, -1.983154296875, -1.4443359375, -0.905517578125, -0.36669921875, 0.172119140625, 0.7109375, 1.249755859375, 1.78857421875, 2.327392578125, 2.8662109375, 3.405029296875, 3.94384765625, 4.482666015625, 5.021484375, 5.560302734375, 6.09912109375, 6.637939453125, 7.1767578125, 7.715576171875, 8.25439453125, 8.793212890625, 9.33203125, 9.870849609375, 10.40966796875, 10.948486328125, 11.4873046875, 12.026123046875, 12.56494140625, 13.103759765625, 13.642578125, 14.181396484375, 14.72021484375, 15.259033203125, 15.7978515625, 16.336669921875, 16.87548828125, 17.414306640625, 17.953125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 9.0, 12.0, 7.0, 18.0, 14.0, 11.0, 27.0, 23.0, 39.0, 32.0, 38.0, 45.0, 49.0, 60.0, 68.0, 161.0, 1529.0, 348.0, 130.0, 43.0, 47.0, 54.0, 32.0, 27.0, 38.0, 26.0, 18.0, 20.0, 18.0, 16.0, 13.0, 10.0, 8.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.484375, -15.967041015625, -15.44970703125, -14.932373046875, -14.4150390625, -13.897705078125, -13.38037109375, -12.863037109375, -12.345703125, -11.828369140625, -11.31103515625, -10.793701171875, -10.2763671875, -9.759033203125, -9.24169921875, -8.724365234375, -8.20703125, -7.689697265625, -7.17236328125, -6.655029296875, -6.1376953125, -5.620361328125, -5.10302734375, -4.585693359375, -4.068359375, -3.551025390625, -3.03369140625, -2.516357421875, -1.9990234375, -1.481689453125, -0.96435546875, -0.447021484375, 0.0703125, 0.587646484375, 1.10498046875, 1.622314453125, 2.1396484375, 2.656982421875, 3.17431640625, 3.691650390625, 4.208984375, 4.726318359375, 5.24365234375, 5.760986328125, 6.2783203125, 6.795654296875, 7.31298828125, 7.830322265625, 8.34765625, 8.864990234375, 9.38232421875, 9.899658203125, 10.4169921875, 10.934326171875, 11.45166015625, 11.968994140625, 12.486328125, 13.003662109375, 13.52099609375, 14.038330078125, 14.5556640625, 15.072998046875, 15.59033203125, 16.107666015625, 16.625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 11.0, 10.0, 11.0, 12.0, 18.0, 32.0, 34.0, 42.0, 52.0, 75.0, 101.0, 117.0, 193.0, 335.0, 636.0, 1933.0, 327576.0, 2809807.0, 2756.0, 738.0, 371.0, 231.0, 169.0, 95.0, 74.0, 53.0, 43.0, 40.0, 26.0, 27.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 7.0, 2.0, 1.0, 2.0, 4.0, 2.0], "bins": [-58.5625, -56.9833984375, -55.404296875, -53.8251953125, -52.24609375, -50.6669921875, -49.087890625, -47.5087890625, -45.9296875, -44.3505859375, -42.771484375, -41.1923828125, -39.61328125, -38.0341796875, -36.455078125, -34.8759765625, -33.296875, -31.7177734375, -30.138671875, -28.5595703125, -26.98046875, -25.4013671875, -23.822265625, -22.2431640625, -20.6640625, -19.0849609375, -17.505859375, -15.9267578125, -14.34765625, -12.7685546875, -11.189453125, -9.6103515625, -8.03125, -6.4521484375, -4.873046875, -3.2939453125, -1.71484375, -0.1357421875, 1.443359375, 3.0224609375, 4.6015625, 6.1806640625, 7.759765625, 9.3388671875, 10.91796875, 12.4970703125, 14.076171875, 15.6552734375, 17.234375, 18.8134765625, 20.392578125, 21.9716796875, 23.55078125, 25.1298828125, 26.708984375, 28.2880859375, 29.8671875, 31.4462890625, 33.025390625, 34.6044921875, 36.18359375, 37.7626953125, 39.341796875, 40.9208984375, 42.5]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 12.0, 109.0, 413.0, 391.0, 85.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.259794235229492, -21.80027198791504, -17.340749740600586, -12.881227493286133, -8.42170524597168, -3.9621829986572266, 0.49733924865722656, 4.95686149597168, 9.416383743286133, 13.875905990600586, 18.33542823791504, 22.794950485229492, 27.254472732543945, 31.7139949798584, 36.17351531982422, 40.63304138183594, 45.092559814453125, 49.55208206176758, 54.01160430908203, 58.471126556396484, 62.93064880371094, 67.39016723632812, 71.84969329833984, 76.30921936035156, 80.76873779296875, 85.22825622558594, 89.68778228759766, 94.14730834960938, 98.60682678222656, 103.06634521484375, 107.52587127685547, 111.98539733886719, 116.44491577148438, 120.90443420410156, 125.36396026611328, 129.823486328125, 134.2830047607422, 138.74252319335938, 143.20205688476562, 147.6615753173828, 152.12109375, 156.5806121826172, 161.04013061523438, 165.49966430664062, 169.9591827392578, 174.418701171875, 178.87823486328125, 183.33775329589844, 187.79727172851562, 192.2567901611328, 196.71630859375, 201.17584228515625, 205.63536071777344, 210.09487915039062, 214.55441284179688, 219.01393127441406, 223.47344970703125, 227.93296813964844, 232.39248657226562, 236.85202026367188, 241.31153869628906, 245.77105712890625, 250.2305908203125, 254.6901092529297, 259.1496276855469]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 4.0, 4.0, 10.0, 4.0, 7.0, 12.0, 12.0, 10.0, 25.0, 19.0, 24.0, 26.0, 24.0, 21.0, 32.0, 43.0, 51.0, 34.0, 25.0, 51.0, 48.0, 49.0, 42.0, 28.0, 37.0, 38.0, 38.0, 42.0, 29.0, 26.0, 27.0, 18.0, 17.0, 25.0, 17.0, 11.0, 9.0, 16.0, 6.0, 11.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0], "bins": [-50.01952362060547, -48.573570251464844, -47.12761688232422, -45.68166732788086, -44.235713958740234, -42.78976058959961, -41.34381103515625, -39.897857666015625, -38.451904296875, -37.005950927734375, -35.55999755859375, -34.11404800415039, -32.668094635009766, -31.22214126586914, -29.77618980407715, -28.330238342285156, -26.88428497314453, -25.438331604003906, -23.992380142211914, -22.546428680419922, -21.100475311279297, -19.654521942138672, -18.20857048034668, -16.762619018554688, -15.316665649414062, -13.870713233947754, -12.424760818481445, -10.978808403015137, -9.532855987548828, -8.08690357208252, -6.640951156616211, -5.194998741149902, -3.7490463256835938, -2.303093910217285, -0.8571414947509766, 0.588810920715332, 2.0347633361816406, 3.480715751647949, 4.926668167114258, 6.372620582580566, 7.818572998046875, 9.264525413513184, 10.710477828979492, 12.1564302444458, 13.60238265991211, 15.048335075378418, 16.494287490844727, 17.94023895263672, 19.386192321777344, 20.83214569091797, 22.27809715270996, 23.724048614501953, 25.170001983642578, 26.615955352783203, 28.061906814575195, 29.507858276367188, 30.953811645507812, 32.39976501464844, 33.84571838378906, 35.29166793823242, 36.73762130737305, 38.18357467651367, 39.62952423095703, 41.075477600097656, 42.52143096923828]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 12.0, 8.0, 11.0, 10.0, 17.0, 19.0, 12.0, 20.0, 20.0, 21.0, 21.0, 21.0, 39.0, 45.0, 36.0, 46.0, 28.0, 45.0, 41.0, 33.0, 30.0, 36.0, 39.0, 50.0, 37.0, 33.0, 25.0, 37.0, 24.0, 33.0, 27.0, 12.0, 11.0, 15.0, 18.0, 15.0, 5.0, 5.0, 11.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.921875, -6.72161865234375, -6.5213623046875, -6.32110595703125, -6.120849609375, -5.92059326171875, -5.7203369140625, -5.52008056640625, -5.31982421875, -5.11956787109375, -4.9193115234375, -4.71905517578125, -4.518798828125, -4.31854248046875, -4.1182861328125, -3.91802978515625, -3.7177734375, -3.51751708984375, -3.3172607421875, -3.11700439453125, -2.916748046875, -2.71649169921875, -2.5162353515625, -2.31597900390625, -2.11572265625, -1.91546630859375, -1.7152099609375, -1.51495361328125, -1.314697265625, -1.11444091796875, -0.9141845703125, -0.71392822265625, -0.513671875, -0.31341552734375, -0.1131591796875, 0.08709716796875, 0.287353515625, 0.48760986328125, 0.6878662109375, 0.88812255859375, 1.08837890625, 1.28863525390625, 1.4888916015625, 1.68914794921875, 1.889404296875, 2.08966064453125, 2.2899169921875, 2.49017333984375, 2.6904296875, 2.89068603515625, 3.0909423828125, 3.29119873046875, 3.491455078125, 3.69171142578125, 3.8919677734375, 4.09222412109375, 4.29248046875, 4.49273681640625, 4.6929931640625, 4.89324951171875, 5.093505859375, 5.29376220703125, 5.4940185546875, 5.69427490234375, 5.89453125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 7.0, 2.0, 1.0, 5.0, 10.0, 13.0, 13.0, 15.0, 26.0, 27.0, 47.0, 63.0, 85.0, 77.0, 146.0, 203.0, 324.0, 493.0, 722.0, 1147.0, 1823.0, 3089.0, 5791.0, 12429.0, 33601.0, 152004.0, 782161.0, 1955151.0, 972645.0, 200345.0, 42421.0, 14149.0, 6216.0, 3404.0, 1954.0, 1275.0, 763.0, 492.0, 345.0, 223.0, 150.0, 115.0, 75.0, 69.0, 44.0, 35.0, 20.0, 19.0, 15.0, 15.0, 5.0, 5.0, 8.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-10.3046875, -9.9884033203125, -9.672119140625, -9.3558349609375, -9.03955078125, -8.7232666015625, -8.406982421875, -8.0906982421875, -7.7744140625, -7.4581298828125, -7.141845703125, -6.8255615234375, -6.50927734375, -6.1929931640625, -5.876708984375, -5.5604248046875, -5.244140625, -4.9278564453125, -4.611572265625, -4.2952880859375, -3.97900390625, -3.6627197265625, -3.346435546875, -3.0301513671875, -2.7138671875, -2.3975830078125, -2.081298828125, -1.7650146484375, -1.44873046875, -1.1324462890625, -0.816162109375, -0.4998779296875, -0.18359375, 0.1326904296875, 0.448974609375, 0.7652587890625, 1.08154296875, 1.3978271484375, 1.714111328125, 2.0303955078125, 2.3466796875, 2.6629638671875, 2.979248046875, 3.2955322265625, 3.61181640625, 3.9281005859375, 4.244384765625, 4.5606689453125, 4.876953125, 5.1932373046875, 5.509521484375, 5.8258056640625, 6.14208984375, 6.4583740234375, 6.774658203125, 7.0909423828125, 7.4072265625, 7.7235107421875, 8.039794921875, 8.3560791015625, 8.67236328125, 8.9886474609375, 9.304931640625, 9.6212158203125, 9.9375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 24.0, 37.0, 64.0, 156.0, 297.0, 587.0, 972.0, 905.0, 516.0, 260.0, 123.0, 55.0, 30.0, 13.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.0625, -25.2451171875, -24.427734375, -23.6103515625, -22.79296875, -21.9755859375, -21.158203125, -20.3408203125, -19.5234375, -18.7060546875, -17.888671875, -17.0712890625, -16.25390625, -15.4365234375, -14.619140625, -13.8017578125, -12.984375, -12.1669921875, -11.349609375, -10.5322265625, -9.71484375, -8.8974609375, -8.080078125, -7.2626953125, -6.4453125, -5.6279296875, -4.810546875, -3.9931640625, -3.17578125, -2.3583984375, -1.541015625, -0.7236328125, 0.09375, 0.9111328125, 1.728515625, 2.5458984375, 3.36328125, 4.1806640625, 4.998046875, 5.8154296875, 6.6328125, 7.4501953125, 8.267578125, 9.0849609375, 9.90234375, 10.7197265625, 11.537109375, 12.3544921875, 13.171875, 13.9892578125, 14.806640625, 15.6240234375, 16.44140625, 17.2587890625, 18.076171875, 18.8935546875, 19.7109375, 20.5283203125, 21.345703125, 22.1630859375, 22.98046875, 23.7978515625, 24.615234375, 25.4326171875, 26.25]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 7.0, 5.0, 12.0, 12.0, 19.0, 38.0, 93.0, 220.0, 601.0, 1585.0, 10874.0, 4021423.0, 154766.0, 2977.0, 922.0, 365.0, 152.0, 84.0, 49.0, 29.0, 11.0, 13.0, 5.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.59375, -55.88623046875, -54.1787109375, -52.47119140625, -50.763671875, -49.05615234375, -47.3486328125, -45.64111328125, -43.93359375, -42.22607421875, -40.5185546875, -38.81103515625, -37.103515625, -35.39599609375, -33.6884765625, -31.98095703125, -30.2734375, -28.56591796875, -26.8583984375, -25.15087890625, -23.443359375, -21.73583984375, -20.0283203125, -18.32080078125, -16.61328125, -14.90576171875, -13.1982421875, -11.49072265625, -9.783203125, -8.07568359375, -6.3681640625, -4.66064453125, -2.953125, -1.24560546875, 0.4619140625, 2.16943359375, 3.876953125, 5.58447265625, 7.2919921875, 8.99951171875, 10.70703125, 12.41455078125, 14.1220703125, 15.82958984375, 17.537109375, 19.24462890625, 20.9521484375, 22.65966796875, 24.3671875, 26.07470703125, 27.7822265625, 29.48974609375, 31.197265625, 32.90478515625, 34.6123046875, 36.31982421875, 38.02734375, 39.73486328125, 41.4423828125, 43.14990234375, 44.857421875, 46.56494140625, 48.2724609375, 49.97998046875, 51.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 248.0, 761.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.84329223632812, -141.57958984375, -124.31590270996094, -107.05220794677734, -89.78851318359375, -72.52481842041016, -55.26112365722656, -37.99742889404297, -20.733734130859375, -3.4700393676757812, 13.793655395507812, 31.057350158691406, 48.321044921875, 65.5847396850586, 82.84843444824219, 100.11212921142578, 117.37582397460938, 134.6395263671875, 151.90321350097656, 169.16690063476562, 186.43060302734375, 203.69430541992188, 220.95799255371094, 238.2216796875, 255.48538208007812, 272.74908447265625, 290.01275634765625, 307.2764587402344, 324.5401611328125, 341.8038635253906, 359.06756591796875, 376.33123779296875, 393.59490966796875, 410.8586120605469, 428.122314453125, 445.385986328125, 462.6496887207031, 479.91339111328125, 497.17706298828125, 514.4407958984375, 531.7044677734375, 548.9681396484375, 566.2318725585938, 583.4955444335938, 600.75927734375, 618.02294921875, 635.28662109375, 652.5503540039062, 669.8140258789062, 687.0776977539062, 704.3414306640625, 721.6051025390625, 738.8687744140625, 756.1325073242188, 773.3961791992188, 790.659912109375, 807.923583984375, 825.187255859375, 842.4509887695312, 859.7146606445312, 876.9783935546875, 894.2420654296875, 911.5057373046875, 928.7694702148438, 946.0331420898438]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 6.0, 8.0, 6.0, 10.0, 12.0, 11.0, 21.0, 17.0, 12.0, 21.0, 29.0, 24.0, 29.0, 33.0, 36.0, 37.0, 49.0, 33.0, 51.0, 37.0, 35.0, 36.0, 45.0, 36.0, 39.0, 36.0, 34.0, 26.0, 35.0, 24.0, 30.0, 23.0, 25.0, 19.0, 15.0, 11.0, 8.0, 8.0, 6.0, 7.0, 5.0, 1.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.69012451171875, -43.33840560913086, -41.98668670654297, -40.634971618652344, -39.28325271606445, -37.93153381347656, -36.57981872558594, -35.22809982299805, -33.876380920410156, -32.524662017822266, -31.172945022583008, -29.82122802734375, -28.46950912475586, -27.11779022216797, -25.76607322692871, -24.414356231689453, -23.062637329101562, -21.710918426513672, -20.359201431274414, -19.007484436035156, -17.655765533447266, -16.304046630859375, -14.952329635620117, -13.600611686706543, -12.248893737792969, -10.897175788879395, -9.54545783996582, -8.193739891052246, -6.842021942138672, -5.490303993225098, -4.138586044311523, -2.786868095397949, -1.435150146484375, -0.08343219757080078, 1.2682857513427734, 2.6200037002563477, 3.971721649169922, 5.323439598083496, 6.67515754699707, 8.026875495910645, 9.378593444824219, 10.730311393737793, 12.082029342651367, 13.433747291564941, 14.785465240478516, 16.137184143066406, 17.488901138305664, 18.840618133544922, 20.192337036132812, 21.544055938720703, 22.89577293395996, 24.24748992919922, 25.59920883178711, 26.950927734375, 28.302644729614258, 29.654361724853516, 31.006080627441406, 32.3577995300293, 33.70951843261719, 35.06123352050781, 36.4129524230957, 37.764671325683594, 39.11638641357422, 40.46810531616211, 41.81982421875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 3.0, 11.0, 8.0, 25.0, 12.0, 20.0, 15.0, 20.0, 26.0, 29.0, 41.0, 28.0, 32.0, 29.0, 37.0, 27.0, 41.0, 29.0, 45.0, 49.0, 45.0, 36.0, 34.0, 36.0, 34.0, 30.0, 31.0, 33.0, 13.0, 19.0, 18.0, 15.0, 9.0, 17.0, 13.0, 9.0, 15.0, 6.0, 6.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.40625, -5.2362060546875, -5.066162109375, -4.8961181640625, -4.72607421875, -4.5560302734375, -4.385986328125, -4.2159423828125, -4.0458984375, -3.8758544921875, -3.705810546875, -3.5357666015625, -3.36572265625, -3.1956787109375, -3.025634765625, -2.8555908203125, -2.685546875, -2.5155029296875, -2.345458984375, -2.1754150390625, -2.00537109375, -1.8353271484375, -1.665283203125, -1.4952392578125, -1.3251953125, -1.1551513671875, -0.985107421875, -0.8150634765625, -0.64501953125, -0.4749755859375, -0.304931640625, -0.1348876953125, 0.03515625, 0.2052001953125, 0.375244140625, 0.5452880859375, 0.71533203125, 0.8853759765625, 1.055419921875, 1.2254638671875, 1.3955078125, 1.5655517578125, 1.735595703125, 1.9056396484375, 2.07568359375, 2.2457275390625, 2.415771484375, 2.5858154296875, 2.755859375, 2.9259033203125, 3.095947265625, 3.2659912109375, 3.43603515625, 3.6060791015625, 3.776123046875, 3.9461669921875, 4.1162109375, 4.2862548828125, 4.456298828125, 4.6263427734375, 4.79638671875, 4.9664306640625, 5.136474609375, 5.3065185546875, 5.4765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 9.0, 6.0, 11.0, 15.0, 33.0, 30.0, 41.0, 61.0, 115.0, 170.0, 239.0, 400.0, 578.0, 900.0, 1358.0, 2117.0, 3295.0, 5113.0, 8323.0, 13398.0, 21888.0, 37478.0, 63684.0, 110468.0, 174195.0, 208413.0, 158255.0, 97483.0, 56017.0, 32654.0, 19347.0, 11969.0, 7364.0, 4706.0, 2996.0, 1933.0, 1226.0, 792.0, 512.0, 295.0, 202.0, 151.0, 104.0, 68.0, 54.0, 31.0, 23.0, 21.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.5849609375, -0.5674362182617188, -0.5499114990234375, -0.5323867797851562, -0.514862060546875, -0.49733734130859375, -0.4798126220703125, -0.46228790283203125, -0.44476318359375, -0.42723846435546875, -0.4097137451171875, -0.39218902587890625, -0.374664306640625, -0.35713958740234375, -0.3396148681640625, -0.32209014892578125, -0.3045654296875, -0.28704071044921875, -0.2695159912109375, -0.25199127197265625, -0.234466552734375, -0.21694183349609375, -0.1994171142578125, -0.18189239501953125, -0.16436767578125, -0.14684295654296875, -0.1293182373046875, -0.11179351806640625, -0.094268798828125, -0.07674407958984375, -0.0592193603515625, -0.04169464111328125, -0.024169921875, -0.00664520263671875, 0.0108795166015625, 0.02840423583984375, 0.045928955078125, 0.06345367431640625, 0.0809783935546875, 0.09850311279296875, 0.11602783203125, 0.13355255126953125, 0.1510772705078125, 0.16860198974609375, 0.186126708984375, 0.20365142822265625, 0.2211761474609375, 0.23870086669921875, 0.2562255859375, 0.27375030517578125, 0.2912750244140625, 0.30879974365234375, 0.326324462890625, 0.34384918212890625, 0.3613739013671875, 0.37889862060546875, 0.39642333984375, 0.41394805908203125, 0.4314727783203125, 0.44899749755859375, 0.466522216796875, 0.48404693603515625, 0.5015716552734375, 0.5190963745117188, 0.53662109375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 5.0, 4.0, 7.0, 11.0, 8.0, 7.0, 20.0, 14.0, 17.0, 23.0, 27.0, 26.0, 38.0, 40.0, 33.0, 37.0, 41.0, 53.0, 37.0, 45.0, 1068.0, 28.0, 43.0, 38.0, 44.0, 46.0, 32.0, 40.0, 35.0, 28.0, 20.0, 21.0, 16.0, 13.0, 12.0, 8.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.873046875, -3.748382568359375, -3.62371826171875, -3.499053955078125, -3.3743896484375, -3.249725341796875, -3.12506103515625, -3.000396728515625, -2.875732421875, -2.751068115234375, -2.62640380859375, -2.501739501953125, -2.3770751953125, -2.252410888671875, -2.12774658203125, -2.003082275390625, -1.87841796875, -1.753753662109375, -1.62908935546875, -1.504425048828125, -1.3797607421875, -1.255096435546875, -1.13043212890625, -1.005767822265625, -0.881103515625, -0.756439208984375, -0.63177490234375, -0.507110595703125, -0.3824462890625, -0.257781982421875, -0.13311767578125, -0.008453369140625, 0.1162109375, 0.240875244140625, 0.36553955078125, 0.490203857421875, 0.6148681640625, 0.739532470703125, 0.86419677734375, 0.988861083984375, 1.113525390625, 1.238189697265625, 1.36285400390625, 1.487518310546875, 1.6121826171875, 1.736846923828125, 1.86151123046875, 1.986175537109375, 2.11083984375, 2.235504150390625, 2.36016845703125, 2.484832763671875, 2.6094970703125, 2.734161376953125, 2.85882568359375, 2.983489990234375, 3.108154296875, 3.232818603515625, 3.35748291015625, 3.482147216796875, 3.6068115234375, 3.731475830078125, 3.85614013671875, 3.980804443359375, 4.10546875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 29.0, 37.0, 41.0, 92.0, 130.0, 200.0, 307.0, 465.0, 694.0, 1161.0, 1758.0, 2693.0, 4369.0, 6996.0, 11272.0, 18432.0, 29416.0, 48043.0, 80177.0, 126483.0, 175785.0, 1221696.0, 137747.0, 88804.0, 54145.0, 32446.0, 20049.0, 12361.0, 7865.0, 4958.0, 3075.0, 1967.0, 1213.0, 786.0, 502.0, 328.0, 189.0, 130.0, 83.0, 72.0, 40.0, 21.0, 11.0, 14.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.4462890625, -0.4323883056640625, -0.418487548828125, -0.4045867919921875, -0.39068603515625, -0.3767852783203125, -0.362884521484375, -0.3489837646484375, -0.3350830078125, -0.3211822509765625, -0.307281494140625, -0.2933807373046875, -0.27947998046875, -0.2655792236328125, -0.251678466796875, -0.2377777099609375, -0.223876953125, -0.2099761962890625, -0.196075439453125, -0.1821746826171875, -0.16827392578125, -0.1543731689453125, -0.140472412109375, -0.1265716552734375, -0.1126708984375, -0.0987701416015625, -0.084869384765625, -0.0709686279296875, -0.05706787109375, -0.0431671142578125, -0.029266357421875, -0.0153656005859375, -0.00146484375, 0.0124359130859375, 0.026336669921875, 0.0402374267578125, 0.05413818359375, 0.0680389404296875, 0.081939697265625, 0.0958404541015625, 0.1097412109375, 0.1236419677734375, 0.137542724609375, 0.1514434814453125, 0.16534423828125, 0.1792449951171875, 0.193145751953125, 0.2070465087890625, 0.220947265625, 0.2348480224609375, 0.248748779296875, 0.2626495361328125, 0.27655029296875, 0.2904510498046875, 0.304351806640625, 0.3182525634765625, 0.3321533203125, 0.3460540771484375, 0.359954833984375, 0.3738555908203125, 0.38775634765625, 0.4016571044921875, 0.415557861328125, 0.4294586181640625, 0.443359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 7.0, 9.0, 11.0, 11.0, 11.0, 31.0, 32.0, 32.0, 46.0, 36.0, 43.0, 48.0, 55.0, 64.0, 63.0, 71.0, 66.0, 72.0, 53.0, 36.0, 52.0, 31.0, 25.0, 20.0, 12.0, 17.0, 8.0, 7.0, 7.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001407623291015625, -0.0013539493083953857, -0.0013002753257751465, -0.0012466013431549072, -0.001192927360534668, -0.0011392533779144287, -0.0010855793952941895, -0.0010319054126739502, -0.000978231430053711, -0.0009245574474334717, -0.0008708834648132324, -0.0008172094821929932, -0.0007635354995727539, -0.0007098615169525146, -0.0006561875343322754, -0.0006025135517120361, -0.0005488395690917969, -0.0004951655864715576, -0.00044149160385131836, -0.0003878176212310791, -0.00033414363861083984, -0.0002804696559906006, -0.00022679567337036133, -0.00017312169075012207, -0.00011944770812988281, -6.577372550964355e-05, -1.2099742889404297e-05, 4.157423973083496e-05, 9.524822235107422e-05, 0.00014892220497131348, 0.00020259618759155273, 0.000256270170211792, 0.00030994415283203125, 0.0003636181354522705, 0.00041729211807250977, 0.000470966100692749, 0.0005246400833129883, 0.0005783140659332275, 0.0006319880485534668, 0.0006856620311737061, 0.0007393360137939453, 0.0007930099964141846, 0.0008466839790344238, 0.0009003579616546631, 0.0009540319442749023, 0.0010077059268951416, 0.0010613799095153809, 0.0011150538921356201, 0.0011687278747558594, 0.0012224018573760986, 0.0012760758399963379, 0.0013297498226165771, 0.0013834238052368164, 0.0014370977878570557, 0.001490771770477295, 0.0015444457530975342, 0.0015981197357177734, 0.0016517937183380127, 0.001705467700958252, 0.0017591416835784912, 0.0018128156661987305, 0.0018664896488189697, 0.001920163631439209, 0.0019738376140594482, 0.0020275115966796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 10.0, 11.0, 18.0, 28.0, 19.0, 32.0, 45.0, 78.0, 85.0, 141.0, 180.0, 261.0, 422.0, 763.0, 2438.0, 969733.0, 71455.0, 1133.0, 573.0, 344.0, 195.0, 143.0, 114.0, 94.0, 52.0, 43.0, 26.0, 20.0, 24.0, 16.0, 9.0, 11.0, 5.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032440185546875, -0.031450748443603516, -0.03046131134033203, -0.029471874237060547, -0.028482437133789062, -0.027493000030517578, -0.026503562927246094, -0.02551412582397461, -0.024524688720703125, -0.02353525161743164, -0.022545814514160156, -0.021556377410888672, -0.020566940307617188, -0.019577503204345703, -0.01858806610107422, -0.017598628997802734, -0.01660919189453125, -0.015619754791259766, -0.014630317687988281, -0.013640880584716797, -0.012651443481445312, -0.011662006378173828, -0.010672569274902344, -0.00968313217163086, -0.008693695068359375, -0.007704257965087891, -0.006714820861816406, -0.005725383758544922, -0.0047359466552734375, -0.003746509552001953, -0.0027570724487304688, -0.0017676353454589844, -0.0007781982421875, 0.00021123886108398438, 0.0012006759643554688, 0.002190113067626953, 0.0031795501708984375, 0.004168987274169922, 0.005158424377441406, 0.006147861480712891, 0.007137298583984375, 0.00812673568725586, 0.009116172790527344, 0.010105609893798828, 0.011095046997070312, 0.012084484100341797, 0.013073921203613281, 0.014063358306884766, 0.01505279541015625, 0.016042232513427734, 0.01703166961669922, 0.018021106719970703, 0.019010543823242188, 0.019999980926513672, 0.020989418029785156, 0.02197885513305664, 0.022968292236328125, 0.02395772933959961, 0.024947166442871094, 0.025936603546142578, 0.026926040649414062, 0.027915477752685547, 0.02890491485595703, 0.029894351959228516, 0.0308837890625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 43.0, 382.0, 471.0, 99.0, 15.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022740066051483154, -0.0021412076894193888, -0.002008408773690462, -0.0018756099743768573, -0.0017428110586479306, -0.001610012142919004, -0.0014772133436053991, -0.0013444144278764725, -0.0012116155121475458, -0.0010788165964186192, -0.0009460177388973534, -0.0008132188813760877, -0.000680419965647161, -0.0005476210499182343, -0.0004148221923969686, -0.00028202333487570286, -0.0001492244191467762, -1.6425532521679997e-05, 0.0001163733541034162, 0.0002491722407285124, 0.0003819711273536086, 0.0005147700430825353, 0.000647568900603801, 0.0007803677581250668, 0.0009131666738539934, 0.00104596558958292, 0.0011787645053118467, 0.0013115633046254516, 0.0014443622203543782, 0.0015771611360833049, 0.0017099599353969097, 0.0018427588511258364, 0.0019755582325160503, 0.002108357148244977, 0.0022411560639739037, 0.0023739549797028303, 0.002506753895431757, 0.00263955257833004, 0.0027723514940589666, 0.0029051504097878933, 0.00303794932551682, 0.0031707482412457466, 0.0033035471569746733, 0.0034363460727036, 0.003569144755601883, 0.0037019439041614532, 0.0038347425870597363, 0.003967541269958019, 0.00410034041851759, 0.004233139101415873, 0.004365938249975443, 0.004498736932873726, 0.004631536081433296, 0.004764334764331579, 0.0048971339128911495, 0.0050299325957894325, 0.005162731744349003, 0.005295530427247286, 0.005428329575806856, 0.005561128258705139, 0.0056939274072647095, 0.0058267260901629925, 0.005959525238722563, 0.006092323921620846, 0.006225122604519129]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 5.0, 3.0, 12.0, 6.0, 12.0, 16.0, 9.0, 11.0, 17.0, 25.0, 31.0, 22.0, 29.0, 36.0, 43.0, 32.0, 55.0, 51.0, 52.0, 35.0, 43.0, 38.0, 37.0, 38.0, 39.0, 42.0, 29.0, 25.0, 35.0, 28.0, 22.0, 24.0, 17.0, 10.0, 20.0, 15.0, 5.0, 7.0, 6.0, 2.0, 8.0, 4.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007296176627278328, -0.0007034484297037125, -0.0006772791966795921, -0.0006511099636554718, -0.0006249407306313515, -0.0005987714976072311, -0.0005726022645831108, -0.0005464330315589905, -0.0005202637985348701, -0.0004940945655107498, -0.0004679253324866295, -0.00044175609946250916, -0.0004155868664383888, -0.0003894176334142685, -0.00036324840039014816, -0.00033707916736602783, -0.0003109099343419075, -0.00028474070131778717, -0.00025857146829366684, -0.0002324022352695465, -0.00020623300224542618, -0.00018006376922130585, -0.00015389453619718552, -0.00012772530317306519, -0.00010155607014894485, -7.538683712482452e-05, -4.921760410070419e-05, -2.3048371076583862e-05, 3.1208619475364685e-06, 2.92900949716568e-05, 5.545932799577713e-05, 8.162856101989746e-05, 0.00010779779404401779, 0.00013396702706813812, 0.00016013626009225845, 0.00018630549311637878, 0.00021247472614049911, 0.00023864395916461945, 0.0002648131921887398, 0.0002909824252128601, 0.00031715165823698044, 0.00034332089126110077, 0.0003694901242852211, 0.00039565935730934143, 0.00042182859033346176, 0.0004479978233575821, 0.0004741670563817024, 0.0005003362894058228, 0.0005265055224299431, 0.0005526747554540634, 0.0005788439884781837, 0.0006050132215023041, 0.0006311824545264244, 0.0006573516875505447, 0.0006835209205746651, 0.0007096901535987854, 0.0007358593866229057, 0.0007620286196470261, 0.0007881978526711464, 0.0008143670856952667, 0.0008405363187193871, 0.0008667055517435074, 0.0008928747847676277, 0.000919044017791748]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 3.0, 11.0, 8.0, 25.0, 12.0, 20.0, 15.0, 20.0, 26.0, 29.0, 41.0, 28.0, 32.0, 29.0, 37.0, 27.0, 41.0, 29.0, 45.0, 49.0, 45.0, 36.0, 34.0, 36.0, 34.0, 30.0, 31.0, 33.0, 13.0, 19.0, 18.0, 15.0, 9.0, 17.0, 13.0, 9.0, 15.0, 6.0, 6.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.40625, -5.2362060546875, -5.066162109375, -4.8961181640625, -4.72607421875, -4.5560302734375, -4.385986328125, -4.2159423828125, -4.0458984375, -3.8758544921875, -3.705810546875, -3.5357666015625, -3.36572265625, -3.1956787109375, -3.025634765625, -2.8555908203125, -2.685546875, -2.5155029296875, -2.345458984375, -2.1754150390625, -2.00537109375, -1.8353271484375, -1.665283203125, -1.4952392578125, -1.3251953125, -1.1551513671875, -0.985107421875, -0.8150634765625, -0.64501953125, -0.4749755859375, -0.304931640625, -0.1348876953125, 0.03515625, 0.2052001953125, 0.375244140625, 0.5452880859375, 0.71533203125, 0.8853759765625, 1.055419921875, 1.2254638671875, 1.3955078125, 1.5655517578125, 1.735595703125, 1.9056396484375, 2.07568359375, 2.2457275390625, 2.415771484375, 2.5858154296875, 2.755859375, 2.9259033203125, 3.095947265625, 3.2659912109375, 3.43603515625, 3.6060791015625, 3.776123046875, 3.9461669921875, 4.1162109375, 4.2862548828125, 4.456298828125, 4.6263427734375, 4.79638671875, 4.9664306640625, 5.136474609375, 5.3065185546875, 5.4765625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 6.0, 8.0, 17.0, 20.0, 34.0, 38.0, 45.0, 58.0, 76.0, 119.0, 159.0, 226.0, 310.0, 436.0, 627.0, 1045.0, 1920.0, 4107.0, 10885.0, 37425.0, 198397.0, 612174.0, 134753.0, 28763.0, 8710.0, 3527.0, 1708.0, 963.0, 570.0, 362.0, 291.0, 175.0, 142.0, 102.0, 84.0, 58.0, 48.0, 29.0, 31.0, 22.0, 19.0, 18.0, 6.0, 6.0, 11.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.8046875, -9.492431640625, -9.18017578125, -8.867919921875, -8.5556640625, -8.243408203125, -7.93115234375, -7.618896484375, -7.306640625, -6.994384765625, -6.68212890625, -6.369873046875, -6.0576171875, -5.745361328125, -5.43310546875, -5.120849609375, -4.80859375, -4.496337890625, -4.18408203125, -3.871826171875, -3.5595703125, -3.247314453125, -2.93505859375, -2.622802734375, -2.310546875, -1.998291015625, -1.68603515625, -1.373779296875, -1.0615234375, -0.749267578125, -0.43701171875, -0.124755859375, 0.1875, 0.499755859375, 0.81201171875, 1.124267578125, 1.4365234375, 1.748779296875, 2.06103515625, 2.373291015625, 2.685546875, 2.997802734375, 3.31005859375, 3.622314453125, 3.9345703125, 4.246826171875, 4.55908203125, 4.871337890625, 5.18359375, 5.495849609375, 5.80810546875, 6.120361328125, 6.4326171875, 6.744873046875, 7.05712890625, 7.369384765625, 7.681640625, 7.993896484375, 8.30615234375, 8.618408203125, 8.9306640625, 9.242919921875, 9.55517578125, 9.867431640625, 10.1796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 5.0, 4.0, 5.0, 8.0, 13.0, 7.0, 23.0, 12.0, 25.0, 22.0, 35.0, 42.0, 59.0, 58.0, 84.0, 132.0, 457.0, 1483.0, 140.0, 89.0, 66.0, 50.0, 49.0, 31.0, 28.0, 24.0, 20.0, 18.0, 14.0, 9.0, 2.0, 8.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.904296875, -15.29296875, -14.681640625, -14.0703125, -13.458984375, -12.84765625, -12.236328125, -11.625, -11.013671875, -10.40234375, -9.791015625, -9.1796875, -8.568359375, -7.95703125, -7.345703125, -6.734375, -6.123046875, -5.51171875, -4.900390625, -4.2890625, -3.677734375, -3.06640625, -2.455078125, -1.84375, -1.232421875, -0.62109375, -0.009765625, 0.6015625, 1.212890625, 1.82421875, 2.435546875, 3.046875, 3.658203125, 4.26953125, 4.880859375, 5.4921875, 6.103515625, 6.71484375, 7.326171875, 7.9375, 8.548828125, 9.16015625, 9.771484375, 10.3828125, 10.994140625, 11.60546875, 12.216796875, 12.828125, 13.439453125, 14.05078125, 14.662109375, 15.2734375, 15.884765625, 16.49609375, 17.107421875, 17.71875, 18.330078125, 18.94140625, 19.552734375, 20.1640625, 20.775390625, 21.38671875, 21.998046875, 22.609375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 9.0, 11.0, 15.0, 24.0, 38.0, 47.0, 78.0, 121.0, 196.0, 421.0, 927.0, 10417.0, 3128370.0, 3429.0, 735.0, 318.0, 167.0, 122.0, 67.0, 57.0, 25.0, 33.0, 8.0, 10.0, 9.0, 3.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0], "bins": [-67.625, -65.90771484375, -64.1904296875, -62.47314453125, -60.755859375, -59.03857421875, -57.3212890625, -55.60400390625, -53.88671875, -52.16943359375, -50.4521484375, -48.73486328125, -47.017578125, -45.30029296875, -43.5830078125, -41.86572265625, -40.1484375, -38.43115234375, -36.7138671875, -34.99658203125, -33.279296875, -31.56201171875, -29.8447265625, -28.12744140625, -26.41015625, -24.69287109375, -22.9755859375, -21.25830078125, -19.541015625, -17.82373046875, -16.1064453125, -14.38916015625, -12.671875, -10.95458984375, -9.2373046875, -7.52001953125, -5.802734375, -4.08544921875, -2.3681640625, -0.65087890625, 1.06640625, 2.78369140625, 4.5009765625, 6.21826171875, 7.935546875, 9.65283203125, 11.3701171875, 13.08740234375, 14.8046875, 16.52197265625, 18.2392578125, 19.95654296875, 21.673828125, 23.39111328125, 25.1083984375, 26.82568359375, 28.54296875, 30.26025390625, 31.9775390625, 33.69482421875, 35.412109375, 37.12939453125, 38.8466796875, 40.56396484375, 42.28125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 284.0, 673.0, 44.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.14484405517578, -105.12804412841797, -101.11124420166016, -97.09444427490234, -93.07764434814453, -89.06084442138672, -85.0440444946289, -81.0272445678711, -77.01044464111328, -72.99364471435547, -68.97684478759766, -64.96004486083984, -60.94324493408203, -56.92644500732422, -52.909645080566406, -48.892845153808594, -44.87604522705078, -40.85924530029297, -36.842445373535156, -32.825645446777344, -28.80884552001953, -24.79204559326172, -20.775245666503906, -16.758445739746094, -12.741645812988281, -8.724845886230469, -4.708045959472656, -0.6912460327148438, 3.3255538940429688, 7.342353820800781, 11.359153747558594, 15.375953674316406, 19.392745971679688, 23.4095458984375, 27.426345825195312, 31.443145751953125, 35.45994567871094, 39.47674560546875, 43.49354553222656, 47.510345458984375, 51.52714538574219, 55.5439453125, 59.56074523925781, 63.577545166015625, 67.59434509277344, 71.61114501953125, 75.62794494628906, 79.64474487304688, 83.66154479980469, 87.6783447265625, 91.69514465332031, 95.71194458007812, 99.72874450683594, 103.74554443359375, 107.76234436035156, 111.77914428710938, 115.79594421386719, 119.812744140625, 123.82954406738281, 127.84634399414062, 131.86314392089844, 135.87994384765625, 139.89674377441406, 143.91354370117188, 147.9303436279297]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 6.0, 9.0, 16.0, 5.0, 15.0, 12.0, 27.0, 26.0, 33.0, 35.0, 29.0, 33.0, 27.0, 45.0, 30.0, 39.0, 43.0, 47.0, 54.0, 50.0, 37.0, 33.0, 35.0, 44.0, 28.0, 34.0, 35.0, 24.0, 23.0, 18.0, 20.0, 14.0, 12.0, 11.0, 12.0, 7.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-37.24935531616211, -36.01531219482422, -34.78126525878906, -33.547218322753906, -32.313175201416016, -31.079130172729492, -29.84508514404297, -28.611040115356445, -27.376995086669922, -26.1429500579834, -24.908905029296875, -23.67486000061035, -22.440814971923828, -21.206769943237305, -19.97272491455078, -18.738679885864258, -17.504634857177734, -16.27058982849121, -15.036544799804688, -13.802499771118164, -12.56845474243164, -11.334409713745117, -10.100364685058594, -8.86631965637207, -7.632274627685547, -6.398229598999023, -5.1641845703125, -3.9301395416259766, -2.696094512939453, -1.4620494842529297, -0.22800445556640625, 1.0060405731201172, 2.240081787109375, 3.4741268157958984, 4.708171844482422, 5.942216873168945, 7.176261901855469, 8.410306930541992, 9.644351959228516, 10.878396987915039, 12.112442016601562, 13.346487045288086, 14.58053207397461, 15.814577102661133, 17.048622131347656, 18.28266716003418, 19.516712188720703, 20.750757217407227, 21.98480224609375, 23.218847274780273, 24.452892303466797, 25.68693733215332, 26.920982360839844, 28.155027389526367, 29.38907241821289, 30.623117446899414, 31.857162475585938, 33.091209411621094, 34.325252532958984, 35.559295654296875, 36.79334259033203, 38.02738952636719, 39.26143264770508, 40.49547576904297, 41.729522705078125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 9.0, 5.0, 8.0, 13.0, 17.0, 12.0, 16.0, 19.0, 14.0, 25.0, 33.0, 46.0, 46.0, 32.0, 43.0, 34.0, 50.0, 43.0, 41.0, 36.0, 43.0, 45.0, 40.0, 36.0, 28.0, 41.0, 29.0, 29.0, 25.0, 18.0, 17.0, 16.0, 22.0, 12.0, 11.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.27618408203125, -7.0484619140625, -6.82073974609375, -6.593017578125, -6.36529541015625, -6.1375732421875, -5.90985107421875, -5.68212890625, -5.45440673828125, -5.2266845703125, -4.99896240234375, -4.771240234375, -4.54351806640625, -4.3157958984375, -4.08807373046875, -3.8603515625, -3.63262939453125, -3.4049072265625, -3.17718505859375, -2.949462890625, -2.72174072265625, -2.4940185546875, -2.26629638671875, -2.03857421875, -1.81085205078125, -1.5831298828125, -1.35540771484375, -1.127685546875, -0.89996337890625, -0.6722412109375, -0.44451904296875, -0.216796875, 0.01092529296875, 0.2386474609375, 0.46636962890625, 0.694091796875, 0.92181396484375, 1.1495361328125, 1.37725830078125, 1.60498046875, 1.83270263671875, 2.0604248046875, 2.28814697265625, 2.515869140625, 2.74359130859375, 2.9713134765625, 3.19903564453125, 3.4267578125, 3.65447998046875, 3.8822021484375, 4.10992431640625, 4.337646484375, 4.56536865234375, 4.7930908203125, 5.02081298828125, 5.24853515625, 5.47625732421875, 5.7039794921875, 5.93170166015625, 6.159423828125, 6.38714599609375, 6.6148681640625, 6.84259033203125, 7.0703125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 13.0, 10.0, 19.0, 17.0, 27.0, 36.0, 45.0, 50.0, 65.0, 74.0, 114.0, 153.0, 158.0, 232.0, 391.0, 506.0, 860.0, 1971.0, 10876.0, 842931.0, 3287922.0, 40930.0, 3484.0, 1079.0, 584.0, 473.0, 295.0, 219.0, 161.0, 132.0, 96.0, 65.0, 58.0, 51.0, 44.0, 26.0, 23.0, 18.0, 17.0, 15.0, 12.0, 2.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-43.25, -42.021484375, -40.79296875, -39.564453125, -38.3359375, -37.107421875, -35.87890625, -34.650390625, -33.421875, -32.193359375, -30.96484375, -29.736328125, -28.5078125, -27.279296875, -26.05078125, -24.822265625, -23.59375, -22.365234375, -21.13671875, -19.908203125, -18.6796875, -17.451171875, -16.22265625, -14.994140625, -13.765625, -12.537109375, -11.30859375, -10.080078125, -8.8515625, -7.623046875, -6.39453125, -5.166015625, -3.9375, -2.708984375, -1.48046875, -0.251953125, 0.9765625, 2.205078125, 3.43359375, 4.662109375, 5.890625, 7.119140625, 8.34765625, 9.576171875, 10.8046875, 12.033203125, 13.26171875, 14.490234375, 15.71875, 16.947265625, 18.17578125, 19.404296875, 20.6328125, 21.861328125, 23.08984375, 24.318359375, 25.546875, 26.775390625, 28.00390625, 29.232421875, 30.4609375, 31.689453125, 32.91796875, 34.146484375, 35.375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 9.0, 11.0, 13.0, 43.0, 73.0, 111.0, 186.0, 399.0, 705.0, 912.0, 696.0, 410.0, 200.0, 113.0, 69.0, 44.0, 25.0, 16.0, 10.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.4390869140625, -10.823486328125, -10.2078857421875, -9.59228515625, -8.9766845703125, -8.361083984375, -7.7454833984375, -7.1298828125, -6.5142822265625, -5.898681640625, -5.2830810546875, -4.66748046875, -4.0518798828125, -3.436279296875, -2.8206787109375, -2.205078125, -1.5894775390625, -0.973876953125, -0.3582763671875, 0.25732421875, 0.8729248046875, 1.488525390625, 2.1041259765625, 2.7197265625, 3.3353271484375, 3.950927734375, 4.5665283203125, 5.18212890625, 5.7977294921875, 6.413330078125, 7.0289306640625, 7.64453125, 8.2601318359375, 8.875732421875, 9.4913330078125, 10.10693359375, 10.7225341796875, 11.338134765625, 11.9537353515625, 12.5693359375, 13.1849365234375, 13.800537109375, 14.4161376953125, 15.03173828125, 15.6473388671875, 16.262939453125, 16.8785400390625, 17.494140625, 18.1097412109375, 18.725341796875, 19.3409423828125, 19.95654296875, 20.5721435546875, 21.187744140625, 21.8033447265625, 22.4189453125, 23.0345458984375, 23.650146484375, 24.2657470703125, 24.88134765625, 25.4969482421875, 26.112548828125, 26.7281494140625, 27.34375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 11.0, 14.0, 43.0, 131.0, 358.0, 1623.0, 11940.0, 528118.0, 3604638.0, 42888.0, 3452.0, 701.0, 197.0, 72.0, 32.0, 24.0, 8.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.548828125, -23.53515625, -22.521484375, -21.5078125, -20.494140625, -19.48046875, -18.466796875, -17.453125, -16.439453125, -15.42578125, -14.412109375, -13.3984375, -12.384765625, -11.37109375, -10.357421875, -9.34375, -8.330078125, -7.31640625, -6.302734375, -5.2890625, -4.275390625, -3.26171875, -2.248046875, -1.234375, -0.220703125, 0.79296875, 1.806640625, 2.8203125, 3.833984375, 4.84765625, 5.861328125, 6.875, 7.888671875, 8.90234375, 9.916015625, 10.9296875, 11.943359375, 12.95703125, 13.970703125, 14.984375, 15.998046875, 17.01171875, 18.025390625, 19.0390625, 20.052734375, 21.06640625, 22.080078125, 23.09375, 24.107421875, 25.12109375, 26.134765625, 27.1484375, 28.162109375, 29.17578125, 30.189453125, 31.203125, 32.216796875, 33.23046875, 34.244140625, 35.2578125, 36.271484375, 37.28515625, 38.298828125, 39.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 12.0, 15.0, 29.0, 56.0, 85.0, 121.0, 143.0, 152.0, 120.0, 111.0, 71.0, 42.0, 18.0, 13.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.779624938964844, -55.160125732421875, -51.54062271118164, -47.92112350463867, -44.30162048339844, -40.68212127685547, -37.0626220703125, -33.44312286376953, -29.823619842529297, -26.204118728637695, -22.584617614746094, -18.965118408203125, -15.345617294311523, -11.726116180419922, -8.106616973876953, -4.487115859985352, -0.86761474609375, 2.7518858909606934, 6.371386528015137, 9.990886688232422, 13.610387802124023, 17.229888916015625, 20.849388122558594, 24.468889236450195, 28.088390350341797, 31.7078914642334, 35.327392578125, 38.94689178466797, 42.56639099121094, 46.18589401245117, 49.80539321899414, 53.424896240234375, 57.044403076171875, 60.663902282714844, 64.28340148925781, 67.90290832519531, 71.52240753173828, 75.14190673828125, 78.76140594482422, 82.38090515136719, 86.00041198730469, 89.61991119384766, 93.23941040039062, 96.85891723632812, 100.4784164428711, 104.09791564941406, 107.71741485595703, 111.3369140625, 114.95641326904297, 118.57591247558594, 122.1954116821289, 125.81491088867188, 129.43441772460938, 133.05392456054688, 136.6734161376953, 140.2929229736328, 143.91241455078125, 147.53192138671875, 151.1514129638672, 154.7709197998047, 158.39041137695312, 162.00991821289062, 165.62942504882812, 169.24891662597656, 172.86842346191406]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 10.0, 16.0, 21.0, 17.0, 30.0, 41.0, 34.0, 41.0, 64.0, 47.0, 56.0, 62.0, 61.0, 67.0, 56.0, 48.0, 55.0, 48.0, 45.0, 40.0, 26.0, 24.0, 16.0, 9.0, 25.0, 10.0, 12.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.016571044921875, -58.14812088012695, -56.27967071533203, -54.41122055053711, -52.54277038574219, -50.67432403564453, -48.805870056152344, -46.93742370605469, -45.068973541259766, -43.200523376464844, -41.33207321166992, -39.463623046875, -37.59517288208008, -35.726722717285156, -33.8582763671875, -31.989826202392578, -30.121374130249023, -28.2529239654541, -26.38447380065918, -24.51602554321289, -22.64757537841797, -20.779125213623047, -18.910675048828125, -17.042224884033203, -15.173775672912598, -13.305325508117676, -11.43687629699707, -9.568426132202148, -7.699976444244385, -5.831526756286621, -3.963076591491699, -2.0946273803710938, -0.22617721557617188, 1.6422725915908813, 3.5107223987579346, 5.379172325134277, 7.247622013092041, 9.116071701049805, 10.984521865844727, 12.852971076965332, 14.721421241760254, 16.58987045288086, 18.45832061767578, 20.326770782470703, 22.195220947265625, 24.063671112060547, 25.93212127685547, 27.800569534301758, 29.66901969909668, 31.5374698638916, 33.40591812133789, 35.27436828613281, 37.142818450927734, 39.011268615722656, 40.87971878051758, 42.7481689453125, 44.61661911010742, 46.485069274902344, 48.353519439697266, 50.22196960449219, 52.09041976928711, 53.95886993408203, 55.82731628417969, 57.69576644897461, 59.56421661376953]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 8.0, 15.0, 17.0, 27.0, 31.0, 44.0, 36.0, 67.0, 64.0, 61.0, 70.0, 78.0, 65.0, 74.0, 55.0, 63.0, 51.0, 52.0, 20.0, 19.0, 21.0, 16.0, 12.0, 16.0, 5.0, 7.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.625, -100.044921875, -96.46484375, -92.884765625, -89.3046875, -85.724609375, -82.14453125, -78.564453125, -74.984375, -71.404296875, -67.82421875, -64.244140625, -60.6640625, -57.083984375, -53.50390625, -49.923828125, -46.34375, -42.763671875, -39.18359375, -35.603515625, -32.0234375, -28.443359375, -24.86328125, -21.283203125, -17.703125, -14.123046875, -10.54296875, -6.962890625, -3.3828125, 0.197265625, 3.77734375, 7.357421875, 10.9375, 14.517578125, 18.09765625, 21.677734375, 25.2578125, 28.837890625, 32.41796875, 35.998046875, 39.578125, 43.158203125, 46.73828125, 50.318359375, 53.8984375, 57.478515625, 61.05859375, 64.638671875, 68.21875, 71.798828125, 75.37890625, 78.958984375, 82.5390625, 86.119140625, 89.69921875, 93.279296875, 96.859375, 100.439453125, 104.01953125, 107.599609375, 111.1796875, 114.759765625, 118.33984375, 121.919921875, 125.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 7.0, 11.0, 26.0, 30.0, 37.0, 80.0, 105.0, 121.0, 207.0, 307.0, 419.0, 613.0, 959.0, 1490.0, 2099.0, 3121.0, 4675.0, 6947.0, 10388.0, 16115.0, 24456.0, 36770.0, 56150.0, 82494.0, 115557.0, 148673.0, 151944.0, 121640.0, 86611.0, 59772.0, 39523.0, 26443.0, 17159.0, 11186.0, 7300.0, 4989.0, 3261.0, 2257.0, 1498.0, 995.0, 674.0, 442.0, 330.0, 218.0, 141.0, 108.0, 86.0, 42.0, 35.0, 17.0, 14.0, 12.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.96051025390625, -3.8194580078125, -3.67840576171875, -3.537353515625, -3.39630126953125, -3.2552490234375, -3.11419677734375, -2.97314453125, -2.83209228515625, -2.6910400390625, -2.54998779296875, -2.408935546875, -2.26788330078125, -2.1268310546875, -1.98577880859375, -1.8447265625, -1.70367431640625, -1.5626220703125, -1.42156982421875, -1.280517578125, -1.13946533203125, -0.9984130859375, -0.85736083984375, -0.71630859375, -0.57525634765625, -0.4342041015625, -0.29315185546875, -0.152099609375, -0.01104736328125, 0.1300048828125, 0.27105712890625, 0.412109375, 0.55316162109375, 0.6942138671875, 0.83526611328125, 0.976318359375, 1.11737060546875, 1.2584228515625, 1.39947509765625, 1.54052734375, 1.68157958984375, 1.8226318359375, 1.96368408203125, 2.104736328125, 2.24578857421875, 2.3868408203125, 2.52789306640625, 2.6689453125, 2.80999755859375, 2.9510498046875, 3.09210205078125, 3.233154296875, 3.37420654296875, 3.5152587890625, 3.65631103515625, 3.79736328125, 3.93841552734375, 4.0794677734375, 4.22052001953125, 4.361572265625, 4.50262451171875, 4.6436767578125, 4.78472900390625, 4.92578125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 10.0, 7.0, 7.0, 13.0, 16.0, 23.0, 26.0, 30.0, 35.0, 31.0, 32.0, 36.0, 35.0, 47.0, 51.0, 60.0, 1079.0, 47.0, 54.0, 50.0, 40.0, 38.0, 39.0, 34.0, 33.0, 24.0, 27.0, 18.0, 17.0, 14.0, 9.0, 7.0, 8.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-58.96875, -57.3046875, -55.640625, -53.9765625, -52.3125, -50.6484375, -48.984375, -47.3203125, -45.65625, -43.9921875, -42.328125, -40.6640625, -39.0, -37.3359375, -35.671875, -34.0078125, -32.34375, -30.6796875, -29.015625, -27.3515625, -25.6875, -24.0234375, -22.359375, -20.6953125, -19.03125, -17.3671875, -15.703125, -14.0390625, -12.375, -10.7109375, -9.046875, -7.3828125, -5.71875, -4.0546875, -2.390625, -0.7265625, 0.9375, 2.6015625, 4.265625, 5.9296875, 7.59375, 9.2578125, 10.921875, 12.5859375, 14.25, 15.9140625, 17.578125, 19.2421875, 20.90625, 22.5703125, 24.234375, 25.8984375, 27.5625, 29.2265625, 30.890625, 32.5546875, 34.21875, 35.8828125, 37.546875, 39.2109375, 40.875, 42.5390625, 44.203125, 45.8671875, 47.53125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 0.0, 8.0, 17.0, 21.0, 34.0, 56.0, 73.0, 124.0, 184.0, 246.0, 412.0, 571.0, 915.0, 1358.0, 2145.0, 3161.0, 4956.0, 7551.0, 11899.0, 18524.0, 29348.0, 45965.0, 72437.0, 108975.0, 147532.0, 1212034.0, 141241.0, 102002.0, 67003.0, 42992.0, 27010.0, 17129.0, 10892.0, 7036.0, 4635.0, 3057.0, 1918.0, 1240.0, 817.0, 539.0, 369.0, 249.0, 166.0, 109.0, 64.0, 50.0, 24.0, 10.0, 19.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.9765625, -4.82763671875, -4.6787109375, -4.52978515625, -4.380859375, -4.23193359375, -4.0830078125, -3.93408203125, -3.78515625, -3.63623046875, -3.4873046875, -3.33837890625, -3.189453125, -3.04052734375, -2.8916015625, -2.74267578125, -2.59375, -2.44482421875, -2.2958984375, -2.14697265625, -1.998046875, -1.84912109375, -1.7001953125, -1.55126953125, -1.40234375, -1.25341796875, -1.1044921875, -0.95556640625, -0.806640625, -0.65771484375, -0.5087890625, -0.35986328125, -0.2109375, -0.06201171875, 0.0869140625, 0.23583984375, 0.384765625, 0.53369140625, 0.6826171875, 0.83154296875, 0.98046875, 1.12939453125, 1.2783203125, 1.42724609375, 1.576171875, 1.72509765625, 1.8740234375, 2.02294921875, 2.171875, 2.32080078125, 2.4697265625, 2.61865234375, 2.767578125, 2.91650390625, 3.0654296875, 3.21435546875, 3.36328125, 3.51220703125, 3.6611328125, 3.81005859375, 3.958984375, 4.10791015625, 4.2568359375, 4.40576171875, 4.5546875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 8.0, 4.0, 16.0, 13.0, 12.0, 19.0, 20.0, 26.0, 22.0, 26.0, 36.0, 35.0, 44.0, 51.0, 46.0, 58.0, 43.0, 61.0, 50.0, 54.0, 43.0, 39.0, 43.0, 31.0, 27.0, 14.0, 28.0, 18.0, 24.0, 13.0, 12.0, 15.0, 10.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03857421875, -0.0370182991027832, -0.035462379455566406, -0.03390645980834961, -0.03235054016113281, -0.030794620513916016, -0.02923870086669922, -0.027682781219482422, -0.026126861572265625, -0.024570941925048828, -0.02301502227783203, -0.021459102630615234, -0.019903182983398438, -0.01834726333618164, -0.016791343688964844, -0.015235424041748047, -0.01367950439453125, -0.012123584747314453, -0.010567665100097656, -0.00901174545288086, -0.0074558258056640625, -0.005899906158447266, -0.004343986511230469, -0.002788066864013672, -0.001232147216796875, 0.0003237724304199219, 0.0018796920776367188, 0.0034356117248535156, 0.0049915313720703125, 0.006547451019287109, 0.008103370666503906, 0.009659290313720703, 0.0112152099609375, 0.012771129608154297, 0.014327049255371094, 0.01588296890258789, 0.017438888549804688, 0.018994808197021484, 0.02055072784423828, 0.022106647491455078, 0.023662567138671875, 0.025218486785888672, 0.02677440643310547, 0.028330326080322266, 0.029886245727539062, 0.03144216537475586, 0.032998085021972656, 0.03455400466918945, 0.03610992431640625, 0.03766584396362305, 0.039221763610839844, 0.04077768325805664, 0.04233360290527344, 0.043889522552490234, 0.04544544219970703, 0.04700136184692383, 0.048557281494140625, 0.05011320114135742, 0.05166912078857422, 0.053225040435791016, 0.05478096008300781, 0.05633687973022461, 0.057892799377441406, 0.0594487190246582, 0.061004638671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 13.0, 20.0, 17.0, 34.0, 33.0, 71.0, 80.0, 120.0, 164.0, 217.0, 299.0, 448.0, 818.0, 1456.0, 3103.0, 7092.0, 18668.0, 57645.0, 235257.0, 517072.0, 142015.0, 39340.0, 13687.0, 5299.0, 2388.0, 1163.0, 668.0, 389.0, 293.0, 204.0, 132.0, 109.0, 63.0, 56.0, 33.0, 26.0, 21.0, 8.0, 6.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.351806640625, -0.34238433837890625, -0.3329620361328125, -0.32353973388671875, -0.314117431640625, -0.30469512939453125, -0.2952728271484375, -0.28585052490234375, -0.27642822265625, -0.26700592041015625, -0.2575836181640625, -0.24816131591796875, -0.238739013671875, -0.22931671142578125, -0.2198944091796875, -0.21047210693359375, -0.2010498046875, -0.19162750244140625, -0.1822052001953125, -0.17278289794921875, -0.163360595703125, -0.15393829345703125, -0.1445159912109375, -0.13509368896484375, -0.12567138671875, -0.11624908447265625, -0.1068267822265625, -0.09740447998046875, -0.087982177734375, -0.07855987548828125, -0.0691375732421875, -0.05971527099609375, -0.05029296875, -0.04087066650390625, -0.0314483642578125, -0.02202606201171875, -0.012603759765625, -0.00318145751953125, 0.0062408447265625, 0.01566314697265625, 0.02508544921875, 0.03450775146484375, 0.0439300537109375, 0.05335235595703125, 0.062774658203125, 0.07219696044921875, 0.0816192626953125, 0.09104156494140625, 0.1004638671875, 0.10988616943359375, 0.1193084716796875, 0.12873077392578125, 0.138153076171875, 0.14757537841796875, 0.1569976806640625, 0.16641998291015625, 0.17584228515625, 0.18526458740234375, 0.1946868896484375, 0.20410919189453125, 0.213531494140625, 0.22295379638671875, 0.2323760986328125, 0.24179840087890625, 0.251220703125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 9.0, 4.0, 9.0, 8.0, 12.0, 18.0, 17.0, 21.0, 32.0, 56.0, 59.0, 90.0, 81.0, 93.0, 95.0, 89.0, 73.0, 63.0, 48.0, 25.0, 28.0, 19.0, 9.0, 7.0, 10.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03601740300655365, -0.03450973704457283, -0.03300207108259201, -0.03149440884590149, -0.02998674288392067, -0.02847907692193985, -0.02697141282260418, -0.02546374872326851, -0.02395608276128769, -0.02244841679930687, -0.0209407526999712, -0.01943308860063553, -0.01792542263865471, -0.01641775667667389, -0.014910092577338219, -0.013402427546679974, -0.011894762516021729, -0.010387097485363483, -0.008879432454705238, -0.007371767424046993, -0.005864102393388748, -0.004356437362730503, -0.002848772332072258, -0.001341107301414013, 0.00016655772924423218, 0.0016742227599024773, 0.0031818877905607224, 0.0046895528212189674, 0.0061972178518772125, 0.007704882882535458, 0.009212547913193703, 0.010720212943851948, 0.012227877974510193, 0.013735543005168438, 0.015243208035826683, 0.016750872135162354, 0.018258538097143173, 0.019766204059123993, 0.021273868158459663, 0.022781532257795334, 0.024289198219776154, 0.025796864181756973, 0.027304528281092644, 0.028812192380428314, 0.030319858342409134, 0.031827524304389954, 0.033335186541080475, 0.034842852503061295, 0.036350518465042114, 0.037858184427022934, 0.039365850389003754, 0.040873512625694275, 0.042381178587675095, 0.043888844549655914, 0.045396506786346436, 0.046904172748327255, 0.048411838710308075, 0.049919504672288895, 0.051427170634269714, 0.052934832870960236, 0.054442498832941055, 0.055950164794921875, 0.057457827031612396, 0.058965492993593216, 0.060473158955574036]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 9.0, 3.0, 11.0, 15.0, 18.0, 18.0, 19.0, 29.0, 22.0, 38.0, 33.0, 35.0, 33.0, 46.0, 30.0, 51.0, 45.0, 41.0, 48.0, 47.0, 32.0, 34.0, 27.0, 40.0, 24.0, 31.0, 31.0, 31.0, 32.0, 23.0, 15.0, 16.0, 18.0, 13.0, 6.0, 4.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03325134515762329, -0.032247722148895264, -0.031244101002812386, -0.030240479856729507, -0.02923685684800148, -0.028233233839273453, -0.027229612693190575, -0.026225991547107697, -0.02522236853837967, -0.024218745529651642, -0.023215124383568764, -0.022211503237485886, -0.02120788022875786, -0.02020425722002983, -0.019200636073946953, -0.018197014927864075, -0.017193391919136047, -0.01618976891040802, -0.015186147764325142, -0.01418252568691969, -0.013178903609514236, -0.012175281532108784, -0.011171659454703331, -0.010168037377297878, -0.009164415299892426, -0.008160793222486973, -0.00715717114508152, -0.006153549067676067, -0.005149926990270615, -0.004146304912865162, -0.003142682835459709, -0.0021390607580542564, -0.0011354386806488037, -0.00013181660324335098, 0.0008718054741621017, 0.0018754275515675545, 0.002879049628973007, 0.00388267170637846, 0.004886293783783913, 0.005889915861189365, 0.006893537938594818, 0.00789716001600027, 0.008900782093405724, 0.009904404170811176, 0.010908026248216629, 0.011911648325622082, 0.012915270403027534, 0.013918892480432987, 0.01492251455783844, 0.015926137566566467, 0.016929758712649345, 0.017933379858732224, 0.01893700286746025, 0.019940625876188278, 0.020944247022271156, 0.021947868168354034, 0.022951491177082062, 0.02395511418581009, 0.024958735331892967, 0.025962356477975845, 0.026965979486703873, 0.0279696024954319, 0.028973223641514778, 0.029976844787597656, 0.030980467796325684]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 8.0, 15.0, 17.0, 26.0, 30.0, 46.0, 34.0, 67.0, 63.0, 63.0, 70.0, 74.0, 69.0, 74.0, 55.0, 63.0, 50.0, 53.0, 22.0, 18.0, 21.0, 16.0, 12.0, 14.0, 6.0, 8.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.875, -100.2890625, -96.703125, -93.1171875, -89.53125, -85.9453125, -82.359375, -78.7734375, -75.1875, -71.6015625, -68.015625, -64.4296875, -60.84375, -57.2578125, -53.671875, -50.0859375, -46.5, -42.9140625, -39.328125, -35.7421875, -32.15625, -28.5703125, -24.984375, -21.3984375, -17.8125, -14.2265625, -10.640625, -7.0546875, -3.46875, 0.1171875, 3.703125, 7.2890625, 10.875, 14.4609375, 18.046875, 21.6328125, 25.21875, 28.8046875, 32.390625, 35.9765625, 39.5625, 43.1484375, 46.734375, 50.3203125, 53.90625, 57.4921875, 61.078125, 64.6640625, 68.25, 71.8359375, 75.421875, 79.0078125, 82.59375, 86.1796875, 89.765625, 93.3515625, 96.9375, 100.5234375, 104.109375, 107.6953125, 111.28125, 114.8671875, 118.453125, 122.0390625, 125.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 8.0, 18.0, 25.0, 35.0, 56.0, 103.0, 177.0, 325.0, 793.0, 1966.0, 5432.0, 23050.0, 257912.0, 687421.0, 56869.0, 9456.0, 2776.0, 1091.0, 462.0, 212.0, 126.0, 82.0, 46.0, 39.0, 19.0, 14.0, 15.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.875, -24.9580078125, -24.041015625, -23.1240234375, -22.20703125, -21.2900390625, -20.373046875, -19.4560546875, -18.5390625, -17.6220703125, -16.705078125, -15.7880859375, -14.87109375, -13.9541015625, -13.037109375, -12.1201171875, -11.203125, -10.2861328125, -9.369140625, -8.4521484375, -7.53515625, -6.6181640625, -5.701171875, -4.7841796875, -3.8671875, -2.9501953125, -2.033203125, -1.1162109375, -0.19921875, 0.7177734375, 1.634765625, 2.5517578125, 3.46875, 4.3857421875, 5.302734375, 6.2197265625, 7.13671875, 8.0537109375, 8.970703125, 9.8876953125, 10.8046875, 11.7216796875, 12.638671875, 13.5556640625, 14.47265625, 15.3896484375, 16.306640625, 17.2236328125, 18.140625, 19.0576171875, 19.974609375, 20.8916015625, 21.80859375, 22.7255859375, 23.642578125, 24.5595703125, 25.4765625, 26.3935546875, 27.310546875, 28.2275390625, 29.14453125, 30.0615234375, 30.978515625, 31.8955078125, 32.8125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 13.0, 15.0, 18.0, 49.0, 43.0, 50.0, 72.0, 66.0, 87.0, 2125.0, 101.0, 86.0, 57.0, 72.0, 47.0, 37.0, 31.0, 22.0, 14.0, 5.0, 10.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.75, -135.26953125, -129.7890625, -124.30859375, -118.828125, -113.34765625, -107.8671875, -102.38671875, -96.90625, -91.42578125, -85.9453125, -80.46484375, -74.984375, -69.50390625, -64.0234375, -58.54296875, -53.0625, -47.58203125, -42.1015625, -36.62109375, -31.140625, -25.66015625, -20.1796875, -14.69921875, -9.21875, -3.73828125, 1.7421875, 7.22265625, 12.703125, 18.18359375, 23.6640625, 29.14453125, 34.625, 40.10546875, 45.5859375, 51.06640625, 56.546875, 62.02734375, 67.5078125, 72.98828125, 78.46875, 83.94921875, 89.4296875, 94.91015625, 100.390625, 105.87109375, 111.3515625, 116.83203125, 122.3125, 127.79296875, 133.2734375, 138.75390625, 144.234375, 149.71484375, 155.1953125, 160.67578125, 166.15625, 171.63671875, 177.1171875, 182.59765625, 188.078125, 193.55859375, 199.0390625, 204.51953125, 210.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 7.0, 11.0, 12.0, 22.0, 22.0, 38.0, 53.0, 78.0, 144.0, 215.0, 316.0, 586.0, 1313.0, 3969.0, 34940.0, 2849714.0, 238521.0, 11329.0, 2339.0, 853.0, 443.0, 252.0, 184.0, 104.0, 70.0, 36.0, 36.0, 32.0, 15.0, 13.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.09375, -36.05712890625, -35.0205078125, -33.98388671875, -32.947265625, -31.91064453125, -30.8740234375, -29.83740234375, -28.80078125, -27.76416015625, -26.7275390625, -25.69091796875, -24.654296875, -23.61767578125, -22.5810546875, -21.54443359375, -20.5078125, -19.47119140625, -18.4345703125, -17.39794921875, -16.361328125, -15.32470703125, -14.2880859375, -13.25146484375, -12.21484375, -11.17822265625, -10.1416015625, -9.10498046875, -8.068359375, -7.03173828125, -5.9951171875, -4.95849609375, -3.921875, -2.88525390625, -1.8486328125, -0.81201171875, 0.224609375, 1.26123046875, 2.2978515625, 3.33447265625, 4.37109375, 5.40771484375, 6.4443359375, 7.48095703125, 8.517578125, 9.55419921875, 10.5908203125, 11.62744140625, 12.6640625, 13.70068359375, 14.7373046875, 15.77392578125, 16.810546875, 17.84716796875, 18.8837890625, 19.92041015625, 20.95703125, 21.99365234375, 23.0302734375, 24.06689453125, 25.103515625, 26.14013671875, 27.1767578125, 28.21337890625, 29.25]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 4.0, 6.0, 9.0, 15.0, 26.0, 49.0, 91.0, 144.0, 188.0, 152.0, 123.0, 67.0, 44.0, 25.0, 14.0, 10.0, 7.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.95148468017578, -70.04188537597656, -64.13228607177734, -58.22269058227539, -52.31309509277344, -46.40349578857422, -40.493896484375, -34.58430099487305, -28.674701690673828, -22.765104293823242, -16.855506896972656, -10.945907592773438, -5.036310195922852, 0.8732872009277344, 6.782886505126953, 12.692481994628906, 18.602081298828125, 24.51167869567871, 30.421276092529297, 36.330875396728516, 42.24047088623047, 48.15007019042969, 54.059669494628906, 59.96926498413086, 65.87886047363281, 71.78845977783203, 77.69805908203125, 83.60765075683594, 89.51725006103516, 95.42684936523438, 101.3364486694336, 107.24604797363281, 113.15565490722656, 119.06525421142578, 124.974853515625, 130.8844451904297, 136.79405212402344, 142.70364379882812, 148.61325073242188, 154.52284240722656, 160.43243408203125, 166.34202575683594, 172.2516326904297, 178.16122436523438, 184.07083129882812, 189.9804229736328, 195.8900146484375, 201.79962158203125, 207.709228515625, 213.6188201904297, 219.52842712402344, 225.43801879882812, 231.34762573242188, 237.25721740722656, 243.16680908203125, 249.076416015625, 254.9860076904297, 260.8955993652344, 266.8052062988281, 272.7148132324219, 278.6243896484375, 284.53399658203125, 290.443603515625, 296.3531799316406, 302.2627868652344]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 6.0, 6.0, 14.0, 11.0, 15.0, 18.0, 33.0, 21.0, 31.0, 45.0, 30.0, 52.0, 44.0, 61.0, 51.0, 52.0, 34.0, 43.0, 55.0, 59.0, 37.0, 32.0, 34.0, 38.0, 29.0, 22.0, 24.0, 17.0, 19.0, 13.0, 7.0, 7.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-171.99749755859375, -167.3218231201172, -162.6461639404297, -157.97048950195312, -153.29481506347656, -148.619140625, -143.9434814453125, -139.26780700683594, -134.59213256835938, -129.9164581298828, -125.24079132080078, -120.56512451171875, -115.88945007324219, -111.21378326416016, -106.53811645507812, -101.86244201660156, -97.18678283691406, -92.51111602783203, -87.83544158935547, -83.15977478027344, -78.48410034179688, -73.80843353271484, -69.13276672363281, -64.45709228515625, -59.78142547607422, -55.10575485229492, -50.430084228515625, -45.754417419433594, -41.0787467956543, -36.403076171875, -31.727407455444336, -27.051738739013672, -22.376052856445312, -17.700382232666016, -13.024713516235352, -8.349043846130371, -3.6733741760253906, 1.0022964477539062, 5.67796516418457, 10.353633880615234, 15.029304504394531, 19.704975128173828, 24.380643844604492, 29.056312561035156, 33.73198318481445, 38.40765380859375, 43.08332061767578, 47.75899124145508, 52.434661865234375, 57.11033248901367, 61.78600311279297, 66.461669921875, 71.13734436035156, 75.8130111694336, 80.48867797851562, 85.16435241699219, 89.84001922607422, 94.51568603515625, 99.19136047363281, 103.86702728271484, 108.54269409179688, 113.21836853027344, 117.89403533935547, 122.5697021484375, 127.24537658691406]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 10.0, 9.0, 15.0, 14.0, 14.0, 23.0, 36.0, 48.0, 45.0, 83.0, 134.0, 126.0, 217.0, 271.0, 329.0, 504.0, 709.0, 1110.0, 1040201.0, 1486.0, 913.0, 553.0, 414.0, 333.0, 252.0, 196.0, 131.0, 107.0, 68.0, 39.0, 44.0, 29.0, 21.0, 14.0, 14.0, 13.0, 14.0, 4.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.27141571044922, -42.73384094238281, -41.19626235961914, -39.65868377685547, -38.12110900878906, -36.583534240722656, -35.045955657958984, -33.50837707519531, -31.970802307128906, -30.433225631713867, -28.895648956298828, -27.35807228088379, -25.82049560546875, -24.28291893005371, -22.745342254638672, -21.207765579223633, -19.670188903808594, -18.132612228393555, -16.595035552978516, -15.057458877563477, -13.519882202148438, -11.982305526733398, -10.44472885131836, -8.90715217590332, -7.369575500488281, -5.831998825073242, -4.294422149658203, -2.756845474243164, -1.219268798828125, 0.31830787658691406, 1.8558845520019531, 3.393461227416992, 4.931041717529297, 6.468618392944336, 8.006195068359375, 9.543771743774414, 11.081348419189453, 12.618925094604492, 14.156501770019531, 15.69407844543457, 17.23165512084961, 18.76923179626465, 20.306808471679688, 21.844385147094727, 23.381961822509766, 24.919538497924805, 26.457115173339844, 27.994691848754883, 29.532268524169922, 31.06984519958496, 32.607421875, 34.144996643066406, 35.68257522583008, 37.22015380859375, 38.757728576660156, 40.29530334472656, 41.832881927490234, 43.370460510253906, 44.90803527832031, 46.44561004638672, 47.98318862915039, 49.52076721191406, 51.05834197998047, 52.595916748046875, 54.13349533081055]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 10.0, 8.0, 11.0, 15.0, 14.0, 42.0, 129.0, 58874.0, 51404756.0, 70.0, 25.0, 17.0, 12.0, 13.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4105.43603515625, -3963.91357421875, -3822.390869140625, -3680.868408203125, -3539.345703125, -3397.8232421875, -3256.30078125, -3114.7783203125, -2973.255615234375, -2831.733154296875, -2690.21044921875, -2548.68798828125, -2407.16552734375, -2265.642822265625, -2124.120361328125, -1982.5977783203125, -1841.0751953125, -1699.5526123046875, -1558.030029296875, -1416.507568359375, -1274.9849853515625, -1133.46240234375, -991.9398803710938, -850.4173583984375, -708.894775390625, -567.3721923828125, -425.84967041015625, -284.3271179199219, -142.8045654296875, -1.281982421875, 140.24053955078125, 281.7630615234375, 423.28515625, 564.8077392578125, 706.3302612304688, 847.852783203125, 989.3753662109375, 1130.89794921875, 1272.42041015625, 1413.9429931640625, 1555.465576171875, 1696.9881591796875, 1838.5107421875, 1980.033203125, 2121.5556640625, 2263.078369140625, 2404.600830078125, 2546.12353515625, 2687.64599609375, 2829.16845703125, 2970.691162109375, 3112.213623046875, 3253.736328125, 3395.2587890625, 3536.78125, 3678.3037109375, 3819.826416015625, 3961.348876953125, 4102.87158203125, 4244.39404296875, 4385.91650390625, 4527.439453125, 4668.9619140625, 4810.484375, 4952.0068359375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 13.0, 14.0, 20.0, 30.0, 56.0, 69.0, 105.0, 173.0, 231.0, 335.0, 544.0, 744.0, 1151.0, 1702.0, 2766.0, 4484.0, 7494.0, 12205.0, 20552.0, 35215.0, 59953.0, 102384.0, 173379.0, 282466.0, 417777.0, 3201590.0, 959182.0, 382700.0, 251184.0, 152868.0, 90141.0, 52399.0, 30497.0, 18303.0, 10809.0, 6669.0, 4008.0, 2498.0, 1555.0, 1064.0, 716.0, 470.0, 303.0, 190.0, 136.0, 82.0, 57.0, 43.0, 33.0, 17.0, 24.0, 6.0, 8.0, 8.0, 4.0, 3.0], "bins": [-2.1875, -2.1229248046875, -2.058349609375, -1.9937744140625, -1.92919921875, -1.8646240234375, -1.800048828125, -1.7354736328125, -1.6708984375, -1.6063232421875, -1.541748046875, -1.4771728515625, -1.41259765625, -1.3480224609375, -1.283447265625, -1.2188720703125, -1.154296875, -1.0897216796875, -1.025146484375, -0.9605712890625, -0.89599609375, -0.8314208984375, -0.766845703125, -0.7022705078125, -0.6376953125, -0.5731201171875, -0.508544921875, -0.4439697265625, -0.37939453125, -0.3148193359375, -0.250244140625, -0.1856689453125, -0.12109375, -0.0565185546875, 0.008056640625, 0.0726318359375, 0.13720703125, 0.2017822265625, 0.266357421875, 0.3309326171875, 0.3955078125, 0.4600830078125, 0.524658203125, 0.5892333984375, 0.65380859375, 0.7183837890625, 0.782958984375, 0.8475341796875, 0.912109375, 0.9766845703125, 1.041259765625, 1.1058349609375, 1.17041015625, 1.2349853515625, 1.299560546875, 1.3641357421875, 1.4287109375, 1.4932861328125, 1.557861328125, 1.6224365234375, 1.68701171875, 1.7515869140625, 1.816162109375, 1.8807373046875, 1.9453125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 7.0, 9.0, 6.0, 11.0, 9.0, 16.0, 19.0, 12.0, 13.0, 20.0, 25.0, 30.0, 37.0, 32.0, 30.0, 29.0, 37.0, 45.0, 37.0, 79.0, 872.0, 185.0, 40.0, 40.0, 44.0, 40.0, 40.0, 30.0, 23.0, 34.0, 22.0, 30.0, 27.0, 22.0, 15.0, 14.0, 12.0, 6.0, 4.0, 2.0, 7.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.890625, -15.418212890625, -14.94580078125, -14.473388671875, -14.0009765625, -13.528564453125, -13.05615234375, -12.583740234375, -12.111328125, -11.638916015625, -11.16650390625, -10.694091796875, -10.2216796875, -9.749267578125, -9.27685546875, -8.804443359375, -8.33203125, -7.859619140625, -7.38720703125, -6.914794921875, -6.4423828125, -5.969970703125, -5.49755859375, -5.025146484375, -4.552734375, -4.080322265625, -3.60791015625, -3.135498046875, -2.6630859375, -2.190673828125, -1.71826171875, -1.245849609375, -0.7734375, -0.301025390625, 0.17138671875, 0.643798828125, 1.1162109375, 1.588623046875, 2.06103515625, 2.533447265625, 3.005859375, 3.478271484375, 3.95068359375, 4.423095703125, 4.8955078125, 5.367919921875, 5.84033203125, 6.312744140625, 6.78515625, 7.257568359375, 7.72998046875, 8.202392578125, 8.6748046875, 9.147216796875, 9.61962890625, 10.092041015625, 10.564453125, 11.036865234375, 11.50927734375, 11.981689453125, 12.4541015625, 12.926513671875, 13.39892578125, 13.871337890625, 14.34375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 7.0, 4.0, 10.0, 19.0, 19.0, 29.0, 52.0, 98.0, 113.0, 157.0, 244.0, 329.0, 511.0, 728.0, 1161.0, 1728.0, 2584.0, 4076.0, 6352.0, 9838.0, 15993.0, 25672.0, 42560.0, 70405.0, 120168.0, 204843.0, 336487.0, 542774.0, 3613514.0, 497772.0, 317424.0, 191038.0, 112566.0, 66535.0, 39693.0, 24000.0, 15111.0, 9401.0, 5972.0, 3994.0, 2528.0, 1678.0, 1114.0, 734.0, 449.0, 315.0, 223.0, 143.0, 84.0, 56.0, 45.0, 33.0, 21.0, 18.0, 12.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0], "bins": [-2.240234375, -2.168975830078125, -2.09771728515625, -2.026458740234375, -1.9552001953125, -1.883941650390625, -1.81268310546875, -1.741424560546875, -1.670166015625, -1.598907470703125, -1.52764892578125, -1.456390380859375, -1.3851318359375, -1.313873291015625, -1.24261474609375, -1.171356201171875, -1.10009765625, -1.028839111328125, -0.95758056640625, -0.886322021484375, -0.8150634765625, -0.743804931640625, -0.67254638671875, -0.601287841796875, -0.530029296875, -0.458770751953125, -0.38751220703125, -0.316253662109375, -0.2449951171875, -0.173736572265625, -0.10247802734375, -0.031219482421875, 0.0400390625, 0.111297607421875, 0.18255615234375, 0.253814697265625, 0.3250732421875, 0.396331787109375, 0.46759033203125, 0.538848876953125, 0.610107421875, 0.681365966796875, 0.75262451171875, 0.823883056640625, 0.8951416015625, 0.966400146484375, 1.03765869140625, 1.108917236328125, 1.18017578125, 1.251434326171875, 1.32269287109375, 1.393951416015625, 1.4652099609375, 1.536468505859375, 1.60772705078125, 1.678985595703125, 1.750244140625, 1.821502685546875, 1.89276123046875, 1.964019775390625, 2.0352783203125, 2.106536865234375, 2.17779541015625, 2.249053955078125, 2.3203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 6.0, 10.0, 7.0, 8.0, 14.0, 19.0, 14.0, 14.0, 15.0, 28.0, 28.0, 31.0, 25.0, 32.0, 33.0, 38.0, 37.0, 27.0, 44.0, 161.0, 827.0, 141.0, 39.0, 32.0, 33.0, 47.0, 39.0, 32.0, 23.0, 27.0, 23.0, 29.0, 18.0, 15.0, 19.0, 15.0, 11.0, 9.0, 11.0, 6.0, 4.0, 3.0, 3.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.671875, -8.3671875, -8.0625, -7.7578125, -7.453125, -7.1484375, -6.84375, -6.5390625, -6.234375, -5.9296875, -5.625, -5.3203125, -5.015625, -4.7109375, -4.40625, -4.1015625, -3.796875, -3.4921875, -3.1875, -2.8828125, -2.578125, -2.2734375, -1.96875, -1.6640625, -1.359375, -1.0546875, -0.75, -0.4453125, -0.140625, 0.1640625, 0.46875, 0.7734375, 1.078125, 1.3828125, 1.6875, 1.9921875, 2.296875, 2.6015625, 2.90625, 3.2109375, 3.515625, 3.8203125, 4.125, 4.4296875, 4.734375, 5.0390625, 5.34375, 5.6484375, 5.953125, 6.2578125, 6.5625, 6.8671875, 7.171875, 7.4765625, 7.78125, 8.0859375, 8.390625, 8.6953125, 9.0, 9.3046875, 9.609375, 9.9140625, 10.21875, 10.5234375, 10.828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 5.0, 6.0, 9.0, 6.0, 15.0, 20.0, 24.0, 31.0, 33.0, 48.0, 65.0, 89.0, 123.0, 160.0, 187.0, 243.0, 310.0, 455.0, 593.0, 852.0, 1275.0, 1760.0, 2953.0, 5090.0, 9493.0, 20386.0, 54960.0, 196961.0, 5797082.0, 123578.0, 38938.0, 15736.0, 7590.0, 4266.0, 2488.0, 1623.0, 1081.0, 704.0, 514.0, 411.0, 306.0, 225.0, 155.0, 157.0, 94.0, 86.0, 58.0, 52.0, 28.0, 28.0, 18.0, 11.0, 18.0, 9.0, 9.0, 9.0, 9.0, 5.0, 5.0, 3.0], "bins": [-9.6640625, -9.365234375, -9.06640625, -8.767578125, -8.46875, -8.169921875, -7.87109375, -7.572265625, -7.2734375, -6.974609375, -6.67578125, -6.376953125, -6.078125, -5.779296875, -5.48046875, -5.181640625, -4.8828125, -4.583984375, -4.28515625, -3.986328125, -3.6875, -3.388671875, -3.08984375, -2.791015625, -2.4921875, -2.193359375, -1.89453125, -1.595703125, -1.296875, -0.998046875, -0.69921875, -0.400390625, -0.1015625, 0.197265625, 0.49609375, 0.794921875, 1.09375, 1.392578125, 1.69140625, 1.990234375, 2.2890625, 2.587890625, 2.88671875, 3.185546875, 3.484375, 3.783203125, 4.08203125, 4.380859375, 4.6796875, 4.978515625, 5.27734375, 5.576171875, 5.875, 6.173828125, 6.47265625, 6.771484375, 7.0703125, 7.369140625, 7.66796875, 7.966796875, 8.265625, 8.564453125, 8.86328125, 9.162109375, 9.4609375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 3.0, 6.0, 11.0, 8.0, 9.0, 15.0, 20.0, 14.0, 31.0, 34.0, 28.0, 42.0, 37.0, 37.0, 36.0, 49.0, 48.0, 153.0, 710.0, 245.0, 57.0, 62.0, 35.0, 48.0, 43.0, 40.0, 37.0, 26.0, 17.0, 25.0, 17.0, 23.0, 10.0, 9.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.34375, -9.08819580078125, -8.8326416015625, -8.57708740234375, -8.321533203125, -8.06597900390625, -7.8104248046875, -7.55487060546875, -7.29931640625, -7.04376220703125, -6.7882080078125, -6.53265380859375, -6.277099609375, -6.02154541015625, -5.7659912109375, -5.51043701171875, -5.2548828125, -4.99932861328125, -4.7437744140625, -4.48822021484375, -4.232666015625, -3.97711181640625, -3.7215576171875, -3.46600341796875, -3.21044921875, -2.95489501953125, -2.6993408203125, -2.44378662109375, -2.188232421875, -1.93267822265625, -1.6771240234375, -1.42156982421875, -1.166015625, -0.91046142578125, -0.6549072265625, -0.39935302734375, -0.143798828125, 0.11175537109375, 0.3673095703125, 0.62286376953125, 0.87841796875, 1.13397216796875, 1.3895263671875, 1.64508056640625, 1.900634765625, 2.15618896484375, 2.4117431640625, 2.66729736328125, 2.9228515625, 3.17840576171875, 3.4339599609375, 3.68951416015625, 3.945068359375, 4.20062255859375, 4.4561767578125, 4.71173095703125, 4.96728515625, 5.22283935546875, 5.4783935546875, 5.73394775390625, 5.989501953125, 6.24505615234375, 6.5006103515625, 6.75616455078125, 7.01171875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 23.0, 72.0, 205.0, 383.0, 217.0, 66.0, 22.0, 9.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.21373748779297, -21.60333824157715, -19.992938995361328, -18.382539749145508, -16.772140502929688, -15.161742210388184, -13.551342964172363, -11.940943717956543, -10.330544471740723, -8.720145225524902, -7.109745979309082, -5.49934720993042, -3.8889479637145996, -2.2785491943359375, -0.6681499481201172, 0.9422492980957031, 2.5526485443115234, 4.163047790527344, 5.773447036743164, 7.383845806121826, 8.994245529174805, 10.604643821716309, 12.215043067932129, 13.82544231414795, 15.43584156036377, 17.046239852905273, 18.656639099121094, 20.267038345336914, 21.877437591552734, 23.487836837768555, 25.098236083984375, 26.708635330200195, 28.319034576416016, 29.929433822631836, 31.539833068847656, 33.150230407714844, 34.7606315612793, 36.371028900146484, 37.98143005371094, 39.591827392578125, 41.20222854614258, 42.812625885009766, 44.42302703857422, 46.033424377441406, 47.64382553100586, 49.25422286987305, 50.8646240234375, 52.47502136230469, 54.085418701171875, 55.69581604003906, 57.306217193603516, 58.9166145324707, 60.527015686035156, 62.137413024902344, 63.7478141784668, 65.35821533203125, 66.96861267089844, 68.57901000976562, 70.18940734863281, 71.79981231689453, 73.41020965576172, 75.0206069946289, 76.6310043334961, 78.24140930175781, 79.851806640625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 10.0, 8.0, 14.0, 14.0, 9.0, 17.0, 17.0, 27.0, 42.0, 33.0, 36.0, 28.0, 51.0, 47.0, 41.0, 37.0, 44.0, 40.0, 33.0, 46.0, 48.0, 46.0, 37.0, 32.0, 34.0, 27.0, 27.0, 20.0, 20.0, 20.0, 13.0, 16.0, 8.0, 13.0, 7.0, 8.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.829414367675781, -11.450998306274414, -11.072583198547363, -10.694167137145996, -10.315752029418945, -9.937335968017578, -9.558919906616211, -9.180503845214844, -8.802088737487793, -8.423672676086426, -8.045257568359375, -7.666841506958008, -7.288425922393799, -6.91001033782959, -6.531594276428223, -6.153178691864014, -5.774763107299805, -5.396347522735596, -5.017931938171387, -4.6395158767700195, -4.2611002922058105, -3.8826847076416016, -3.5042688846588135, -3.1258530616760254, -2.7474374771118164, -2.3690218925476074, -1.9906060695648193, -1.6121903657913208, -1.2337746620178223, -0.8553589582443237, -0.4769432544708252, -0.09852743148803711, 0.2798891067504883, 0.6583048105239868, 1.0367205142974854, 1.4151362180709839, 1.7935519218444824, 2.1719675064086914, 2.5503833293914795, 2.9287991523742676, 3.3072147369384766, 3.6856303215026855, 4.0640459060668945, 4.442461967468262, 4.820877552032471, 5.19929313659668, 5.577709197998047, 5.956124782562256, 6.334540367126465, 6.712955951690674, 7.091371536254883, 7.46978759765625, 7.848203182220459, 8.226618766784668, 8.605034828186035, 8.983449935913086, 9.361865997314453, 9.74028205871582, 10.118697166442871, 10.497113227844238, 10.875528335571289, 11.253944396972656, 11.632360458374023, 12.01077651977539, 12.389191627502441]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 14.0, 26.0, 35.0, 50.0, 61.0, 122.0, 206.0, 330.0, 634.0, 1225.0, 2515.0, 5730.0, 15573.0, 63216.0, 3936408.0, 130129.0, 22840.0, 7788.0, 3426.0, 1660.0, 917.0, 488.0, 306.0, 179.0, 115.0, 74.0, 64.0, 33.0, 26.0, 26.0, 14.0, 13.0, 9.0, 7.0, 1.0, 1.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.49111175537109375, -0.4719696044921875, -0.45282745361328125, -0.433685302734375, -0.41454315185546875, -0.3954010009765625, -0.37625885009765625, -0.35711669921875, -0.33797454833984375, -0.3188323974609375, -0.29969024658203125, -0.280548095703125, -0.26140594482421875, -0.2422637939453125, -0.22312164306640625, -0.2039794921875, -0.18483734130859375, -0.1656951904296875, -0.14655303955078125, -0.127410888671875, -0.10826873779296875, -0.0891265869140625, -0.06998443603515625, -0.05084228515625, -0.03170013427734375, -0.0125579833984375, 0.00658416748046875, 0.025726318359375, 0.04486846923828125, 0.0640106201171875, 0.08315277099609375, 0.102294921875, 0.12143707275390625, 0.1405792236328125, 0.15972137451171875, 0.178863525390625, 0.19800567626953125, 0.2171478271484375, 0.23628997802734375, 0.25543212890625, 0.27457427978515625, 0.2937164306640625, 0.31285858154296875, 0.332000732421875, 0.35114288330078125, 0.3702850341796875, 0.38942718505859375, 0.4085693359375, 0.42771148681640625, 0.4468536376953125, 0.46599578857421875, 0.485137939453125, 0.5042800903320312, 0.5234222412109375, 0.5425643920898438, 0.56170654296875, 0.5808486938476562, 0.5999908447265625, 0.6191329956054688, 0.638275146484375, 0.6574172973632812, 0.6765594482421875, 0.6957015991210938, 0.71484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 7.0, 2.0, 4.0, 3.0, 6.0, 8.0, 5.0, 9.0, 14.0, 15.0, 11.0, 76.0, 719.0, 14.0, 11.0, 15.0, 9.0, 12.0, 7.0, 8.0, 5.0, 5.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059906005859375, -0.05779600143432617, -0.055685997009277344, -0.053575992584228516, -0.05146598815917969, -0.04935598373413086, -0.04724597930908203, -0.0451359748840332, -0.043025970458984375, -0.04091596603393555, -0.03880596160888672, -0.03669595718383789, -0.03458595275878906, -0.032475948333740234, -0.030365943908691406, -0.028255939483642578, -0.02614593505859375, -0.024035930633544922, -0.021925926208496094, -0.019815921783447266, -0.017705917358398438, -0.01559591293334961, -0.013485908508300781, -0.011375904083251953, -0.009265899658203125, -0.007155895233154297, -0.005045890808105469, -0.0029358863830566406, -0.0008258819580078125, 0.0012841224670410156, 0.0033941268920898438, 0.005504131317138672, 0.0076141357421875, 0.009724140167236328, 0.011834144592285156, 0.013944149017333984, 0.016054153442382812, 0.01816415786743164, 0.02027416229248047, 0.022384166717529297, 0.024494171142578125, 0.026604175567626953, 0.02871417999267578, 0.03082418441772461, 0.03293418884277344, 0.035044193267822266, 0.037154197692871094, 0.03926420211791992, 0.04137420654296875, 0.04348421096801758, 0.045594215393066406, 0.047704219818115234, 0.04981422424316406, 0.05192422866821289, 0.05403423309326172, 0.05614423751831055, 0.058254241943359375, 0.0603642463684082, 0.06247425079345703, 0.06458425521850586, 0.06669425964355469, 0.06880426406860352, 0.07091426849365234, 0.07302427291870117, 0.07513427734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 19.0, 13.0, 9.0, 22.0, 31.0, 43.0, 63.0, 137.0, 170.0, 308.0, 560.0, 1139.0, 2196.0, 4527.0, 9845.0, 25172.0, 74534.0, 287590.0, 2227527.0, 1267205.0, 199568.0, 56823.0, 20116.0, 8531.0, 3898.0, 1941.0, 969.0, 533.0, 268.0, 174.0, 116.0, 59.0, 39.0, 38.0, 25.0, 20.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.314697265625, -0.3048248291015625, -0.294952392578125, -0.2850799560546875, -0.27520751953125, -0.2653350830078125, -0.255462646484375, -0.2455902099609375, -0.2357177734375, -0.2258453369140625, -0.215972900390625, -0.2061004638671875, -0.19622802734375, -0.1863555908203125, -0.176483154296875, -0.1666107177734375, -0.15673828125, -0.1468658447265625, -0.136993408203125, -0.1271209716796875, -0.11724853515625, -0.1073760986328125, -0.097503662109375, -0.0876312255859375, -0.0777587890625, -0.0678863525390625, -0.058013916015625, -0.0481414794921875, -0.03826904296875, -0.0283966064453125, -0.018524169921875, -0.0086517333984375, 0.001220703125, 0.0110931396484375, 0.020965576171875, 0.0308380126953125, 0.04071044921875, 0.0505828857421875, 0.060455322265625, 0.0703277587890625, 0.0802001953125, 0.0900726318359375, 0.099945068359375, 0.1098175048828125, 0.11968994140625, 0.1295623779296875, 0.139434814453125, 0.1493072509765625, 0.1591796875, 0.1690521240234375, 0.178924560546875, 0.1887969970703125, 0.19866943359375, 0.2085418701171875, 0.218414306640625, 0.2282867431640625, 0.2381591796875, 0.2480316162109375, 0.257904052734375, 0.2677764892578125, 0.27764892578125, 0.2875213623046875, 0.297393798828125, 0.3072662353515625, 0.317138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 7.0, 3.0, 7.0, 11.0, 13.0, 9.0, 21.0, 27.0, 37.0, 65.0, 60.0, 105.0, 136.0, 206.0, 284.0, 501.0, 866.0, 586.0, 367.0, 211.0, 132.0, 107.0, 107.0, 41.0, 38.0, 25.0, 25.0, 17.0, 14.0, 12.0, 8.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.138427734375, -0.13474464416503906, -0.13106155395507812, -0.1273784637451172, -0.12369537353515625, -0.12001228332519531, -0.11632919311523438, -0.11264610290527344, -0.1089630126953125, -0.10527992248535156, -0.10159683227539062, -0.09791374206542969, -0.09423065185546875, -0.09054756164550781, -0.08686447143554688, -0.08318138122558594, -0.079498291015625, -0.07581520080566406, -0.07213211059570312, -0.06844902038574219, -0.06476593017578125, -0.06108283996582031, -0.057399749755859375, -0.05371665954589844, -0.0500335693359375, -0.04635047912597656, -0.042667388916015625, -0.03898429870605469, -0.03530120849609375, -0.03161811828613281, -0.027935028076171875, -0.024251937866210938, -0.02056884765625, -0.016885757446289062, -0.013202667236328125, -0.009519577026367188, -0.00583648681640625, -0.0021533966064453125, 0.001529693603515625, 0.0052127838134765625, 0.0088958740234375, 0.012578964233398438, 0.016262054443359375, 0.019945144653320312, 0.02362823486328125, 0.027311325073242188, 0.030994415283203125, 0.03467750549316406, 0.038360595703125, 0.04204368591308594, 0.045726776123046875, 0.04940986633300781, 0.05309295654296875, 0.05677604675292969, 0.060459136962890625, 0.06414222717285156, 0.0678253173828125, 0.07150840759277344, 0.07519149780273438, 0.07887458801269531, 0.08255767822265625, 0.08624076843261719, 0.08992385864257812, 0.09360694885253906, 0.0972900390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 8.0, 11.0, 21.0, 56.0, 74.0, 134.0, 160.0, 157.0, 145.0, 90.0, 58.0, 33.0, 12.0, 12.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5847426652908325, -0.5522713661193848, -0.519800066947937, -0.48732873797416687, -0.4548574388027191, -0.42238613963127136, -0.3899148106575012, -0.35744351148605347, -0.3249722123146057, -0.29250091314315796, -0.2600296139717102, -0.22755828499794006, -0.1950869858264923, -0.16261568665504456, -0.1301443725824356, -0.09767305850982666, -0.0652017593383789, -0.032730452716350555, -0.0002591460943222046, 0.032212160527706146, 0.0646834671497345, 0.09715476632118225, 0.1296260803937912, 0.16209739446640015, 0.1945686936378479, 0.22703999280929565, 0.2595112919807434, 0.29198262095451355, 0.3244539201259613, 0.35692521929740906, 0.3893965482711792, 0.42186784744262695, 0.45433902740478516, 0.4868103265762329, 0.5192816257476807, 0.5517529249191284, 0.5842242240905762, 0.6166955232620239, 0.6491668820381165, 0.6816381812095642, 0.714109480381012, 0.7465807795524597, 0.7790520787239075, 0.8115233778953552, 0.8439947366714478, 0.8764660358428955, 0.9089373350143433, 0.941408634185791, 0.9738799333572388, 1.0063512325286865, 1.0388225317001343, 1.071293830871582, 1.1037651300430298, 1.1362364292144775, 1.1687077283859253, 1.201179027557373, 1.2336504459381104, 1.266121745109558, 1.2985930442810059, 1.3310643434524536, 1.3635356426239014, 1.3960069417953491, 1.4284782409667969, 1.4609496593475342, 1.4934208393096924]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 7.0, 12.0, 16.0, 22.0, 24.0, 48.0, 43.0, 54.0, 58.0, 66.0, 64.0, 58.0, 69.0, 58.0, 65.0, 55.0, 45.0, 50.0, 45.0, 35.0, 19.0, 15.0, 12.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6479199528694153, -0.6287246346473694, -0.6095293164253235, -0.5903339982032776, -0.5711386799812317, -0.5519433617591858, -0.5327480435371399, -0.5135527849197388, -0.4943574368953705, -0.4751621186733246, -0.4559668004512787, -0.4367714822292328, -0.4175761938095093, -0.3983808755874634, -0.3791855573654175, -0.3599902391433716, -0.3407949209213257, -0.3215996026992798, -0.3024042844772339, -0.283208966255188, -0.2640136480331421, -0.24481834471225739, -0.22562304139137268, -0.20642772316932678, -0.18723240494728088, -0.16803708672523499, -0.1488417685031891, -0.12964646518230438, -0.11045114696025848, -0.09125582873821259, -0.07206051796674728, -0.05286520719528198, -0.033669888973236084, -0.014474574476480484, 0.004720740020275116, 0.023916054517030716, 0.043111369013786316, 0.062306687235832214, 0.08150199800729752, 0.10069730877876282, 0.11989262700080872, 0.13908794522285461, 0.1582832634449005, 0.17747856676578522, 0.19667388498783112, 0.21586920320987701, 0.23506450653076172, 0.2542598247528076, 0.2734551429748535, 0.2926504611968994, 0.3118457794189453, 0.3310410976409912, 0.3502364158630371, 0.369431734085083, 0.3886270225048065, 0.4078223407268524, 0.4270176589488983, 0.4462129771709442, 0.4654082953929901, 0.484603613615036, 0.5037989020347595, 0.5229942202568054, 0.5421895384788513, 0.5613848567008972, 0.5805801749229431]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 3.0, 10.0, 20.0, 32.0, 36.0, 50.0, 78.0, 116.0, 170.0, 231.0, 396.0, 549.0, 892.0, 1339.0, 2325.0, 3405.0, 5680.0, 9469.0, 16380.0, 32045.0, 393414.0, 504835.0, 34300.0, 17039.0, 9819.0, 5926.0, 3606.0, 2193.0, 1440.0, 957.0, 611.0, 395.0, 253.0, 181.0, 113.0, 67.0, 46.0, 37.0, 31.0, 22.0, 11.0, 10.0, 7.0, 7.0, 2.0, 1.0, 5.0], "bins": [-0.47998046875, -0.4673614501953125, -0.454742431640625, -0.4421234130859375, -0.42950439453125, -0.4168853759765625, -0.404266357421875, -0.3916473388671875, -0.3790283203125, -0.3664093017578125, -0.353790283203125, -0.3411712646484375, -0.32855224609375, -0.3159332275390625, -0.303314208984375, -0.2906951904296875, -0.278076171875, -0.2654571533203125, -0.252838134765625, -0.2402191162109375, -0.22760009765625, -0.2149810791015625, -0.202362060546875, -0.1897430419921875, -0.1771240234375, -0.1645050048828125, -0.151885986328125, -0.1392669677734375, -0.12664794921875, -0.1140289306640625, -0.101409912109375, -0.0887908935546875, -0.076171875, -0.0635528564453125, -0.050933837890625, -0.0383148193359375, -0.02569580078125, -0.0130767822265625, -0.000457763671875, 0.0121612548828125, 0.0247802734375, 0.0373992919921875, 0.050018310546875, 0.0626373291015625, 0.07525634765625, 0.0878753662109375, 0.100494384765625, 0.1131134033203125, 0.125732421875, 0.1383514404296875, 0.150970458984375, 0.1635894775390625, 0.17620849609375, 0.1888275146484375, 0.201446533203125, 0.2140655517578125, 0.2266845703125, 0.2393035888671875, 0.251922607421875, 0.2645416259765625, 0.27716064453125, 0.2897796630859375, 0.302398681640625, 0.3150177001953125, 0.32763671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 8.0, 10.0, 18.0, 36.0, 86.0, 242.0, 273.0, 156.0, 43.0, 17.0, 11.0, 11.0, 5.0, 6.0, 7.0, 2.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05657958984375, -0.054511070251464844, -0.05244255065917969, -0.05037403106689453, -0.048305511474609375, -0.04623699188232422, -0.04416847229003906, -0.042099952697753906, -0.04003143310546875, -0.037962913513183594, -0.03589439392089844, -0.03382587432861328, -0.031757354736328125, -0.02968883514404297, -0.027620315551757812, -0.025551795959472656, -0.0234832763671875, -0.021414756774902344, -0.019346237182617188, -0.01727771759033203, -0.015209197998046875, -0.013140678405761719, -0.011072158813476562, -0.009003639221191406, -0.00693511962890625, -0.004866600036621094, -0.0027980804443359375, -0.0007295608520507812, 0.001338958740234375, 0.0034074783325195312, 0.0054759979248046875, 0.007544517517089844, 0.009613037109375, 0.011681556701660156, 0.013750076293945312, 0.01581859588623047, 0.017887115478515625, 0.01995563507080078, 0.022024154663085938, 0.024092674255371094, 0.02616119384765625, 0.028229713439941406, 0.030298233032226562, 0.03236675262451172, 0.034435272216796875, 0.03650379180908203, 0.03857231140136719, 0.040640830993652344, 0.0427093505859375, 0.044777870178222656, 0.04684638977050781, 0.04891490936279297, 0.050983428955078125, 0.05305194854736328, 0.05512046813964844, 0.057188987731933594, 0.05925750732421875, 0.061326026916503906, 0.06339454650878906, 0.06546306610107422, 0.06753158569335938, 0.06960010528564453, 0.07166862487792969, 0.07373714447021484, 0.0758056640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 3.0, 4.0, 10.0, 13.0, 15.0, 19.0, 30.0, 42.0, 61.0, 74.0, 110.0, 172.0, 207.0, 438.0, 692.0, 1354.0, 2852.0, 7290.0, 22240.0, 86954.0, 358226.0, 419511.0, 106588.0, 26522.0, 8336.0, 3242.0, 1497.0, 750.0, 433.0, 266.0, 167.0, 115.0, 82.0, 67.0, 45.0, 32.0, 26.0, 16.0, 12.0, 8.0, 11.0, 6.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434814453125, -0.4198570251464844, -0.40489959716796875, -0.3899421691894531, -0.3749847412109375, -0.3600273132324219, -0.34506988525390625, -0.3301124572753906, -0.315155029296875, -0.3001976013183594, -0.28524017333984375, -0.2702827453613281, -0.2553253173828125, -0.24036788940429688, -0.22541046142578125, -0.21045303344726562, -0.19549560546875, -0.18053817749023438, -0.16558074951171875, -0.15062332153320312, -0.1356658935546875, -0.12070846557617188, -0.10575103759765625, -0.09079360961914062, -0.075836181640625, -0.060878753662109375, -0.04592132568359375, -0.030963897705078125, -0.0160064697265625, -0.001049041748046875, 0.01390838623046875, 0.028865814208984375, 0.0438232421875, 0.058780670166015625, 0.07373809814453125, 0.08869552612304688, 0.1036529541015625, 0.11861038208007812, 0.13356781005859375, 0.14852523803710938, 0.163482666015625, 0.17844009399414062, 0.19339752197265625, 0.20835494995117188, 0.2233123779296875, 0.23826980590820312, 0.25322723388671875, 0.2681846618652344, 0.28314208984375, 0.2980995178222656, 0.31305694580078125, 0.3280143737792969, 0.3429718017578125, 0.3579292297363281, 0.37288665771484375, 0.3878440856933594, 0.402801513671875, 0.4177589416503906, 0.43271636962890625, 0.4476737976074219, 0.4626312255859375, 0.4775886535644531, 0.49254608154296875, 0.5075035095214844, 0.5224609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 6.0, 9.0, 8.0, 8.0, 15.0, 18.0, 17.0, 20.0, 19.0, 27.0, 33.0, 28.0, 41.0, 40.0, 43.0, 45.0, 41.0, 45.0, 41.0, 38.0, 45.0, 34.0, 45.0, 45.0, 33.0, 35.0, 30.0, 26.0, 24.0, 20.0, 17.0, 19.0, 17.0, 14.0, 14.0, 14.0, 5.0, 3.0, 3.0, 3.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.29541015625, -0.28730010986328125, -0.2791900634765625, -0.27108001708984375, -0.262969970703125, -0.25485992431640625, -0.2467498779296875, -0.23863983154296875, -0.23052978515625, -0.22241973876953125, -0.2143096923828125, -0.20619964599609375, -0.198089599609375, -0.18997955322265625, -0.1818695068359375, -0.17375946044921875, -0.1656494140625, -0.15753936767578125, -0.1494293212890625, -0.14131927490234375, -0.133209228515625, -0.12509918212890625, -0.1169891357421875, -0.10887908935546875, -0.10076904296875, -0.09265899658203125, -0.0845489501953125, -0.07643890380859375, -0.068328857421875, -0.06021881103515625, -0.0521087646484375, -0.04399871826171875, -0.035888671875, -0.02777862548828125, -0.0196685791015625, -0.01155853271484375, -0.003448486328125, 0.00466156005859375, 0.0127716064453125, 0.02088165283203125, 0.02899169921875, 0.03710174560546875, 0.0452117919921875, 0.05332183837890625, 0.061431884765625, 0.06954193115234375, 0.0776519775390625, 0.08576202392578125, 0.0938720703125, 0.10198211669921875, 0.1100921630859375, 0.11820220947265625, 0.126312255859375, 0.13442230224609375, 0.1425323486328125, 0.15064239501953125, 0.15875244140625, 0.16686248779296875, 0.1749725341796875, 0.18308258056640625, 0.191192626953125, 0.19930267333984375, 0.2074127197265625, 0.21552276611328125, 0.2236328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 15.0, 23.0, 41.0, 62.0, 88.0, 173.0, 395.0, 869.0, 2711.0, 12907.0, 393653.0, 616950.0, 15857.0, 2970.0, 967.0, 382.0, 196.0, 110.0, 49.0, 32.0, 14.0, 20.0, 21.0, 7.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97314453125, -0.942779541015625, -0.91241455078125, -0.882049560546875, -0.8516845703125, -0.821319580078125, -0.79095458984375, -0.760589599609375, -0.730224609375, -0.699859619140625, -0.66949462890625, -0.639129638671875, -0.6087646484375, -0.578399658203125, -0.54803466796875, -0.517669677734375, -0.4873046875, -0.456939697265625, -0.42657470703125, -0.396209716796875, -0.3658447265625, -0.335479736328125, -0.30511474609375, -0.274749755859375, -0.244384765625, -0.214019775390625, -0.18365478515625, -0.153289794921875, -0.1229248046875, -0.092559814453125, -0.06219482421875, -0.031829833984375, -0.00146484375, 0.028900146484375, 0.05926513671875, 0.089630126953125, 0.1199951171875, 0.150360107421875, 0.18072509765625, 0.211090087890625, 0.241455078125, 0.271820068359375, 0.30218505859375, 0.332550048828125, 0.3629150390625, 0.393280029296875, 0.42364501953125, 0.454010009765625, 0.484375, 0.514739990234375, 0.54510498046875, 0.575469970703125, 0.6058349609375, 0.636199951171875, 0.66656494140625, 0.696929931640625, 0.727294921875, 0.757659912109375, 0.78802490234375, 0.818389892578125, 0.8487548828125, 0.879119873046875, 0.90948486328125, 0.939849853515625, 0.97021484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 7.0, 10.0, 18.0, 31.0, 49.0, 65.0, 90.0, 121.0, 123.0, 119.0, 108.0, 78.0, 58.0, 40.0, 29.0, 16.0, 12.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21540641784668e-05, -5.070120096206665e-05, -4.9248337745666504e-05, -4.779547452926636e-05, -4.634261131286621e-05, -4.4889748096466064e-05, -4.343688488006592e-05, -4.198402166366577e-05, -4.0531158447265625e-05, -3.907829523086548e-05, -3.762543201446533e-05, -3.6172568798065186e-05, -3.471970558166504e-05, -3.326684236526489e-05, -3.1813979148864746e-05, -3.03611159324646e-05, -2.8908252716064453e-05, -2.7455389499664307e-05, -2.600252628326416e-05, -2.4549663066864014e-05, -2.3096799850463867e-05, -2.164393663406372e-05, -2.0191073417663574e-05, -1.8738210201263428e-05, -1.728534698486328e-05, -1.5832483768463135e-05, -1.4379620552062988e-05, -1.2926757335662842e-05, -1.1473894119262695e-05, -1.0021030902862549e-05, -8.568167686462402e-06, -7.115304470062256e-06, -5.662441253662109e-06, -4.209578037261963e-06, -2.7567148208618164e-06, -1.30385160446167e-06, 1.4901161193847656e-07, 1.601874828338623e-06, 3.0547380447387695e-06, 4.507601261138916e-06, 5.9604644775390625e-06, 7.413327693939209e-06, 8.866190910339355e-06, 1.0319054126739502e-05, 1.1771917343139648e-05, 1.3224780559539795e-05, 1.4677643775939941e-05, 1.6130506992340088e-05, 1.7583370208740234e-05, 1.903623342514038e-05, 2.0489096641540527e-05, 2.1941959857940674e-05, 2.339482307434082e-05, 2.4847686290740967e-05, 2.6300549507141113e-05, 2.775341272354126e-05, 2.9206275939941406e-05, 3.065913915634155e-05, 3.21120023727417e-05, 3.3564865589141846e-05, 3.501772880554199e-05, 3.647059202194214e-05, 3.7923455238342285e-05, 3.937631845474243e-05, 4.082918167114258e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 2.0, 10.0, 10.0, 19.0, 34.0, 72.0, 123.0, 255.0, 674.0, 1686.0, 5718.0, 25476.0, 199966.0, 681319.0, 110207.0, 16544.0, 4109.0, 1329.0, 543.0, 218.0, 93.0, 55.0, 38.0, 22.0, 10.0, 7.0, 2.0, 0.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61474609375, -0.598724365234375, -0.58270263671875, -0.566680908203125, -0.5506591796875, -0.534637451171875, -0.51861572265625, -0.502593994140625, -0.486572265625, -0.470550537109375, -0.45452880859375, -0.438507080078125, -0.4224853515625, -0.406463623046875, -0.39044189453125, -0.374420166015625, -0.3583984375, -0.342376708984375, -0.32635498046875, -0.310333251953125, -0.2943115234375, -0.278289794921875, -0.26226806640625, -0.246246337890625, -0.230224609375, -0.214202880859375, -0.19818115234375, -0.182159423828125, -0.1661376953125, -0.150115966796875, -0.13409423828125, -0.118072509765625, -0.10205078125, -0.086029052734375, -0.07000732421875, -0.053985595703125, -0.0379638671875, -0.021942138671875, -0.00592041015625, 0.010101318359375, 0.026123046875, 0.042144775390625, 0.05816650390625, 0.074188232421875, 0.0902099609375, 0.106231689453125, 0.12225341796875, 0.138275146484375, 0.154296875, 0.170318603515625, 0.18634033203125, 0.202362060546875, 0.2183837890625, 0.234405517578125, 0.25042724609375, 0.266448974609375, 0.282470703125, 0.298492431640625, 0.31451416015625, 0.330535888671875, 0.3465576171875, 0.362579345703125, 0.37860107421875, 0.394622802734375, 0.41064453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 6.0, 5.0, 8.0, 3.0, 6.0, 12.0, 29.0, 26.0, 31.0, 46.0, 40.0, 48.0, 61.0, 54.0, 65.0, 59.0, 73.0, 64.0, 56.0, 43.0, 46.0, 42.0, 43.0, 27.0, 23.0, 18.0, 14.0, 4.0, 9.0, 8.0, 3.0, 7.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.294921875, -0.28591156005859375, -0.2769012451171875, -0.26789093017578125, -0.258880615234375, -0.24987030029296875, -0.2408599853515625, -0.23184967041015625, -0.22283935546875, -0.21382904052734375, -0.2048187255859375, -0.19580841064453125, -0.186798095703125, -0.17778778076171875, -0.1687774658203125, -0.15976715087890625, -0.1507568359375, -0.14174652099609375, -0.1327362060546875, -0.12372589111328125, -0.114715576171875, -0.10570526123046875, -0.0966949462890625, -0.08768463134765625, -0.07867431640625, -0.06966400146484375, -0.0606536865234375, -0.05164337158203125, -0.042633056640625, -0.03362274169921875, -0.0246124267578125, -0.01560211181640625, -0.006591796875, 0.00241851806640625, 0.0114288330078125, 0.02043914794921875, 0.029449462890625, 0.03845977783203125, 0.0474700927734375, 0.05648040771484375, 0.06549072265625, 0.07450103759765625, 0.0835113525390625, 0.09252166748046875, 0.101531982421875, 0.11054229736328125, 0.1195526123046875, 0.12856292724609375, 0.1375732421875, 0.14658355712890625, 0.1555938720703125, 0.16460418701171875, 0.173614501953125, 0.18262481689453125, 0.1916351318359375, 0.20064544677734375, 0.20965576171875, 0.21866607666015625, 0.2276763916015625, 0.23668670654296875, 0.245697021484375, 0.25470733642578125, 0.2637176513671875, 0.27272796630859375, 0.28173828125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 11.0, 8.0, 20.0, 53.0, 98.0, 232.0, 290.0, 142.0, 73.0, 21.0, 13.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.161901473999023, -4.965007305145264, -4.768112659454346, -4.571218490600586, -4.374323844909668, -4.177429676055908, -3.9805352687835693, -3.7836408615112305, -3.5867464542388916, -3.3898520469665527, -3.192957639694214, -2.996063232421875, -2.7991690635681152, -2.6022744178771973, -2.4053802490234375, -2.2084858417510986, -2.0115914344787598, -1.814697027206421, -1.617802619934082, -1.4209083318710327, -1.2240139245986938, -1.027119517326355, -0.8302252292633057, -0.6333308219909668, -0.43643641471862793, -0.23954203724861145, -0.04264765977859497, 0.15424668788909912, 0.351141095161438, 0.5480355024337769, 0.7449297904968262, 0.941824197769165, 1.138718605041504, 1.3356130123138428, 1.5325074195861816, 1.729401707649231, 1.9262961149215698, 2.123190402984619, 2.320084810256958, 2.516979217529297, 2.7138736248016357, 2.9107680320739746, 3.1076624393463135, 3.3045568466186523, 3.501451015472412, 3.69834566116333, 3.89523983001709, 4.092134475708008, 4.289028644561768, 4.485922813415527, 4.682817459106445, 4.879711627960205, 5.076606273651123, 5.273500442504883, 5.470395088195801, 5.6672892570495605, 5.86418342590332, 6.06107759475708, 6.257972240447998, 6.454866409301758, 6.651761054992676, 6.8486552238464355, 7.045549392700195, 7.242444038391113, 7.439338684082031]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 6.0, 2.0, 7.0, 4.0, 6.0, 10.0, 10.0, 14.0, 14.0, 32.0, 44.0, 66.0, 109.0, 127.0, 131.0, 134.0, 90.0, 53.0, 45.0, 21.0, 10.0, 11.0, 11.0, 9.0, 7.0, 3.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.683117866516113, -5.527040958404541, -5.370964050292969, -5.214886665344238, -5.058809757232666, -4.902732849121094, -4.7466559410095215, -4.590579032897949, -4.434501647949219, -4.2784247398376465, -4.122347831726074, -3.966270685195923, -3.8101935386657715, -3.654116630554199, -3.498039722442627, -3.3419625759124756, -3.1858856678009033, -3.029808759689331, -2.8737316131591797, -2.7176547050476074, -2.561577558517456, -2.405500650405884, -2.2494235038757324, -2.09334659576416, -1.9372695684432983, -1.7811925411224365, -1.6251155138015747, -1.469038486480713, -1.3129615783691406, -1.1568844318389893, -1.000807523727417, -0.8447304964065552, -0.6886534690856934, -0.5325764417648315, -0.3764994442462921, -0.22042244672775269, -0.06434541940689087, 0.09173160791397095, 0.247808575630188, 0.4038856029510498, 0.5599626302719116, 0.7160396575927734, 0.8721166849136353, 1.028193712234497, 1.1842706203460693, 1.3403477668762207, 1.496424674987793, 1.6525017023086548, 1.8085787296295166, 1.9646557569503784, 2.1207327842712402, 2.2768096923828125, 2.432886838912964, 2.588963747024536, 2.7450408935546875, 2.9011178016662598, 3.057194709777832, 3.2132716178894043, 3.3693487644195557, 3.525425672531128, 3.6815028190612793, 3.8375797271728516, 3.993656635284424, 4.149733543395996, 4.305810928344727]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 6.0, 21.0, 37.0, 76.0, 259.0, 1620.0, 20500.0, 4132452.0, 36671.0, 2088.0, 336.0, 125.0, 33.0, 20.0, 8.0, 12.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.914581298828125, -4.80181884765625, -4.689056396484375, -4.5762939453125, -4.463531494140625, -4.35076904296875, -4.238006591796875, -4.125244140625, -4.012481689453125, -3.89971923828125, -3.786956787109375, -3.6741943359375, -3.561431884765625, -3.44866943359375, -3.335906982421875, -3.22314453125, -3.110382080078125, -2.99761962890625, -2.884857177734375, -2.7720947265625, -2.659332275390625, -2.54656982421875, -2.433807373046875, -2.321044921875, -2.208282470703125, -2.09552001953125, -1.982757568359375, -1.8699951171875, -1.757232666015625, -1.64447021484375, -1.531707763671875, -1.4189453125, -1.306182861328125, -1.19342041015625, -1.080657958984375, -0.9678955078125, -0.855133056640625, -0.74237060546875, -0.629608154296875, -0.516845703125, -0.404083251953125, -0.29132080078125, -0.178558349609375, -0.0657958984375, 0.046966552734375, 0.15972900390625, 0.272491455078125, 0.38525390625, 0.498016357421875, 0.61077880859375, 0.723541259765625, 0.8363037109375, 0.949066162109375, 1.06182861328125, 1.174591064453125, 1.287353515625, 1.400115966796875, 1.51287841796875, 1.625640869140625, 1.7384033203125, 1.851165771484375, 1.96392822265625, 2.076690673828125, 2.189453125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 5.0, 5.0, 3.0, 4.0, 4.0, 11.0, 10.0, 14.0, 25.0, 34.0, 80.0, 151.0, 208.0, 190.0, 94.0, 56.0, 27.0, 15.0, 7.0, 7.0, 7.0, 3.0, 15.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06632328033447266, -0.06416511535644531, -0.06200695037841797, -0.059848785400390625, -0.05769062042236328, -0.05553245544433594, -0.053374290466308594, -0.05121612548828125, -0.049057960510253906, -0.04689979553222656, -0.04474163055419922, -0.042583465576171875, -0.04042530059814453, -0.03826713562011719, -0.036108970642089844, -0.0339508056640625, -0.031792640686035156, -0.029634475708007812, -0.02747631072998047, -0.025318145751953125, -0.02315998077392578, -0.021001815795898438, -0.018843650817871094, -0.01668548583984375, -0.014527320861816406, -0.012369155883789062, -0.010210990905761719, -0.008052825927734375, -0.005894660949707031, -0.0037364959716796875, -0.0015783309936523438, 0.000579833984375, 0.0027379989624023438, 0.0048961639404296875, 0.007054328918457031, 0.009212493896484375, 0.011370658874511719, 0.013528823852539062, 0.015686988830566406, 0.01784515380859375, 0.020003318786621094, 0.022161483764648438, 0.02431964874267578, 0.026477813720703125, 0.02863597869873047, 0.030794143676757812, 0.032952308654785156, 0.0351104736328125, 0.037268638610839844, 0.03942680358886719, 0.04158496856689453, 0.043743133544921875, 0.04590129852294922, 0.04805946350097656, 0.050217628479003906, 0.05237579345703125, 0.054533958435058594, 0.05669212341308594, 0.05885028839111328, 0.061008453369140625, 0.06316661834716797, 0.06532478332519531, 0.06748294830322266, 0.06964111328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 9.0, 11.0, 24.0, 25.0, 33.0, 43.0, 80.0, 100.0, 171.0, 220.0, 397.0, 629.0, 1047.0, 1845.0, 3331.0, 6646.0, 14719.0, 38548.0, 149458.0, 2134174.0, 1639921.0, 137068.0, 36876.0, 14183.0, 6498.0, 3301.0, 1918.0, 1098.0, 665.0, 425.0, 276.0, 175.0, 132.0, 71.0, 51.0, 30.0, 24.0, 19.0, 15.0, 9.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.522613525390625, -0.50323486328125, -0.483856201171875, -0.4644775390625, -0.445098876953125, -0.42572021484375, -0.406341552734375, -0.386962890625, -0.367584228515625, -0.34820556640625, -0.328826904296875, -0.3094482421875, -0.290069580078125, -0.27069091796875, -0.251312255859375, -0.23193359375, -0.212554931640625, -0.19317626953125, -0.173797607421875, -0.1544189453125, -0.135040283203125, -0.11566162109375, -0.096282958984375, -0.076904296875, -0.057525634765625, -0.03814697265625, -0.018768310546875, 0.0006103515625, 0.019989013671875, 0.03936767578125, 0.058746337890625, 0.078125, 0.097503662109375, 0.11688232421875, 0.136260986328125, 0.1556396484375, 0.175018310546875, 0.19439697265625, 0.213775634765625, 0.233154296875, 0.252532958984375, 0.27191162109375, 0.291290283203125, 0.3106689453125, 0.330047607421875, 0.34942626953125, 0.368804931640625, 0.38818359375, 0.407562255859375, 0.42694091796875, 0.446319580078125, 0.4656982421875, 0.485076904296875, 0.50445556640625, 0.523834228515625, 0.543212890625, 0.562591552734375, 0.58197021484375, 0.601348876953125, 0.6207275390625, 0.640106201171875, 0.65948486328125, 0.678863525390625, 0.6982421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 9.0, 10.0, 19.0, 7.0, 19.0, 22.0, 41.0, 92.0, 168.0, 374.0, 1186.0, 1256.0, 408.0, 170.0, 94.0, 67.0, 36.0, 30.0, 20.0, 9.0, 9.0, 7.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14369773864746094, -0.13920211791992188, -0.1347064971923828, -0.13021087646484375, -0.1257152557373047, -0.12121963500976562, -0.11672401428222656, -0.1122283935546875, -0.10773277282714844, -0.10323715209960938, -0.09874153137207031, -0.09424591064453125, -0.08975028991699219, -0.08525466918945312, -0.08075904846191406, -0.076263427734375, -0.07176780700683594, -0.06727218627929688, -0.06277656555175781, -0.05828094482421875, -0.05378532409667969, -0.049289703369140625, -0.04479408264160156, -0.0402984619140625, -0.03580284118652344, -0.031307220458984375, -0.026811599731445312, -0.02231597900390625, -0.017820358276367188, -0.013324737548828125, -0.008829116821289062, -0.00433349609375, 0.0001621246337890625, 0.004657745361328125, 0.009153366088867188, 0.01364898681640625, 0.018144607543945312, 0.022640228271484375, 0.027135848999023438, 0.0316314697265625, 0.03612709045410156, 0.040622711181640625, 0.04511833190917969, 0.04961395263671875, 0.05410957336425781, 0.058605194091796875, 0.06310081481933594, 0.067596435546875, 0.07209205627441406, 0.07658767700195312, 0.08108329772949219, 0.08557891845703125, 0.09007453918457031, 0.09457015991210938, 0.09906578063964844, 0.1035614013671875, 0.10805702209472656, 0.11255264282226562, 0.11704826354980469, 0.12154388427734375, 0.1260395050048828, 0.13053512573242188, 0.13503074645996094, 0.1395263671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 30.0, 193.0, 517.0, 209.0, 44.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.846590280532837, -1.7603347301483154, -1.674079179763794, -1.5878236293792725, -1.501568078994751, -1.4153125286102295, -1.3290568590164185, -1.242801308631897, -1.1565457582473755, -1.070290207862854, -0.9840346574783325, -0.8977790474891663, -0.8115234971046448, -0.7252679467201233, -0.639012336730957, -0.5527567863464355, -0.46650123596191406, -0.3802456855773926, -0.2939901053905487, -0.20773452520370483, -0.12147897481918335, -0.035223424434661865, 0.051032185554504395, 0.13728773593902588, 0.22354328632354736, 0.30979883670806885, 0.3960544168949127, 0.4823099970817566, 0.5685655474662781, 0.6548210978507996, 0.7410767078399658, 0.8273322582244873, 0.9135878086090088, 0.9998433589935303, 1.0860989093780518, 1.1723544597625732, 1.2586100101470947, 1.3448655605316162, 1.4311212301254272, 1.5173767805099487, 1.6036323308944702, 1.6898878812789917, 1.7761434316635132, 1.8623991012573242, 1.9486546516418457, 2.034910202026367, 2.1211657524108887, 2.20742130279541, 2.2936768531799316, 2.379932403564453, 2.4661879539489746, 2.552443504333496, 2.6386990547180176, 2.724954605102539, 2.8112101554870605, 2.897465705871582, 2.9837212562561035, 3.069976806640625, 3.1562323570251465, 3.242487907409668, 3.3287434577941895, 3.414999008178711, 3.5012545585632324, 3.587510108947754, 3.6737658977508545]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 5.0, 5.0, 2.0, 4.0, 9.0, 6.0, 7.0, 18.0, 25.0, 35.0, 53.0, 56.0, 91.0, 92.0, 105.0, 115.0, 87.0, 70.0, 59.0, 49.0, 29.0, 19.0, 12.0, 13.0, 7.0, 8.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7490231394767761, -0.7257136702537537, -0.7024042010307312, -0.6790947318077087, -0.6557852029800415, -0.632475733757019, -0.6091662645339966, -0.5858567953109741, -0.5625473260879517, -0.5392378568649292, -0.5159283876419067, -0.4926188886165619, -0.46930941939353943, -0.44599995017051697, -0.4226904511451721, -0.39938098192214966, -0.3760715126991272, -0.35276204347610474, -0.3294525742530823, -0.3061430752277374, -0.28283360600471497, -0.2595241367816925, -0.23621465265750885, -0.2129051685333252, -0.18959569931030273, -0.16628623008728027, -0.14297674596309662, -0.11966726928949356, -0.0963577926158905, -0.07304831594228745, -0.04973883926868439, -0.026429355144500732, -0.003119826316833496, 0.020189650356769562, 0.04349912703037262, 0.06680860370397568, 0.09011808037757874, 0.1134275570511818, 0.13673703372478485, 0.1600465178489685, 0.18335598707199097, 0.20666545629501343, 0.22997494041919708, 0.25328442454338074, 0.2765938937664032, 0.29990336298942566, 0.3232128620147705, 0.34652233123779297, 0.36983180046081543, 0.3931412696838379, 0.41645073890686035, 0.4397602379322052, 0.46306970715522766, 0.4863791763782501, 0.509688675403595, 0.5329981446266174, 0.5563076138496399, 0.5796170830726624, 0.6029265522956848, 0.6262360215187073, 0.6495455503463745, 0.672855019569397, 0.6961644887924194, 0.7194739580154419, 0.7427834272384644]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 1.0, 5.0, 10.0, 13.0, 10.0, 19.0, 20.0, 34.0, 70.0, 128.0, 232.0, 434.0, 893.0, 2066.0, 5991.0, 19687.0, 107792.0, 751037.0, 127605.0, 21783.0, 6471.0, 2279.0, 968.0, 414.0, 239.0, 130.0, 72.0, 43.0, 24.0, 14.0, 7.0, 7.0, 6.0, 8.0, 4.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.78369140625, -0.7603225708007812, -0.7369537353515625, -0.7135848999023438, -0.690216064453125, -0.6668472290039062, -0.6434783935546875, -0.6201095581054688, -0.59674072265625, -0.5733718872070312, -0.5500030517578125, -0.5266342163085938, -0.503265380859375, -0.47989654541015625, -0.4565277099609375, -0.43315887451171875, -0.4097900390625, -0.38642120361328125, -0.3630523681640625, -0.33968353271484375, -0.316314697265625, -0.29294586181640625, -0.2695770263671875, -0.24620819091796875, -0.22283935546875, -0.19947052001953125, -0.1761016845703125, -0.15273284912109375, -0.129364013671875, -0.10599517822265625, -0.0826263427734375, -0.05925750732421875, -0.035888671875, -0.01251983642578125, 0.0108489990234375, 0.03421783447265625, 0.057586669921875, 0.08095550537109375, 0.1043243408203125, 0.12769317626953125, 0.15106201171875, 0.17443084716796875, 0.1977996826171875, 0.22116851806640625, 0.244537353515625, 0.26790618896484375, 0.2912750244140625, 0.31464385986328125, 0.3380126953125, 0.36138153076171875, 0.3847503662109375, 0.40811920166015625, 0.431488037109375, 0.45485687255859375, 0.4782257080078125, 0.5015945434570312, 0.52496337890625, 0.5483322143554688, 0.5717010498046875, 0.5950698852539062, 0.618438720703125, 0.6418075561523438, 0.6651763916015625, 0.6885452270507812, 0.7119140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 11.0, 9.0, 16.0, 30.0, 71.0, 106.0, 184.0, 198.0, 150.0, 98.0, 48.0, 23.0, 13.0, 4.0, 8.0, 9.0, 7.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04547119140625, -0.04298686981201172, -0.04050254821777344, -0.038018226623535156, -0.035533905029296875, -0.033049583435058594, -0.030565261840820312, -0.02808094024658203, -0.02559661865234375, -0.02311229705810547, -0.020627975463867188, -0.018143653869628906, -0.015659332275390625, -0.013175010681152344, -0.010690689086914062, -0.008206367492675781, -0.0057220458984375, -0.0032377243041992188, -0.0007534027099609375, 0.0017309188842773438, 0.004215240478515625, 0.006699562072753906, 0.009183883666992188, 0.011668205261230469, 0.01415252685546875, 0.01663684844970703, 0.019121170043945312, 0.021605491638183594, 0.024089813232421875, 0.026574134826660156, 0.029058456420898438, 0.03154277801513672, 0.034027099609375, 0.03651142120361328, 0.03899574279785156, 0.041480064392089844, 0.043964385986328125, 0.046448707580566406, 0.04893302917480469, 0.05141735076904297, 0.05390167236328125, 0.05638599395751953, 0.05887031555175781, 0.061354637145996094, 0.06383895874023438, 0.06632328033447266, 0.06880760192871094, 0.07129192352294922, 0.0737762451171875, 0.07626056671142578, 0.07874488830566406, 0.08122920989990234, 0.08371353149414062, 0.0861978530883789, 0.08868217468261719, 0.09116649627685547, 0.09365081787109375, 0.09613513946533203, 0.09861946105957031, 0.1011037826538086, 0.10358810424804688, 0.10607242584228516, 0.10855674743652344, 0.11104106903076172, 0.113525390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 5.0, 5.0, 5.0, 8.0, 9.0, 43.0, 187.0, 2296.0, 356094.0, 685696.0, 3814.0, 255.0, 40.0, 11.0, 2.0, 3.0, 9.0, 4.0, 1.0, 13.0, 4.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.4140625, -2.3506622314453125, -2.287261962890625, -2.2238616943359375, -2.16046142578125, -2.0970611572265625, -2.033660888671875, -1.9702606201171875, -1.9068603515625, -1.8434600830078125, -1.780059814453125, -1.7166595458984375, -1.65325927734375, -1.5898590087890625, -1.526458740234375, -1.4630584716796875, -1.399658203125, -1.3362579345703125, -1.272857666015625, -1.2094573974609375, -1.14605712890625, -1.0826568603515625, -1.019256591796875, -0.9558563232421875, -0.8924560546875, -0.8290557861328125, -0.765655517578125, -0.7022552490234375, -0.63885498046875, -0.5754547119140625, -0.512054443359375, -0.4486541748046875, -0.38525390625, -0.3218536376953125, -0.258453369140625, -0.1950531005859375, -0.13165283203125, -0.0682525634765625, -0.004852294921875, 0.0585479736328125, 0.1219482421875, 0.1853485107421875, 0.248748779296875, 0.3121490478515625, 0.37554931640625, 0.4389495849609375, 0.502349853515625, 0.5657501220703125, 0.629150390625, 0.6925506591796875, 0.755950927734375, 0.8193511962890625, 0.88275146484375, 0.9461517333984375, 1.009552001953125, 1.0729522705078125, 1.1363525390625, 1.1997528076171875, 1.263153076171875, 1.3265533447265625, 1.38995361328125, 1.4533538818359375, 1.516754150390625, 1.5801544189453125, 1.6435546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 1.0, 3.0, 7.0, 15.0, 11.0, 13.0, 13.0, 16.0, 22.0, 15.0, 30.0, 32.0, 46.0, 42.0, 34.0, 47.0, 33.0, 38.0, 44.0, 38.0, 31.0, 44.0, 50.0, 36.0, 33.0, 42.0, 36.0, 36.0, 25.0, 23.0, 19.0, 10.0, 18.0, 15.0, 18.0, 10.0, 9.0, 8.0, 5.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15380859375, -0.14833450317382812, -0.14286041259765625, -0.13738632202148438, -0.1319122314453125, -0.12643814086914062, -0.12096405029296875, -0.11548995971679688, -0.110015869140625, -0.10454177856445312, -0.09906768798828125, -0.09359359741210938, -0.0881195068359375, -0.08264541625976562, -0.07717132568359375, -0.07169723510742188, -0.06622314453125, -0.060749053955078125, -0.05527496337890625, -0.049800872802734375, -0.0443267822265625, -0.038852691650390625, -0.03337860107421875, -0.027904510498046875, -0.022430419921875, -0.016956329345703125, -0.01148223876953125, -0.006008148193359375, -0.0005340576171875, 0.004940032958984375, 0.01041412353515625, 0.015888214111328125, 0.0213623046875, 0.026836395263671875, 0.03231048583984375, 0.037784576416015625, 0.0432586669921875, 0.048732757568359375, 0.05420684814453125, 0.059680938720703125, 0.065155029296875, 0.07062911987304688, 0.07610321044921875, 0.08157730102539062, 0.0870513916015625, 0.09252548217773438, 0.09799957275390625, 0.10347366333007812, 0.10894775390625, 0.11442184448242188, 0.11989593505859375, 0.12537002563476562, 0.1308441162109375, 0.13631820678710938, 0.14179229736328125, 0.14726638793945312, 0.152740478515625, 0.15821456909179688, 0.16368865966796875, 0.16916275024414062, 0.1746368408203125, 0.18011093139648438, 0.18558502197265625, 0.19105911254882812, 0.196533203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 1.0, 15.0, 19.0, 84.0, 1540.0, 1046195.0, 611.0, 53.0, 18.0, 2.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.546875, -18.0635986328125, -17.580322265625, -17.0970458984375, -16.61376953125, -16.1304931640625, -15.647216796875, -15.1639404296875, -14.6806640625, -14.1973876953125, -13.714111328125, -13.2308349609375, -12.74755859375, -12.2642822265625, -11.781005859375, -11.2977294921875, -10.814453125, -10.3311767578125, -9.847900390625, -9.3646240234375, -8.88134765625, -8.3980712890625, -7.914794921875, -7.4315185546875, -6.9482421875, -6.4649658203125, -5.981689453125, -5.4984130859375, -5.01513671875, -4.5318603515625, -4.048583984375, -3.5653076171875, -3.08203125, -2.5987548828125, -2.115478515625, -1.6322021484375, -1.14892578125, -0.6656494140625, -0.182373046875, 0.3009033203125, 0.7841796875, 1.2674560546875, 1.750732421875, 2.2340087890625, 2.71728515625, 3.2005615234375, 3.683837890625, 4.1671142578125, 4.650390625, 5.1336669921875, 5.616943359375, 6.1002197265625, 6.58349609375, 7.0667724609375, 7.550048828125, 8.0333251953125, 8.5166015625, 8.9998779296875, 9.483154296875, 9.9664306640625, 10.44970703125, 10.9329833984375, 11.416259765625, 11.8995361328125, 12.3828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 13.0, 10.0, 27.0, 28.0, 61.0, 77.0, 102.0, 118.0, 145.0, 123.0, 85.0, 61.0, 37.0, 28.0, 13.0, 9.0, 9.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.832050323486328e-05, -7.58785754442215e-05, -7.343664765357971e-05, -7.099471986293793e-05, -6.855279207229614e-05, -6.611086428165436e-05, -6.366893649101257e-05, -6.122700870037079e-05, -5.8785080909729004e-05, -5.634315311908722e-05, -5.3901225328445435e-05, -5.145929753780365e-05, -4.9017369747161865e-05, -4.657544195652008e-05, -4.4133514165878296e-05, -4.169158637523651e-05, -3.9249658584594727e-05, -3.680773079395294e-05, -3.436580300331116e-05, -3.192387521266937e-05, -2.9481947422027588e-05, -2.7040019631385803e-05, -2.459809184074402e-05, -2.2156164050102234e-05, -1.971423625946045e-05, -1.7272308468818665e-05, -1.483038067817688e-05, -1.2388452887535095e-05, -9.94652509689331e-06, -7.504597306251526e-06, -5.062669515609741e-06, -2.6207417249679565e-06, -1.7881393432617188e-07, 2.263113856315613e-06, 4.7050416469573975e-06, 7.146969437599182e-06, 9.588897228240967e-06, 1.2030825018882751e-05, 1.4472752809524536e-05, 1.691468060016632e-05, 1.9356608390808105e-05, 2.179853618144989e-05, 2.4240463972091675e-05, 2.668239176273346e-05, 2.9124319553375244e-05, 3.156624734401703e-05, 3.4008175134658813e-05, 3.64501029253006e-05, 3.889203071594238e-05, 4.133395850658417e-05, 4.377588629722595e-05, 4.621781408786774e-05, 4.865974187850952e-05, 5.1101669669151306e-05, 5.354359745979309e-05, 5.5985525250434875e-05, 5.842745304107666e-05, 6.0869380831718445e-05, 6.331130862236023e-05, 6.575323641300201e-05, 6.81951642036438e-05, 7.063709199428558e-05, 7.307901978492737e-05, 7.552094757556915e-05, 7.796287536621094e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 13.0, 6.0, 20.0, 11.0, 26.0, 36.0, 50.0, 124.0, 265.0, 718.0, 1908.0, 6035.0, 45918.0, 913218.0, 69709.0, 6758.0, 2118.0, 808.0, 361.0, 153.0, 87.0, 50.0, 46.0, 31.0, 20.0, 17.0, 15.0, 14.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87353515625, -0.8288803100585938, -0.7842254638671875, -0.7395706176757812, -0.694915771484375, -0.6502609252929688, -0.6056060791015625, -0.5609512329101562, -0.51629638671875, -0.47164154052734375, -0.4269866943359375, -0.38233184814453125, -0.337677001953125, -0.29302215576171875, -0.2483673095703125, -0.20371246337890625, -0.1590576171875, -0.11440277099609375, -0.0697479248046875, -0.02509307861328125, 0.019561767578125, 0.06421661376953125, 0.1088714599609375, 0.15352630615234375, 0.19818115234375, 0.24283599853515625, 0.2874908447265625, 0.33214569091796875, 0.376800537109375, 0.42145538330078125, 0.4661102294921875, 0.5107650756835938, 0.555419921875, 0.6000747680664062, 0.6447296142578125, 0.6893844604492188, 0.734039306640625, 0.7786941528320312, 0.8233489990234375, 0.8680038452148438, 0.91265869140625, 0.9573135375976562, 1.0019683837890625, 1.0466232299804688, 1.091278076171875, 1.1359329223632812, 1.1805877685546875, 1.2252426147460938, 1.2698974609375, 1.3145523071289062, 1.3592071533203125, 1.4038619995117188, 1.448516845703125, 1.4931716918945312, 1.5378265380859375, 1.5824813842773438, 1.62713623046875, 1.6717910766601562, 1.7164459228515625, 1.7611007690429688, 1.805755615234375, 1.8504104614257812, 1.8950653076171875, 1.9397201538085938, 1.984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 7.0, 25.0, 64.0, 157.0, 285.0, 267.0, 114.0, 47.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5109176635742188, -0.4764251708984375, -0.44193267822265625, -0.407440185546875, -0.37294769287109375, -0.3384552001953125, -0.30396270751953125, -0.26947021484375, -0.23497772216796875, -0.2004852294921875, -0.16599273681640625, -0.131500244140625, -0.09700775146484375, -0.0625152587890625, -0.02802276611328125, 0.0064697265625, 0.04096221923828125, 0.0754547119140625, 0.10994720458984375, 0.144439697265625, 0.17893218994140625, 0.2134246826171875, 0.24791717529296875, 0.28240966796875, 0.31690216064453125, 0.3513946533203125, 0.38588714599609375, 0.420379638671875, 0.45487213134765625, 0.4893646240234375, 0.5238571166992188, 0.558349609375, 0.5928421020507812, 0.6273345947265625, 0.6618270874023438, 0.696319580078125, 0.7308120727539062, 0.7653045654296875, 0.7997970581054688, 0.83428955078125, 0.8687820434570312, 0.9032745361328125, 0.9377670288085938, 0.972259521484375, 1.0067520141601562, 1.0412445068359375, 1.0757369995117188, 1.1102294921875, 1.1447219848632812, 1.1792144775390625, 1.2137069702148438, 1.248199462890625, 1.2826919555664062, 1.3171844482421875, 1.3516769409179688, 1.38616943359375, 1.4206619262695312, 1.4551544189453125, 1.4896469116210938, 1.524139404296875, 1.5586318969726562, 1.5931243896484375, 1.6276168823242188, 1.662109375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 14.0, 31.0, 188.0, 387.0, 236.0, 77.0, 32.0, 21.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.526920318603516, -8.286758422851562, -8.046595573425293, -7.80643367767334, -7.566271781921387, -7.326109409332275, -7.085947513580322, -6.845785140991211, -6.605623245239258, -6.3654608726501465, -6.125298976898193, -5.885136604309082, -5.644974708557129, -5.404812335968018, -5.1646504402160645, -4.924488067626953, -4.684326171875, -4.444163799285889, -4.2040019035339355, -3.9638397693634033, -3.723677635192871, -3.4835152626037598, -3.2433533668518066, -3.0031909942626953, -2.763028621673584, -2.5228664875030518, -2.2827043533325195, -2.0425422191619873, -1.802380084991455, -1.5622178316116333, -1.322055697441101, -1.0818935632705688, -0.8417315483093262, -0.601569414138794, -0.36140725016593933, -0.12124508619308472, 0.11891704797744751, 0.3590792417526245, 0.5992413759231567, 0.839403510093689, 1.0795656442642212, 1.3197277784347534, 1.5598899126052856, 1.8000521659851074, 2.0402143001556396, 2.280376434326172, 2.520538568496704, 2.7607007026672363, 3.0008628368377686, 3.241024971008301, 3.481187105178833, 3.7213492393493652, 3.9615113735198975, 4.20167350769043, 4.441835880279541, 4.681997776031494, 4.9221601486206055, 5.162322521209717, 5.40248441696167, 5.642646789550781, 5.882808685302734, 6.122971057891846, 6.363132953643799, 6.60329532623291, 6.843457221984863]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 9.0, 8.0, 11.0, 20.0, 18.0, 31.0, 34.0, 55.0, 70.0, 65.0, 83.0, 76.0, 67.0, 88.0, 73.0, 63.0, 42.0, 33.0, 42.0, 23.0, 19.0, 18.0, 11.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.629892110824585, -2.548163890838623, -2.4664359092712402, -2.3847079277038574, -2.3029797077178955, -2.2212514877319336, -2.139523506164551, -2.057795524597168, -1.976067304611206, -1.8943392038345337, -1.8126111030578613, -1.730883002281189, -1.6491549015045166, -1.5674268007278442, -1.4856986999511719, -1.4039705991744995, -1.3222424983978271, -1.2405143976211548, -1.1587862968444824, -1.07705819606781, -0.9953300952911377, -0.9136019945144653, -0.831873893737793, -0.7501457929611206, -0.6684176921844482, -0.5866895914077759, -0.5049614906311035, -0.42323338985443115, -0.3415052890777588, -0.2597771883010864, -0.17804908752441406, -0.0963209867477417, -0.014593124389648438, 0.06713497638702393, 0.1488630771636963, 0.23059117794036865, 0.312319278717041, 0.3940473794937134, 0.47577548027038574, 0.5575035810470581, 0.6392316818237305, 0.7209597826004028, 0.8026878833770752, 0.8844159841537476, 0.9661440849304199, 1.0478721857070923, 1.1296002864837646, 1.211328387260437, 1.2930564880371094, 1.3747845888137817, 1.456512689590454, 1.5382407903671265, 1.6199688911437988, 1.7016969919204712, 1.7834250926971436, 1.865153193473816, 1.9468812942504883, 2.028609275817871, 2.110337495803833, 2.192065715789795, 2.2737936973571777, 2.3555216789245605, 2.4372498989105225, 2.5189781188964844, 2.600706100463867]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 12.0, 19.0, 13.0, 28.0, 46.0, 44.0, 83.0, 134.0, 188.0, 317.0, 522.0, 938.0, 1934.0, 4007.0, 9714.0, 32197.0, 294030.0, 3717476.0, 99711.0, 19624.0, 6815.0, 2859.0, 1463.0, 788.0, 474.0, 290.0, 182.0, 130.0, 74.0, 42.0, 37.0, 28.0, 9.0, 10.0, 9.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1875, -1.15386962890625, -1.1202392578125, -1.08660888671875, -1.052978515625, -1.01934814453125, -0.9857177734375, -0.95208740234375, -0.91845703125, -0.88482666015625, -0.8511962890625, -0.81756591796875, -0.783935546875, -0.75030517578125, -0.7166748046875, -0.68304443359375, -0.6494140625, -0.61578369140625, -0.5821533203125, -0.54852294921875, -0.514892578125, -0.48126220703125, -0.4476318359375, -0.41400146484375, -0.38037109375, -0.34674072265625, -0.3131103515625, -0.27947998046875, -0.245849609375, -0.21221923828125, -0.1785888671875, -0.14495849609375, -0.111328125, -0.07769775390625, -0.0440673828125, -0.01043701171875, 0.023193359375, 0.05682373046875, 0.0904541015625, 0.12408447265625, 0.15771484375, 0.19134521484375, 0.2249755859375, 0.25860595703125, 0.292236328125, 0.32586669921875, 0.3594970703125, 0.39312744140625, 0.4267578125, 0.46038818359375, 0.4940185546875, 0.52764892578125, 0.561279296875, 0.59490966796875, 0.6285400390625, 0.66217041015625, 0.69580078125, 0.72943115234375, 0.7630615234375, 0.79669189453125, 0.830322265625, 0.86395263671875, 0.8975830078125, 0.93121337890625, 0.96484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 10.0, 7.0, 10.0, 16.0, 26.0, 36.0, 49.0, 46.0, 56.0, 74.0, 93.0, 99.0, 83.0, 79.0, 76.0, 61.0, 49.0, 35.0, 26.0, 12.0, 10.0, 9.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.054355621337890625, -0.05283355712890625, -0.051311492919921875, -0.0497894287109375, -0.048267364501953125, -0.04674530029296875, -0.045223236083984375, -0.043701171875, -0.042179107666015625, -0.04065704345703125, -0.039134979248046875, -0.0376129150390625, -0.036090850830078125, -0.03456878662109375, -0.033046722412109375, -0.031524658203125, -0.030002593994140625, -0.02848052978515625, -0.026958465576171875, -0.0254364013671875, -0.023914337158203125, -0.02239227294921875, -0.020870208740234375, -0.01934814453125, -0.017826080322265625, -0.01630401611328125, -0.014781951904296875, -0.0132598876953125, -0.011737823486328125, -0.01021575927734375, -0.008693695068359375, -0.007171630859375, -0.005649566650390625, -0.00412750244140625, -0.002605438232421875, -0.0010833740234375, 0.000438690185546875, 0.00196075439453125, 0.003482818603515625, 0.0050048828125, 0.006526947021484375, 0.00804901123046875, 0.009571075439453125, 0.0110931396484375, 0.012615203857421875, 0.01413726806640625, 0.015659332275390625, 0.017181396484375, 0.018703460693359375, 0.02022552490234375, 0.021747589111328125, 0.0232696533203125, 0.024791717529296875, 0.02631378173828125, 0.027835845947265625, 0.02935791015625, 0.030879974365234375, 0.03240203857421875, 0.033924102783203125, 0.0354461669921875, 0.036968231201171875, 0.03849029541015625, 0.040012359619140625, 0.041534423828125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 1.0, 2.0, 9.0, 2.0, 9.0, 7.0, 13.0, 8.0, 15.0, 10.0, 16.0, 14.0, 24.0, 34.0, 48.0, 82.0, 186.0, 554.0, 3230.0, 33016.0, 3285016.0, 849088.0, 19710.0, 2172.0, 479.0, 162.0, 105.0, 59.0, 44.0, 37.0, 25.0, 13.0, 14.0, 10.0, 5.0, 12.0, 10.0, 4.0, 6.0, 6.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.961669921875, -1.90380859375, -1.845947265625, -1.7880859375, -1.730224609375, -1.67236328125, -1.614501953125, -1.556640625, -1.498779296875, -1.44091796875, -1.383056640625, -1.3251953125, -1.267333984375, -1.20947265625, -1.151611328125, -1.09375, -1.035888671875, -0.97802734375, -0.920166015625, -0.8623046875, -0.804443359375, -0.74658203125, -0.688720703125, -0.630859375, -0.572998046875, -0.51513671875, -0.457275390625, -0.3994140625, -0.341552734375, -0.28369140625, -0.225830078125, -0.16796875, -0.110107421875, -0.05224609375, 0.005615234375, 0.0634765625, 0.121337890625, 0.17919921875, 0.237060546875, 0.294921875, 0.352783203125, 0.41064453125, 0.468505859375, 0.5263671875, 0.584228515625, 0.64208984375, 0.699951171875, 0.7578125, 0.815673828125, 0.87353515625, 0.931396484375, 0.9892578125, 1.047119140625, 1.10498046875, 1.162841796875, 1.220703125, 1.278564453125, 1.33642578125, 1.394287109375, 1.4521484375, 1.510009765625, 1.56787109375, 1.625732421875, 1.68359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 11.0, 12.0, 19.0, 30.0, 20.0, 32.0, 49.0, 60.0, 90.0, 161.0, 251.0, 504.0, 1016.0, 784.0, 379.0, 241.0, 114.0, 66.0, 46.0, 38.0, 17.0, 21.0, 18.0, 13.0, 11.0, 13.0, 12.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10009765625, -0.09705257415771484, -0.09400749206542969, -0.09096240997314453, -0.08791732788085938, -0.08487224578857422, -0.08182716369628906, -0.0787820816040039, -0.07573699951171875, -0.0726919174194336, -0.06964683532714844, -0.06660175323486328, -0.06355667114257812, -0.06051158905029297, -0.05746650695800781, -0.054421424865722656, -0.0513763427734375, -0.048331260681152344, -0.04528617858886719, -0.04224109649658203, -0.039196014404296875, -0.03615093231201172, -0.03310585021972656, -0.030060768127441406, -0.02701568603515625, -0.023970603942871094, -0.020925521850585938, -0.01788043975830078, -0.014835357666015625, -0.011790275573730469, -0.008745193481445312, -0.005700111389160156, -0.002655029296875, 0.00039005279541015625, 0.0034351348876953125, 0.006480216979980469, 0.009525299072265625, 0.012570381164550781, 0.015615463256835938, 0.018660545349121094, 0.02170562744140625, 0.024750709533691406, 0.027795791625976562, 0.03084087371826172, 0.033885955810546875, 0.03693103790283203, 0.03997611999511719, 0.043021202087402344, 0.0460662841796875, 0.049111366271972656, 0.05215644836425781, 0.05520153045654297, 0.058246612548828125, 0.06129169464111328, 0.06433677673339844, 0.0673818588256836, 0.07042694091796875, 0.0734720230102539, 0.07651710510253906, 0.07956218719482422, 0.08260726928710938, 0.08565235137939453, 0.08869743347167969, 0.09174251556396484, 0.09478759765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 13.0, 65.0, 239.0, 405.0, 214.0, 49.0, 16.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.727738857269287, -3.654149293899536, -3.5805599689483643, -3.5069704055786133, -3.4333808422088623, -3.3597915172576904, -3.2862019538879395, -3.2126126289367676, -3.1390230655670166, -3.0654335021972656, -2.9918441772460938, -2.9182546138763428, -2.844665050506592, -2.77107572555542, -2.697486162185669, -2.623896598815918, -2.550307273864746, -2.476717710494995, -2.4031283855438232, -2.3295388221740723, -2.2559492588043213, -2.1823599338531494, -2.1087703704833984, -2.0351810455322266, -1.9615912437438965, -1.888001799583435, -1.814412236213684, -1.7408227920532227, -1.6672333478927612, -1.5936439037322998, -1.5200543403625488, -1.4464648962020874, -1.372875452041626, -1.2992860078811646, -1.2256964445114136, -1.1521070003509521, -1.0785175561904907, -1.0049281120300293, -0.9313385486602783, -0.8577491044998169, -0.7841596603393555, -0.7105701565742493, -0.6369807124137878, -0.5633912086486816, -0.4898017346858978, -0.416212260723114, -0.3426227569580078, -0.2690333127975464, -0.19544380903244019, -0.12185432761907578, -0.048264846205711365, 0.025324642658233643, 0.09891411662101746, 0.17250359058380127, 0.24609309434890747, 0.3196825385093689, 0.3932720422744751, 0.4668615162372589, 0.5404509902000427, 0.6140404939651489, 0.6876299381256104, 0.7612194418907166, 0.8348089456558228, 0.9083983898162842, 0.9819878935813904]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 12.0, 17.0, 15.0, 17.0, 32.0, 31.0, 47.0, 57.0, 55.0, 78.0, 64.0, 64.0, 79.0, 61.0, 65.0, 67.0, 54.0, 42.0, 34.0, 22.0, 12.0, 22.0, 11.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41616570949554443, -0.39932334423065186, -0.38248100876808167, -0.3656386435031891, -0.3487963080406189, -0.3319539427757263, -0.31511157751083374, -0.29826921224594116, -0.28142687678337097, -0.2645845115184784, -0.2477421760559082, -0.23089981079101562, -0.21405746042728424, -0.19721511006355286, -0.18037274479866028, -0.1635303944349289, -0.1466880440711975, -0.12984569370746613, -0.11300333589315414, -0.09616097807884216, -0.07931862771511078, -0.062476277351379395, -0.04563391953706741, -0.028791561722755432, -0.011949211359024048, 0.004893142729997635, 0.021735496819019318, 0.038577850908041, 0.05542020499706268, 0.07226255536079407, 0.08910491317510605, 0.10594727098941803, 0.12278968095779419, 0.13963203132152557, 0.15647438168525696, 0.17331674695014954, 0.19015909731388092, 0.2070014476776123, 0.22384381294250488, 0.24068616330623627, 0.25752851366996765, 0.27437087893486023, 0.2912132143974304, 0.308055579662323, 0.3248979449272156, 0.34174028038978577, 0.35858264565467834, 0.37542498111724854, 0.3922673463821411, 0.4091097116470337, 0.4259520471096039, 0.44279441237449646, 0.45963674783706665, 0.47647911310195923, 0.4933214783668518, 0.5101638436317444, 0.5270061492919922, 0.5438485145568848, 0.5606908798217773, 0.5775331854820251, 0.5943755507469177, 0.6112179160118103, 0.6280602812767029, 0.6449026465415955, 0.661745011806488]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 6.0, 8.0, 9.0, 18.0, 21.0, 29.0, 49.0, 38.0, 55.0, 58.0, 139.0, 1873.0, 491584.0, 552162.0, 2021.0, 161.0, 74.0, 58.0, 35.0, 42.0, 29.0, 22.0, 16.0, 14.0, 8.0, 4.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.53265380859375, -2.4559326171875, -2.37921142578125, -2.302490234375, -2.22576904296875, -2.1490478515625, -2.07232666015625, -1.99560546875, -1.91888427734375, -1.8421630859375, -1.76544189453125, -1.688720703125, -1.61199951171875, -1.5352783203125, -1.45855712890625, -1.3818359375, -1.30511474609375, -1.2283935546875, -1.15167236328125, -1.074951171875, -0.99822998046875, -0.9215087890625, -0.84478759765625, -0.76806640625, -0.69134521484375, -0.6146240234375, -0.53790283203125, -0.461181640625, -0.38446044921875, -0.3077392578125, -0.23101806640625, -0.154296875, -0.07757568359375, -0.0008544921875, 0.07586669921875, 0.152587890625, 0.22930908203125, 0.3060302734375, 0.38275146484375, 0.45947265625, 0.53619384765625, 0.6129150390625, 0.68963623046875, 0.766357421875, 0.84307861328125, 0.9197998046875, 0.99652099609375, 1.0732421875, 1.14996337890625, 1.2266845703125, 1.30340576171875, 1.380126953125, 1.45684814453125, 1.5335693359375, 1.61029052734375, 1.68701171875, 1.76373291015625, 1.8404541015625, 1.91717529296875, 1.993896484375, 2.07061767578125, 2.1473388671875, 2.22406005859375, 2.30078125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 10.0, 21.0, 60.0, 82.0, 126.0, 175.0, 171.0, 134.0, 97.0, 64.0, 34.0, 9.0, 8.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042449951171875, -0.03945016860961914, -0.03645038604736328, -0.03345060348510742, -0.030450820922851562, -0.027451038360595703, -0.024451255798339844, -0.021451473236083984, -0.018451690673828125, -0.015451908111572266, -0.012452125549316406, -0.009452342987060547, -0.0064525604248046875, -0.003452777862548828, -0.00045299530029296875, 0.0025467872619628906, 0.00554656982421875, 0.00854635238647461, 0.011546134948730469, 0.014545917510986328, 0.017545700073242188, 0.020545482635498047, 0.023545265197753906, 0.026545047760009766, 0.029544830322265625, 0.032544612884521484, 0.035544395446777344, 0.0385441780090332, 0.04154396057128906, 0.04454374313354492, 0.04754352569580078, 0.05054330825805664, 0.0535430908203125, 0.05654287338256836, 0.05954265594482422, 0.06254243850708008, 0.06554222106933594, 0.0685420036315918, 0.07154178619384766, 0.07454156875610352, 0.07754135131835938, 0.08054113388061523, 0.0835409164428711, 0.08654069900512695, 0.08954048156738281, 0.09254026412963867, 0.09554004669189453, 0.09853982925415039, 0.10153961181640625, 0.10453939437866211, 0.10753917694091797, 0.11053895950317383, 0.11353874206542969, 0.11653852462768555, 0.1195383071899414, 0.12253808975219727, 0.12553787231445312, 0.12853765487670898, 0.13153743743896484, 0.1345372200012207, 0.13753700256347656, 0.14053678512573242, 0.14353656768798828, 0.14653635025024414, 0.1495361328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 11.0, 11.0, 15.0, 15.0, 25.0, 33.0, 36.0, 71.0, 112.0, 158.0, 290.0, 437.0, 871.0, 1783.0, 4181.0, 10585.0, 31701.0, 97359.0, 257470.0, 351644.0, 190408.0, 65949.0, 21622.0, 7532.0, 3170.0, 1309.0, 715.0, 369.0, 238.0, 139.0, 80.0, 70.0, 38.0, 33.0, 17.0, 17.0, 5.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.45849609375, -0.4447364807128906, -0.43097686767578125, -0.4172172546386719, -0.4034576416015625, -0.3896980285644531, -0.37593841552734375, -0.3621788024902344, -0.348419189453125, -0.3346595764160156, -0.32089996337890625, -0.3071403503417969, -0.2933807373046875, -0.2796211242675781, -0.26586151123046875, -0.2521018981933594, -0.23834228515625, -0.22458267211914062, -0.21082305908203125, -0.19706344604492188, -0.1833038330078125, -0.16954421997070312, -0.15578460693359375, -0.14202499389648438, -0.128265380859375, -0.11450576782226562, -0.10074615478515625, -0.08698654174804688, -0.0732269287109375, -0.059467315673828125, -0.04570770263671875, -0.031948089599609375, -0.0181884765625, -0.004428863525390625, 0.00933074951171875, 0.023090362548828125, 0.0368499755859375, 0.050609588623046875, 0.06436920166015625, 0.07812881469726562, 0.091888427734375, 0.10564804077148438, 0.11940765380859375, 0.13316726684570312, 0.1469268798828125, 0.16068649291992188, 0.17444610595703125, 0.18820571899414062, 0.20196533203125, 0.21572494506835938, 0.22948455810546875, 0.24324417114257812, 0.2570037841796875, 0.2707633972167969, 0.28452301025390625, 0.2982826232910156, 0.312042236328125, 0.3258018493652344, 0.33956146240234375, 0.3533210754394531, 0.3670806884765625, 0.3808403015136719, 0.39459991455078125, 0.4083595275878906, 0.422119140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 3.0, 2.0, 6.0, 3.0, 6.0, 7.0, 13.0, 9.0, 26.0, 19.0, 23.0, 28.0, 36.0, 34.0, 32.0, 43.0, 47.0, 55.0, 47.0, 48.0, 53.0, 46.0, 42.0, 45.0, 43.0, 41.0, 30.0, 40.0, 31.0, 24.0, 16.0, 19.0, 21.0, 12.0, 9.0, 6.0, 11.0, 6.0, 8.0, 2.0, 6.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2210693359375, -0.21459579467773438, -0.20812225341796875, -0.20164871215820312, -0.1951751708984375, -0.18870162963867188, -0.18222808837890625, -0.17575454711914062, -0.169281005859375, -0.16280746459960938, -0.15633392333984375, -0.14986038208007812, -0.1433868408203125, -0.13691329956054688, -0.13043975830078125, -0.12396621704101562, -0.11749267578125, -0.11101913452148438, -0.10454559326171875, -0.09807205200195312, -0.0915985107421875, -0.08512496948242188, -0.07865142822265625, -0.07217788696289062, -0.065704345703125, -0.059230804443359375, -0.05275726318359375, -0.046283721923828125, -0.0398101806640625, -0.033336639404296875, -0.02686309814453125, -0.020389556884765625, -0.013916015625, -0.007442474365234375, -0.00096893310546875, 0.005504608154296875, 0.0119781494140625, 0.018451690673828125, 0.02492523193359375, 0.031398773193359375, 0.037872314453125, 0.044345855712890625, 0.05081939697265625, 0.057292938232421875, 0.0637664794921875, 0.07024002075195312, 0.07671356201171875, 0.08318710327148438, 0.08966064453125, 0.09613418579101562, 0.10260772705078125, 0.10908126831054688, 0.1155548095703125, 0.12202835083007812, 0.12850189208984375, 0.13497543334960938, 0.141448974609375, 0.14792251586914062, 0.15439605712890625, 0.16086959838867188, 0.1673431396484375, 0.17381668090820312, 0.18029022216796875, 0.18676376342773438, 0.1932373046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 10.0, 3.0, 4.0, 9.0, 8.0, 11.0, 14.0, 18.0, 34.0, 35.0, 63.0, 106.0, 187.0, 329.0, 591.0, 1352.0, 3212.0, 9622.0, 37998.0, 210187.0, 558576.0, 178843.0, 32943.0, 8726.0, 3033.0, 1274.0, 570.0, 322.0, 159.0, 99.0, 56.0, 43.0, 23.0, 37.0, 13.0, 10.0, 10.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.57275390625, -0.555633544921875, -0.53851318359375, -0.521392822265625, -0.5042724609375, -0.487152099609375, -0.47003173828125, -0.452911376953125, -0.435791015625, -0.418670654296875, -0.40155029296875, -0.384429931640625, -0.3673095703125, -0.350189208984375, -0.33306884765625, -0.315948486328125, -0.298828125, -0.281707763671875, -0.26458740234375, -0.247467041015625, -0.2303466796875, -0.213226318359375, -0.19610595703125, -0.178985595703125, -0.161865234375, -0.144744873046875, -0.12762451171875, -0.110504150390625, -0.0933837890625, -0.076263427734375, -0.05914306640625, -0.042022705078125, -0.02490234375, -0.007781982421875, 0.00933837890625, 0.026458740234375, 0.0435791015625, 0.060699462890625, 0.07781982421875, 0.094940185546875, 0.112060546875, 0.129180908203125, 0.14630126953125, 0.163421630859375, 0.1805419921875, 0.197662353515625, 0.21478271484375, 0.231903076171875, 0.2490234375, 0.266143798828125, 0.28326416015625, 0.300384521484375, 0.3175048828125, 0.334625244140625, 0.35174560546875, 0.368865966796875, 0.385986328125, 0.403106689453125, 0.42022705078125, 0.437347412109375, 0.4544677734375, 0.471588134765625, 0.48870849609375, 0.505828857421875, 0.52294921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 11.0, 9.0, 17.0, 22.0, 40.0, 54.0, 82.0, 120.0, 129.0, 137.0, 114.0, 88.0, 53.0, 42.0, 26.0, 18.0, 14.0, 9.0, 7.0, 1.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.508827209472656e-05, -6.214901804924011e-05, -5.920976400375366e-05, -5.627050995826721e-05, -5.333125591278076e-05, -5.039200186729431e-05, -4.745274782180786e-05, -4.451349377632141e-05, -4.157423973083496e-05, -3.863498568534851e-05, -3.569573163986206e-05, -3.275647759437561e-05, -2.981722354888916e-05, -2.687796950340271e-05, -2.393871545791626e-05, -2.099946141242981e-05, -1.806020736694336e-05, -1.512095332145691e-05, -1.2181699275970459e-05, -9.242445230484009e-06, -6.303191184997559e-06, -3.3639371395111084e-06, -4.246830940246582e-07, 2.514570951461792e-06, 5.453824996948242e-06, 8.393079042434692e-06, 1.1332333087921143e-05, 1.4271587133407593e-05, 1.7210841178894043e-05, 2.0150095224380493e-05, 2.3089349269866943e-05, 2.6028603315353394e-05, 2.8967857360839844e-05, 3.1907111406326294e-05, 3.4846365451812744e-05, 3.7785619497299194e-05, 4.0724873542785645e-05, 4.3664127588272095e-05, 4.6603381633758545e-05, 4.9542635679244995e-05, 5.2481889724731445e-05, 5.5421143770217896e-05, 5.8360397815704346e-05, 6.12996518611908e-05, 6.423890590667725e-05, 6.71781599521637e-05, 7.011741399765015e-05, 7.30566680431366e-05, 7.599592208862305e-05, 7.89351761341095e-05, 8.187443017959595e-05, 8.48136842250824e-05, 8.775293827056885e-05, 9.06921923160553e-05, 9.363144636154175e-05, 9.65707004070282e-05, 9.950995445251465e-05, 0.0001024492084980011, 0.00010538846254348755, 0.000108327716588974, 0.00011126697063446045, 0.0001142062246799469, 0.00011714547872543335, 0.0001200847327709198, 0.00012302398681640625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 15.0, 21.0, 41.0, 46.0, 88.0, 143.0, 228.0, 504.0, 1015.0, 2640.0, 8468.0, 44524.0, 597169.0, 356168.0, 27498.0, 6186.0, 2034.0, 799.0, 406.0, 217.0, 120.0, 68.0, 46.0, 39.0, 17.0, 8.0, 4.0, 6.0, 5.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76220703125, -0.7315750122070312, -0.7009429931640625, -0.6703109741210938, -0.639678955078125, -0.6090469360351562, -0.5784149169921875, -0.5477828979492188, -0.51715087890625, -0.48651885986328125, -0.4558868408203125, -0.42525482177734375, -0.394622802734375, -0.36399078369140625, -0.3333587646484375, -0.30272674560546875, -0.2720947265625, -0.24146270751953125, -0.2108306884765625, -0.18019866943359375, -0.149566650390625, -0.11893463134765625, -0.0883026123046875, -0.05767059326171875, -0.02703857421875, 0.00359344482421875, 0.0342254638671875, 0.06485748291015625, 0.095489501953125, 0.12612152099609375, 0.1567535400390625, 0.18738555908203125, 0.218017578125, 0.24864959716796875, 0.2792816162109375, 0.30991363525390625, 0.340545654296875, 0.37117767333984375, 0.4018096923828125, 0.43244171142578125, 0.46307373046875, 0.49370574951171875, 0.5243377685546875, 0.5549697875976562, 0.585601806640625, 0.6162338256835938, 0.6468658447265625, 0.6774978637695312, 0.7081298828125, 0.7387619018554688, 0.7693939208984375, 0.8000259399414062, 0.830657958984375, 0.8612899780273438, 0.8919219970703125, 0.9225540161132812, 0.95318603515625, 0.9838180541992188, 1.0144500732421875, 1.0450820922851562, 1.075714111328125, 1.1063461303710938, 1.1369781494140625, 1.1676101684570312, 1.1982421875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 2.0, 8.0, 15.0, 8.0, 11.0, 19.0, 21.0, 53.0, 76.0, 79.0, 111.0, 132.0, 110.0, 95.0, 83.0, 48.0, 40.0, 21.0, 14.0, 10.0, 9.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.443115234375, -0.43135833740234375, -0.4196014404296875, -0.40784454345703125, -0.396087646484375, -0.38433074951171875, -0.3725738525390625, -0.36081695556640625, -0.34906005859375, -0.33730316162109375, -0.3255462646484375, -0.31378936767578125, -0.302032470703125, -0.29027557373046875, -0.2785186767578125, -0.26676177978515625, -0.2550048828125, -0.24324798583984375, -0.2314910888671875, -0.21973419189453125, -0.207977294921875, -0.19622039794921875, -0.1844635009765625, -0.17270660400390625, -0.16094970703125, -0.14919281005859375, -0.1374359130859375, -0.12567901611328125, -0.113922119140625, -0.10216522216796875, -0.0904083251953125, -0.07865142822265625, -0.06689453125, -0.05513763427734375, -0.0433807373046875, -0.03162384033203125, -0.019866943359375, -0.00811004638671875, 0.0036468505859375, 0.01540374755859375, 0.02716064453125, 0.03891754150390625, 0.0506744384765625, 0.06243133544921875, 0.074188232421875, 0.08594512939453125, 0.0977020263671875, 0.10945892333984375, 0.1212158203125, 0.13297271728515625, 0.1447296142578125, 0.15648651123046875, 0.168243408203125, 0.18000030517578125, 0.1917572021484375, 0.20351409912109375, 0.21527099609375, 0.22702789306640625, 0.2387847900390625, 0.25054168701171875, 0.262298583984375, 0.27405548095703125, 0.2858123779296875, 0.29756927490234375, 0.309326171875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 9.0, 12.0, 30.0, 62.0, 189.0, 315.0, 244.0, 104.0, 24.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.983085632324219, -5.730259418487549, -5.477432727813721, -5.224606513977051, -4.971779823303223, -4.718953609466553, -4.466127395629883, -4.213300704956055, -3.9604744911193848, -3.7076480388641357, -3.4548215866088867, -3.201995372772217, -2.9491689205169678, -2.6963424682617188, -2.443516254425049, -2.1906898021698, -1.9378633499145508, -1.6850368976593018, -1.4322105646133423, -1.1793842315673828, -0.9265577793121338, -0.6737313270568848, -0.4209049940109253, -0.16807866096496582, 0.0847477912902832, 0.33757418394088745, 0.5904005765914917, 0.843226969242096, 1.0960533618927002, 1.3488798141479492, 1.6017061471939087, 1.8545324802398682, 2.107358932495117, 2.360185384750366, 2.6130118370056152, 2.865838050842285, 3.118664503097534, 3.371490955352783, 3.624317169189453, 3.877143621444702, 4.129970073699951, 4.382796287536621, 4.635622978210449, 4.888449192047119, 5.141275405883789, 5.394102096557617, 5.646928310394287, 5.899754524230957, 6.152581214904785, 6.405407428741455, 6.658234119415283, 6.911060333251953, 7.163887023925781, 7.416713237762451, 7.669539451599121, 7.922366142272949, 8.175191879272461, 8.428018569946289, 8.6808443069458, 8.933670997619629, 9.186497688293457, 9.439323425292969, 9.692150115966797, 9.944976806640625, 10.197803497314453]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 25.0, 57.0, 74.0, 99.0, 139.0, 134.0, 139.0, 115.0, 91.0, 63.0, 38.0, 16.0, 10.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6718108654022217, -1.534712314605713, -1.397613763809204, -1.2605152130126953, -1.1234166622161865, -0.9863181114196777, -0.849219560623169, -0.7121210098266602, -0.5750224590301514, -0.4379239082336426, -0.3008253574371338, -0.163726806640625, -0.02662825584411621, 0.11047029495239258, 0.24756884574890137, 0.38466739654541016, 0.521765947341919, 0.6588644981384277, 0.7959630489349365, 0.9330615997314453, 1.070160150527954, 1.207258701324463, 1.3443572521209717, 1.4814558029174805, 1.6185543537139893, 1.755652904510498, 1.8927514553070068, 2.0298500061035156, 2.1669485569000244, 2.304047107696533, 2.441145658493042, 2.578244209289551, 2.7153429985046387, 2.8524415493011475, 2.9895401000976562, 3.126638650894165, 3.263737201690674, 3.4008357524871826, 3.5379343032836914, 3.6750328540802, 3.812131404876709, 3.9492299556732178, 4.086328506469727, 4.223426818847656, 4.360525608062744, 4.497624397277832, 4.634722709655762, 4.771821022033691, 4.908919811248779, 5.046018600463867, 5.183116912841797, 5.320215225219727, 5.4573140144348145, 5.594412803649902, 5.731511116027832, 5.868609428405762, 6.00570821762085, 6.1428070068359375, 6.279905319213867, 6.417003631591797, 6.554102420806885, 6.691201210021973, 6.828299522399902, 6.965397834777832, 7.10249662399292]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 14.0, 22.0, 72.0, 167.0, 691.0, 17208.0, 4157771.0, 16905.0, 775.0, 243.0, 116.0, 79.0, 40.0, 33.0, 39.0, 25.0, 22.0, 16.0, 12.0, 8.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.02093505859375, -2.8660888671875, -2.71124267578125, -2.556396484375, -2.40155029296875, -2.2467041015625, -2.09185791015625, -1.93701171875, -1.78216552734375, -1.6273193359375, -1.47247314453125, -1.317626953125, -1.16278076171875, -1.0079345703125, -0.85308837890625, -0.6982421875, -0.54339599609375, -0.3885498046875, -0.23370361328125, -0.078857421875, 0.07598876953125, 0.2308349609375, 0.38568115234375, 0.54052734375, 0.69537353515625, 0.8502197265625, 1.00506591796875, 1.159912109375, 1.31475830078125, 1.4696044921875, 1.62445068359375, 1.779296875, 1.93414306640625, 2.0889892578125, 2.24383544921875, 2.398681640625, 2.55352783203125, 2.7083740234375, 2.86322021484375, 3.01806640625, 3.17291259765625, 3.3277587890625, 3.48260498046875, 3.637451171875, 3.79229736328125, 3.9471435546875, 4.10198974609375, 4.2568359375, 4.41168212890625, 4.5665283203125, 4.72137451171875, 4.876220703125, 5.03106689453125, 5.1859130859375, 5.34075927734375, 5.49560546875, 5.65045166015625, 5.8052978515625, 5.96014404296875, 6.114990234375, 6.26983642578125, 6.4246826171875, 6.57952880859375, 6.734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 11.0, 16.0, 44.0, 67.0, 99.0, 186.0, 167.0, 157.0, 121.0, 76.0, 33.0, 17.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.07967758178710938, -0.07537078857421875, -0.07106399536132812, -0.0667572021484375, -0.062450408935546875, -0.05814361572265625, -0.053836822509765625, -0.049530029296875, -0.045223236083984375, -0.04091644287109375, -0.036609649658203125, -0.0323028564453125, -0.027996063232421875, -0.02368927001953125, -0.019382476806640625, -0.01507568359375, -0.010768890380859375, -0.00646209716796875, -0.002155303955078125, 0.0021514892578125, 0.006458282470703125, 0.01076507568359375, 0.015071868896484375, 0.019378662109375, 0.023685455322265625, 0.02799224853515625, 0.032299041748046875, 0.0366058349609375, 0.040912628173828125, 0.04521942138671875, 0.049526214599609375, 0.0538330078125, 0.058139801025390625, 0.06244659423828125, 0.06675338745117188, 0.0710601806640625, 0.07536697387695312, 0.07967376708984375, 0.08398056030273438, 0.088287353515625, 0.09259414672851562, 0.09690093994140625, 0.10120773315429688, 0.1055145263671875, 0.10982131958007812, 0.11412811279296875, 0.11843490600585938, 0.12274169921875, 0.12704849243164062, 0.13135528564453125, 0.13566207885742188, 0.1399688720703125, 0.14427566528320312, 0.14858245849609375, 0.15288925170898438, 0.157196044921875, 0.16150283813476562, 0.16580963134765625, 0.17011642456054688, 0.1744232177734375, 0.17873001098632812, 0.18303680419921875, 0.18734359741210938, 0.191650390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 11.0, 9.0, 22.0, 33.0, 66.0, 120.0, 165.0, 343.0, 792.0, 6083.0, 4030038.0, 153601.0, 1913.0, 520.0, 249.0, 148.0, 75.0, 41.0, 27.0, 14.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.889678955078125, -7.72467041015625, -7.559661865234375, -7.3946533203125, -7.229644775390625, -7.06463623046875, -6.899627685546875, -6.734619140625, -6.569610595703125, -6.40460205078125, -6.239593505859375, -6.0745849609375, -5.909576416015625, -5.74456787109375, -5.579559326171875, -5.41455078125, -5.249542236328125, -5.08453369140625, -4.919525146484375, -4.7545166015625, -4.589508056640625, -4.42449951171875, -4.259490966796875, -4.094482421875, -3.929473876953125, -3.76446533203125, -3.599456787109375, -3.4344482421875, -3.269439697265625, -3.10443115234375, -2.939422607421875, -2.7744140625, -2.609405517578125, -2.44439697265625, -2.279388427734375, -2.1143798828125, -1.949371337890625, -1.78436279296875, -1.619354248046875, -1.454345703125, -1.289337158203125, -1.12432861328125, -0.959320068359375, -0.7943115234375, -0.629302978515625, -0.46429443359375, -0.299285888671875, -0.13427734375, 0.030731201171875, 0.19573974609375, 0.360748291015625, 0.5257568359375, 0.690765380859375, 0.85577392578125, 1.020782470703125, 1.185791015625, 1.350799560546875, 1.51580810546875, 1.680816650390625, 1.8458251953125, 2.010833740234375, 2.17584228515625, 2.340850830078125, 2.505859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 11.0, 10.0, 29.0, 44.0, 120.0, 459.0, 2543.0, 630.0, 151.0, 53.0, 26.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6928024291992188, -0.6775970458984375, -0.6623916625976562, -0.647186279296875, -0.6319808959960938, -0.6167755126953125, -0.6015701293945312, -0.58636474609375, -0.5711593627929688, -0.5559539794921875, -0.5407485961914062, -0.525543212890625, -0.5103378295898438, -0.4951324462890625, -0.47992706298828125, -0.4647216796875, -0.44951629638671875, -0.4343109130859375, -0.41910552978515625, -0.403900146484375, -0.38869476318359375, -0.3734893798828125, -0.35828399658203125, -0.34307861328125, -0.32787322998046875, -0.3126678466796875, -0.29746246337890625, -0.282257080078125, -0.26705169677734375, -0.2518463134765625, -0.23664093017578125, -0.221435546875, -0.20623016357421875, -0.1910247802734375, -0.17581939697265625, -0.160614013671875, -0.14540863037109375, -0.1302032470703125, -0.11499786376953125, -0.09979248046875, -0.08458709716796875, -0.0693817138671875, -0.05417633056640625, -0.038970947265625, -0.02376556396484375, -0.0085601806640625, 0.00664520263671875, 0.0218505859375, 0.03705596923828125, 0.0522613525390625, 0.06746673583984375, 0.082672119140625, 0.09787750244140625, 0.1130828857421875, 0.12828826904296875, 0.14349365234375, 0.15869903564453125, 0.1739044189453125, 0.18910980224609375, 0.204315185546875, 0.21952056884765625, 0.2347259521484375, 0.24993133544921875, 0.26513671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 28.0, 125.0, 452.0, 320.0, 61.0, 14.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.045211791992188, -9.825933456420898, -9.60665512084961, -9.387377738952637, -9.168099403381348, -8.948821067810059, -8.72954273223877, -8.51026439666748, -8.290987014770508, -8.071708679199219, -7.852430820465088, -7.633152484893799, -7.413874626159668, -7.194596290588379, -6.97531795501709, -6.756040096282959, -6.536761283874512, -6.317482948303223, -6.098205089569092, -5.878926753997803, -5.659648895263672, -5.440370559692383, -5.221092224121094, -5.001814365386963, -4.782536506652832, -4.563258171081543, -4.343980312347412, -4.124701976776123, -3.905423879623413, -3.686145782470703, -3.466867685317993, -3.247589588165283, -3.0283114910125732, -2.8090333938598633, -2.5897552967071533, -2.3704771995544434, -2.1511988639831543, -1.9319207668304443, -1.7126426696777344, -1.4933644533157349, -1.274086356163025, -1.054808259010315, -0.8355300426483154, -0.6162519454956055, -0.39697378873825073, -0.177695631980896, 0.041582465171813965, 0.2608606815338135, 0.48013877868652344, 0.6994169354438782, 0.9186950922012329, 1.1379731893539429, 1.3572514057159424, 1.5765295028686523, 1.7958076000213623, 2.0150856971740723, 2.2343640327453613, 2.4536421298980713, 2.6729202270507812, 2.8921985626220703, 3.1114766597747803, 3.3307547569274902, 3.5500328540802, 3.76931095123291, 3.98858904838562]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 19.0, 22.0, 41.0, 44.0, 68.0, 70.0, 95.0, 118.0, 106.0, 108.0, 93.0, 63.0, 51.0, 39.0, 24.0, 15.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1679043769836426, -1.1115180253982544, -1.0551316738128662, -0.9987452626228333, -0.9423588514328003, -0.8859724998474121, -0.8295861482620239, -0.773199737071991, -0.716813325881958, -0.6604269742965698, -0.6040405631065369, -0.5476542115211487, -0.4912678003311157, -0.43488144874572754, -0.37849506735801697, -0.3221086859703064, -0.2657223343849182, -0.20933595299720764, -0.15294957160949707, -0.09656320512294769, -0.04017682373523712, 0.016209542751312256, 0.07259592413902283, 0.1289823055267334, 0.18536868691444397, 0.24175506830215454, 0.2981414496898651, 0.3545278310775757, 0.41091418266296387, 0.46730056405067444, 0.523686945438385, 0.580073356628418, 0.6364597082138062, 0.6928460597991943, 0.7492324709892273, 0.8056188225746155, 0.8620052337646484, 0.9183915853500366, 0.9747779369354248, 1.0311644077301025, 1.0875507593154907, 1.143937110900879, 1.200323462486267, 1.2567099332809448, 1.313096284866333, 1.3694826364517212, 1.4258689880371094, 1.482255458831787, 1.5386416912078857, 1.595028042793274, 1.651414394378662, 1.7078008651733398, 1.764187216758728, 1.8205735683441162, 1.8769599199295044, 1.9333462715148926, 1.9897327423095703, 2.046119213104248, 2.1025054454803467, 2.1588919162750244, 2.215278148651123, 2.271664619445801, 2.3280510902404785, 2.384437322616577, 2.440823793411255]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 10.0, 10.0, 18.0, 9.0, 12.0, 20.0, 38.0, 51.0, 71.0, 127.0, 243.0, 599.0, 1860.0, 11883.0, 250595.0, 734294.0, 42759.0, 4026.0, 995.0, 385.0, 186.0, 107.0, 57.0, 49.0, 29.0, 19.0, 16.0, 9.0, 14.0, 12.0, 11.0, 10.0, 9.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.378662109375, -1.32177734375, -1.264892578125, -1.2080078125, -1.151123046875, -1.09423828125, -1.037353515625, -0.98046875, -0.923583984375, -0.86669921875, -0.809814453125, -0.7529296875, -0.696044921875, -0.63916015625, -0.582275390625, -0.525390625, -0.468505859375, -0.41162109375, -0.354736328125, -0.2978515625, -0.240966796875, -0.18408203125, -0.127197265625, -0.0703125, -0.013427734375, 0.04345703125, 0.100341796875, 0.1572265625, 0.214111328125, 0.27099609375, 0.327880859375, 0.384765625, 0.441650390625, 0.49853515625, 0.555419921875, 0.6123046875, 0.669189453125, 0.72607421875, 0.782958984375, 0.83984375, 0.896728515625, 0.95361328125, 1.010498046875, 1.0673828125, 1.124267578125, 1.18115234375, 1.238037109375, 1.294921875, 1.351806640625, 1.40869140625, 1.465576171875, 1.5224609375, 1.579345703125, 1.63623046875, 1.693115234375, 1.75, 1.806884765625, 1.86376953125, 1.920654296875, 1.9775390625, 2.034423828125, 2.09130859375, 2.148193359375, 2.205078125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 13.0, 23.0, 36.0, 49.0, 82.0, 95.0, 118.0, 119.0, 119.0, 101.0, 85.0, 64.0, 41.0, 20.0, 14.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11210155487060547, -0.10817527770996094, -0.1042490005493164, -0.10032272338867188, -0.09639644622802734, -0.09247016906738281, -0.08854389190673828, -0.08461761474609375, -0.08069133758544922, -0.07676506042480469, -0.07283878326416016, -0.06891250610351562, -0.0649862289428711, -0.06105995178222656, -0.05713367462158203, -0.0532073974609375, -0.04928112030029297, -0.04535484313964844, -0.041428565979003906, -0.037502288818359375, -0.033576011657714844, -0.029649734497070312, -0.02572345733642578, -0.02179718017578125, -0.01787090301513672, -0.013944625854492188, -0.010018348693847656, -0.006092071533203125, -0.0021657943725585938, 0.0017604827880859375, 0.005686759948730469, 0.009613037109375, 0.013539314270019531, 0.017465591430664062, 0.021391868591308594, 0.025318145751953125, 0.029244422912597656, 0.03317070007324219, 0.03709697723388672, 0.04102325439453125, 0.04494953155517578, 0.04887580871582031, 0.052802085876464844, 0.056728363037109375, 0.060654640197753906, 0.06458091735839844, 0.06850719451904297, 0.0724334716796875, 0.07635974884033203, 0.08028602600097656, 0.0842123031616211, 0.08813858032226562, 0.09206485748291016, 0.09599113464355469, 0.09991741180419922, 0.10384368896484375, 0.10776996612548828, 0.11169624328613281, 0.11562252044677734, 0.11954879760742188, 0.1234750747680664, 0.12740135192871094, 0.13132762908935547, 0.13525390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 3.0, 5.0, 16.0, 21.0, 15.0, 28.0, 36.0, 56.0, 86.0, 119.0, 191.0, 340.0, 612.0, 1216.0, 2620.0, 7358.0, 26284.0, 117106.0, 422931.0, 353565.0, 86005.0, 19475.0, 5851.0, 2275.0, 1008.0, 487.0, 289.0, 176.0, 124.0, 79.0, 45.0, 27.0, 31.0, 18.0, 16.0, 9.0, 10.0, 3.0, 5.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0], "bins": [-0.80615234375, -0.784881591796875, -0.76361083984375, -0.742340087890625, -0.7210693359375, -0.699798583984375, -0.67852783203125, -0.657257080078125, -0.635986328125, -0.614715576171875, -0.59344482421875, -0.572174072265625, -0.5509033203125, -0.529632568359375, -0.50836181640625, -0.487091064453125, -0.4658203125, -0.444549560546875, -0.42327880859375, -0.402008056640625, -0.3807373046875, -0.359466552734375, -0.33819580078125, -0.316925048828125, -0.295654296875, -0.274383544921875, -0.25311279296875, -0.231842041015625, -0.2105712890625, -0.189300537109375, -0.16802978515625, -0.146759033203125, -0.12548828125, -0.104217529296875, -0.08294677734375, -0.061676025390625, -0.0404052734375, -0.019134521484375, 0.00213623046875, 0.023406982421875, 0.044677734375, 0.065948486328125, 0.08721923828125, 0.108489990234375, 0.1297607421875, 0.151031494140625, 0.17230224609375, 0.193572998046875, 0.21484375, 0.236114501953125, 0.25738525390625, 0.278656005859375, 0.2999267578125, 0.321197509765625, 0.34246826171875, 0.363739013671875, 0.385009765625, 0.406280517578125, 0.42755126953125, 0.448822021484375, 0.4700927734375, 0.491363525390625, 0.51263427734375, 0.533905029296875, 0.55517578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 13.0, 8.0, 11.0, 14.0, 15.0, 26.0, 25.0, 30.0, 35.0, 36.0, 35.0, 54.0, 56.0, 59.0, 59.0, 59.0, 52.0, 55.0, 55.0, 49.0, 36.0, 39.0, 28.0, 25.0, 29.0, 20.0, 15.0, 17.0, 10.0, 6.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.37890625, -0.3684959411621094, -0.35808563232421875, -0.3476753234863281, -0.3372650146484375, -0.3268547058105469, -0.31644439697265625, -0.3060340881347656, -0.295623779296875, -0.2852134704589844, -0.27480316162109375, -0.2643928527832031, -0.2539825439453125, -0.24357223510742188, -0.23316192626953125, -0.22275161743164062, -0.21234130859375, -0.20193099975585938, -0.19152069091796875, -0.18111038208007812, -0.1707000732421875, -0.16028976440429688, -0.14987945556640625, -0.13946914672851562, -0.129058837890625, -0.11864852905273438, -0.10823822021484375, -0.09782791137695312, -0.0874176025390625, -0.07700729370117188, -0.06659698486328125, -0.056186676025390625, -0.0457763671875, -0.035366058349609375, -0.02495574951171875, -0.014545440673828125, -0.0041351318359375, 0.006275177001953125, 0.01668548583984375, 0.027095794677734375, 0.037506103515625, 0.047916412353515625, 0.05832672119140625, 0.06873703002929688, 0.0791473388671875, 0.08955764770507812, 0.09996795654296875, 0.11037826538085938, 0.12078857421875, 0.13119888305664062, 0.14160919189453125, 0.15201950073242188, 0.1624298095703125, 0.17284011840820312, 0.18325042724609375, 0.19366073608398438, 0.204071044921875, 0.21448135375976562, 0.22489166259765625, 0.23530197143554688, 0.2457122802734375, 0.2561225891113281, 0.26653289794921875, 0.2769432067871094, 0.287353515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 9.0, 15.0, 13.0, 26.0, 54.0, 73.0, 105.0, 213.0, 419.0, 1348.0, 6075.0, 68038.0, 928777.0, 36896.0, 4526.0, 1046.0, 382.0, 192.0, 109.0, 73.0, 54.0, 28.0, 17.0, 14.0, 9.0, 10.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6630859375, -1.613311767578125, -1.56353759765625, -1.513763427734375, -1.4639892578125, -1.414215087890625, -1.36444091796875, -1.314666748046875, -1.264892578125, -1.215118408203125, -1.16534423828125, -1.115570068359375, -1.0657958984375, -1.016021728515625, -0.96624755859375, -0.916473388671875, -0.86669921875, -0.816925048828125, -0.76715087890625, -0.717376708984375, -0.6676025390625, -0.617828369140625, -0.56805419921875, -0.518280029296875, -0.468505859375, -0.418731689453125, -0.36895751953125, -0.319183349609375, -0.2694091796875, -0.219635009765625, -0.16986083984375, -0.120086669921875, -0.0703125, -0.020538330078125, 0.02923583984375, 0.079010009765625, 0.1287841796875, 0.178558349609375, 0.22833251953125, 0.278106689453125, 0.327880859375, 0.377655029296875, 0.42742919921875, 0.477203369140625, 0.5269775390625, 0.576751708984375, 0.62652587890625, 0.676300048828125, 0.72607421875, 0.775848388671875, 0.82562255859375, 0.875396728515625, 0.9251708984375, 0.974945068359375, 1.02471923828125, 1.074493408203125, 1.124267578125, 1.174041748046875, 1.22381591796875, 1.273590087890625, 1.3233642578125, 1.373138427734375, 1.42291259765625, 1.472686767578125, 1.5224609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 3.0, 2.0, 6.0, 12.0, 22.0, 32.0, 53.0, 57.0, 95.0, 99.0, 134.0, 125.0, 101.0, 83.0, 59.0, 35.0, 28.0, 10.0, 13.0, 12.0, 8.0, 2.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.842613220214844e-05, -6.528012454509735e-05, -6.213411688804626e-05, -5.898810923099518e-05, -5.584210157394409e-05, -5.2696093916893005e-05, -4.955008625984192e-05, -4.640407860279083e-05, -4.3258070945739746e-05, -4.011206328868866e-05, -3.696605563163757e-05, -3.382004797458649e-05, -3.06740403175354e-05, -2.7528032660484314e-05, -2.4382025003433228e-05, -2.123601734638214e-05, -1.8090009689331055e-05, -1.4944002032279968e-05, -1.1797994375228882e-05, -8.651986718177795e-06, -5.505979061126709e-06, -2.3599714040756226e-06, 7.860362529754639e-07, 3.93204391002655e-06, 7.078051567077637e-06, 1.0224059224128723e-05, 1.337006688117981e-05, 1.6516074538230896e-05, 1.9662082195281982e-05, 2.280808985233307e-05, 2.5954097509384155e-05, 2.9100105166435242e-05, 3.224611282348633e-05, 3.5392120480537415e-05, 3.85381281375885e-05, 4.168413579463959e-05, 4.4830143451690674e-05, 4.797615110874176e-05, 5.112215876579285e-05, 5.426816642284393e-05, 5.741417407989502e-05, 6.0560181736946106e-05, 6.370618939399719e-05, 6.685219705104828e-05, 6.999820470809937e-05, 7.314421236515045e-05, 7.629022002220154e-05, 7.943622767925262e-05, 8.258223533630371e-05, 8.57282429933548e-05, 8.887425065040588e-05, 9.202025830745697e-05, 9.516626596450806e-05, 9.831227362155914e-05, 0.00010145828127861023, 0.00010460428893566132, 0.0001077502965927124, 0.00011089630424976349, 0.00011404231190681458, 0.00011718831956386566, 0.00012033432722091675, 0.00012348033487796783, 0.00012662634253501892, 0.00012977235019207, 0.0001329183578491211]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 7.0, 5.0, 17.0, 29.0, 47.0, 68.0, 120.0, 247.0, 645.0, 1671.0, 6345.0, 45543.0, 856796.0, 123088.0, 10011.0, 2335.0, 833.0, 314.0, 171.0, 90.0, 53.0, 39.0, 20.0, 16.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.2192840576171875, -1.180755615234375, -1.1422271728515625, -1.10369873046875, -1.0651702880859375, -1.026641845703125, -0.9881134033203125, -0.9495849609375, -0.9110565185546875, -0.872528076171875, -0.8339996337890625, -0.79547119140625, -0.7569427490234375, -0.718414306640625, -0.6798858642578125, -0.641357421875, -0.6028289794921875, -0.564300537109375, -0.5257720947265625, -0.48724365234375, -0.4487152099609375, -0.410186767578125, -0.3716583251953125, -0.3331298828125, -0.2946014404296875, -0.256072998046875, -0.2175445556640625, -0.17901611328125, -0.1404876708984375, -0.101959228515625, -0.0634307861328125, -0.02490234375, 0.0136260986328125, 0.052154541015625, 0.0906829833984375, 0.12921142578125, 0.1677398681640625, 0.206268310546875, 0.2447967529296875, 0.2833251953125, 0.3218536376953125, 0.360382080078125, 0.3989105224609375, 0.43743896484375, 0.4759674072265625, 0.514495849609375, 0.5530242919921875, 0.591552734375, 0.6300811767578125, 0.668609619140625, 0.7071380615234375, 0.74566650390625, 0.7841949462890625, 0.822723388671875, 0.8612518310546875, 0.8997802734375, 0.9383087158203125, 0.976837158203125, 1.0153656005859375, 1.05389404296875, 1.0924224853515625, 1.130950927734375, 1.1694793701171875, 1.2080078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 7.0, 8.0, 15.0, 14.0, 32.0, 69.0, 83.0, 138.0, 165.0, 153.0, 125.0, 72.0, 52.0, 22.0, 13.0, 8.0, 3.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430908203125, -0.4154930114746094, -0.40007781982421875, -0.3846626281738281, -0.3692474365234375, -0.3538322448730469, -0.33841705322265625, -0.3230018615722656, -0.307586669921875, -0.2921714782714844, -0.27675628662109375, -0.2613410949707031, -0.2459259033203125, -0.23051071166992188, -0.21509552001953125, -0.19968032836914062, -0.18426513671875, -0.16884994506835938, -0.15343475341796875, -0.13801956176757812, -0.1226043701171875, -0.10718917846679688, -0.09177398681640625, -0.07635879516601562, -0.060943603515625, -0.045528411865234375, -0.03011322021484375, -0.014698028564453125, 0.0007171630859375, 0.016132354736328125, 0.03154754638671875, 0.046962738037109375, 0.0623779296875, 0.07779312133789062, 0.09320831298828125, 0.10862350463867188, 0.1240386962890625, 0.13945388793945312, 0.15486907958984375, 0.17028427124023438, 0.185699462890625, 0.20111465454101562, 0.21652984619140625, 0.23194503784179688, 0.2473602294921875, 0.2627754211425781, 0.27819061279296875, 0.2936058044433594, 0.30902099609375, 0.3244361877441406, 0.33985137939453125, 0.3552665710449219, 0.3706817626953125, 0.3860969543457031, 0.40151214599609375, 0.4169273376464844, 0.432342529296875, 0.4477577209472656, 0.46317291259765625, 0.4785881042480469, 0.4940032958984375, 0.5094184875488281, 0.5248336791992188, 0.5402488708496094, 0.5556640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 12.0, 46.0, 184.0, 423.0, 250.0, 67.0, 17.0, 10.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.70760726928711, -16.33279037475586, -15.957975387573242, -15.583159446716309, -15.208343505859375, -14.833527565002441, -14.458711624145508, -14.083895683288574, -13.70907974243164, -13.334263801574707, -12.959447860717773, -12.58463191986084, -12.209815979003906, -11.835000038146973, -11.460184097290039, -11.085368156433105, -10.710552215576172, -10.335736274719238, -9.960920333862305, -9.586104393005371, -9.211288452148438, -8.836472511291504, -8.46165657043457, -8.086840629577637, -7.712023735046387, -7.337207794189453, -6.9623918533325195, -6.587575912475586, -6.212759971618652, -5.837944030761719, -5.463128089904785, -5.088312149047852, -4.71349573135376, -4.338679790496826, -3.9638638496398926, -3.589047908782959, -3.2142319679260254, -2.839416027069092, -2.464599847793579, -2.0897839069366455, -1.714967966079712, -1.3401520252227783, -0.9653360247612, -0.5905200242996216, -0.215704083442688, 0.1591118574142456, 0.5339279174804688, 0.9087438583374023, 1.283559799194336, 1.6583757400512695, 2.033191680908203, 2.4080076217651367, 2.7828235626220703, 3.157639503479004, 3.5324556827545166, 3.90727162361145, 4.282087326049805, 4.656903266906738, 5.031719207763672, 5.4065351486206055, 5.781351089477539, 6.156167030334473, 6.530982971191406, 6.90579891204834, 7.280615329742432]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 14.0, 18.0, 17.0, 31.0, 34.0, 42.0, 46.0, 69.0, 69.0, 62.0, 65.0, 65.0, 82.0, 67.0, 54.0, 59.0, 43.0, 40.0, 34.0, 21.0, 17.0, 6.0, 15.0, 10.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.159533977508545, -2.0684778690338135, -1.9774218797683716, -1.8863658905029297, -1.7953099012374878, -1.704253911972046, -1.6131978034973145, -1.5221418142318726, -1.4310858249664307, -1.3400298357009888, -1.2489737272262573, -1.1579177379608154, -1.0668617486953735, -0.9758056998252869, -0.8847496509552002, -0.7936936616897583, -0.7026375532150269, -0.6115815043449402, -0.5205255150794983, -0.4294694662094116, -0.33841344714164734, -0.24735742807388306, -0.1563013792037964, -0.06524538993835449, 0.025810658931732178, 0.11686668545007706, 0.20792271196842194, 0.2989787459373474, 0.3900347650051117, 0.481090784072876, 0.5721468329429626, 0.6632028222084045, 0.7542588710784912, 0.8453149199485779, 0.9363709092140198, 1.0274269580841064, 1.1184829473495483, 1.2095389366149902, 1.3005950450897217, 1.3916510343551636, 1.4827070236206055, 1.5737630128860474, 1.6648191213607788, 1.7558751106262207, 1.8469310998916626, 1.9379870891571045, 2.029043197631836, 2.1200990676879883, 2.211155414581299, 2.3022115230560303, 2.3932673931121826, 2.484323501586914, 2.5753796100616455, 2.666435480117798, 2.7574915885925293, 2.8485474586486816, 2.939603567123413, 3.0306596755981445, 3.121715545654297, 3.2127716541290283, 3.3038277626037598, 3.394883632659912, 3.4859397411346436, 3.576995849609375, 3.6680517196655273]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 11.0, 12.0, 18.0, 32.0, 52.0, 99.0, 295.0, 999.0, 6401.0, 97757.0, 3993691.0, 87454.0, 5839.0, 962.0, 270.0, 118.0, 66.0, 42.0, 28.0, 22.0, 22.0, 19.0, 7.0, 11.0, 14.0, 5.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9638671875, -1.8897247314453125, -1.815582275390625, -1.7414398193359375, -1.66729736328125, -1.5931549072265625, -1.519012451171875, -1.4448699951171875, -1.3707275390625, -1.2965850830078125, -1.222442626953125, -1.1483001708984375, -1.07415771484375, -1.0000152587890625, -0.925872802734375, -0.8517303466796875, -0.777587890625, -0.7034454345703125, -0.629302978515625, -0.5551605224609375, -0.48101806640625, -0.4068756103515625, -0.332733154296875, -0.2585906982421875, -0.1844482421875, -0.1103057861328125, -0.036163330078125, 0.0379791259765625, 0.11212158203125, 0.1862640380859375, 0.260406494140625, 0.3345489501953125, 0.40869140625, 0.4828338623046875, 0.556976318359375, 0.6311187744140625, 0.70526123046875, 0.7794036865234375, 0.853546142578125, 0.9276885986328125, 1.0018310546875, 1.0759735107421875, 1.150115966796875, 1.2242584228515625, 1.29840087890625, 1.3725433349609375, 1.446685791015625, 1.5208282470703125, 1.594970703125, 1.6691131591796875, 1.743255615234375, 1.8173980712890625, 1.89154052734375, 1.9656829833984375, 2.039825439453125, 2.1139678955078125, 2.1881103515625, 2.2622528076171875, 2.336395263671875, 2.4105377197265625, 2.48468017578125, 2.5588226318359375, 2.632965087890625, 2.7071075439453125, 2.78125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 6.0, 6.0, 9.0, 14.0, 10.0, 18.0, 15.0, 35.0, 37.0, 42.0, 53.0, 45.0, 51.0, 67.0, 48.0, 68.0, 69.0, 65.0, 74.0, 63.0, 43.0, 27.0, 34.0, 27.0, 17.0, 14.0, 10.0, 9.0, 9.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.06072998046875, -0.0582275390625, -0.05572509765625, -0.05322265625, -0.05072021484375, -0.0482177734375, -0.04571533203125, -0.043212890625, -0.04071044921875, -0.0382080078125, -0.03570556640625, -0.033203125, -0.03070068359375, -0.0281982421875, -0.02569580078125, -0.023193359375, -0.02069091796875, -0.0181884765625, -0.01568603515625, -0.01318359375, -0.01068115234375, -0.0081787109375, -0.00567626953125, -0.003173828125, -0.00067138671875, 0.0018310546875, 0.00433349609375, 0.0068359375, 0.00933837890625, 0.0118408203125, 0.01434326171875, 0.016845703125, 0.01934814453125, 0.0218505859375, 0.02435302734375, 0.02685546875, 0.02935791015625, 0.0318603515625, 0.03436279296875, 0.036865234375, 0.03936767578125, 0.0418701171875, 0.04437255859375, 0.046875, 0.04937744140625, 0.0518798828125, 0.05438232421875, 0.056884765625, 0.05938720703125, 0.0618896484375, 0.06439208984375, 0.06689453125, 0.06939697265625, 0.0718994140625, 0.07440185546875, 0.076904296875, 0.07940673828125, 0.0819091796875, 0.08441162109375, 0.0869140625, 0.08941650390625, 0.0919189453125, 0.09442138671875, 0.096923828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 9.0, 8.0, 14.0, 28.0, 19.0, 38.0, 67.0, 129.0, 238.0, 505.0, 1730.0, 44189.0, 4138750.0, 6616.0, 1036.0, 410.0, 185.0, 105.0, 69.0, 53.0, 27.0, 16.0, 7.0, 10.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.125, -6.9525146484375, -6.780029296875, -6.6075439453125, -6.43505859375, -6.2625732421875, -6.090087890625, -5.9176025390625, -5.7451171875, -5.5726318359375, -5.400146484375, -5.2276611328125, -5.05517578125, -4.8826904296875, -4.710205078125, -4.5377197265625, -4.365234375, -4.1927490234375, -4.020263671875, -3.8477783203125, -3.67529296875, -3.5028076171875, -3.330322265625, -3.1578369140625, -2.9853515625, -2.8128662109375, -2.640380859375, -2.4678955078125, -2.29541015625, -2.1229248046875, -1.950439453125, -1.7779541015625, -1.60546875, -1.4329833984375, -1.260498046875, -1.0880126953125, -0.91552734375, -0.7430419921875, -0.570556640625, -0.3980712890625, -0.2255859375, -0.0531005859375, 0.119384765625, 0.2918701171875, 0.46435546875, 0.6368408203125, 0.809326171875, 0.9818115234375, 1.154296875, 1.3267822265625, 1.499267578125, 1.6717529296875, 1.84423828125, 2.0167236328125, 2.189208984375, 2.3616943359375, 2.5341796875, 2.7066650390625, 2.879150390625, 3.0516357421875, 3.22412109375, 3.3966064453125, 3.569091796875, 3.7415771484375, 3.9140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 12.0, 16.0, 17.0, 40.0, 106.0, 252.0, 840.0, 2039.0, 434.0, 161.0, 78.0, 28.0, 21.0, 14.0, 11.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41455078125, -0.4020957946777344, -0.38964080810546875, -0.3771858215332031, -0.3647308349609375, -0.3522758483886719, -0.33982086181640625, -0.3273658752441406, -0.314910888671875, -0.3024559020996094, -0.29000091552734375, -0.2775459289550781, -0.2650909423828125, -0.2526359558105469, -0.24018096923828125, -0.22772598266601562, -0.21527099609375, -0.20281600952148438, -0.19036102294921875, -0.17790603637695312, -0.1654510498046875, -0.15299606323242188, -0.14054107666015625, -0.12808609008789062, -0.115631103515625, -0.10317611694335938, -0.09072113037109375, -0.07826614379882812, -0.0658111572265625, -0.053356170654296875, -0.04090118408203125, -0.028446197509765625, -0.0159912109375, -0.003536224365234375, 0.00891876220703125, 0.021373748779296875, 0.0338287353515625, 0.046283721923828125, 0.05873870849609375, 0.07119369506835938, 0.083648681640625, 0.09610366821289062, 0.10855865478515625, 0.12101364135742188, 0.1334686279296875, 0.14592361450195312, 0.15837860107421875, 0.17083358764648438, 0.18328857421875, 0.19574356079101562, 0.20819854736328125, 0.22065353393554688, 0.2331085205078125, 0.24556350708007812, 0.25801849365234375, 0.2704734802246094, 0.282928466796875, 0.2953834533691406, 0.30783843994140625, 0.3202934265136719, 0.3327484130859375, 0.3452033996582031, 0.35765838623046875, 0.3701133728027344, 0.382568359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 16.0, 24.0, 39.0, 105.0, 197.0, 268.0, 182.0, 76.0, 40.0, 19.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7217984199523926, -3.6108174324035645, -3.4998362064361572, -3.388855218887329, -3.277873992919922, -3.1668930053710938, -3.0559120178222656, -2.9449307918548584, -2.833949565887451, -2.722968578338623, -2.611987352371216, -2.5010063648223877, -2.3900251388549805, -2.2790441513061523, -2.168063163757324, -2.057081937789917, -1.9461009502410889, -1.8351198434829712, -1.7241387367248535, -1.6131577491760254, -1.5021765232086182, -1.39119553565979, -1.2802144289016724, -1.1692333221435547, -1.058252215385437, -0.9472711086273193, -0.8362900018692017, -0.7253089547157288, -0.6143278479576111, -0.5033467411994934, -0.3923656940460205, -0.28138458728790283, -0.17040348052978516, -0.059422388672828674, 0.05155870318412781, 0.1625397801399231, 0.27352088689804077, 0.38450199365615845, 0.49548304080963135, 0.606464147567749, 0.7174452543258667, 0.8284263610839844, 0.939407467842102, 1.0503885746002197, 1.1613695621490479, 1.272350788116455, 1.3833317756652832, 1.4943128824234009, 1.6052939891815186, 1.7162750959396362, 1.827256202697754, 1.938237190246582, 2.0492184162139893, 2.1601994037628174, 2.2711806297302246, 2.3821616172790527, 2.493142604827881, 2.604123592376709, 2.715104818344116, 2.8260858058929443, 2.9370670318603516, 3.0480480194091797, 3.159029006958008, 3.270010232925415, 3.3809914588928223]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 13.0, 15.0, 17.0, 42.0, 36.0, 52.0, 67.0, 79.0, 93.0, 92.0, 67.0, 69.0, 63.0, 63.0, 60.0, 47.0, 34.0, 19.0, 19.0, 14.0, 10.0, 10.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.483320951461792, -1.447756290435791, -1.41219162940979, -1.3766270875930786, -1.3410624265670776, -1.3054977655410767, -1.2699332237243652, -1.2343685626983643, -1.1988039016723633, -1.1632392406463623, -1.1276745796203613, -1.09211003780365, -1.056545376777649, -1.020980715751648, -0.9854161143302917, -0.9498515129089355, -0.9142868518829346, -0.8787221908569336, -0.8431575894355774, -0.8075929880142212, -0.7720283269882202, -0.7364636659622192, -0.700899064540863, -0.6653344631195068, -0.6297698020935059, -0.5942051410675049, -0.5586405396461487, -0.5230759382247925, -0.4875112771987915, -0.4519466459751129, -0.4163820147514343, -0.38081738352775574, -0.34525275230407715, -0.30968812108039856, -0.27412348985671997, -0.23855885863304138, -0.2029942274093628, -0.1674295961856842, -0.13186496496200562, -0.09630033373832703, -0.06073570251464844, -0.02517107129096985, 0.01039355993270874, 0.04595819115638733, 0.08152282238006592, 0.1170874536037445, 0.1526520848274231, 0.18821671605110168, 0.22378134727478027, 0.25934597849845886, 0.29491060972213745, 0.33047524094581604, 0.36603987216949463, 0.4016045033931732, 0.4371691346168518, 0.4727337658405304, 0.508298397064209, 0.54386305809021, 0.5794276595115662, 0.6149922609329224, 0.6505569219589233, 0.6861215829849243, 0.7216861844062805, 0.7572507858276367, 0.7928154468536377]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 11.0, 8.0, 12.0, 19.0, 26.0, 17.0, 48.0, 53.0, 69.0, 102.0, 159.0, 282.0, 645.0, 1408.0, 4808.0, 25801.0, 259866.0, 649973.0, 89064.0, 11415.0, 2633.0, 978.0, 438.0, 238.0, 145.0, 92.0, 57.0, 51.0, 28.0, 25.0, 20.0, 9.0, 7.0, 10.0, 9.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.6005859375, -1.552490234375, -1.50439453125, -1.456298828125, -1.408203125, -1.360107421875, -1.31201171875, -1.263916015625, -1.2158203125, -1.167724609375, -1.11962890625, -1.071533203125, -1.0234375, -0.975341796875, -0.92724609375, -0.879150390625, -0.8310546875, -0.782958984375, -0.73486328125, -0.686767578125, -0.638671875, -0.590576171875, -0.54248046875, -0.494384765625, -0.4462890625, -0.398193359375, -0.35009765625, -0.302001953125, -0.25390625, -0.205810546875, -0.15771484375, -0.109619140625, -0.0615234375, -0.013427734375, 0.03466796875, 0.082763671875, 0.130859375, 0.178955078125, 0.22705078125, 0.275146484375, 0.3232421875, 0.371337890625, 0.41943359375, 0.467529296875, 0.515625, 0.563720703125, 0.61181640625, 0.659912109375, 0.7080078125, 0.756103515625, 0.80419921875, 0.852294921875, 0.900390625, 0.948486328125, 0.99658203125, 1.044677734375, 1.0927734375, 1.140869140625, 1.18896484375, 1.237060546875, 1.28515625, 1.333251953125, 1.38134765625, 1.429443359375, 1.4775390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 9.0, 4.0, 13.0, 20.0, 23.0, 49.0, 35.0, 50.0, 68.0, 67.0, 87.0, 87.0, 80.0, 77.0, 72.0, 81.0, 56.0, 32.0, 27.0, 22.0, 17.0, 13.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0828857421875, -0.07953834533691406, -0.07619094848632812, -0.07284355163574219, -0.06949615478515625, -0.06614875793457031, -0.06280136108398438, -0.05945396423339844, -0.0561065673828125, -0.05275917053222656, -0.049411773681640625, -0.04606437683105469, -0.04271697998046875, -0.03936958312988281, -0.036022186279296875, -0.03267478942871094, -0.029327392578125, -0.025979995727539062, -0.022632598876953125, -0.019285202026367188, -0.01593780517578125, -0.012590408325195312, -0.009243011474609375, -0.0058956146240234375, -0.0025482177734375, 0.0007991790771484375, 0.004146575927734375, 0.0074939727783203125, 0.01084136962890625, 0.014188766479492188, 0.017536163330078125, 0.020883560180664062, 0.02423095703125, 0.027578353881835938, 0.030925750732421875, 0.03427314758300781, 0.03762054443359375, 0.04096794128417969, 0.044315338134765625, 0.04766273498535156, 0.0510101318359375, 0.05435752868652344, 0.057704925537109375, 0.06105232238769531, 0.06439971923828125, 0.06774711608886719, 0.07109451293945312, 0.07444190979003906, 0.077789306640625, 0.08113670349121094, 0.08448410034179688, 0.08783149719238281, 0.09117889404296875, 0.09452629089355469, 0.09787368774414062, 0.10122108459472656, 0.1045684814453125, 0.10791587829589844, 0.11126327514648438, 0.11461067199707031, 0.11795806884765625, 0.12130546569824219, 0.12465286254882812, 0.12800025939941406, 0.13134765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 9.0, 10.0, 14.0, 27.0, 26.0, 51.0, 79.0, 119.0, 193.0, 395.0, 672.0, 1467.0, 3077.0, 7522.0, 23439.0, 92933.0, 351050.0, 402935.0, 119214.0, 29475.0, 8960.0, 3500.0, 1543.0, 781.0, 410.0, 229.0, 141.0, 81.0, 57.0, 37.0, 26.0, 23.0, 9.0, 13.0, 8.0, 4.0, 3.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7990036010742188, -0.7762298583984375, -0.7534561157226562, -0.730682373046875, -0.7079086303710938, -0.6851348876953125, -0.6623611450195312, -0.63958740234375, -0.6168136596679688, -0.5940399169921875, -0.5712661743164062, -0.548492431640625, -0.5257186889648438, -0.5029449462890625, -0.48017120361328125, -0.4573974609375, -0.43462371826171875, -0.4118499755859375, -0.38907623291015625, -0.366302490234375, -0.34352874755859375, -0.3207550048828125, -0.29798126220703125, -0.27520751953125, -0.25243377685546875, -0.2296600341796875, -0.20688629150390625, -0.184112548828125, -0.16133880615234375, -0.1385650634765625, -0.11579132080078125, -0.093017578125, -0.07024383544921875, -0.0474700927734375, -0.02469635009765625, -0.001922607421875, 0.02085113525390625, 0.0436248779296875, 0.06639862060546875, 0.08917236328125, 0.11194610595703125, 0.1347198486328125, 0.15749359130859375, 0.180267333984375, 0.20304107666015625, 0.2258148193359375, 0.24858856201171875, 0.2713623046875, 0.29413604736328125, 0.3169097900390625, 0.33968353271484375, 0.362457275390625, 0.38523101806640625, 0.4080047607421875, 0.43077850341796875, 0.45355224609375, 0.47632598876953125, 0.4990997314453125, 0.5218734741210938, 0.544647216796875, 0.5674209594726562, 0.5901947021484375, 0.6129684448242188, 0.6357421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 7.0, 10.0, 14.0, 15.0, 18.0, 22.0, 32.0, 33.0, 38.0, 30.0, 34.0, 30.0, 47.0, 43.0, 49.0, 46.0, 49.0, 49.0, 51.0, 31.0, 31.0, 40.0, 35.0, 33.0, 17.0, 28.0, 24.0, 14.0, 19.0, 15.0, 12.0, 11.0, 9.0, 11.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.307373046875, -0.2979774475097656, -0.28858184814453125, -0.2791862487792969, -0.2697906494140625, -0.2603950500488281, -0.25099945068359375, -0.24160385131835938, -0.232208251953125, -0.22281265258789062, -0.21341705322265625, -0.20402145385742188, -0.1946258544921875, -0.18523025512695312, -0.17583465576171875, -0.16643905639648438, -0.15704345703125, -0.14764785766601562, -0.13825225830078125, -0.12885665893554688, -0.1194610595703125, -0.11006546020507812, -0.10066986083984375, -0.09127426147460938, -0.081878662109375, -0.07248306274414062, -0.06308746337890625, -0.053691864013671875, -0.0442962646484375, -0.034900665283203125, -0.02550506591796875, -0.016109466552734375, -0.0067138671875, 0.002681732177734375, 0.01207733154296875, 0.021472930908203125, 0.0308685302734375, 0.040264129638671875, 0.04965972900390625, 0.059055328369140625, 0.068450927734375, 0.07784652709960938, 0.08724212646484375, 0.09663772583007812, 0.1060333251953125, 0.11542892456054688, 0.12482452392578125, 0.13422012329101562, 0.14361572265625, 0.15301132202148438, 0.16240692138671875, 0.17180252075195312, 0.1811981201171875, 0.19059371948242188, 0.19998931884765625, 0.20938491821289062, 0.218780517578125, 0.22817611694335938, 0.23757171630859375, 0.24696731567382812, 0.2563629150390625, 0.2657585144042969, 0.27515411376953125, 0.2845497131347656, 0.2939453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 6.0, 8.0, 4.0, 4.0, 11.0, 14.0, 19.0, 24.0, 57.0, 77.0, 146.0, 279.0, 529.0, 1204.0, 3415.0, 12084.0, 88429.0, 700792.0, 212376.0, 20892.0, 4971.0, 1704.0, 709.0, 326.0, 164.0, 120.0, 53.0, 40.0, 22.0, 17.0, 15.0, 7.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6748046875, -0.6558837890625, -0.636962890625, -0.6180419921875, -0.59912109375, -0.5802001953125, -0.561279296875, -0.5423583984375, -0.5234375, -0.5045166015625, -0.485595703125, -0.4666748046875, -0.44775390625, -0.4288330078125, -0.409912109375, -0.3909912109375, -0.3720703125, -0.3531494140625, -0.334228515625, -0.3153076171875, -0.29638671875, -0.2774658203125, -0.258544921875, -0.2396240234375, -0.220703125, -0.2017822265625, -0.182861328125, -0.1639404296875, -0.14501953125, -0.1260986328125, -0.107177734375, -0.0882568359375, -0.0693359375, -0.0504150390625, -0.031494140625, -0.0125732421875, 0.00634765625, 0.0252685546875, 0.044189453125, 0.0631103515625, 0.08203125, 0.1009521484375, 0.119873046875, 0.1387939453125, 0.15771484375, 0.1766357421875, 0.195556640625, 0.2144775390625, 0.2333984375, 0.2523193359375, 0.271240234375, 0.2901611328125, 0.30908203125, 0.3280029296875, 0.346923828125, 0.3658447265625, 0.384765625, 0.4036865234375, 0.422607421875, 0.4415283203125, 0.46044921875, 0.4793701171875, 0.498291015625, 0.5172119140625, 0.5361328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 11.0, 9.0, 17.0, 16.0, 19.0, 29.0, 31.0, 42.0, 49.0, 64.0, 75.0, 83.0, 104.0, 67.0, 78.0, 54.0, 61.0, 41.0, 36.0, 25.0, 26.0, 11.0, 9.0, 7.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.210803985595703e-05, -6.0187652707099915e-05, -5.82672655582428e-05, -5.634687840938568e-05, -5.4426491260528564e-05, -5.250610411167145e-05, -5.058571696281433e-05, -4.8665329813957214e-05, -4.67449426651001e-05, -4.482455551624298e-05, -4.2904168367385864e-05, -4.098378121852875e-05, -3.906339406967163e-05, -3.7143006920814514e-05, -3.52226197719574e-05, -3.330223262310028e-05, -3.1381845474243164e-05, -2.9461458325386047e-05, -2.754107117652893e-05, -2.5620684027671814e-05, -2.3700296878814697e-05, -2.177990972995758e-05, -1.9859522581100464e-05, -1.7939135432243347e-05, -1.601874828338623e-05, -1.4098361134529114e-05, -1.2177973985671997e-05, -1.025758683681488e-05, -8.337199687957764e-06, -6.416812539100647e-06, -4.49642539024353e-06, -2.5760382413864136e-06, -6.556510925292969e-07, 1.2647360563278198e-06, 3.1851232051849365e-06, 5.105510354042053e-06, 7.02589750289917e-06, 8.946284651756287e-06, 1.0866671800613403e-05, 1.278705894947052e-05, 1.4707446098327637e-05, 1.6627833247184753e-05, 1.854822039604187e-05, 2.0468607544898987e-05, 2.2388994693756104e-05, 2.430938184261322e-05, 2.6229768991470337e-05, 2.8150156140327454e-05, 3.007054328918457e-05, 3.199093043804169e-05, 3.3911317586898804e-05, 3.583170473575592e-05, 3.775209188461304e-05, 3.9672479033470154e-05, 4.159286618232727e-05, 4.351325333118439e-05, 4.5433640480041504e-05, 4.735402762889862e-05, 4.927441477775574e-05, 5.1194801926612854e-05, 5.311518907546997e-05, 5.503557622432709e-05, 5.6955963373184204e-05, 5.887635052204132e-05, 6.079673767089844e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 5.0, 11.0, 13.0, 17.0, 12.0, 27.0, 54.0, 82.0, 154.0, 274.0, 586.0, 1381.0, 3486.0, 11839.0, 60879.0, 570322.0, 350703.0, 35644.0, 8227.0, 2725.0, 1065.0, 489.0, 239.0, 107.0, 79.0, 40.0, 30.0, 16.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.7109375, -0.6939544677734375, -0.676971435546875, -0.6599884033203125, -0.64300537109375, -0.6260223388671875, -0.609039306640625, -0.5920562744140625, -0.5750732421875, -0.5580902099609375, -0.541107177734375, -0.5241241455078125, -0.50714111328125, -0.4901580810546875, -0.473175048828125, -0.4561920166015625, -0.439208984375, -0.4222259521484375, -0.405242919921875, -0.3882598876953125, -0.37127685546875, -0.3542938232421875, -0.337310791015625, -0.3203277587890625, -0.3033447265625, -0.2863616943359375, -0.269378662109375, -0.2523956298828125, -0.23541259765625, -0.2184295654296875, -0.201446533203125, -0.1844635009765625, -0.16748046875, -0.1504974365234375, -0.133514404296875, -0.1165313720703125, -0.09954833984375, -0.0825653076171875, -0.065582275390625, -0.0485992431640625, -0.0316162109375, -0.0146331787109375, 0.002349853515625, 0.0193328857421875, 0.03631591796875, 0.0532989501953125, 0.070281982421875, 0.0872650146484375, 0.104248046875, 0.1212310791015625, 0.138214111328125, 0.1551971435546875, 0.17218017578125, 0.1891632080078125, 0.206146240234375, 0.2231292724609375, 0.2401123046875, 0.2570953369140625, 0.274078369140625, 0.2910614013671875, 0.30804443359375, 0.3250274658203125, 0.342010498046875, 0.3589935302734375, 0.3759765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 8.0, 16.0, 22.0, 19.0, 71.0, 69.0, 84.0, 116.0, 136.0, 119.0, 119.0, 63.0, 47.0, 34.0, 35.0, 8.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4656867980957031, -0.45334625244140625, -0.4410057067871094, -0.4286651611328125, -0.4163246154785156, -0.40398406982421875, -0.3916435241699219, -0.379302978515625, -0.3669624328613281, -0.35462188720703125, -0.3422813415527344, -0.3299407958984375, -0.3176002502441406, -0.30525970458984375, -0.2929191589355469, -0.28057861328125, -0.2682380676269531, -0.25589752197265625, -0.24355697631835938, -0.2312164306640625, -0.21887588500976562, -0.20653533935546875, -0.19419479370117188, -0.181854248046875, -0.16951370239257812, -0.15717315673828125, -0.14483261108398438, -0.1324920654296875, -0.12015151977539062, -0.10781097412109375, -0.09547042846679688, -0.0831298828125, -0.07078933715820312, -0.05844879150390625, -0.046108245849609375, -0.0337677001953125, -0.021427154541015625, -0.00908660888671875, 0.003253936767578125, 0.015594482421875, 0.027935028076171875, 0.04027557373046875, 0.052616119384765625, 0.0649566650390625, 0.07729721069335938, 0.08963775634765625, 0.10197830200195312, 0.11431884765625, 0.12665939331054688, 0.13899993896484375, 0.15134048461914062, 0.1636810302734375, 0.17602157592773438, 0.18836212158203125, 0.20070266723632812, 0.213043212890625, 0.22538375854492188, 0.23772430419921875, 0.2500648498535156, 0.2624053955078125, 0.2747459411621094, 0.28708648681640625, 0.2994270324707031, 0.311767578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 14.0, 33.0, 80.0, 148.0, 250.0, 246.0, 126.0, 56.0, 28.0, 11.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.672994136810303, -6.440582275390625, -6.2081708908081055, -5.975759029388428, -5.74334716796875, -5.5109357833862305, -5.278523921966553, -5.046112060546875, -4.8137006759643555, -4.581288814544678, -4.348877429962158, -4.1164655685424805, -3.8840537071228027, -3.651642084121704, -3.4192304611206055, -3.1868185997009277, -2.95440673828125, -2.7219951152801514, -2.4895832538604736, -2.257171630859375, -2.0247597694396973, -1.7923481464385986, -1.5599365234375, -1.3275247812271118, -1.0951130390167236, -0.8627012968063354, -0.630289614200592, -0.39787793159484863, -0.16546618938446045, 0.06694555282592773, 0.29935717582702637, 0.5317689180374146, 0.7641811370849609, 0.9965928792953491, 1.2290046215057373, 1.461416244506836, 1.6938279867172241, 1.9262397289276123, 2.158651351928711, 2.3910632133483887, 2.6234748363494873, 2.855886459350586, 3.0882983207702637, 3.3207099437713623, 3.553121566772461, 3.7855334281921387, 4.017945289611816, 4.250356674194336, 4.482768535614014, 4.715180397033691, 4.947591781616211, 5.180003643035889, 5.412415504455566, 5.644826889038086, 5.877238750457764, 6.109650611877441, 6.342061996459961, 6.574473857879639, 6.806885242462158, 7.039297103881836, 7.271708965301514, 7.504120826721191, 7.736532211303711, 7.968944072723389, 8.201355934143066]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 8.0, 12.0, 12.0, 15.0, 15.0, 19.0, 28.0, 31.0, 30.0, 33.0, 46.0, 32.0, 48.0, 48.0, 39.0, 37.0, 42.0, 33.0, 37.0, 41.0, 37.0, 38.0, 32.0, 43.0, 30.0, 29.0, 25.0, 20.0, 18.0, 17.0, 19.0, 11.0, 9.0, 16.0, 5.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.741559386253357, -1.685322642326355, -1.629085898399353, -1.572849154472351, -1.5166124105453491, -1.4603756666183472, -1.4041389226913452, -1.3479021787643433, -1.2916654348373413, -1.2354286909103394, -1.1791919469833374, -1.1229552030563354, -1.0667184591293335, -1.0104817152023315, -0.9542449712753296, -0.8980082273483276, -0.8417714834213257, -0.7855347394943237, -0.7292979955673218, -0.6730612516403198, -0.6168245077133179, -0.5605877637863159, -0.504351019859314, -0.448114275932312, -0.39187753200531006, -0.3356407880783081, -0.27940404415130615, -0.2231673002243042, -0.16693055629730225, -0.11069381237030029, -0.05445706844329834, 0.0017796754837036133, 0.058016300201416016, 0.11425304412841797, 0.17048978805541992, 0.22672653198242188, 0.28296327590942383, 0.3392000198364258, 0.39543676376342773, 0.4516735076904297, 0.5079102516174316, 0.5641469955444336, 0.6203837394714355, 0.6766204833984375, 0.7328572273254395, 0.7890939712524414, 0.8453307151794434, 0.9015674591064453, 0.9578042030334473, 1.0140409469604492, 1.0702776908874512, 1.1265144348144531, 1.182751178741455, 1.238987922668457, 1.295224666595459, 1.351461410522461, 1.407698154449463, 1.4639348983764648, 1.5201716423034668, 1.5764083862304688, 1.6326451301574707, 1.6888818740844727, 1.7451186180114746, 1.8013553619384766, 1.8575921058654785]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 11.0, 11.0, 22.0, 24.0, 46.0, 78.0, 140.0, 266.0, 552.0, 1502.0, 5666.0, 42920.0, 3859616.0, 265021.0, 13832.0, 2841.0, 872.0, 372.0, 180.0, 97.0, 46.0, 40.0, 18.0, 25.0, 13.0, 13.0, 7.0, 3.0, 8.0, 6.0, 8.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5263671875, -1.4621124267578125, -1.397857666015625, -1.3336029052734375, -1.26934814453125, -1.2050933837890625, -1.140838623046875, -1.0765838623046875, -1.0123291015625, -0.9480743408203125, -0.883819580078125, -0.8195648193359375, -0.75531005859375, -0.6910552978515625, -0.626800537109375, -0.5625457763671875, -0.498291015625, -0.4340362548828125, -0.369781494140625, -0.3055267333984375, -0.24127197265625, -0.1770172119140625, -0.112762451171875, -0.0485076904296875, 0.0157470703125, 0.0800018310546875, 0.144256591796875, 0.2085113525390625, 0.27276611328125, 0.3370208740234375, 0.401275634765625, 0.4655303955078125, 0.52978515625, 0.5940399169921875, 0.658294677734375, 0.7225494384765625, 0.78680419921875, 0.8510589599609375, 0.915313720703125, 0.9795684814453125, 1.0438232421875, 1.1080780029296875, 1.172332763671875, 1.2365875244140625, 1.30084228515625, 1.3650970458984375, 1.429351806640625, 1.4936065673828125, 1.557861328125, 1.6221160888671875, 1.686370849609375, 1.7506256103515625, 1.81488037109375, 1.8791351318359375, 1.943389892578125, 2.0076446533203125, 2.0718994140625, 2.1361541748046875, 2.200408935546875, 2.2646636962890625, 2.32891845703125, 2.3931732177734375, 2.457427978515625, 2.5216827392578125, 2.5859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 2.0, 5.0, 9.0, 14.0, 17.0, 25.0, 27.0, 23.0, 65.0, 64.0, 66.0, 63.0, 78.0, 87.0, 71.0, 78.0, 55.0, 59.0, 47.0, 43.0, 21.0, 20.0, 22.0, 9.0, 5.0, 5.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0782470703125, -0.07489967346191406, -0.07155227661132812, -0.06820487976074219, -0.06485748291015625, -0.06151008605957031, -0.058162689208984375, -0.05481529235839844, -0.0514678955078125, -0.04812049865722656, -0.044773101806640625, -0.04142570495605469, -0.03807830810546875, -0.03473091125488281, -0.031383514404296875, -0.028036117553710938, -0.024688720703125, -0.021341323852539062, -0.017993927001953125, -0.014646530151367188, -0.01129913330078125, -0.007951736450195312, -0.004604339599609375, -0.0012569427490234375, 0.0020904541015625, 0.0054378509521484375, 0.008785247802734375, 0.012132644653320312, 0.01548004150390625, 0.018827438354492188, 0.022174835205078125, 0.025522232055664062, 0.02886962890625, 0.03221702575683594, 0.035564422607421875, 0.03891181945800781, 0.04225921630859375, 0.04560661315917969, 0.048954010009765625, 0.05230140686035156, 0.0556488037109375, 0.05899620056152344, 0.062343597412109375, 0.06569099426269531, 0.06903839111328125, 0.07238578796386719, 0.07573318481445312, 0.07908058166503906, 0.082427978515625, 0.08577537536621094, 0.08912277221679688, 0.09247016906738281, 0.09581756591796875, 0.09916496276855469, 0.10251235961914062, 0.10585975646972656, 0.1092071533203125, 0.11255455017089844, 0.11590194702148438, 0.11924934387207031, 0.12259674072265625, 0.1259441375732422, 0.12929153442382812, 0.13263893127441406, 0.135986328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 10.0, 17.0, 35.0, 41.0, 83.0, 182.0, 385.0, 1173.0, 6971.0, 1667375.0, 2507908.0, 7943.0, 1321.0, 485.0, 193.0, 84.0, 36.0, 22.0, 10.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.220703125, -3.123138427734375, -3.02557373046875, -2.928009033203125, -2.8304443359375, -2.732879638671875, -2.63531494140625, -2.537750244140625, -2.440185546875, -2.342620849609375, -2.24505615234375, -2.147491455078125, -2.0499267578125, -1.952362060546875, -1.85479736328125, -1.757232666015625, -1.65966796875, -1.562103271484375, -1.46453857421875, -1.366973876953125, -1.2694091796875, -1.171844482421875, -1.07427978515625, -0.976715087890625, -0.879150390625, -0.781585693359375, -0.68402099609375, -0.586456298828125, -0.4888916015625, -0.391326904296875, -0.29376220703125, -0.196197509765625, -0.0986328125, -0.001068115234375, 0.09649658203125, 0.194061279296875, 0.2916259765625, 0.389190673828125, 0.48675537109375, 0.584320068359375, 0.681884765625, 0.779449462890625, 0.87701416015625, 0.974578857421875, 1.0721435546875, 1.169708251953125, 1.26727294921875, 1.364837646484375, 1.46240234375, 1.559967041015625, 1.65753173828125, 1.755096435546875, 1.8526611328125, 1.950225830078125, 2.04779052734375, 2.145355224609375, 2.242919921875, 2.340484619140625, 2.43804931640625, 2.535614013671875, 2.6331787109375, 2.730743408203125, 2.82830810546875, 2.925872802734375, 3.0234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 10.0, 18.0, 28.0, 52.0, 146.0, 461.0, 2084.0, 894.0, 222.0, 87.0, 29.0, 23.0, 10.0, 7.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.452880859375, -0.4390411376953125, -0.425201416015625, -0.4113616943359375, -0.39752197265625, -0.3836822509765625, -0.369842529296875, -0.3560028076171875, -0.3421630859375, -0.3283233642578125, -0.314483642578125, -0.3006439208984375, -0.28680419921875, -0.2729644775390625, -0.259124755859375, -0.2452850341796875, -0.2314453125, -0.2176055908203125, -0.203765869140625, -0.1899261474609375, -0.17608642578125, -0.1622467041015625, -0.148406982421875, -0.1345672607421875, -0.1207275390625, -0.1068878173828125, -0.093048095703125, -0.0792083740234375, -0.06536865234375, -0.0515289306640625, -0.037689208984375, -0.0238494873046875, -0.010009765625, 0.0038299560546875, 0.017669677734375, 0.0315093994140625, 0.04534912109375, 0.0591888427734375, 0.073028564453125, 0.0868682861328125, 0.1007080078125, 0.1145477294921875, 0.128387451171875, 0.1422271728515625, 0.15606689453125, 0.1699066162109375, 0.183746337890625, 0.1975860595703125, 0.21142578125, 0.2252655029296875, 0.239105224609375, 0.2529449462890625, 0.26678466796875, 0.2806243896484375, 0.294464111328125, 0.3083038330078125, 0.3221435546875, 0.3359832763671875, 0.349822998046875, 0.3636627197265625, 0.37750244140625, 0.3913421630859375, 0.405181884765625, 0.4190216064453125, 0.432861328125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 14.0, 40.0, 130.0, 396.0, 308.0, 83.0, 21.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.397743225097656, -4.250485897064209, -4.10322904586792, -3.9559717178344727, -3.8087146282196045, -3.6614575386047363, -3.514200210571289, -3.366943120956421, -3.2196860313415527, -3.0724289417266846, -2.9251718521118164, -2.777914524078369, -2.630657434463501, -2.483400344848633, -2.3361430168151855, -2.1888859272003174, -2.041628837585449, -1.894371747970581, -1.7471145391464233, -1.5998573303222656, -1.4526002407073975, -1.3053431510925293, -1.1580859422683716, -1.0108287334442139, -0.8635716438293457, -0.7163144946098328, -0.5690573453903198, -0.4218001961708069, -0.27454304695129395, -0.127285897731781, 0.019971251487731934, 0.16722846031188965, 0.3144855499267578, 0.46174269914627075, 0.6089998483657837, 0.7562569975852966, 0.9035141468048096, 1.0507712364196777, 1.1980284452438354, 1.3452856540679932, 1.4925427436828613, 1.6397998332977295, 1.7870570421218872, 1.934314250946045, 2.081571340560913, 2.2288284301757812, 2.3760857582092285, 2.5233428478240967, 2.670599937438965, 2.817857027053833, 2.965114116668701, 3.1123714447021484, 3.2596285343170166, 3.4068856239318848, 3.554142951965332, 3.7014000415802, 3.8486571311950684, 3.9959142208099365, 4.143171310424805, 4.290428638458252, 4.437685966491699, 4.584942817687988, 4.7322001457214355, 4.879457473754883, 5.026714324951172]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 8.0, 7.0, 18.0, 10.0, 15.0, 23.0, 23.0, 36.0, 35.0, 59.0, 62.0, 48.0, 64.0, 59.0, 63.0, 75.0, 64.0, 60.0, 50.0, 49.0, 37.0, 27.0, 15.0, 20.0, 11.0, 17.0, 8.0, 4.0, 9.0, 4.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8421344757080078, -0.8111727237701416, -0.7802109718322754, -0.7492492198944092, -0.718287467956543, -0.6873257160186768, -0.6563639640808105, -0.6254022121429443, -0.5944404602050781, -0.5634787082672119, -0.5325169563293457, -0.5015552043914795, -0.4705934524536133, -0.43963170051574707, -0.40866991877555847, -0.37770816683769226, -0.34674638509750366, -0.31578463315963745, -0.28482288122177124, -0.25386112928390503, -0.22289936244487762, -0.1919376105070114, -0.160975843667984, -0.1300140917301178, -0.09905233979225159, -0.06809058785438538, -0.03712882846593857, -0.00616706907749176, 0.02479468286037445, 0.05575643479824066, 0.08671820163726807, 0.11767995357513428, 0.1486417055130005, 0.1796034574508667, 0.2105652093887329, 0.24152697622776031, 0.27248871326446533, 0.30345046520233154, 0.33441224694252014, 0.36537399888038635, 0.39633575081825256, 0.4272975027561188, 0.458259254693985, 0.4892210364341736, 0.5201827883720398, 0.551144540309906, 0.5821062922477722, 0.6130680441856384, 0.6440297961235046, 0.6749915480613708, 0.7059532999992371, 0.7369150519371033, 0.7678768038749695, 0.7988385558128357, 0.8298003673553467, 0.8607621192932129, 0.8917238712310791, 0.9226856231689453, 0.9536473751068115, 0.9846091270446777, 1.015570878982544, 1.0465326309204102, 1.0774943828582764, 1.1084561347961426, 1.1394178867340088]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 3.0, 10.0, 18.0, 45.0, 73.0, 139.0, 322.0, 796.0, 2472.0, 20680.0, 764890.0, 249036.0, 7604.0, 1450.0, 529.0, 224.0, 104.0, 60.0, 29.0, 20.0, 9.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.181640625, -2.09002685546875, -1.9984130859375, -1.90679931640625, -1.815185546875, -1.72357177734375, -1.6319580078125, -1.54034423828125, -1.44873046875, -1.35711669921875, -1.2655029296875, -1.17388916015625, -1.082275390625, -0.99066162109375, -0.8990478515625, -0.80743408203125, -0.7158203125, -0.62420654296875, -0.5325927734375, -0.44097900390625, -0.349365234375, -0.25775146484375, -0.1661376953125, -0.07452392578125, 0.01708984375, 0.10870361328125, 0.2003173828125, 0.29193115234375, 0.383544921875, 0.47515869140625, 0.5667724609375, 0.65838623046875, 0.75, 0.84161376953125, 0.9332275390625, 1.02484130859375, 1.116455078125, 1.20806884765625, 1.2996826171875, 1.39129638671875, 1.48291015625, 1.57452392578125, 1.6661376953125, 1.75775146484375, 1.849365234375, 1.94097900390625, 2.0325927734375, 2.12420654296875, 2.2158203125, 2.30743408203125, 2.3990478515625, 2.49066162109375, 2.582275390625, 2.67388916015625, 2.7655029296875, 2.85711669921875, 2.94873046875, 3.04034423828125, 3.1319580078125, 3.22357177734375, 3.315185546875, 3.40679931640625, 3.4984130859375, 3.59002685546875, 3.681640625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 17.0, 25.0, 20.0, 30.0, 33.0, 49.0, 48.0, 63.0, 69.0, 75.0, 72.0, 71.0, 71.0, 65.0, 61.0, 48.0, 39.0, 23.0, 19.0, 27.0, 12.0, 12.0, 10.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087890625, -0.08433341979980469, -0.08077621459960938, -0.07721900939941406, -0.07366180419921875, -0.07010459899902344, -0.06654739379882812, -0.06299018859863281, -0.0594329833984375, -0.05587577819824219, -0.052318572998046875, -0.04876136779785156, -0.04520416259765625, -0.04164695739746094, -0.038089752197265625, -0.03453254699707031, -0.030975341796875, -0.027418136596679688, -0.023860931396484375, -0.020303726196289062, -0.01674652099609375, -0.013189315795898438, -0.009632110595703125, -0.0060749053955078125, -0.0025177001953125, 0.0010395050048828125, 0.004596710205078125, 0.008153915405273438, 0.01171112060546875, 0.015268325805664062, 0.018825531005859375, 0.022382736206054688, 0.02593994140625, 0.029497146606445312, 0.033054351806640625, 0.03661155700683594, 0.04016876220703125, 0.04372596740722656, 0.047283172607421875, 0.05084037780761719, 0.0543975830078125, 0.05795478820800781, 0.061511993408203125, 0.06506919860839844, 0.06862640380859375, 0.07218360900878906, 0.07574081420898438, 0.07929801940917969, 0.082855224609375, 0.08641242980957031, 0.08996963500976562, 0.09352684020996094, 0.09708404541015625, 0.10064125061035156, 0.10419845581054688, 0.10775566101074219, 0.1113128662109375, 0.11487007141113281, 0.11842727661132812, 0.12198448181152344, 0.12554168701171875, 0.12909889221191406, 0.13265609741210938, 0.1362133026123047, 0.1397705078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 12.0, 10.0, 7.0, 21.0, 24.0, 31.0, 41.0, 68.0, 92.0, 152.0, 254.0, 373.0, 759.0, 1238.0, 2514.0, 5655.0, 15695.0, 58450.0, 260037.0, 477039.0, 167663.0, 38127.0, 11312.0, 4277.0, 2055.0, 1083.0, 575.0, 366.0, 197.0, 130.0, 92.0, 45.0, 40.0, 29.0, 18.0, 12.0, 14.0, 3.0, 12.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8632736206054688, -0.8373870849609375, -0.8115005493164062, -0.785614013671875, -0.7597274780273438, -0.7338409423828125, -0.7079544067382812, -0.68206787109375, -0.6561813354492188, -0.6302947998046875, -0.6044082641601562, -0.578521728515625, -0.5526351928710938, -0.5267486572265625, -0.5008621215820312, -0.4749755859375, -0.44908905029296875, -0.4232025146484375, -0.39731597900390625, -0.371429443359375, -0.34554290771484375, -0.3196563720703125, -0.29376983642578125, -0.26788330078125, -0.24199676513671875, -0.2161102294921875, -0.19022369384765625, -0.164337158203125, -0.13845062255859375, -0.1125640869140625, -0.08667755126953125, -0.060791015625, -0.03490447998046875, -0.0090179443359375, 0.01686859130859375, 0.042755126953125, 0.06864166259765625, 0.0945281982421875, 0.12041473388671875, 0.14630126953125, 0.17218780517578125, 0.1980743408203125, 0.22396087646484375, 0.249847412109375, 0.27573394775390625, 0.3016204833984375, 0.32750701904296875, 0.3533935546875, 0.37928009033203125, 0.4051666259765625, 0.43105316162109375, 0.456939697265625, 0.48282623291015625, 0.5087127685546875, 0.5345993041992188, 0.56048583984375, 0.5863723754882812, 0.6122589111328125, 0.6381454467773438, 0.664031982421875, 0.6899185180664062, 0.7158050537109375, 0.7416915893554688, 0.767578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 10.0, 11.0, 10.0, 11.0, 15.0, 17.0, 20.0, 22.0, 22.0, 21.0, 32.0, 35.0, 40.0, 36.0, 46.0, 43.0, 50.0, 47.0, 38.0, 47.0, 42.0, 46.0, 43.0, 34.0, 38.0, 21.0, 25.0, 28.0, 25.0, 18.0, 15.0, 14.0, 12.0, 12.0, 8.0, 10.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.423095703125, -0.41040802001953125, -0.3977203369140625, -0.38503265380859375, -0.372344970703125, -0.35965728759765625, -0.3469696044921875, -0.33428192138671875, -0.32159423828125, -0.30890655517578125, -0.2962188720703125, -0.28353118896484375, -0.270843505859375, -0.25815582275390625, -0.2454681396484375, -0.23278045654296875, -0.2200927734375, -0.20740509033203125, -0.1947174072265625, -0.18202972412109375, -0.169342041015625, -0.15665435791015625, -0.1439666748046875, -0.13127899169921875, -0.11859130859375, -0.10590362548828125, -0.0932159423828125, -0.08052825927734375, -0.067840576171875, -0.05515289306640625, -0.0424652099609375, -0.02977752685546875, -0.01708984375, -0.00440216064453125, 0.0082855224609375, 0.02097320556640625, 0.033660888671875, 0.04634857177734375, 0.0590362548828125, 0.07172393798828125, 0.08441162109375, 0.09709930419921875, 0.1097869873046875, 0.12247467041015625, 0.135162353515625, 0.14785003662109375, 0.1605377197265625, 0.17322540283203125, 0.1859130859375, 0.19860076904296875, 0.2112884521484375, 0.22397613525390625, 0.236663818359375, 0.24935150146484375, 0.2620391845703125, 0.27472686767578125, 0.28741455078125, 0.30010223388671875, 0.3127899169921875, 0.32547760009765625, 0.338165283203125, 0.35085296630859375, 0.3635406494140625, 0.37622833251953125, 0.388916015625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 3.0, 8.0, 10.0, 16.0, 24.0, 34.0, 40.0, 93.0, 115.0, 191.0, 264.0, 473.0, 939.0, 2061.0, 5175.0, 16556.0, 78215.0, 430139.0, 415378.0, 73703.0, 15822.0, 4982.0, 2061.0, 951.0, 503.0, 290.0, 167.0, 115.0, 66.0, 40.0, 37.0, 18.0, 19.0, 9.0, 6.0, 4.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4302253723144531, -0.41538238525390625, -0.4005393981933594, -0.3856964111328125, -0.3708534240722656, -0.35601043701171875, -0.3411674499511719, -0.326324462890625, -0.3114814758300781, -0.29663848876953125, -0.2817955017089844, -0.2669525146484375, -0.2521095275878906, -0.23726654052734375, -0.22242355346679688, -0.20758056640625, -0.19273757934570312, -0.17789459228515625, -0.16305160522460938, -0.1482086181640625, -0.13336563110351562, -0.11852264404296875, -0.10367965698242188, -0.088836669921875, -0.07399368286132812, -0.05915069580078125, -0.044307708740234375, -0.0294647216796875, -0.014621734619140625, 0.00022125244140625, 0.015064239501953125, 0.0299072265625, 0.044750213623046875, 0.05959320068359375, 0.07443618774414062, 0.0892791748046875, 0.10412216186523438, 0.11896514892578125, 0.13380813598632812, 0.148651123046875, 0.16349411010742188, 0.17833709716796875, 0.19318008422851562, 0.2080230712890625, 0.22286605834960938, 0.23770904541015625, 0.2525520324707031, 0.26739501953125, 0.2822380065917969, 0.29708099365234375, 0.3119239807128906, 0.3267669677734375, 0.3416099548339844, 0.35645294189453125, 0.3712959289550781, 0.386138916015625, 0.4009819030761719, 0.41582489013671875, 0.4306678771972656, 0.4455108642578125, 0.4603538513183594, 0.47519683837890625, 0.4900398254394531, 0.5048828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 10.0, 19.0, 22.0, 37.0, 50.0, 88.0, 119.0, 152.0, 177.0, 119.0, 63.0, 53.0, 33.0, 18.0, 8.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000179290771484375, -0.000174802727997303, -0.00017031468451023102, -0.00016582664102315903, -0.00016133859753608704, -0.00015685055404901505, -0.00015236251056194305, -0.00014787446707487106, -0.00014338642358779907, -0.00013889838010072708, -0.0001344103366136551, -0.0001299222931265831, -0.0001254342496395111, -0.00012094620615243912, -0.00011645816266536713, -0.00011197011917829514, -0.00010748207569122314, -0.00010299403220415115, -9.850598871707916e-05, -9.401794523000717e-05, -8.952990174293518e-05, -8.504185825586319e-05, -8.05538147687912e-05, -7.606577128171921e-05, -7.157772779464722e-05, -6.708968430757523e-05, -6.260164082050323e-05, -5.8113597333431244e-05, -5.362555384635925e-05, -4.913751035928726e-05, -4.464946687221527e-05, -4.016142338514328e-05, -3.567337989807129e-05, -3.11853364109993e-05, -2.6697292923927307e-05, -2.2209249436855316e-05, -1.7721205949783325e-05, -1.3233162462711334e-05, -8.745118975639343e-06, -4.257075488567352e-06, 2.3096799850463867e-07, 4.71901148557663e-06, 9.20705497264862e-06, 1.3695098459720612e-05, 1.8183141946792603e-05, 2.2671185433864594e-05, 2.7159228920936584e-05, 3.1647272408008575e-05, 3.6135315895080566e-05, 4.062335938215256e-05, 4.511140286922455e-05, 4.959944635629654e-05, 5.408748984336853e-05, 5.857553333044052e-05, 6.306357681751251e-05, 6.75516203045845e-05, 7.20396637916565e-05, 7.652770727872849e-05, 8.101575076580048e-05, 8.550379425287247e-05, 8.999183773994446e-05, 9.447988122701645e-05, 9.896792471408844e-05, 0.00010345596820116043, 0.00010794401168823242]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 9.0, 6.0, 15.0, 16.0, 33.0, 39.0, 61.0, 106.0, 164.0, 199.0, 398.0, 648.0, 1223.0, 2495.0, 6131.0, 18515.0, 86514.0, 472261.0, 372987.0, 62245.0, 14605.0, 5119.0, 2204.0, 1052.0, 578.0, 318.0, 215.0, 124.0, 74.0, 57.0, 34.0, 37.0, 18.0, 10.0, 10.0, 6.0, 6.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.477783203125, -0.46369171142578125, -0.4496002197265625, -0.43550872802734375, -0.421417236328125, -0.40732574462890625, -0.3932342529296875, -0.37914276123046875, -0.36505126953125, -0.35095977783203125, -0.3368682861328125, -0.32277679443359375, -0.308685302734375, -0.29459381103515625, -0.2805023193359375, -0.26641082763671875, -0.2523193359375, -0.23822784423828125, -0.2241363525390625, -0.21004486083984375, -0.195953369140625, -0.18186187744140625, -0.1677703857421875, -0.15367889404296875, -0.13958740234375, -0.12549591064453125, -0.1114044189453125, -0.09731292724609375, -0.083221435546875, -0.06912994384765625, -0.0550384521484375, -0.04094696044921875, -0.02685546875, -0.01276397705078125, 0.0013275146484375, 0.01541900634765625, 0.029510498046875, 0.04360198974609375, 0.0576934814453125, 0.07178497314453125, 0.08587646484375, 0.09996795654296875, 0.1140594482421875, 0.12815093994140625, 0.142242431640625, 0.15633392333984375, 0.1704254150390625, 0.18451690673828125, 0.1986083984375, 0.21269989013671875, 0.2267913818359375, 0.24088287353515625, 0.254974365234375, 0.26906585693359375, 0.2831573486328125, 0.29724884033203125, 0.31134033203125, 0.32543182373046875, 0.3395233154296875, 0.35361480712890625, 0.367706298828125, 0.38179779052734375, 0.3958892822265625, 0.40998077392578125, 0.424072265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 11.0, 15.0, 12.0, 18.0, 24.0, 32.0, 30.0, 50.0, 57.0, 60.0, 84.0, 77.0, 88.0, 85.0, 71.0, 65.0, 50.0, 27.0, 35.0, 24.0, 22.0, 13.0, 9.0, 6.0, 5.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32080078125, -0.3119010925292969, -0.30300140380859375, -0.2941017150878906, -0.2852020263671875, -0.2763023376464844, -0.26740264892578125, -0.2585029602050781, -0.249603271484375, -0.24070358276367188, -0.23180389404296875, -0.22290420532226562, -0.2140045166015625, -0.20510482788085938, -0.19620513916015625, -0.18730545043945312, -0.17840576171875, -0.16950607299804688, -0.16060638427734375, -0.15170669555664062, -0.1428070068359375, -0.13390731811523438, -0.12500762939453125, -0.11610794067382812, -0.107208251953125, -0.09830856323242188, -0.08940887451171875, -0.08050918579101562, -0.0716094970703125, -0.06270980834960938, -0.05381011962890625, -0.044910430908203125, -0.0360107421875, -0.027111053466796875, -0.01821136474609375, -0.009311676025390625, -0.0004119873046875, 0.008487701416015625, 0.01738739013671875, 0.026287078857421875, 0.035186767578125, 0.044086456298828125, 0.05298614501953125, 0.061885833740234375, 0.0707855224609375, 0.07968521118164062, 0.08858489990234375, 0.09748458862304688, 0.10638427734375, 0.11528396606445312, 0.12418365478515625, 0.13308334350585938, 0.1419830322265625, 0.15088272094726562, 0.15978240966796875, 0.16868209838867188, 0.177581787109375, 0.18648147583007812, 0.19538116455078125, 0.20428085327148438, 0.2131805419921875, 0.22208023071289062, 0.23097991943359375, 0.23987960815429688, 0.248779296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 12.0, 18.0, 31.0, 47.0, 89.0, 118.0, 184.0, 169.0, 129.0, 84.0, 49.0, 24.0, 15.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82899284362793, -4.634719371795654, -4.440446376800537, -4.246172904968262, -4.0518999099731445, -3.8576266765594482, -3.663353443145752, -3.4690799713134766, -3.2748069763183594, -3.080533742904663, -2.886260509490967, -2.6919872760772705, -2.497714042663574, -2.303440809249878, -2.1091675758361816, -1.9148942232131958, -1.72062087059021, -1.5263476371765137, -1.3320744037628174, -1.137801170349121, -0.94352787733078, -0.7492546439170837, -0.5549813508987427, -0.3607081174850464, -0.1664348840713501, 0.027838364243507385, 0.22211161255836487, 0.41638487577438354, 0.6106581091880798, 0.8049313426017761, 0.9992046356201172, 1.1934778690338135, 1.3877511024475098, 1.582024335861206, 1.7762975692749023, 1.9705708026885986, 2.164844036102295, 2.359117269515991, 2.5533905029296875, 2.747663974761963, 2.94193696975708, 3.1362102031707764, 3.3304834365844727, 3.524756669998169, 3.7190299034118652, 3.9133031368255615, 4.107576370239258, 4.301849842071533, 4.496123313903809, 4.690396785736084, 4.884669780731201, 5.078943252563477, 5.273216247558594, 5.467489719390869, 5.661762714385986, 5.856036186218262, 6.050309181213379, 6.244582653045654, 6.4388556480407715, 6.633129119873047, 6.827402114868164, 7.0216755867004395, 7.215948581695557, 7.410222053527832, 7.604495048522949]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 7.0, 17.0, 20.0, 25.0, 25.0, 25.0, 37.0, 55.0, 46.0, 67.0, 65.0, 75.0, 69.0, 66.0, 57.0, 72.0, 53.0, 46.0, 36.0, 39.0, 21.0, 11.0, 17.0, 11.0, 10.0, 3.0, 7.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6068387031555176, -3.4877161979675293, -3.36859393119812, -3.249471426010132, -3.1303491592407227, -3.0112266540527344, -2.892104148864746, -2.772981882095337, -2.6538596153259277, -2.5347371101379395, -2.4156148433685303, -2.296492338180542, -2.177370071411133, -2.0582475662231445, -1.9391251802444458, -1.820002794265747, -1.7008802890777588, -1.58175790309906, -1.4626355171203613, -1.343513011932373, -1.2243907451629639, -1.1052682399749756, -0.9861458539962769, -0.8670234680175781, -0.7479010820388794, -0.6287786960601807, -0.5096563100814819, -0.3905338644981384, -0.2714114785194397, -0.15228909254074097, -0.03316664695739746, 0.08595573902130127, 0.205078125, 0.32420051097869873, 0.44332292675971985, 0.562445342540741, 0.6815677285194397, 0.8006901144981384, 0.9198125600814819, 1.0389349460601807, 1.1580573320388794, 1.2771797180175781, 1.3963021039962769, 1.5154244899749756, 1.6345469951629639, 1.753669261932373, 1.8727917671203613, 1.99191415309906, 2.111036539077759, 2.230159044265747, 2.3492813110351562, 2.4684038162231445, 2.5875260829925537, 2.706648588180542, 2.825770854949951, 2.9448933601379395, 3.0640158653259277, 3.183138370513916, 3.302260637283325, 3.4213831424713135, 3.5405054092407227, 3.659627914428711, 3.778750419616699, 3.8978726863861084, 4.016994953155518]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 15.0, 20.0, 38.0, 50.0, 106.0, 201.0, 393.0, 888.0, 2274.0, 7070.0, 32631.0, 417693.0, 3606772.0, 104860.0, 14798.0, 3773.0, 1307.0, 573.0, 255.0, 154.0, 84.0, 79.0, 60.0, 42.0, 30.0, 24.0, 10.0, 13.0, 7.0, 12.0, 4.0, 10.0, 4.0, 5.0, 4.0, 7.0, 2.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9516143798828125, -0.902252197265625, -0.8528900146484375, -0.80352783203125, -0.7541656494140625, -0.704803466796875, -0.6554412841796875, -0.6060791015625, -0.5567169189453125, -0.507354736328125, -0.4579925537109375, -0.40863037109375, -0.3592681884765625, -0.309906005859375, -0.2605438232421875, -0.211181640625, -0.1618194580078125, -0.112457275390625, -0.0630950927734375, -0.01373291015625, 0.0356292724609375, 0.084991455078125, 0.1343536376953125, 0.1837158203125, 0.2330780029296875, 0.282440185546875, 0.3318023681640625, 0.38116455078125, 0.4305267333984375, 0.479888916015625, 0.5292510986328125, 0.57861328125, 0.6279754638671875, 0.677337646484375, 0.7266998291015625, 0.77606201171875, 0.8254241943359375, 0.874786376953125, 0.9241485595703125, 0.9735107421875, 1.0228729248046875, 1.072235107421875, 1.1215972900390625, 1.17095947265625, 1.2203216552734375, 1.269683837890625, 1.3190460205078125, 1.368408203125, 1.4177703857421875, 1.467132568359375, 1.5164947509765625, 1.56585693359375, 1.6152191162109375, 1.664581298828125, 1.7139434814453125, 1.7633056640625, 1.8126678466796875, 1.862030029296875, 1.9113922119140625, 1.96075439453125, 2.0101165771484375, 2.059478759765625, 2.1088409423828125, 2.158203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 2.0, 8.0, 1.0, 14.0, 6.0, 17.0, 21.0, 33.0, 30.0, 33.0, 45.0, 50.0, 68.0, 60.0, 80.0, 75.0, 65.0, 81.0, 63.0, 64.0, 37.0, 30.0, 31.0, 34.0, 12.0, 10.0, 11.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10406494140625, -0.10026073455810547, -0.09645652770996094, -0.0926523208618164, -0.08884811401367188, -0.08504390716552734, -0.08123970031738281, -0.07743549346923828, -0.07363128662109375, -0.06982707977294922, -0.06602287292480469, -0.062218666076660156, -0.058414459228515625, -0.054610252380371094, -0.05080604553222656, -0.04700183868408203, -0.0431976318359375, -0.03939342498779297, -0.03558921813964844, -0.031785011291503906, -0.027980804443359375, -0.024176597595214844, -0.020372390747070312, -0.01656818389892578, -0.01276397705078125, -0.008959770202636719, -0.0051555633544921875, -0.0013513565063476562, 0.002452850341796875, 0.006257057189941406, 0.010061264038085938, 0.013865470886230469, 0.017669677734375, 0.02147388458251953, 0.025278091430664062, 0.029082298278808594, 0.032886505126953125, 0.036690711975097656, 0.04049491882324219, 0.04429912567138672, 0.04810333251953125, 0.05190753936767578, 0.05571174621582031, 0.059515953063964844, 0.06332015991210938, 0.0671243667602539, 0.07092857360839844, 0.07473278045654297, 0.0785369873046875, 0.08234119415283203, 0.08614540100097656, 0.0899496078491211, 0.09375381469726562, 0.09755802154541016, 0.10136222839355469, 0.10516643524169922, 0.10897064208984375, 0.11277484893798828, 0.11657905578613281, 0.12038326263427734, 0.12418746948242188, 0.1279916763305664, 0.13179588317871094, 0.13560009002685547, 0.139404296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 13.0, 12.0, 14.0, 25.0, 61.0, 98.0, 166.0, 452.0, 1361.0, 9178.0, 4036700.0, 140420.0, 4102.0, 987.0, 328.0, 150.0, 80.0, 46.0, 33.0, 18.0, 11.0, 11.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.97265625, -6.801788330078125, -6.63092041015625, -6.460052490234375, -6.2891845703125, -6.118316650390625, -5.94744873046875, -5.776580810546875, -5.605712890625, -5.434844970703125, -5.26397705078125, -5.093109130859375, -4.9222412109375, -4.751373291015625, -4.58050537109375, -4.409637451171875, -4.23876953125, -4.067901611328125, -3.89703369140625, -3.726165771484375, -3.5552978515625, -3.384429931640625, -3.21356201171875, -3.042694091796875, -2.871826171875, -2.700958251953125, -2.53009033203125, -2.359222412109375, -2.1883544921875, -2.017486572265625, -1.84661865234375, -1.675750732421875, -1.5048828125, -1.334014892578125, -1.16314697265625, -0.992279052734375, -0.8214111328125, -0.650543212890625, -0.47967529296875, -0.308807373046875, -0.137939453125, 0.032928466796875, 0.20379638671875, 0.374664306640625, 0.5455322265625, 0.716400146484375, 0.88726806640625, 1.058135986328125, 1.22900390625, 1.399871826171875, 1.57073974609375, 1.741607666015625, 1.9124755859375, 2.083343505859375, 2.25421142578125, 2.425079345703125, 2.595947265625, 2.766815185546875, 2.93768310546875, 3.108551025390625, 3.2794189453125, 3.450286865234375, 3.62115478515625, 3.792022705078125, 3.962890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 20.0, 23.0, 35.0, 79.0, 155.0, 376.0, 1652.0, 1174.0, 300.0, 120.0, 66.0, 23.0, 18.0, 11.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.351318359375, -0.3304786682128906, -0.30963897705078125, -0.2887992858886719, -0.2679595947265625, -0.24711990356445312, -0.22628021240234375, -0.20544052124023438, -0.184600830078125, -0.16376113891601562, -0.14292144775390625, -0.12208175659179688, -0.1012420654296875, -0.08040237426757812, -0.05956268310546875, -0.038722991943359375, -0.01788330078125, 0.002956390380859375, 0.02379608154296875, 0.044635772705078125, 0.0654754638671875, 0.08631515502929688, 0.10715484619140625, 0.12799453735351562, 0.148834228515625, 0.16967391967773438, 0.19051361083984375, 0.21135330200195312, 0.2321929931640625, 0.2530326843261719, 0.27387237548828125, 0.2947120666503906, 0.3155517578125, 0.3363914489746094, 0.35723114013671875, 0.3780708312988281, 0.3989105224609375, 0.4197502136230469, 0.44058990478515625, 0.4614295959472656, 0.482269287109375, 0.5031089782714844, 0.5239486694335938, 0.5447883605957031, 0.5656280517578125, 0.5864677429199219, 0.6073074340820312, 0.6281471252441406, 0.64898681640625, 0.6698265075683594, 0.6906661987304688, 0.7115058898925781, 0.7323455810546875, 0.7531852722167969, 0.7740249633789062, 0.7948646545410156, 0.815704345703125, 0.8365440368652344, 0.8573837280273438, 0.8782234191894531, 0.8990631103515625, 0.9199028015136719, 0.9407424926757812, 0.9615821838378906, 0.982421875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 7.0, 22.0, 75.0, 255.0, 396.0, 175.0, 45.0, 20.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.42778491973877, -8.139674186706543, -7.851562976837158, -7.563452243804932, -7.275341033935547, -6.98723030090332, -6.699119567871094, -6.411008834838867, -6.122897624969482, -5.834786891937256, -5.546675682067871, -5.2585649490356445, -4.970454216003418, -4.682343006134033, -4.394232273101807, -4.106121063232422, -3.8180103302001953, -3.5298993587493896, -3.241788387298584, -2.9536776542663574, -2.6655666828155518, -2.377455711364746, -2.0893449783325195, -1.8012340068817139, -1.5131230354309082, -1.2250120639801025, -0.9369012117385864, -0.6487902998924255, -0.36067938804626465, -0.07256841659545898, 0.21554243564605713, 0.5036532878875732, 0.7917652130126953, 1.079876184463501, 1.367987036705017, 1.6560978889465332, 1.9442088603973389, 2.2323198318481445, 2.520430564880371, 2.8085415363311768, 3.0966525077819824, 3.384763479232788, 3.6728744506835938, 3.9609851837158203, 4.249095916748047, 4.537207126617432, 4.825317859649658, 5.113429069519043, 5.4015398025512695, 5.689650535583496, 5.977761745452881, 6.265872478485107, 6.553983688354492, 6.842094421386719, 7.130205154418945, 7.418315887451172, 7.706427097320557, 7.994537830352783, 8.282649040222168, 8.570759773254395, 8.858870506286621, 9.146982192993164, 9.43509292602539, 9.723203659057617, 10.011314392089844]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 8.0, 9.0, 13.0, 19.0, 28.0, 32.0, 54.0, 55.0, 81.0, 72.0, 60.0, 86.0, 88.0, 71.0, 73.0, 56.0, 53.0, 33.0, 26.0, 28.0, 19.0, 12.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9469283819198608, -1.8755866289138794, -1.8042447566986084, -1.732903003692627, -1.661561131477356, -1.5902193784713745, -1.5188775062561035, -1.447535753250122, -1.3761940002441406, -1.3048522472381592, -1.2335103750228882, -1.1621686220169067, -1.0908267498016357, -1.0194849967956543, -0.9481431841850281, -0.8768013715744019, -0.8054594993591309, -0.7341176867485046, -0.6627758741378784, -0.591434121131897, -0.520092248916626, -0.44875046610832214, -0.3774086833000183, -0.3060668706893921, -0.23472505807876587, -0.16338324546813965, -0.09204144775867462, -0.020699650049209595, 0.050642162561416626, 0.12198397517204285, 0.19332575798034668, 0.2646675705909729, 0.33600926399230957, 0.4073510766029358, 0.478692889213562, 0.5500346422195435, 0.6213765144348145, 0.6927182674407959, 0.7640600800514221, 0.8354018926620483, 0.9067437052726746, 0.9780855178833008, 1.0494272708892822, 1.1207691431045532, 1.1921108961105347, 1.2634527683258057, 1.334794521331787, 1.4061362743377686, 1.4774781465530396, 1.548819899559021, 1.620161771774292, 1.6915035247802734, 1.7628453969955444, 1.8341871500015259, 1.9055290222167969, 1.9768707752227783, 2.0482125282287598, 2.119554281234741, 2.1908960342407227, 2.262238025665283, 2.3335797786712646, 2.404921531677246, 2.4762632846832275, 2.547605037689209, 2.6189470291137695]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 10.0, 13.0, 13.0, 25.0, 25.0, 41.0, 75.0, 94.0, 202.0, 323.0, 635.0, 1252.0, 3218.0, 12596.0, 105910.0, 661141.0, 231879.0, 22999.0, 4623.0, 1640.0, 792.0, 400.0, 217.0, 137.0, 82.0, 74.0, 33.0, 28.0, 24.0, 15.0, 8.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8779296875, -1.8267059326171875, -1.775482177734375, -1.7242584228515625, -1.67303466796875, -1.6218109130859375, -1.570587158203125, -1.5193634033203125, -1.4681396484375, -1.4169158935546875, -1.365692138671875, -1.3144683837890625, -1.26324462890625, -1.2120208740234375, -1.160797119140625, -1.1095733642578125, -1.058349609375, -1.0071258544921875, -0.955902099609375, -0.9046783447265625, -0.85345458984375, -0.8022308349609375, -0.751007080078125, -0.6997833251953125, -0.6485595703125, -0.5973358154296875, -0.546112060546875, -0.4948883056640625, -0.44366455078125, -0.3924407958984375, -0.341217041015625, -0.2899932861328125, -0.23876953125, -0.1875457763671875, -0.136322021484375, -0.0850982666015625, -0.03387451171875, 0.0173492431640625, 0.068572998046875, 0.1197967529296875, 0.1710205078125, 0.2222442626953125, 0.273468017578125, 0.3246917724609375, 0.37591552734375, 0.4271392822265625, 0.478363037109375, 0.5295867919921875, 0.580810546875, 0.6320343017578125, 0.683258056640625, 0.7344818115234375, 0.78570556640625, 0.8369293212890625, 0.888153076171875, 0.9393768310546875, 0.9906005859375, 1.0418243408203125, 1.093048095703125, 1.1442718505859375, 1.19549560546875, 1.2467193603515625, 1.297943115234375, 1.3491668701171875, 1.400390625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 12.0, 16.0, 22.0, 32.0, 53.0, 73.0, 96.0, 107.0, 125.0, 108.0, 123.0, 69.0, 62.0, 44.0, 19.0, 16.0, 9.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.1978168487548828, -0.19067764282226562, -0.18353843688964844, -0.17639923095703125, -0.16926002502441406, -0.16212081909179688, -0.1549816131591797, -0.1478424072265625, -0.1407032012939453, -0.13356399536132812, -0.12642478942871094, -0.11928558349609375, -0.11214637756347656, -0.10500717163085938, -0.09786796569824219, -0.090728759765625, -0.08358955383300781, -0.07645034790039062, -0.06931114196777344, -0.06217193603515625, -0.05503273010253906, -0.047893524169921875, -0.04075431823730469, -0.0336151123046875, -0.026475906372070312, -0.019336700439453125, -0.012197494506835938, -0.00505828857421875, 0.0020809173583984375, 0.009220123291015625, 0.016359329223632812, 0.02349853515625, 0.030637741088867188, 0.037776947021484375, 0.04491615295410156, 0.05205535888671875, 0.05919456481933594, 0.06633377075195312, 0.07347297668457031, 0.0806121826171875, 0.08775138854980469, 0.09489059448242188, 0.10202980041503906, 0.10916900634765625, 0.11630821228027344, 0.12344741821289062, 0.1305866241455078, 0.137725830078125, 0.1448650360107422, 0.15200424194335938, 0.15914344787597656, 0.16628265380859375, 0.17342185974121094, 0.18056106567382812, 0.1877002716064453, 0.1948394775390625, 0.2019786834716797, 0.20911788940429688, 0.21625709533691406, 0.22339630126953125, 0.23053550720214844, 0.23767471313476562, 0.2448139190673828, 0.251953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 11.0, 9.0, 24.0, 29.0, 40.0, 31.0, 72.0, 86.0, 133.0, 219.0, 309.0, 546.0, 869.0, 1580.0, 3083.0, 6169.0, 13531.0, 30424.0, 69000.0, 144585.0, 243357.0, 249579.0, 151539.0, 72730.0, 32453.0, 14286.0, 6552.0, 3196.0, 1638.0, 915.0, 568.0, 354.0, 206.0, 140.0, 85.0, 52.0, 36.0, 31.0, 27.0, 14.0, 8.0, 8.0, 8.0, 1.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.416259765625, -0.40402984619140625, -0.3917999267578125, -0.37957000732421875, -0.367340087890625, -0.35511016845703125, -0.3428802490234375, -0.33065032958984375, -0.31842041015625, -0.30619049072265625, -0.2939605712890625, -0.28173065185546875, -0.269500732421875, -0.25727081298828125, -0.2450408935546875, -0.23281097412109375, -0.2205810546875, -0.20835113525390625, -0.1961212158203125, -0.18389129638671875, -0.171661376953125, -0.15943145751953125, -0.1472015380859375, -0.13497161865234375, -0.12274169921875, -0.11051177978515625, -0.0982818603515625, -0.08605194091796875, -0.073822021484375, -0.06159210205078125, -0.0493621826171875, -0.03713226318359375, -0.02490234375, -0.01267242431640625, -0.0004425048828125, 0.01178741455078125, 0.024017333984375, 0.03624725341796875, 0.0484771728515625, 0.06070709228515625, 0.07293701171875, 0.08516693115234375, 0.0973968505859375, 0.10962677001953125, 0.121856689453125, 0.13408660888671875, 0.1463165283203125, 0.15854644775390625, 0.1707763671875, 0.18300628662109375, 0.1952362060546875, 0.20746612548828125, 0.219696044921875, 0.23192596435546875, 0.2441558837890625, 0.25638580322265625, 0.26861572265625, 0.28084564208984375, 0.2930755615234375, 0.30530548095703125, 0.317535400390625, 0.32976531982421875, 0.3419952392578125, 0.35422515869140625, 0.366455078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 9.0, 6.0, 6.0, 16.0, 23.0, 22.0, 24.0, 27.0, 32.0, 35.0, 39.0, 36.0, 43.0, 33.0, 45.0, 46.0, 37.0, 55.0, 36.0, 38.0, 50.0, 39.0, 41.0, 35.0, 34.0, 33.0, 29.0, 17.0, 17.0, 11.0, 21.0, 12.0, 10.0, 9.0, 9.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.417724609375, -0.4046974182128906, -0.39167022705078125, -0.3786430358886719, -0.3656158447265625, -0.3525886535644531, -0.33956146240234375, -0.3265342712402344, -0.313507080078125, -0.3004798889160156, -0.28745269775390625, -0.2744255065917969, -0.2613983154296875, -0.24837112426757812, -0.23534393310546875, -0.22231674194335938, -0.20928955078125, -0.19626235961914062, -0.18323516845703125, -0.17020797729492188, -0.1571807861328125, -0.14415359497070312, -0.13112640380859375, -0.11809921264648438, -0.105072021484375, -0.09204483032226562, -0.07901763916015625, -0.06599044799804688, -0.0529632568359375, -0.039936065673828125, -0.02690887451171875, -0.013881683349609375, -0.0008544921875, 0.012172698974609375, 0.02519989013671875, 0.038227081298828125, 0.0512542724609375, 0.06428146362304688, 0.07730865478515625, 0.09033584594726562, 0.103363037109375, 0.11639022827148438, 0.12941741943359375, 0.14244461059570312, 0.1554718017578125, 0.16849899291992188, 0.18152618408203125, 0.19455337524414062, 0.20758056640625, 0.22060775756835938, 0.23363494873046875, 0.24666213989257812, 0.2596893310546875, 0.2727165222167969, 0.28574371337890625, 0.2987709045410156, 0.311798095703125, 0.3248252868652344, 0.33785247802734375, 0.3508796691894531, 0.3639068603515625, 0.3769340515136719, 0.38996124267578125, 0.4029884338378906, 0.416015625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 16.0, 23.0, 51.0, 82.0, 113.0, 243.0, 456.0, 1142.0, 3925.0, 20118.0, 170189.0, 639023.0, 185171.0, 21862.0, 3982.0, 1120.0, 478.0, 242.0, 116.0, 82.0, 42.0, 25.0, 12.0, 15.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6822967529296875, -0.665863037109375, -0.6494293212890625, -0.63299560546875, -0.6165618896484375, -0.600128173828125, -0.5836944580078125, -0.5672607421875, -0.5508270263671875, -0.534393310546875, -0.5179595947265625, -0.50152587890625, -0.4850921630859375, -0.468658447265625, -0.4522247314453125, -0.435791015625, -0.4193572998046875, -0.402923583984375, -0.3864898681640625, -0.37005615234375, -0.3536224365234375, -0.337188720703125, -0.3207550048828125, -0.3043212890625, -0.2878875732421875, -0.271453857421875, -0.2550201416015625, -0.23858642578125, -0.2221527099609375, -0.205718994140625, -0.1892852783203125, -0.1728515625, -0.1564178466796875, -0.139984130859375, -0.1235504150390625, -0.10711669921875, -0.0906829833984375, -0.074249267578125, -0.0578155517578125, -0.0413818359375, -0.0249481201171875, -0.008514404296875, 0.0079193115234375, 0.02435302734375, 0.0407867431640625, 0.057220458984375, 0.0736541748046875, 0.090087890625, 0.1065216064453125, 0.122955322265625, 0.1393890380859375, 0.15582275390625, 0.1722564697265625, 0.188690185546875, 0.2051239013671875, 0.2215576171875, 0.2379913330078125, 0.254425048828125, 0.2708587646484375, 0.28729248046875, 0.3037261962890625, 0.320159912109375, 0.3365936279296875, 0.35302734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 2.0, 7.0, 9.0, 13.0, 13.0, 10.0, 26.0, 21.0, 25.0, 30.0, 41.0, 39.0, 40.0, 52.0, 42.0, 57.0, 61.0, 55.0, 63.0, 52.0, 40.0, 43.0, 42.0, 32.0, 25.0, 17.0, 20.0, 20.0, 18.0, 9.0, 16.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.774332046508789e-05, -4.627928137779236e-05, -4.4815242290496826e-05, -4.3351203203201294e-05, -4.188716411590576e-05, -4.042312502861023e-05, -3.89590859413147e-05, -3.7495046854019165e-05, -3.603100776672363e-05, -3.45669686794281e-05, -3.310292959213257e-05, -3.1638890504837036e-05, -3.0174851417541504e-05, -2.871081233024597e-05, -2.724677324295044e-05, -2.5782734155654907e-05, -2.4318695068359375e-05, -2.2854655981063843e-05, -2.139061689376831e-05, -1.992657780647278e-05, -1.8462538719177246e-05, -1.6998499631881714e-05, -1.553446054458618e-05, -1.407042145729065e-05, -1.2606382369995117e-05, -1.1142343282699585e-05, -9.678304195404053e-06, -8.21426510810852e-06, -6.750226020812988e-06, -5.286186933517456e-06, -3.822147846221924e-06, -2.3581087589263916e-06, -8.940696716308594e-07, 5.699694156646729e-07, 2.034008502960205e-06, 3.4980475902557373e-06, 4.9620866775512695e-06, 6.426125764846802e-06, 7.890164852142334e-06, 9.354203939437866e-06, 1.0818243026733398e-05, 1.228228211402893e-05, 1.3746321201324463e-05, 1.5210360288619995e-05, 1.6674399375915527e-05, 1.813843846321106e-05, 1.9602477550506592e-05, 2.1066516637802124e-05, 2.2530555725097656e-05, 2.399459481239319e-05, 2.545863389968872e-05, 2.6922672986984253e-05, 2.8386712074279785e-05, 2.9850751161575317e-05, 3.131479024887085e-05, 3.277882933616638e-05, 3.4242868423461914e-05, 3.5706907510757446e-05, 3.717094659805298e-05, 3.863498568534851e-05, 4.009902477264404e-05, 4.1563063859939575e-05, 4.302710294723511e-05, 4.449114203453064e-05, 4.595518112182617e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 5.0, 3.0, 15.0, 20.0, 24.0, 40.0, 51.0, 84.0, 170.0, 295.0, 556.0, 1138.0, 2745.0, 7517.0, 26589.0, 117445.0, 406685.0, 360532.0, 92858.0, 21109.0, 6050.0, 2281.0, 1101.0, 495.0, 298.0, 145.0, 112.0, 62.0, 39.0, 31.0, 22.0, 12.0, 5.0, 7.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36572265625, -0.3552513122558594, -0.34477996826171875, -0.3343086242675781, -0.3238372802734375, -0.3133659362792969, -0.30289459228515625, -0.2924232482910156, -0.281951904296875, -0.2714805603027344, -0.26100921630859375, -0.2505378723144531, -0.2400665283203125, -0.22959518432617188, -0.21912384033203125, -0.20865249633789062, -0.19818115234375, -0.18770980834960938, -0.17723846435546875, -0.16676712036132812, -0.1562957763671875, -0.14582443237304688, -0.13535308837890625, -0.12488174438476562, -0.114410400390625, -0.10393905639648438, -0.09346771240234375, -0.08299636840820312, -0.0725250244140625, -0.062053680419921875, -0.05158233642578125, -0.041110992431640625, -0.0306396484375, -0.020168304443359375, -0.00969696044921875, 0.000774383544921875, 0.0112457275390625, 0.021717071533203125, 0.03218841552734375, 0.042659759521484375, 0.053131103515625, 0.06360244750976562, 0.07407379150390625, 0.08454513549804688, 0.0950164794921875, 0.10548782348632812, 0.11595916748046875, 0.12643051147460938, 0.13690185546875, 0.14737319946289062, 0.15784454345703125, 0.16831588745117188, 0.1787872314453125, 0.18925857543945312, 0.19972991943359375, 0.21020126342773438, 0.220672607421875, 0.23114395141601562, 0.24161529541015625, 0.2520866394042969, 0.2625579833984375, 0.2730293273925781, 0.28350067138671875, 0.2939720153808594, 0.304443359375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 10.0, 15.0, 15.0, 28.0, 24.0, 47.0, 52.0, 64.0, 62.0, 98.0, 78.0, 78.0, 69.0, 74.0, 70.0, 38.0, 39.0, 34.0, 25.0, 18.0, 12.0, 12.0, 9.0, 3.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2213134765625, -0.21305274963378906, -0.20479202270507812, -0.1965312957763672, -0.18827056884765625, -0.1800098419189453, -0.17174911499023438, -0.16348838806152344, -0.1552276611328125, -0.14696693420410156, -0.13870620727539062, -0.1304454803466797, -0.12218475341796875, -0.11392402648925781, -0.10566329956054688, -0.09740257263183594, -0.089141845703125, -0.08088111877441406, -0.07262039184570312, -0.06435966491699219, -0.05609893798828125, -0.04783821105957031, -0.039577484130859375, -0.03131675720214844, -0.0230560302734375, -0.014795303344726562, -0.006534576416015625, 0.0017261505126953125, 0.00998687744140625, 0.018247604370117188, 0.026508331298828125, 0.03476905822753906, 0.04302978515625, 0.05129051208496094, 0.059551239013671875, 0.06781196594238281, 0.07607269287109375, 0.08433341979980469, 0.09259414672851562, 0.10085487365722656, 0.1091156005859375, 0.11737632751464844, 0.12563705444335938, 0.1338977813720703, 0.14215850830078125, 0.1504192352294922, 0.15867996215820312, 0.16694068908691406, 0.175201416015625, 0.18346214294433594, 0.19172286987304688, 0.1999835968017578, 0.20824432373046875, 0.2165050506591797, 0.22476577758789062, 0.23302650451660156, 0.2412872314453125, 0.24954795837402344, 0.2578086853027344, 0.2660694122314453, 0.27433013916015625, 0.2825908660888672, 0.2908515930175781, 0.29911231994628906, 0.307373046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 12.0, 12.0, 32.0, 67.0, 90.0, 133.0, 171.0, 186.0, 111.0, 78.0, 53.0, 31.0, 14.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09897232055664, -7.904950141906738, -7.710928440093994, -7.516906261444092, -7.322884559631348, -7.128862380981445, -6.934840202331543, -6.740818023681641, -6.5467963218688965, -6.352774143218994, -6.15875244140625, -5.964730262756348, -5.770708084106445, -5.576686382293701, -5.382664203643799, -5.188642501831055, -4.994620323181152, -4.80059814453125, -4.606576442718506, -4.4125542640686035, -4.218532562255859, -4.024510383605957, -3.8304882049560547, -3.6364662647247314, -3.442444324493408, -3.248422384262085, -3.0544004440307617, -2.8603782653808594, -2.666356325149536, -2.472334384918213, -2.2783122062683105, -2.0842902660369873, -1.890268325805664, -1.6962463855743408, -1.502224326133728, -1.3082022666931152, -1.114180326461792, -0.920158326625824, -0.726136326789856, -0.5321142673492432, -0.3380923271179199, -0.1440703272819519, 0.04995167255401611, 0.24397367238998413, 0.43799567222595215, 0.6320176720619202, 0.8260396718978882, 1.020061731338501, 1.2140836715698242, 1.4081056118011475, 1.6021276712417603, 1.796149730682373, 1.9901716709136963, 2.1841936111450195, 2.378215789794922, 2.572237730026245, 2.7662596702575684, 2.9602816104888916, 3.154303550720215, 3.348325729370117, 3.5423476696014404, 3.7363696098327637, 3.930391788482666, 4.12441349029541, 4.3184356689453125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 10.0, 8.0, 9.0, 16.0, 14.0, 15.0, 19.0, 23.0, 21.0, 24.0, 23.0, 36.0, 49.0, 49.0, 38.0, 42.0, 67.0, 56.0, 55.0, 47.0, 46.0, 42.0, 43.0, 46.0, 31.0, 28.0, 31.0, 13.0, 21.0, 19.0, 9.0, 13.0, 7.0, 12.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8482842445373535, -2.7652475833892822, -2.682210922241211, -2.5991744995117188, -2.5161378383636475, -2.433101177215576, -2.350064516067505, -2.2670278549194336, -2.1839914321899414, -2.10095477104187, -2.017918109893799, -1.934881567955017, -1.8518450260162354, -1.768808364868164, -1.6857717037200928, -1.6027350425720215, -1.5196983814239502, -1.436661720275879, -1.3536251783370972, -1.2705885171890259, -1.1875519752502441, -1.1045153141021729, -1.0214786529541016, -0.938442051410675, -0.8554054498672485, -0.772368848323822, -0.6893322467803955, -0.6062955856323242, -0.5232589840888977, -0.4402223825454712, -0.3571857511997223, -0.2741491198539734, -0.19111251831054688, -0.10807590186595917, -0.02503928542137146, 0.05799733102321625, 0.14103394746780396, 0.22407054901123047, 0.30710718035697937, 0.39014381170272827, 0.4731804132461548, 0.5562170147895813, 0.6392536163330078, 0.7222902774810791, 0.8053268790245056, 0.8883634805679321, 0.9714001417160034, 1.0544366836547852, 1.1374733448028564, 1.2205100059509277, 1.3035465478897095, 1.3865832090377808, 1.4696197509765625, 1.5526564121246338, 1.635693073272705, 1.7187297344207764, 1.801766276359558, 1.8848029375076294, 1.9678394794464111, 2.0508761405944824, 2.1339128017425537, 2.216949462890625, 2.299985885620117, 2.3830225467681885, 2.4660592079162598]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 14.0, 10.0, 20.0, 30.0, 48.0, 61.0, 108.0, 160.0, 361.0, 793.0, 2220.0, 9289.0, 110831.0, 3991566.0, 68126.0, 7455.0, 1782.0, 632.0, 256.0, 154.0, 104.0, 69.0, 53.0, 26.0, 22.0, 13.0, 16.0, 9.0, 5.0, 13.0, 5.0, 3.0, 5.0, 6.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7939453125, -1.7308502197265625, -1.667755126953125, -1.6046600341796875, -1.54156494140625, -1.4784698486328125, -1.415374755859375, -1.3522796630859375, -1.2891845703125, -1.2260894775390625, -1.162994384765625, -1.0998992919921875, -1.03680419921875, -0.9737091064453125, -0.910614013671875, -0.8475189208984375, -0.784423828125, -0.7213287353515625, -0.658233642578125, -0.5951385498046875, -0.53204345703125, -0.4689483642578125, -0.405853271484375, -0.3427581787109375, -0.2796630859375, -0.2165679931640625, -0.153472900390625, -0.0903778076171875, -0.02728271484375, 0.0358123779296875, 0.098907470703125, 0.1620025634765625, 0.22509765625, 0.2881927490234375, 0.351287841796875, 0.4143829345703125, 0.47747802734375, 0.5405731201171875, 0.603668212890625, 0.6667633056640625, 0.7298583984375, 0.7929534912109375, 0.856048583984375, 0.9191436767578125, 0.98223876953125, 1.0453338623046875, 1.108428955078125, 1.1715240478515625, 1.234619140625, 1.2977142333984375, 1.360809326171875, 1.4239044189453125, 1.48699951171875, 1.5500946044921875, 1.613189697265625, 1.6762847900390625, 1.7393798828125, 1.8024749755859375, 1.865570068359375, 1.9286651611328125, 1.99176025390625, 2.0548553466796875, 2.117950439453125, 2.1810455322265625, 2.244140625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 9.0, 17.0, 22.0, 29.0, 28.0, 47.0, 53.0, 80.0, 82.0, 103.0, 98.0, 104.0, 74.0, 69.0, 53.0, 31.0, 32.0, 22.0, 14.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173828125, -0.1680622100830078, -0.16229629516601562, -0.15653038024902344, -0.15076446533203125, -0.14499855041503906, -0.13923263549804688, -0.1334667205810547, -0.1277008056640625, -0.12193489074707031, -0.11616897583007812, -0.11040306091308594, -0.10463714599609375, -0.09887123107910156, -0.09310531616210938, -0.08733940124511719, -0.081573486328125, -0.07580757141113281, -0.07004165649414062, -0.06427574157714844, -0.05850982666015625, -0.05274391174316406, -0.046977996826171875, -0.04121208190917969, -0.0354461669921875, -0.029680252075195312, -0.023914337158203125, -0.018148422241210938, -0.01238250732421875, -0.0066165924072265625, -0.000850677490234375, 0.0049152374267578125, 0.01068115234375, 0.016447067260742188, 0.022212982177734375, 0.027978897094726562, 0.03374481201171875, 0.03951072692871094, 0.045276641845703125, 0.05104255676269531, 0.0568084716796875, 0.06257438659667969, 0.06834030151367188, 0.07410621643066406, 0.07987213134765625, 0.08563804626464844, 0.09140396118164062, 0.09716987609863281, 0.102935791015625, 0.10870170593261719, 0.11446762084960938, 0.12023353576660156, 0.12599945068359375, 0.13176536560058594, 0.13753128051757812, 0.1432971954345703, 0.1490631103515625, 0.1548290252685547, 0.16059494018554688, 0.16636085510253906, 0.17212677001953125, 0.17789268493652344, 0.18365859985351562, 0.1894245147705078, 0.1951904296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 4.0, 11.0, 16.0, 16.0, 41.0, 53.0, 81.0, 116.0, 205.0, 323.0, 651.0, 1190.0, 2380.0, 5614.0, 16154.0, 67340.0, 720778.0, 3170027.0, 165150.0, 28746.0, 8435.0, 3368.0, 1547.0, 797.0, 482.0, 254.0, 201.0, 106.0, 71.0, 40.0, 28.0, 18.0, 14.0, 6.0, 1.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8058624267578125, -0.779205322265625, -0.7525482177734375, -0.72589111328125, -0.6992340087890625, -0.672576904296875, -0.6459197998046875, -0.6192626953125, -0.5926055908203125, -0.565948486328125, -0.5392913818359375, -0.51263427734375, -0.4859771728515625, -0.459320068359375, -0.4326629638671875, -0.406005859375, -0.3793487548828125, -0.352691650390625, -0.3260345458984375, -0.29937744140625, -0.2727203369140625, -0.246063232421875, -0.2194061279296875, -0.1927490234375, -0.1660919189453125, -0.139434814453125, -0.1127777099609375, -0.08612060546875, -0.0594635009765625, -0.032806396484375, -0.0061492919921875, 0.0205078125, 0.0471649169921875, 0.073822021484375, 0.1004791259765625, 0.12713623046875, 0.1537933349609375, 0.180450439453125, 0.2071075439453125, 0.2337646484375, 0.2604217529296875, 0.287078857421875, 0.3137359619140625, 0.34039306640625, 0.3670501708984375, 0.393707275390625, 0.4203643798828125, 0.447021484375, 0.4736785888671875, 0.500335693359375, 0.5269927978515625, 0.55364990234375, 0.5803070068359375, 0.606964111328125, 0.6336212158203125, 0.6602783203125, 0.6869354248046875, 0.713592529296875, 0.7402496337890625, 0.76690673828125, 0.7935638427734375, 0.820220947265625, 0.8468780517578125, 0.87353515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 20.0, 27.0, 25.0, 41.0, 74.0, 107.0, 184.0, 500.0, 1233.0, 991.0, 381.0, 186.0, 100.0, 70.0, 35.0, 24.0, 12.0, 9.0, 9.0, 9.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24691390991210938, -0.23699188232421875, -0.22706985473632812, -0.2171478271484375, -0.20722579956054688, -0.19730377197265625, -0.18738174438476562, -0.177459716796875, -0.16753768920898438, -0.15761566162109375, -0.14769363403320312, -0.1377716064453125, -0.12784957885742188, -0.11792755126953125, -0.10800552368164062, -0.09808349609375, -0.08816146850585938, -0.07823944091796875, -0.06831741333007812, -0.0583953857421875, -0.048473358154296875, -0.03855133056640625, -0.028629302978515625, -0.018707275390625, -0.008785247802734375, 0.00113677978515625, 0.011058807373046875, 0.0209808349609375, 0.030902862548828125, 0.04082489013671875, 0.050746917724609375, 0.0606689453125, 0.07059097290039062, 0.08051300048828125, 0.09043502807617188, 0.1003570556640625, 0.11027908325195312, 0.12020111083984375, 0.13012313842773438, 0.140045166015625, 0.14996719360351562, 0.15988922119140625, 0.16981124877929688, 0.1797332763671875, 0.18965530395507812, 0.19957733154296875, 0.20949935913085938, 0.21942138671875, 0.22934341430664062, 0.23926544189453125, 0.24918746948242188, 0.2591094970703125, 0.2690315246582031, 0.27895355224609375, 0.2888755798339844, 0.298797607421875, 0.3087196350097656, 0.31864166259765625, 0.3285636901855469, 0.3384857177734375, 0.3484077453613281, 0.35832977294921875, 0.3682518005371094, 0.378173828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 15.0, 28.0, 106.0, 225.0, 327.0, 206.0, 63.0, 26.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.445000648498535, -4.303231716156006, -4.161463260650635, -4.0196943283081055, -3.8779256343841553, -3.736156940460205, -3.594388008117676, -3.4526193141937256, -3.3108506202697754, -3.169081926345825, -3.027313232421875, -2.8855443000793457, -2.7437756061553955, -2.6020069122314453, -2.460237979888916, -2.318469285964966, -2.1767005920410156, -2.0349318981170654, -1.8931630849838257, -1.751394271850586, -1.6096255779266357, -1.4678568840026855, -1.3260880708694458, -1.184319257736206, -1.0425505638122559, -0.9007818102836609, -0.7590130567550659, -0.617244303226471, -0.475475549697876, -0.333706796169281, -0.19193804264068604, -0.050169289112091064, 0.0915989875793457, 0.23336774110794067, 0.37513649463653564, 0.5169052481651306, 0.6586740016937256, 0.8004427552223206, 0.9422115087509155, 1.0839803218841553, 1.2257490158081055, 1.3675177097320557, 1.5092865228652954, 1.6510553359985352, 1.7928240299224854, 1.9345927238464355, 2.076361656188965, 2.218130350112915, 2.3598990440368652, 2.5016677379608154, 2.6434364318847656, 2.785205364227295, 2.926974058151245, 3.0687427520751953, 3.2105116844177246, 3.352280378341675, 3.494049072265625, 3.635817766189575, 3.7775864601135254, 3.9193553924560547, 4.061123847961426, 4.202892780303955, 4.344661712646484, 4.4864301681518555, 4.628199100494385]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 10.0, 8.0, 10.0, 8.0, 11.0, 17.0, 20.0, 21.0, 25.0, 35.0, 50.0, 28.0, 44.0, 43.0, 55.0, 51.0, 53.0, 49.0, 51.0, 53.0, 40.0, 42.0, 21.0, 34.0, 43.0, 28.0, 28.0, 24.0, 13.0, 14.0, 16.0, 13.0, 12.0, 6.0, 9.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.898186981678009, -0.8695569634437561, -0.840927004814148, -0.812296986579895, -0.7836670279502869, -0.7550370097160339, -0.7264070510864258, -0.6977770328521729, -0.6691470146179199, -0.640516996383667, -0.6118870377540588, -0.5832570195198059, -0.5546270608901978, -0.5259970426559448, -0.4973670542240143, -0.46873706579208374, -0.4401070773601532, -0.41147708892822266, -0.3828471004962921, -0.3542171120643616, -0.32558709383010864, -0.2969571053981781, -0.26832711696624756, -0.23969711363315582, -0.21106712520122528, -0.18243713676929474, -0.153807133436203, -0.12517714500427246, -0.09654714912176132, -0.06791715323925018, -0.03928716480731964, -0.010657161474227905, 0.017972826957702637, 0.046602822840213776, 0.07523281872272491, 0.10386280715465546, 0.1324928104877472, 0.16112279891967773, 0.18975278735160828, 0.2183827906847, 0.24701277911663055, 0.2756427824497223, 0.30427277088165283, 0.3329027593135834, 0.3615327477455139, 0.39016276597976685, 0.418792724609375, 0.44742274284362793, 0.47605273127555847, 0.504682719707489, 0.5333127379417419, 0.5619426965713501, 0.590572714805603, 0.619202733039856, 0.6478326916694641, 0.676462709903717, 0.7050926685333252, 0.7337226867675781, 0.7623526453971863, 0.7909826636314392, 0.8196126222610474, 0.8482426404953003, 0.8768726587295532, 0.9055026173591614, 0.9341326355934143]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 13.0, 15.0, 12.0, 28.0, 38.0, 47.0, 77.0, 144.0, 204.0, 403.0, 890.0, 2365.0, 9360.0, 83565.0, 650138.0, 270736.0, 23772.0, 4124.0, 1287.0, 569.0, 298.0, 163.0, 94.0, 67.0, 37.0, 33.0, 20.0, 17.0, 9.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.70147705078125, -1.6461181640625, -1.59075927734375, -1.535400390625, -1.48004150390625, -1.4246826171875, -1.36932373046875, -1.31396484375, -1.25860595703125, -1.2032470703125, -1.14788818359375, -1.092529296875, -1.03717041015625, -0.9818115234375, -0.92645263671875, -0.87109375, -0.81573486328125, -0.7603759765625, -0.70501708984375, -0.649658203125, -0.59429931640625, -0.5389404296875, -0.48358154296875, -0.42822265625, -0.37286376953125, -0.3175048828125, -0.26214599609375, -0.206787109375, -0.15142822265625, -0.0960693359375, -0.04071044921875, 0.0146484375, 0.07000732421875, 0.1253662109375, 0.18072509765625, 0.236083984375, 0.29144287109375, 0.3468017578125, 0.40216064453125, 0.45751953125, 0.51287841796875, 0.5682373046875, 0.62359619140625, 0.678955078125, 0.73431396484375, 0.7896728515625, 0.84503173828125, 0.900390625, 0.95574951171875, 1.0111083984375, 1.06646728515625, 1.121826171875, 1.17718505859375, 1.2325439453125, 1.28790283203125, 1.34326171875, 1.39862060546875, 1.4539794921875, 1.50933837890625, 1.564697265625, 1.62005615234375, 1.6754150390625, 1.73077392578125, 1.7861328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 7.0, 10.0, 11.0, 15.0, 30.0, 34.0, 27.0, 51.0, 60.0, 65.0, 67.0, 99.0, 86.0, 75.0, 84.0, 74.0, 54.0, 44.0, 28.0, 25.0, 10.0, 9.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.16636085510253906, -0.16084671020507812, -0.1553325653076172, -0.14981842041015625, -0.1443042755126953, -0.13879013061523438, -0.13327598571777344, -0.1277618408203125, -0.12224769592285156, -0.11673355102539062, -0.11121940612792969, -0.10570526123046875, -0.10019111633300781, -0.09467697143554688, -0.08916282653808594, -0.083648681640625, -0.07813453674316406, -0.07262039184570312, -0.06710624694824219, -0.06159210205078125, -0.05607795715332031, -0.050563812255859375, -0.04504966735839844, -0.0395355224609375, -0.03402137756347656, -0.028507232666015625, -0.022993087768554688, -0.01747894287109375, -0.011964797973632812, -0.006450653076171875, -0.0009365081787109375, 0.00457763671875, 0.010091781616210938, 0.015605926513671875, 0.021120071411132812, 0.02663421630859375, 0.03214836120605469, 0.037662506103515625, 0.04317665100097656, 0.0486907958984375, 0.05420494079589844, 0.059719085693359375, 0.06523323059082031, 0.07074737548828125, 0.07626152038574219, 0.08177566528320312, 0.08728981018066406, 0.092803955078125, 0.09831809997558594, 0.10383224487304688, 0.10934638977050781, 0.11486053466796875, 0.12037467956542969, 0.12588882446289062, 0.13140296936035156, 0.1369171142578125, 0.14243125915527344, 0.14794540405273438, 0.1534595489501953, 0.15897369384765625, 0.1644878387451172, 0.17000198364257812, 0.17551612854003906, 0.1810302734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 9.0, 18.0, 30.0, 27.0, 36.0, 59.0, 65.0, 103.0, 173.0, 251.0, 434.0, 749.0, 1231.0, 2253.0, 4637.0, 10041.0, 23398.0, 55715.0, 132140.0, 258491.0, 280749.0, 157550.0, 68349.0, 28108.0, 12118.0, 5424.0, 2621.0, 1500.0, 802.0, 486.0, 305.0, 207.0, 140.0, 93.0, 84.0, 40.0, 29.0, 22.0, 17.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.50830078125, -0.4938240051269531, -0.47934722900390625, -0.4648704528808594, -0.4503936767578125, -0.4359169006347656, -0.42144012451171875, -0.4069633483886719, -0.392486572265625, -0.3780097961425781, -0.36353302001953125, -0.3490562438964844, -0.3345794677734375, -0.3201026916503906, -0.30562591552734375, -0.2911491394042969, -0.27667236328125, -0.2621955871582031, -0.24771881103515625, -0.23324203491210938, -0.2187652587890625, -0.20428848266601562, -0.18981170654296875, -0.17533493041992188, -0.160858154296875, -0.14638137817382812, -0.13190460205078125, -0.11742782592773438, -0.1029510498046875, -0.08847427368164062, -0.07399749755859375, -0.059520721435546875, -0.0450439453125, -0.030567169189453125, -0.01609039306640625, -0.001613616943359375, 0.0128631591796875, 0.027339935302734375, 0.04181671142578125, 0.056293487548828125, 0.070770263671875, 0.08524703979492188, 0.09972381591796875, 0.11420059204101562, 0.1286773681640625, 0.14315414428710938, 0.15763092041015625, 0.17210769653320312, 0.18658447265625, 0.20106124877929688, 0.21553802490234375, 0.23001480102539062, 0.2444915771484375, 0.2589683532714844, 0.27344512939453125, 0.2879219055175781, 0.302398681640625, 0.3168754577636719, 0.33135223388671875, 0.3458290100097656, 0.3603057861328125, 0.3747825622558594, 0.38925933837890625, 0.4037361145019531, 0.418212890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 13.0, 14.0, 19.0, 26.0, 28.0, 16.0, 35.0, 34.0, 29.0, 33.0, 35.0, 43.0, 42.0, 38.0, 51.0, 47.0, 47.0, 48.0, 43.0, 41.0, 53.0, 34.0, 42.0, 23.0, 28.0, 19.0, 18.0, 16.0, 12.0, 7.0, 15.0, 3.0, 6.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.486083984375, -0.4711265563964844, -0.45616912841796875, -0.4412117004394531, -0.4262542724609375, -0.4112968444824219, -0.39633941650390625, -0.3813819885253906, -0.366424560546875, -0.3514671325683594, -0.33650970458984375, -0.3215522766113281, -0.3065948486328125, -0.2916374206542969, -0.27667999267578125, -0.2617225646972656, -0.24676513671875, -0.23180770874023438, -0.21685028076171875, -0.20189285278320312, -0.1869354248046875, -0.17197799682617188, -0.15702056884765625, -0.14206314086914062, -0.127105712890625, -0.11214828491210938, -0.09719085693359375, -0.08223342895507812, -0.0672760009765625, -0.052318572998046875, -0.03736114501953125, -0.022403717041015625, -0.0074462890625, 0.007511138916015625, 0.02246856689453125, 0.037425994873046875, 0.0523834228515625, 0.06734085083007812, 0.08229827880859375, 0.09725570678710938, 0.112213134765625, 0.12717056274414062, 0.14212799072265625, 0.15708541870117188, 0.1720428466796875, 0.18700027465820312, 0.20195770263671875, 0.21691513061523438, 0.23187255859375, 0.24682998657226562, 0.26178741455078125, 0.2767448425292969, 0.2917022705078125, 0.3066596984863281, 0.32161712646484375, 0.3365745544433594, 0.351531982421875, 0.3664894104003906, 0.38144683837890625, 0.3964042663574219, 0.4113616943359375, 0.4263191223144531, 0.44127655029296875, 0.4562339782714844, 0.47119140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 5.0, 20.0, 30.0, 34.0, 74.0, 146.0, 304.0, 724.0, 2074.0, 9897.0, 96603.0, 697332.0, 217942.0, 18652.0, 3040.0, 925.0, 359.0, 175.0, 89.0, 47.0, 32.0, 16.0, 9.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5841064453125, -0.563720703125, -0.5433349609375, -0.52294921875, -0.5025634765625, -0.482177734375, -0.4617919921875, -0.44140625, -0.4210205078125, -0.400634765625, -0.3802490234375, -0.35986328125, -0.3394775390625, -0.319091796875, -0.2987060546875, -0.2783203125, -0.2579345703125, -0.237548828125, -0.2171630859375, -0.19677734375, -0.1763916015625, -0.156005859375, -0.1356201171875, -0.115234375, -0.0948486328125, -0.074462890625, -0.0540771484375, -0.03369140625, -0.0133056640625, 0.007080078125, 0.0274658203125, 0.0478515625, 0.0682373046875, 0.088623046875, 0.1090087890625, 0.12939453125, 0.1497802734375, 0.170166015625, 0.1905517578125, 0.2109375, 0.2313232421875, 0.251708984375, 0.2720947265625, 0.29248046875, 0.3128662109375, 0.333251953125, 0.3536376953125, 0.3740234375, 0.3944091796875, 0.414794921875, 0.4351806640625, 0.45556640625, 0.4759521484375, 0.496337890625, 0.5167236328125, 0.537109375, 0.5574951171875, 0.577880859375, 0.5982666015625, 0.61865234375, 0.6390380859375, 0.659423828125, 0.6798095703125, 0.7001953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 12.0, 17.0, 20.0, 40.0, 59.0, 93.0, 160.0, 175.0, 148.0, 98.0, 57.0, 43.0, 28.0, 18.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001691579818725586, -0.00016463827341794968, -0.00016011856496334076, -0.00015559885650873184, -0.00015107914805412292, -0.000146559439599514, -0.0001420397311449051, -0.00013752002269029617, -0.00013300031423568726, -0.00012848060578107834, -0.00012396089732646942, -0.0001194411888718605, -0.00011492148041725159, -0.00011040177196264267, -0.00010588206350803375, -0.00010136235505342484, -9.684264659881592e-05, -9.2322938144207e-05, -8.780322968959808e-05, -8.328352123498917e-05, -7.876381278038025e-05, -7.424410432577133e-05, -6.972439587116241e-05, -6.52046874165535e-05, -6.068497896194458e-05, -5.616527050733566e-05, -5.1645562052726746e-05, -4.712585359811783e-05, -4.260614514350891e-05, -3.8086436688899994e-05, -3.356672823429108e-05, -2.904701977968216e-05, -2.4527311325073242e-05, -2.0007602870464325e-05, -1.5487894415855408e-05, -1.096818596124649e-05, -6.448477506637573e-06, -1.928769052028656e-06, 2.5909394025802612e-06, 7.1106478571891785e-06, 1.1630356311798096e-05, 1.6150064766407013e-05, 2.066977322101593e-05, 2.5189481675624847e-05, 2.9709190130233765e-05, 3.422889858484268e-05, 3.87486070394516e-05, 4.3268315494060516e-05, 4.7788023948669434e-05, 5.230773240327835e-05, 5.682744085788727e-05, 6.134714931249619e-05, 6.58668577671051e-05, 7.038656622171402e-05, 7.490627467632294e-05, 7.942598313093185e-05, 8.394569158554077e-05, 8.846540004014969e-05, 9.29851084947586e-05, 9.750481694936752e-05, 0.00010202452540397644, 0.00010654423385858536, 0.00011106394231319427, 0.00011558365076780319, 0.00012010335922241211]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 9.0, 7.0, 12.0, 16.0, 27.0, 39.0, 83.0, 136.0, 243.0, 511.0, 1157.0, 3107.0, 9344.0, 35465.0, 184332.0, 546782.0, 211012.0, 40221.0, 10286.0, 3356.0, 1257.0, 574.0, 250.0, 132.0, 76.0, 45.0, 29.0, 20.0, 9.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36865234375, -0.3552665710449219, -0.34188079833984375, -0.3284950256347656, -0.3151092529296875, -0.3017234802246094, -0.28833770751953125, -0.2749519348144531, -0.261566162109375, -0.24818038940429688, -0.23479461669921875, -0.22140884399414062, -0.2080230712890625, -0.19463729858398438, -0.18125152587890625, -0.16786575317382812, -0.15447998046875, -0.14109420776367188, -0.12770843505859375, -0.11432266235351562, -0.1009368896484375, -0.08755111694335938, -0.07416534423828125, -0.060779571533203125, -0.047393798828125, -0.034008026123046875, -0.02062225341796875, -0.007236480712890625, 0.0061492919921875, 0.019535064697265625, 0.03292083740234375, 0.046306610107421875, 0.0596923828125, 0.07307815551757812, 0.08646392822265625, 0.09984970092773438, 0.1132354736328125, 0.12662124633789062, 0.14000701904296875, 0.15339279174804688, 0.166778564453125, 0.18016433715820312, 0.19355010986328125, 0.20693588256835938, 0.2203216552734375, 0.23370742797851562, 0.24709320068359375, 0.2604789733886719, 0.27386474609375, 0.2872505187988281, 0.30063629150390625, 0.3140220642089844, 0.3274078369140625, 0.3407936096191406, 0.35417938232421875, 0.3675651550292969, 0.380950927734375, 0.3943367004394531, 0.40772247314453125, 0.4211082458496094, 0.4344940185546875, 0.4478797912597656, 0.46126556396484375, 0.4746513366699219, 0.488037109375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 9.0, 7.0, 7.0, 12.0, 15.0, 30.0, 33.0, 45.0, 48.0, 65.0, 97.0, 108.0, 100.0, 94.0, 85.0, 69.0, 50.0, 37.0, 28.0, 18.0, 10.0, 12.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.51416015625, -0.5027713775634766, -0.4913825988769531, -0.4799938201904297, -0.46860504150390625, -0.4572162628173828, -0.4458274841308594, -0.43443870544433594, -0.4230499267578125, -0.41166114807128906, -0.4002723693847656, -0.3888835906982422, -0.37749481201171875, -0.3661060333251953, -0.3547172546386719, -0.34332847595214844, -0.331939697265625, -0.32055091857910156, -0.3091621398925781, -0.2977733612060547, -0.28638458251953125, -0.2749958038330078, -0.2636070251464844, -0.25221824645996094, -0.2408294677734375, -0.22944068908691406, -0.21805191040039062, -0.2066631317138672, -0.19527435302734375, -0.1838855743408203, -0.17249679565429688, -0.16110801696777344, -0.14971923828125, -0.13833045959472656, -0.12694168090820312, -0.11555290222167969, -0.10416412353515625, -0.09277534484863281, -0.08138656616210938, -0.06999778747558594, -0.0586090087890625, -0.04722023010253906, -0.035831451416015625, -0.024442672729492188, -0.01305389404296875, -0.0016651153564453125, 0.009723663330078125, 0.021112442016601562, 0.032501220703125, 0.04388999938964844, 0.055278778076171875, 0.06666755676269531, 0.07805633544921875, 0.08944511413574219, 0.10083389282226562, 0.11222267150878906, 0.1236114501953125, 0.13500022888183594, 0.14638900756835938, 0.1577777862548828, 0.16916656494140625, 0.1805553436279297, 0.19194412231445312, 0.20333290100097656, 0.2147216796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 11.0, 33.0, 73.0, 161.0, 242.0, 237.0, 129.0, 76.0, 28.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.384471893310547, -12.057840347290039, -11.731209754943848, -11.40457820892334, -11.077946662902832, -10.751315116882324, -10.424684524536133, -10.098052978515625, -9.771421432495117, -9.44478988647461, -9.118159294128418, -8.79152774810791, -8.464896202087402, -8.138264656066895, -7.811634063720703, -7.485002517700195, -7.158371448516846, -6.831740379333496, -6.505108833312988, -6.178477764129639, -5.851846218109131, -5.525215148925781, -5.198583602905273, -4.871952533721924, -4.545321464538574, -4.218690395355225, -3.892058849334717, -3.565427780151367, -3.2387962341308594, -2.9121651649475098, -2.585533857345581, -2.2589025497436523, -1.9322710037231445, -1.6056396961212158, -1.279008388519287, -0.952377200126648, -0.6257458925247192, -0.2991145849227905, 0.027516603469848633, 0.35414791107177734, 0.680779218673706, 1.0074105262756348, 1.3340418338775635, 1.6606730222702026, 1.9873043298721313, 2.3139357566833496, 2.640566825866699, 2.967198133468628, 3.2938294410705566, 3.6204607486724854, 3.947092056274414, 4.273723125457764, 4.6003546714782715, 4.926985740661621, 5.253617286682129, 5.5802483558654785, 5.906879425048828, 6.233510494232178, 6.5601420402526855, 6.886773109436035, 7.213404655456543, 7.540035724639893, 7.866666793823242, 8.19329833984375, 8.519929885864258]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 8.0, 9.0, 6.0, 11.0, 8.0, 21.0, 27.0, 29.0, 31.0, 32.0, 37.0, 34.0, 42.0, 47.0, 43.0, 41.0, 53.0, 46.0, 45.0, 41.0, 54.0, 48.0, 45.0, 45.0, 20.0, 31.0, 21.0, 19.0, 18.0, 13.0, 18.0, 8.0, 15.0, 6.0, 6.0, 4.0, 5.0, 1.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.027097702026367, -2.935706853866577, -2.844316005706787, -2.752925157546997, -2.661534309387207, -2.570143699645996, -2.478752851486206, -2.387362003326416, -2.295971155166626, -2.204580307006836, -2.113189458847046, -2.021798610687256, -1.9304078817367554, -1.8390170335769653, -1.7476263046264648, -1.6562354564666748, -1.5648446083068848, -1.4734537601470947, -1.3820629119873047, -1.2906721830368042, -1.1992813348770142, -1.1078904867172241, -1.0164997577667236, -0.9251089096069336, -0.8337180614471436, -0.7423272132873535, -0.6509364247322083, -0.559545636177063, -0.46815478801727295, -0.3767639696598053, -0.28537315130233765, -0.19398236274719238, -0.10259175300598145, -0.011200934648513794, 0.08018988370895386, 0.1715807020664215, 0.26297152042388916, 0.3543623387813568, 0.44575315713882446, 0.5371439456939697, 0.6285347938537598, 0.7199256420135498, 0.8113164305686951, 0.9027072191238403, 0.9940980672836304, 1.0854889154434204, 1.176879644393921, 1.268270492553711, 1.359661340713501, 1.451052188873291, 1.542443037033081, 1.6338337659835815, 1.7252246141433716, 1.8166154623031616, 1.908006191253662, 1.9993970394134521, 2.090787887573242, 2.1821787357330322, 2.2735695838928223, 2.3649604320526123, 2.4563512802124023, 2.5477418899536133, 2.6391327381134033, 2.7305235862731934, 2.8219144344329834]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 14.0, 18.0, 15.0, 25.0, 38.0, 78.0, 88.0, 128.0, 235.0, 411.0, 894.0, 2292.0, 6879.0, 35716.0, 1520181.0, 2576214.0, 39744.0, 7089.0, 2156.0, 921.0, 393.0, 237.0, 147.0, 102.0, 55.0, 29.0, 28.0, 21.0, 26.0, 21.0, 17.0, 9.0, 5.0, 5.0, 9.0, 4.0, 8.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.3623046875, -1.3118896484375, -1.261474609375, -1.2110595703125, -1.16064453125, -1.1102294921875, -1.059814453125, -1.0093994140625, -0.958984375, -0.9085693359375, -0.858154296875, -0.8077392578125, -0.75732421875, -0.7069091796875, -0.656494140625, -0.6060791015625, -0.5556640625, -0.5052490234375, -0.454833984375, -0.4044189453125, -0.35400390625, -0.3035888671875, -0.253173828125, -0.2027587890625, -0.15234375, -0.1019287109375, -0.051513671875, -0.0010986328125, 0.04931640625, 0.0997314453125, 0.150146484375, 0.2005615234375, 0.2509765625, 0.3013916015625, 0.351806640625, 0.4022216796875, 0.45263671875, 0.5030517578125, 0.553466796875, 0.6038818359375, 0.654296875, 0.7047119140625, 0.755126953125, 0.8055419921875, 0.85595703125, 0.9063720703125, 0.956787109375, 1.0072021484375, 1.0576171875, 1.1080322265625, 1.158447265625, 1.2088623046875, 1.25927734375, 1.3096923828125, 1.360107421875, 1.4105224609375, 1.4609375, 1.5113525390625, 1.561767578125, 1.6121826171875, 1.66259765625, 1.7130126953125, 1.763427734375, 1.8138427734375, 1.8642578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 11.0, 11.0, 12.0, 13.0, 16.0, 26.0, 34.0, 45.0, 60.0, 63.0, 69.0, 79.0, 77.0, 77.0, 81.0, 72.0, 61.0, 32.0, 40.0, 42.0, 25.0, 21.0, 15.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.206787109375, -0.2008342742919922, -0.19488143920898438, -0.18892860412597656, -0.18297576904296875, -0.17702293395996094, -0.17107009887695312, -0.1651172637939453, -0.1591644287109375, -0.1532115936279297, -0.14725875854492188, -0.14130592346191406, -0.13535308837890625, -0.12940025329589844, -0.12344741821289062, -0.11749458312988281, -0.111541748046875, -0.10558891296386719, -0.09963607788085938, -0.09368324279785156, -0.08773040771484375, -0.08177757263183594, -0.07582473754882812, -0.06987190246582031, -0.0639190673828125, -0.05796623229980469, -0.052013397216796875, -0.04606056213378906, -0.04010772705078125, -0.03415489196777344, -0.028202056884765625, -0.022249221801757812, -0.01629638671875, -0.010343551635742188, -0.004390716552734375, 0.0015621185302734375, 0.00751495361328125, 0.013467788696289062, 0.019420623779296875, 0.025373458862304688, 0.0313262939453125, 0.03727912902832031, 0.043231964111328125, 0.04918479919433594, 0.05513763427734375, 0.06109046936035156, 0.06704330444335938, 0.07299613952636719, 0.078948974609375, 0.08490180969238281, 0.09085464477539062, 0.09680747985839844, 0.10276031494140625, 0.10871315002441406, 0.11466598510742188, 0.12061882019042969, 0.1265716552734375, 0.1325244903564453, 0.13847732543945312, 0.14443016052246094, 0.15038299560546875, 0.15633583068847656, 0.16228866577148438, 0.1682415008544922, 0.1741943359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 15.0, 19.0, 29.0, 47.0, 60.0, 94.0, 141.0, 219.0, 410.0, 790.0, 1706.0, 4411.0, 13292.0, 53741.0, 480828.0, 3385990.0, 205006.0, 32497.0, 8986.0, 3174.0, 1344.0, 606.0, 332.0, 192.0, 131.0, 69.0, 41.0, 26.0, 28.0, 15.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.99951171875, -0.9695358276367188, -0.9395599365234375, -0.9095840454101562, -0.879608154296875, -0.8496322631835938, -0.8196563720703125, -0.7896804809570312, -0.75970458984375, -0.7297286987304688, -0.6997528076171875, -0.6697769165039062, -0.639801025390625, -0.6098251342773438, -0.5798492431640625, -0.5498733520507812, -0.5198974609375, -0.48992156982421875, -0.4599456787109375, -0.42996978759765625, -0.399993896484375, -0.37001800537109375, -0.3400421142578125, -0.31006622314453125, -0.28009033203125, -0.25011444091796875, -0.2201385498046875, -0.19016265869140625, -0.160186767578125, -0.13021087646484375, -0.1002349853515625, -0.07025909423828125, -0.040283203125, -0.01030731201171875, 0.0196685791015625, 0.04964447021484375, 0.079620361328125, 0.10959625244140625, 0.1395721435546875, 0.16954803466796875, 0.19952392578125, 0.22949981689453125, 0.2594757080078125, 0.28945159912109375, 0.319427490234375, 0.34940338134765625, 0.3793792724609375, 0.40935516357421875, 0.4393310546875, 0.46930694580078125, 0.4992828369140625, 0.5292587280273438, 0.559234619140625, 0.5892105102539062, 0.6191864013671875, 0.6491622924804688, 0.67913818359375, 0.7091140747070312, 0.7390899658203125, 0.7690658569335938, 0.799041748046875, 0.8290176391601562, 0.8589935302734375, 0.8889694213867188, 0.9189453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 8.0, 3.0, 11.0, 11.0, 23.0, 23.0, 45.0, 56.0, 107.0, 195.0, 423.0, 1112.0, 1133.0, 436.0, 204.0, 112.0, 53.0, 38.0, 23.0, 14.0, 15.0, 7.0, 1.0, 1.0, 5.0, 7.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.4213218688964844, -0.40856170654296875, -0.3958015441894531, -0.3830413818359375, -0.3702812194824219, -0.35752105712890625, -0.3447608947753906, -0.332000732421875, -0.3192405700683594, -0.30648040771484375, -0.2937202453613281, -0.2809600830078125, -0.2681999206542969, -0.25543975830078125, -0.24267959594726562, -0.22991943359375, -0.21715927124023438, -0.20439910888671875, -0.19163894653320312, -0.1788787841796875, -0.16611862182617188, -0.15335845947265625, -0.14059829711914062, -0.127838134765625, -0.11507797241210938, -0.10231781005859375, -0.08955764770507812, -0.0767974853515625, -0.06403732299804688, -0.05127716064453125, -0.038516998291015625, -0.0257568359375, -0.012996673583984375, -0.00023651123046875, 0.012523651123046875, 0.0252838134765625, 0.038043975830078125, 0.05080413818359375, 0.06356430053710938, 0.076324462890625, 0.08908462524414062, 0.10184478759765625, 0.11460494995117188, 0.1273651123046875, 0.14012527465820312, 0.15288543701171875, 0.16564559936523438, 0.17840576171875, 0.19116592407226562, 0.20392608642578125, 0.21668624877929688, 0.2294464111328125, 0.24220657348632812, 0.25496673583984375, 0.2677268981933594, 0.280487060546875, 0.2932472229003906, 0.30600738525390625, 0.3187675476074219, 0.3315277099609375, 0.3442878723144531, 0.35704803466796875, 0.3698081970214844, 0.382568359375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 9.0, 18.0, 41.0, 78.0, 128.0, 177.0, 191.0, 153.0, 99.0, 52.0, 24.0, 12.0, 8.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.024954795837402, -3.914379358291626, -3.8038036823272705, -3.693228244781494, -3.5826528072357178, -3.4720771312713623, -3.361501693725586, -3.2509260177612305, -3.140350580215454, -3.0297751426696777, -2.9191994667053223, -2.808624029159546, -2.6980485916137695, -2.587472915649414, -2.4768974781036377, -2.3663220405578613, -2.255746364593506, -2.1451709270477295, -2.034595251083374, -1.9240198135375977, -1.8134442567825317, -1.7028687000274658, -1.5922932624816895, -1.4817177057266235, -1.3711423873901367, -1.2605668306350708, -1.1499913930892944, -1.0394158363342285, -0.9288402795791626, -0.8182647824287415, -0.7076892852783203, -0.5971137285232544, -0.4865381717681885, -0.37596264481544495, -0.2653871178627014, -0.15481162071228027, -0.04423609375953674, 0.06633943319320679, 0.17691493034362793, 0.28749048709869385, 0.398065984249115, 0.5086414813995361, 0.619217038154602, 0.7297925353050232, 0.8403680324554443, 0.9509435892105103, 1.0615191459655762, 1.1720945835113525, 1.2826701402664185, 1.3932456970214844, 1.5038211345672607, 1.6143966913223267, 1.7249722480773926, 1.835547685623169, 1.9461232423782349, 2.056698799133301, 2.167274236679077, 2.2778496742248535, 2.388425350189209, 2.4990007877349854, 2.6095762252807617, 2.720151901245117, 2.8307273387908936, 2.94130277633667, 3.0518784523010254]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 14.0, 9.0, 22.0, 28.0, 30.0, 35.0, 39.0, 43.0, 53.0, 56.0, 48.0, 63.0, 59.0, 63.0, 55.0, 62.0, 60.0, 51.0, 42.0, 40.0, 33.0, 19.0, 18.0, 20.0, 11.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0796396732330322, -1.031628131866455, -0.9836165904998779, -0.9356050491333008, -0.8875934481620789, -0.8395819067955017, -0.7915703654289246, -0.7435587644577026, -0.6955472230911255, -0.6475356817245483, -0.5995241403579712, -0.551512598991394, -0.5035009980201721, -0.45548945665359497, -0.4074779152870178, -0.3594663441181183, -0.3114548325538635, -0.2634432911872864, -0.21543172001838684, -0.1674201786518097, -0.11940862238407135, -0.07139706611633301, -0.02338552474975586, 0.024626046419143677, 0.07263758778572083, 0.12064914405345917, 0.1686607003211975, 0.21667224168777466, 0.2646837830543518, 0.31269535422325134, 0.3607068955898285, 0.408718466758728, 0.4567300081253052, 0.5047415494918823, 0.5527530908584595, 0.6007646322250366, 0.6487762331962585, 0.6967877745628357, 0.7447993159294128, 0.7928109169006348, 0.8408224582672119, 0.8888339996337891, 0.9368455410003662, 0.9848570823669434, 1.0328686237335205, 1.0808801651000977, 1.1288917064666748, 1.1769033670425415, 1.224914789199829, 1.2729263305664062, 1.3209378719329834, 1.3689494132995605, 1.4169609546661377, 1.4649724960327148, 1.512984037399292, 1.5609956979751587, 1.6090072393417358, 1.657018780708313, 1.7050303220748901, 1.7530418634414673, 1.8010534048080444, 1.8490650653839111, 1.8970766067504883, 1.9450881481170654, 1.9930996894836426]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 6.0, 14.0, 21.0, 30.0, 81.0, 171.0, 351.0, 895.0, 3978.0, 42085.0, 829365.0, 160761.0, 8287.0, 1573.0, 490.0, 177.0, 105.0, 58.0, 26.0, 25.0, 11.0, 9.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -3.0137939453125, -2.933837890625, -2.8538818359375, -2.77392578125, -2.6939697265625, -2.614013671875, -2.5340576171875, -2.4541015625, -2.3741455078125, -2.294189453125, -2.2142333984375, -2.13427734375, -2.0543212890625, -1.974365234375, -1.8944091796875, -1.814453125, -1.7344970703125, -1.654541015625, -1.5745849609375, -1.49462890625, -1.4146728515625, -1.334716796875, -1.2547607421875, -1.1748046875, -1.0948486328125, -1.014892578125, -0.9349365234375, -0.85498046875, -0.7750244140625, -0.695068359375, -0.6151123046875, -0.53515625, -0.4552001953125, -0.375244140625, -0.2952880859375, -0.21533203125, -0.1353759765625, -0.055419921875, 0.0245361328125, 0.1044921875, 0.1844482421875, 0.264404296875, 0.3443603515625, 0.42431640625, 0.5042724609375, 0.584228515625, 0.6641845703125, 0.744140625, 0.8240966796875, 0.904052734375, 0.9840087890625, 1.06396484375, 1.1439208984375, 1.223876953125, 1.3038330078125, 1.3837890625, 1.4637451171875, 1.543701171875, 1.6236572265625, 1.70361328125, 1.7835693359375, 1.863525390625, 1.9434814453125, 2.0234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 12.0, 9.0, 9.0, 18.0, 21.0, 29.0, 36.0, 45.0, 43.0, 50.0, 58.0, 64.0, 76.0, 58.0, 66.0, 52.0, 63.0, 49.0, 43.0, 43.0, 34.0, 16.0, 23.0, 23.0, 15.0, 13.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.151611328125, -0.14647293090820312, -0.14133453369140625, -0.13619613647460938, -0.1310577392578125, -0.12591934204101562, -0.12078094482421875, -0.11564254760742188, -0.110504150390625, -0.10536575317382812, -0.10022735595703125, -0.09508895874023438, -0.0899505615234375, -0.08481216430664062, -0.07967376708984375, -0.07453536987304688, -0.06939697265625, -0.06425857543945312, -0.05912017822265625, -0.053981781005859375, -0.0488433837890625, -0.043704986572265625, -0.03856658935546875, -0.033428192138671875, -0.028289794921875, -0.023151397705078125, -0.01801300048828125, -0.012874603271484375, -0.0077362060546875, -0.002597808837890625, 0.00254058837890625, 0.007678985595703125, 0.0128173828125, 0.017955780029296875, 0.02309417724609375, 0.028232574462890625, 0.0333709716796875, 0.038509368896484375, 0.04364776611328125, 0.048786163330078125, 0.053924560546875, 0.059062957763671875, 0.06420135498046875, 0.06933975219726562, 0.0744781494140625, 0.07961654663085938, 0.08475494384765625, 0.08989334106445312, 0.09503173828125, 0.10017013549804688, 0.10530853271484375, 0.11044692993164062, 0.1155853271484375, 0.12072372436523438, 0.12586212158203125, 0.13100051879882812, 0.136138916015625, 0.14127731323242188, 0.14641571044921875, 0.15155410766601562, 0.1566925048828125, 0.16183090209960938, 0.16696929931640625, 0.17210769653320312, 0.17724609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 7.0, 11.0, 17.0, 18.0, 37.0, 40.0, 56.0, 85.0, 106.0, 152.0, 269.0, 380.0, 622.0, 1118.0, 2135.0, 4391.0, 10197.0, 25462.0, 68735.0, 192506.0, 377285.0, 229317.0, 82264.0, 30556.0, 11846.0, 5099.0, 2536.0, 1281.0, 721.0, 399.0, 265.0, 163.0, 124.0, 92.0, 64.0, 50.0, 38.0, 29.0, 19.0, 16.0, 11.0, 2.0, 7.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4580078125, -0.4407806396484375, -0.423553466796875, -0.4063262939453125, -0.38909912109375, -0.3718719482421875, -0.354644775390625, -0.3374176025390625, -0.3201904296875, -0.3029632568359375, -0.285736083984375, -0.2685089111328125, -0.25128173828125, -0.2340545654296875, -0.216827392578125, -0.1996002197265625, -0.182373046875, -0.1651458740234375, -0.147918701171875, -0.1306915283203125, -0.11346435546875, -0.0962371826171875, -0.079010009765625, -0.0617828369140625, -0.0445556640625, -0.0273284912109375, -0.010101318359375, 0.0071258544921875, 0.02435302734375, 0.0415802001953125, 0.058807373046875, 0.0760345458984375, 0.09326171875, 0.1104888916015625, 0.127716064453125, 0.1449432373046875, 0.16217041015625, 0.1793975830078125, 0.196624755859375, 0.2138519287109375, 0.2310791015625, 0.2483062744140625, 0.265533447265625, 0.2827606201171875, 0.29998779296875, 0.3172149658203125, 0.334442138671875, 0.3516693115234375, 0.368896484375, 0.3861236572265625, 0.403350830078125, 0.4205780029296875, 0.43780517578125, 0.4550323486328125, 0.472259521484375, 0.4894866943359375, 0.5067138671875, 0.5239410400390625, 0.541168212890625, 0.5583953857421875, 0.57562255859375, 0.5928497314453125, 0.610076904296875, 0.6273040771484375, 0.64453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 3.0, 5.0, 7.0, 8.0, 10.0, 12.0, 14.0, 13.0, 18.0, 22.0, 30.0, 23.0, 32.0, 36.0, 40.0, 43.0, 41.0, 44.0, 56.0, 49.0, 42.0, 39.0, 45.0, 50.0, 44.0, 34.0, 29.0, 33.0, 29.0, 21.0, 19.0, 17.0, 14.0, 10.0, 10.0, 13.0, 15.0, 6.0, 5.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.552734375, -0.5361099243164062, -0.5194854736328125, -0.5028610229492188, -0.486236572265625, -0.46961212158203125, -0.4529876708984375, -0.43636322021484375, -0.41973876953125, -0.40311431884765625, -0.3864898681640625, -0.36986541748046875, -0.353240966796875, -0.33661651611328125, -0.3199920654296875, -0.30336761474609375, -0.2867431640625, -0.27011871337890625, -0.2534942626953125, -0.23686981201171875, -0.220245361328125, -0.20362091064453125, -0.1869964599609375, -0.17037200927734375, -0.15374755859375, -0.13712310791015625, -0.1204986572265625, -0.10387420654296875, -0.087249755859375, -0.07062530517578125, -0.0540008544921875, -0.03737640380859375, -0.020751953125, -0.00412750244140625, 0.0124969482421875, 0.02912139892578125, 0.045745849609375, 0.06237030029296875, 0.0789947509765625, 0.09561920166015625, 0.11224365234375, 0.12886810302734375, 0.1454925537109375, 0.16211700439453125, 0.178741455078125, 0.19536590576171875, 0.2119903564453125, 0.22861480712890625, 0.2452392578125, 0.26186370849609375, 0.2784881591796875, 0.29511260986328125, 0.311737060546875, 0.32836151123046875, 0.3449859619140625, 0.36161041259765625, 0.37823486328125, 0.39485931396484375, 0.4114837646484375, 0.42810821533203125, 0.444732666015625, 0.46135711669921875, 0.4779815673828125, 0.49460601806640625, 0.51123046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 13.0, 36.0, 40.0, 75.0, 248.0, 613.0, 2343.0, 17963.0, 639095.0, 373130.0, 12323.0, 1843.0, 462.0, 192.0, 76.0, 43.0, 22.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7822265625, -0.7508392333984375, -0.719451904296875, -0.6880645751953125, -0.65667724609375, -0.6252899169921875, -0.593902587890625, -0.5625152587890625, -0.5311279296875, -0.4997406005859375, -0.468353271484375, -0.4369659423828125, -0.40557861328125, -0.3741912841796875, -0.342803955078125, -0.3114166259765625, -0.280029296875, -0.2486419677734375, -0.217254638671875, -0.1858673095703125, -0.15447998046875, -0.1230926513671875, -0.091705322265625, -0.0603179931640625, -0.0289306640625, 0.0024566650390625, 0.033843994140625, 0.0652313232421875, 0.09661865234375, 0.1280059814453125, 0.159393310546875, 0.1907806396484375, 0.22216796875, 0.2535552978515625, 0.284942626953125, 0.3163299560546875, 0.34771728515625, 0.3791046142578125, 0.410491943359375, 0.4418792724609375, 0.4732666015625, 0.5046539306640625, 0.536041259765625, 0.5674285888671875, 0.59881591796875, 0.6302032470703125, 0.661590576171875, 0.6929779052734375, 0.724365234375, 0.7557525634765625, 0.787139892578125, 0.8185272216796875, 0.84991455078125, 0.8813018798828125, 0.912689208984375, 0.9440765380859375, 0.9754638671875, 1.0068511962890625, 1.038238525390625, 1.0696258544921875, 1.10101318359375, 1.1324005126953125, 1.163787841796875, 1.1951751708984375, 1.2265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 7.0, 7.0, 18.0, 12.0, 22.0, 29.0, 40.0, 65.0, 69.0, 103.0, 119.0, 136.0, 114.0, 75.0, 56.0, 37.0, 22.0, 17.0, 9.0, 12.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010758638381958008, -0.00010449253022670746, -0.00010139867663383484, -9.830482304096222e-05, -9.52109694480896e-05, -9.211711585521698e-05, -8.902326226234436e-05, -8.592940866947174e-05, -8.283555507659912e-05, -7.97417014837265e-05, -7.664784789085388e-05, -7.355399429798126e-05, -7.046014070510864e-05, -6.736628711223602e-05, -6.42724335193634e-05, -6.117857992649078e-05, -5.8084726333618164e-05, -5.4990872740745544e-05, -5.1897019147872925e-05, -4.8803165555000305e-05, -4.5709311962127686e-05, -4.2615458369255066e-05, -3.9521604776382446e-05, -3.642775118350983e-05, -3.333389759063721e-05, -3.0240043997764587e-05, -2.7146190404891968e-05, -2.4052336812019348e-05, -2.095848321914673e-05, -1.786462962627411e-05, -1.477077603340149e-05, -1.167692244052887e-05, -8.58306884765625e-06, -5.48921525478363e-06, -2.3953616619110107e-06, 6.984919309616089e-07, 3.7923455238342285e-06, 6.886199116706848e-06, 9.980052709579468e-06, 1.3073906302452087e-05, 1.6167759895324707e-05, 1.9261613488197327e-05, 2.2355467081069946e-05, 2.5449320673942566e-05, 2.8543174266815186e-05, 3.1637027859687805e-05, 3.4730881452560425e-05, 3.7824735045433044e-05, 4.0918588638305664e-05, 4.4012442231178284e-05, 4.71062958240509e-05, 5.020014941692352e-05, 5.329400300979614e-05, 5.638785660266876e-05, 5.948171019554138e-05, 6.2575563788414e-05, 6.566941738128662e-05, 6.876327097415924e-05, 7.185712456703186e-05, 7.495097815990448e-05, 7.80448317527771e-05, 8.113868534564972e-05, 8.423253893852234e-05, 8.732639253139496e-05, 9.042024612426758e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 20.0, 47.0, 87.0, 188.0, 568.0, 3607.0, 134377.0, 898353.0, 9863.0, 959.0, 272.0, 102.0, 58.0, 17.0, 18.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.341278076171875, -1.28802490234375, -1.234771728515625, -1.1815185546875, -1.128265380859375, -1.07501220703125, -1.021759033203125, -0.968505859375, -0.915252685546875, -0.86199951171875, -0.808746337890625, -0.7554931640625, -0.702239990234375, -0.64898681640625, -0.595733642578125, -0.54248046875, -0.489227294921875, -0.43597412109375, -0.382720947265625, -0.3294677734375, -0.276214599609375, -0.22296142578125, -0.169708251953125, -0.116455078125, -0.063201904296875, -0.00994873046875, 0.043304443359375, 0.0965576171875, 0.149810791015625, 0.20306396484375, 0.256317138671875, 0.3095703125, 0.362823486328125, 0.41607666015625, 0.469329833984375, 0.5225830078125, 0.575836181640625, 0.62908935546875, 0.682342529296875, 0.735595703125, 0.788848876953125, 0.84210205078125, 0.895355224609375, 0.9486083984375, 1.001861572265625, 1.05511474609375, 1.108367919921875, 1.16162109375, 1.214874267578125, 1.26812744140625, 1.321380615234375, 1.3746337890625, 1.427886962890625, 1.48114013671875, 1.534393310546875, 1.587646484375, 1.640899658203125, 1.69415283203125, 1.747406005859375, 1.8006591796875, 1.853912353515625, 1.90716552734375, 1.960418701171875, 2.013671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 12.0, 18.0, 45.0, 79.0, 174.0, 245.0, 201.0, 103.0, 46.0, 30.0, 11.0, 15.0, 4.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6588821411132812, -0.6331939697265625, -0.6075057983398438, -0.581817626953125, -0.5561294555664062, -0.5304412841796875, -0.5047531127929688, -0.47906494140625, -0.45337677001953125, -0.4276885986328125, -0.40200042724609375, -0.376312255859375, -0.35062408447265625, -0.3249359130859375, -0.29924774169921875, -0.2735595703125, -0.24787139892578125, -0.2221832275390625, -0.19649505615234375, -0.170806884765625, -0.14511871337890625, -0.1194305419921875, -0.09374237060546875, -0.06805419921875, -0.04236602783203125, -0.0166778564453125, 0.00901031494140625, 0.034698486328125, 0.06038665771484375, 0.0860748291015625, 0.11176300048828125, 0.137451171875, 0.16313934326171875, 0.1888275146484375, 0.21451568603515625, 0.240203857421875, 0.26589202880859375, 0.2915802001953125, 0.31726837158203125, 0.34295654296875, 0.36864471435546875, 0.3943328857421875, 0.42002105712890625, 0.445709228515625, 0.47139739990234375, 0.4970855712890625, 0.5227737426757812, 0.5484619140625, 0.5741500854492188, 0.5998382568359375, 0.6255264282226562, 0.651214599609375, 0.6769027709960938, 0.7025909423828125, 0.7282791137695312, 0.75396728515625, 0.7796554565429688, 0.8053436279296875, 0.8310317993164062, 0.856719970703125, 0.8824081420898438, 0.9080963134765625, 0.9337844848632812, 0.95947265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 23.0, 65.0, 132.0, 273.0, 232.0, 162.0, 70.0, 28.0, 12.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.694255828857422, -16.331281661987305, -15.968308448791504, -15.605334281921387, -15.24236011505127, -14.879386901855469, -14.516412734985352, -14.153438568115234, -13.790464401245117, -13.427490234375, -13.0645170211792, -12.701542854309082, -12.338568687438965, -11.975595474243164, -11.612621307373047, -11.24964714050293, -10.886673927307129, -10.523699760437012, -10.160726547241211, -9.797752380371094, -9.434778213500977, -9.07180404663086, -8.708830833435059, -8.345856666564941, -7.982882976531982, -7.619909286499023, -7.256935119628906, -6.893961429595947, -6.530987739562988, -6.168013572692871, -5.805039882659912, -5.442066192626953, -5.079092025756836, -4.716118335723877, -4.35314416885376, -3.990170478820801, -3.6271965503692627, -3.2642226219177246, -2.9012489318847656, -2.5382750034332275, -2.1753010749816895, -1.8123271465301514, -1.4493533372879028, -1.0863795280456543, -0.7234055995941162, -0.3604316711425781, 0.0025420188903808594, 0.36551594734191895, 0.728489875793457, 1.0914638042449951, 1.4544376134872437, 1.8174114227294922, 2.1803853511810303, 2.5433592796325684, 2.9063329696655273, 3.2693068981170654, 3.6322808265686035, 3.9952547550201416, 4.35822868347168, 4.721202373504639, 5.084176063537598, 5.447150230407715, 5.810123920440674, 6.173097610473633, 6.53607177734375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 3.0, 3.0, 10.0, 5.0, 7.0, 4.0, 11.0, 8.0, 24.0, 16.0, 25.0, 29.0, 36.0, 37.0, 21.0, 25.0, 37.0, 38.0, 44.0, 49.0, 46.0, 49.0, 47.0, 56.0, 45.0, 38.0, 42.0, 25.0, 34.0, 23.0, 23.0, 19.0, 22.0, 14.0, 17.0, 11.0, 13.0, 7.0, 9.0, 5.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.9814746379852295, -2.891805648803711, -2.8021366596221924, -2.712467670440674, -2.622798442840576, -2.5331294536590576, -2.443460464477539, -2.3537914752960205, -2.264122486114502, -2.1744534969329834, -2.084784507751465, -1.9951153993606567, -1.9054462909698486, -1.81577730178833, -1.7261083126068115, -1.636439323425293, -1.5467700958251953, -1.4571011066436768, -1.3674319982528687, -1.27776300907135, -1.188093900680542, -1.0984249114990234, -1.0087559223175049, -0.9190868735313416, -0.8294178247451782, -0.7397487759590149, -0.6500797271728516, -0.560410737991333, -0.4707416892051697, -0.38107264041900635, -0.2914036512374878, -0.20173460245132446, -0.11206579208374023, -0.022396758198738098, 0.06727227568626404, 0.15694129467010498, 0.2466103434562683, 0.33627939224243164, 0.4259483814239502, 0.5156174302101135, 0.6052864789962769, 0.6949555277824402, 0.7846245765686035, 0.8742935657501221, 0.9639626145362854, 1.0536316633224487, 1.1433006525039673, 1.2329697608947754, 1.322638750076294, 1.4123077392578125, 1.5019768476486206, 1.5916458368301392, 1.6813149452209473, 1.7709839344024658, 1.8606529235839844, 1.950321912765503, 2.0399909019470215, 2.12965989112854, 2.2193288803100586, 2.3089981079101562, 2.398667097091675, 2.4883360862731934, 2.578005075454712, 2.6676740646362305, 2.757343292236328]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 8.0, 8.0, 24.0, 32.0, 35.0, 63.0, 140.0, 273.0, 783.0, 2825.0, 20971.0, 3849465.0, 307218.0, 9800.0, 1639.0, 499.0, 198.0, 111.0, 49.0, 42.0, 24.0, 16.0, 16.0, 7.0, 12.0, 2.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.94512939453125, -1.8668212890625, -1.78851318359375, -1.710205078125, -1.63189697265625, -1.5535888671875, -1.47528076171875, -1.39697265625, -1.31866455078125, -1.2403564453125, -1.16204833984375, -1.083740234375, -1.00543212890625, -0.9271240234375, -0.84881591796875, -0.7705078125, -0.69219970703125, -0.6138916015625, -0.53558349609375, -0.457275390625, -0.37896728515625, -0.3006591796875, -0.22235107421875, -0.14404296875, -0.06573486328125, 0.0125732421875, 0.09088134765625, 0.169189453125, 0.24749755859375, 0.3258056640625, 0.40411376953125, 0.482421875, 0.56072998046875, 0.6390380859375, 0.71734619140625, 0.795654296875, 0.87396240234375, 0.9522705078125, 1.03057861328125, 1.10888671875, 1.18719482421875, 1.2655029296875, 1.34381103515625, 1.422119140625, 1.50042724609375, 1.5787353515625, 1.65704345703125, 1.7353515625, 1.81365966796875, 1.8919677734375, 1.97027587890625, 2.048583984375, 2.12689208984375, 2.2052001953125, 2.28350830078125, 2.36181640625, 2.44012451171875, 2.5184326171875, 2.59674072265625, 2.675048828125, 2.75335693359375, 2.8316650390625, 2.90997314453125, 2.98828125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 11.0, 9.0, 19.0, 16.0, 18.0, 35.0, 29.0, 40.0, 39.0, 58.0, 47.0, 66.0, 55.0, 58.0, 73.0, 74.0, 56.0, 47.0, 48.0, 41.0, 33.0, 27.0, 15.0, 10.0, 18.0, 15.0, 7.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.1488628387451172, -0.14342880249023438, -0.13799476623535156, -0.13256072998046875, -0.12712669372558594, -0.12169265747070312, -0.11625862121582031, -0.1108245849609375, -0.10539054870605469, -0.09995651245117188, -0.09452247619628906, -0.08908843994140625, -0.08365440368652344, -0.07822036743164062, -0.07278633117675781, -0.067352294921875, -0.06191825866699219, -0.056484222412109375, -0.05105018615722656, -0.04561614990234375, -0.04018211364746094, -0.034748077392578125, -0.029314041137695312, -0.0238800048828125, -0.018445968627929688, -0.013011932373046875, -0.0075778961181640625, -0.00214385986328125, 0.0032901763916015625, 0.008724212646484375, 0.014158248901367188, 0.01959228515625, 0.025026321411132812, 0.030460357666015625, 0.03589439392089844, 0.04132843017578125, 0.04676246643066406, 0.052196502685546875, 0.05763053894042969, 0.0630645751953125, 0.06849861145019531, 0.07393264770507812, 0.07936668395996094, 0.08480072021484375, 0.09023475646972656, 0.09566879272460938, 0.10110282897949219, 0.106536865234375, 0.11197090148925781, 0.11740493774414062, 0.12283897399902344, 0.12827301025390625, 0.13370704650878906, 0.13914108276367188, 0.1445751190185547, 0.1500091552734375, 0.1554431915283203, 0.16087722778320312, 0.16631126403808594, 0.17174530029296875, 0.17717933654785156, 0.18261337280273438, 0.1880474090576172, 0.1934814453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 10.0, 11.0, 9.0, 10.0, 15.0, 32.0, 41.0, 50.0, 61.0, 85.0, 101.0, 206.0, 445.0, 1094.0, 4926.0, 51678.0, 3974024.0, 149846.0, 8785.0, 1690.0, 541.0, 225.0, 113.0, 71.0, 52.0, 52.0, 30.0, 29.0, 8.0, 15.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.890625, -1.819671630859375, -1.74871826171875, -1.677764892578125, -1.6068115234375, -1.535858154296875, -1.46490478515625, -1.393951416015625, -1.322998046875, -1.252044677734375, -1.18109130859375, -1.110137939453125, -1.0391845703125, -0.968231201171875, -0.89727783203125, -0.826324462890625, -0.75537109375, -0.684417724609375, -0.61346435546875, -0.542510986328125, -0.4715576171875, -0.400604248046875, -0.32965087890625, -0.258697509765625, -0.187744140625, -0.116790771484375, -0.04583740234375, 0.025115966796875, 0.0960693359375, 0.167022705078125, 0.23797607421875, 0.308929443359375, 0.3798828125, 0.450836181640625, 0.52178955078125, 0.592742919921875, 0.6636962890625, 0.734649658203125, 0.80560302734375, 0.876556396484375, 0.947509765625, 1.018463134765625, 1.08941650390625, 1.160369873046875, 1.2313232421875, 1.302276611328125, 1.37322998046875, 1.444183349609375, 1.51513671875, 1.586090087890625, 1.65704345703125, 1.727996826171875, 1.7989501953125, 1.869903564453125, 1.94085693359375, 2.011810302734375, 2.082763671875, 2.153717041015625, 2.22467041015625, 2.295623779296875, 2.3665771484375, 2.437530517578125, 2.50848388671875, 2.579437255859375, 2.650390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 6.0, 8.0, 15.0, 20.0, 46.0, 85.0, 240.0, 1028.0, 2074.0, 331.0, 126.0, 46.0, 16.0, 15.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-1.0322265625, -1.0120468139648438, -0.9918670654296875, -0.9716873168945312, -0.951507568359375, -0.9313278198242188, -0.9111480712890625, -0.8909683227539062, -0.87078857421875, -0.8506088256835938, -0.8304290771484375, -0.8102493286132812, -0.790069580078125, -0.7698898315429688, -0.7497100830078125, -0.7295303344726562, -0.7093505859375, -0.6891708374023438, -0.6689910888671875, -0.6488113403320312, -0.628631591796875, -0.6084518432617188, -0.5882720947265625, -0.5680923461914062, -0.54791259765625, -0.5277328491210938, -0.5075531005859375, -0.48737335205078125, -0.467193603515625, -0.44701385498046875, -0.4268341064453125, -0.40665435791015625, -0.386474609375, -0.36629486083984375, -0.3461151123046875, -0.32593536376953125, -0.305755615234375, -0.28557586669921875, -0.2653961181640625, -0.24521636962890625, -0.22503662109375, -0.20485687255859375, -0.1846771240234375, -0.16449737548828125, -0.144317626953125, -0.12413787841796875, -0.1039581298828125, -0.08377838134765625, -0.0635986328125, -0.04341888427734375, -0.0232391357421875, -0.00305938720703125, 0.017120361328125, 0.03730010986328125, 0.0574798583984375, 0.07765960693359375, 0.09783935546875, 0.11801910400390625, 0.1381988525390625, 0.15837860107421875, 0.178558349609375, 0.19873809814453125, 0.2189178466796875, 0.23909759521484375, 0.25927734375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 33.0, 134.0, 343.0, 276.0, 133.0, 36.0, 11.0, 6.0, 2.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.465598106384277, -9.280097007751465, -9.094595909118652, -8.90909481048584, -8.723592758178711, -8.538091659545898, -8.352590560913086, -8.167089462280273, -7.981588363647461, -7.796087265014648, -7.610585689544678, -7.425084590911865, -7.239583492279053, -7.05408239364624, -6.8685808181762695, -6.683079719543457, -6.4975786209106445, -6.312077522277832, -6.126575946807861, -5.941074848175049, -5.755573749542236, -5.570072650909424, -5.384571075439453, -5.199069976806641, -5.01356840133667, -4.828067302703857, -4.642565727233887, -4.457064628601074, -4.271563529968262, -4.086062431335449, -3.9005608558654785, -3.715059757232666, -3.5295586585998535, -3.344057321548462, -3.1585562229156494, -2.973054885864258, -2.7875537872314453, -2.6020524501800537, -2.416551113128662, -2.2310500144958496, -2.045548915863037, -1.860047698020935, -1.674546480178833, -1.4890451431274414, -1.303544044494629, -1.1180427074432373, -0.9325414896011353, -0.7470402717590332, -0.5615389347076416, -0.37603771686553955, -0.1905364692211151, -0.005035221576690674, 0.18046599626541138, 0.3659672141075134, 0.5514684915542603, 0.7369697093963623, 0.9224709272384644, 1.1079721450805664, 1.2934733629226685, 1.4789745807647705, 1.664475917816162, 1.8499770164489746, 2.035478353500366, 2.220979690551758, 2.4064807891845703]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 16.0, 18.0, 21.0, 35.0, 53.0, 57.0, 67.0, 68.0, 68.0, 89.0, 81.0, 76.0, 68.0, 71.0, 60.0, 41.0, 28.0, 29.0, 19.0, 11.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3186640739440918, -1.2607791423797607, -1.2028943300247192, -1.1450093984603882, -1.0871244668960571, -1.0292396545410156, -0.9713547229766846, -0.9134698510169983, -0.855584979057312, -0.7977001070976257, -0.7398151755332947, -0.6819303035736084, -0.6240454316139221, -0.5661605596542358, -0.5082756280899048, -0.4503907561302185, -0.39250582456588745, -0.3346209228038788, -0.2767360508441925, -0.21885114908218384, -0.16096626222133636, -0.10308137536048889, -0.045196473598480225, 0.012688398361206055, 0.07057330012321472, 0.1284581869840622, 0.18634307384490967, 0.24422797560691833, 0.302112877368927, 0.3599977493286133, 0.41788265109062195, 0.4757675230503082, 0.5336524248123169, 0.5915372967720032, 0.6494222283363342, 0.7073071002960205, 0.7651919722557068, 0.8230768442153931, 0.8809617757797241, 0.9388466477394104, 0.9967315196990967, 1.0546164512634277, 1.1125012636184692, 1.1703861951828003, 1.2282711267471313, 1.2861559391021729, 1.344040870666504, 1.401925802230835, 1.459810733795166, 1.517695665359497, 1.5755804777145386, 1.6334654092788696, 1.6913503408432007, 1.7492351531982422, 1.8071200847625732, 1.8650050163269043, 1.9228898286819458, 1.9807747602462769, 2.0386595726013184, 2.0965445041656494, 2.1544294357299805, 2.2123143672943115, 2.2701992988586426, 2.3280839920043945, 2.3859689235687256]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 9.0, 14.0, 21.0, 30.0, 36.0, 78.0, 172.0, 402.0, 1243.0, 6591.0, 100170.0, 840674.0, 90955.0, 6122.0, 1235.0, 435.0, 156.0, 75.0, 45.0, 39.0, 23.0, 6.0, 5.0, 6.0, 0.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9140625, -1.838958740234375, -1.76385498046875, -1.688751220703125, -1.6136474609375, -1.538543701171875, -1.46343994140625, -1.388336181640625, -1.313232421875, -1.238128662109375, -1.16302490234375, -1.087921142578125, -1.0128173828125, -0.937713623046875, -0.86260986328125, -0.787506103515625, -0.71240234375, -0.637298583984375, -0.56219482421875, -0.487091064453125, -0.4119873046875, -0.336883544921875, -0.26177978515625, -0.186676025390625, -0.111572265625, -0.036468505859375, 0.03863525390625, 0.113739013671875, 0.1888427734375, 0.263946533203125, 0.33905029296875, 0.414154052734375, 0.4892578125, 0.564361572265625, 0.63946533203125, 0.714569091796875, 0.7896728515625, 0.864776611328125, 0.93988037109375, 1.014984130859375, 1.090087890625, 1.165191650390625, 1.24029541015625, 1.315399169921875, 1.3905029296875, 1.465606689453125, 1.54071044921875, 1.615814208984375, 1.69091796875, 1.766021728515625, 1.84112548828125, 1.916229248046875, 1.9913330078125, 2.066436767578125, 2.14154052734375, 2.216644287109375, 2.291748046875, 2.366851806640625, 2.44195556640625, 2.517059326171875, 2.5921630859375, 2.667266845703125, 2.74237060546875, 2.817474365234375, 2.892578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 10.0, 15.0, 14.0, 11.0, 23.0, 25.0, 24.0, 34.0, 36.0, 39.0, 49.0, 42.0, 69.0, 61.0, 63.0, 59.0, 60.0, 60.0, 37.0, 47.0, 38.0, 49.0, 33.0, 17.0, 21.0, 12.0, 13.0, 9.0, 13.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1739501953125, -0.1684246063232422, -0.16289901733398438, -0.15737342834472656, -0.15184783935546875, -0.14632225036621094, -0.14079666137695312, -0.1352710723876953, -0.1297454833984375, -0.12421989440917969, -0.11869430541992188, -0.11316871643066406, -0.10764312744140625, -0.10211753845214844, -0.09659194946289062, -0.09106636047363281, -0.085540771484375, -0.08001518249511719, -0.07448959350585938, -0.06896400451660156, -0.06343841552734375, -0.05791282653808594, -0.052387237548828125, -0.04686164855957031, -0.0413360595703125, -0.03581047058105469, -0.030284881591796875, -0.024759292602539062, -0.01923370361328125, -0.013708114624023438, -0.008182525634765625, -0.0026569366455078125, 0.00286865234375, 0.008394241333007812, 0.013919830322265625, 0.019445419311523438, 0.02497100830078125, 0.030496597290039062, 0.036022186279296875, 0.04154777526855469, 0.0470733642578125, 0.05259895324707031, 0.058124542236328125, 0.06365013122558594, 0.06917572021484375, 0.07470130920410156, 0.08022689819335938, 0.08575248718261719, 0.091278076171875, 0.09680366516113281, 0.10232925415039062, 0.10785484313964844, 0.11338043212890625, 0.11890602111816406, 0.12443161010742188, 0.1299571990966797, 0.1354827880859375, 0.1410083770751953, 0.14653396606445312, 0.15205955505371094, 0.15758514404296875, 0.16311073303222656, 0.16863632202148438, 0.1741619110107422, 0.1796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 5.0, 7.0, 13.0, 16.0, 33.0, 27.0, 51.0, 92.0, 169.0, 266.0, 542.0, 1238.0, 3119.0, 8604.0, 25745.0, 82736.0, 266937.0, 423069.0, 161054.0, 49475.0, 16092.0, 5412.0, 2031.0, 818.0, 427.0, 222.0, 135.0, 75.0, 46.0, 41.0, 20.0, 10.0, 4.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7978515625, -0.7764511108398438, -0.7550506591796875, -0.7336502075195312, -0.712249755859375, -0.6908493041992188, -0.6694488525390625, -0.6480484008789062, -0.62664794921875, -0.6052474975585938, -0.5838470458984375, -0.5624465942382812, -0.541046142578125, -0.5196456909179688, -0.4982452392578125, -0.47684478759765625, -0.4554443359375, -0.43404388427734375, -0.4126434326171875, -0.39124298095703125, -0.369842529296875, -0.34844207763671875, -0.3270416259765625, -0.30564117431640625, -0.28424072265625, -0.26284027099609375, -0.2414398193359375, -0.22003936767578125, -0.198638916015625, -0.17723846435546875, -0.1558380126953125, -0.13443756103515625, -0.113037109375, -0.09163665771484375, -0.0702362060546875, -0.04883575439453125, -0.027435302734375, -0.00603485107421875, 0.0153656005859375, 0.03676605224609375, 0.05816650390625, 0.07956695556640625, 0.1009674072265625, 0.12236785888671875, 0.143768310546875, 0.16516876220703125, 0.1865692138671875, 0.20796966552734375, 0.2293701171875, 0.25077056884765625, 0.2721710205078125, 0.29357147216796875, 0.314971923828125, 0.33637237548828125, 0.3577728271484375, 0.37917327880859375, 0.40057373046875, 0.42197418212890625, 0.4433746337890625, 0.46477508544921875, 0.486175537109375, 0.5075759887695312, 0.5289764404296875, 0.5503768920898438, 0.57177734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 12.0, 22.0, 12.0, 13.0, 17.0, 16.0, 20.0, 25.0, 26.0, 24.0, 34.0, 38.0, 43.0, 46.0, 42.0, 40.0, 41.0, 45.0, 38.0, 44.0, 45.0, 31.0, 39.0, 24.0, 27.0, 32.0, 23.0, 27.0, 24.0, 22.0, 15.0, 13.0, 19.0, 8.0, 8.0, 5.0, 7.0, 4.0, 4.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5068359375, -0.4906768798828125, -0.474517822265625, -0.4583587646484375, -0.44219970703125, -0.4260406494140625, -0.409881591796875, -0.3937225341796875, -0.3775634765625, -0.3614044189453125, -0.345245361328125, -0.3290863037109375, -0.31292724609375, -0.2967681884765625, -0.280609130859375, -0.2644500732421875, -0.248291015625, -0.2321319580078125, -0.215972900390625, -0.1998138427734375, -0.18365478515625, -0.1674957275390625, -0.151336669921875, -0.1351776123046875, -0.1190185546875, -0.1028594970703125, -0.086700439453125, -0.0705413818359375, -0.05438232421875, -0.0382232666015625, -0.022064208984375, -0.0059051513671875, 0.01025390625, 0.0264129638671875, 0.042572021484375, 0.0587310791015625, 0.07489013671875, 0.0910491943359375, 0.107208251953125, 0.1233673095703125, 0.1395263671875, 0.1556854248046875, 0.171844482421875, 0.1880035400390625, 0.20416259765625, 0.2203216552734375, 0.236480712890625, 0.2526397705078125, 0.268798828125, 0.2849578857421875, 0.301116943359375, 0.3172760009765625, 0.33343505859375, 0.3495941162109375, 0.365753173828125, 0.3819122314453125, 0.3980712890625, 0.4142303466796875, 0.430389404296875, 0.4465484619140625, 0.46270751953125, 0.4788665771484375, 0.495025634765625, 0.5111846923828125, 0.52734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 15.0, 39.0, 52.0, 81.0, 175.0, 375.0, 1071.0, 3442.0, 14639.0, 89250.0, 583425.0, 305159.0, 39949.0, 7593.0, 1955.0, 678.0, 304.0, 155.0, 60.0, 42.0, 33.0, 14.0, 3.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.389892578125, -0.3753395080566406, -0.36078643798828125, -0.3462333679199219, -0.3316802978515625, -0.3171272277832031, -0.30257415771484375, -0.2880210876464844, -0.273468017578125, -0.2589149475097656, -0.24436187744140625, -0.22980880737304688, -0.2152557373046875, -0.20070266723632812, -0.18614959716796875, -0.17159652709960938, -0.15704345703125, -0.14249038696289062, -0.12793731689453125, -0.11338424682617188, -0.0988311767578125, -0.08427810668945312, -0.06972503662109375, -0.055171966552734375, -0.040618896484375, -0.026065826416015625, -0.01151275634765625, 0.003040313720703125, 0.0175933837890625, 0.032146453857421875, 0.04669952392578125, 0.061252593994140625, 0.0758056640625, 0.09035873413085938, 0.10491180419921875, 0.11946487426757812, 0.1340179443359375, 0.14857101440429688, 0.16312408447265625, 0.17767715454101562, 0.192230224609375, 0.20678329467773438, 0.22133636474609375, 0.23588943481445312, 0.2504425048828125, 0.2649955749511719, 0.27954864501953125, 0.2941017150878906, 0.30865478515625, 0.3232078552246094, 0.33776092529296875, 0.3523139953613281, 0.3668670654296875, 0.3814201354980469, 0.39597320556640625, 0.4105262756347656, 0.425079345703125, 0.4396324157714844, 0.45418548583984375, 0.4687385559082031, 0.4832916259765625, 0.4978446960449219, 0.5123977661132812, 0.5269508361816406, 0.54150390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 5.0, 9.0, 4.0, 12.0, 14.0, 27.0, 36.0, 49.0, 81.0, 101.0, 114.0, 117.0, 114.0, 87.0, 58.0, 40.0, 26.0, 22.0, 15.0, 16.0, 9.0, 12.0, 2.0, 6.0, 8.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.018182754516602e-05, -8.738785982131958e-05, -8.459389209747314e-05, -8.179992437362671e-05, -7.900595664978027e-05, -7.621198892593384e-05, -7.34180212020874e-05, -7.062405347824097e-05, -6.783008575439453e-05, -6.50361180305481e-05, -6.224215030670166e-05, -5.9448182582855225e-05, -5.665421485900879e-05, -5.3860247135162354e-05, -5.106627941131592e-05, -4.827231168746948e-05, -4.547834396362305e-05, -4.268437623977661e-05, -3.9890408515930176e-05, -3.709644079208374e-05, -3.4302473068237305e-05, -3.150850534439087e-05, -2.8714537620544434e-05, -2.5920569896697998e-05, -2.3126602172851562e-05, -2.0332634449005127e-05, -1.753866672515869e-05, -1.4744699001312256e-05, -1.195073127746582e-05, -9.156763553619385e-06, -6.362795829772949e-06, -3.5688281059265137e-06, -7.748603820800781e-07, 2.0191073417663574e-06, 4.813075065612793e-06, 7.6070427894592285e-06, 1.0401010513305664e-05, 1.31949782371521e-05, 1.5988945960998535e-05, 1.878291368484497e-05, 2.1576881408691406e-05, 2.4370849132537842e-05, 2.7164816856384277e-05, 2.9958784580230713e-05, 3.275275230407715e-05, 3.5546720027923584e-05, 3.834068775177002e-05, 4.1134655475616455e-05, 4.392862319946289e-05, 4.6722590923309326e-05, 4.951655864715576e-05, 5.23105263710022e-05, 5.510449409484863e-05, 5.789846181869507e-05, 6.0692429542541504e-05, 6.348639726638794e-05, 6.628036499023438e-05, 6.907433271408081e-05, 7.186830043792725e-05, 7.466226816177368e-05, 7.745623588562012e-05, 8.025020360946655e-05, 8.304417133331299e-05, 8.583813905715942e-05, 8.863210678100586e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 12.0, 8.0, 15.0, 22.0, 33.0, 48.0, 81.0, 112.0, 164.0, 264.0, 624.0, 1396.0, 4335.0, 15932.0, 78986.0, 533136.0, 348029.0, 49147.0, 10807.0, 3043.0, 1132.0, 518.0, 286.0, 147.0, 87.0, 51.0, 32.0, 30.0, 26.0, 13.0, 9.0, 7.0, 7.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.3853416442871094, -0.37151336669921875, -0.3576850891113281, -0.3438568115234375, -0.3300285339355469, -0.31620025634765625, -0.3023719787597656, -0.288543701171875, -0.2747154235839844, -0.26088714599609375, -0.24705886840820312, -0.2332305908203125, -0.21940231323242188, -0.20557403564453125, -0.19174575805664062, -0.17791748046875, -0.16408920288085938, -0.15026092529296875, -0.13643264770507812, -0.1226043701171875, -0.10877609252929688, -0.09494781494140625, -0.08111953735351562, -0.067291259765625, -0.053462982177734375, -0.03963470458984375, -0.025806427001953125, -0.0119781494140625, 0.001850128173828125, 0.01567840576171875, 0.029506683349609375, 0.0433349609375, 0.057163238525390625, 0.07099151611328125, 0.08481979370117188, 0.0986480712890625, 0.11247634887695312, 0.12630462646484375, 0.14013290405273438, 0.153961181640625, 0.16778945922851562, 0.18161773681640625, 0.19544601440429688, 0.2092742919921875, 0.22310256958007812, 0.23693084716796875, 0.2507591247558594, 0.26458740234375, 0.2784156799316406, 0.29224395751953125, 0.3060722351074219, 0.3199005126953125, 0.3337287902832031, 0.34755706787109375, 0.3613853454589844, 0.375213623046875, 0.3890419006347656, 0.40287017822265625, 0.4166984558105469, 0.4305267333984375, 0.4443550109863281, 0.45818328857421875, 0.4720115661621094, 0.48583984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 8.0, 11.0, 10.0, 10.0, 15.0, 22.0, 35.0, 45.0, 45.0, 71.0, 72.0, 51.0, 95.0, 85.0, 94.0, 71.0, 59.0, 49.0, 28.0, 21.0, 18.0, 23.0, 7.0, 15.0, 8.0, 2.0, 9.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243896484375, -0.235107421875, -0.226318359375, -0.217529296875, -0.208740234375, -0.199951171875, -0.191162109375, -0.182373046875, -0.173583984375, -0.164794921875, -0.156005859375, -0.147216796875, -0.138427734375, -0.129638671875, -0.120849609375, -0.112060546875, -0.103271484375, -0.094482421875, -0.085693359375, -0.076904296875, -0.068115234375, -0.059326171875, -0.050537109375, -0.041748046875, -0.032958984375, -0.024169921875, -0.015380859375, -0.006591796875, 0.002197265625, 0.010986328125, 0.019775390625, 0.028564453125, 0.037353515625, 0.046142578125, 0.054931640625, 0.063720703125, 0.072509765625, 0.081298828125, 0.090087890625, 0.098876953125, 0.107666015625, 0.116455078125, 0.125244140625, 0.134033203125, 0.142822265625, 0.151611328125, 0.160400390625, 0.169189453125, 0.177978515625, 0.186767578125, 0.195556640625, 0.204345703125, 0.213134765625, 0.221923828125, 0.230712890625, 0.239501953125, 0.248291015625, 0.257080078125, 0.265869140625, 0.274658203125, 0.283447265625, 0.292236328125, 0.301025390625, 0.309814453125, 0.318603515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 16.0, 60.0, 139.0, 251.0, 247.0, 177.0, 82.0, 20.0, 8.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.825963973999023, -16.469953536987305, -16.11394500732422, -15.7579345703125, -15.401925086975098, -15.045915603637695, -14.689906120300293, -14.33389663696289, -13.977886199951172, -13.62187671661377, -13.265867233276367, -12.909856796264648, -12.553847312927246, -12.197837829589844, -11.841828346252441, -11.485818862915039, -11.129809379577637, -10.773799896240234, -10.417790412902832, -10.06178092956543, -9.705770492553711, -9.349761009216309, -8.993751525878906, -8.637742042541504, -8.281732559204102, -7.925723075866699, -7.569713115692139, -7.213703632354736, -6.857693672180176, -6.501684188842773, -6.145674705505371, -5.789665222167969, -5.433655261993408, -5.077645778656006, -4.721635818481445, -4.365626335144043, -4.009616851806641, -3.65360689163208, -3.2975974082946777, -2.9415876865386963, -2.585577964782715, -2.2295682430267334, -1.8735586404800415, -1.5175490379333496, -1.1615393161773682, -0.8055295944213867, -0.4495201110839844, -0.09351038932800293, 0.2624993324279785, 0.6185089945793152, 0.9745186567306519, 1.3305282592773438, 1.6865379810333252, 2.0425477027893066, 2.398557186126709, 2.7545669078826904, 3.110576629638672, 3.4665863513946533, 3.8225960731506348, 4.178605556488037, 4.534615516662598, 4.890625, 5.246634483337402, 5.602643966674805, 5.958653926849365]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 8.0, 5.0, 9.0, 10.0, 7.0, 21.0, 19.0, 15.0, 29.0, 25.0, 21.0, 38.0, 30.0, 38.0, 43.0, 51.0, 47.0, 48.0, 42.0, 40.0, 52.0, 43.0, 34.0, 42.0, 35.0, 36.0, 27.0, 33.0, 23.0, 23.0, 19.0, 18.0, 15.0, 6.0, 3.0, 12.0, 9.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5132555961608887, -2.428422212600708, -2.3435890674591064, -2.258755683898926, -2.173922300338745, -2.0890889167785645, -2.004255771636963, -1.9194223880767822, -1.8345891237258911, -1.749755859375, -1.6649224758148193, -1.5800892114639282, -1.495255947113037, -1.4104225635528564, -1.3255892992019653, -1.2407560348510742, -1.1559226512908936, -1.0710893869400024, -0.9862560033798218, -0.9014227390289307, -0.8165894150733948, -0.7317560911178589, -0.6469228267669678, -0.5620895028114319, -0.477256178855896, -0.3924228549003601, -0.3075895607471466, -0.2227562665939331, -0.13792294263839722, -0.05308961868286133, 0.031743645668029785, 0.11657696962356567, 0.20141029357910156, 0.28624361753463745, 0.37107691168785095, 0.45591020584106445, 0.5407435297966003, 0.6255768537521362, 0.7104101181030273, 0.7952434420585632, 0.8800767660140991, 0.964910089969635, 1.049743413925171, 1.134576678276062, 1.2194099426269531, 1.3042433261871338, 1.389076590538025, 1.473909854888916, 1.5587432384490967, 1.6435765027999878, 1.7284098863601685, 1.8132431507110596, 1.8980765342712402, 1.9829097986221313, 2.0677430629730225, 2.152576446533203, 2.2374095916748047, 2.3222429752349854, 2.407076120376587, 2.4919095039367676, 2.5767428874969482, 2.661576271057129, 2.7464094161987305, 2.831242799758911, 2.916076183319092]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 18.0, 28.0, 36.0, 33.0, 53.0, 96.0, 183.0, 351.0, 685.0, 1539.0, 3965.0, 13393.0, 94671.0, 3904053.0, 149659.0, 17776.0, 4545.0, 1660.0, 689.0, 327.0, 188.0, 109.0, 52.0, 42.0, 29.0, 19.0, 14.0, 15.0, 9.0, 8.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9111328125, -1.854217529296875, -1.79730224609375, -1.740386962890625, -1.6834716796875, -1.626556396484375, -1.56964111328125, -1.512725830078125, -1.455810546875, -1.398895263671875, -1.34197998046875, -1.285064697265625, -1.2281494140625, -1.171234130859375, -1.11431884765625, -1.057403564453125, -1.00048828125, -0.943572998046875, -0.88665771484375, -0.829742431640625, -0.7728271484375, -0.715911865234375, -0.65899658203125, -0.602081298828125, -0.545166015625, -0.488250732421875, -0.43133544921875, -0.374420166015625, -0.3175048828125, -0.260589599609375, -0.20367431640625, -0.146759033203125, -0.08984375, -0.032928466796875, 0.02398681640625, 0.080902099609375, 0.1378173828125, 0.194732666015625, 0.25164794921875, 0.308563232421875, 0.365478515625, 0.422393798828125, 0.47930908203125, 0.536224365234375, 0.5931396484375, 0.650054931640625, 0.70697021484375, 0.763885498046875, 0.82080078125, 0.877716064453125, 0.93463134765625, 0.991546630859375, 1.0484619140625, 1.105377197265625, 1.16229248046875, 1.219207763671875, 1.276123046875, 1.333038330078125, 1.38995361328125, 1.446868896484375, 1.5037841796875, 1.560699462890625, 1.61761474609375, 1.674530029296875, 1.7314453125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 8.0, 12.0, 12.0, 9.0, 29.0, 26.0, 34.0, 33.0, 35.0, 46.0, 40.0, 41.0, 56.0, 61.0, 53.0, 57.0, 59.0, 55.0, 51.0, 46.0, 38.0, 32.0, 26.0, 28.0, 29.0, 26.0, 11.0, 8.0, 6.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1812744140625, -0.1757221221923828, -0.17016983032226562, -0.16461753845214844, -0.15906524658203125, -0.15351295471191406, -0.14796066284179688, -0.1424083709716797, -0.1368560791015625, -0.1313037872314453, -0.12575149536132812, -0.12019920349121094, -0.11464691162109375, -0.10909461975097656, -0.10354232788085938, -0.09799003601074219, -0.092437744140625, -0.08688545227050781, -0.08133316040039062, -0.07578086853027344, -0.07022857666015625, -0.06467628479003906, -0.059123992919921875, -0.05357170104980469, -0.0480194091796875, -0.04246711730957031, -0.036914825439453125, -0.03136253356933594, -0.02581024169921875, -0.020257949829101562, -0.014705657958984375, -0.009153366088867188, -0.00360107421875, 0.0019512176513671875, 0.007503509521484375, 0.013055801391601562, 0.01860809326171875, 0.024160385131835938, 0.029712677001953125, 0.03526496887207031, 0.0408172607421875, 0.04636955261230469, 0.051921844482421875, 0.05747413635253906, 0.06302642822265625, 0.06857872009277344, 0.07413101196289062, 0.07968330383300781, 0.085235595703125, 0.09078788757324219, 0.09634017944335938, 0.10189247131347656, 0.10744476318359375, 0.11299705505371094, 0.11854934692382812, 0.12410163879394531, 0.1296539306640625, 0.1352062225341797, 0.14075851440429688, 0.14631080627441406, 0.15186309814453125, 0.15741539001464844, 0.16296768188476562, 0.1685199737548828, 0.174072265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 14.0, 21.0, 43.0, 61.0, 55.0, 106.0, 226.0, 351.0, 681.0, 1580.0, 5380.0, 25150.0, 373403.0, 3707523.0, 65019.0, 9861.0, 2641.0, 980.0, 487.0, 265.0, 159.0, 91.0, 56.0, 41.0, 30.0, 21.0, 10.0, 10.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.333984375, -2.27447509765625, -2.2149658203125, -2.15545654296875, -2.095947265625, -2.03643798828125, -1.9769287109375, -1.91741943359375, -1.85791015625, -1.79840087890625, -1.7388916015625, -1.67938232421875, -1.619873046875, -1.56036376953125, -1.5008544921875, -1.44134521484375, -1.3818359375, -1.32232666015625, -1.2628173828125, -1.20330810546875, -1.143798828125, -1.08428955078125, -1.0247802734375, -0.96527099609375, -0.90576171875, -0.84625244140625, -0.7867431640625, -0.72723388671875, -0.667724609375, -0.60821533203125, -0.5487060546875, -0.48919677734375, -0.4296875, -0.37017822265625, -0.3106689453125, -0.25115966796875, -0.191650390625, -0.13214111328125, -0.0726318359375, -0.01312255859375, 0.04638671875, 0.10589599609375, 0.1654052734375, 0.22491455078125, 0.284423828125, 0.34393310546875, 0.4034423828125, 0.46295166015625, 0.5224609375, 0.58197021484375, 0.6414794921875, 0.70098876953125, 0.760498046875, 0.82000732421875, 0.8795166015625, 0.93902587890625, 0.99853515625, 1.05804443359375, 1.1175537109375, 1.17706298828125, 1.236572265625, 1.29608154296875, 1.3555908203125, 1.41510009765625, 1.474609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 5.0, 13.0, 14.0, 23.0, 35.0, 74.0, 106.0, 227.0, 781.0, 2061.0, 356.0, 146.0, 73.0, 58.0, 34.0, 14.0, 12.0, 11.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3812408447265625, -0.365509033203125, -0.3497772216796875, -0.33404541015625, -0.3183135986328125, -0.302581787109375, -0.2868499755859375, -0.2711181640625, -0.2553863525390625, -0.239654541015625, -0.2239227294921875, -0.20819091796875, -0.1924591064453125, -0.176727294921875, -0.1609954833984375, -0.145263671875, -0.1295318603515625, -0.113800048828125, -0.0980682373046875, -0.08233642578125, -0.0666046142578125, -0.050872802734375, -0.0351409912109375, -0.0194091796875, -0.0036773681640625, 0.012054443359375, 0.0277862548828125, 0.04351806640625, 0.0592498779296875, 0.074981689453125, 0.0907135009765625, 0.1064453125, 0.1221771240234375, 0.137908935546875, 0.1536407470703125, 0.16937255859375, 0.1851043701171875, 0.200836181640625, 0.2165679931640625, 0.2322998046875, 0.2480316162109375, 0.263763427734375, 0.2794952392578125, 0.29522705078125, 0.3109588623046875, 0.326690673828125, 0.3424224853515625, 0.358154296875, 0.3738861083984375, 0.389617919921875, 0.4053497314453125, 0.42108154296875, 0.4368133544921875, 0.452545166015625, 0.4682769775390625, 0.4840087890625, 0.4997406005859375, 0.515472412109375, 0.5312042236328125, 0.54693603515625, 0.5626678466796875, 0.578399658203125, 0.5941314697265625, 0.60986328125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 34.0, 103.0, 261.0, 330.0, 181.0, 46.0, 18.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.936696529388428, -5.757986068725586, -5.579276084899902, -5.4005656242370605, -5.221855163574219, -5.043145179748535, -4.864434719085693, -4.685724258422852, -4.507014274597168, -4.328303813934326, -4.149593830108643, -3.970883369445801, -3.792172908782959, -3.6134626865386963, -3.4347524642944336, -3.256042003631592, -3.07733154296875, -2.8986213207244873, -2.7199108600616455, -2.541200637817383, -2.362490177154541, -2.1837799549102783, -2.0050697326660156, -1.8263593912124634, -1.6476490497589111, -1.4689387083053589, -1.2902283668518066, -1.111518144607544, -0.9328078031539917, -0.7540974617004395, -0.5753872394561768, -0.3966768980026245, -0.21796703338623047, -0.03925672173500061, 0.13945358991622925, 0.3181638717651367, 0.49687421321868896, 0.6755845546722412, 0.8542947769165039, 1.0330051183700562, 1.2117154598236084, 1.3904258012771606, 1.569136142730713, 1.7478463649749756, 1.9265567064285278, 2.10526704788208, 2.2839772701263428, 2.4626874923706055, 2.6413979530334473, 2.82010817527771, 2.9988186359405518, 3.1775288581848145, 3.3562393188476562, 3.534949541091919, 3.7136597633361816, 3.8923702239990234, 4.071080207824707, 4.249790668487549, 4.428500652313232, 4.607211112976074, 4.785921573638916, 4.964632034301758, 5.143342018127441, 5.322052478790283, 5.500762939453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 14.0, 12.0, 10.0, 19.0, 14.0, 31.0, 32.0, 41.0, 35.0, 53.0, 54.0, 48.0, 66.0, 70.0, 55.0, 50.0, 61.0, 62.0, 44.0, 37.0, 35.0, 25.0, 32.0, 26.0, 22.0, 9.0, 4.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4183084964752197, -1.3751988410949707, -1.3320890665054321, -1.288979411125183, -1.245869755744934, -1.2027599811553955, -1.1596503257751465, -1.1165406703948975, -1.0734310150146484, -1.0303213596343994, -0.9872116446495056, -0.9441019296646118, -0.9009922742843628, -0.857882559299469, -0.8147728443145752, -0.7716631889343262, -0.7285534143447876, -0.6854436993598938, -0.6423340439796448, -0.599224328994751, -0.556114673614502, -0.5130049586296082, -0.46989524364471436, -0.42678555846214294, -0.38367587327957153, -0.3405661880970001, -0.2974565029144287, -0.2543467879295349, -0.2112371027469635, -0.1681274175643921, -0.1250177025794983, -0.08190801739692688, -0.03879821300506592, 0.00431147962808609, 0.0474211722612381, 0.0905308723449707, 0.13364055752754211, 0.17675024271011353, 0.21985995769500732, 0.26296964287757874, 0.30607932806015015, 0.34918901324272156, 0.39229869842529297, 0.43540841341018677, 0.4785180985927582, 0.5216277837753296, 0.5647374987602234, 0.6078472137451172, 0.6509568691253662, 0.69406658411026, 0.737176239490509, 0.7802859544754028, 0.8233956098556519, 0.8665053248405457, 0.9096150398254395, 0.9527246952056885, 0.9958344101905823, 1.038944125175476, 1.082053780555725, 1.1251635551452637, 1.1682732105255127, 1.2113828659057617, 1.2544925212860107, 1.2976022958755493, 1.3407119512557983]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 8.0, 16.0, 16.0, 18.0, 28.0, 33.0, 41.0, 73.0, 137.0, 209.0, 326.0, 653.0, 1289.0, 2954.0, 8017.0, 25662.0, 93509.0, 315171.0, 402326.0, 141033.0, 38171.0, 11266.0, 4024.0, 1659.0, 820.0, 437.0, 236.0, 148.0, 76.0, 65.0, 31.0, 35.0, 19.0, 11.0, 11.0, 5.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.97509765625, -0.9404678344726562, -0.9058380126953125, -0.8712081909179688, -0.836578369140625, -0.8019485473632812, -0.7673187255859375, -0.7326889038085938, -0.69805908203125, -0.6634292602539062, -0.6287994384765625, -0.5941696166992188, -0.559539794921875, -0.5249099731445312, -0.4902801513671875, -0.45565032958984375, -0.4210205078125, -0.38639068603515625, -0.3517608642578125, -0.31713104248046875, -0.282501220703125, -0.24787139892578125, -0.2132415771484375, -0.17861175537109375, -0.14398193359375, -0.10935211181640625, -0.0747222900390625, -0.04009246826171875, -0.005462646484375, 0.02916717529296875, 0.0637969970703125, 0.09842681884765625, 0.133056640625, 0.16768646240234375, 0.2023162841796875, 0.23694610595703125, 0.271575927734375, 0.30620574951171875, 0.3408355712890625, 0.37546539306640625, 0.41009521484375, 0.44472503662109375, 0.4793548583984375, 0.5139846801757812, 0.548614501953125, 0.5832443237304688, 0.6178741455078125, 0.6525039672851562, 0.6871337890625, 0.7217636108398438, 0.7563934326171875, 0.7910232543945312, 0.825653076171875, 0.8602828979492188, 0.8949127197265625, 0.9295425415039062, 0.96417236328125, 0.9988021850585938, 1.0334320068359375, 1.0680618286132812, 1.102691650390625, 1.1373214721679688, 1.1719512939453125, 1.2065811157226562, 1.2412109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 8.0, 9.0, 5.0, 11.0, 12.0, 14.0, 17.0, 29.0, 20.0, 38.0, 44.0, 50.0, 48.0, 55.0, 59.0, 60.0, 59.0, 47.0, 58.0, 48.0, 46.0, 43.0, 47.0, 32.0, 30.0, 33.0, 16.0, 9.0, 20.0, 11.0, 3.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.20703125, -0.20101547241210938, -0.19499969482421875, -0.18898391723632812, -0.1829681396484375, -0.17695236206054688, -0.17093658447265625, -0.16492080688476562, -0.158905029296875, -0.15288925170898438, -0.14687347412109375, -0.14085769653320312, -0.1348419189453125, -0.12882614135742188, -0.12281036376953125, -0.11679458618164062, -0.11077880859375, -0.10476303100585938, -0.09874725341796875, -0.09273147583007812, -0.0867156982421875, -0.08069992065429688, -0.07468414306640625, -0.06866836547851562, -0.062652587890625, -0.056636810302734375, -0.05062103271484375, -0.044605255126953125, -0.0385894775390625, -0.032573699951171875, -0.02655792236328125, -0.020542144775390625, -0.0145263671875, -0.008510589599609375, -0.00249481201171875, 0.003520965576171875, 0.0095367431640625, 0.015552520751953125, 0.02156829833984375, 0.027584075927734375, 0.033599853515625, 0.039615631103515625, 0.04563140869140625, 0.051647186279296875, 0.0576629638671875, 0.06367874145507812, 0.06969451904296875, 0.07571029663085938, 0.08172607421875, 0.08774185180664062, 0.09375762939453125, 0.09977340698242188, 0.1057891845703125, 0.11180496215820312, 0.11782073974609375, 0.12383651733398438, 0.129852294921875, 0.13586807250976562, 0.14188385009765625, 0.14789962768554688, 0.1539154052734375, 0.15993118286132812, 0.16594696044921875, 0.17196273803710938, 0.177978515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 10.0, 15.0, 27.0, 28.0, 50.0, 73.0, 102.0, 178.0, 263.0, 406.0, 635.0, 1149.0, 2147.0, 4057.0, 8680.0, 19941.0, 48090.0, 114375.0, 242763.0, 298564.0, 174802.0, 75024.0, 31041.0, 13370.0, 6021.0, 2863.0, 1540.0, 871.0, 501.0, 342.0, 202.0, 115.0, 87.0, 62.0, 57.0, 36.0, 23.0, 11.0, 13.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.64501953125, -0.6267242431640625, -0.608428955078125, -0.5901336669921875, -0.57183837890625, -0.5535430908203125, -0.535247802734375, -0.5169525146484375, -0.4986572265625, -0.4803619384765625, -0.462066650390625, -0.4437713623046875, -0.42547607421875, -0.4071807861328125, -0.388885498046875, -0.3705902099609375, -0.352294921875, -0.3339996337890625, -0.315704345703125, -0.2974090576171875, -0.27911376953125, -0.2608184814453125, -0.242523193359375, -0.2242279052734375, -0.2059326171875, -0.1876373291015625, -0.169342041015625, -0.1510467529296875, -0.13275146484375, -0.1144561767578125, -0.096160888671875, -0.0778656005859375, -0.0595703125, -0.0412750244140625, -0.022979736328125, -0.0046844482421875, 0.01361083984375, 0.0319061279296875, 0.050201416015625, 0.0684967041015625, 0.0867919921875, 0.1050872802734375, 0.123382568359375, 0.1416778564453125, 0.15997314453125, 0.1782684326171875, 0.196563720703125, 0.2148590087890625, 0.233154296875, 0.2514495849609375, 0.269744873046875, 0.2880401611328125, 0.30633544921875, 0.3246307373046875, 0.342926025390625, 0.3612213134765625, 0.3795166015625, 0.3978118896484375, 0.416107177734375, 0.4344024658203125, 0.45269775390625, 0.4709930419921875, 0.489288330078125, 0.5075836181640625, 0.52587890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 9.0, 7.0, 6.0, 6.0, 10.0, 18.0, 22.0, 17.0, 21.0, 28.0, 26.0, 37.0, 45.0, 42.0, 48.0, 36.0, 55.0, 30.0, 36.0, 48.0, 50.0, 43.0, 46.0, 57.0, 29.0, 37.0, 34.0, 24.0, 22.0, 18.0, 18.0, 10.0, 10.0, 14.0, 7.0, 8.0, 7.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.74267578125, -0.7205734252929688, -0.6984710693359375, -0.6763687133789062, -0.654266357421875, -0.6321640014648438, -0.6100616455078125, -0.5879592895507812, -0.56585693359375, -0.5437545776367188, -0.5216522216796875, -0.49954986572265625, -0.477447509765625, -0.45534515380859375, -0.4332427978515625, -0.41114044189453125, -0.3890380859375, -0.36693572998046875, -0.3448333740234375, -0.32273101806640625, -0.300628662109375, -0.27852630615234375, -0.2564239501953125, -0.23432159423828125, -0.21221923828125, -0.19011688232421875, -0.1680145263671875, -0.14591217041015625, -0.123809814453125, -0.10170745849609375, -0.0796051025390625, -0.05750274658203125, -0.035400390625, -0.01329803466796875, 0.0088043212890625, 0.03090667724609375, 0.053009033203125, 0.07511138916015625, 0.0972137451171875, 0.11931610107421875, 0.14141845703125, 0.16352081298828125, 0.1856231689453125, 0.20772552490234375, 0.229827880859375, 0.25193023681640625, 0.2740325927734375, 0.29613494873046875, 0.3182373046875, 0.34033966064453125, 0.3624420166015625, 0.38454437255859375, 0.406646728515625, 0.42874908447265625, 0.4508514404296875, 0.47295379638671875, 0.49505615234375, 0.5171585083007812, 0.5392608642578125, 0.5613632202148438, 0.583465576171875, 0.6055679321289062, 0.6276702880859375, 0.6497726440429688, 0.671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 14.0, 10.0, 14.0, 33.0, 78.0, 126.0, 237.0, 518.0, 1349.0, 5303.0, 30098.0, 255831.0, 635507.0, 101238.0, 13732.0, 2859.0, 882.0, 340.0, 176.0, 109.0, 44.0, 23.0, 14.0, 9.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.64501953125, -0.6244049072265625, -0.603790283203125, -0.5831756591796875, -0.56256103515625, -0.5419464111328125, -0.521331787109375, -0.5007171630859375, -0.4801025390625, -0.4594879150390625, -0.438873291015625, -0.4182586669921875, -0.39764404296875, -0.3770294189453125, -0.356414794921875, -0.3358001708984375, -0.315185546875, -0.2945709228515625, -0.273956298828125, -0.2533416748046875, -0.23272705078125, -0.2121124267578125, -0.191497802734375, -0.1708831787109375, -0.1502685546875, -0.1296539306640625, -0.109039306640625, -0.0884246826171875, -0.06781005859375, -0.0471954345703125, -0.026580810546875, -0.0059661865234375, 0.0146484375, 0.0352630615234375, 0.055877685546875, 0.0764923095703125, 0.09710693359375, 0.1177215576171875, 0.138336181640625, 0.1589508056640625, 0.1795654296875, 0.2001800537109375, 0.220794677734375, 0.2414093017578125, 0.26202392578125, 0.2826385498046875, 0.303253173828125, 0.3238677978515625, 0.344482421875, 0.3650970458984375, 0.385711669921875, 0.4063262939453125, 0.42694091796875, 0.4475555419921875, 0.468170166015625, 0.4887847900390625, 0.5093994140625, 0.5300140380859375, 0.550628662109375, 0.5712432861328125, 0.59185791015625, 0.6124725341796875, 0.633087158203125, 0.6537017822265625, 0.67431640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 5.0, 5.0, 6.0, 6.0, 12.0, 20.0, 23.0, 23.0, 29.0, 41.0, 53.0, 50.0, 77.0, 57.0, 74.0, 81.0, 86.0, 73.0, 64.0, 42.0, 37.0, 26.0, 24.0, 15.0, 10.0, 13.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.790327072143555e-05, -7.561780512332916e-05, -7.333233952522278e-05, -7.10468739271164e-05, -6.876140832901001e-05, -6.647594273090363e-05, -6.419047713279724e-05, -6.190501153469086e-05, -5.961954593658447e-05, -5.733408033847809e-05, -5.5048614740371704e-05, -5.276314914226532e-05, -5.0477683544158936e-05, -4.819221794605255e-05, -4.590675234794617e-05, -4.362128674983978e-05, -4.13358211517334e-05, -3.9050355553627014e-05, -3.676488995552063e-05, -3.4479424357414246e-05, -3.219395875930786e-05, -2.9908493161201477e-05, -2.7623027563095093e-05, -2.533756196498871e-05, -2.3052096366882324e-05, -2.076663076877594e-05, -1.8481165170669556e-05, -1.619569957256317e-05, -1.3910233974456787e-05, -1.1624768376350403e-05, -9.339302778244019e-06, -7.053837180137634e-06, -4.76837158203125e-06, -2.4829059839248657e-06, -1.9744038581848145e-07, 2.088025212287903e-06, 4.373490810394287e-06, 6.658956408500671e-06, 8.944422006607056e-06, 1.122988760471344e-05, 1.3515353202819824e-05, 1.580081880092621e-05, 1.8086284399032593e-05, 2.0371749997138977e-05, 2.265721559524536e-05, 2.4942681193351746e-05, 2.722814679145813e-05, 2.9513612389564514e-05, 3.17990779876709e-05, 3.408454358577728e-05, 3.637000918388367e-05, 3.865547478199005e-05, 4.0940940380096436e-05, 4.322640597820282e-05, 4.5511871576309204e-05, 4.779733717441559e-05, 5.008280277252197e-05, 5.236826837062836e-05, 5.465373396873474e-05, 5.6939199566841125e-05, 5.922466516494751e-05, 6.15101307630539e-05, 6.379559636116028e-05, 6.608106195926666e-05, 6.836652755737305e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 13.0, 14.0, 27.0, 33.0, 67.0, 84.0, 135.0, 238.0, 448.0, 762.0, 1680.0, 3832.0, 9817.0, 27181.0, 80346.0, 246079.0, 402461.0, 182511.0, 59199.0, 20181.0, 7518.0, 2953.0, 1407.0, 695.0, 353.0, 205.0, 113.0, 69.0, 32.0, 39.0, 16.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.338134765625, -0.3266181945800781, -0.31510162353515625, -0.3035850524902344, -0.2920684814453125, -0.2805519104003906, -0.26903533935546875, -0.2575187683105469, -0.246002197265625, -0.23448562622070312, -0.22296905517578125, -0.21145248413085938, -0.1999359130859375, -0.18841934204101562, -0.17690277099609375, -0.16538619995117188, -0.15386962890625, -0.14235305786132812, -0.13083648681640625, -0.11931991577148438, -0.1078033447265625, -0.09628677368164062, -0.08477020263671875, -0.07325363159179688, -0.061737060546875, -0.050220489501953125, -0.03870391845703125, -0.027187347412109375, -0.0156707763671875, -0.004154205322265625, 0.00736236572265625, 0.018878936767578125, 0.0303955078125, 0.041912078857421875, 0.05342864990234375, 0.06494522094726562, 0.0764617919921875, 0.08797836303710938, 0.09949493408203125, 0.11101150512695312, 0.122528076171875, 0.13404464721679688, 0.14556121826171875, 0.15707778930664062, 0.1685943603515625, 0.18011093139648438, 0.19162750244140625, 0.20314407348632812, 0.21466064453125, 0.22617721557617188, 0.23769378662109375, 0.24921035766601562, 0.2607269287109375, 0.2722434997558594, 0.28376007080078125, 0.2952766418457031, 0.306793212890625, 0.3183097839355469, 0.32982635498046875, 0.3413429260253906, 0.3528594970703125, 0.3643760681152344, 0.37589263916015625, 0.3874092102050781, 0.39892578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 10.0, 21.0, 24.0, 18.0, 19.0, 27.0, 41.0, 41.0, 52.0, 61.0, 68.0, 71.0, 83.0, 74.0, 54.0, 49.0, 42.0, 37.0, 34.0, 25.0, 25.0, 11.0, 21.0, 9.0, 11.0, 6.0, 8.0, 6.0, 2.0, 2.0, 5.0, 10.0, 0.0, 1.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420654296875, -0.4083213806152344, -0.39598846435546875, -0.3836555480957031, -0.3713226318359375, -0.3589897155761719, -0.34665679931640625, -0.3343238830566406, -0.321990966796875, -0.3096580505371094, -0.29732513427734375, -0.2849922180175781, -0.2726593017578125, -0.2603263854980469, -0.24799346923828125, -0.23566055297851562, -0.22332763671875, -0.21099472045898438, -0.19866180419921875, -0.18632888793945312, -0.1739959716796875, -0.16166305541992188, -0.14933013916015625, -0.13699722290039062, -0.124664306640625, -0.11233139038085938, -0.09999847412109375, -0.08766555786132812, -0.0753326416015625, -0.06299972534179688, -0.05066680908203125, -0.038333892822265625, -0.0260009765625, -0.013668060302734375, -0.00133514404296875, 0.010997772216796875, 0.0233306884765625, 0.035663604736328125, 0.04799652099609375, 0.060329437255859375, 0.072662353515625, 0.08499526977539062, 0.09732818603515625, 0.10966110229492188, 0.1219940185546875, 0.13432693481445312, 0.14665985107421875, 0.15899276733398438, 0.17132568359375, 0.18365859985351562, 0.19599151611328125, 0.20832443237304688, 0.2206573486328125, 0.23299026489257812, 0.24532318115234375, 0.2576560974121094, 0.269989013671875, 0.2823219299316406, 0.29465484619140625, 0.3069877624511719, 0.3193206787109375, 0.3316535949707031, 0.34398651123046875, 0.3563194274902344, 0.36865234375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 15.0, 18.0, 40.0, 72.0, 130.0, 177.0, 170.0, 152.0, 121.0, 50.0, 20.0, 19.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.444522857666016, -16.117935180664062, -15.79134750366211, -15.464759826660156, -15.138172149658203, -14.81158447265625, -14.484996795654297, -14.158409118652344, -13.83182144165039, -13.505233764648438, -13.178646087646484, -12.852058410644531, -12.525470733642578, -12.198883056640625, -11.872295379638672, -11.545707702636719, -11.219120979309082, -10.892533302307129, -10.565945625305176, -10.239357948303223, -9.91277027130127, -9.586182594299316, -9.259594917297363, -8.933008193969727, -8.606420516967773, -8.27983283996582, -7.953245162963867, -7.626657485961914, -7.300069808959961, -6.973482131958008, -6.646894931793213, -6.32030725479126, -5.993719100952148, -5.667131423950195, -5.340543746948242, -5.013956069946289, -4.687368392944336, -4.360780715942383, -4.034193515777588, -3.7076058387756348, -3.3810181617736816, -3.0544304847717285, -2.7278428077697754, -2.4012553691864014, -2.0746676921844482, -1.7480800151824951, -1.4214924573898315, -1.094904899597168, -0.7683172225952148, -0.4417296051979065, -0.11514198780059814, 0.2114456295967102, 0.5380332469940186, 0.8646209239959717, 1.1912084817886353, 1.5177960395812988, 1.844383716583252, 2.170971393585205, 2.497559070587158, 2.8241465091705322, 3.1507341861724854, 3.4773218631744385, 3.8039093017578125, 4.130496978759766, 4.457084655761719]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 12.0, 9.0, 9.0, 15.0, 17.0, 18.0, 20.0, 23.0, 25.0, 38.0, 25.0, 36.0, 42.0, 48.0, 38.0, 55.0, 45.0, 55.0, 54.0, 37.0, 55.0, 38.0, 46.0, 36.0, 35.0, 25.0, 17.0, 33.0, 18.0, 11.0, 15.0, 10.0, 7.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.402034759521484, -4.275336265563965, -4.148637294769287, -4.021938800811768, -3.895240068435669, -3.7685413360595703, -3.641842842102051, -3.515144109725952, -3.3884453773498535, -3.261746644973755, -3.1350479125976562, -3.0083494186401367, -2.881650686264038, -2.7549519538879395, -2.62825345993042, -2.5015547275543213, -2.3748559951782227, -2.248157262802124, -2.1214585304260254, -1.9947600364685059, -1.8680613040924072, -1.7413625717163086, -1.6146639585494995, -1.4879653453826904, -1.3612666130065918, -1.2345678806304932, -1.107869267463684, -0.9811705946922302, -0.8544719219207764, -0.7277732491493225, -0.6010745763778687, -0.4743759036064148, -0.34767723083496094, -0.22097855806350708, -0.09427988529205322, 0.032418787479400635, 0.1591174602508545, 0.28581613302230835, 0.4125148057937622, 0.5392134785652161, 0.6659121513366699, 0.7926108241081238, 0.9193094968795776, 1.0460081100463867, 1.1727068424224854, 1.299405574798584, 1.426104187965393, 1.5528028011322021, 1.6795015335083008, 1.8062002658843994, 1.9328988790512085, 2.0595974922180176, 2.186296224594116, 2.312994956970215, 2.4396934509277344, 2.566392183303833, 2.6930909156799316, 2.8197896480560303, 2.946488380432129, 3.0731868743896484, 3.199885606765747, 3.3265843391418457, 3.4532828330993652, 3.579981565475464, 3.7066802978515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 14.0, 22.0, 25.0, 46.0, 80.0, 134.0, 245.0, 534.0, 1488.0, 4394.0, 18324.0, 139865.0, 3822677.0, 177738.0, 21159.0, 4921.0, 1547.0, 538.0, 225.0, 106.0, 63.0, 41.0, 18.0, 14.0, 9.0, 10.0, 4.0, 5.0, 4.0, 4.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.34759521484375, -1.2850341796875, -1.22247314453125, -1.159912109375, -1.09735107421875, -1.0347900390625, -0.97222900390625, -0.90966796875, -0.84710693359375, -0.7845458984375, -0.72198486328125, -0.659423828125, -0.59686279296875, -0.5343017578125, -0.47174072265625, -0.4091796875, -0.34661865234375, -0.2840576171875, -0.22149658203125, -0.158935546875, -0.09637451171875, -0.0338134765625, 0.02874755859375, 0.09130859375, 0.15386962890625, 0.2164306640625, 0.27899169921875, 0.341552734375, 0.40411376953125, 0.4666748046875, 0.52923583984375, 0.591796875, 0.65435791015625, 0.7169189453125, 0.77947998046875, 0.842041015625, 0.90460205078125, 0.9671630859375, 1.02972412109375, 1.09228515625, 1.15484619140625, 1.2174072265625, 1.27996826171875, 1.342529296875, 1.40509033203125, 1.4676513671875, 1.53021240234375, 1.5927734375, 1.65533447265625, 1.7178955078125, 1.78045654296875, 1.843017578125, 1.90557861328125, 1.9681396484375, 2.03070068359375, 2.09326171875, 2.15582275390625, 2.2183837890625, 2.28094482421875, 2.343505859375, 2.40606689453125, 2.4686279296875, 2.53118896484375, 2.59375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 9.0, 9.0, 12.0, 10.0, 16.0, 16.0, 19.0, 21.0, 27.0, 23.0, 36.0, 47.0, 51.0, 48.0, 47.0, 63.0, 42.0, 53.0, 61.0, 47.0, 65.0, 40.0, 36.0, 33.0, 27.0, 30.0, 22.0, 22.0, 11.0, 17.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2069091796875, -0.20078468322753906, -0.19466018676757812, -0.1885356903076172, -0.18241119384765625, -0.1762866973876953, -0.17016220092773438, -0.16403770446777344, -0.1579132080078125, -0.15178871154785156, -0.14566421508789062, -0.1395397186279297, -0.13341522216796875, -0.1272907257080078, -0.12116622924804688, -0.11504173278808594, -0.108917236328125, -0.10279273986816406, -0.09666824340820312, -0.09054374694824219, -0.08441925048828125, -0.07829475402832031, -0.07217025756835938, -0.06604576110839844, -0.0599212646484375, -0.05379676818847656, -0.047672271728515625, -0.04154777526855469, -0.03542327880859375, -0.029298782348632812, -0.023174285888671875, -0.017049789428710938, -0.01092529296875, -0.0048007965087890625, 0.001323699951171875, 0.0074481964111328125, 0.01357269287109375, 0.019697189331054688, 0.025821685791015625, 0.03194618225097656, 0.0380706787109375, 0.04419517517089844, 0.050319671630859375, 0.05644416809082031, 0.06256866455078125, 0.06869316101074219, 0.07481765747070312, 0.08094215393066406, 0.087066650390625, 0.09319114685058594, 0.09931564331054688, 0.10544013977050781, 0.11156463623046875, 0.11768913269042969, 0.12381362915039062, 0.12993812561035156, 0.1360626220703125, 0.14218711853027344, 0.14831161499023438, 0.1544361114501953, 0.16056060791015625, 0.1666851043701172, 0.17280960083007812, 0.17893409729003906, 0.18505859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 7.0, 6.0, 13.0, 20.0, 20.0, 42.0, 46.0, 73.0, 109.0, 156.0, 251.0, 397.0, 571.0, 975.0, 1679.0, 3200.0, 6563.0, 16481.0, 53374.0, 298933.0, 3394356.0, 328770.0, 56471.0, 17268.0, 6765.0, 3281.0, 1654.0, 1040.0, 587.0, 410.0, 235.0, 168.0, 101.0, 74.0, 52.0, 38.0, 24.0, 19.0, 21.0, 7.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.3203125, -1.28314208984375, -1.2459716796875, -1.20880126953125, -1.171630859375, -1.13446044921875, -1.0972900390625, -1.06011962890625, -1.02294921875, -0.98577880859375, -0.9486083984375, -0.91143798828125, -0.874267578125, -0.83709716796875, -0.7999267578125, -0.76275634765625, -0.7255859375, -0.68841552734375, -0.6512451171875, -0.61407470703125, -0.576904296875, -0.53973388671875, -0.5025634765625, -0.46539306640625, -0.42822265625, -0.39105224609375, -0.3538818359375, -0.31671142578125, -0.279541015625, -0.24237060546875, -0.2052001953125, -0.16802978515625, -0.130859375, -0.09368896484375, -0.0565185546875, -0.01934814453125, 0.017822265625, 0.05499267578125, 0.0921630859375, 0.12933349609375, 0.16650390625, 0.20367431640625, 0.2408447265625, 0.27801513671875, 0.315185546875, 0.35235595703125, 0.3895263671875, 0.42669677734375, 0.4638671875, 0.50103759765625, 0.5382080078125, 0.57537841796875, 0.612548828125, 0.64971923828125, 0.6868896484375, 0.72406005859375, 0.76123046875, 0.79840087890625, 0.8355712890625, 0.87274169921875, 0.909912109375, 0.94708251953125, 0.9842529296875, 1.02142333984375, 1.05859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 4.0, 6.0, 9.0, 15.0, 22.0, 35.0, 58.0, 98.0, 202.0, 507.0, 1960.0, 610.0, 232.0, 107.0, 70.0, 34.0, 27.0, 17.0, 15.0, 7.0, 4.0, 8.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6225814819335938, -0.5991668701171875, -0.5757522583007812, -0.552337646484375, -0.5289230346679688, -0.5055084228515625, -0.48209381103515625, -0.45867919921875, -0.43526458740234375, -0.4118499755859375, -0.38843536376953125, -0.365020751953125, -0.34160614013671875, -0.3181915283203125, -0.29477691650390625, -0.2713623046875, -0.24794769287109375, -0.2245330810546875, -0.20111846923828125, -0.177703857421875, -0.15428924560546875, -0.1308746337890625, -0.10746002197265625, -0.08404541015625, -0.06063079833984375, -0.0372161865234375, -0.01380157470703125, 0.009613037109375, 0.03302764892578125, 0.0564422607421875, 0.07985687255859375, 0.103271484375, 0.12668609619140625, 0.1501007080078125, 0.17351531982421875, 0.196929931640625, 0.22034454345703125, 0.2437591552734375, 0.26717376708984375, 0.29058837890625, 0.31400299072265625, 0.3374176025390625, 0.36083221435546875, 0.384246826171875, 0.40766143798828125, 0.4310760498046875, 0.45449066162109375, 0.4779052734375, 0.5013198852539062, 0.5247344970703125, 0.5481491088867188, 0.571563720703125, 0.5949783325195312, 0.6183929443359375, 0.6418075561523438, 0.66522216796875, 0.6886367797851562, 0.7120513916015625, 0.7354660034179688, 0.758880615234375, 0.7822952270507812, 0.8057098388671875, 0.8291244506835938, 0.8525390625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 25.0, 45.0, 104.0, 173.0, 210.0, 186.0, 133.0, 56.0, 35.0, 13.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.316376686096191, -9.11625862121582, -8.91614055633545, -8.716022491455078, -8.515904426574707, -8.315786361694336, -8.115668296813965, -7.915550231933594, -7.715432167053223, -7.515314102172852, -7.3151960372924805, -7.115077972412109, -6.914959907531738, -6.714841842651367, -6.514723777770996, -6.314605712890625, -6.114487648010254, -5.914369583129883, -5.714251518249512, -5.514133453369141, -5.3140153884887695, -5.113897323608398, -4.913779258728027, -4.713661193847656, -4.513542652130127, -4.313424587249756, -4.113306522369385, -3.9131884574890137, -3.7130703926086426, -3.5129523277282715, -3.3128342628479004, -3.1127161979675293, -2.912598133087158, -2.712480068206787, -2.512362003326416, -2.312243938446045, -2.112125873565674, -1.9120076894760132, -1.711889624595642, -1.511771559715271, -1.3116534948349, -1.1115354299545288, -0.9114173650741577, -0.7112992405891418, -0.5111811757087708, -0.3110630512237549, -0.11094498634338379, 0.0891730785369873, 0.2892911434173584, 0.4894092082977295, 0.6895272731781006, 0.8896453976631165, 1.0897634029388428, 1.2898815870285034, 1.4899996519088745, 1.6901177167892456, 1.8902357816696167, 2.0903539657592773, 2.2904720306396484, 2.4905900955200195, 2.6907081604003906, 2.8908262252807617, 3.090944290161133, 3.291062355041504, 3.491180419921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 8.0, 9.0, 6.0, 9.0, 10.0, 9.0, 13.0, 16.0, 13.0, 30.0, 24.0, 42.0, 39.0, 37.0, 40.0, 38.0, 41.0, 52.0, 50.0, 60.0, 39.0, 43.0, 57.0, 38.0, 42.0, 40.0, 33.0, 28.0, 26.0, 20.0, 18.0, 14.0, 10.0, 6.0, 7.0, 8.0, 8.0, 7.0, 5.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.3479976654052734, -2.280540943145752, -2.2130842208862305, -2.145627498626709, -2.0781707763671875, -2.010714054107666, -1.943257451057434, -1.8758007287979126, -1.8083441257476807, -1.7408874034881592, -1.6734306812286377, -1.6059739589691162, -1.5385173559188843, -1.4710606336593628, -1.4036039113998413, -1.3361471891403198, -1.2686904668807983, -1.2012337446212769, -1.1337770223617554, -1.0663204193115234, -0.998863697052002, -0.9314069747924805, -0.863950252532959, -0.7964935302734375, -0.7290368676185608, -0.6615801453590393, -0.5941234827041626, -0.5266667604446411, -0.459210067987442, -0.3917533755302429, -0.32429665327072144, -0.25683996081352234, -0.18938326835632324, -0.12192656844854355, -0.054469868540763855, 0.012986838817596436, 0.08044353127479553, 0.14790022373199463, 0.2153569459915161, 0.2828136384487152, 0.3502703309059143, 0.4177270233631134, 0.4851837158203125, 0.552640438079834, 0.6200971603393555, 0.6875538229942322, 0.7550105452537537, 0.8224672079086304, 0.8899239301681519, 0.9573806524276733, 1.0248373746871948, 1.0922939777374268, 1.1597506999969482, 1.2272074222564697, 1.2946641445159912, 1.3621208667755127, 1.4295775890350342, 1.4970343112945557, 1.5644910335540771, 1.6319477558135986, 1.6994043588638306, 1.766861081123352, 1.8343178033828735, 1.901774525642395, 1.969231128692627]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 8.0, 18.0, 26.0, 32.0, 84.0, 138.0, 281.0, 580.0, 1493.0, 3890.0, 12242.0, 44563.0, 172722.0, 422165.0, 281007.0, 78609.0, 20694.0, 6165.0, 2159.0, 880.0, 388.0, 203.0, 84.0, 45.0, 29.0, 17.0, 8.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.8815383911132812, -0.8368072509765625, -0.7920761108398438, -0.747344970703125, -0.7026138305664062, -0.6578826904296875, -0.6131515502929688, -0.56842041015625, -0.5236892700195312, -0.4789581298828125, -0.43422698974609375, -0.389495849609375, -0.34476470947265625, -0.3000335693359375, -0.25530242919921875, -0.2105712890625, -0.16584014892578125, -0.1211090087890625, -0.07637786865234375, -0.031646728515625, 0.01308441162109375, 0.0578155517578125, 0.10254669189453125, 0.14727783203125, 0.19200897216796875, 0.2367401123046875, 0.28147125244140625, 0.326202392578125, 0.37093353271484375, 0.4156646728515625, 0.46039581298828125, 0.505126953125, 0.5498580932617188, 0.5945892333984375, 0.6393203735351562, 0.684051513671875, 0.7287826538085938, 0.7735137939453125, 0.8182449340820312, 0.86297607421875, 0.9077072143554688, 0.9524383544921875, 0.9971694946289062, 1.041900634765625, 1.0866317749023438, 1.1313629150390625, 1.1760940551757812, 1.2208251953125, 1.2655563354492188, 1.3102874755859375, 1.3550186157226562, 1.399749755859375, 1.4444808959960938, 1.4892120361328125, 1.5339431762695312, 1.57867431640625, 1.6234054565429688, 1.6681365966796875, 1.7128677368164062, 1.757598876953125, 1.8023300170898438, 1.8470611572265625, 1.8917922973632812, 1.9365234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 10.0, 9.0, 10.0, 22.0, 18.0, 16.0, 30.0, 36.0, 37.0, 39.0, 57.0, 49.0, 51.0, 62.0, 56.0, 48.0, 65.0, 54.0, 52.0, 41.0, 49.0, 38.0, 32.0, 29.0, 14.0, 14.0, 12.0, 7.0, 13.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.315673828125, -0.30750274658203125, -0.2993316650390625, -0.29116058349609375, -0.282989501953125, -0.27481842041015625, -0.2666473388671875, -0.25847625732421875, -0.25030517578125, -0.24213409423828125, -0.2339630126953125, -0.22579193115234375, -0.217620849609375, -0.20944976806640625, -0.2012786865234375, -0.19310760498046875, -0.1849365234375, -0.17676544189453125, -0.1685943603515625, -0.16042327880859375, -0.152252197265625, -0.14408111572265625, -0.1359100341796875, -0.12773895263671875, -0.11956787109375, -0.11139678955078125, -0.1032257080078125, -0.09505462646484375, -0.086883544921875, -0.07871246337890625, -0.0705413818359375, -0.06237030029296875, -0.05419921875, -0.04602813720703125, -0.0378570556640625, -0.02968597412109375, -0.021514892578125, -0.01334381103515625, -0.0051727294921875, 0.00299835205078125, 0.01116943359375, 0.01934051513671875, 0.0275115966796875, 0.03568267822265625, 0.043853759765625, 0.05202484130859375, 0.0601959228515625, 0.06836700439453125, 0.0765380859375, 0.08470916748046875, 0.0928802490234375, 0.10105133056640625, 0.109222412109375, 0.11739349365234375, 0.1255645751953125, 0.13373565673828125, 0.14190673828125, 0.15007781982421875, 0.1582489013671875, 0.16641998291015625, 0.174591064453125, 0.18276214599609375, 0.1909332275390625, 0.19910430908203125, 0.207275390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 11.0, 10.0, 23.0, 16.0, 31.0, 45.0, 78.0, 96.0, 159.0, 256.0, 402.0, 610.0, 1158.0, 2028.0, 3846.0, 7894.0, 17072.0, 39619.0, 95452.0, 218615.0, 314615.0, 196789.0, 84295.0, 35041.0, 15334.0, 7058.0, 3562.0, 1904.0, 1018.0, 544.0, 352.0, 217.0, 135.0, 66.0, 65.0, 48.0, 27.0, 16.0, 20.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.89013671875, -0.8626861572265625, -0.835235595703125, -0.8077850341796875, -0.78033447265625, -0.7528839111328125, -0.725433349609375, -0.6979827880859375, -0.6705322265625, -0.6430816650390625, -0.615631103515625, -0.5881805419921875, -0.56072998046875, -0.5332794189453125, -0.505828857421875, -0.4783782958984375, -0.450927734375, -0.4234771728515625, -0.396026611328125, -0.3685760498046875, -0.34112548828125, -0.3136749267578125, -0.286224365234375, -0.2587738037109375, -0.2313232421875, -0.2038726806640625, -0.176422119140625, -0.1489715576171875, -0.12152099609375, -0.0940704345703125, -0.066619873046875, -0.0391693115234375, -0.01171875, 0.0157318115234375, 0.043182373046875, 0.0706329345703125, 0.09808349609375, 0.1255340576171875, 0.152984619140625, 0.1804351806640625, 0.2078857421875, 0.2353363037109375, 0.262786865234375, 0.2902374267578125, 0.31768798828125, 0.3451385498046875, 0.372589111328125, 0.4000396728515625, 0.427490234375, 0.4549407958984375, 0.482391357421875, 0.5098419189453125, 0.53729248046875, 0.5647430419921875, 0.592193603515625, 0.6196441650390625, 0.6470947265625, 0.6745452880859375, 0.701995849609375, 0.7294464111328125, 0.75689697265625, 0.7843475341796875, 0.811798095703125, 0.8392486572265625, 0.86669921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 3.0, 13.0, 11.0, 10.0, 12.0, 17.0, 21.0, 18.0, 24.0, 27.0, 19.0, 43.0, 40.0, 48.0, 60.0, 45.0, 39.0, 55.0, 48.0, 37.0, 50.0, 36.0, 41.0, 36.0, 29.0, 25.0, 32.0, 23.0, 20.0, 19.0, 15.0, 15.0, 16.0, 7.0, 10.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.2734375, -1.2375640869140625, -1.201690673828125, -1.1658172607421875, -1.12994384765625, -1.0940704345703125, -1.058197021484375, -1.0223236083984375, -0.9864501953125, -0.9505767822265625, -0.914703369140625, -0.8788299560546875, -0.84295654296875, -0.8070831298828125, -0.771209716796875, -0.7353363037109375, -0.699462890625, -0.6635894775390625, -0.627716064453125, -0.5918426513671875, -0.55596923828125, -0.5200958251953125, -0.484222412109375, -0.4483489990234375, -0.4124755859375, -0.3766021728515625, -0.340728759765625, -0.3048553466796875, -0.26898193359375, -0.2331085205078125, -0.197235107421875, -0.1613616943359375, -0.12548828125, -0.0896148681640625, -0.053741455078125, -0.0178680419921875, 0.01800537109375, 0.0538787841796875, 0.089752197265625, 0.1256256103515625, 0.1614990234375, 0.1973724365234375, 0.233245849609375, 0.2691192626953125, 0.30499267578125, 0.3408660888671875, 0.376739501953125, 0.4126129150390625, 0.448486328125, 0.4843597412109375, 0.520233154296875, 0.5561065673828125, 0.59197998046875, 0.6278533935546875, 0.663726806640625, 0.6996002197265625, 0.7354736328125, 0.7713470458984375, 0.807220458984375, 0.8430938720703125, 0.87896728515625, 0.9148406982421875, 0.950714111328125, 0.9865875244140625, 1.0224609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 14.0, 4.0, 10.0, 10.0, 19.0, 29.0, 35.0, 50.0, 78.0, 123.0, 173.0, 247.0, 447.0, 778.0, 1644.0, 3974.0, 11085.0, 39030.0, 178669.0, 519276.0, 223564.0, 47630.0, 13135.0, 4435.0, 1892.0, 877.0, 462.0, 297.0, 160.0, 115.0, 80.0, 55.0, 43.0, 29.0, 17.0, 15.0, 16.0, 8.0, 6.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79296875, -0.76934814453125, -0.7457275390625, -0.72210693359375, -0.698486328125, -0.67486572265625, -0.6512451171875, -0.62762451171875, -0.60400390625, -0.58038330078125, -0.5567626953125, -0.53314208984375, -0.509521484375, -0.48590087890625, -0.4622802734375, -0.43865966796875, -0.4150390625, -0.39141845703125, -0.3677978515625, -0.34417724609375, -0.320556640625, -0.29693603515625, -0.2733154296875, -0.24969482421875, -0.22607421875, -0.20245361328125, -0.1788330078125, -0.15521240234375, -0.131591796875, -0.10797119140625, -0.0843505859375, -0.06072998046875, -0.037109375, -0.01348876953125, 0.0101318359375, 0.03375244140625, 0.057373046875, 0.08099365234375, 0.1046142578125, 0.12823486328125, 0.15185546875, 0.17547607421875, 0.1990966796875, 0.22271728515625, 0.246337890625, 0.26995849609375, 0.2935791015625, 0.31719970703125, 0.3408203125, 0.36444091796875, 0.3880615234375, 0.41168212890625, 0.435302734375, 0.45892333984375, 0.4825439453125, 0.50616455078125, 0.52978515625, 0.55340576171875, 0.5770263671875, 0.60064697265625, 0.624267578125, 0.64788818359375, 0.6715087890625, 0.69512939453125, 0.71875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 9.0, 11.0, 17.0, 5.0, 24.0, 45.0, 60.0, 75.0, 98.0, 110.0, 109.0, 105.0, 79.0, 72.0, 53.0, 49.0, 26.0, 24.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00021409988403320312, -0.0002090558409690857, -0.00020401179790496826, -0.00019896775484085083, -0.0001939237117767334, -0.00018887966871261597, -0.00018383562564849854, -0.0001787915825843811, -0.00017374753952026367, -0.00016870349645614624, -0.0001636594533920288, -0.00015861541032791138, -0.00015357136726379395, -0.00014852732419967651, -0.00014348328113555908, -0.00013843923807144165, -0.00013339519500732422, -0.0001283511519432068, -0.00012330710887908936, -0.00011826306581497192, -0.00011321902275085449, -0.00010817497968673706, -0.00010313093662261963, -9.80868935585022e-05, -9.304285049438477e-05, -8.799880743026733e-05, -8.29547643661499e-05, -7.791072130203247e-05, -7.286667823791504e-05, -6.782263517379761e-05, -6.277859210968018e-05, -5.7734549045562744e-05, -5.269050598144531e-05, -4.764646291732788e-05, -4.260241985321045e-05, -3.755837678909302e-05, -3.2514333724975586e-05, -2.7470290660858154e-05, -2.2426247596740723e-05, -1.738220453262329e-05, -1.233816146850586e-05, -7.294118404388428e-06, -2.250075340270996e-06, 2.7939677238464355e-06, 7.838010787963867e-06, 1.2882053852081299e-05, 1.792609691619873e-05, 2.2970139980316162e-05, 2.8014183044433594e-05, 3.3058226108551025e-05, 3.810226917266846e-05, 4.314631223678589e-05, 4.819035530090332e-05, 5.323439836502075e-05, 5.8278441429138184e-05, 6.332248449325562e-05, 6.836652755737305e-05, 7.341057062149048e-05, 7.845461368560791e-05, 8.349865674972534e-05, 8.854269981384277e-05, 9.35867428779602e-05, 9.863078594207764e-05, 0.00010367482900619507, 0.0001087188720703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 9.0, 10.0, 22.0, 22.0, 37.0, 43.0, 90.0, 108.0, 154.0, 286.0, 503.0, 925.0, 1887.0, 4525.0, 12544.0, 44087.0, 183312.0, 464469.0, 248054.0, 60320.0, 16660.0, 5696.0, 2286.0, 1068.0, 544.0, 295.0, 196.0, 126.0, 70.0, 53.0, 41.0, 28.0, 28.0, 11.0, 13.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6083984375, -0.5871353149414062, -0.5658721923828125, -0.5446090698242188, -0.523345947265625, -0.5020828247070312, -0.4808197021484375, -0.45955657958984375, -0.43829345703125, -0.41703033447265625, -0.3957672119140625, -0.37450408935546875, -0.353240966796875, -0.33197784423828125, -0.3107147216796875, -0.28945159912109375, -0.2681884765625, -0.24692535400390625, -0.2256622314453125, -0.20439910888671875, -0.183135986328125, -0.16187286376953125, -0.1406097412109375, -0.11934661865234375, -0.09808349609375, -0.07682037353515625, -0.0555572509765625, -0.03429412841796875, -0.013031005859375, 0.00823211669921875, 0.0294952392578125, 0.05075836181640625, 0.072021484375, 0.09328460693359375, 0.1145477294921875, 0.13581085205078125, 0.157073974609375, 0.17833709716796875, 0.1996002197265625, 0.22086334228515625, 0.24212646484375, 0.26338958740234375, 0.2846527099609375, 0.30591583251953125, 0.327178955078125, 0.34844207763671875, 0.3697052001953125, 0.39096832275390625, 0.4122314453125, 0.43349456787109375, 0.4547576904296875, 0.47602081298828125, 0.497283935546875, 0.5185470581054688, 0.5398101806640625, 0.5610733032226562, 0.58233642578125, 0.6035995483398438, 0.6248626708984375, 0.6461257934570312, 0.667388916015625, 0.6886520385742188, 0.7099151611328125, 0.7311782836914062, 0.75244140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 7.0, 13.0, 11.0, 13.0, 22.0, 29.0, 22.0, 34.0, 38.0, 44.0, 68.0, 69.0, 67.0, 67.0, 69.0, 71.0, 65.0, 39.0, 45.0, 41.0, 29.0, 19.0, 10.0, 14.0, 12.0, 10.0, 7.0, 7.0, 2.0, 4.0, 7.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.74560546875, -0.7225341796875, -0.699462890625, -0.6763916015625, -0.6533203125, -0.6302490234375, -0.607177734375, -0.5841064453125, -0.56103515625, -0.5379638671875, -0.514892578125, -0.4918212890625, -0.46875, -0.4456787109375, -0.422607421875, -0.3995361328125, -0.37646484375, -0.3533935546875, -0.330322265625, -0.3072509765625, -0.2841796875, -0.2611083984375, -0.238037109375, -0.2149658203125, -0.19189453125, -0.1688232421875, -0.145751953125, -0.1226806640625, -0.099609375, -0.0765380859375, -0.053466796875, -0.0303955078125, -0.00732421875, 0.0157470703125, 0.038818359375, 0.0618896484375, 0.0849609375, 0.1080322265625, 0.131103515625, 0.1541748046875, 0.17724609375, 0.2003173828125, 0.223388671875, 0.2464599609375, 0.26953125, 0.2926025390625, 0.315673828125, 0.3387451171875, 0.36181640625, 0.3848876953125, 0.407958984375, 0.4310302734375, 0.4541015625, 0.4771728515625, 0.500244140625, 0.5233154296875, 0.54638671875, 0.5694580078125, 0.592529296875, 0.6156005859375, 0.638671875, 0.6617431640625, 0.684814453125, 0.7078857421875, 0.73095703125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 13.0, 9.0, 16.0, 21.0, 23.0, 38.0, 52.0, 58.0, 64.0, 91.0, 110.0, 95.0, 96.0, 75.0, 80.0, 45.0, 29.0, 26.0, 19.0, 13.0, 6.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.674462795257568, -7.398504257202148, -7.12254524230957, -6.84658670425415, -6.5706281661987305, -6.2946696281433105, -6.018711090087891, -5.7427520751953125, -5.466793537139893, -5.190834999084473, -4.9148759841918945, -4.638917446136475, -4.362958908081055, -4.087000370025635, -3.8110415935516357, -3.5350828170776367, -3.259124279022217, -2.983165740966797, -2.707206964492798, -2.431248188018799, -2.155289649963379, -1.8793309926986694, -1.60337233543396, -1.3274136781692505, -1.051455020904541, -0.7754963636398315, -0.49953770637512207, -0.2235790491104126, 0.052379608154296875, 0.32833826541900635, 0.6042969226837158, 0.8802555799484253, 1.1562137603759766, 1.432172417640686, 1.7081310749053955, 1.984089732170105, 2.2600483894348145, 2.5360069274902344, 2.8119657039642334, 3.0879244804382324, 3.3638830184936523, 3.6398415565490723, 3.9158003330230713, 4.19175910949707, 4.46771764755249, 4.74367618560791, 5.019635200500488, 5.295593738555908, 5.571552276611328, 5.847510814666748, 6.123469352722168, 6.399428367614746, 6.675386905670166, 6.951345443725586, 7.227304458618164, 7.503262996673584, 7.779221534729004, 8.055180549621582, 8.331138610839844, 8.607097625732422, 8.883056640625, 9.159014701843262, 9.43497371673584, 9.710931777954102, 9.98689079284668]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 13.0, 15.0, 16.0, 18.0, 28.0, 30.0, 43.0, 42.0, 33.0, 40.0, 47.0, 38.0, 52.0, 51.0, 48.0, 50.0, 51.0, 48.0, 47.0, 31.0, 24.0, 39.0, 25.0, 24.0, 19.0, 27.0, 14.0, 18.0, 16.0, 10.0, 11.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42227029800415, -6.211087703704834, -5.999905586242676, -5.788722991943359, -5.577540397644043, -5.366357803344727, -5.155175685882568, -4.943993091583252, -4.7328104972839355, -4.521627902984619, -4.310445785522461, -4.0992631912231445, -3.888080596923828, -3.676898241043091, -3.4657158851623535, -3.254533290863037, -3.0433509349823, -2.8321685791015625, -2.620985984802246, -2.409803628921509, -2.1986210346221924, -1.987438678741455, -1.7762562036514282, -1.5650737285614014, -1.3538912534713745, -1.1427087783813477, -0.9315263032913208, -0.7203438878059387, -0.5091614127159119, -0.2979789972305298, -0.08679652214050293, 0.12438595294952393, 0.3355684280395508, 0.5467509031295776, 0.7579333782196045, 0.9691157937049866, 1.1802983283996582, 1.3914806842803955, 1.6026631593704224, 1.8138456344604492, 2.0250282287597656, 2.236210584640503, 2.4473931789398193, 2.6585755348205566, 2.869758129119873, 3.0809404850006104, 3.2921228408813477, 3.503305435180664, 3.7144877910614014, 3.9256701469421387, 4.136852741241455, 4.3480353355407715, 4.55921745300293, 4.770400047302246, 4.9815826416015625, 5.192765235900879, 5.403947353363037, 5.6151299476623535, 5.826312065124512, 6.037494659423828, 6.2486772537231445, 6.459859848022461, 6.671041965484619, 6.8822245597839355, 7.093407154083252]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 8.0, 6.0, 16.0, 14.0, 30.0, 31.0, 64.0, 86.0, 107.0, 212.0, 317.0, 636.0, 1266.0, 2709.0, 6774.0, 21637.0, 188841.0, 3914834.0, 39646.0, 9733.0, 3685.0, 1679.0, 843.0, 443.0, 246.0, 139.0, 89.0, 67.0, 46.0, 19.0, 11.0, 13.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7841796875, -1.726959228515625, -1.66973876953125, -1.612518310546875, -1.5552978515625, -1.498077392578125, -1.44085693359375, -1.383636474609375, -1.326416015625, -1.269195556640625, -1.21197509765625, -1.154754638671875, -1.0975341796875, -1.040313720703125, -0.98309326171875, -0.925872802734375, -0.86865234375, -0.811431884765625, -0.75421142578125, -0.696990966796875, -0.6397705078125, -0.582550048828125, -0.52532958984375, -0.468109130859375, -0.410888671875, -0.353668212890625, -0.29644775390625, -0.239227294921875, -0.1820068359375, -0.124786376953125, -0.06756591796875, -0.010345458984375, 0.046875, 0.104095458984375, 0.16131591796875, 0.218536376953125, 0.2757568359375, 0.332977294921875, 0.39019775390625, 0.447418212890625, 0.504638671875, 0.561859130859375, 0.61907958984375, 0.676300048828125, 0.7335205078125, 0.790740966796875, 0.84796142578125, 0.905181884765625, 0.96240234375, 1.019622802734375, 1.07684326171875, 1.134063720703125, 1.1912841796875, 1.248504638671875, 1.30572509765625, 1.362945556640625, 1.420166015625, 1.477386474609375, 1.53460693359375, 1.591827392578125, 1.6490478515625, 1.706268310546875, 1.76348876953125, 1.820709228515625, 1.8779296875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 11.0, 19.0, 25.0, 19.0, 20.0, 37.0, 43.0, 33.0, 43.0, 51.0, 57.0, 45.0, 58.0, 62.0, 58.0, 48.0, 43.0, 64.0, 37.0, 34.0, 32.0, 28.0, 21.0, 19.0, 10.0, 17.0, 19.0, 7.0, 2.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3671875, -0.3572845458984375, -0.347381591796875, -0.3374786376953125, -0.32757568359375, -0.3176727294921875, -0.307769775390625, -0.2978668212890625, -0.2879638671875, -0.2780609130859375, -0.268157958984375, -0.2582550048828125, -0.24835205078125, -0.2384490966796875, -0.228546142578125, -0.2186431884765625, -0.208740234375, -0.1988372802734375, -0.188934326171875, -0.1790313720703125, -0.16912841796875, -0.1592254638671875, -0.149322509765625, -0.1394195556640625, -0.1295166015625, -0.1196136474609375, -0.109710693359375, -0.0998077392578125, -0.08990478515625, -0.0800018310546875, -0.070098876953125, -0.0601959228515625, -0.05029296875, -0.0403900146484375, -0.030487060546875, -0.0205841064453125, -0.01068115234375, -0.0007781982421875, 0.009124755859375, 0.0190277099609375, 0.0289306640625, 0.0388336181640625, 0.048736572265625, 0.0586395263671875, 0.06854248046875, 0.0784454345703125, 0.088348388671875, 0.0982513427734375, 0.108154296875, 0.1180572509765625, 0.127960205078125, 0.1378631591796875, 0.14776611328125, 0.1576690673828125, 0.167572021484375, 0.1774749755859375, 0.1873779296875, 0.1972808837890625, 0.207183837890625, 0.2170867919921875, 0.22698974609375, 0.2368927001953125, 0.246795654296875, 0.2566986083984375, 0.2666015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 6.0, 6.0, 8.0, 20.0, 20.0, 30.0, 49.0, 68.0, 86.0, 137.0, 201.0, 347.0, 453.0, 735.0, 1262.0, 2322.0, 4892.0, 12614.0, 51828.0, 3923668.0, 158905.0, 22028.0, 7153.0, 3198.0, 1563.0, 960.0, 606.0, 339.0, 241.0, 167.0, 129.0, 76.0, 43.0, 35.0, 28.0, 13.0, 9.0, 9.0, 8.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.549072265625, -2.47119140625, -2.393310546875, -2.3154296875, -2.237548828125, -2.15966796875, -2.081787109375, -2.00390625, -1.926025390625, -1.84814453125, -1.770263671875, -1.6923828125, -1.614501953125, -1.53662109375, -1.458740234375, -1.380859375, -1.302978515625, -1.22509765625, -1.147216796875, -1.0693359375, -0.991455078125, -0.91357421875, -0.835693359375, -0.7578125, -0.679931640625, -0.60205078125, -0.524169921875, -0.4462890625, -0.368408203125, -0.29052734375, -0.212646484375, -0.134765625, -0.056884765625, 0.02099609375, 0.098876953125, 0.1767578125, 0.254638671875, 0.33251953125, 0.410400390625, 0.48828125, 0.566162109375, 0.64404296875, 0.721923828125, 0.7998046875, 0.877685546875, 0.95556640625, 1.033447265625, 1.111328125, 1.189208984375, 1.26708984375, 1.344970703125, 1.4228515625, 1.500732421875, 1.57861328125, 1.656494140625, 1.734375, 1.812255859375, 1.89013671875, 1.968017578125, 2.0458984375, 2.123779296875, 2.20166015625, 2.279541015625, 2.357421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 5.0, 17.0, 25.0, 21.0, 58.0, 196.0, 3425.0, 193.0, 50.0, 28.0, 12.0, 9.0, 6.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6729583740234375, -0.651580810546875, -0.6302032470703125, -0.60882568359375, -0.5874481201171875, -0.566070556640625, -0.5446929931640625, -0.5233154296875, -0.5019378662109375, -0.480560302734375, -0.4591827392578125, -0.43780517578125, -0.4164276123046875, -0.395050048828125, -0.3736724853515625, -0.352294921875, -0.3309173583984375, -0.309539794921875, -0.2881622314453125, -0.26678466796875, -0.2454071044921875, -0.224029541015625, -0.2026519775390625, -0.1812744140625, -0.1598968505859375, -0.138519287109375, -0.1171417236328125, -0.09576416015625, -0.0743865966796875, -0.053009033203125, -0.0316314697265625, -0.01025390625, 0.0111236572265625, 0.032501220703125, 0.0538787841796875, 0.07525634765625, 0.0966339111328125, 0.118011474609375, 0.1393890380859375, 0.1607666015625, 0.1821441650390625, 0.203521728515625, 0.2248992919921875, 0.24627685546875, 0.2676544189453125, 0.289031982421875, 0.3104095458984375, 0.331787109375, 0.3531646728515625, 0.374542236328125, 0.3959197998046875, 0.41729736328125, 0.4386749267578125, 0.460052490234375, 0.4814300537109375, 0.5028076171875, 0.5241851806640625, 0.545562744140625, 0.5669403076171875, 0.58831787109375, 0.6096954345703125, 0.631072998046875, 0.6524505615234375, 0.673828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 11.0, 30.0, 36.0, 76.0, 156.0, 237.0, 205.0, 133.0, 66.0, 32.0, 13.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.628856658935547, -5.503933906555176, -5.379011631011963, -5.254088878631592, -5.129166603088379, -5.004243850708008, -4.879321575164795, -4.754398822784424, -4.629476547241211, -4.50455379486084, -4.379631519317627, -4.254708766937256, -4.129786491394043, -4.004863739013672, -3.87994122505188, -3.755018711090088, -3.630095958709717, -3.505173444747925, -3.380250930786133, -3.255328416824341, -3.130405902862549, -3.0054831504821777, -2.8805606365203857, -2.7556381225585938, -2.6307156085968018, -2.5057930946350098, -2.3808705806732178, -2.255948066711426, -2.1310253143310547, -2.006103038787842, -1.8811802864074707, -1.7562577724456787, -1.6313354969024658, -1.5064129829406738, -1.3814904689788818, -1.2565678358078003, -1.1316453218460083, -1.0067228078842163, -0.8818002343177795, -0.7568776607513428, -0.6319551467895508, -0.5070326328277588, -0.382110059261322, -0.25718751549720764, -0.13226497173309326, -0.0073424577713012695, 0.1175801157951355, 0.24250268936157227, 0.36742520332336426, 0.49234774708747864, 0.617270290851593, 0.7421928644180298, 0.8671153783798218, 0.9920378923416138, 1.1169605255126953, 1.2418830394744873, 1.3668055534362793, 1.4917280673980713, 1.6166505813598633, 1.7415732145309448, 1.8664957284927368, 1.9914182424545288, 2.1163408756256104, 2.2412633895874023, 2.3661859035491943]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 5.0, 15.0, 8.0, 13.0, 17.0, 26.0, 18.0, 22.0, 46.0, 35.0, 31.0, 38.0, 41.0, 58.0, 36.0, 44.0, 59.0, 42.0, 44.0, 49.0, 45.0, 34.0, 41.0, 33.0, 34.0, 26.0, 28.0, 17.0, 26.0, 10.0, 11.0, 10.0, 12.0, 9.0, 10.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.464925765991211, -1.4220956563949585, -1.379265546798706, -1.3364355564117432, -1.2936054468154907, -1.2507753372192383, -1.2079452276229858, -1.1651151180267334, -1.1222851276397705, -1.079455018043518, -1.0366249084472656, -0.993794858455658, -0.9509648084640503, -0.9081346988677979, -0.8653045892715454, -0.822474479675293, -0.7796443700790405, -0.7368142604827881, -0.6939842104911804, -0.651154100894928, -0.6083240509033203, -0.5654939413070679, -0.5226638317108154, -0.4798337519168854, -0.4370036721229553, -0.39417359232902527, -0.3513435125350952, -0.3085134029388428, -0.2656833231449127, -0.22285324335098267, -0.18002313375473022, -0.13719305396080017, -0.09436297416687012, -0.05153288692235947, -0.008702799677848816, 0.03412729501724243, 0.07695737481117249, 0.11978745460510254, 0.16261756420135498, 0.20544764399528503, 0.2482777237892151, 0.29110780358314514, 0.3339378833770752, 0.37676799297332764, 0.4195980727672577, 0.46242815256118774, 0.5052582621574402, 0.5480883121490479, 0.5909184217453003, 0.6337485313415527, 0.6765785813331604, 0.7194086909294128, 0.7622387409210205, 0.805068850517273, 0.8478989601135254, 0.8907290697097778, 0.9335591197013855, 0.9763892292976379, 1.0192192792892456, 1.062049388885498, 1.1048794984817505, 1.147709608078003, 1.1905395984649658, 1.2333697080612183, 1.2761998176574707]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 5.0, 3.0, 12.0, 14.0, 30.0, 52.0, 80.0, 157.0, 281.0, 454.0, 918.0, 1787.0, 3550.0, 7353.0, 15511.0, 33989.0, 73958.0, 148639.0, 240609.0, 238310.0, 147201.0, 72405.0, 33504.0, 15392.0, 7129.0, 3550.0, 1717.0, 869.0, 457.0, 259.0, 151.0, 91.0, 44.0, 30.0, 23.0, 13.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.173828125, -1.13824462890625, -1.1026611328125, -1.06707763671875, -1.031494140625, -0.99591064453125, -0.9603271484375, -0.92474365234375, -0.88916015625, -0.85357666015625, -0.8179931640625, -0.78240966796875, -0.746826171875, -0.71124267578125, -0.6756591796875, -0.64007568359375, -0.6044921875, -0.56890869140625, -0.5333251953125, -0.49774169921875, -0.462158203125, -0.42657470703125, -0.3909912109375, -0.35540771484375, -0.31982421875, -0.28424072265625, -0.2486572265625, -0.21307373046875, -0.177490234375, -0.14190673828125, -0.1063232421875, -0.07073974609375, -0.03515625, 0.00042724609375, 0.0360107421875, 0.07159423828125, 0.107177734375, 0.14276123046875, 0.1783447265625, 0.21392822265625, 0.24951171875, 0.28509521484375, 0.3206787109375, 0.35626220703125, 0.391845703125, 0.42742919921875, 0.4630126953125, 0.49859619140625, 0.5341796875, 0.56976318359375, 0.6053466796875, 0.64093017578125, 0.676513671875, 0.71209716796875, 0.7476806640625, 0.78326416015625, 0.81884765625, 0.85443115234375, 0.8900146484375, 0.92559814453125, 0.961181640625, 0.99676513671875, 1.0323486328125, 1.06793212890625, 1.103515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 12.0, 11.0, 14.0, 17.0, 10.0, 27.0, 19.0, 31.0, 32.0, 29.0, 32.0, 49.0, 43.0, 50.0, 41.0, 58.0, 56.0, 52.0, 54.0, 49.0, 45.0, 42.0, 36.0, 27.0, 31.0, 21.0, 24.0, 17.0, 11.0, 13.0, 8.0, 10.0, 6.0, 4.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4580078125, -0.4446563720703125, -0.431304931640625, -0.4179534912109375, -0.40460205078125, -0.3912506103515625, -0.377899169921875, -0.3645477294921875, -0.3511962890625, -0.3378448486328125, -0.324493408203125, -0.3111419677734375, -0.29779052734375, -0.2844390869140625, -0.271087646484375, -0.2577362060546875, -0.244384765625, -0.2310333251953125, -0.217681884765625, -0.2043304443359375, -0.19097900390625, -0.1776275634765625, -0.164276123046875, -0.1509246826171875, -0.1375732421875, -0.1242218017578125, -0.110870361328125, -0.0975189208984375, -0.08416748046875, -0.0708160400390625, -0.057464599609375, -0.0441131591796875, -0.03076171875, -0.0174102783203125, -0.004058837890625, 0.0092926025390625, 0.02264404296875, 0.0359954833984375, 0.049346923828125, 0.0626983642578125, 0.0760498046875, 0.0894012451171875, 0.102752685546875, 0.1161041259765625, 0.12945556640625, 0.1428070068359375, 0.156158447265625, 0.1695098876953125, 0.182861328125, 0.1962127685546875, 0.209564208984375, 0.2229156494140625, 0.23626708984375, 0.2496185302734375, 0.262969970703125, 0.2763214111328125, 0.2896728515625, 0.3030242919921875, 0.316375732421875, 0.3297271728515625, 0.34307861328125, 0.3564300537109375, 0.369781494140625, 0.3831329345703125, 0.396484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 11.0, 15.0, 18.0, 13.0, 38.0, 42.0, 63.0, 108.0, 191.0, 284.0, 478.0, 799.0, 1413.0, 2912.0, 5714.0, 11717.0, 25127.0, 57290.0, 130340.0, 266453.0, 286366.0, 142855.0, 62615.0, 27816.0, 12799.0, 6214.0, 3078.0, 1620.0, 882.0, 472.0, 305.0, 178.0, 88.0, 71.0, 52.0, 32.0, 23.0, 15.0, 9.0, 6.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.184234619140625, -1.14483642578125, -1.105438232421875, -1.0660400390625, -1.026641845703125, -0.98724365234375, -0.947845458984375, -0.908447265625, -0.869049072265625, -0.82965087890625, -0.790252685546875, -0.7508544921875, -0.711456298828125, -0.67205810546875, -0.632659912109375, -0.59326171875, -0.553863525390625, -0.51446533203125, -0.475067138671875, -0.4356689453125, -0.396270751953125, -0.35687255859375, -0.317474365234375, -0.278076171875, -0.238677978515625, -0.19927978515625, -0.159881591796875, -0.1204833984375, -0.081085205078125, -0.04168701171875, -0.002288818359375, 0.037109375, 0.076507568359375, 0.11590576171875, 0.155303955078125, 0.1947021484375, 0.234100341796875, 0.27349853515625, 0.312896728515625, 0.352294921875, 0.391693115234375, 0.43109130859375, 0.470489501953125, 0.5098876953125, 0.549285888671875, 0.58868408203125, 0.628082275390625, 0.66748046875, 0.706878662109375, 0.74627685546875, 0.785675048828125, 0.8250732421875, 0.864471435546875, 0.90386962890625, 0.943267822265625, 0.982666015625, 1.022064208984375, 1.06146240234375, 1.100860595703125, 1.1402587890625, 1.179656982421875, 1.21905517578125, 1.258453369140625, 1.2978515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 3.0, 11.0, 7.0, 11.0, 19.0, 17.0, 22.0, 12.0, 21.0, 24.0, 26.0, 26.0, 20.0, 41.0, 35.0, 32.0, 38.0, 44.0, 45.0, 38.0, 53.0, 29.0, 39.0, 53.0, 38.0, 29.0, 28.0, 32.0, 36.0, 25.0, 25.0, 21.0, 13.0, 16.0, 7.0, 16.0, 7.0, 8.0, 5.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.1473541259765625, -2.083770751953125, -2.0201873779296875, -1.95660400390625, -1.8930206298828125, -1.829437255859375, -1.7658538818359375, -1.7022705078125, -1.6386871337890625, -1.575103759765625, -1.5115203857421875, -1.44793701171875, -1.3843536376953125, -1.320770263671875, -1.2571868896484375, -1.193603515625, -1.1300201416015625, -1.066436767578125, -1.0028533935546875, -0.93927001953125, -0.8756866455078125, -0.812103271484375, -0.7485198974609375, -0.6849365234375, -0.6213531494140625, -0.557769775390625, -0.4941864013671875, -0.43060302734375, -0.3670196533203125, -0.303436279296875, -0.2398529052734375, -0.17626953125, -0.1126861572265625, -0.049102783203125, 0.0144805908203125, 0.07806396484375, 0.1416473388671875, 0.205230712890625, 0.2688140869140625, 0.3323974609375, 0.3959808349609375, 0.459564208984375, 0.5231475830078125, 0.58673095703125, 0.6503143310546875, 0.713897705078125, 0.7774810791015625, 0.841064453125, 0.9046478271484375, 0.968231201171875, 1.0318145751953125, 1.09539794921875, 1.1589813232421875, 1.222564697265625, 1.2861480712890625, 1.3497314453125, 1.4133148193359375, 1.476898193359375, 1.5404815673828125, 1.60406494140625, 1.6676483154296875, 1.731231689453125, 1.7948150634765625, 1.8583984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 13.0, 20.0, 30.0, 35.0, 71.0, 94.0, 182.0, 320.0, 698.0, 1730.0, 6211.0, 44758.0, 846406.0, 133174.0, 10307.0, 2667.0, 880.0, 408.0, 218.0, 116.0, 72.0, 49.0, 34.0, 16.0, 9.0, 12.0, 3.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.42156982421875, -2.3450927734375, -2.26861572265625, -2.192138671875, -2.11566162109375, -2.0391845703125, -1.96270751953125, -1.88623046875, -1.80975341796875, -1.7332763671875, -1.65679931640625, -1.580322265625, -1.50384521484375, -1.4273681640625, -1.35089111328125, -1.2744140625, -1.19793701171875, -1.1214599609375, -1.04498291015625, -0.968505859375, -0.89202880859375, -0.8155517578125, -0.73907470703125, -0.66259765625, -0.58612060546875, -0.5096435546875, -0.43316650390625, -0.356689453125, -0.28021240234375, -0.2037353515625, -0.12725830078125, -0.05078125, 0.02569580078125, 0.1021728515625, 0.17864990234375, 0.255126953125, 0.33160400390625, 0.4080810546875, 0.48455810546875, 0.56103515625, 0.63751220703125, 0.7139892578125, 0.79046630859375, 0.866943359375, 0.94342041015625, 1.0198974609375, 1.09637451171875, 1.1728515625, 1.24932861328125, 1.3258056640625, 1.40228271484375, 1.478759765625, 1.55523681640625, 1.6317138671875, 1.70819091796875, 1.78466796875, 1.86114501953125, 1.9376220703125, 2.01409912109375, 2.090576171875, 2.16705322265625, 2.2435302734375, 2.32000732421875, 2.396484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 4.0, 12.0, 14.0, 14.0, 25.0, 27.0, 22.0, 39.0, 35.0, 54.0, 74.0, 60.0, 73.0, 70.0, 66.0, 70.0, 55.0, 46.0, 52.0, 33.0, 32.0, 15.0, 21.0, 16.0, 16.0, 8.0, 4.0, 5.0, 5.0, 5.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015234947204589844, -0.00014814548194408417, -0.0001439414918422699, -0.00013973750174045563, -0.00013553351163864136, -0.0001313295215368271, -0.00012712553143501282, -0.00012292154133319855, -0.00011871755123138428, -0.00011451356112957001, -0.00011030957102775574, -0.00010610558092594147, -0.0001019015908241272, -9.769760072231293e-05, -9.349361062049866e-05, -8.928962051868439e-05, -8.508563041687012e-05, -8.088164031505585e-05, -7.667765021324158e-05, -7.247366011142731e-05, -6.826967000961304e-05, -6.406567990779877e-05, -5.98616898059845e-05, -5.565769970417023e-05, -5.145370960235596e-05, -4.724971950054169e-05, -4.304572939872742e-05, -3.884173929691315e-05, -3.463774919509888e-05, -3.0433759093284607e-05, -2.6229768991470337e-05, -2.2025778889656067e-05, -1.7821788787841797e-05, -1.3617798686027527e-05, -9.413808584213257e-06, -5.209818482398987e-06, -1.0058283805847168e-06, 3.1981617212295532e-06, 7.402151823043823e-06, 1.1606141924858093e-05, 1.5810132026672363e-05, 2.0014122128486633e-05, 2.4218112230300903e-05, 2.8422102332115173e-05, 3.262609243392944e-05, 3.683008253574371e-05, 4.1034072637557983e-05, 4.5238062739372253e-05, 4.9442052841186523e-05, 5.3646042943000793e-05, 5.7850033044815063e-05, 6.205402314662933e-05, 6.62580132484436e-05, 7.046200335025787e-05, 7.466599345207214e-05, 7.886998355388641e-05, 8.307397365570068e-05, 8.727796375751495e-05, 9.148195385932922e-05, 9.56859439611435e-05, 9.988993406295776e-05, 0.00010409392416477203, 0.0001082979142665863, 0.00011250190436840057, 0.00011670589447021484]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 10.0, 18.0, 36.0, 51.0, 79.0, 149.0, 335.0, 774.0, 1951.0, 6735.0, 40812.0, 496534.0, 453748.0, 37717.0, 6274.0, 1904.0, 692.0, 353.0, 149.0, 62.0, 60.0, 31.0, 10.0, 11.0, 7.0, 11.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.6357421875, -1.5845947265625, -1.533447265625, -1.4822998046875, -1.43115234375, -1.3800048828125, -1.328857421875, -1.2777099609375, -1.2265625, -1.1754150390625, -1.124267578125, -1.0731201171875, -1.02197265625, -0.9708251953125, -0.919677734375, -0.8685302734375, -0.8173828125, -0.7662353515625, -0.715087890625, -0.6639404296875, -0.61279296875, -0.5616455078125, -0.510498046875, -0.4593505859375, -0.408203125, -0.3570556640625, -0.305908203125, -0.2547607421875, -0.20361328125, -0.1524658203125, -0.101318359375, -0.0501708984375, 0.0009765625, 0.0521240234375, 0.103271484375, 0.1544189453125, 0.20556640625, 0.2567138671875, 0.307861328125, 0.3590087890625, 0.41015625, 0.4613037109375, 0.512451171875, 0.5635986328125, 0.61474609375, 0.6658935546875, 0.717041015625, 0.7681884765625, 0.8193359375, 0.8704833984375, 0.921630859375, 0.9727783203125, 1.02392578125, 1.0750732421875, 1.126220703125, 1.1773681640625, 1.228515625, 1.2796630859375, 1.330810546875, 1.3819580078125, 1.43310546875, 1.4842529296875, 1.535400390625, 1.5865478515625, 1.6376953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 7.0, 7.0, 17.0, 22.0, 18.0, 41.0, 55.0, 79.0, 120.0, 157.0, 119.0, 109.0, 69.0, 50.0, 46.0, 22.0, 23.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.248046875, -2.183563232421875, -2.11907958984375, -2.054595947265625, -1.9901123046875, -1.925628662109375, -1.86114501953125, -1.796661376953125, -1.732177734375, -1.667694091796875, -1.60321044921875, -1.538726806640625, -1.4742431640625, -1.409759521484375, -1.34527587890625, -1.280792236328125, -1.21630859375, -1.151824951171875, -1.08734130859375, -1.022857666015625, -0.9583740234375, -0.893890380859375, -0.82940673828125, -0.764923095703125, -0.700439453125, -0.635955810546875, -0.57147216796875, -0.506988525390625, -0.4425048828125, -0.378021240234375, -0.31353759765625, -0.249053955078125, -0.1845703125, -0.120086669921875, -0.05560302734375, 0.008880615234375, 0.0733642578125, 0.137847900390625, 0.20233154296875, 0.266815185546875, 0.331298828125, 0.395782470703125, 0.46026611328125, 0.524749755859375, 0.5892333984375, 0.653717041015625, 0.71820068359375, 0.782684326171875, 0.84716796875, 0.911651611328125, 0.97613525390625, 1.040618896484375, 1.1051025390625, 1.169586181640625, 1.23406982421875, 1.298553466796875, 1.363037109375, 1.427520751953125, 1.49200439453125, 1.556488037109375, 1.6209716796875, 1.685455322265625, 1.74993896484375, 1.814422607421875, 1.87890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 28.0, 81.0, 177.0, 293.0, 234.0, 147.0, 33.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.814849853515625, -60.18119812011719, -58.54754638671875, -56.91389083862305, -55.28023910522461, -53.64658737182617, -52.012935638427734, -50.37928009033203, -48.745628356933594, -47.111976623535156, -45.47832489013672, -43.844669342041016, -42.21101760864258, -40.57736587524414, -38.9437141418457, -37.31005859375, -35.67640686035156, -34.042755126953125, -32.40910339355469, -30.775449752807617, -29.141796112060547, -27.50814437866211, -25.874492645263672, -24.2408390045166, -22.607189178466797, -20.97353744506836, -19.33988380432129, -17.70623207092285, -16.07257843017578, -14.438926696777344, -12.80527400970459, -11.171621322631836, -9.537967681884766, -7.904314994812012, -6.270662307739258, -4.637010097503662, -3.003357410430908, -1.3697052001953125, 0.2639474868774414, 1.8976001739501953, 3.531252861022949, 5.164905548095703, 6.798558235168457, 8.432210922241211, 10.065862655639648, 11.699515342712402, 13.333168029785156, 14.96682071685791, 16.600473403930664, 18.2341251373291, 19.867778778076172, 21.50143051147461, 23.13508415222168, 24.768735885620117, 26.402389526367188, 28.036041259765625, 29.669692993164062, 31.3033447265625, 32.93699645996094, 34.57065200805664, 36.20430374145508, 37.837955474853516, 39.47160720825195, 41.105262756347656, 42.738914489746094]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 10.0, 17.0, 7.0, 17.0, 19.0, 22.0, 20.0, 31.0, 34.0, 54.0, 46.0, 26.0, 41.0, 51.0, 38.0, 52.0, 51.0, 43.0, 42.0, 45.0, 51.0, 54.0, 28.0, 30.0, 32.0, 25.0, 24.0, 22.0, 11.0, 15.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.628750801086426, -14.241868019104004, -13.854984283447266, -13.468101501464844, -13.081217765808105, -12.694334983825684, -12.307451248168945, -11.920568466186523, -11.533685684204102, -11.14680290222168, -10.759919166564941, -10.37303638458252, -9.986152648925781, -9.59926986694336, -9.212387084960938, -8.8255033493042, -8.438619613647461, -8.051736831665039, -7.664853096008301, -7.277970314025879, -6.891086578369141, -6.504203796386719, -6.117320537567139, -5.730437278747559, -5.3435540199279785, -4.956670761108398, -4.569787502288818, -4.182904243469238, -3.7960212230682373, -3.4091379642486572, -3.0222549438476562, -2.635371685028076, -2.2484893798828125, -1.8616061210632324, -1.474722981452942, -1.0878398418426514, -0.7009565830230713, -0.3140733242034912, 0.07280969619750977, 0.45969295501708984, 0.8465762138366699, 1.23345947265625, 1.6203426122665405, 2.007225751876831, 2.394109010696411, 2.780992269515991, 3.167875289916992, 3.5547585487365723, 3.9416418075561523, 4.328525066375732, 4.7154083251953125, 5.102291107177734, 5.489174842834473, 5.8760576248168945, 6.262940883636475, 6.649824142456055, 7.036707401275635, 7.423590660095215, 7.810473918914795, 8.197357177734375, 8.584239959716797, 8.971123695373535, 9.358006477355957, 9.744890213012695, 10.131772994995117]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 13.0, 20.0, 32.0, 28.0, 50.0, 61.0, 100.0, 149.0, 255.0, 503.0, 845.0, 1897.0, 4820.0, 15880.0, 102168.0, 3993789.0, 55338.0, 11278.0, 3625.0, 1527.0, 798.0, 393.0, 230.0, 179.0, 97.0, 59.0, 39.0, 23.0, 14.0, 18.0, 14.0, 4.0, 9.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.744140625, -2.65936279296875, -2.5745849609375, -2.48980712890625, -2.405029296875, -2.32025146484375, -2.2354736328125, -2.15069580078125, -2.06591796875, -1.98114013671875, -1.8963623046875, -1.81158447265625, -1.726806640625, -1.64202880859375, -1.5572509765625, -1.47247314453125, -1.3876953125, -1.30291748046875, -1.2181396484375, -1.13336181640625, -1.048583984375, -0.96380615234375, -0.8790283203125, -0.79425048828125, -0.70947265625, -0.62469482421875, -0.5399169921875, -0.45513916015625, -0.370361328125, -0.28558349609375, -0.2008056640625, -0.11602783203125, -0.03125, 0.05352783203125, 0.1383056640625, 0.22308349609375, 0.307861328125, 0.39263916015625, 0.4774169921875, 0.56219482421875, 0.64697265625, 0.73175048828125, 0.8165283203125, 0.90130615234375, 0.986083984375, 1.07086181640625, 1.1556396484375, 1.24041748046875, 1.3251953125, 1.40997314453125, 1.4947509765625, 1.57952880859375, 1.664306640625, 1.74908447265625, 1.8338623046875, 1.91864013671875, 2.00341796875, 2.08819580078125, 2.1729736328125, 2.25775146484375, 2.342529296875, 2.42730712890625, 2.5120849609375, 2.59686279296875, 2.681640625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 10.0, 11.0, 6.0, 11.0, 17.0, 26.0, 26.0, 22.0, 32.0, 35.0, 45.0, 44.0, 58.0, 66.0, 51.0, 49.0, 66.0, 62.0, 64.0, 35.0, 41.0, 36.0, 30.0, 33.0, 18.0, 16.0, 21.0, 18.0, 12.0, 9.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46240234375, -0.44673919677734375, -0.4310760498046875, -0.41541290283203125, -0.399749755859375, -0.38408660888671875, -0.3684234619140625, -0.35276031494140625, -0.33709716796875, -0.32143402099609375, -0.3057708740234375, -0.29010772705078125, -0.274444580078125, -0.25878143310546875, -0.2431182861328125, -0.22745513916015625, -0.2117919921875, -0.19612884521484375, -0.1804656982421875, -0.16480255126953125, -0.149139404296875, -0.13347625732421875, -0.1178131103515625, -0.10214996337890625, -0.08648681640625, -0.07082366943359375, -0.0551605224609375, -0.03949737548828125, -0.023834228515625, -0.00817108154296875, 0.0074920654296875, 0.02315521240234375, 0.038818359375, 0.05448150634765625, 0.0701446533203125, 0.08580780029296875, 0.101470947265625, 0.11713409423828125, 0.1327972412109375, 0.14846038818359375, 0.16412353515625, 0.17978668212890625, 0.1954498291015625, 0.21111297607421875, 0.226776123046875, 0.24243927001953125, 0.2581024169921875, 0.27376556396484375, 0.2894287109375, 0.30509185791015625, 0.3207550048828125, 0.33641815185546875, 0.352081298828125, 0.36774444580078125, 0.3834075927734375, 0.39907073974609375, 0.41473388671875, 0.43039703369140625, 0.4460601806640625, 0.46172332763671875, 0.477386474609375, 0.49304962158203125, 0.5087127685546875, 0.5243759155273438, 0.5400390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 5.0, 18.0, 8.0, 14.0, 25.0, 31.0, 38.0, 55.0, 66.0, 95.0, 134.0, 198.0, 288.0, 428.0, 705.0, 1123.0, 1935.0, 3619.0, 7237.0, 17678.0, 59039.0, 3501558.0, 518785.0, 50630.0, 15843.0, 6726.0, 3208.0, 1764.0, 977.0, 626.0, 417.0, 270.0, 201.0, 140.0, 103.0, 68.0, 59.0, 36.0, 24.0, 19.0, 15.0, 16.0, 11.0, 12.0, 7.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-2.796875, -2.71197509765625, -2.6270751953125, -2.54217529296875, -2.457275390625, -2.37237548828125, -2.2874755859375, -2.20257568359375, -2.11767578125, -2.03277587890625, -1.9478759765625, -1.86297607421875, -1.778076171875, -1.69317626953125, -1.6082763671875, -1.52337646484375, -1.4384765625, -1.35357666015625, -1.2686767578125, -1.18377685546875, -1.098876953125, -1.01397705078125, -0.9290771484375, -0.84417724609375, -0.75927734375, -0.67437744140625, -0.5894775390625, -0.50457763671875, -0.419677734375, -0.33477783203125, -0.2498779296875, -0.16497802734375, -0.080078125, 0.00482177734375, 0.0897216796875, 0.17462158203125, 0.259521484375, 0.34442138671875, 0.4293212890625, 0.51422119140625, 0.59912109375, 0.68402099609375, 0.7689208984375, 0.85382080078125, 0.938720703125, 1.02362060546875, 1.1085205078125, 1.19342041015625, 1.2783203125, 1.36322021484375, 1.4481201171875, 1.53302001953125, 1.617919921875, 1.70281982421875, 1.7877197265625, 1.87261962890625, 1.95751953125, 2.04241943359375, 2.1273193359375, 2.21221923828125, 2.297119140625, 2.38201904296875, 2.4669189453125, 2.55181884765625, 2.63671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 10.0, 9.0, 19.0, 24.0, 59.0, 132.0, 2568.0, 968.0, 118.0, 58.0, 31.0, 22.0, 16.0, 11.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4227371215820312, -1.3903961181640625, -1.3580551147460938, -1.325714111328125, -1.2933731079101562, -1.2610321044921875, -1.2286911010742188, -1.19635009765625, -1.1640090942382812, -1.1316680908203125, -1.0993270874023438, -1.066986083984375, -1.0346450805664062, -1.0023040771484375, -0.9699630737304688, -0.9376220703125, -0.9052810668945312, -0.8729400634765625, -0.8405990600585938, -0.808258056640625, -0.7759170532226562, -0.7435760498046875, -0.7112350463867188, -0.67889404296875, -0.6465530395507812, -0.6142120361328125, -0.5818710327148438, -0.549530029296875, -0.5171890258789062, -0.4848480224609375, -0.45250701904296875, -0.420166015625, -0.38782501220703125, -0.3554840087890625, -0.32314300537109375, -0.290802001953125, -0.25846099853515625, -0.2261199951171875, -0.19377899169921875, -0.16143798828125, -0.12909698486328125, -0.0967559814453125, -0.06441497802734375, -0.032073974609375, 0.00026702880859375, 0.0326080322265625, 0.06494903564453125, 0.0972900390625, 0.12963104248046875, 0.1619720458984375, 0.19431304931640625, 0.226654052734375, 0.25899505615234375, 0.2913360595703125, 0.32367706298828125, 0.35601806640625, 0.38835906982421875, 0.4207000732421875, 0.45304107666015625, 0.485382080078125, 0.5177230834960938, 0.5500640869140625, 0.5824050903320312, 0.61474609375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 11.0, 18.0, 36.0, 75.0, 119.0, 160.0, 173.0, 144.0, 102.0, 86.0, 46.0, 17.0, 11.0, 9.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4579567909240723, -2.2746176719665527, -2.091278553009033, -1.9079391956329346, -1.724600076675415, -1.5412609577178955, -1.3579217195510864, -1.1745824813842773, -0.9912433624267578, -0.8079041838645935, -0.6245650053024292, -0.4412258267402649, -0.2578866481781006, -0.07454746961593628, 0.10879170894622803, 0.2921309471130371, 0.47547006607055664, 0.658809244632721, 0.8421484231948853, 1.0254876613616943, 1.2088267803192139, 1.3921658992767334, 1.5755051374435425, 1.7588443756103516, 1.942183494567871, 2.1255226135253906, 2.30886173248291, 2.492201089859009, 2.6755402088165283, 2.858879327774048, 3.0422186851501465, 3.225557804107666, 3.4088964462280273, 3.592235565185547, 3.7755746841430664, 3.958914041519165, 4.1422529220581055, 4.325592517852783, 4.508931636810303, 4.692270755767822, 4.875609874725342, 5.058948993682861, 5.242288112640381, 5.4256272315979, 5.608966827392578, 5.792305946350098, 5.975645065307617, 6.158984184265137, 6.342323303222656, 6.525662422180176, 6.709001541137695, 6.892340660095215, 7.075679779052734, 7.259019374847412, 7.442358493804932, 7.625697612762451, 7.809036731719971, 7.99237585067749, 8.175715446472168, 8.359054565429688, 8.542393684387207, 8.725732803344727, 8.909071922302246, 9.092411041259766, 9.275750160217285]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 9.0, 8.0, 8.0, 8.0, 4.0, 15.0, 16.0, 14.0, 19.0, 24.0, 30.0, 23.0, 31.0, 27.0, 40.0, 30.0, 47.0, 50.0, 41.0, 42.0, 40.0, 41.0, 45.0, 33.0, 43.0, 32.0, 31.0, 23.0, 22.0, 30.0, 29.0, 24.0, 17.0, 15.0, 11.0, 17.0, 14.0, 9.0, 4.0, 6.0, 5.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7019164562225342, -1.6513633728027344, -1.6008104085922241, -1.5502574443817139, -1.499704360961914, -1.4491512775421143, -1.398598313331604, -1.3480453491210938, -1.297492265701294, -1.2469391822814941, -1.1963862180709839, -1.1458332538604736, -1.0952801704406738, -1.044727087020874, -0.9941741228103638, -0.9436210989952087, -0.8930680751800537, -0.8425150513648987, -0.7919620275497437, -0.7414090037345886, -0.6908559799194336, -0.6403029561042786, -0.5897499322891235, -0.5391969084739685, -0.4886438846588135, -0.43809086084365845, -0.3875378370285034, -0.3369848132133484, -0.28643178939819336, -0.23587876558303833, -0.1853257417678833, -0.13477271795272827, -0.08421969413757324, -0.03366667032241821, 0.016886353492736816, 0.06743937730789185, 0.11799240112304688, 0.1685454249382019, 0.21909844875335693, 0.26965147256851196, 0.320204496383667, 0.370757520198822, 0.42131054401397705, 0.4718635678291321, 0.5224165916442871, 0.5729696154594421, 0.6235226392745972, 0.6740756630897522, 0.7246286869049072, 0.7751817107200623, 0.8257347345352173, 0.8762877583503723, 0.9268407821655273, 0.9773938059806824, 1.0279468297958374, 1.0784997940063477, 1.1290528774261475, 1.1796059608459473, 1.2301589250564575, 1.2807118892669678, 1.3312649726867676, 1.3818180561065674, 1.4323710203170776, 1.482923984527588, 1.5334770679473877]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 9.0, 12.0, 13.0, 20.0, 33.0, 35.0, 52.0, 70.0, 109.0, 155.0, 246.0, 388.0, 545.0, 773.0, 1287.0, 2127.0, 3409.0, 5995.0, 10407.0, 19240.0, 37477.0, 72573.0, 140358.0, 225742.0, 227258.0, 142005.0, 74366.0, 38056.0, 19786.0, 10611.0, 5937.0, 3472.0, 2052.0, 1364.0, 847.0, 522.0, 371.0, 216.0, 186.0, 125.0, 79.0, 46.0, 46.0, 28.0, 19.0, 23.0, 12.0, 11.0, 8.0, 6.0, 6.0, 4.0, 3.0, 6.0], "bins": [-1.25390625, -1.217041015625, -1.18017578125, -1.143310546875, -1.1064453125, -1.069580078125, -1.03271484375, -0.995849609375, -0.958984375, -0.922119140625, -0.88525390625, -0.848388671875, -0.8115234375, -0.774658203125, -0.73779296875, -0.700927734375, -0.6640625, -0.627197265625, -0.59033203125, -0.553466796875, -0.5166015625, -0.479736328125, -0.44287109375, -0.406005859375, -0.369140625, -0.332275390625, -0.29541015625, -0.258544921875, -0.2216796875, -0.184814453125, -0.14794921875, -0.111083984375, -0.07421875, -0.037353515625, -0.00048828125, 0.036376953125, 0.0732421875, 0.110107421875, 0.14697265625, 0.183837890625, 0.220703125, 0.257568359375, 0.29443359375, 0.331298828125, 0.3681640625, 0.405029296875, 0.44189453125, 0.478759765625, 0.515625, 0.552490234375, 0.58935546875, 0.626220703125, 0.6630859375, 0.699951171875, 0.73681640625, 0.773681640625, 0.810546875, 0.847412109375, 0.88427734375, 0.921142578125, 0.9580078125, 0.994873046875, 1.03173828125, 1.068603515625, 1.10546875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 13.0, 11.0, 10.0, 16.0, 22.0, 28.0, 26.0, 39.0, 37.0, 41.0, 48.0, 44.0, 48.0, 58.0, 54.0, 41.0, 74.0, 58.0, 50.0, 50.0, 45.0, 30.0, 25.0, 23.0, 15.0, 19.0, 21.0, 15.0, 12.0, 2.0, 9.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53173828125, -0.5132217407226562, -0.4947052001953125, -0.47618865966796875, -0.457672119140625, -0.43915557861328125, -0.4206390380859375, -0.40212249755859375, -0.38360595703125, -0.36508941650390625, -0.3465728759765625, -0.32805633544921875, -0.309539794921875, -0.29102325439453125, -0.2725067138671875, -0.25399017333984375, -0.2354736328125, -0.21695709228515625, -0.1984405517578125, -0.17992401123046875, -0.161407470703125, -0.14289093017578125, -0.1243743896484375, -0.10585784912109375, -0.08734130859375, -0.06882476806640625, -0.0503082275390625, -0.03179168701171875, -0.013275146484375, 0.00524139404296875, 0.0237579345703125, 0.04227447509765625, 0.060791015625, 0.07930755615234375, 0.0978240966796875, 0.11634063720703125, 0.134857177734375, 0.15337371826171875, 0.1718902587890625, 0.19040679931640625, 0.20892333984375, 0.22743988037109375, 0.2459564208984375, 0.26447296142578125, 0.282989501953125, 0.30150604248046875, 0.3200225830078125, 0.33853912353515625, 0.3570556640625, 0.37557220458984375, 0.3940887451171875, 0.41260528564453125, 0.431121826171875, 0.44963836669921875, 0.4681549072265625, 0.48667144775390625, 0.50518798828125, 0.5237045288085938, 0.5422210693359375, 0.5607376098632812, 0.579254150390625, 0.5977706909179688, 0.6162872314453125, 0.6348037719726562, 0.6533203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 11.0, 18.0, 29.0, 51.0, 46.0, 68.0, 123.0, 217.0, 379.0, 555.0, 1069.0, 2095.0, 4581.0, 11014.0, 31120.0, 101162.0, 336529.0, 381424.0, 119515.0, 35624.0, 12594.0, 5177.0, 2337.0, 1136.0, 619.0, 363.0, 225.0, 148.0, 93.0, 64.0, 39.0, 33.0, 22.0, 11.0, 12.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.17816162109375, -2.1102294921875, -2.04229736328125, -1.974365234375, -1.90643310546875, -1.8385009765625, -1.77056884765625, -1.70263671875, -1.63470458984375, -1.5667724609375, -1.49884033203125, -1.430908203125, -1.36297607421875, -1.2950439453125, -1.22711181640625, -1.1591796875, -1.09124755859375, -1.0233154296875, -0.95538330078125, -0.887451171875, -0.81951904296875, -0.7515869140625, -0.68365478515625, -0.61572265625, -0.54779052734375, -0.4798583984375, -0.41192626953125, -0.343994140625, -0.27606201171875, -0.2081298828125, -0.14019775390625, -0.072265625, -0.00433349609375, 0.0635986328125, 0.13153076171875, 0.199462890625, 0.26739501953125, 0.3353271484375, 0.40325927734375, 0.47119140625, 0.53912353515625, 0.6070556640625, 0.67498779296875, 0.742919921875, 0.81085205078125, 0.8787841796875, 0.94671630859375, 1.0146484375, 1.08258056640625, 1.1505126953125, 1.21844482421875, 1.286376953125, 1.35430908203125, 1.4222412109375, 1.49017333984375, 1.55810546875, 1.62603759765625, 1.6939697265625, 1.76190185546875, 1.829833984375, 1.89776611328125, 1.9656982421875, 2.03363037109375, 2.1015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 4.0, 3.0, 8.0, 14.0, 15.0, 15.0, 23.0, 18.0, 32.0, 26.0, 28.0, 33.0, 35.0, 42.0, 43.0, 51.0, 52.0, 49.0, 43.0, 49.0, 40.0, 37.0, 42.0, 26.0, 39.0, 27.0, 36.0, 29.0, 23.0, 19.0, 11.0, 15.0, 12.0, 12.0, 6.0, 7.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.880859375, -2.79632568359375, -2.7117919921875, -2.62725830078125, -2.542724609375, -2.45819091796875, -2.3736572265625, -2.28912353515625, -2.20458984375, -2.12005615234375, -2.0355224609375, -1.95098876953125, -1.866455078125, -1.78192138671875, -1.6973876953125, -1.61285400390625, -1.5283203125, -1.44378662109375, -1.3592529296875, -1.27471923828125, -1.190185546875, -1.10565185546875, -1.0211181640625, -0.93658447265625, -0.85205078125, -0.76751708984375, -0.6829833984375, -0.59844970703125, -0.513916015625, -0.42938232421875, -0.3448486328125, -0.26031494140625, -0.17578125, -0.09124755859375, -0.0067138671875, 0.07781982421875, 0.162353515625, 0.24688720703125, 0.3314208984375, 0.41595458984375, 0.50048828125, 0.58502197265625, 0.6695556640625, 0.75408935546875, 0.838623046875, 0.92315673828125, 1.0076904296875, 1.09222412109375, 1.1767578125, 1.26129150390625, 1.3458251953125, 1.43035888671875, 1.514892578125, 1.59942626953125, 1.6839599609375, 1.76849365234375, 1.85302734375, 1.93756103515625, 2.0220947265625, 2.10662841796875, 2.191162109375, 2.27569580078125, 2.3602294921875, 2.44476318359375, 2.529296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 12.0, 20.0, 19.0, 23.0, 23.0, 61.0, 67.0, 112.0, 170.0, 265.0, 516.0, 1095.0, 2675.0, 8223.0, 36230.0, 292888.0, 604215.0, 80141.0, 14512.0, 4032.0, 1562.0, 699.0, 384.0, 194.0, 128.0, 76.0, 60.0, 42.0, 26.0, 21.0, 12.0, 10.0, 11.0, 4.0, 2.0, 7.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7451171875, -1.687347412109375, -1.62957763671875, -1.571807861328125, -1.5140380859375, -1.456268310546875, -1.39849853515625, -1.340728759765625, -1.282958984375, -1.225189208984375, -1.16741943359375, -1.109649658203125, -1.0518798828125, -0.994110107421875, -0.93634033203125, -0.878570556640625, -0.82080078125, -0.763031005859375, -0.70526123046875, -0.647491455078125, -0.5897216796875, -0.531951904296875, -0.47418212890625, -0.416412353515625, -0.358642578125, -0.300872802734375, -0.24310302734375, -0.185333251953125, -0.1275634765625, -0.069793701171875, -0.01202392578125, 0.045745849609375, 0.103515625, 0.161285400390625, 0.21905517578125, 0.276824951171875, 0.3345947265625, 0.392364501953125, 0.45013427734375, 0.507904052734375, 0.565673828125, 0.623443603515625, 0.68121337890625, 0.738983154296875, 0.7967529296875, 0.854522705078125, 0.91229248046875, 0.970062255859375, 1.02783203125, 1.085601806640625, 1.14337158203125, 1.201141357421875, 1.2589111328125, 1.316680908203125, 1.37445068359375, 1.432220458984375, 1.489990234375, 1.547760009765625, 1.60552978515625, 1.663299560546875, 1.7210693359375, 1.778839111328125, 1.83660888671875, 1.894378662109375, 1.9521484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 2.0, 9.0, 11.0, 20.0, 16.0, 16.0, 24.0, 46.0, 37.0, 57.0, 75.0, 65.0, 78.0, 86.0, 87.0, 72.0, 56.0, 48.0, 39.0, 37.0, 26.0, 20.0, 16.0, 10.0, 8.0, 7.0, 8.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0002117156982421875, -0.0002048984169960022, -0.0001980811357498169, -0.0001912638545036316, -0.0001844465732574463, -0.00017762929201126099, -0.00017081201076507568, -0.00016399472951889038, -0.00015717744827270508, -0.00015036016702651978, -0.00014354288578033447, -0.00013672560453414917, -0.00012990832328796387, -0.00012309104204177856, -0.00011627376079559326, -0.00010945647954940796, -0.00010263919830322266, -9.582191705703735e-05, -8.900463581085205e-05, -8.218735456466675e-05, -7.537007331848145e-05, -6.855279207229614e-05, -6.173551082611084e-05, -5.491822957992554e-05, -4.8100948333740234e-05, -4.128366708755493e-05, -3.446638584136963e-05, -2.7649104595184326e-05, -2.0831823348999023e-05, -1.401454210281372e-05, -7.197260856628418e-06, -3.7997961044311523e-07, 6.4373016357421875e-06, 1.325458288192749e-05, 2.0071864128112793e-05, 2.6889145374298096e-05, 3.37064266204834e-05, 4.05237078666687e-05, 4.7340989112854004e-05, 5.415827035903931e-05, 6.097555160522461e-05, 6.779283285140991e-05, 7.461011409759521e-05, 8.142739534378052e-05, 8.824467658996582e-05, 9.506195783615112e-05, 0.00010187923908233643, 0.00010869652032852173, 0.00011551380157470703, 0.00012233108282089233, 0.00012914836406707764, 0.00013596564531326294, 0.00014278292655944824, 0.00014960020780563354, 0.00015641748905181885, 0.00016323477029800415, 0.00017005205154418945, 0.00017686933279037476, 0.00018368661403656006, 0.00019050389528274536, 0.00019732117652893066, 0.00020413845777511597, 0.00021095573902130127, 0.00021777302026748657, 0.00022459030151367188]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 18.0, 23.0, 26.0, 55.0, 80.0, 139.0, 256.0, 506.0, 1209.0, 3467.0, 14010.0, 112696.0, 735120.0, 156933.0, 17624.0, 3870.0, 1303.0, 540.0, 255.0, 136.0, 69.0, 66.0, 55.0, 26.0, 18.0, 11.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-2.771484375, -2.704803466796875, -2.63812255859375, -2.571441650390625, -2.5047607421875, -2.438079833984375, -2.37139892578125, -2.304718017578125, -2.238037109375, -2.171356201171875, -2.10467529296875, -2.037994384765625, -1.9713134765625, -1.904632568359375, -1.83795166015625, -1.771270751953125, -1.70458984375, -1.637908935546875, -1.57122802734375, -1.504547119140625, -1.4378662109375, -1.371185302734375, -1.30450439453125, -1.237823486328125, -1.171142578125, -1.104461669921875, -1.03778076171875, -0.971099853515625, -0.9044189453125, -0.837738037109375, -0.77105712890625, -0.704376220703125, -0.6376953125, -0.571014404296875, -0.50433349609375, -0.437652587890625, -0.3709716796875, -0.304290771484375, -0.23760986328125, -0.170928955078125, -0.104248046875, -0.037567138671875, 0.02911376953125, 0.095794677734375, 0.1624755859375, 0.229156494140625, 0.29583740234375, 0.362518310546875, 0.42919921875, 0.495880126953125, 0.56256103515625, 0.629241943359375, 0.6959228515625, 0.762603759765625, 0.82928466796875, 0.895965576171875, 0.962646484375, 1.029327392578125, 1.09600830078125, 1.162689208984375, 1.2293701171875, 1.296051025390625, 1.36273193359375, 1.429412841796875, 1.49609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 5.0, 8.0, 7.0, 10.0, 20.0, 16.0, 30.0, 29.0, 39.0, 52.0, 65.0, 53.0, 74.0, 63.0, 83.0, 75.0, 65.0, 51.0, 45.0, 58.0, 35.0, 27.0, 22.0, 22.0, 4.0, 11.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.4775390625, -1.437042236328125, -1.39654541015625, -1.356048583984375, -1.3155517578125, -1.275054931640625, -1.23455810546875, -1.194061279296875, -1.153564453125, -1.113067626953125, -1.07257080078125, -1.032073974609375, -0.9915771484375, -0.951080322265625, -0.91058349609375, -0.870086669921875, -0.82958984375, -0.789093017578125, -0.74859619140625, -0.708099365234375, -0.6676025390625, -0.627105712890625, -0.58660888671875, -0.546112060546875, -0.505615234375, -0.465118408203125, -0.42462158203125, -0.384124755859375, -0.3436279296875, -0.303131103515625, -0.26263427734375, -0.222137451171875, -0.181640625, -0.141143798828125, -0.10064697265625, -0.060150146484375, -0.0196533203125, 0.020843505859375, 0.06134033203125, 0.101837158203125, 0.142333984375, 0.182830810546875, 0.22332763671875, 0.263824462890625, 0.3043212890625, 0.344818115234375, 0.38531494140625, 0.425811767578125, 0.46630859375, 0.506805419921875, 0.54730224609375, 0.587799072265625, 0.6282958984375, 0.668792724609375, 0.70928955078125, 0.749786376953125, 0.790283203125, 0.830780029296875, 0.87127685546875, 0.911773681640625, 0.9522705078125, 0.992767333984375, 1.03326416015625, 1.073760986328125, 1.1142578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 19.0, 35.0, 35.0, 49.0, 85.0, 96.0, 113.0, 121.0, 129.0, 103.0, 65.0, 51.0, 36.0, 21.0, 12.0, 11.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.681549072265625, -22.873117446899414, -22.064685821533203, -21.256254196166992, -20.44782257080078, -19.63939094543457, -18.83095932006836, -18.02252769470215, -17.214096069335938, -16.405664443969727, -15.597232818603516, -14.788801193237305, -13.980369567871094, -13.171937942504883, -12.363506317138672, -11.555074691772461, -10.74664306640625, -9.938211441040039, -9.129779815673828, -8.321348190307617, -7.512916564941406, -6.704484939575195, -5.896053314208984, -5.087621688842773, -4.2791900634765625, -3.4707584381103516, -2.6623268127441406, -1.8538951873779297, -1.0454635620117188, -0.2370319366455078, 0.5713996887207031, 1.379831314086914, 2.188264846801758, 2.9966964721679688, 3.8051280975341797, 4.613559722900391, 5.421991348266602, 6.2304229736328125, 7.038854598999023, 7.847286224365234, 8.655717849731445, 9.464149475097656, 10.272581100463867, 11.081012725830078, 11.889444351196289, 12.6978759765625, 13.506307601928711, 14.314739227294922, 15.123170852661133, 15.931602478027344, 16.740034103393555, 17.548465728759766, 18.356897354125977, 19.165328979492188, 19.9737606048584, 20.78219223022461, 21.59062385559082, 22.39905548095703, 23.207487106323242, 24.015918731689453, 24.824350357055664, 25.632781982421875, 26.441213607788086, 27.249645233154297, 28.058076858520508]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 3.0, 6.0, 5.0, 13.0, 12.0, 13.0, 23.0, 22.0, 28.0, 33.0, 29.0, 50.0, 35.0, 64.0, 49.0, 62.0, 46.0, 61.0, 57.0, 42.0, 47.0, 44.0, 38.0, 32.0, 40.0, 27.0, 27.0, 21.0, 15.0, 11.0, 13.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.115697860717773, -11.647721290588379, -11.179744720458984, -10.71176815032959, -10.243791580200195, -9.7758150100708, -9.307838439941406, -8.839862823486328, -8.371885299682617, -7.903908729553223, -7.435932159423828, -6.967955589294434, -6.499979019165039, -6.0320024490356445, -5.564026355743408, -5.096049785614014, -4.628073692321777, -4.160097122192383, -3.6921205520629883, -3.224144220352173, -2.7561676502227783, -2.288191080093384, -1.8202147483825684, -1.3522381782531738, -0.8842616081237793, -0.41628509759902954, 0.051691412925720215, 0.5196678638458252, 0.9876444339752197, 1.4556210041046143, 1.9235973358154297, 2.391573905944824, 2.8595504760742188, 3.3275270462036133, 3.795503616333008, 4.263480186462402, 4.731456756591797, 5.199433326721191, 5.667409420013428, 6.135385990142822, 6.603362560272217, 7.071339130401611, 7.539315700531006, 8.007291793823242, 8.475268363952637, 8.943244934082031, 9.411221504211426, 9.87919807434082, 10.347174644470215, 10.81515121459961, 11.283127784729004, 11.751104354858398, 12.219080924987793, 12.687057495117188, 13.155033111572266, 13.623010635375977, 14.090986251831055, 14.55896282196045, 15.026939392089844, 15.494915962219238, 15.962892532348633, 16.43086814880371, 16.898845672607422, 17.3668212890625, 17.83479881286621]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 6.0, 13.0, 28.0, 33.0, 48.0, 98.0, 215.0, 436.0, 965.0, 2446.0, 8300.0, 79308.0, 4080153.0, 15990.0, 3682.0, 1286.0, 603.0, 299.0, 138.0, 89.0, 51.0, 27.0, 22.0, 15.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.26318359375, -5.0888671875, -4.91455078125, -4.740234375, -4.56591796875, -4.3916015625, -4.21728515625, -4.04296875, -3.86865234375, -3.6943359375, -3.52001953125, -3.345703125, -3.17138671875, -2.9970703125, -2.82275390625, -2.6484375, -2.47412109375, -2.2998046875, -2.12548828125, -1.951171875, -1.77685546875, -1.6025390625, -1.42822265625, -1.25390625, -1.07958984375, -0.9052734375, -0.73095703125, -0.556640625, -0.38232421875, -0.2080078125, -0.03369140625, 0.140625, 0.31494140625, 0.4892578125, 0.66357421875, 0.837890625, 1.01220703125, 1.1865234375, 1.36083984375, 1.53515625, 1.70947265625, 1.8837890625, 2.05810546875, 2.232421875, 2.40673828125, 2.5810546875, 2.75537109375, 2.9296875, 3.10400390625, 3.2783203125, 3.45263671875, 3.626953125, 3.80126953125, 3.9755859375, 4.14990234375, 4.32421875, 4.49853515625, 4.6728515625, 4.84716796875, 5.021484375, 5.19580078125, 5.3701171875, 5.54443359375, 5.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 6.0, 13.0, 6.0, 19.0, 21.0, 23.0, 33.0, 45.0, 49.0, 58.0, 58.0, 61.0, 64.0, 66.0, 58.0, 67.0, 57.0, 48.0, 36.0, 38.0, 32.0, 27.0, 19.0, 23.0, 10.0, 11.0, 9.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.80517578125, -0.7825088500976562, -0.7598419189453125, -0.7371749877929688, -0.714508056640625, -0.6918411254882812, -0.6691741943359375, -0.6465072631835938, -0.62384033203125, -0.6011734008789062, -0.5785064697265625, -0.5558395385742188, -0.533172607421875, -0.5105056762695312, -0.4878387451171875, -0.46517181396484375, -0.4425048828125, -0.41983795166015625, -0.3971710205078125, -0.37450408935546875, -0.351837158203125, -0.32917022705078125, -0.3065032958984375, -0.28383636474609375, -0.26116943359375, -0.23850250244140625, -0.2158355712890625, -0.19316864013671875, -0.170501708984375, -0.14783477783203125, -0.1251678466796875, -0.10250091552734375, -0.079833984375, -0.05716705322265625, -0.0345001220703125, -0.01183319091796875, 0.010833740234375, 0.03350067138671875, 0.0561676025390625, 0.07883453369140625, 0.10150146484375, 0.12416839599609375, 0.1468353271484375, 0.16950225830078125, 0.192169189453125, 0.21483612060546875, 0.2375030517578125, 0.26016998291015625, 0.2828369140625, 0.30550384521484375, 0.3281707763671875, 0.35083770751953125, 0.373504638671875, 0.39617156982421875, 0.4188385009765625, 0.44150543212890625, 0.46417236328125, 0.48683929443359375, 0.5095062255859375, 0.5321731567382812, 0.554840087890625, 0.5775070190429688, 0.6001739501953125, 0.6228408813476562, 0.6455078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 3.0, 11.0, 18.0, 14.0, 22.0, 23.0, 29.0, 48.0, 80.0, 118.0, 221.0, 359.0, 667.0, 1491.0, 3507.0, 10899.0, 74194.0, 4056017.0, 34471.0, 7016.0, 2555.0, 1167.0, 521.0, 277.0, 189.0, 94.0, 74.0, 53.0, 30.0, 23.0, 12.0, 16.0, 17.0, 8.0, 7.0, 3.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.32366943359375, -6.1395263671875, -5.95538330078125, -5.771240234375, -5.58709716796875, -5.4029541015625, -5.21881103515625, -5.03466796875, -4.85052490234375, -4.6663818359375, -4.48223876953125, -4.298095703125, -4.11395263671875, -3.9298095703125, -3.74566650390625, -3.5615234375, -3.37738037109375, -3.1932373046875, -3.00909423828125, -2.824951171875, -2.64080810546875, -2.4566650390625, -2.27252197265625, -2.08837890625, -1.90423583984375, -1.7200927734375, -1.53594970703125, -1.351806640625, -1.16766357421875, -0.9835205078125, -0.79937744140625, -0.615234375, -0.43109130859375, -0.2469482421875, -0.06280517578125, 0.121337890625, 0.30548095703125, 0.4896240234375, 0.67376708984375, 0.85791015625, 1.04205322265625, 1.2261962890625, 1.41033935546875, 1.594482421875, 1.77862548828125, 1.9627685546875, 2.14691162109375, 2.3310546875, 2.51519775390625, 2.6993408203125, 2.88348388671875, 3.067626953125, 3.25177001953125, 3.4359130859375, 3.62005615234375, 3.80419921875, 3.98834228515625, 4.1724853515625, 4.35662841796875, 4.540771484375, 4.72491455078125, 4.9090576171875, 5.09320068359375, 5.27734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 8.0, 8.0, 10.0, 25.0, 50.0, 117.0, 3643.0, 116.0, 40.0, 23.0, 15.0, 9.0, 6.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2421875, -1.1952972412109375, -1.148406982421875, -1.1015167236328125, -1.05462646484375, -1.0077362060546875, -0.960845947265625, -0.9139556884765625, -0.8670654296875, -0.8201751708984375, -0.773284912109375, -0.7263946533203125, -0.67950439453125, -0.6326141357421875, -0.585723876953125, -0.5388336181640625, -0.491943359375, -0.4450531005859375, -0.398162841796875, -0.3512725830078125, -0.30438232421875, -0.2574920654296875, -0.210601806640625, -0.1637115478515625, -0.1168212890625, -0.0699310302734375, -0.023040771484375, 0.0238494873046875, 0.07073974609375, 0.1176300048828125, 0.164520263671875, 0.2114105224609375, 0.25830078125, 0.3051910400390625, 0.352081298828125, 0.3989715576171875, 0.44586181640625, 0.4927520751953125, 0.539642333984375, 0.5865325927734375, 0.6334228515625, 0.6803131103515625, 0.727203369140625, 0.7740936279296875, 0.82098388671875, 0.8678741455078125, 0.914764404296875, 0.9616546630859375, 1.008544921875, 1.0554351806640625, 1.102325439453125, 1.1492156982421875, 1.19610595703125, 1.2429962158203125, 1.289886474609375, 1.3367767333984375, 1.3836669921875, 1.4305572509765625, 1.477447509765625, 1.5243377685546875, 1.57122802734375, 1.6181182861328125, 1.665008544921875, 1.7118988037109375, 1.7587890625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 5.0, 16.0, 34.0, 46.0, 61.0, 76.0, 89.0, 105.0, 94.0, 108.0, 90.0, 86.0, 52.0, 44.0, 27.0, 13.0, 11.0, 13.0, 8.0, 5.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.702145576477051, -2.5952060222625732, -2.4882664680480957, -2.381326913833618, -2.2743873596191406, -2.167447805404663, -2.0605082511901855, -1.9535688161849976, -1.84662926197052, -1.7396897077560425, -1.632750153541565, -1.525810718536377, -1.4188711643218994, -1.3119316101074219, -1.2049920558929443, -1.0980525016784668, -0.9911129474639893, -0.8841733932495117, -0.7772338390350342, -0.6702943444252014, -0.5633547902107239, -0.45641523599624634, -0.3494757413864136, -0.24253618717193604, -0.1355966329574585, -0.02865709364414215, 0.0782824456691742, 0.18522197008132935, 0.2921615242958069, 0.3991010785102844, 0.5060405731201172, 0.6129801273345947, 0.7199196815490723, 0.8268592357635498, 0.9337987899780273, 1.0407383441925049, 1.1476778984069824, 1.25461745262146, 1.361556887626648, 1.4684964418411255, 1.575435996055603, 1.6823755502700806, 1.789315104484558, 1.896254539489746, 2.0031940937042236, 2.110133647918701, 2.2170732021331787, 2.3240127563476562, 2.430952310562134, 2.5378918647766113, 2.644831418991089, 2.7517709732055664, 2.858710527420044, 2.9656500816345215, 3.07258939743042, 3.1795291900634766, 3.286468505859375, 3.3934080600738525, 3.50034761428833, 3.6072871685028076, 3.714226722717285, 3.8211662769317627, 3.9281058311462402, 4.035045146942139, 4.141984939575195]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 3.0, 11.0, 9.0, 2.0, 18.0, 19.0, 24.0, 18.0, 15.0, 25.0, 41.0, 32.0, 43.0, 39.0, 44.0, 44.0, 54.0, 50.0, 53.0, 43.0, 38.0, 49.0, 33.0, 38.0, 34.0, 28.0, 23.0, 25.0, 27.0, 23.0, 9.0, 17.0, 10.0, 12.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8859353065490723, -1.8234976530075073, -1.7610599994659424, -1.6986223459243774, -1.6361846923828125, -1.5737470388412476, -1.5113093852996826, -1.4488716125488281, -1.3864340782165527, -1.3239964246749878, -1.2615587711334229, -1.199121117591858, -1.136683464050293, -1.074245810508728, -1.011808156967163, -0.9493704438209534, -0.8869327306747437, -0.8244950771331787, -0.7620574235916138, -0.6996197700500488, -0.6371821165084839, -0.574744462966919, -0.5123067498207092, -0.4498690962791443, -0.38743144273757935, -0.3249937891960144, -0.26255613565444946, -0.20011845231056213, -0.1376807987689972, -0.07524314522743225, -0.012805461883544922, 0.04963219165802002, 0.11206984519958496, 0.1745074987411499, 0.23694516718387604, 0.2993828356266022, 0.3618204891681671, 0.42425814270973206, 0.4866958260536194, 0.5491334795951843, 0.6115711331367493, 0.6740087866783142, 0.7364464402198792, 0.7988841533660889, 0.8613218069076538, 0.9237594604492188, 0.9861971139907837, 1.0486347675323486, 1.1110724210739136, 1.1735100746154785, 1.2359477281570435, 1.2983853816986084, 1.3608230352401733, 1.4232606887817383, 1.4856984615325928, 1.5481359958648682, 1.6105737686157227, 1.6730114221572876, 1.7354490756988525, 1.7978867292404175, 1.8603243827819824, 1.9227620363235474, 1.9851996898651123, 2.047637462615967, 2.110074996948242]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 9.0, 13.0, 20.0, 26.0, 54.0, 73.0, 111.0, 186.0, 353.0, 696.0, 1361.0, 2774.0, 6229.0, 16640.0, 51943.0, 186105.0, 454966.0, 230451.0, 63044.0, 19902.0, 7367.0, 3111.0, 1440.0, 715.0, 398.0, 214.0, 125.0, 74.0, 56.0, 31.0, 28.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -3.00347900390625, -2.9190673828125, -2.83465576171875, -2.750244140625, -2.66583251953125, -2.5814208984375, -2.49700927734375, -2.41259765625, -2.32818603515625, -2.2437744140625, -2.15936279296875, -2.074951171875, -1.99053955078125, -1.9061279296875, -1.82171630859375, -1.7373046875, -1.65289306640625, -1.5684814453125, -1.48406982421875, -1.399658203125, -1.31524658203125, -1.2308349609375, -1.14642333984375, -1.06201171875, -0.97760009765625, -0.8931884765625, -0.80877685546875, -0.724365234375, -0.63995361328125, -0.5555419921875, -0.47113037109375, -0.38671875, -0.30230712890625, -0.2178955078125, -0.13348388671875, -0.049072265625, 0.03533935546875, 0.1197509765625, 0.20416259765625, 0.28857421875, 0.37298583984375, 0.4573974609375, 0.54180908203125, 0.626220703125, 0.71063232421875, 0.7950439453125, 0.87945556640625, 0.9638671875, 1.04827880859375, 1.1326904296875, 1.21710205078125, 1.301513671875, 1.38592529296875, 1.4703369140625, 1.55474853515625, 1.63916015625, 1.72357177734375, 1.8079833984375, 1.89239501953125, 1.976806640625, 2.06121826171875, 2.1456298828125, 2.23004150390625, 2.314453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 1.0, 7.0, 6.0, 6.0, 10.0, 17.0, 6.0, 21.0, 13.0, 23.0, 34.0, 33.0, 56.0, 46.0, 53.0, 67.0, 60.0, 51.0, 65.0, 70.0, 50.0, 58.0, 41.0, 30.0, 36.0, 22.0, 27.0, 18.0, 15.0, 10.0, 9.0, 5.0, 9.0, 4.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7883682250976562, -0.7617950439453125, -0.7352218627929688, -0.708648681640625, -0.6820755004882812, -0.6555023193359375, -0.6289291381835938, -0.60235595703125, -0.5757827758789062, -0.5492095947265625, -0.5226364135742188, -0.496063232421875, -0.46949005126953125, -0.4429168701171875, -0.41634368896484375, -0.3897705078125, -0.36319732666015625, -0.3366241455078125, -0.31005096435546875, -0.283477783203125, -0.25690460205078125, -0.2303314208984375, -0.20375823974609375, -0.17718505859375, -0.15061187744140625, -0.1240386962890625, -0.09746551513671875, -0.070892333984375, -0.04431915283203125, -0.0177459716796875, 0.00882720947265625, 0.035400390625, 0.06197357177734375, 0.0885467529296875, 0.11511993408203125, 0.141693115234375, 0.16826629638671875, 0.1948394775390625, 0.22141265869140625, 0.24798583984375, 0.27455902099609375, 0.3011322021484375, 0.32770538330078125, 0.354278564453125, 0.38085174560546875, 0.4074249267578125, 0.43399810791015625, 0.4605712890625, 0.48714447021484375, 0.5137176513671875, 0.5402908325195312, 0.566864013671875, 0.5934371948242188, 0.6200103759765625, 0.6465835571289062, 0.67315673828125, 0.6997299194335938, 0.7263031005859375, 0.7528762817382812, 0.779449462890625, 0.8060226440429688, 0.8325958251953125, 0.8591690063476562, 0.8857421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 9.0, 17.0, 23.0, 27.0, 51.0, 68.0, 102.0, 211.0, 453.0, 845.0, 2351.0, 8293.0, 42321.0, 311490.0, 575038.0, 86763.0, 14406.0, 3659.0, 1225.0, 539.0, 274.0, 131.0, 85.0, 39.0, 39.0, 31.0, 19.0, 10.0, 10.0, 9.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.12890625, -4.011566162109375, -3.89422607421875, -3.776885986328125, -3.6595458984375, -3.542205810546875, -3.42486572265625, -3.307525634765625, -3.190185546875, -3.072845458984375, -2.95550537109375, -2.838165283203125, -2.7208251953125, -2.603485107421875, -2.48614501953125, -2.368804931640625, -2.25146484375, -2.134124755859375, -2.01678466796875, -1.899444580078125, -1.7821044921875, -1.664764404296875, -1.54742431640625, -1.430084228515625, -1.312744140625, -1.195404052734375, -1.07806396484375, -0.960723876953125, -0.8433837890625, -0.726043701171875, -0.60870361328125, -0.491363525390625, -0.3740234375, -0.256683349609375, -0.13934326171875, -0.022003173828125, 0.0953369140625, 0.212677001953125, 0.33001708984375, 0.447357177734375, 0.564697265625, 0.682037353515625, 0.79937744140625, 0.916717529296875, 1.0340576171875, 1.151397705078125, 1.26873779296875, 1.386077880859375, 1.50341796875, 1.620758056640625, 1.73809814453125, 1.855438232421875, 1.9727783203125, 2.090118408203125, 2.20745849609375, 2.324798583984375, 2.442138671875, 2.559478759765625, 2.67681884765625, 2.794158935546875, 2.9114990234375, 3.028839111328125, 3.14617919921875, 3.263519287109375, 3.380859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 15.0, 18.0, 12.0, 16.0, 21.0, 15.0, 34.0, 27.0, 31.0, 42.0, 34.0, 42.0, 55.0, 38.0, 44.0, 42.0, 44.0, 49.0, 37.0, 42.0, 54.0, 41.0, 21.0, 30.0, 32.0, 26.0, 24.0, 24.0, 16.0, 15.0, 15.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.603515625, -3.48968505859375, -3.3758544921875, -3.26202392578125, -3.148193359375, -3.03436279296875, -2.9205322265625, -2.80670166015625, -2.69287109375, -2.57904052734375, -2.4652099609375, -2.35137939453125, -2.237548828125, -2.12371826171875, -2.0098876953125, -1.89605712890625, -1.7822265625, -1.66839599609375, -1.5545654296875, -1.44073486328125, -1.326904296875, -1.21307373046875, -1.0992431640625, -0.98541259765625, -0.87158203125, -0.75775146484375, -0.6439208984375, -0.53009033203125, -0.416259765625, -0.30242919921875, -0.1885986328125, -0.07476806640625, 0.0390625, 0.15289306640625, 0.2667236328125, 0.38055419921875, 0.494384765625, 0.60821533203125, 0.7220458984375, 0.83587646484375, 0.94970703125, 1.06353759765625, 1.1773681640625, 1.29119873046875, 1.405029296875, 1.51885986328125, 1.6326904296875, 1.74652099609375, 1.8603515625, 1.97418212890625, 2.0880126953125, 2.20184326171875, 2.315673828125, 2.42950439453125, 2.5433349609375, 2.65716552734375, 2.77099609375, 2.88482666015625, 2.9986572265625, 3.11248779296875, 3.226318359375, 3.34014892578125, 3.4539794921875, 3.56781005859375, 3.681640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 10.0, 10.0, 21.0, 28.0, 64.0, 102.0, 205.0, 463.0, 1336.0, 6669.0, 127401.0, 881579.0, 26203.0, 2945.0, 802.0, 330.0, 151.0, 87.0, 52.0, 24.0, 19.0, 13.0, 13.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-6.42578125, -6.277313232421875, -6.12884521484375, -5.980377197265625, -5.8319091796875, -5.683441162109375, -5.53497314453125, -5.386505126953125, -5.238037109375, -5.089569091796875, -4.94110107421875, -4.792633056640625, -4.6441650390625, -4.495697021484375, -4.34722900390625, -4.198760986328125, -4.05029296875, -3.901824951171875, -3.75335693359375, -3.604888916015625, -3.4564208984375, -3.307952880859375, -3.15948486328125, -3.011016845703125, -2.862548828125, -2.714080810546875, -2.56561279296875, -2.417144775390625, -2.2686767578125, -2.120208740234375, -1.97174072265625, -1.823272705078125, -1.6748046875, -1.526336669921875, -1.37786865234375, -1.229400634765625, -1.0809326171875, -0.932464599609375, -0.78399658203125, -0.635528564453125, -0.487060546875, -0.338592529296875, -0.19012451171875, -0.041656494140625, 0.1068115234375, 0.255279541015625, 0.40374755859375, 0.552215576171875, 0.70068359375, 0.849151611328125, 0.99761962890625, 1.146087646484375, 1.2945556640625, 1.443023681640625, 1.59149169921875, 1.739959716796875, 1.888427734375, 2.036895751953125, 2.18536376953125, 2.333831787109375, 2.4822998046875, 2.630767822265625, 2.77923583984375, 2.927703857421875, 3.076171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 7.0, 8.0, 8.0, 17.0, 12.0, 28.0, 35.0, 40.0, 52.0, 74.0, 70.0, 77.0, 91.0, 89.0, 75.0, 83.0, 42.0, 37.0, 39.0, 27.0, 17.0, 18.0, 13.0, 7.0, 3.0, 12.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026607513427734375, -0.0002577193081378937, -0.0002493634819984436, -0.00024100765585899353, -0.00023265182971954346, -0.00022429600358009338, -0.0002159401774406433, -0.00020758435130119324, -0.00019922852516174316, -0.0001908726990222931, -0.00018251687288284302, -0.00017416104674339294, -0.00016580522060394287, -0.0001574493944644928, -0.00014909356832504272, -0.00014073774218559265, -0.00013238191604614258, -0.0001240260899066925, -0.00011567026376724243, -0.00010731443762779236, -9.895861148834229e-05, -9.060278534889221e-05, -8.224695920944214e-05, -7.389113306999207e-05, -6.553530693054199e-05, -5.717948079109192e-05, -4.8823654651641846e-05, -4.046782851219177e-05, -3.21120023727417e-05, -2.3756176233291626e-05, -1.5400350093841553e-05, -7.0445239543914795e-06, 1.3113021850585938e-06, 9.667128324508667e-06, 1.802295446395874e-05, 2.6378780603408813e-05, 3.473460674285889e-05, 4.309043288230896e-05, 5.144625902175903e-05, 5.9802085161209106e-05, 6.815791130065918e-05, 7.651373744010925e-05, 8.486956357955933e-05, 9.32253897190094e-05, 0.00010158121585845947, 0.00010993704199790955, 0.00011829286813735962, 0.0001266486942768097, 0.00013500452041625977, 0.00014336034655570984, 0.0001517161726951599, 0.00016007199883460999, 0.00016842782497406006, 0.00017678365111351013, 0.0001851394772529602, 0.00019349530339241028, 0.00020185112953186035, 0.00021020695567131042, 0.0002185627818107605, 0.00022691860795021057, 0.00023527443408966064, 0.00024363026022911072, 0.0002519860863685608, 0.00026034191250801086, 0.00026869773864746094]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 15.0, 14.0, 22.0, 35.0, 57.0, 90.0, 154.0, 285.0, 535.0, 1312.0, 3756.0, 14158.0, 97156.0, 756302.0, 148900.0, 18400.0, 4364.0, 1574.0, 660.0, 317.0, 175.0, 82.0, 56.0, 38.0, 18.0, 15.0, 17.0, 8.0, 5.0, 2.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.447265625, -2.36724853515625, -2.2872314453125, -2.20721435546875, -2.127197265625, -2.04718017578125, -1.9671630859375, -1.88714599609375, -1.80712890625, -1.72711181640625, -1.6470947265625, -1.56707763671875, -1.487060546875, -1.40704345703125, -1.3270263671875, -1.24700927734375, -1.1669921875, -1.08697509765625, -1.0069580078125, -0.92694091796875, -0.846923828125, -0.76690673828125, -0.6868896484375, -0.60687255859375, -0.52685546875, -0.44683837890625, -0.3668212890625, -0.28680419921875, -0.206787109375, -0.12677001953125, -0.0467529296875, 0.03326416015625, 0.11328125, 0.19329833984375, 0.2733154296875, 0.35333251953125, 0.433349609375, 0.51336669921875, 0.5933837890625, 0.67340087890625, 0.75341796875, 0.83343505859375, 0.9134521484375, 0.99346923828125, 1.073486328125, 1.15350341796875, 1.2335205078125, 1.31353759765625, 1.3935546875, 1.47357177734375, 1.5535888671875, 1.63360595703125, 1.713623046875, 1.79364013671875, 1.8736572265625, 1.95367431640625, 2.03369140625, 2.11370849609375, 2.1937255859375, 2.27374267578125, 2.353759765625, 2.43377685546875, 2.5137939453125, 2.59381103515625, 2.673828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 12.0, 10.0, 14.0, 14.0, 19.0, 43.0, 71.0, 108.0, 113.0, 111.0, 126.0, 111.0, 60.0, 50.0, 31.0, 23.0, 18.0, 19.0, 13.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.701171875, -2.612945556640625, -2.52471923828125, -2.436492919921875, -2.3482666015625, -2.260040283203125, -2.17181396484375, -2.083587646484375, -1.995361328125, -1.907135009765625, -1.81890869140625, -1.730682373046875, -1.6424560546875, -1.554229736328125, -1.46600341796875, -1.377777099609375, -1.28955078125, -1.201324462890625, -1.11309814453125, -1.024871826171875, -0.9366455078125, -0.848419189453125, -0.76019287109375, -0.671966552734375, -0.583740234375, -0.495513916015625, -0.40728759765625, -0.319061279296875, -0.2308349609375, -0.142608642578125, -0.05438232421875, 0.033843994140625, 0.1220703125, 0.210296630859375, 0.29852294921875, 0.386749267578125, 0.4749755859375, 0.563201904296875, 0.65142822265625, 0.739654541015625, 0.827880859375, 0.916107177734375, 1.00433349609375, 1.092559814453125, 1.1807861328125, 1.269012451171875, 1.35723876953125, 1.445465087890625, 1.53369140625, 1.621917724609375, 1.71014404296875, 1.798370361328125, 1.8865966796875, 1.974822998046875, 2.06304931640625, 2.151275634765625, 2.239501953125, 2.327728271484375, 2.41595458984375, 2.504180908203125, 2.5924072265625, 2.680633544921875, 2.76885986328125, 2.857086181640625, 2.9453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 18.0, 29.0, 64.0, 91.0, 126.0, 167.0, 154.0, 118.0, 86.0, 61.0, 28.0, 24.0, 11.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.20188903808594, -38.04933547973633, -36.89678192138672, -35.74422836303711, -34.5916748046875, -33.439125061035156, -32.28656768798828, -31.134017944335938, -29.981464385986328, -28.82891082763672, -27.67635726928711, -26.5238037109375, -25.371252059936523, -24.218698501586914, -23.066144943237305, -21.913593292236328, -20.761037826538086, -19.608484268188477, -18.455930709838867, -17.30337905883789, -16.15082550048828, -14.998271942138672, -13.845718383789062, -12.69316577911377, -11.54061222076416, -10.38805866241455, -9.235506057739258, -8.082952499389648, -6.930399417877197, -5.777846336364746, -4.625292778015137, -3.4727401733398438, -2.3201866149902344, -1.1676334142684937, -0.01508021354675293, 1.1374731063842773, 2.2900261878967285, 3.4425792694091797, 4.595132827758789, 5.747685432434082, 6.900238990783691, 8.0527925491333, 9.205345153808594, 10.357898712158203, 11.510452270507812, 12.663004875183105, 13.815558433532715, 14.968111038208008, 16.120664596557617, 17.273218154907227, 18.425771713256836, 19.578323364257812, 20.730876922607422, 21.88343048095703, 23.03598403930664, 24.18853759765625, 25.34109115600586, 26.49364471435547, 27.646198272705078, 28.798751831054688, 29.951303482055664, 31.103857040405273, 32.25640869140625, 33.40896224975586, 34.56151580810547]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 13.0, 11.0, 26.0, 20.0, 31.0, 42.0, 48.0, 60.0, 67.0, 76.0, 71.0, 77.0, 70.0, 66.0, 71.0, 51.0, 47.0, 37.0, 24.0, 18.0, 20.0, 14.0, 11.0, 10.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.44010353088379, -18.615272521972656, -17.790443420410156, -16.965612411499023, -16.14078140258789, -15.315950393676758, -14.491120338439941, -13.666290283203125, -12.841459274291992, -12.01662826538086, -11.191798210144043, -10.366968154907227, -9.542137145996094, -8.717306137084961, -7.8924760818481445, -7.06764554977417, -6.242815017700195, -5.417984485626221, -4.593153953552246, -3.7683234214782715, -2.943492889404297, -2.1186623573303223, -1.2938318252563477, -0.46900129318237305, 0.35582923889160156, 1.1806597709655762, 2.005490303039551, 2.8303208351135254, 3.6551513671875, 4.479981899261475, 5.304812431335449, 6.129642963409424, 6.954475402832031, 7.779305934906006, 8.60413646697998, 9.428966522216797, 10.25379753112793, 11.078628540039062, 11.903458595275879, 12.728288650512695, 13.553119659423828, 14.377950668334961, 15.202780723571777, 16.027610778808594, 16.852441787719727, 17.67727279663086, 18.50210189819336, 19.326932907104492, 20.151763916015625, 20.976594924926758, 21.80142593383789, 22.62625503540039, 23.451086044311523, 24.275917053222656, 25.100746154785156, 25.92557716369629, 26.750408172607422, 27.575239181518555, 28.400070190429688, 29.224899291992188, 30.04973030090332, 30.874561309814453, 31.699390411376953, 32.52422332763672, 33.34905242919922]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 5.0, 7.0, 9.0, 22.0, 22.0, 38.0, 62.0, 66.0, 117.0, 183.0, 293.0, 473.0, 858.0, 1573.0, 3315.0, 7411.0, 24141.0, 193121.0, 3891738.0, 49593.0, 11909.0, 4640.0, 2078.0, 1057.0, 581.0, 350.0, 200.0, 132.0, 101.0, 52.0, 37.0, 35.0, 18.0, 12.0, 7.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -3.001068115234375, -2.89080810546875, -2.780548095703125, -2.6702880859375, -2.560028076171875, -2.44976806640625, -2.339508056640625, -2.229248046875, -2.118988037109375, -2.00872802734375, -1.898468017578125, -1.7882080078125, -1.677947998046875, -1.56768798828125, -1.457427978515625, -1.34716796875, -1.236907958984375, -1.12664794921875, -1.016387939453125, -0.9061279296875, -0.795867919921875, -0.68560791015625, -0.575347900390625, -0.465087890625, -0.354827880859375, -0.24456787109375, -0.134307861328125, -0.0240478515625, 0.086212158203125, 0.19647216796875, 0.306732177734375, 0.4169921875, 0.527252197265625, 0.63751220703125, 0.747772216796875, 0.8580322265625, 0.968292236328125, 1.07855224609375, 1.188812255859375, 1.299072265625, 1.409332275390625, 1.51959228515625, 1.629852294921875, 1.7401123046875, 1.850372314453125, 1.96063232421875, 2.070892333984375, 2.18115234375, 2.291412353515625, 2.40167236328125, 2.511932373046875, 2.6221923828125, 2.732452392578125, 2.84271240234375, 2.952972412109375, 3.063232421875, 3.173492431640625, 3.28375244140625, 3.394012451171875, 3.5042724609375, 3.614532470703125, 3.72479248046875, 3.835052490234375, 3.9453125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 6.0, 2.0, 9.0, 9.0, 6.0, 14.0, 16.0, 22.0, 28.0, 36.0, 53.0, 69.0, 74.0, 83.0, 92.0, 80.0, 97.0, 89.0, 58.0, 48.0, 33.0, 26.0, 19.0, 14.0, 6.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8650436401367188, -0.8233489990234375, -0.7816543579101562, -0.739959716796875, -0.6982650756835938, -0.6565704345703125, -0.6148757934570312, -0.57318115234375, -0.5314865112304688, -0.4897918701171875, -0.44809722900390625, -0.406402587890625, -0.36470794677734375, -0.3230133056640625, -0.28131866455078125, -0.2396240234375, -0.19792938232421875, -0.1562347412109375, -0.11454010009765625, -0.072845458984375, -0.03115081787109375, 0.0105438232421875, 0.05223846435546875, 0.09393310546875, 0.13562774658203125, 0.1773223876953125, 0.21901702880859375, 0.260711669921875, 0.30240631103515625, 0.3441009521484375, 0.38579559326171875, 0.427490234375, 0.46918487548828125, 0.5108795166015625, 0.5525741577148438, 0.594268798828125, 0.6359634399414062, 0.6776580810546875, 0.7193527221679688, 0.76104736328125, 0.8027420043945312, 0.8444366455078125, 0.8861312866210938, 0.927825927734375, 0.9695205688476562, 1.0112152099609375, 1.0529098510742188, 1.0946044921875, 1.1362991333007812, 1.1779937744140625, 1.2196884155273438, 1.261383056640625, 1.3030776977539062, 1.3447723388671875, 1.3864669799804688, 1.42816162109375, 1.4698562622070312, 1.5115509033203125, 1.5532455444335938, 1.594940185546875, 1.6366348266601562, 1.6783294677734375, 1.7200241088867188, 1.76171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 6.0, 6.0, 8.0, 13.0, 13.0, 20.0, 23.0, 27.0, 49.0, 76.0, 113.0, 224.0, 471.0, 1274.0, 3894.0, 15794.0, 174937.0, 3943429.0, 42916.0, 7356.0, 2021.0, 776.0, 344.0, 166.0, 88.0, 59.0, 43.0, 45.0, 14.0, 11.0, 12.0, 6.0, 8.0, 7.0, 6.0, 3.0, 4.0, 3.0, 9.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.703125, -7.484619140625, -7.26611328125, -7.047607421875, -6.8291015625, -6.610595703125, -6.39208984375, -6.173583984375, -5.955078125, -5.736572265625, -5.51806640625, -5.299560546875, -5.0810546875, -4.862548828125, -4.64404296875, -4.425537109375, -4.20703125, -3.988525390625, -3.77001953125, -3.551513671875, -3.3330078125, -3.114501953125, -2.89599609375, -2.677490234375, -2.458984375, -2.240478515625, -2.02197265625, -1.803466796875, -1.5849609375, -1.366455078125, -1.14794921875, -0.929443359375, -0.7109375, -0.492431640625, -0.27392578125, -0.055419921875, 0.1630859375, 0.381591796875, 0.60009765625, 0.818603515625, 1.037109375, 1.255615234375, 1.47412109375, 1.692626953125, 1.9111328125, 2.129638671875, 2.34814453125, 2.566650390625, 2.78515625, 3.003662109375, 3.22216796875, 3.440673828125, 3.6591796875, 3.877685546875, 4.09619140625, 4.314697265625, 4.533203125, 4.751708984375, 4.97021484375, 5.188720703125, 5.4072265625, 5.625732421875, 5.84423828125, 6.062744140625, 6.28125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 4.0, 4.0, 11.0, 16.0, 20.0, 23.0, 19.0, 29.0, 58.0, 103.0, 238.0, 2845.0, 364.0, 128.0, 68.0, 55.0, 22.0, 20.0, 12.0, 10.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.1780242919921875, -2.121673583984375, -2.0653228759765625, -2.00897216796875, -1.9526214599609375, -1.896270751953125, -1.8399200439453125, -1.7835693359375, -1.7272186279296875, -1.670867919921875, -1.6145172119140625, -1.55816650390625, -1.5018157958984375, -1.445465087890625, -1.3891143798828125, -1.332763671875, -1.2764129638671875, -1.220062255859375, -1.1637115478515625, -1.10736083984375, -1.0510101318359375, -0.994659423828125, -0.9383087158203125, -0.8819580078125, -0.8256072998046875, -0.769256591796875, -0.7129058837890625, -0.65655517578125, -0.6002044677734375, -0.543853759765625, -0.4875030517578125, -0.43115234375, -0.3748016357421875, -0.318450927734375, -0.2621002197265625, -0.20574951171875, -0.1493988037109375, -0.093048095703125, -0.0366973876953125, 0.0196533203125, 0.0760040283203125, 0.132354736328125, 0.1887054443359375, 0.24505615234375, 0.3014068603515625, 0.357757568359375, 0.4141082763671875, 0.470458984375, 0.5268096923828125, 0.583160400390625, 0.6395111083984375, 0.69586181640625, 0.7522125244140625, 0.808563232421875, 0.8649139404296875, 0.9212646484375, 0.9776153564453125, 1.033966064453125, 1.0903167724609375, 1.14666748046875, 1.2030181884765625, 1.259368896484375, 1.3157196044921875, 1.3720703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 7.0, 9.0, 22.0, 30.0, 48.0, 71.0, 119.0, 134.0, 175.0, 166.0, 100.0, 61.0, 29.0, 14.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.355575561523438, -18.96014404296875, -18.56471061706543, -18.169279098510742, -17.773845672607422, -17.378414154052734, -16.982982635498047, -16.587549209594727, -16.19211769104004, -15.796685218811035, -15.401252746582031, -15.005821228027344, -14.61038875579834, -14.214956283569336, -13.819524765014648, -13.424092292785645, -13.02865982055664, -12.633227348327637, -12.237794876098633, -11.842363357543945, -11.446930885314941, -11.051498413085938, -10.65606689453125, -10.260634422302246, -9.865201950073242, -9.469769477844238, -9.074337005615234, -8.678905487060547, -8.283473014831543, -7.888040542602539, -7.492608547210693, -7.097176551818848, -6.7017436027526855, -6.30631160736084, -5.910879135131836, -5.515446662902832, -5.120014667510986, -4.724582672119141, -4.329150199890137, -3.933717966079712, -3.538285732269287, -3.1428534984588623, -2.7474212646484375, -2.3519890308380127, -1.956556797027588, -1.561124563217163, -1.1656923294067383, -0.7702600955963135, -0.37482786178588867, 0.020604372024536133, 0.41603660583496094, 0.8114688396453857, 1.2069010734558105, 1.6023333072662354, 1.9977655410766602, 2.393197774887085, 2.7886300086975098, 3.1840622425079346, 3.5794944763183594, 3.974926710128784, 4.370358943939209, 4.765790939331055, 5.161223411560059, 5.5566558837890625, 5.952087879180908]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 3.0, 6.0, 6.0, 9.0, 14.0, 11.0, 16.0, 18.0, 17.0, 22.0, 16.0, 21.0, 27.0, 30.0, 34.0, 38.0, 39.0, 35.0, 38.0, 36.0, 37.0, 39.0, 42.0, 28.0, 33.0, 37.0, 40.0, 29.0, 28.0, 28.0, 31.0, 23.0, 25.0, 23.0, 9.0, 17.0, 10.0, 13.0, 12.0, 7.0, 12.0, 5.0, 7.0, 3.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.132979869842529, -4.982744216918945, -4.832508563995361, -4.682272911071777, -4.532036781311035, -4.381801128387451, -4.231565475463867, -4.081329822540283, -3.931094169616699, -3.7808585166931152, -3.6306228637695312, -3.480386972427368, -3.330151319503784, -3.1799156665802, -3.029679775238037, -2.879444122314453, -2.729208469390869, -2.578972816467285, -2.428737163543701, -2.278501272201538, -2.128265619277954, -1.9780299663543701, -1.8277941942214966, -1.677558422088623, -1.527322769165039, -1.377087116241455, -1.2268513441085815, -1.076615571975708, -0.926379919052124, -0.7761442065238953, -0.6259084939956665, -0.47567272186279297, -0.3254365921020508, -0.17520087957382202, -0.02496516704559326, 0.1252705454826355, 0.27550625801086426, 0.425741970539093, 0.5759776830673218, 0.7262134552001953, 0.8764491081237793, 1.0266847610473633, 1.1769205331802368, 1.3271563053131104, 1.4773919582366943, 1.6276276111602783, 1.7778633832931519, 1.9280991554260254, 2.0783348083496094, 2.2285704612731934, 2.3788061141967773, 2.5290420055389404, 2.6792776584625244, 2.8295133113861084, 2.9797492027282715, 3.1299848556518555, 3.2802205085754395, 3.4304561614990234, 3.5806918144226074, 3.7309277057647705, 3.8811633586883545, 4.031399250030518, 4.181634902954102, 4.3318705558776855, 4.4821062088012695]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 5.0, 6.0, 11.0, 12.0, 28.0, 45.0, 67.0, 128.0, 233.0, 483.0, 954.0, 2349.0, 6205.0, 19068.0, 70910.0, 278839.0, 457058.0, 154811.0, 38938.0, 11451.0, 3979.0, 1544.0, 677.0, 346.0, 175.0, 98.0, 51.0, 25.0, 15.0, 15.0, 3.0, 7.0, 10.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.842376708984375, -2.74530029296875, -2.648223876953125, -2.5511474609375, -2.454071044921875, -2.35699462890625, -2.259918212890625, -2.162841796875, -2.065765380859375, -1.96868896484375, -1.871612548828125, -1.7745361328125, -1.677459716796875, -1.58038330078125, -1.483306884765625, -1.38623046875, -1.289154052734375, -1.19207763671875, -1.095001220703125, -0.9979248046875, -0.900848388671875, -0.80377197265625, -0.706695556640625, -0.609619140625, -0.512542724609375, -0.41546630859375, -0.318389892578125, -0.2213134765625, -0.124237060546875, -0.02716064453125, 0.069915771484375, 0.1669921875, 0.264068603515625, 0.36114501953125, 0.458221435546875, 0.5552978515625, 0.652374267578125, 0.74945068359375, 0.846527099609375, 0.943603515625, 1.040679931640625, 1.13775634765625, 1.234832763671875, 1.3319091796875, 1.428985595703125, 1.52606201171875, 1.623138427734375, 1.72021484375, 1.817291259765625, 1.91436767578125, 2.011444091796875, 2.1085205078125, 2.205596923828125, 2.30267333984375, 2.399749755859375, 2.496826171875, 2.593902587890625, 2.69097900390625, 2.788055419921875, 2.8851318359375, 2.982208251953125, 3.07928466796875, 3.176361083984375, 3.2734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 12.0, 15.0, 15.0, 24.0, 32.0, 51.0, 73.0, 91.0, 97.0, 91.0, 94.0, 85.0, 88.0, 59.0, 49.0, 29.0, 23.0, 22.0, 14.0, 12.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4013671875, -1.3430633544921875, -1.284759521484375, -1.2264556884765625, -1.16815185546875, -1.1098480224609375, -1.051544189453125, -0.9932403564453125, -0.9349365234375, -0.8766326904296875, -0.818328857421875, -0.7600250244140625, -0.70172119140625, -0.6434173583984375, -0.585113525390625, -0.5268096923828125, -0.468505859375, -0.4102020263671875, -0.351898193359375, -0.2935943603515625, -0.23529052734375, -0.1769866943359375, -0.118682861328125, -0.0603790283203125, -0.0020751953125, 0.0562286376953125, 0.114532470703125, 0.1728363037109375, 0.23114013671875, 0.2894439697265625, 0.347747802734375, 0.4060516357421875, 0.46435546875, 0.5226593017578125, 0.580963134765625, 0.6392669677734375, 0.69757080078125, 0.7558746337890625, 0.814178466796875, 0.8724822998046875, 0.9307861328125, 0.9890899658203125, 1.047393798828125, 1.1056976318359375, 1.16400146484375, 1.2223052978515625, 1.280609130859375, 1.3389129638671875, 1.397216796875, 1.4555206298828125, 1.513824462890625, 1.5721282958984375, 1.63043212890625, 1.6887359619140625, 1.747039794921875, 1.8053436279296875, 1.8636474609375, 1.9219512939453125, 1.980255126953125, 2.0385589599609375, 2.09686279296875, 2.1551666259765625, 2.213470458984375, 2.2717742919921875, 2.330078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 15.0, 23.0, 30.0, 57.0, 87.0, 140.0, 278.0, 529.0, 1335.0, 4419.0, 27167.0, 404348.0, 564616.0, 37165.0, 5475.0, 1555.0, 592.0, 282.0, 158.0, 103.0, 62.0, 32.0, 24.0, 14.0, 7.0, 5.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8359375, -6.6409912109375, -6.446044921875, -6.2510986328125, -6.05615234375, -5.8612060546875, -5.666259765625, -5.4713134765625, -5.2763671875, -5.0814208984375, -4.886474609375, -4.6915283203125, -4.49658203125, -4.3016357421875, -4.106689453125, -3.9117431640625, -3.716796875, -3.5218505859375, -3.326904296875, -3.1319580078125, -2.93701171875, -2.7420654296875, -2.547119140625, -2.3521728515625, -2.1572265625, -1.9622802734375, -1.767333984375, -1.5723876953125, -1.37744140625, -1.1824951171875, -0.987548828125, -0.7926025390625, -0.59765625, -0.4027099609375, -0.207763671875, -0.0128173828125, 0.18212890625, 0.3770751953125, 0.572021484375, 0.7669677734375, 0.9619140625, 1.1568603515625, 1.351806640625, 1.5467529296875, 1.74169921875, 1.9366455078125, 2.131591796875, 2.3265380859375, 2.521484375, 2.7164306640625, 2.911376953125, 3.1063232421875, 3.30126953125, 3.4962158203125, 3.691162109375, 3.8861083984375, 4.0810546875, 4.2760009765625, 4.470947265625, 4.6658935546875, 4.86083984375, 5.0557861328125, 5.250732421875, 5.4456787109375, 5.640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 11.0, 10.0, 7.0, 14.0, 20.0, 15.0, 24.0, 40.0, 45.0, 39.0, 45.0, 71.0, 62.0, 64.0, 56.0, 61.0, 63.0, 47.0, 50.0, 48.0, 38.0, 34.0, 21.0, 23.0, 26.0, 16.0, 12.0, 9.0, 6.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.00390625, -5.79351806640625, -5.5831298828125, -5.37274169921875, -5.162353515625, -4.95196533203125, -4.7415771484375, -4.53118896484375, -4.32080078125, -4.11041259765625, -3.9000244140625, -3.68963623046875, -3.479248046875, -3.26885986328125, -3.0584716796875, -2.84808349609375, -2.6376953125, -2.42730712890625, -2.2169189453125, -2.00653076171875, -1.796142578125, -1.58575439453125, -1.3753662109375, -1.16497802734375, -0.95458984375, -0.74420166015625, -0.5338134765625, -0.32342529296875, -0.113037109375, 0.09735107421875, 0.3077392578125, 0.51812744140625, 0.728515625, 0.93890380859375, 1.1492919921875, 1.35968017578125, 1.570068359375, 1.78045654296875, 1.9908447265625, 2.20123291015625, 2.41162109375, 2.62200927734375, 2.8323974609375, 3.04278564453125, 3.253173828125, 3.46356201171875, 3.6739501953125, 3.88433837890625, 4.0947265625, 4.30511474609375, 4.5155029296875, 4.72589111328125, 4.936279296875, 5.14666748046875, 5.3570556640625, 5.56744384765625, 5.77783203125, 5.98822021484375, 6.1986083984375, 6.40899658203125, 6.619384765625, 6.82977294921875, 7.0401611328125, 7.25054931640625, 7.4609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 10.0, 9.0, 12.0, 28.0, 39.0, 54.0, 90.0, 197.0, 478.0, 1357.0, 7769.0, 307119.0, 715249.0, 13234.0, 1820.0, 593.0, 230.0, 97.0, 58.0, 40.0, 23.0, 13.0, 11.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.779296875, -3.665130615234375, -3.55096435546875, -3.436798095703125, -3.3226318359375, -3.208465576171875, -3.09429931640625, -2.980133056640625, -2.865966796875, -2.751800537109375, -2.63763427734375, -2.523468017578125, -2.4093017578125, -2.295135498046875, -2.18096923828125, -2.066802978515625, -1.95263671875, -1.838470458984375, -1.72430419921875, -1.610137939453125, -1.4959716796875, -1.381805419921875, -1.26763916015625, -1.153472900390625, -1.039306640625, -0.925140380859375, -0.81097412109375, -0.696807861328125, -0.5826416015625, -0.468475341796875, -0.35430908203125, -0.240142822265625, -0.1259765625, -0.011810302734375, 0.10235595703125, 0.216522216796875, 0.3306884765625, 0.444854736328125, 0.55902099609375, 0.673187255859375, 0.787353515625, 0.901519775390625, 1.01568603515625, 1.129852294921875, 1.2440185546875, 1.358184814453125, 1.47235107421875, 1.586517333984375, 1.70068359375, 1.814849853515625, 1.92901611328125, 2.043182373046875, 2.1573486328125, 2.271514892578125, 2.38568115234375, 2.499847412109375, 2.614013671875, 2.728179931640625, 2.84234619140625, 2.956512451171875, 3.0706787109375, 3.184844970703125, 3.29901123046875, 3.413177490234375, 3.52734375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 12.0, 10.0, 20.0, 31.0, 35.0, 36.0, 73.0, 82.0, 98.0, 113.0, 101.0, 83.0, 71.0, 50.0, 46.0, 42.0, 26.0, 15.0, 18.0, 13.0, 5.0, 2.0, 3.0, 3.0, 7.0, 3.0, 2.0], "bins": [-0.00048828125, -0.0004778541624546051, -0.0004674270749092102, -0.0004569999873638153, -0.0004465728998184204, -0.0004361458122730255, -0.0004257187247276306, -0.0004152916371822357, -0.0004048645496368408, -0.0003944374620914459, -0.000384010374546051, -0.00037358328700065613, -0.00036315619945526123, -0.00035272911190986633, -0.00034230202436447144, -0.00033187493681907654, -0.00032144784927368164, -0.00031102076172828674, -0.00030059367418289185, -0.00029016658663749695, -0.00027973949909210205, -0.00026931241154670715, -0.00025888532400131226, -0.00024845823645591736, -0.00023803114891052246, -0.00022760406136512756, -0.00021717697381973267, -0.00020674988627433777, -0.00019632279872894287, -0.00018589571118354797, -0.00017546862363815308, -0.00016504153609275818, -0.00015461444854736328, -0.00014418736100196838, -0.00013376027345657349, -0.0001233331859111786, -0.00011290609836578369, -0.0001024790108203888, -9.20519232749939e-05, -8.1624835729599e-05, -7.11977481842041e-05, -6.0770660638809204e-05, -5.034357309341431e-05, -3.991648554801941e-05, -2.9489398002624512e-05, -1.9062310457229614e-05, -8.635222911834717e-06, 1.7918646335601807e-06, 1.2218952178955078e-05, 2.2646039724349976e-05, 3.307312726974487e-05, 4.350021481513977e-05, 5.392730236053467e-05, 6.435438990592957e-05, 7.478147745132446e-05, 8.520856499671936e-05, 9.563565254211426e-05, 0.00010606274008750916, 0.00011648982763290405, 0.00012691691517829895, 0.00013734400272369385, 0.00014777109026908875, 0.00015819817781448364, 0.00016862526535987854, 0.00017905235290527344]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 8.0, 13.0, 20.0, 43.0, 71.0, 167.0, 358.0, 962.0, 3451.0, 26764.0, 718476.0, 282798.0, 12024.0, 2125.0, 687.0, 275.0, 142.0, 62.0, 36.0, 18.0, 7.0, 11.0, 3.0, 5.0, 5.0, 0.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.51171875, -2.42755126953125, -2.3433837890625, -2.25921630859375, -2.175048828125, -2.09088134765625, -2.0067138671875, -1.92254638671875, -1.83837890625, -1.75421142578125, -1.6700439453125, -1.58587646484375, -1.501708984375, -1.41754150390625, -1.3333740234375, -1.24920654296875, -1.1650390625, -1.08087158203125, -0.9967041015625, -0.91253662109375, -0.828369140625, -0.74420166015625, -0.6600341796875, -0.57586669921875, -0.49169921875, -0.40753173828125, -0.3233642578125, -0.23919677734375, -0.155029296875, -0.07086181640625, 0.0133056640625, 0.09747314453125, 0.181640625, 0.26580810546875, 0.3499755859375, 0.43414306640625, 0.518310546875, 0.60247802734375, 0.6866455078125, 0.77081298828125, 0.85498046875, 0.93914794921875, 1.0233154296875, 1.10748291015625, 1.191650390625, 1.27581787109375, 1.3599853515625, 1.44415283203125, 1.5283203125, 1.61248779296875, 1.6966552734375, 1.78082275390625, 1.864990234375, 1.94915771484375, 2.0333251953125, 2.11749267578125, 2.20166015625, 2.28582763671875, 2.3699951171875, 2.45416259765625, 2.538330078125, 2.62249755859375, 2.7066650390625, 2.79083251953125, 2.875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 15.0, 24.0, 34.0, 46.0, 99.0, 120.0, 145.0, 147.0, 126.0, 73.0, 68.0, 28.0, 30.0, 14.0, 11.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.341064453125, -3.24267578125, -3.144287109375, -3.0458984375, -2.947509765625, -2.84912109375, -2.750732421875, -2.65234375, -2.553955078125, -2.45556640625, -2.357177734375, -2.2587890625, -2.160400390625, -2.06201171875, -1.963623046875, -1.865234375, -1.766845703125, -1.66845703125, -1.570068359375, -1.4716796875, -1.373291015625, -1.27490234375, -1.176513671875, -1.078125, -0.979736328125, -0.88134765625, -0.782958984375, -0.6845703125, -0.586181640625, -0.48779296875, -0.389404296875, -0.291015625, -0.192626953125, -0.09423828125, 0.004150390625, 0.1025390625, 0.200927734375, 0.29931640625, 0.397705078125, 0.49609375, 0.594482421875, 0.69287109375, 0.791259765625, 0.8896484375, 0.988037109375, 1.08642578125, 1.184814453125, 1.283203125, 1.381591796875, 1.47998046875, 1.578369140625, 1.6767578125, 1.775146484375, 1.87353515625, 1.971923828125, 2.0703125, 2.168701171875, 2.26708984375, 2.365478515625, 2.4638671875, 2.562255859375, 2.66064453125, 2.759033203125, 2.857421875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 18.0, 24.0, 45.0, 52.0, 84.0, 105.0, 144.0, 150.0, 106.0, 84.0, 65.0, 38.0, 24.0, 14.0, 7.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.288166046142578, -22.266162872314453, -21.244159698486328, -20.222156524658203, -19.200153350830078, -18.178150177001953, -17.156147003173828, -16.134143829345703, -15.112140655517578, -14.090137481689453, -13.068134307861328, -12.046131134033203, -11.024127960205078, -10.002124786376953, -8.980121612548828, -7.958118438720703, -6.936115264892578, -5.914112091064453, -4.892108917236328, -3.870105743408203, -2.848102569580078, -1.8260993957519531, -0.8040962219238281, 0.21790695190429688, 1.2399101257324219, 2.261913299560547, 3.283916473388672, 4.305919647216797, 5.327922821044922, 6.349925994873047, 7.371929168701172, 8.393932342529297, 9.415931701660156, 10.437934875488281, 11.459938049316406, 12.481941223144531, 13.503944396972656, 14.525947570800781, 15.547950744628906, 16.56995391845703, 17.591957092285156, 18.61396026611328, 19.635963439941406, 20.65796661376953, 21.679969787597656, 22.70197296142578, 23.723976135253906, 24.74597930908203, 25.767982482910156, 26.78998565673828, 27.811988830566406, 28.83399200439453, 29.855995178222656, 30.87799835205078, 31.900001525878906, 32.92200469970703, 33.944007873535156, 34.96601104736328, 35.988014221191406, 37.01001739501953, 38.032020568847656, 39.05402374267578, 40.076026916503906, 41.09803009033203, 42.120033264160156]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 4.0, 6.0, 4.0, 23.0, 22.0, 20.0, 35.0, 41.0, 37.0, 41.0, 70.0, 53.0, 66.0, 83.0, 73.0, 57.0, 58.0, 49.0, 54.0, 41.0, 40.0, 26.0, 17.0, 17.0, 17.0, 12.0, 15.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.04898452758789, -41.99481964111328, -40.94065856933594, -39.88649368286133, -38.83232879638672, -37.778167724609375, -36.724002838134766, -35.669837951660156, -34.61567687988281, -33.5615119934082, -32.50735092163086, -31.45318603515625, -30.399023056030273, -29.344860076904297, -28.290695190429688, -27.23653221130371, -26.1823673248291, -25.128204345703125, -24.074039459228516, -23.01987648010254, -21.965713500976562, -20.911548614501953, -19.857385635375977, -18.80322265625, -17.74905776977539, -16.694894790649414, -15.640730857849121, -14.586566925048828, -13.532403945922852, -12.478240013122559, -11.424076080322266, -10.369913101196289, -9.315750122070312, -8.26158618927002, -7.207423210144043, -6.15325927734375, -5.099095821380615, -4.0449323654174805, -2.9907684326171875, -1.9366049766540527, -0.882441520690918, 0.17172205448150635, 1.2258856296539307, 2.2800493240356445, 3.3342127799987793, 4.388376235961914, 5.442540168762207, 6.496703624725342, 7.550867080688477, 8.60503101348877, 9.659193992614746, 10.713357925415039, 11.767520904541016, 12.821684837341309, 13.875848770141602, 14.930011749267578, 15.984175682067871, 17.038339614868164, 18.09250259399414, 19.14666748046875, 20.200830459594727, 21.254993438720703, 22.309158325195312, 23.36332130432129, 24.417484283447266]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 3.0, 12.0, 10.0, 11.0, 19.0, 30.0, 29.0, 26.0, 33.0, 80.0, 124.0, 205.0, 417.0, 1140.0, 4761.0, 39581.0, 3667780.0, 456034.0, 19420.0, 3448.0, 741.0, 234.0, 79.0, 34.0, 11.0, 9.0, 4.0, 4.0], "bins": [-9.2421875, -9.067214965820312, -8.892242431640625, -8.717269897460938, -8.54229736328125, -8.367324829101562, -8.192352294921875, -8.017379760742188, -7.8424072265625, -7.6674346923828125, -7.492462158203125, -7.3174896240234375, -7.14251708984375, -6.9675445556640625, -6.792572021484375, -6.6175994873046875, -6.442626953125, -6.2676544189453125, -6.092681884765625, -5.9177093505859375, -5.74273681640625, -5.5677642822265625, -5.392791748046875, -5.2178192138671875, -5.0428466796875, -4.8678741455078125, -4.692901611328125, -4.5179290771484375, -4.34295654296875, -4.1679840087890625, -3.993011474609375, -3.8180389404296875, -3.64306640625, -3.4680938720703125, -3.293121337890625, -3.1181488037109375, -2.94317626953125, -2.7682037353515625, -2.593231201171875, -2.4182586669921875, -2.2432861328125, -2.0683135986328125, -1.893341064453125, -1.7183685302734375, -1.54339599609375, -1.3684234619140625, -1.193450927734375, -1.0184783935546875, -0.843505859375, -0.6685333251953125, -0.493560791015625, -0.3185882568359375, -0.14361572265625, 0.0313568115234375, 0.206329345703125, 0.3813018798828125, 0.5562744140625, 0.7312469482421875, 0.906219482421875, 1.0811920166015625, 1.25616455078125, 1.4311370849609375, 1.606109619140625, 1.7810821533203125, 1.9560546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 18.0, 30.0, 74.0, 124.0, 161.0, 162.0, 135.0, 118.0, 80.0, 40.0, 20.0, 18.0, 12.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.79296875, -4.698089599609375, -4.60321044921875, -4.508331298828125, -4.4134521484375, -4.318572998046875, -4.22369384765625, -4.128814697265625, -4.033935546875, -3.939056396484375, -3.84417724609375, -3.749298095703125, -3.6544189453125, -3.559539794921875, -3.46466064453125, -3.369781494140625, -3.27490234375, -3.180023193359375, -3.08514404296875, -2.990264892578125, -2.8953857421875, -2.800506591796875, -2.70562744140625, -2.610748291015625, -2.515869140625, -2.420989990234375, -2.32611083984375, -2.231231689453125, -2.1363525390625, -2.041473388671875, -1.94659423828125, -1.851715087890625, -1.7568359375, -1.661956787109375, -1.56707763671875, -1.472198486328125, -1.3773193359375, -1.282440185546875, -1.18756103515625, -1.092681884765625, -0.997802734375, -0.902923583984375, -0.80804443359375, -0.713165283203125, -0.6182861328125, -0.523406982421875, -0.42852783203125, -0.333648681640625, -0.23876953125, -0.143890380859375, -0.04901123046875, 0.045867919921875, 0.1407470703125, 0.235626220703125, 0.33050537109375, 0.425384521484375, 0.520263671875, 0.615142822265625, 0.71002197265625, 0.804901123046875, 0.8997802734375, 0.994659423828125, 1.08953857421875, 1.184417724609375, 1.279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 7.0, 19.0, 18.0, 23.0, 35.0, 66.0, 85.0, 156.0, 234.0, 410.0, 740.0, 1443.0, 3105.0, 7946.0, 25835.0, 122235.0, 2858786.0, 1062536.0, 80266.0, 18895.0, 6227.0, 2445.0, 1240.0, 662.0, 308.0, 204.0, 96.0, 77.0, 48.0, 31.0, 15.0, 14.0, 9.0, 13.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.421875, -3.314544677734375, -3.20721435546875, -3.099884033203125, -2.9925537109375, -2.885223388671875, -2.77789306640625, -2.670562744140625, -2.563232421875, -2.455902099609375, -2.34857177734375, -2.241241455078125, -2.1339111328125, -2.026580810546875, -1.91925048828125, -1.811920166015625, -1.70458984375, -1.597259521484375, -1.48992919921875, -1.382598876953125, -1.2752685546875, -1.167938232421875, -1.06060791015625, -0.953277587890625, -0.845947265625, -0.738616943359375, -0.63128662109375, -0.523956298828125, -0.4166259765625, -0.309295654296875, -0.20196533203125, -0.094635009765625, 0.0126953125, 0.120025634765625, 0.22735595703125, 0.334686279296875, 0.4420166015625, 0.549346923828125, 0.65667724609375, 0.764007568359375, 0.871337890625, 0.978668212890625, 1.08599853515625, 1.193328857421875, 1.3006591796875, 1.407989501953125, 1.51531982421875, 1.622650146484375, 1.72998046875, 1.837310791015625, 1.94464111328125, 2.051971435546875, 2.1593017578125, 2.266632080078125, 2.37396240234375, 2.481292724609375, 2.588623046875, 2.695953369140625, 2.80328369140625, 2.910614013671875, 3.0179443359375, 3.125274658203125, 3.23260498046875, 3.339935302734375, 3.447265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 9.0, 3.0, 5.0, 9.0, 20.0, 19.0, 32.0, 48.0, 75.0, 140.0, 292.0, 878.0, 1313.0, 648.0, 219.0, 133.0, 75.0, 48.0, 35.0, 28.0, 13.0, 6.0, 12.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.3680419921875, -5.216552734375, -5.0650634765625, -4.91357421875, -4.7620849609375, -4.610595703125, -4.4591064453125, -4.3076171875, -4.1561279296875, -4.004638671875, -3.8531494140625, -3.70166015625, -3.5501708984375, -3.398681640625, -3.2471923828125, -3.095703125, -2.9442138671875, -2.792724609375, -2.6412353515625, -2.48974609375, -2.3382568359375, -2.186767578125, -2.0352783203125, -1.8837890625, -1.7322998046875, -1.580810546875, -1.4293212890625, -1.27783203125, -1.1263427734375, -0.974853515625, -0.8233642578125, -0.671875, -0.5203857421875, -0.368896484375, -0.2174072265625, -0.06591796875, 0.0855712890625, 0.237060546875, 0.3885498046875, 0.5400390625, 0.6915283203125, 0.843017578125, 0.9945068359375, 1.14599609375, 1.2974853515625, 1.448974609375, 1.6004638671875, 1.751953125, 1.9034423828125, 2.054931640625, 2.2064208984375, 2.35791015625, 2.5093994140625, 2.660888671875, 2.8123779296875, 2.9638671875, 3.1153564453125, 3.266845703125, 3.4183349609375, 3.56982421875, 3.7213134765625, 3.872802734375, 4.0242919921875, 4.17578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 10.0, 18.0, 39.0, 48.0, 88.0, 109.0, 158.0, 167.0, 143.0, 85.0, 47.0, 30.0, 16.0, 12.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.949365615844727, -24.043842315673828, -23.138317108154297, -22.2327938079834, -21.327268600463867, -20.42174530029297, -19.516220092773438, -18.61069679260254, -17.70517349243164, -16.799650192260742, -15.894124984741211, -14.988601684570312, -14.083076477050781, -13.177553176879883, -12.272028923034668, -11.366504669189453, -10.460979461669922, -9.555455207824707, -8.649930953979492, -7.7444071769714355, -6.838882923126221, -5.933358669281006, -5.027834892272949, -4.122310638427734, -3.2167863845825195, -2.3112621307373047, -1.405738115310669, -0.5002140998840332, 0.40531015396118164, 1.3108344078063965, 2.216358184814453, 3.121882438659668, 4.02740478515625, 4.932929039001465, 5.83845329284668, 6.743977069854736, 7.649501323699951, 8.555025100708008, 9.460549354553223, 10.366073608398438, 11.271597862243652, 12.177122116088867, 13.082646369934082, 13.988170623779297, 14.893693923950195, 15.799219131469727, 16.704742431640625, 17.610267639160156, 18.515790939331055, 19.421314239501953, 20.326839447021484, 21.232362747192383, 22.137887954711914, 23.043411254882812, 23.948936462402344, 24.854459762573242, 25.75998306274414, 26.66550636291504, 27.57103157043457, 28.47655487060547, 29.382080078125, 30.2876033782959, 31.193126678466797, 32.09865188598633, 33.00417709350586]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 17.0, 9.0, 25.0, 35.0, 27.0, 45.0, 52.0, 67.0, 73.0, 79.0, 78.0, 70.0, 72.0, 70.0, 66.0, 52.0, 40.0, 29.0, 32.0, 19.0, 14.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.357948303222656, -16.51941680908203, -15.68088436126709, -14.842352867126465, -14.003820419311523, -13.165288925170898, -12.326757431030273, -11.488224983215332, -10.64969253540039, -9.811161041259766, -8.972628593444824, -8.1340970993042, -7.295564651489258, -6.457033157348633, -5.61850118637085, -4.779969215393066, -3.9414377212524414, -3.102905750274658, -2.264373779296875, -1.425842046737671, -0.5873100757598877, 0.2512216567993164, 1.0897536277770996, 1.9282855987548828, 2.766817569732666, 3.605349540710449, 4.443881511688232, 5.282413482666016, 6.120944976806641, 6.959476947784424, 7.798008918762207, 8.636541366577148, 9.475072860717773, 10.313604354858398, 11.15213680267334, 11.990668296813965, 12.829200744628906, 13.667732238769531, 14.506263732910156, 15.344796180725098, 16.18332862854004, 17.021860122680664, 17.86039161682129, 18.698925018310547, 19.537456512451172, 20.375988006591797, 21.214519500732422, 22.053050994873047, 22.891582489013672, 23.730113983154297, 24.568645477294922, 25.40717887878418, 26.245710372924805, 27.08424186706543, 27.922773361206055, 28.761306762695312, 29.599838256835938, 30.438369750976562, 31.276901245117188, 32.11543273925781, 32.95396423339844, 33.79249572753906, 34.63103103637695, 35.46956253051758, 36.3080940246582]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 10.0, 14.0, 21.0, 32.0, 68.0, 94.0, 200.0, 347.0, 773.0, 1685.0, 4210.0, 12335.0, 40486.0, 142520.0, 420188.0, 301727.0, 85617.0, 24863.0, 7997.0, 2886.0, 1271.0, 591.0, 282.0, 134.0, 83.0, 46.0, 23.0, 13.0, 11.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.255859375, -2.17169189453125, -2.0875244140625, -2.00335693359375, -1.919189453125, -1.83502197265625, -1.7508544921875, -1.66668701171875, -1.58251953125, -1.49835205078125, -1.4141845703125, -1.33001708984375, -1.245849609375, -1.16168212890625, -1.0775146484375, -0.99334716796875, -0.9091796875, -0.82501220703125, -0.7408447265625, -0.65667724609375, -0.572509765625, -0.48834228515625, -0.4041748046875, -0.32000732421875, -0.23583984375, -0.15167236328125, -0.0675048828125, 0.01666259765625, 0.100830078125, 0.18499755859375, 0.2691650390625, 0.35333251953125, 0.4375, 0.52166748046875, 0.6058349609375, 0.69000244140625, 0.774169921875, 0.85833740234375, 0.9425048828125, 1.02667236328125, 1.11083984375, 1.19500732421875, 1.2791748046875, 1.36334228515625, 1.447509765625, 1.53167724609375, 1.6158447265625, 1.70001220703125, 1.7841796875, 1.86834716796875, 1.9525146484375, 2.03668212890625, 2.120849609375, 2.20501708984375, 2.2891845703125, 2.37335205078125, 2.45751953125, 2.54168701171875, 2.6258544921875, 2.71002197265625, 2.794189453125, 2.87835693359375, 2.9625244140625, 3.04669189453125, 3.130859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 10.0, 19.0, 18.0, 30.0, 35.0, 51.0, 57.0, 70.0, 81.0, 95.0, 72.0, 77.0, 82.0, 57.0, 47.0, 42.0, 51.0, 32.0, 17.0, 14.0, 13.0, 8.0, 5.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.185546875, -2.1351776123046875, -2.084808349609375, -2.0344390869140625, -1.98406982421875, -1.9337005615234375, -1.883331298828125, -1.8329620361328125, -1.7825927734375, -1.7322235107421875, -1.681854248046875, -1.6314849853515625, -1.58111572265625, -1.5307464599609375, -1.480377197265625, -1.4300079345703125, -1.379638671875, -1.3292694091796875, -1.278900146484375, -1.2285308837890625, -1.17816162109375, -1.1277923583984375, -1.077423095703125, -1.0270538330078125, -0.9766845703125, -0.9263153076171875, -0.875946044921875, -0.8255767822265625, -0.77520751953125, -0.7248382568359375, -0.674468994140625, -0.6240997314453125, -0.57373046875, -0.5233612060546875, -0.472991943359375, -0.4226226806640625, -0.37225341796875, -0.3218841552734375, -0.271514892578125, -0.2211456298828125, -0.1707763671875, -0.1204071044921875, -0.070037841796875, -0.0196685791015625, 0.03070068359375, 0.0810699462890625, 0.131439208984375, 0.1818084716796875, 0.232177734375, 0.2825469970703125, 0.332916259765625, 0.3832855224609375, 0.43365478515625, 0.4840240478515625, 0.534393310546875, 0.5847625732421875, 0.6351318359375, 0.6855010986328125, 0.735870361328125, 0.7862396240234375, 0.83660888671875, 0.8869781494140625, 0.937347412109375, 0.9877166748046875, 1.0380859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 9.0, 5.0, 19.0, 11.0, 36.0, 44.0, 71.0, 109.0, 192.0, 296.0, 480.0, 900.0, 1733.0, 4454.0, 16596.0, 98496.0, 613986.0, 260254.0, 37232.0, 8168.0, 2659.0, 1217.0, 580.0, 359.0, 223.0, 147.0, 87.0, 75.0, 37.0, 25.0, 13.0, 14.0, 5.0, 5.0, 5.0, 6.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.9375, -4.816314697265625, -4.69512939453125, -4.573944091796875, -4.4527587890625, -4.331573486328125, -4.21038818359375, -4.089202880859375, -3.968017578125, -3.846832275390625, -3.72564697265625, -3.604461669921875, -3.4832763671875, -3.362091064453125, -3.24090576171875, -3.119720458984375, -2.99853515625, -2.877349853515625, -2.75616455078125, -2.634979248046875, -2.5137939453125, -2.392608642578125, -2.27142333984375, -2.150238037109375, -2.029052734375, -1.907867431640625, -1.78668212890625, -1.665496826171875, -1.5443115234375, -1.423126220703125, -1.30194091796875, -1.180755615234375, -1.0595703125, -0.938385009765625, -0.81719970703125, -0.696014404296875, -0.5748291015625, -0.453643798828125, -0.33245849609375, -0.211273193359375, -0.090087890625, 0.031097412109375, 0.15228271484375, 0.273468017578125, 0.3946533203125, 0.515838623046875, 0.63702392578125, 0.758209228515625, 0.87939453125, 1.000579833984375, 1.12176513671875, 1.242950439453125, 1.3641357421875, 1.485321044921875, 1.60650634765625, 1.727691650390625, 1.848876953125, 1.970062255859375, 2.09124755859375, 2.212432861328125, 2.3336181640625, 2.454803466796875, 2.57598876953125, 2.697174072265625, 2.818359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 4.0, 9.0, 4.0, 12.0, 11.0, 17.0, 23.0, 32.0, 26.0, 22.0, 27.0, 41.0, 39.0, 37.0, 46.0, 47.0, 36.0, 54.0, 45.0, 44.0, 49.0, 44.0, 45.0, 43.0, 39.0, 24.0, 31.0, 24.0, 13.0, 20.0, 14.0, 10.0, 9.0, 19.0, 8.0, 9.0, 13.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.10546875, -4.948486328125, -4.79150390625, -4.634521484375, -4.4775390625, -4.320556640625, -4.16357421875, -4.006591796875, -3.849609375, -3.692626953125, -3.53564453125, -3.378662109375, -3.2216796875, -3.064697265625, -2.90771484375, -2.750732421875, -2.59375, -2.436767578125, -2.27978515625, -2.122802734375, -1.9658203125, -1.808837890625, -1.65185546875, -1.494873046875, -1.337890625, -1.180908203125, -1.02392578125, -0.866943359375, -0.7099609375, -0.552978515625, -0.39599609375, -0.239013671875, -0.08203125, 0.074951171875, 0.23193359375, 0.388916015625, 0.5458984375, 0.702880859375, 0.85986328125, 1.016845703125, 1.173828125, 1.330810546875, 1.48779296875, 1.644775390625, 1.8017578125, 1.958740234375, 2.11572265625, 2.272705078125, 2.4296875, 2.586669921875, 2.74365234375, 2.900634765625, 3.0576171875, 3.214599609375, 3.37158203125, 3.528564453125, 3.685546875, 3.842529296875, 3.99951171875, 4.156494140625, 4.3134765625, 4.470458984375, 4.62744140625, 4.784423828125, 4.94140625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 16.0, 26.0, 38.0, 75.0, 147.0, 409.0, 1316.0, 7854.0, 224487.0, 791732.0, 19228.0, 2239.0, 568.0, 201.0, 109.0, 48.0, 26.0, 18.0, 10.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.134033203125, -3.03955078125, -2.945068359375, -2.8505859375, -2.756103515625, -2.66162109375, -2.567138671875, -2.47265625, -2.378173828125, -2.28369140625, -2.189208984375, -2.0947265625, -2.000244140625, -1.90576171875, -1.811279296875, -1.716796875, -1.622314453125, -1.52783203125, -1.433349609375, -1.3388671875, -1.244384765625, -1.14990234375, -1.055419921875, -0.9609375, -0.866455078125, -0.77197265625, -0.677490234375, -0.5830078125, -0.488525390625, -0.39404296875, -0.299560546875, -0.205078125, -0.110595703125, -0.01611328125, 0.078369140625, 0.1728515625, 0.267333984375, 0.36181640625, 0.456298828125, 0.55078125, 0.645263671875, 0.73974609375, 0.834228515625, 0.9287109375, 1.023193359375, 1.11767578125, 1.212158203125, 1.306640625, 1.401123046875, 1.49560546875, 1.590087890625, 1.6845703125, 1.779052734375, 1.87353515625, 1.968017578125, 2.0625, 2.156982421875, 2.25146484375, 2.345947265625, 2.4404296875, 2.534912109375, 2.62939453125, 2.723876953125, 2.818359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 10.0, 10.0, 11.0, 26.0, 31.0, 45.0, 51.0, 84.0, 96.0, 122.0, 139.0, 107.0, 77.0, 67.0, 41.0, 26.0, 23.0, 12.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032973289489746094, -0.00031743571162223816, -0.0003051385283470154, -0.0002928413450717926, -0.0002805441617965698, -0.00026824697852134705, -0.00025594979524612427, -0.0002436526119709015, -0.0002313554286956787, -0.00021905824542045593, -0.00020676106214523315, -0.00019446387887001038, -0.0001821666955947876, -0.00016986951231956482, -0.00015757232904434204, -0.00014527514576911926, -0.00013297796249389648, -0.0001206807792186737, -0.00010838359594345093, -9.608641266822815e-05, -8.378922939300537e-05, -7.149204611778259e-05, -5.9194862842559814e-05, -4.6897679567337036e-05, -3.460049629211426e-05, -2.230331301689148e-05, -1.0006129741668701e-05, 2.291053533554077e-06, 1.4588236808776855e-05, 2.6885420083999634e-05, 3.918260335922241e-05, 5.147978663444519e-05, 6.377696990966797e-05, 7.607415318489075e-05, 8.837133646011353e-05, 0.0001006685197353363, 0.00011296570301055908, 0.00012526288628578186, 0.00013756006956100464, 0.00014985725283622742, 0.0001621544361114502, 0.00017445161938667297, 0.00018674880266189575, 0.00019904598593711853, 0.0002113431692123413, 0.0002236403524875641, 0.00023593753576278687, 0.00024823471903800964, 0.0002605319023132324, 0.0002728290855884552, 0.000285126268863678, 0.00029742345213890076, 0.00030972063541412354, 0.0003220178186893463, 0.0003343150019645691, 0.00034661218523979187, 0.00035890936851501465, 0.0003712065517902374, 0.0003835037350654602, 0.000395800918340683, 0.00040809810161590576, 0.00042039528489112854, 0.0004326924681663513, 0.0004449896514415741, 0.0004572868347167969]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 13.0, 16.0, 22.0, 25.0, 33.0, 57.0, 60.0, 96.0, 154.0, 280.0, 493.0, 957.0, 2186.0, 6016.0, 23372.0, 148457.0, 667881.0, 162650.0, 24812.0, 6411.0, 2339.0, 973.0, 504.0, 278.0, 165.0, 97.0, 60.0, 32.0, 32.0, 17.0, 13.0, 11.0, 7.0, 11.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25, -1.20904541015625, -1.1680908203125, -1.12713623046875, -1.086181640625, -1.04522705078125, -1.0042724609375, -0.96331787109375, -0.92236328125, -0.88140869140625, -0.8404541015625, -0.79949951171875, -0.758544921875, -0.71759033203125, -0.6766357421875, -0.63568115234375, -0.5947265625, -0.55377197265625, -0.5128173828125, -0.47186279296875, -0.430908203125, -0.38995361328125, -0.3489990234375, -0.30804443359375, -0.26708984375, -0.22613525390625, -0.1851806640625, -0.14422607421875, -0.103271484375, -0.06231689453125, -0.0213623046875, 0.01959228515625, 0.060546875, 0.10150146484375, 0.1424560546875, 0.18341064453125, 0.224365234375, 0.26531982421875, 0.3062744140625, 0.34722900390625, 0.38818359375, 0.42913818359375, 0.4700927734375, 0.51104736328125, 0.552001953125, 0.59295654296875, 0.6339111328125, 0.67486572265625, 0.7158203125, 0.75677490234375, 0.7977294921875, 0.83868408203125, 0.879638671875, 0.92059326171875, 0.9615478515625, 1.00250244140625, 1.04345703125, 1.08441162109375, 1.1253662109375, 1.16632080078125, 1.207275390625, 1.24822998046875, 1.2891845703125, 1.33013916015625, 1.37109375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 6.0, 7.0, 8.0, 15.0, 15.0, 28.0, 32.0, 43.0, 45.0, 51.0, 63.0, 87.0, 93.0, 75.0, 103.0, 71.0, 61.0, 44.0, 38.0, 33.0, 26.0, 18.0, 13.0, 8.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12109375, -1.0718994140625, -1.022705078125, -0.9735107421875, -0.92431640625, -0.8751220703125, -0.825927734375, -0.7767333984375, -0.7275390625, -0.6783447265625, -0.629150390625, -0.5799560546875, -0.53076171875, -0.4815673828125, -0.432373046875, -0.3831787109375, -0.333984375, -0.2847900390625, -0.235595703125, -0.1864013671875, -0.13720703125, -0.0880126953125, -0.038818359375, 0.0103759765625, 0.0595703125, 0.1087646484375, 0.157958984375, 0.2071533203125, 0.25634765625, 0.3055419921875, 0.354736328125, 0.4039306640625, 0.453125, 0.5023193359375, 0.551513671875, 0.6007080078125, 0.64990234375, 0.6990966796875, 0.748291015625, 0.7974853515625, 0.8466796875, 0.8958740234375, 0.945068359375, 0.9942626953125, 1.04345703125, 1.0926513671875, 1.141845703125, 1.1910400390625, 1.240234375, 1.2894287109375, 1.338623046875, 1.3878173828125, 1.43701171875, 1.4862060546875, 1.535400390625, 1.5845947265625, 1.6337890625, 1.6829833984375, 1.732177734375, 1.7813720703125, 1.83056640625, 1.8797607421875, 1.928955078125, 1.9781494140625, 2.02734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 8.0, 2.0, 16.0, 49.0, 126.0, 236.0, 284.0, 160.0, 77.0, 23.0, 9.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.383113861083984, -23.91530990600586, -22.447507858276367, -20.979703903198242, -19.51190185546875, -18.044097900390625, -16.5762939453125, -15.108490943908691, -13.640687942504883, -12.172884941101074, -10.705081939697266, -9.23727798461914, -7.769474983215332, -6.301671981811523, -4.833868026733398, -3.36606502532959, -1.8982620239257812, -0.43045878410339355, 1.0373444557189941, 2.505147933959961, 3.9729509353637695, 5.440753936767578, 6.908557891845703, 8.376360893249512, 9.84416389465332, 11.311966896057129, 12.779769897460938, 14.247573852539062, 15.715376853942871, 17.18317985534668, 18.650983810424805, 20.118785858154297, 21.586585998535156, 23.05438995361328, 24.522192001342773, 25.9899959564209, 27.45779800415039, 28.925601959228516, 30.39340591430664, 31.861209869384766, 33.329010009765625, 34.79681396484375, 36.264617919921875, 37.732421875, 39.20022201538086, 40.668025970458984, 42.13582992553711, 43.603633880615234, 45.07143783569336, 46.539241790771484, 48.00704574584961, 49.47484588623047, 50.942649841308594, 52.41045379638672, 53.878257751464844, 55.34606170654297, 56.813865661621094, 58.28166961669922, 59.749473571777344, 61.21727752685547, 62.68507766723633, 64.15287780761719, 65.62068176269531, 67.08848571777344, 68.55628967285156]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 7.0, 9.0, 10.0, 16.0, 14.0, 22.0, 27.0, 30.0, 39.0, 47.0, 56.0, 34.0, 51.0, 56.0, 71.0, 68.0, 68.0, 58.0, 39.0, 46.0, 40.0, 27.0, 22.0, 26.0, 24.0, 20.0, 10.0, 8.0, 11.0, 6.0, 11.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.10374641418457, -19.4123477935791, -18.720947265625, -18.02954864501953, -17.338150024414062, -16.646751403808594, -15.955351829528809, -15.263952255249023, -14.572553634643555, -13.881155014038086, -13.1897554397583, -12.498355865478516, -11.806957244873047, -11.115558624267578, -10.424159049987793, -9.732759475708008, -9.041360855102539, -8.34996223449707, -7.658562660217285, -6.967163562774658, -6.275764465332031, -5.584365367889404, -4.892966270446777, -4.20156717300415, -3.5101680755615234, -2.8187689781188965, -2.1273698806762695, -1.4359707832336426, -0.7445716857910156, -0.05317258834838867, 0.6382265090942383, 1.3296256065368652, 2.021026611328125, 2.712425708770752, 3.403824806213379, 4.095223903656006, 4.786623001098633, 5.47802209854126, 6.169421195983887, 6.860820293426514, 7.552219390869141, 8.24361801147461, 8.935017585754395, 9.62641716003418, 10.317815780639648, 11.009214401245117, 11.700613975524902, 12.392013549804688, 13.083412170410156, 13.774810791015625, 14.46621036529541, 15.157609939575195, 15.849008560180664, 16.540407180786133, 17.231807708740234, 17.923206329345703, 18.614604949951172, 19.30600357055664, 19.99740219116211, 20.68880271911621, 21.38020133972168, 22.07159996032715, 22.76300048828125, 23.45439910888672, 24.145797729492188]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 9.0, 15.0, 11.0, 42.0, 71.0, 118.0, 263.0, 788.0, 3068.0, 17658.0, 298147.0, 3796124.0, 66874.0, 8112.0, 1827.0, 581.0, 239.0, 143.0, 61.0, 46.0, 23.0, 9.0, 13.0, 6.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.92578125, -4.800445556640625, -4.67510986328125, -4.549774169921875, -4.4244384765625, -4.299102783203125, -4.17376708984375, -4.048431396484375, -3.923095703125, -3.797760009765625, -3.67242431640625, -3.547088623046875, -3.4217529296875, -3.296417236328125, -3.17108154296875, -3.045745849609375, -2.92041015625, -2.795074462890625, -2.66973876953125, -2.544403076171875, -2.4190673828125, -2.293731689453125, -2.16839599609375, -2.043060302734375, -1.917724609375, -1.792388916015625, -1.66705322265625, -1.541717529296875, -1.4163818359375, -1.291046142578125, -1.16571044921875, -1.040374755859375, -0.9150390625, -0.789703369140625, -0.66436767578125, -0.539031982421875, -0.4136962890625, -0.288360595703125, -0.16302490234375, -0.037689208984375, 0.087646484375, 0.212982177734375, 0.33831787109375, 0.463653564453125, 0.5889892578125, 0.714324951171875, 0.83966064453125, 0.964996337890625, 1.09033203125, 1.215667724609375, 1.34100341796875, 1.466339111328125, 1.5916748046875, 1.717010498046875, 1.84234619140625, 1.967681884765625, 2.093017578125, 2.218353271484375, 2.34368896484375, 2.469024658203125, 2.5943603515625, 2.719696044921875, 2.84503173828125, 2.970367431640625, 3.095703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 4.0, 11.0, 12.0, 13.0, 25.0, 22.0, 46.0, 66.0, 62.0, 75.0, 75.0, 73.0, 76.0, 80.0, 79.0, 71.0, 45.0, 45.0, 34.0, 35.0, 16.0, 13.0, 7.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77734375, -0.72998046875, -0.6826171875, -0.63525390625, -0.587890625, -0.54052734375, -0.4931640625, -0.44580078125, -0.3984375, -0.35107421875, -0.3037109375, -0.25634765625, -0.208984375, -0.16162109375, -0.1142578125, -0.06689453125, -0.01953125, 0.02783203125, 0.0751953125, 0.12255859375, 0.169921875, 0.21728515625, 0.2646484375, 0.31201171875, 0.359375, 0.40673828125, 0.4541015625, 0.50146484375, 0.548828125, 0.59619140625, 0.6435546875, 0.69091796875, 0.73828125, 0.78564453125, 0.8330078125, 0.88037109375, 0.927734375, 0.97509765625, 1.0224609375, 1.06982421875, 1.1171875, 1.16455078125, 1.2119140625, 1.25927734375, 1.306640625, 1.35400390625, 1.4013671875, 1.44873046875, 1.49609375, 1.54345703125, 1.5908203125, 1.63818359375, 1.685546875, 1.73291015625, 1.7802734375, 1.82763671875, 1.875, 1.92236328125, 1.9697265625, 2.01708984375, 2.064453125, 2.11181640625, 2.1591796875, 2.20654296875, 2.25390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 17.0, 19.0, 45.0, 57.0, 98.0, 227.0, 376.0, 895.0, 2244.0, 6189.0, 19964.0, 92019.0, 1591393.0, 2333780.0, 112368.0, 23228.0, 6989.0, 2459.0, 1011.0, 446.0, 199.0, 118.0, 52.0, 27.0, 26.0, 9.0, 10.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.849334716796875, -2.76312255859375, -2.676910400390625, -2.5906982421875, -2.504486083984375, -2.41827392578125, -2.332061767578125, -2.245849609375, -2.159637451171875, -2.07342529296875, -1.987213134765625, -1.9010009765625, -1.814788818359375, -1.72857666015625, -1.642364501953125, -1.55615234375, -1.469940185546875, -1.38372802734375, -1.297515869140625, -1.2113037109375, -1.125091552734375, -1.03887939453125, -0.952667236328125, -0.866455078125, -0.780242919921875, -0.69403076171875, -0.607818603515625, -0.5216064453125, -0.435394287109375, -0.34918212890625, -0.262969970703125, -0.1767578125, -0.090545654296875, -0.00433349609375, 0.081878662109375, 0.1680908203125, 0.254302978515625, 0.34051513671875, 0.426727294921875, 0.512939453125, 0.599151611328125, 0.68536376953125, 0.771575927734375, 0.8577880859375, 0.944000244140625, 1.03021240234375, 1.116424560546875, 1.20263671875, 1.288848876953125, 1.37506103515625, 1.461273193359375, 1.5474853515625, 1.633697509765625, 1.71990966796875, 1.806121826171875, 1.892333984375, 1.978546142578125, 2.06475830078125, 2.150970458984375, 2.2371826171875, 2.323394775390625, 2.40960693359375, 2.495819091796875, 2.58203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 8.0, 9.0, 17.0, 17.0, 33.0, 43.0, 53.0, 104.0, 184.0, 316.0, 612.0, 992.0, 738.0, 378.0, 181.0, 112.0, 74.0, 57.0, 37.0, 22.0, 16.0, 12.0, 10.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.12109375, -3.035797119140625, -2.95050048828125, -2.865203857421875, -2.7799072265625, -2.694610595703125, -2.60931396484375, -2.524017333984375, -2.438720703125, -2.353424072265625, -2.26812744140625, -2.182830810546875, -2.0975341796875, -2.012237548828125, -1.92694091796875, -1.841644287109375, -1.75634765625, -1.671051025390625, -1.58575439453125, -1.500457763671875, -1.4151611328125, -1.329864501953125, -1.24456787109375, -1.159271240234375, -1.073974609375, -0.988677978515625, -0.90338134765625, -0.818084716796875, -0.7327880859375, -0.647491455078125, -0.56219482421875, -0.476898193359375, -0.3916015625, -0.306304931640625, -0.22100830078125, -0.135711669921875, -0.0504150390625, 0.034881591796875, 0.12017822265625, 0.205474853515625, 0.290771484375, 0.376068115234375, 0.46136474609375, 0.546661376953125, 0.6319580078125, 0.717254638671875, 0.80255126953125, 0.887847900390625, 0.97314453125, 1.058441162109375, 1.14373779296875, 1.229034423828125, 1.3143310546875, 1.399627685546875, 1.48492431640625, 1.570220947265625, 1.655517578125, 1.740814208984375, 1.82611083984375, 1.911407470703125, 1.9967041015625, 2.082000732421875, 2.16729736328125, 2.252593994140625, 2.337890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 15.0, 37.0, 80.0, 158.0, 218.0, 187.0, 139.0, 75.0, 37.0, 11.0, 15.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.884531021118164, -21.070728302001953, -20.256927490234375, -19.443124771118164, -18.629322052001953, -17.815521240234375, -17.001718521118164, -16.187915802001953, -15.374114990234375, -14.56031322479248, -13.746511459350586, -12.932708740234375, -12.11890697479248, -11.305105209350586, -10.491302490234375, -9.67750072479248, -8.863698959350586, -8.049897193908691, -7.236094951629639, -6.422292709350586, -5.608490943908691, -4.794689178466797, -3.980886936187744, -3.1670846939086914, -2.353282928466797, -1.5394809246063232, -0.7256789207458496, 0.08812308311462402, 0.9019250869750977, 1.7157268524169922, 2.529529094696045, 3.3433313369750977, 4.157131195068359, 4.970932960510254, 5.784735202789307, 6.598537445068359, 7.412339210510254, 8.226140975952148, 9.03994369506836, 9.853745460510254, 10.667547225952148, 11.481348991394043, 12.295150756835938, 13.108953475952148, 13.922755241394043, 14.736557006835938, 15.550359725952148, 16.36416244506836, 17.177963256835938, 17.99176597595215, 18.805566787719727, 19.619369506835938, 20.433170318603516, 21.246973037719727, 22.060775756835938, 22.874576568603516, 23.688379287719727, 24.502182006835938, 25.315982818603516, 26.129785537719727, 26.943588256835938, 27.757389068603516, 28.571191787719727, 29.384994506835938, 30.198795318603516]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 10.0, 4.0, 2.0, 8.0, 9.0, 14.0, 17.0, 17.0, 14.0, 29.0, 22.0, 23.0, 35.0, 32.0, 34.0, 36.0, 34.0, 38.0, 55.0, 56.0, 38.0, 47.0, 45.0, 44.0, 46.0, 42.0, 44.0, 32.0, 22.0, 22.0, 25.0, 20.0, 16.0, 15.0, 14.0, 10.0, 4.0, 8.0, 3.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.633718490600586, -11.298864364624023, -10.964011192321777, -10.629157066345215, -10.294302940368652, -9.959449768066406, -9.624595642089844, -9.289741516113281, -8.954887390136719, -8.620033264160156, -8.28518009185791, -7.950325965881348, -7.615471839904785, -7.280618190765381, -6.945764541625977, -6.610910415649414, -6.276057243347168, -5.941203594207764, -5.606349468231201, -5.271495819091797, -4.936641693115234, -4.60178804397583, -4.266934394836426, -3.9320805072784424, -3.597226619720459, -3.2623727321624756, -2.927518844604492, -2.592665195465088, -2.2578113079071045, -1.922957420349121, -1.5881037712097168, -1.2532498836517334, -0.91839599609375, -0.5835421681404114, -0.24868834018707275, 0.0861654281616211, 0.4210193157196045, 0.7558732032775879, 1.0907268524169922, 1.4255807399749756, 1.760434627532959, 2.0952885150909424, 2.430142402648926, 2.76499605178833, 3.0998499393463135, 3.434703826904297, 3.769557476043701, 4.1044111251831055, 4.439265251159668, 4.774118900299072, 5.108973026275635, 5.443826675415039, 5.778680801391602, 6.113534450531006, 6.44838809967041, 6.783242225646973, 7.118095874786377, 7.452949523925781, 7.787803649902344, 8.122657775878906, 8.457510948181152, 8.792365074157715, 9.127218246459961, 9.462072372436523, 9.796926498413086]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 9.0, 12.0, 26.0, 31.0, 70.0, 92.0, 126.0, 237.0, 368.0, 652.0, 1033.0, 1917.0, 3705.0, 7325.0, 15285.0, 33969.0, 81245.0, 200261.0, 335451.0, 211246.0, 86404.0, 36460.0, 16081.0, 7810.0, 3880.0, 2034.0, 1120.0, 647.0, 412.0, 232.0, 145.0, 107.0, 57.0, 39.0, 22.0, 12.0, 18.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.93359375, -1.879180908203125, -1.82476806640625, -1.770355224609375, -1.7159423828125, -1.661529541015625, -1.60711669921875, -1.552703857421875, -1.498291015625, -1.443878173828125, -1.38946533203125, -1.335052490234375, -1.2806396484375, -1.226226806640625, -1.17181396484375, -1.117401123046875, -1.06298828125, -1.008575439453125, -0.95416259765625, -0.899749755859375, -0.8453369140625, -0.790924072265625, -0.73651123046875, -0.682098388671875, -0.627685546875, -0.573272705078125, -0.51885986328125, -0.464447021484375, -0.4100341796875, -0.355621337890625, -0.30120849609375, -0.246795654296875, -0.1923828125, -0.137969970703125, -0.08355712890625, -0.029144287109375, 0.0252685546875, 0.079681396484375, 0.13409423828125, 0.188507080078125, 0.242919921875, 0.297332763671875, 0.35174560546875, 0.406158447265625, 0.4605712890625, 0.514984130859375, 0.56939697265625, 0.623809814453125, 0.67822265625, 0.732635498046875, 0.78704833984375, 0.841461181640625, 0.8958740234375, 0.950286865234375, 1.00469970703125, 1.059112548828125, 1.113525390625, 1.167938232421875, 1.22235107421875, 1.276763916015625, 1.3311767578125, 1.385589599609375, 1.44000244140625, 1.494415283203125, 1.548828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 11.0, 11.0, 16.0, 21.0, 14.0, 29.0, 27.0, 37.0, 34.0, 40.0, 37.0, 39.0, 56.0, 52.0, 43.0, 43.0, 55.0, 39.0, 48.0, 36.0, 47.0, 34.0, 36.0, 27.0, 21.0, 25.0, 14.0, 15.0, 18.0, 12.0, 9.0, 4.0, 2.0, 6.0, 4.0, 7.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78955078125, -0.7596206665039062, -0.7296905517578125, -0.6997604370117188, -0.669830322265625, -0.6399002075195312, -0.6099700927734375, -0.5800399780273438, -0.55010986328125, -0.5201797485351562, -0.4902496337890625, -0.46031951904296875, -0.430389404296875, -0.40045928955078125, -0.3705291748046875, -0.34059906005859375, -0.3106689453125, -0.28073883056640625, -0.2508087158203125, -0.22087860107421875, -0.190948486328125, -0.16101837158203125, -0.1310882568359375, -0.10115814208984375, -0.07122802734375, -0.04129791259765625, -0.0113677978515625, 0.01856231689453125, 0.048492431640625, 0.07842254638671875, 0.1083526611328125, 0.13828277587890625, 0.168212890625, 0.19814300537109375, 0.2280731201171875, 0.25800323486328125, 0.287933349609375, 0.31786346435546875, 0.3477935791015625, 0.37772369384765625, 0.40765380859375, 0.43758392333984375, 0.4675140380859375, 0.49744415283203125, 0.527374267578125, 0.5573043823242188, 0.5872344970703125, 0.6171646118164062, 0.6470947265625, 0.6770248413085938, 0.7069549560546875, 0.7368850708007812, 0.766815185546875, 0.7967453002929688, 0.8266754150390625, 0.8566055297851562, 0.88653564453125, 0.9164657592773438, 0.9463958740234375, 0.9763259887695312, 1.006256103515625, 1.0361862182617188, 1.0661163330078125, 1.0960464477539062, 1.1259765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 12.0, 26.0, 30.0, 40.0, 69.0, 129.0, 194.0, 318.0, 602.0, 1172.0, 3033.0, 10941.0, 62688.0, 549819.0, 360921.0, 45024.0, 8691.0, 2532.0, 1041.0, 510.0, 291.0, 159.0, 89.0, 74.0, 47.0, 28.0, 14.0, 14.0, 14.0, 4.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.82421875, -4.70025634765625, -4.5762939453125, -4.45233154296875, -4.328369140625, -4.20440673828125, -4.0804443359375, -3.95648193359375, -3.83251953125, -3.70855712890625, -3.5845947265625, -3.46063232421875, -3.336669921875, -3.21270751953125, -3.0887451171875, -2.96478271484375, -2.8408203125, -2.71685791015625, -2.5928955078125, -2.46893310546875, -2.344970703125, -2.22100830078125, -2.0970458984375, -1.97308349609375, -1.84912109375, -1.72515869140625, -1.6011962890625, -1.47723388671875, -1.353271484375, -1.22930908203125, -1.1053466796875, -0.98138427734375, -0.857421875, -0.73345947265625, -0.6094970703125, -0.48553466796875, -0.361572265625, -0.23760986328125, -0.1136474609375, 0.01031494140625, 0.13427734375, 0.25823974609375, 0.3822021484375, 0.50616455078125, 0.630126953125, 0.75408935546875, 0.8780517578125, 1.00201416015625, 1.1259765625, 1.24993896484375, 1.3739013671875, 1.49786376953125, 1.621826171875, 1.74578857421875, 1.8697509765625, 1.99371337890625, 2.11767578125, 2.24163818359375, 2.3656005859375, 2.48956298828125, 2.613525390625, 2.73748779296875, 2.8614501953125, 2.98541259765625, 3.109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 9.0, 10.0, 12.0, 15.0, 10.0, 16.0, 22.0, 22.0, 27.0, 33.0, 42.0, 36.0, 31.0, 34.0, 36.0, 44.0, 41.0, 41.0, 54.0, 44.0, 30.0, 56.0, 43.0, 38.0, 33.0, 26.0, 25.0, 26.0, 24.0, 14.0, 25.0, 17.0, 12.0, 6.0, 7.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.0234375, -3.9017333984375, -3.780029296875, -3.6583251953125, -3.53662109375, -3.4149169921875, -3.293212890625, -3.1715087890625, -3.0498046875, -2.9281005859375, -2.806396484375, -2.6846923828125, -2.56298828125, -2.4412841796875, -2.319580078125, -2.1978759765625, -2.076171875, -1.9544677734375, -1.832763671875, -1.7110595703125, -1.58935546875, -1.4676513671875, -1.345947265625, -1.2242431640625, -1.1025390625, -0.9808349609375, -0.859130859375, -0.7374267578125, -0.61572265625, -0.4940185546875, -0.372314453125, -0.2506103515625, -0.12890625, -0.0072021484375, 0.114501953125, 0.2362060546875, 0.35791015625, 0.4796142578125, 0.601318359375, 0.7230224609375, 0.8447265625, 0.9664306640625, 1.088134765625, 1.2098388671875, 1.33154296875, 1.4532470703125, 1.574951171875, 1.6966552734375, 1.818359375, 1.9400634765625, 2.061767578125, 2.1834716796875, 2.30517578125, 2.4268798828125, 2.548583984375, 2.6702880859375, 2.7919921875, 2.9136962890625, 3.035400390625, 3.1571044921875, 3.27880859375, 3.4005126953125, 3.522216796875, 3.6439208984375, 3.765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 14.0, 13.0, 20.0, 27.0, 66.0, 97.0, 165.0, 478.0, 1479.0, 9175.0, 255257.0, 757519.0, 20756.0, 2326.0, 633.0, 236.0, 121.0, 60.0, 35.0, 13.0, 13.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.625, -2.543365478515625, -2.46173095703125, -2.380096435546875, -2.2984619140625, -2.216827392578125, -2.13519287109375, -2.053558349609375, -1.971923828125, -1.890289306640625, -1.80865478515625, -1.727020263671875, -1.6453857421875, -1.563751220703125, -1.48211669921875, -1.400482177734375, -1.31884765625, -1.237213134765625, -1.15557861328125, -1.073944091796875, -0.9923095703125, -0.910675048828125, -0.82904052734375, -0.747406005859375, -0.665771484375, -0.584136962890625, -0.50250244140625, -0.420867919921875, -0.3392333984375, -0.257598876953125, -0.17596435546875, -0.094329833984375, -0.0126953125, 0.068939208984375, 0.15057373046875, 0.232208251953125, 0.3138427734375, 0.395477294921875, 0.47711181640625, 0.558746337890625, 0.640380859375, 0.722015380859375, 0.80364990234375, 0.885284423828125, 0.9669189453125, 1.048553466796875, 1.13018798828125, 1.211822509765625, 1.29345703125, 1.375091552734375, 1.45672607421875, 1.538360595703125, 1.6199951171875, 1.701629638671875, 1.78326416015625, 1.864898681640625, 1.946533203125, 2.028167724609375, 2.10980224609375, 2.191436767578125, 2.2730712890625, 2.354705810546875, 2.43634033203125, 2.517974853515625, 2.599609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 5.0, 9.0, 13.0, 9.0, 13.0, 21.0, 27.0, 27.0, 41.0, 49.0, 52.0, 64.0, 79.0, 94.0, 76.0, 77.0, 63.0, 49.0, 47.0, 31.0, 30.0, 18.0, 24.0, 17.0, 9.0, 11.0, 9.0, 11.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018310546875, -0.00017629563808441162, -0.00016948580741882324, -0.00016267597675323486, -0.00015586614608764648, -0.0001490563154220581, -0.00014224648475646973, -0.00013543665409088135, -0.00012862682342529297, -0.00012181699275970459, -0.00011500716209411621, -0.00010819733142852783, -0.00010138750076293945, -9.457767009735107e-05, -8.77678394317627e-05, -8.095800876617432e-05, -7.414817810058594e-05, -6.733834743499756e-05, -6.052851676940918e-05, -5.37186861038208e-05, -4.690885543823242e-05, -4.009902477264404e-05, -3.3289194107055664e-05, -2.6479363441467285e-05, -1.9669532775878906e-05, -1.2859702110290527e-05, -6.0498714447021484e-06, 7.599592208862305e-07, 7.569789886474609e-06, 1.4379620552062988e-05, 2.1189451217651367e-05, 2.7999281883239746e-05, 3.4809112548828125e-05, 4.1618943214416504e-05, 4.842877388000488e-05, 5.523860454559326e-05, 6.204843521118164e-05, 6.885826587677002e-05, 7.56680965423584e-05, 8.247792720794678e-05, 8.928775787353516e-05, 9.609758853912354e-05, 0.00010290741920471191, 0.00010971724987030029, 0.00011652708053588867, 0.00012333691120147705, 0.00013014674186706543, 0.0001369565725326538, 0.0001437664031982422, 0.00015057623386383057, 0.00015738606452941895, 0.00016419589519500732, 0.0001710057258605957, 0.00017781555652618408, 0.00018462538719177246, 0.00019143521785736084, 0.00019824504852294922, 0.0002050548791885376, 0.00021186470985412598, 0.00021867454051971436, 0.00022548437118530273, 0.0002322942018508911, 0.0002391040325164795, 0.00024591386318206787, 0.00025272369384765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 1.0, 3.0, 3.0, 12.0, 17.0, 24.0, 39.0, 54.0, 96.0, 171.0, 371.0, 771.0, 2300.0, 9863.0, 104569.0, 798472.0, 116897.0, 10747.0, 2525.0, 829.0, 374.0, 164.0, 98.0, 69.0, 27.0, 20.0, 10.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.380859375, -1.326751708984375, -1.27264404296875, -1.218536376953125, -1.1644287109375, -1.110321044921875, -1.05621337890625, -1.002105712890625, -0.947998046875, -0.893890380859375, -0.83978271484375, -0.785675048828125, -0.7315673828125, -0.677459716796875, -0.62335205078125, -0.569244384765625, -0.51513671875, -0.461029052734375, -0.40692138671875, -0.352813720703125, -0.2987060546875, -0.244598388671875, -0.19049072265625, -0.136383056640625, -0.082275390625, -0.028167724609375, 0.02593994140625, 0.080047607421875, 0.1341552734375, 0.188262939453125, 0.24237060546875, 0.296478271484375, 0.3505859375, 0.404693603515625, 0.45880126953125, 0.512908935546875, 0.5670166015625, 0.621124267578125, 0.67523193359375, 0.729339599609375, 0.783447265625, 0.837554931640625, 0.89166259765625, 0.945770263671875, 0.9998779296875, 1.053985595703125, 1.10809326171875, 1.162200927734375, 1.21630859375, 1.270416259765625, 1.32452392578125, 1.378631591796875, 1.4327392578125, 1.486846923828125, 1.54095458984375, 1.595062255859375, 1.649169921875, 1.703277587890625, 1.75738525390625, 1.811492919921875, 1.8656005859375, 1.919708251953125, 1.97381591796875, 2.027923583984375, 2.08203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 10.0, 12.0, 12.0, 23.0, 35.0, 57.0, 65.0, 82.0, 124.0, 106.0, 126.0, 84.0, 77.0, 66.0, 31.0, 31.0, 19.0, 11.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.205169677734375, -1.15252685546875, -1.099884033203125, -1.0472412109375, -0.994598388671875, -0.94195556640625, -0.889312744140625, -0.836669921875, -0.784027099609375, -0.73138427734375, -0.678741455078125, -0.6260986328125, -0.573455810546875, -0.52081298828125, -0.468170166015625, -0.41552734375, -0.362884521484375, -0.31024169921875, -0.257598876953125, -0.2049560546875, -0.152313232421875, -0.09967041015625, -0.047027587890625, 0.005615234375, 0.058258056640625, 0.11090087890625, 0.163543701171875, 0.2161865234375, 0.268829345703125, 0.32147216796875, 0.374114990234375, 0.4267578125, 0.479400634765625, 0.53204345703125, 0.584686279296875, 0.6373291015625, 0.689971923828125, 0.74261474609375, 0.795257568359375, 0.847900390625, 0.900543212890625, 0.95318603515625, 1.005828857421875, 1.0584716796875, 1.111114501953125, 1.16375732421875, 1.216400146484375, 1.26904296875, 1.321685791015625, 1.37432861328125, 1.426971435546875, 1.4796142578125, 1.532257080078125, 1.58489990234375, 1.637542724609375, 1.690185546875, 1.742828369140625, 1.79547119140625, 1.848114013671875, 1.9007568359375, 1.953399658203125, 2.00604248046875, 2.058685302734375, 2.111328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 4.0, 10.0, 19.0, 34.0, 90.0, 125.0, 181.0, 217.0, 139.0, 89.0, 42.0, 21.0, 15.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.67139434814453, -25.722217559814453, -24.773040771484375, -23.823863983154297, -22.87468719482422, -21.92551040649414, -20.976333618164062, -20.027156829833984, -19.077980041503906, -18.128803253173828, -17.17962646484375, -16.230449676513672, -15.281272888183594, -14.332096099853516, -13.382919311523438, -12.43374252319336, -11.484566688537598, -10.53538990020752, -9.586213111877441, -8.637036323547363, -7.687859535217285, -6.738683223724365, -5.789506435394287, -4.840329647064209, -3.891152858734131, -2.9419760704040527, -1.9927994012832642, -1.0436227321624756, -0.09444594383239746, 0.8547306060791016, 1.8039073944091797, 2.753084182739258, 3.702260971069336, 4.651437759399414, 5.600614547729492, 6.54979133605957, 7.498968124389648, 8.448144912719727, 9.397321701049805, 10.346498489379883, 11.295675277709961, 12.244852066040039, 13.194028854370117, 14.143205642700195, 15.092382431030273, 16.04155921936035, 16.99073600769043, 17.939912796020508, 18.889087677001953, 19.83826446533203, 20.78744125366211, 21.736618041992188, 22.685794830322266, 23.634971618652344, 24.584148406982422, 25.5333251953125, 26.482501983642578, 27.431678771972656, 28.380855560302734, 29.330032348632812, 30.27920913696289, 31.22838592529297, 32.17756271362305, 33.126739501953125, 34.0759162902832]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 11.0, 11.0, 17.0, 23.0, 21.0, 23.0, 38.0, 35.0, 38.0, 41.0, 50.0, 52.0, 58.0, 70.0, 73.0, 47.0, 45.0, 36.0, 48.0, 36.0, 36.0, 30.0, 26.0, 17.0, 19.0, 16.0, 9.0, 10.0, 6.0, 2.0, 10.0, 2.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.40782356262207, -18.776329040527344, -18.144834518432617, -17.51333999633789, -16.881847381591797, -16.25035285949707, -15.618858337402344, -14.987363815307617, -14.35586929321289, -13.724374771118164, -13.092881202697754, -12.461386680603027, -11.8298921585083, -11.19839859008789, -10.566904067993164, -9.935409545898438, -9.303915977478027, -8.6724214553833, -8.04092788696289, -7.409433364868164, -6.7779388427734375, -6.146444797515869, -5.514950752258301, -4.883456230163574, -4.251962184906006, -3.6204679012298584, -2.988973617553711, -2.3574795722961426, -1.7259852886199951, -1.0944910049438477, -0.4629969596862793, 0.16849756240844727, 0.7999916076660156, 1.431485891342163, 2.0629801750183105, 2.694474220275879, 3.3259685039520264, 3.957462787628174, 4.588956832885742, 5.220451354980469, 5.851945400238037, 6.4834394454956055, 7.114933967590332, 7.7464280128479, 8.377922058105469, 9.009416580200195, 9.640911102294922, 10.272405624389648, 10.903899192810059, 11.535393714904785, 12.166887283325195, 12.798381805419922, 13.429876327514648, 14.061370849609375, 14.692864418029785, 15.324358940124512, 15.955852508544922, 16.58734703063965, 17.218841552734375, 17.85033416748047, 18.481828689575195, 19.113323211669922, 19.74481773376465, 20.376312255859375, 21.0078067779541]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 8.0, 14.0, 42.0, 70.0, 179.0, 353.0, 754.0, 1684.0, 4729.0, 16630.0, 82741.0, 897752.0, 2844768.0, 293385.0, 38509.0, 8663.0, 2440.0, 801.0, 337.0, 147.0, 84.0, 51.0, 29.0, 19.0, 23.0, 14.0, 7.0, 11.0, 6.0, 4.0, 6.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3583984375, -1.3024749755859375, -1.246551513671875, -1.1906280517578125, -1.13470458984375, -1.0787811279296875, -1.022857666015625, -0.9669342041015625, -0.9110107421875, -0.8550872802734375, -0.799163818359375, -0.7432403564453125, -0.68731689453125, -0.6313934326171875, -0.575469970703125, -0.5195465087890625, -0.463623046875, -0.4076995849609375, -0.351776123046875, -0.2958526611328125, -0.23992919921875, -0.1840057373046875, -0.128082275390625, -0.0721588134765625, -0.0162353515625, 0.0396881103515625, 0.095611572265625, 0.1515350341796875, 0.20745849609375, 0.2633819580078125, 0.319305419921875, 0.3752288818359375, 0.43115234375, 0.4870758056640625, 0.542999267578125, 0.5989227294921875, 0.65484619140625, 0.7107696533203125, 0.766693115234375, 0.8226165771484375, 0.8785400390625, 0.9344635009765625, 0.990386962890625, 1.0463104248046875, 1.10223388671875, 1.1581573486328125, 1.214080810546875, 1.2700042724609375, 1.325927734375, 1.3818511962890625, 1.437774658203125, 1.4936981201171875, 1.54962158203125, 1.6055450439453125, 1.661468505859375, 1.7173919677734375, 1.7733154296875, 1.8292388916015625, 1.885162353515625, 1.9410858154296875, 1.99700927734375, 2.0529327392578125, 2.108856201171875, 2.1647796630859375, 2.220703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 6.0, 14.0, 25.0, 39.0, 62.0, 90.0, 94.0, 107.0, 133.0, 118.0, 100.0, 74.0, 45.0, 48.0, 23.0, 19.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8720703125, -0.8027801513671875, -0.733489990234375, -0.6641998291015625, -0.59490966796875, -0.5256195068359375, -0.456329345703125, -0.3870391845703125, -0.3177490234375, -0.2484588623046875, -0.179168701171875, -0.1098785400390625, -0.04058837890625, 0.0287017822265625, 0.097991943359375, 0.1672821044921875, 0.236572265625, 0.3058624267578125, 0.375152587890625, 0.4444427490234375, 0.51373291015625, 0.5830230712890625, 0.652313232421875, 0.7216033935546875, 0.7908935546875, 0.8601837158203125, 0.929473876953125, 0.9987640380859375, 1.06805419921875, 1.1373443603515625, 1.206634521484375, 1.2759246826171875, 1.34521484375, 1.4145050048828125, 1.483795166015625, 1.5530853271484375, 1.62237548828125, 1.6916656494140625, 1.760955810546875, 1.8302459716796875, 1.8995361328125, 1.9688262939453125, 2.038116455078125, 2.1074066162109375, 2.17669677734375, 2.2459869384765625, 2.315277099609375, 2.3845672607421875, 2.453857421875, 2.5231475830078125, 2.592437744140625, 2.6617279052734375, 2.73101806640625, 2.8003082275390625, 2.869598388671875, 2.9388885498046875, 3.0081787109375, 3.0774688720703125, 3.146759033203125, 3.2160491943359375, 3.28533935546875, 3.3546295166015625, 3.423919677734375, 3.4932098388671875, 3.5625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 12.0, 17.0, 19.0, 24.0, 27.0, 47.0, 74.0, 112.0, 177.0, 313.0, 546.0, 1276.0, 3117.0, 8342.0, 25436.0, 110009.0, 1156827.0, 2635151.0, 199534.0, 37137.0, 9859.0, 3422.0, 1343.0, 648.0, 315.0, 175.0, 103.0, 62.0, 53.0, 32.0, 18.0, 21.0, 9.0, 5.0, 7.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.462890625, -2.394775390625, -2.32666015625, -2.258544921875, -2.1904296875, -2.122314453125, -2.05419921875, -1.986083984375, -1.91796875, -1.849853515625, -1.78173828125, -1.713623046875, -1.6455078125, -1.577392578125, -1.50927734375, -1.441162109375, -1.373046875, -1.304931640625, -1.23681640625, -1.168701171875, -1.1005859375, -1.032470703125, -0.96435546875, -0.896240234375, -0.828125, -0.760009765625, -0.69189453125, -0.623779296875, -0.5556640625, -0.487548828125, -0.41943359375, -0.351318359375, -0.283203125, -0.215087890625, -0.14697265625, -0.078857421875, -0.0107421875, 0.057373046875, 0.12548828125, 0.193603515625, 0.26171875, 0.329833984375, 0.39794921875, 0.466064453125, 0.5341796875, 0.602294921875, 0.67041015625, 0.738525390625, 0.806640625, 0.874755859375, 0.94287109375, 1.010986328125, 1.0791015625, 1.147216796875, 1.21533203125, 1.283447265625, 1.3515625, 1.419677734375, 1.48779296875, 1.555908203125, 1.6240234375, 1.692138671875, 1.76025390625, 1.828369140625, 1.896484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 1.0, 8.0, 2.0, 3.0, 7.0, 6.0, 15.0, 9.0, 14.0, 16.0, 16.0, 18.0, 24.0, 41.0, 68.0, 83.0, 130.0, 183.0, 250.0, 352.0, 592.0, 613.0, 517.0, 340.0, 224.0, 148.0, 94.0, 80.0, 50.0, 45.0, 18.0, 29.0, 24.0, 13.0, 11.0, 6.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -1.982696533203125, -1.91265869140625, -1.842620849609375, -1.7725830078125, -1.702545166015625, -1.63250732421875, -1.562469482421875, -1.492431640625, -1.422393798828125, -1.35235595703125, -1.282318115234375, -1.2122802734375, -1.142242431640625, -1.07220458984375, -1.002166748046875, -0.93212890625, -0.862091064453125, -0.79205322265625, -0.722015380859375, -0.6519775390625, -0.581939697265625, -0.51190185546875, -0.441864013671875, -0.371826171875, -0.301788330078125, -0.23175048828125, -0.161712646484375, -0.0916748046875, -0.021636962890625, 0.04840087890625, 0.118438720703125, 0.1884765625, 0.258514404296875, 0.32855224609375, 0.398590087890625, 0.4686279296875, 0.538665771484375, 0.60870361328125, 0.678741455078125, 0.748779296875, 0.818817138671875, 0.88885498046875, 0.958892822265625, 1.0289306640625, 1.098968505859375, 1.16900634765625, 1.239044189453125, 1.30908203125, 1.379119873046875, 1.44915771484375, 1.519195556640625, 1.5892333984375, 1.659271240234375, 1.72930908203125, 1.799346923828125, 1.869384765625, 1.939422607421875, 2.00946044921875, 2.079498291015625, 2.1495361328125, 2.219573974609375, 2.28961181640625, 2.359649658203125, 2.4296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 19.0, 45.0, 117.0, 262.0, 327.0, 149.0, 45.0, 14.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.65392303466797, -38.202369689941406, -36.75081253051758, -35.29925537109375, -33.84770202636719, -32.396148681640625, -30.944591522216797, -29.4930362701416, -28.041481018066406, -26.58992576599121, -25.138370513916016, -23.68681526184082, -22.235260009765625, -20.78370475769043, -19.332149505615234, -17.88059425354004, -16.429039001464844, -14.977483749389648, -13.525928497314453, -12.074373245239258, -10.622817993164062, -9.171262741088867, -7.719707489013672, -6.268152236938477, -4.816596984863281, -3.365041732788086, -1.9134864807128906, -0.4619312286376953, 0.9896240234375, 2.4411792755126953, 3.8927345275878906, 5.344289779663086, 6.795848846435547, 8.247404098510742, 9.698959350585938, 11.150514602661133, 12.602069854736328, 14.053625106811523, 15.505180358886719, 16.956735610961914, 18.40829086303711, 19.859846115112305, 21.3114013671875, 22.762956619262695, 24.21451187133789, 25.666067123413086, 27.11762237548828, 28.569177627563477, 30.020732879638672, 31.472288131713867, 32.92384338378906, 34.375396728515625, 35.82695388793945, 37.27851104736328, 38.730064392089844, 40.181617736816406, 41.633174896240234, 43.08473205566406, 44.536285400390625, 45.98783874511719, 47.439395904541016, 48.890953063964844, 50.342506408691406, 51.79405975341797, 53.2456169128418]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 9.0, 19.0, 23.0, 17.0, 21.0, 28.0, 35.0, 41.0, 48.0, 49.0, 64.0, 85.0, 63.0, 78.0, 62.0, 51.0, 42.0, 61.0, 49.0, 37.0, 29.0, 18.0, 20.0, 9.0, 11.0, 7.0, 6.0, 2.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-22.36190414428711, -21.82243537902832, -21.28296661376953, -20.743497848510742, -20.204029083251953, -19.664562225341797, -19.125093460083008, -18.58562469482422, -18.04615592956543, -17.50668716430664, -16.96721839904785, -16.427749633789062, -15.88828182220459, -15.3488130569458, -14.809345245361328, -14.269876480102539, -13.73040771484375, -13.190938949584961, -12.651470184326172, -12.1120023727417, -11.57253360748291, -11.033064842224121, -10.493597030639648, -9.95412826538086, -9.41465950012207, -8.875190734863281, -8.335721969604492, -7.7962541580200195, -7.2567853927612305, -6.717316627502441, -6.1778483390808105, -5.63838005065918, -5.098913192749023, -4.559444427490234, -4.0199761390686035, -3.4805076122283936, -2.9410390853881836, -2.4015705585479736, -1.8621020317077637, -1.3226335048675537, -0.7831649780273438, -0.2436964511871338, 0.29577207565307617, 0.8352406024932861, 1.374709129333496, 1.914177656173706, 2.453646183013916, 2.993114709854126, 3.532583236694336, 4.072052001953125, 4.611520290374756, 5.150988578796387, 5.690457344055176, 6.229926109313965, 6.769394397735596, 7.308862686157227, 7.848331451416016, 8.387800216674805, 8.927268981933594, 9.466736793518066, 10.006205558776855, 10.545674324035645, 11.085142135620117, 11.624610900878906, 12.164079666137695]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 11.0, 16.0, 41.0, 54.0, 75.0, 145.0, 228.0, 527.0, 952.0, 2204.0, 4849.0, 11866.0, 28482.0, 68983.0, 154509.0, 275902.0, 260023.0, 136617.0, 59816.0, 25008.0, 10130.0, 4415.0, 1885.0, 845.0, 416.0, 218.0, 141.0, 71.0, 46.0, 25.0, 20.0, 15.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1875, -1.1433868408203125, -1.099273681640625, -1.0551605224609375, -1.01104736328125, -0.9669342041015625, -0.922821044921875, -0.8787078857421875, -0.8345947265625, -0.7904815673828125, -0.746368408203125, -0.7022552490234375, -0.65814208984375, -0.6140289306640625, -0.569915771484375, -0.5258026123046875, -0.481689453125, -0.4375762939453125, -0.393463134765625, -0.3493499755859375, -0.30523681640625, -0.2611236572265625, -0.217010498046875, -0.1728973388671875, -0.1287841796875, -0.0846710205078125, -0.040557861328125, 0.0035552978515625, 0.04766845703125, 0.0917816162109375, 0.135894775390625, 0.1800079345703125, 0.22412109375, 0.2682342529296875, 0.312347412109375, 0.3564605712890625, 0.40057373046875, 0.4446868896484375, 0.488800048828125, 0.5329132080078125, 0.5770263671875, 0.6211395263671875, 0.665252685546875, 0.7093658447265625, 0.75347900390625, 0.7975921630859375, 0.841705322265625, 0.8858184814453125, 0.929931640625, 0.9740447998046875, 1.018157958984375, 1.0622711181640625, 1.10638427734375, 1.1504974365234375, 1.194610595703125, 1.2387237548828125, 1.2828369140625, 1.3269500732421875, 1.371063232421875, 1.4151763916015625, 1.45928955078125, 1.5034027099609375, 1.547515869140625, 1.5916290283203125, 1.6357421875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 6.0, 14.0, 19.0, 18.0, 30.0, 25.0, 38.0, 48.0, 49.0, 51.0, 47.0, 46.0, 63.0, 65.0, 54.0, 64.0, 53.0, 46.0, 41.0, 42.0, 27.0, 35.0, 22.0, 26.0, 18.0, 19.0, 6.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79736328125, -0.7635116577148438, -0.7296600341796875, -0.6958084106445312, -0.661956787109375, -0.6281051635742188, -0.5942535400390625, -0.5604019165039062, -0.52655029296875, -0.49269866943359375, -0.4588470458984375, -0.42499542236328125, -0.391143798828125, -0.35729217529296875, -0.3234405517578125, -0.28958892822265625, -0.2557373046875, -0.22188568115234375, -0.1880340576171875, -0.15418243408203125, -0.120330810546875, -0.08647918701171875, -0.0526275634765625, -0.01877593994140625, 0.01507568359375, 0.04892730712890625, 0.0827789306640625, 0.11663055419921875, 0.150482177734375, 0.18433380126953125, 0.2181854248046875, 0.25203704833984375, 0.285888671875, 0.31974029541015625, 0.3535919189453125, 0.38744354248046875, 0.421295166015625, 0.45514678955078125, 0.4889984130859375, 0.5228500366210938, 0.55670166015625, 0.5905532836914062, 0.6244049072265625, 0.6582565307617188, 0.692108154296875, 0.7259597778320312, 0.7598114013671875, 0.7936630249023438, 0.8275146484375, 0.8613662719726562, 0.8952178955078125, 0.9290695190429688, 0.962921142578125, 0.9967727661132812, 1.0306243896484375, 1.0644760131835938, 1.09832763671875, 1.1321792602539062, 1.1660308837890625, 1.1998825073242188, 1.233734130859375, 1.2675857543945312, 1.3014373779296875, 1.3352890014648438, 1.369140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 7.0, 8.0, 13.0, 28.0, 20.0, 27.0, 35.0, 58.0, 81.0, 94.0, 164.0, 208.0, 335.0, 451.0, 683.0, 1162.0, 2367.0, 6113.0, 25368.0, 172627.0, 667545.0, 138960.0, 21407.0, 5479.0, 2197.0, 1092.0, 646.0, 393.0, 277.0, 197.0, 121.0, 106.0, 69.0, 42.0, 49.0, 26.0, 30.0, 15.0, 11.0, 8.0, 11.0, 10.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.650390625, -2.557220458984375, -2.46405029296875, -2.370880126953125, -2.2777099609375, -2.184539794921875, -2.09136962890625, -1.998199462890625, -1.905029296875, -1.811859130859375, -1.71868896484375, -1.625518798828125, -1.5323486328125, -1.439178466796875, -1.34600830078125, -1.252838134765625, -1.15966796875, -1.066497802734375, -0.97332763671875, -0.880157470703125, -0.7869873046875, -0.693817138671875, -0.60064697265625, -0.507476806640625, -0.414306640625, -0.321136474609375, -0.22796630859375, -0.134796142578125, -0.0416259765625, 0.051544189453125, 0.14471435546875, 0.237884521484375, 0.3310546875, 0.424224853515625, 0.51739501953125, 0.610565185546875, 0.7037353515625, 0.796905517578125, 0.89007568359375, 0.983245849609375, 1.076416015625, 1.169586181640625, 1.26275634765625, 1.355926513671875, 1.4490966796875, 1.542266845703125, 1.63543701171875, 1.728607177734375, 1.82177734375, 1.914947509765625, 2.00811767578125, 2.101287841796875, 2.1944580078125, 2.287628173828125, 2.38079833984375, 2.473968505859375, 2.567138671875, 2.660308837890625, 2.75347900390625, 2.846649169921875, 2.9398193359375, 3.032989501953125, 3.12615966796875, 3.219329833984375, 3.3125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 7.0, 14.0, 13.0, 16.0, 25.0, 19.0, 39.0, 31.0, 36.0, 49.0, 34.0, 50.0, 56.0, 53.0, 40.0, 59.0, 48.0, 56.0, 34.0, 47.0, 47.0, 27.0, 18.0, 34.0, 22.0, 30.0, 17.0, 13.0, 12.0, 15.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.833251953125, -3.70166015625, -3.570068359375, -3.4384765625, -3.306884765625, -3.17529296875, -3.043701171875, -2.912109375, -2.780517578125, -2.64892578125, -2.517333984375, -2.3857421875, -2.254150390625, -2.12255859375, -1.990966796875, -1.859375, -1.727783203125, -1.59619140625, -1.464599609375, -1.3330078125, -1.201416015625, -1.06982421875, -0.938232421875, -0.806640625, -0.675048828125, -0.54345703125, -0.411865234375, -0.2802734375, -0.148681640625, -0.01708984375, 0.114501953125, 0.24609375, 0.377685546875, 0.50927734375, 0.640869140625, 0.7724609375, 0.904052734375, 1.03564453125, 1.167236328125, 1.298828125, 1.430419921875, 1.56201171875, 1.693603515625, 1.8251953125, 1.956787109375, 2.08837890625, 2.219970703125, 2.3515625, 2.483154296875, 2.61474609375, 2.746337890625, 2.8779296875, 3.009521484375, 3.14111328125, 3.272705078125, 3.404296875, 3.535888671875, 3.66748046875, 3.799072265625, 3.9306640625, 4.062255859375, 4.19384765625, 4.325439453125, 4.45703125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 4.0, 9.0, 19.0, 19.0, 55.0, 106.0, 355.0, 1277.0, 7377.0, 182769.0, 830307.0, 22913.0, 2486.0, 509.0, 182.0, 82.0, 37.0, 19.0, 9.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6546478271484375, -1.591522216796875, -1.5283966064453125, -1.46527099609375, -1.4021453857421875, -1.339019775390625, -1.2758941650390625, -1.2127685546875, -1.1496429443359375, -1.086517333984375, -1.0233917236328125, -0.96026611328125, -0.8971405029296875, -0.834014892578125, -0.7708892822265625, -0.707763671875, -0.6446380615234375, -0.581512451171875, -0.5183868408203125, -0.45526123046875, -0.3921356201171875, -0.329010009765625, -0.2658843994140625, -0.2027587890625, -0.1396331787109375, -0.076507568359375, -0.0133819580078125, 0.04974365234375, 0.1128692626953125, 0.175994873046875, 0.2391204833984375, 0.30224609375, 0.3653717041015625, 0.428497314453125, 0.4916229248046875, 0.55474853515625, 0.6178741455078125, 0.680999755859375, 0.7441253662109375, 0.8072509765625, 0.8703765869140625, 0.933502197265625, 0.9966278076171875, 1.05975341796875, 1.1228790283203125, 1.186004638671875, 1.2491302490234375, 1.312255859375, 1.3753814697265625, 1.438507080078125, 1.5016326904296875, 1.56475830078125, 1.6278839111328125, 1.691009521484375, 1.7541351318359375, 1.8172607421875, 1.8803863525390625, 1.943511962890625, 2.0066375732421875, 2.06976318359375, 2.1328887939453125, 2.196014404296875, 2.2591400146484375, 2.322265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 10.0, 10.0, 8.0, 14.0, 23.0, 22.0, 37.0, 36.0, 33.0, 57.0, 63.0, 75.0, 114.0, 90.0, 71.0, 53.0, 56.0, 37.0, 28.0, 33.0, 22.0, 27.0, 17.0, 14.0, 13.0, 7.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020265579223632812, -0.0001956634223461151, -0.0001886710524559021, -0.0001816786825656891, -0.00017468631267547607, -0.00016769394278526306, -0.00016070157289505005, -0.00015370920300483704, -0.00014671683311462402, -0.000139724463224411, -0.000132732093334198, -0.00012573972344398499, -0.00011874735355377197, -0.00011175498366355896, -0.00010476261377334595, -9.777024388313293e-05, -9.077787399291992e-05, -8.378550410270691e-05, -7.67931342124939e-05, -6.980076432228088e-05, -6.280839443206787e-05, -5.581602454185486e-05, -4.8823654651641846e-05, -4.183128476142883e-05, -3.483891487121582e-05, -2.7846544981002808e-05, -2.0854175090789795e-05, -1.3861805200576782e-05, -6.8694353103637695e-06, 1.2293457984924316e-07, 7.115304470062256e-06, 1.4107674360275269e-05, 2.110004425048828e-05, 2.8092414140701294e-05, 3.508478403091431e-05, 4.207715392112732e-05, 4.906952381134033e-05, 5.6061893701553345e-05, 6.305426359176636e-05, 7.004663348197937e-05, 7.703900337219238e-05, 8.40313732624054e-05, 9.102374315261841e-05, 9.801611304283142e-05, 0.00010500848293304443, 0.00011200085282325745, 0.00011899322271347046, 0.00012598559260368347, 0.00013297796249389648, 0.0001399703323841095, 0.0001469627022743225, 0.00015395507216453552, 0.00016094744205474854, 0.00016793981194496155, 0.00017493218183517456, 0.00018192455172538757, 0.00018891692161560059, 0.0001959092915058136, 0.0002029016613960266, 0.00020989403128623962, 0.00021688640117645264, 0.00022387877106666565, 0.00023087114095687866, 0.00023786351084709167, 0.0002448558807373047]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 7.0, 11.0, 18.0, 27.0, 31.0, 55.0, 73.0, 165.0, 299.0, 582.0, 1403.0, 3548.0, 13446.0, 98406.0, 751780.0, 152901.0, 18415.0, 4359.0, 1579.0, 660.0, 311.0, 173.0, 118.0, 67.0, 46.0, 24.0, 11.0, 13.0, 7.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.8978729248046875, -0.864105224609375, -0.8303375244140625, -0.79656982421875, -0.7628021240234375, -0.729034423828125, -0.6952667236328125, -0.6614990234375, -0.6277313232421875, -0.593963623046875, -0.5601959228515625, -0.52642822265625, -0.4926605224609375, -0.458892822265625, -0.4251251220703125, -0.391357421875, -0.3575897216796875, -0.323822021484375, -0.2900543212890625, -0.25628662109375, -0.2225189208984375, -0.188751220703125, -0.1549835205078125, -0.1212158203125, -0.0874481201171875, -0.053680419921875, -0.0199127197265625, 0.01385498046875, 0.0476226806640625, 0.081390380859375, 0.1151580810546875, 0.14892578125, 0.1826934814453125, 0.216461181640625, 0.2502288818359375, 0.28399658203125, 0.3177642822265625, 0.351531982421875, 0.3852996826171875, 0.4190673828125, 0.4528350830078125, 0.486602783203125, 0.5203704833984375, 0.55413818359375, 0.5879058837890625, 0.621673583984375, 0.6554412841796875, 0.689208984375, 0.7229766845703125, 0.756744384765625, 0.7905120849609375, 0.82427978515625, 0.8580474853515625, 0.891815185546875, 0.9255828857421875, 0.9593505859375, 0.9931182861328125, 1.026885986328125, 1.0606536865234375, 1.09442138671875, 1.1281890869140625, 1.161956787109375, 1.1957244873046875, 1.2294921875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 9.0, 7.0, 7.0, 14.0, 18.0, 24.0, 20.0, 33.0, 40.0, 52.0, 72.0, 66.0, 72.0, 83.0, 69.0, 67.0, 66.0, 56.0, 46.0, 44.0, 33.0, 27.0, 19.0, 9.0, 11.0, 11.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69580078125, -0.6655807495117188, -0.6353607177734375, -0.6051406860351562, -0.574920654296875, -0.5447006225585938, -0.5144805908203125, -0.48426055908203125, -0.45404052734375, -0.42382049560546875, -0.3936004638671875, -0.36338043212890625, -0.333160400390625, -0.30294036865234375, -0.2727203369140625, -0.24250030517578125, -0.2122802734375, -0.18206024169921875, -0.1518402099609375, -0.12162017822265625, -0.091400146484375, -0.06118011474609375, -0.0309600830078125, -0.00074005126953125, 0.02947998046875, 0.05970001220703125, 0.0899200439453125, 0.12014007568359375, 0.150360107421875, 0.18058013916015625, 0.2108001708984375, 0.24102020263671875, 0.271240234375, 0.30146026611328125, 0.3316802978515625, 0.36190032958984375, 0.392120361328125, 0.42234039306640625, 0.4525604248046875, 0.48278045654296875, 0.51300048828125, 0.5432205200195312, 0.5734405517578125, 0.6036605834960938, 0.633880615234375, 0.6641006469726562, 0.6943206787109375, 0.7245407104492188, 0.7547607421875, 0.7849807739257812, 0.8152008056640625, 0.8454208374023438, 0.875640869140625, 0.9058609008789062, 0.9360809326171875, 0.9663009643554688, 0.99652099609375, 1.0267410278320312, 1.0569610595703125, 1.0871810913085938, 1.117401123046875, 1.1476211547851562, 1.1778411865234375, 1.2080612182617188, 1.23828125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 3.0, 1.0, 1.0, 2.0, 8.0, 17.0, 26.0, 60.0, 113.0, 199.0, 259.0, 166.0, 87.0, 26.0, 20.0, 10.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.236351013183594, -24.37698745727539, -23.51762580871582, -22.658262252807617, -21.798900604248047, -20.939537048339844, -20.080175399780273, -19.22081184387207, -18.3614501953125, -17.502086639404297, -16.642724990844727, -15.78336238861084, -14.923999786376953, -14.06463623046875, -13.20527458190918, -12.345911026000977, -11.48654842376709, -10.627185821533203, -9.767823219299316, -8.90846061706543, -8.049098014831543, -7.189734935760498, -6.330372333526611, -5.471009731292725, -4.611647129058838, -3.752284526824951, -2.8929219245910645, -2.0335590839385986, -1.174196481704712, -0.3148336410522461, 0.5445289611816406, 1.4038915634155273, 2.263254165649414, 3.122616767883301, 3.9819793701171875, 4.841341972351074, 5.700704574584961, 6.560067653656006, 7.419430255889893, 8.278793334960938, 9.138154983520508, 9.997517585754395, 10.856880187988281, 11.716242790222168, 12.575605392456055, 13.434968948364258, 14.294330596923828, 15.153694152832031, 16.013057708740234, 16.872421264648438, 17.731782913208008, 18.59114646911621, 19.45050811767578, 20.309871673583984, 21.169233322143555, 22.028596878051758, 22.887958526611328, 23.74732208251953, 24.6066837310791, 25.466047286987305, 26.325408935546875, 27.184772491455078, 28.04413414001465, 28.90349769592285, 29.762859344482422]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 8.0, 6.0, 4.0, 7.0, 13.0, 18.0, 12.0, 17.0, 16.0, 36.0, 32.0, 31.0, 32.0, 42.0, 32.0, 46.0, 48.0, 70.0, 78.0, 66.0, 58.0, 53.0, 39.0, 30.0, 32.0, 28.0, 29.0, 17.0, 20.0, 14.0, 16.0, 10.0, 15.0, 8.0, 7.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.957334518432617, -15.446669578552246, -14.936004638671875, -14.425338745117188, -13.914673805236816, -13.404008865356445, -12.893342971801758, -12.382678031921387, -11.872013092041016, -11.361348152160645, -10.850683212280273, -10.340017318725586, -9.829352378845215, -9.318687438964844, -8.808021545410156, -8.297356605529785, -7.786691665649414, -7.276026725769043, -6.765361309051514, -6.254695892333984, -5.744030952453613, -5.233366012573242, -4.722700595855713, -4.212035179138184, -3.7013702392578125, -3.1907050609588623, -2.680039882659912, -2.169374704360962, -1.6587095260620117, -1.1480443477630615, -0.6373791694641113, -0.12671399116516113, 0.38395118713378906, 0.8946163654327393, 1.4052815437316895, 1.9159467220306396, 2.42661190032959, 2.93727707862854, 3.4479422569274902, 3.9586074352264404, 4.469272613525391, 4.979937553405762, 5.490602970123291, 6.00126838684082, 6.511933326721191, 7.0225982666015625, 7.533263683319092, 8.043929100036621, 8.554594039916992, 9.065258979797363, 9.575923919677734, 10.086589813232422, 10.597254753112793, 11.107919692993164, 11.618585586547852, 12.129250526428223, 12.639915466308594, 13.150580406188965, 13.661245346069336, 14.171911239624023, 14.682576179504395, 15.193241119384766, 15.703907012939453, 16.214570999145508, 16.725236892700195]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 5.0, 13.0, 25.0, 25.0, 62.0, 152.0, 350.0, 745.0, 1970.0, 5085.0, 14559.0, 49093.0, 230453.0, 1381118.0, 2020275.0, 387480.0, 71666.0, 19997.0, 6809.0, 2533.0, 1030.0, 421.0, 171.0, 104.0, 45.0, 33.0, 14.0, 15.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.02734375, -0.992095947265625, -0.95684814453125, -0.921600341796875, -0.8863525390625, -0.851104736328125, -0.81585693359375, -0.780609130859375, -0.745361328125, -0.710113525390625, -0.67486572265625, -0.639617919921875, -0.6043701171875, -0.569122314453125, -0.53387451171875, -0.498626708984375, -0.46337890625, -0.428131103515625, -0.39288330078125, -0.357635498046875, -0.3223876953125, -0.287139892578125, -0.25189208984375, -0.216644287109375, -0.181396484375, -0.146148681640625, -0.11090087890625, -0.075653076171875, -0.0404052734375, -0.005157470703125, 0.03009033203125, 0.065338134765625, 0.1005859375, 0.135833740234375, 0.17108154296875, 0.206329345703125, 0.2415771484375, 0.276824951171875, 0.31207275390625, 0.347320556640625, 0.382568359375, 0.417816162109375, 0.45306396484375, 0.488311767578125, 0.5235595703125, 0.558807373046875, 0.59405517578125, 0.629302978515625, 0.66455078125, 0.699798583984375, 0.73504638671875, 0.770294189453125, 0.8055419921875, 0.840789794921875, 0.87603759765625, 0.911285400390625, 0.946533203125, 0.981781005859375, 1.01702880859375, 1.052276611328125, 1.0875244140625, 1.122772216796875, 1.15802001953125, 1.193267822265625, 1.228515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 3.0, 11.0, 6.0, 20.0, 21.0, 21.0, 20.0, 32.0, 29.0, 27.0, 47.0, 44.0, 40.0, 42.0, 43.0, 43.0, 56.0, 51.0, 47.0, 45.0, 46.0, 34.0, 33.0, 35.0, 37.0, 19.0, 20.0, 20.0, 16.0, 14.0, 14.0, 8.0, 9.0, 11.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8759765625, -0.8498077392578125, -0.823638916015625, -0.7974700927734375, -0.77130126953125, -0.7451324462890625, -0.718963623046875, -0.6927947998046875, -0.6666259765625, -0.6404571533203125, -0.614288330078125, -0.5881195068359375, -0.56195068359375, -0.5357818603515625, -0.509613037109375, -0.4834442138671875, -0.457275390625, -0.4311065673828125, -0.404937744140625, -0.3787689208984375, -0.35260009765625, -0.3264312744140625, -0.300262451171875, -0.2740936279296875, -0.2479248046875, -0.2217559814453125, -0.195587158203125, -0.1694183349609375, -0.14324951171875, -0.1170806884765625, -0.090911865234375, -0.0647430419921875, -0.03857421875, -0.0124053955078125, 0.013763427734375, 0.0399322509765625, 0.06610107421875, 0.0922698974609375, 0.118438720703125, 0.1446075439453125, 0.1707763671875, 0.1969451904296875, 0.223114013671875, 0.2492828369140625, 0.27545166015625, 0.3016204833984375, 0.327789306640625, 0.3539581298828125, 0.380126953125, 0.4062957763671875, 0.432464599609375, 0.4586334228515625, 0.48480224609375, 0.5109710693359375, 0.537139892578125, 0.5633087158203125, 0.5894775390625, 0.6156463623046875, 0.641815185546875, 0.6679840087890625, 0.69415283203125, 0.7203216552734375, 0.746490478515625, 0.7726593017578125, 0.798828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 17.0, 12.0, 12.0, 16.0, 32.0, 49.0, 68.0, 152.0, 244.0, 565.0, 1138.0, 3250.0, 9895.0, 39838.0, 241321.0, 2922117.0, 864971.0, 84459.0, 18006.0, 4971.0, 1627.0, 683.0, 346.0, 189.0, 102.0, 56.0, 39.0, 36.0, 21.0, 15.0, 10.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.24609375, -2.1865692138671875, -2.127044677734375, -2.0675201416015625, -2.00799560546875, -1.9484710693359375, -1.888946533203125, -1.8294219970703125, -1.7698974609375, -1.7103729248046875, -1.650848388671875, -1.5913238525390625, -1.53179931640625, -1.4722747802734375, -1.412750244140625, -1.3532257080078125, -1.293701171875, -1.2341766357421875, -1.174652099609375, -1.1151275634765625, -1.05560302734375, -0.9960784912109375, -0.936553955078125, -0.8770294189453125, -0.8175048828125, -0.7579803466796875, -0.698455810546875, -0.6389312744140625, -0.57940673828125, -0.5198822021484375, -0.460357666015625, -0.4008331298828125, -0.34130859375, -0.2817840576171875, -0.222259521484375, -0.1627349853515625, -0.10321044921875, -0.0436859130859375, 0.015838623046875, 0.0753631591796875, 0.1348876953125, 0.1944122314453125, 0.253936767578125, 0.3134613037109375, 0.37298583984375, 0.4325103759765625, 0.492034912109375, 0.5515594482421875, 0.611083984375, 0.6706085205078125, 0.730133056640625, 0.7896575927734375, 0.84918212890625, 0.9087066650390625, 0.968231201171875, 1.0277557373046875, 1.0872802734375, 1.1468048095703125, 1.206329345703125, 1.2658538818359375, 1.32537841796875, 1.3849029541015625, 1.444427490234375, 1.5039520263671875, 1.5634765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 4.0, 8.0, 12.0, 11.0, 8.0, 17.0, 27.0, 43.0, 50.0, 61.0, 87.0, 104.0, 152.0, 223.0, 335.0, 442.0, 563.0, 554.0, 398.0, 279.0, 184.0, 127.0, 92.0, 58.0, 51.0, 39.0, 25.0, 31.0, 21.0, 11.0, 15.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6572265625, -1.601287841796875, -1.54534912109375, -1.489410400390625, -1.4334716796875, -1.377532958984375, -1.32159423828125, -1.265655517578125, -1.209716796875, -1.153778076171875, -1.09783935546875, -1.041900634765625, -0.9859619140625, -0.930023193359375, -0.87408447265625, -0.818145751953125, -0.76220703125, -0.706268310546875, -0.65032958984375, -0.594390869140625, -0.5384521484375, -0.482513427734375, -0.42657470703125, -0.370635986328125, -0.314697265625, -0.258758544921875, -0.20281982421875, -0.146881103515625, -0.0909423828125, -0.035003662109375, 0.02093505859375, 0.076873779296875, 0.1328125, 0.188751220703125, 0.24468994140625, 0.300628662109375, 0.3565673828125, 0.412506103515625, 0.46844482421875, 0.524383544921875, 0.580322265625, 0.636260986328125, 0.69219970703125, 0.748138427734375, 0.8040771484375, 0.860015869140625, 0.91595458984375, 0.971893310546875, 1.02783203125, 1.083770751953125, 1.13970947265625, 1.195648193359375, 1.2515869140625, 1.307525634765625, 1.36346435546875, 1.419403076171875, 1.475341796875, 1.531280517578125, 1.58721923828125, 1.643157958984375, 1.6990966796875, 1.755035400390625, 1.81097412109375, 1.866912841796875, 1.9228515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 17.0, 59.0, 265.0, 383.0, 176.0, 50.0, 21.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.37917709350586, -37.024932861328125, -35.670684814453125, -34.31644058227539, -32.962196350097656, -31.607952117919922, -30.253705978393555, -28.899459838867188, -27.545215606689453, -26.19097137451172, -24.83672523498535, -23.482479095458984, -22.12823486328125, -20.773990631103516, -19.41974449157715, -18.06549835205078, -16.711254119873047, -15.357008934020996, -14.002763748168945, -12.648518562316895, -11.294273376464844, -9.940028190612793, -8.585783004760742, -7.231537818908691, -5.877292633056641, -4.52304744720459, -3.168802261352539, -1.8145570755004883, -0.4603118896484375, 0.8939332962036133, 2.248178482055664, 3.602423667907715, 4.956672668457031, 6.310917854309082, 7.665163040161133, 9.019408226013184, 10.373653411865234, 11.727898597717285, 13.082143783569336, 14.436388969421387, 15.790634155273438, 17.144878387451172, 18.49912452697754, 19.853370666503906, 21.20761489868164, 22.561859130859375, 23.916105270385742, 25.27035140991211, 26.624595642089844, 27.978839874267578, 29.333086013793945, 30.687332153320312, 32.04157638549805, 33.39582061767578, 34.75006866455078, 36.104312896728516, 37.45855712890625, 38.812801361083984, 40.16704559326172, 41.52129364013672, 42.87553787231445, 44.22978210449219, 45.58403015136719, 46.93827438354492, 48.292518615722656]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 2.0, 6.0, 9.0, 8.0, 12.0, 10.0, 20.0, 23.0, 24.0, 33.0, 35.0, 47.0, 52.0, 52.0, 70.0, 68.0, 50.0, 49.0, 57.0, 57.0, 35.0, 57.0, 39.0, 31.0, 33.0, 29.0, 19.0, 11.0, 21.0, 12.0, 7.0, 7.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.817249298095703, -14.404088973999023, -13.99092960357666, -13.577770233154297, -13.164609909057617, -12.751449584960938, -12.338290214538574, -11.925130844116211, -11.511970520019531, -11.098810195922852, -10.685650825500488, -10.272491455078125, -9.859331130981445, -9.446170806884766, -9.033011436462402, -8.619852066040039, -8.20669174194336, -7.793531894683838, -7.380372047424316, -6.967212200164795, -6.554052352905273, -6.140892505645752, -5.7277326583862305, -5.314572811126709, -4.9014129638671875, -4.488253116607666, -4.0750932693481445, -3.661933422088623, -3.2487735748291016, -2.83561372756958, -2.4224538803100586, -2.009294033050537, -1.5961341857910156, -1.1829743385314941, -0.7698144912719727, -0.35665464401245117, 0.05650520324707031, 0.4696650505065918, 0.8828248977661133, 1.2959847450256348, 1.7091445922851562, 2.1223044395446777, 2.535464286804199, 2.9486241340637207, 3.361783981323242, 3.7749438285827637, 4.188103675842285, 4.601263523101807, 5.014423370361328, 5.42758321762085, 5.840743064880371, 6.253902912139893, 6.667062759399414, 7.0802226066589355, 7.493382453918457, 7.9065423011779785, 8.3197021484375, 8.73286247253418, 9.146021842956543, 9.559181213378906, 9.972341537475586, 10.385501861572266, 10.798661231994629, 11.211820602416992, 11.624980926513672]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 15.0, 17.0, 28.0, 59.0, 122.0, 238.0, 387.0, 799.0, 1661.0, 3638.0, 8420.0, 20853.0, 52765.0, 135162.0, 300774.0, 300020.0, 134951.0, 52991.0, 20317.0, 8358.0, 3590.0, 1677.0, 847.0, 391.0, 205.0, 105.0, 70.0, 34.0, 18.0, 14.0, 12.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.630859375, -1.5782470703125, -1.525634765625, -1.4730224609375, -1.42041015625, -1.3677978515625, -1.315185546875, -1.2625732421875, -1.2099609375, -1.1573486328125, -1.104736328125, -1.0521240234375, -0.99951171875, -0.9468994140625, -0.894287109375, -0.8416748046875, -0.7890625, -0.7364501953125, -0.683837890625, -0.6312255859375, -0.57861328125, -0.5260009765625, -0.473388671875, -0.4207763671875, -0.3681640625, -0.3155517578125, -0.262939453125, -0.2103271484375, -0.15771484375, -0.1051025390625, -0.052490234375, 0.0001220703125, 0.052734375, 0.1053466796875, 0.157958984375, 0.2105712890625, 0.26318359375, 0.3157958984375, 0.368408203125, 0.4210205078125, 0.4736328125, 0.5262451171875, 0.578857421875, 0.6314697265625, 0.68408203125, 0.7366943359375, 0.789306640625, 0.8419189453125, 0.89453125, 0.9471435546875, 0.999755859375, 1.0523681640625, 1.10498046875, 1.1575927734375, 1.210205078125, 1.2628173828125, 1.3154296875, 1.3680419921875, 1.420654296875, 1.4732666015625, 1.52587890625, 1.5784912109375, 1.631103515625, 1.6837158203125, 1.736328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 7.0, 10.0, 5.0, 12.0, 17.0, 17.0, 26.0, 19.0, 33.0, 29.0, 17.0, 30.0, 37.0, 45.0, 42.0, 52.0, 53.0, 40.0, 52.0, 52.0, 51.0, 48.0, 38.0, 48.0, 30.0, 33.0, 17.0, 17.0, 22.0, 18.0, 18.0, 8.0, 9.0, 10.0, 8.0, 7.0, 4.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8505859375, -0.8228836059570312, -0.7951812744140625, -0.7674789428710938, -0.739776611328125, -0.7120742797851562, -0.6843719482421875, -0.6566696166992188, -0.62896728515625, -0.6012649536132812, -0.5735626220703125, -0.5458602905273438, -0.518157958984375, -0.49045562744140625, -0.4627532958984375, -0.43505096435546875, -0.4073486328125, -0.37964630126953125, -0.3519439697265625, -0.32424163818359375, -0.296539306640625, -0.26883697509765625, -0.2411346435546875, -0.21343231201171875, -0.18572998046875, -0.15802764892578125, -0.1303253173828125, -0.10262298583984375, -0.074920654296875, -0.04721832275390625, -0.0195159912109375, 0.00818634033203125, 0.035888671875, 0.06359100341796875, 0.0912933349609375, 0.11899566650390625, 0.146697998046875, 0.17440032958984375, 0.2021026611328125, 0.22980499267578125, 0.25750732421875, 0.28520965576171875, 0.3129119873046875, 0.34061431884765625, 0.368316650390625, 0.39601898193359375, 0.4237213134765625, 0.45142364501953125, 0.4791259765625, 0.5068283081054688, 0.5345306396484375, 0.5622329711914062, 0.589935302734375, 0.6176376342773438, 0.6453399658203125, 0.6730422973632812, 0.70074462890625, 0.7284469604492188, 0.7561492919921875, 0.7838516235351562, 0.811553955078125, 0.8392562866210938, 0.8669586181640625, 0.8946609497070312, 0.92236328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 7.0, 8.0, 14.0, 24.0, 23.0, 31.0, 46.0, 72.0, 85.0, 133.0, 199.0, 280.0, 465.0, 778.0, 1562.0, 3737.0, 13000.0, 79689.0, 666690.0, 239086.0, 30933.0, 6546.0, 2344.0, 1129.0, 588.0, 333.0, 223.0, 148.0, 102.0, 78.0, 58.0, 32.0, 26.0, 25.0, 19.0, 7.0, 7.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.46875, -3.36285400390625, -3.2569580078125, -3.15106201171875, -3.045166015625, -2.93927001953125, -2.8333740234375, -2.72747802734375, -2.62158203125, -2.51568603515625, -2.4097900390625, -2.30389404296875, -2.197998046875, -2.09210205078125, -1.9862060546875, -1.88031005859375, -1.7744140625, -1.66851806640625, -1.5626220703125, -1.45672607421875, -1.350830078125, -1.24493408203125, -1.1390380859375, -1.03314208984375, -0.92724609375, -0.82135009765625, -0.7154541015625, -0.60955810546875, -0.503662109375, -0.39776611328125, -0.2918701171875, -0.18597412109375, -0.080078125, 0.02581787109375, 0.1317138671875, 0.23760986328125, 0.343505859375, 0.44940185546875, 0.5552978515625, 0.66119384765625, 0.76708984375, 0.87298583984375, 0.9788818359375, 1.08477783203125, 1.190673828125, 1.29656982421875, 1.4024658203125, 1.50836181640625, 1.6142578125, 1.72015380859375, 1.8260498046875, 1.93194580078125, 2.037841796875, 2.14373779296875, 2.2496337890625, 2.35552978515625, 2.46142578125, 2.56732177734375, 2.6732177734375, 2.77911376953125, 2.885009765625, 2.99090576171875, 3.0968017578125, 3.20269775390625, 3.30859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 1.0, 10.0, 14.0, 16.0, 17.0, 24.0, 27.0, 35.0, 46.0, 58.0, 65.0, 66.0, 44.0, 55.0, 62.0, 61.0, 62.0, 42.0, 56.0, 46.0, 40.0, 25.0, 24.0, 25.0, 14.0, 9.0, 12.0, 11.0, 1.0, 5.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.43243408203125, -4.2984619140625, -4.16448974609375, -4.030517578125, -3.89654541015625, -3.7625732421875, -3.62860107421875, -3.49462890625, -3.36065673828125, -3.2266845703125, -3.09271240234375, -2.958740234375, -2.82476806640625, -2.6907958984375, -2.55682373046875, -2.4228515625, -2.28887939453125, -2.1549072265625, -2.02093505859375, -1.886962890625, -1.75299072265625, -1.6190185546875, -1.48504638671875, -1.35107421875, -1.21710205078125, -1.0831298828125, -0.94915771484375, -0.815185546875, -0.68121337890625, -0.5472412109375, -0.41326904296875, -0.279296875, -0.14532470703125, -0.0113525390625, 0.12261962890625, 0.256591796875, 0.39056396484375, 0.5245361328125, 0.65850830078125, 0.79248046875, 0.92645263671875, 1.0604248046875, 1.19439697265625, 1.328369140625, 1.46234130859375, 1.5963134765625, 1.73028564453125, 1.8642578125, 1.99822998046875, 2.1322021484375, 2.26617431640625, 2.400146484375, 2.53411865234375, 2.6680908203125, 2.80206298828125, 2.93603515625, 3.07000732421875, 3.2039794921875, 3.33795166015625, 3.471923828125, 3.60589599609375, 3.7398681640625, 3.87384033203125, 4.0078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 5.0, 3.0, 3.0, 8.0, 9.0, 8.0, 16.0, 15.0, 29.0, 32.0, 43.0, 67.0, 112.0, 149.0, 262.0, 468.0, 927.0, 1984.0, 5103.0, 17309.0, 79291.0, 539023.0, 319086.0, 62238.0, 14171.0, 4475.0, 1771.0, 763.0, 464.0, 254.0, 119.0, 86.0, 63.0, 64.0, 31.0, 17.0, 22.0, 13.0, 12.0, 9.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81689453125, -0.7913055419921875, -0.765716552734375, -0.7401275634765625, -0.71453857421875, -0.6889495849609375, -0.663360595703125, -0.6377716064453125, -0.6121826171875, -0.5865936279296875, -0.561004638671875, -0.5354156494140625, -0.50982666015625, -0.4842376708984375, -0.458648681640625, -0.4330596923828125, -0.407470703125, -0.3818817138671875, -0.356292724609375, -0.3307037353515625, -0.30511474609375, -0.2795257568359375, -0.253936767578125, -0.2283477783203125, -0.2027587890625, -0.1771697998046875, -0.151580810546875, -0.1259918212890625, -0.10040283203125, -0.0748138427734375, -0.049224853515625, -0.0236358642578125, 0.001953125, 0.0275421142578125, 0.053131103515625, 0.0787200927734375, 0.10430908203125, 0.1298980712890625, 0.155487060546875, 0.1810760498046875, 0.2066650390625, 0.2322540283203125, 0.257843017578125, 0.2834320068359375, 0.30902099609375, 0.3346099853515625, 0.360198974609375, 0.3857879638671875, 0.411376953125, 0.4369659423828125, 0.462554931640625, 0.4881439208984375, 0.51373291015625, 0.5393218994140625, 0.564910888671875, 0.5904998779296875, 0.6160888671875, 0.6416778564453125, 0.667266845703125, 0.6928558349609375, 0.71844482421875, 0.7440338134765625, 0.769622802734375, 0.7952117919921875, 0.82080078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 8.0, 6.0, 10.0, 11.0, 25.0, 25.0, 30.0, 28.0, 52.0, 60.0, 84.0, 96.0, 106.0, 89.0, 84.0, 69.0, 49.0, 35.0, 29.0, 19.0, 15.0, 11.0, 18.0, 12.0, 4.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002582073211669922, -0.00024978071451187134, -0.0002413541078567505, -0.00023292750120162964, -0.0002245008945465088, -0.00021607428789138794, -0.0002076476812362671, -0.00019922107458114624, -0.0001907944679260254, -0.00018236786127090454, -0.0001739412546157837, -0.00016551464796066284, -0.000157088041305542, -0.00014866143465042114, -0.0001402348279953003, -0.00013180822134017944, -0.0001233816146850586, -0.00011495500802993774, -0.0001065284013748169, -9.810179471969604e-05, -8.96751880645752e-05, -8.124858140945435e-05, -7.28219747543335e-05, -6.439536809921265e-05, -5.59687614440918e-05, -4.754215478897095e-05, -3.91155481338501e-05, -3.068894147872925e-05, -2.22623348236084e-05, -1.3835728168487549e-05, -5.409121513366699e-06, 3.0174851417541504e-06, 1.1444091796875e-05, 1.987069845199585e-05, 2.82973051071167e-05, 3.672391176223755e-05, 4.51505184173584e-05, 5.357712507247925e-05, 6.20037317276001e-05, 7.043033838272095e-05, 7.88569450378418e-05, 8.728355169296265e-05, 9.57101583480835e-05, 0.00010413676500320435, 0.0001125633716583252, 0.00012098997831344604, 0.0001294165849685669, 0.00013784319162368774, 0.0001462697982788086, 0.00015469640493392944, 0.0001631230115890503, 0.00017154961824417114, 0.000179976224899292, 0.00018840283155441284, 0.0001968294382095337, 0.00020525604486465454, 0.0002136826515197754, 0.00022210925817489624, 0.0002305358648300171, 0.00023896247148513794, 0.0002473890781402588, 0.00025581568479537964, 0.0002642422914505005, 0.00027266889810562134, 0.0002810955047607422]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 11.0, 8.0, 13.0, 18.0, 27.0, 38.0, 73.0, 104.0, 200.0, 363.0, 813.0, 1802.0, 5419.0, 25837.0, 236634.0, 688404.0, 72861.0, 10663.0, 2935.0, 1125.0, 533.0, 278.0, 151.0, 87.0, 47.0, 34.0, 18.0, 17.0, 9.0, 7.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -0.999267578125, -0.96728515625, -0.935302734375, -0.9033203125, -0.871337890625, -0.83935546875, -0.807373046875, -0.775390625, -0.743408203125, -0.71142578125, -0.679443359375, -0.6474609375, -0.615478515625, -0.58349609375, -0.551513671875, -0.51953125, -0.487548828125, -0.45556640625, -0.423583984375, -0.3916015625, -0.359619140625, -0.32763671875, -0.295654296875, -0.263671875, -0.231689453125, -0.19970703125, -0.167724609375, -0.1357421875, -0.103759765625, -0.07177734375, -0.039794921875, -0.0078125, 0.024169921875, 0.05615234375, 0.088134765625, 0.1201171875, 0.152099609375, 0.18408203125, 0.216064453125, 0.248046875, 0.280029296875, 0.31201171875, 0.343994140625, 0.3759765625, 0.407958984375, 0.43994140625, 0.471923828125, 0.50390625, 0.535888671875, 0.56787109375, 0.599853515625, 0.6318359375, 0.663818359375, 0.69580078125, 0.727783203125, 0.759765625, 0.791748046875, 0.82373046875, 0.855712890625, 0.8876953125, 0.919677734375, 0.95166015625, 0.983642578125, 1.015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 10.0, 8.0, 11.0, 15.0, 23.0, 28.0, 46.0, 45.0, 64.0, 80.0, 81.0, 94.0, 93.0, 77.0, 72.0, 57.0, 58.0, 47.0, 27.0, 15.0, 15.0, 10.0, 7.0, 8.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748046875, -1.1439743041992188, -1.1131439208984375, -1.0823135375976562, -1.051483154296875, -1.0206527709960938, -0.9898223876953125, -0.9589920043945312, -0.92816162109375, -0.8973312377929688, -0.8665008544921875, -0.8356704711914062, -0.804840087890625, -0.7740097045898438, -0.7431793212890625, -0.7123489379882812, -0.6815185546875, -0.6506881713867188, -0.6198577880859375, -0.5890274047851562, -0.558197021484375, -0.5273666381835938, -0.4965362548828125, -0.46570587158203125, -0.43487548828125, -0.40404510498046875, -0.3732147216796875, -0.34238433837890625, -0.311553955078125, -0.28072357177734375, -0.2498931884765625, -0.21906280517578125, -0.188232421875, -0.15740203857421875, -0.1265716552734375, -0.09574127197265625, -0.064910888671875, -0.03408050537109375, -0.0032501220703125, 0.02758026123046875, 0.05841064453125, 0.08924102783203125, 0.1200714111328125, 0.15090179443359375, 0.181732177734375, 0.21256256103515625, 0.2433929443359375, 0.27422332763671875, 0.3050537109375, 0.33588409423828125, 0.3667144775390625, 0.39754486083984375, 0.428375244140625, 0.45920562744140625, 0.4900360107421875, 0.5208663940429688, 0.55169677734375, 0.5825271606445312, 0.6133575439453125, 0.6441879272460938, 0.675018310546875, 0.7058486938476562, 0.7366790771484375, 0.7675094604492188, 0.79833984375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 14.0, 35.0, 49.0, 89.0, 143.0, 241.0, 162.0, 97.0, 81.0, 31.0, 17.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.46628189086914, -22.787492752075195, -22.10870361328125, -21.429916381835938, -20.751127243041992, -20.072338104248047, -19.3935489654541, -18.714759826660156, -18.035972595214844, -17.3571834564209, -16.678394317626953, -15.999606132507324, -15.320817947387695, -14.64202880859375, -13.963239669799805, -13.284451484680176, -12.60566234588623, -11.926873207092285, -11.248085021972656, -10.569295883178711, -9.890507698059082, -9.211718559265137, -8.532930374145508, -7.8541412353515625, -7.175352573394775, -6.496563911437988, -5.817775249481201, -5.138986587524414, -4.460197448730469, -3.7814090251922607, -3.1026201248168945, -2.4238314628601074, -1.7450428009033203, -1.0662541389465332, -0.38746535778045654, 0.2913234233856201, 0.9701120853424072, 1.6489007472991943, 2.3276896476745605, 3.0064783096313477, 3.6852669715881348, 4.364055633544922, 5.042844295501709, 5.721632957458496, 6.400422096252441, 7.07921028137207, 7.757999420166016, 8.436788558959961, 9.11557674407959, 9.794365882873535, 10.473154067993164, 11.15194320678711, 11.830731391906738, 12.509520530700684, 13.188308715820312, 13.867097854614258, 14.545886993408203, 15.224676132202148, 15.903464317321777, 16.582252502441406, 17.26104164123535, 17.939830780029297, 18.618619918823242, 19.297409057617188, 19.9761962890625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 4.0, 11.0, 9.0, 13.0, 7.0, 17.0, 15.0, 13.0, 19.0, 25.0, 23.0, 28.0, 27.0, 35.0, 41.0, 48.0, 72.0, 66.0, 73.0, 64.0, 52.0, 41.0, 30.0, 33.0, 32.0, 27.0, 26.0, 18.0, 23.0, 24.0, 17.0, 9.0, 10.0, 8.0, 6.0, 6.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.696672439575195, -13.268020629882812, -12.83936882019043, -12.410717964172363, -11.98206615447998, -11.553414344787598, -11.124763488769531, -10.696111679077148, -10.267459869384766, -9.838808059692383, -9.41015625, -8.981505393981934, -8.55285358428955, -8.124201774597168, -7.695550441741943, -7.266899108886719, -6.838247299194336, -6.409595489501953, -5.9809441566467285, -5.552292823791504, -5.123641014099121, -4.694989204406738, -4.266337871551514, -3.83768630027771, -3.4090347290039062, -2.9803831577301025, -2.551731586456299, -2.123080015182495, -1.6944284439086914, -1.2657768726348877, -0.837125301361084, -0.4084737300872803, 0.020178794860839844, 0.44883036613464355, 0.8774819374084473, 1.306133508682251, 1.7347850799560547, 2.1634366512298584, 2.592088222503662, 3.020739793777466, 3.4493913650512695, 3.8780429363250732, 4.306694507598877, 4.735345840454102, 5.163997650146484, 5.592649459838867, 6.021300792694092, 6.449952125549316, 6.878603935241699, 7.307255744934082, 7.735907077789307, 8.164558410644531, 8.593210220336914, 9.021862030029297, 9.45051383972168, 9.879164695739746, 10.307816505432129, 10.736468315124512, 11.165119171142578, 11.593770980834961, 12.022422790527344, 12.451074600219727, 12.87972640991211, 13.308377265930176, 13.737029075622559]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 13.0, 14.0, 15.0, 14.0, 22.0, 34.0, 53.0, 52.0, 106.0, 158.0, 308.0, 671.0, 1601.0, 4078.0, 13659.0, 63166.0, 447574.0, 2217824.0, 1239799.0, 165566.0, 27650.0, 7213.0, 2532.0, 1015.0, 442.0, 239.0, 147.0, 97.0, 63.0, 34.0, 24.0, 19.0, 15.0, 16.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95068359375, -0.9137802124023438, -0.8768768310546875, -0.8399734497070312, -0.803070068359375, -0.7661666870117188, -0.7292633056640625, -0.6923599243164062, -0.65545654296875, -0.6185531616210938, -0.5816497802734375, -0.5447463989257812, -0.507843017578125, -0.47093963623046875, -0.4340362548828125, -0.39713287353515625, -0.3602294921875, -0.32332611083984375, -0.2864227294921875, -0.24951934814453125, -0.212615966796875, -0.17571258544921875, -0.1388092041015625, -0.10190582275390625, -0.06500244140625, -0.02809906005859375, 0.0088043212890625, 0.04570770263671875, 0.082611083984375, 0.11951446533203125, 0.1564178466796875, 0.19332122802734375, 0.230224609375, 0.26712799072265625, 0.3040313720703125, 0.34093475341796875, 0.377838134765625, 0.41474151611328125, 0.4516448974609375, 0.48854827880859375, 0.52545166015625, 0.5623550415039062, 0.5992584228515625, 0.6361618041992188, 0.673065185546875, 0.7099685668945312, 0.7468719482421875, 0.7837753295898438, 0.8206787109375, 0.8575820922851562, 0.8944854736328125, 0.9313888549804688, 0.968292236328125, 1.0051956176757812, 1.0420989990234375, 1.0790023803710938, 1.11590576171875, 1.1528091430664062, 1.1897125244140625, 1.2266159057617188, 1.263519287109375, 1.3004226684570312, 1.3373260498046875, 1.3742294311523438, 1.4111328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 8.0, 10.0, 14.0, 12.0, 17.0, 22.0, 25.0, 32.0, 30.0, 32.0, 28.0, 36.0, 30.0, 50.0, 49.0, 50.0, 35.0, 52.0, 52.0, 40.0, 46.0, 33.0, 34.0, 33.0, 34.0, 28.0, 17.0, 24.0, 23.0, 19.0, 14.0, 9.0, 9.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.83935546875, -0.814544677734375, -0.78973388671875, -0.764923095703125, -0.7401123046875, -0.715301513671875, -0.69049072265625, -0.665679931640625, -0.640869140625, -0.616058349609375, -0.59124755859375, -0.566436767578125, -0.5416259765625, -0.516815185546875, -0.49200439453125, -0.467193603515625, -0.4423828125, -0.417572021484375, -0.39276123046875, -0.367950439453125, -0.3431396484375, -0.318328857421875, -0.29351806640625, -0.268707275390625, -0.243896484375, -0.219085693359375, -0.19427490234375, -0.169464111328125, -0.1446533203125, -0.119842529296875, -0.09503173828125, -0.070220947265625, -0.04541015625, -0.020599365234375, 0.00421142578125, 0.029022216796875, 0.0538330078125, 0.078643798828125, 0.10345458984375, 0.128265380859375, 0.153076171875, 0.177886962890625, 0.20269775390625, 0.227508544921875, 0.2523193359375, 0.277130126953125, 0.30194091796875, 0.326751708984375, 0.3515625, 0.376373291015625, 0.40118408203125, 0.425994873046875, 0.4508056640625, 0.475616455078125, 0.50042724609375, 0.525238037109375, 0.550048828125, 0.574859619140625, 0.59967041015625, 0.624481201171875, 0.6492919921875, 0.674102783203125, 0.69891357421875, 0.723724365234375, 0.74853515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 23.0, 34.0, 43.0, 100.0, 167.0, 305.0, 583.0, 1236.0, 3579.0, 13651.0, 92051.0, 2492407.0, 1515235.0, 60065.0, 9897.0, 2711.0, 1027.0, 501.0, 257.0, 147.0, 87.0, 49.0, 35.0, 22.0, 11.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.531036376953125, -2.45855712890625, -2.386077880859375, -2.3135986328125, -2.241119384765625, -2.16864013671875, -2.096160888671875, -2.023681640625, -1.951202392578125, -1.87872314453125, -1.806243896484375, -1.7337646484375, -1.661285400390625, -1.58880615234375, -1.516326904296875, -1.44384765625, -1.371368408203125, -1.29888916015625, -1.226409912109375, -1.1539306640625, -1.081451416015625, -1.00897216796875, -0.936492919921875, -0.864013671875, -0.791534423828125, -0.71905517578125, -0.646575927734375, -0.5740966796875, -0.501617431640625, -0.42913818359375, -0.356658935546875, -0.2841796875, -0.211700439453125, -0.13922119140625, -0.066741943359375, 0.0057373046875, 0.078216552734375, 0.15069580078125, 0.223175048828125, 0.295654296875, 0.368133544921875, 0.44061279296875, 0.513092041015625, 0.5855712890625, 0.658050537109375, 0.73052978515625, 0.803009033203125, 0.87548828125, 0.947967529296875, 1.02044677734375, 1.092926025390625, 1.1654052734375, 1.237884521484375, 1.31036376953125, 1.382843017578125, 1.455322265625, 1.527801513671875, 1.60028076171875, 1.672760009765625, 1.7452392578125, 1.817718505859375, 1.89019775390625, 1.962677001953125, 2.03515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 8.0, 7.0, 15.0, 6.0, 14.0, 21.0, 34.0, 43.0, 58.0, 105.0, 177.0, 288.0, 432.0, 665.0, 722.0, 551.0, 366.0, 220.0, 122.0, 68.0, 52.0, 33.0, 11.0, 16.0, 5.0, 10.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9921875, -1.921417236328125, -1.85064697265625, -1.779876708984375, -1.7091064453125, -1.638336181640625, -1.56756591796875, -1.496795654296875, -1.426025390625, -1.355255126953125, -1.28448486328125, -1.213714599609375, -1.1429443359375, -1.072174072265625, -1.00140380859375, -0.930633544921875, -0.85986328125, -0.789093017578125, -0.71832275390625, -0.647552490234375, -0.5767822265625, -0.506011962890625, -0.43524169921875, -0.364471435546875, -0.293701171875, -0.222930908203125, -0.15216064453125, -0.081390380859375, -0.0106201171875, 0.060150146484375, 0.13092041015625, 0.201690673828125, 0.2724609375, 0.343231201171875, 0.41400146484375, 0.484771728515625, 0.5555419921875, 0.626312255859375, 0.69708251953125, 0.767852783203125, 0.838623046875, 0.909393310546875, 0.98016357421875, 1.050933837890625, 1.1217041015625, 1.192474365234375, 1.26324462890625, 1.334014892578125, 1.40478515625, 1.475555419921875, 1.54632568359375, 1.617095947265625, 1.6878662109375, 1.758636474609375, 1.82940673828125, 1.900177001953125, 1.970947265625, 2.041717529296875, 2.11248779296875, 2.183258056640625, 2.2540283203125, 2.324798583984375, 2.39556884765625, 2.466339111328125, 2.537109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 7.0, 11.0, 28.0, 122.0, 342.0, 328.0, 128.0, 14.0, 10.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.348331451416016, -27.05377769470215, -25.75922393798828, -24.464670181274414, -23.170116424560547, -21.875564575195312, -20.581010818481445, -19.286457061767578, -17.99190330505371, -16.697349548339844, -15.402795791625977, -14.108242988586426, -12.813689231872559, -11.519135475158691, -10.22458267211914, -8.930028915405273, -7.635475158691406, -6.340921401977539, -5.04636812210083, -3.751814603805542, -2.457261085510254, -1.1627073287963867, 0.13184595108032227, 1.4263992309570312, 2.7209529876708984, 4.015506744384766, 5.310060024261475, 6.604613304138184, 7.899167060852051, 9.193720817565918, 10.488273620605469, 11.782827377319336, 13.077377319335938, 14.371931076049805, 15.666484832763672, 16.96103858947754, 18.255592346191406, 19.55014419555664, 20.844697952270508, 22.139251708984375, 23.433805465698242, 24.72835922241211, 26.022912979125977, 27.317466735839844, 28.612018585205078, 29.906574249267578, 31.201126098632812, 32.49568176269531, 33.79023361206055, 35.08478546142578, 36.37934112548828, 37.673892974853516, 38.968448638916016, 40.26300048828125, 41.55755615234375, 42.852108001708984, 44.14665985107422, 45.44121170043945, 46.73576736450195, 48.03031921386719, 49.32487487792969, 50.61942672729492, 51.91398239135742, 53.208534240722656, 54.503089904785156]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 8.0, 8.0, 13.0, 11.0, 23.0, 25.0, 20.0, 34.0, 26.0, 25.0, 42.0, 41.0, 50.0, 40.0, 55.0, 54.0, 52.0, 40.0, 53.0, 48.0, 35.0, 47.0, 39.0, 31.0, 30.0, 25.0, 24.0, 17.0, 19.0, 15.0, 17.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.662504196166992, -9.341949462890625, -9.021394729614258, -8.70083999633789, -8.380285263061523, -8.059730529785156, -7.739176273345947, -7.418622016906738, -7.098067283630371, -6.777512550354004, -6.456957817077637, -6.1364030838012695, -5.8158488273620605, -5.495294094085693, -5.174739360809326, -4.854185104370117, -4.533629894256592, -4.213075160980225, -3.8925206661224365, -3.5719659328460693, -3.2514114379882812, -2.930856704711914, -2.610301971435547, -2.289747476577759, -1.9691927433013916, -1.648638129234314, -1.3280835151672363, -1.0075287818908691, -0.6869741678237915, -0.36641955375671387, -0.04586482048034668, 0.2746896743774414, 0.5952444076538086, 0.9157990217208862, 1.2363536357879639, 1.556908369064331, 1.8774629831314087, 2.1980175971984863, 2.5185723304748535, 2.8391268253326416, 3.159681558609009, 3.480236291885376, 3.800790786743164, 4.121345520019531, 4.441900253295898, 4.762454986572266, 5.083009719848633, 5.403563976287842, 5.724118709564209, 6.044673442840576, 6.365228176116943, 6.685782432556152, 7.0063371658325195, 7.326891899108887, 7.647446632385254, 7.968001365661621, 8.288556098937988, 8.609110832214355, 8.929665565490723, 9.25022029876709, 9.570775032043457, 9.891328811645508, 10.211883544921875, 10.532438278198242, 10.85299301147461]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 12.0, 24.0, 22.0, 53.0, 85.0, 152.0, 231.0, 357.0, 576.0, 975.0, 1622.0, 3056.0, 5716.0, 10755.0, 21035.0, 42981.0, 88185.0, 167579.0, 243458.0, 213388.0, 123941.0, 61940.0, 30112.0, 14929.0, 7741.0, 4125.0, 2280.0, 1268.0, 739.0, 438.0, 300.0, 179.0, 114.0, 65.0, 41.0, 30.0, 15.0, 11.0, 4.0, 3.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0078125, -0.97393798828125, -0.9400634765625, -0.90618896484375, -0.872314453125, -0.83843994140625, -0.8045654296875, -0.77069091796875, -0.73681640625, -0.70294189453125, -0.6690673828125, -0.63519287109375, -0.601318359375, -0.56744384765625, -0.5335693359375, -0.49969482421875, -0.4658203125, -0.43194580078125, -0.3980712890625, -0.36419677734375, -0.330322265625, -0.29644775390625, -0.2625732421875, -0.22869873046875, -0.19482421875, -0.16094970703125, -0.1270751953125, -0.09320068359375, -0.059326171875, -0.02545166015625, 0.0084228515625, 0.04229736328125, 0.076171875, 0.11004638671875, 0.1439208984375, 0.17779541015625, 0.211669921875, 0.24554443359375, 0.2794189453125, 0.31329345703125, 0.34716796875, 0.38104248046875, 0.4149169921875, 0.44879150390625, 0.482666015625, 0.51654052734375, 0.5504150390625, 0.58428955078125, 0.6181640625, 0.65203857421875, 0.6859130859375, 0.71978759765625, 0.753662109375, 0.78753662109375, 0.8214111328125, 0.85528564453125, 0.88916015625, 0.92303466796875, 0.9569091796875, 0.99078369140625, 1.024658203125, 1.05853271484375, 1.0924072265625, 1.12628173828125, 1.16015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 7.0, 10.0, 13.0, 10.0, 16.0, 21.0, 25.0, 35.0, 27.0, 37.0, 27.0, 30.0, 40.0, 41.0, 41.0, 43.0, 43.0, 49.0, 51.0, 50.0, 44.0, 48.0, 33.0, 25.0, 27.0, 27.0, 31.0, 24.0, 20.0, 17.0, 11.0, 9.0, 13.0, 7.0, 8.0, 5.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.841796875, -0.815704345703125, -0.78961181640625, -0.763519287109375, -0.7374267578125, -0.711334228515625, -0.68524169921875, -0.659149169921875, -0.633056640625, -0.606964111328125, -0.58087158203125, -0.554779052734375, -0.5286865234375, -0.502593994140625, -0.47650146484375, -0.450408935546875, -0.42431640625, -0.398223876953125, -0.37213134765625, -0.346038818359375, -0.3199462890625, -0.293853759765625, -0.26776123046875, -0.241668701171875, -0.215576171875, -0.189483642578125, -0.16339111328125, -0.137298583984375, -0.1112060546875, -0.085113525390625, -0.05902099609375, -0.032928466796875, -0.0068359375, 0.019256591796875, 0.04534912109375, 0.071441650390625, 0.0975341796875, 0.123626708984375, 0.14971923828125, 0.175811767578125, 0.201904296875, 0.227996826171875, 0.25408935546875, 0.280181884765625, 0.3062744140625, 0.332366943359375, 0.35845947265625, 0.384552001953125, 0.41064453125, 0.436737060546875, 0.46282958984375, 0.488922119140625, 0.5150146484375, 0.541107177734375, 0.56719970703125, 0.593292236328125, 0.619384765625, 0.645477294921875, 0.67156982421875, 0.697662353515625, 0.7237548828125, 0.749847412109375, 0.77593994140625, 0.802032470703125, 0.828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 4.0, 12.0, 7.0, 13.0, 16.0, 20.0, 28.0, 22.0, 49.0, 95.0, 133.0, 272.0, 541.0, 1332.0, 3918.0, 15196.0, 76798.0, 547081.0, 325421.0, 59617.0, 12322.0, 3379.0, 1162.0, 422.0, 229.0, 137.0, 105.0, 66.0, 40.0, 29.0, 21.0, 14.0, 15.0, 10.0, 9.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.46331787109375, -2.3836669921875, -2.30401611328125, -2.224365234375, -2.14471435546875, -2.0650634765625, -1.98541259765625, -1.90576171875, -1.82611083984375, -1.7464599609375, -1.66680908203125, -1.587158203125, -1.50750732421875, -1.4278564453125, -1.34820556640625, -1.2685546875, -1.18890380859375, -1.1092529296875, -1.02960205078125, -0.949951171875, -0.87030029296875, -0.7906494140625, -0.71099853515625, -0.63134765625, -0.55169677734375, -0.4720458984375, -0.39239501953125, -0.312744140625, -0.23309326171875, -0.1534423828125, -0.07379150390625, 0.005859375, 0.08551025390625, 0.1651611328125, 0.24481201171875, 0.324462890625, 0.40411376953125, 0.4837646484375, 0.56341552734375, 0.64306640625, 0.72271728515625, 0.8023681640625, 0.88201904296875, 0.961669921875, 1.04132080078125, 1.1209716796875, 1.20062255859375, 1.2802734375, 1.35992431640625, 1.4395751953125, 1.51922607421875, 1.598876953125, 1.67852783203125, 1.7581787109375, 1.83782958984375, 1.91748046875, 1.99713134765625, 2.0767822265625, 2.15643310546875, 2.236083984375, 2.31573486328125, 2.3953857421875, 2.47503662109375, 2.5546875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 9.0, 5.0, 8.0, 14.0, 13.0, 19.0, 13.0, 26.0, 35.0, 39.0, 46.0, 37.0, 62.0, 52.0, 59.0, 66.0, 62.0, 56.0, 59.0, 52.0, 50.0, 27.0, 35.0, 27.0, 19.0, 20.0, 15.0, 15.0, 11.0, 14.0, 11.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.1875, -4.071258544921875, -3.95501708984375, -3.838775634765625, -3.7225341796875, -3.606292724609375, -3.49005126953125, -3.373809814453125, -3.257568359375, -3.141326904296875, -3.02508544921875, -2.908843994140625, -2.7926025390625, -2.676361083984375, -2.56011962890625, -2.443878173828125, -2.32763671875, -2.211395263671875, -2.09515380859375, -1.978912353515625, -1.8626708984375, -1.746429443359375, -1.63018798828125, -1.513946533203125, -1.397705078125, -1.281463623046875, -1.16522216796875, -1.048980712890625, -0.9327392578125, -0.816497802734375, -0.70025634765625, -0.584014892578125, -0.4677734375, -0.351531982421875, -0.23529052734375, -0.119049072265625, -0.0028076171875, 0.113433837890625, 0.22967529296875, 0.345916748046875, 0.462158203125, 0.578399658203125, 0.69464111328125, 0.810882568359375, 0.9271240234375, 1.043365478515625, 1.15960693359375, 1.275848388671875, 1.39208984375, 1.508331298828125, 1.62457275390625, 1.740814208984375, 1.8570556640625, 1.973297119140625, 2.08953857421875, 2.205780029296875, 2.322021484375, 2.438262939453125, 2.55450439453125, 2.670745849609375, 2.7869873046875, 2.903228759765625, 3.01947021484375, 3.135711669921875, 3.251953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 9.0, 13.0, 9.0, 10.0, 23.0, 31.0, 42.0, 68.0, 78.0, 127.0, 222.0, 357.0, 564.0, 1002.0, 1929.0, 3977.0, 8952.0, 22583.0, 62492.0, 182952.0, 512621.0, 160211.0, 54695.0, 19602.0, 8070.0, 3629.0, 1831.0, 988.0, 548.0, 330.0, 209.0, 120.0, 81.0, 66.0, 39.0, 23.0, 21.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.591796875, -0.5750961303710938, -0.5583953857421875, -0.5416946411132812, -0.524993896484375, -0.5082931518554688, -0.4915924072265625, -0.47489166259765625, -0.45819091796875, -0.44149017333984375, -0.4247894287109375, -0.40808868408203125, -0.391387939453125, -0.37468719482421875, -0.3579864501953125, -0.34128570556640625, -0.3245849609375, -0.30788421630859375, -0.2911834716796875, -0.27448272705078125, -0.257781982421875, -0.24108123779296875, -0.2243804931640625, -0.20767974853515625, -0.19097900390625, -0.17427825927734375, -0.1575775146484375, -0.14087677001953125, -0.124176025390625, -0.10747528076171875, -0.0907745361328125, -0.07407379150390625, -0.057373046875, -0.04067230224609375, -0.0239715576171875, -0.00727081298828125, 0.009429931640625, 0.02613067626953125, 0.0428314208984375, 0.05953216552734375, 0.07623291015625, 0.09293365478515625, 0.1096343994140625, 0.12633514404296875, 0.143035888671875, 0.15973663330078125, 0.1764373779296875, 0.19313812255859375, 0.2098388671875, 0.22653961181640625, 0.2432403564453125, 0.25994110107421875, 0.276641845703125, 0.29334259033203125, 0.3100433349609375, 0.32674407958984375, 0.34344482421875, 0.36014556884765625, 0.3768463134765625, 0.39354705810546875, 0.410247802734375, 0.42694854736328125, 0.4436492919921875, 0.46035003662109375, 0.47705078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 5.0, 11.0, 13.0, 16.0, 42.0, 47.0, 74.0, 126.0, 151.0, 151.0, 120.0, 90.0, 54.0, 35.0, 25.0, 14.0, 6.0, 1.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003600120544433594, -0.000347677618265152, -0.0003353431820869446, -0.0003230087459087372, -0.0003106743097305298, -0.0002983398735523224, -0.000286005437374115, -0.0002736710011959076, -0.0002613365650177002, -0.0002490021288394928, -0.0002366676926612854, -0.000224333256483078, -0.0002119988203048706, -0.0001996643841266632, -0.0001873299479484558, -0.0001749955117702484, -0.00016266107559204102, -0.00015032663941383362, -0.00013799220323562622, -0.00012565776705741882, -0.00011332333087921143, -0.00010098889470100403, -8.865445852279663e-05, -7.632002234458923e-05, -6.398558616638184e-05, -5.165114998817444e-05, -3.931671380996704e-05, -2.6982277631759644e-05, -1.4647841453552246e-05, -2.3134052753448486e-06, 1.0021030902862549e-05, 2.2355467081069946e-05, 3.4689903259277344e-05, 4.702433943748474e-05, 5.935877561569214e-05, 7.169321179389954e-05, 8.402764797210693e-05, 9.636208415031433e-05, 0.00010869652032852173, 0.00012103095650672913, 0.00013336539268493652, 0.00014569982886314392, 0.00015803426504135132, 0.00017036870121955872, 0.0001827031373977661, 0.0001950375735759735, 0.0002073720097541809, 0.0002197064459323883, 0.0002320408821105957, 0.0002443753182888031, 0.0002567097544670105, 0.0002690441906452179, 0.0002813786268234253, 0.0002937130630016327, 0.0003060474991798401, 0.0003183819353580475, 0.0003307163715362549, 0.0003430508077144623, 0.0003553852438926697, 0.0003677196800708771, 0.00038005411624908447, 0.00039238855242729187, 0.00040472298860549927, 0.00041705742478370667, 0.00042939186096191406]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 8.0, 9.0, 16.0, 18.0, 31.0, 50.0, 88.0, 174.0, 361.0, 825.0, 2405.0, 8167.0, 37374.0, 219302.0, 642154.0, 109940.0, 19962.0, 4943.0, 1548.0, 571.0, 245.0, 143.0, 78.0, 39.0, 28.0, 26.0, 17.0, 13.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0166015625, -0.9886016845703125, -0.960601806640625, -0.9326019287109375, -0.90460205078125, -0.8766021728515625, -0.848602294921875, -0.8206024169921875, -0.7926025390625, -0.7646026611328125, -0.736602783203125, -0.7086029052734375, -0.68060302734375, -0.6526031494140625, -0.624603271484375, -0.5966033935546875, -0.568603515625, -0.5406036376953125, -0.512603759765625, -0.4846038818359375, -0.45660400390625, -0.4286041259765625, -0.400604248046875, -0.3726043701171875, -0.3446044921875, -0.3166046142578125, -0.288604736328125, -0.2606048583984375, -0.23260498046875, -0.2046051025390625, -0.176605224609375, -0.1486053466796875, -0.12060546875, -0.0926055908203125, -0.064605712890625, -0.0366058349609375, -0.00860595703125, 0.0193939208984375, 0.047393798828125, 0.0753936767578125, 0.1033935546875, 0.1313934326171875, 0.159393310546875, 0.1873931884765625, 0.21539306640625, 0.2433929443359375, 0.271392822265625, 0.2993927001953125, 0.327392578125, 0.3553924560546875, 0.383392333984375, 0.4113922119140625, 0.43939208984375, 0.4673919677734375, 0.495391845703125, 0.5233917236328125, 0.5513916015625, 0.5793914794921875, 0.607391357421875, 0.6353912353515625, 0.66339111328125, 0.6913909912109375, 0.719390869140625, 0.7473907470703125, 0.775390625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 8.0, 3.0, 7.0, 12.0, 7.0, 21.0, 13.0, 23.0, 31.0, 35.0, 51.0, 48.0, 83.0, 66.0, 81.0, 71.0, 71.0, 55.0, 56.0, 46.0, 48.0, 38.0, 34.0, 25.0, 19.0, 11.0, 11.0, 6.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83837890625, -0.8147430419921875, -0.791107177734375, -0.7674713134765625, -0.74383544921875, -0.7201995849609375, -0.696563720703125, -0.6729278564453125, -0.6492919921875, -0.6256561279296875, -0.602020263671875, -0.5783843994140625, -0.55474853515625, -0.5311126708984375, -0.507476806640625, -0.4838409423828125, -0.460205078125, -0.4365692138671875, -0.412933349609375, -0.3892974853515625, -0.36566162109375, -0.3420257568359375, -0.318389892578125, -0.2947540283203125, -0.2711181640625, -0.2474822998046875, -0.223846435546875, -0.2002105712890625, -0.17657470703125, -0.1529388427734375, -0.129302978515625, -0.1056671142578125, -0.08203125, -0.0583953857421875, -0.034759521484375, -0.0111236572265625, 0.01251220703125, 0.0361480712890625, 0.059783935546875, 0.0834197998046875, 0.1070556640625, 0.1306915283203125, 0.154327392578125, 0.1779632568359375, 0.20159912109375, 0.2252349853515625, 0.248870849609375, 0.2725067138671875, 0.296142578125, 0.3197784423828125, 0.343414306640625, 0.3670501708984375, 0.39068603515625, 0.4143218994140625, 0.437957763671875, 0.4615936279296875, 0.4852294921875, 0.5088653564453125, 0.532501220703125, 0.5561370849609375, 0.57977294921875, 0.6034088134765625, 0.627044677734375, 0.6506805419921875, 0.67431640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 10.0, 19.0, 20.0, 38.0, 55.0, 86.0, 129.0, 216.0, 124.0, 100.0, 68.0, 37.0, 22.0, 14.0, 15.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.267129898071289, -14.783132553100586, -14.2991361618042, -13.815138816833496, -13.33114242553711, -12.847145080566406, -12.363147735595703, -11.879151344299316, -11.39515495300293, -10.911157608032227, -10.42716121673584, -9.943163871765137, -9.45916748046875, -8.975170135498047, -8.491172790527344, -8.007176399230957, -7.523179054260254, -7.039182186126709, -6.555185317993164, -6.071187973022461, -5.587191581726074, -5.103194236755371, -4.619197368621826, -4.135200500488281, -3.6512036323547363, -3.1672067642211914, -2.6832098960876465, -2.1992127895355225, -1.7152159214019775, -1.2312190532684326, -0.7472219467163086, -0.26322507858276367, 0.22077178955078125, 0.704768717288971, 1.1887656450271606, 1.6727626323699951, 2.15675950050354, 2.640756368637085, 3.124753475189209, 3.608750343322754, 4.092747211456299, 4.576744079589844, 5.060740947723389, 5.544737815856934, 6.028735160827637, 6.512731552124023, 6.996728897094727, 7.4807257652282715, 7.964722633361816, 8.44871997833252, 8.932716369628906, 9.41671371459961, 9.900710105895996, 10.3847074508667, 10.868703842163086, 11.352701187133789, 11.836698532104492, 12.320695877075195, 12.804692268371582, 13.288689613342285, 13.772686004638672, 14.256683349609375, 14.740680694580078, 15.224677085876465, 15.708673477172852]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 8.0, 9.0, 12.0, 17.0, 16.0, 15.0, 19.0, 29.0, 26.0, 41.0, 53.0, 48.0, 65.0, 91.0, 91.0, 79.0, 56.0, 31.0, 43.0, 40.0, 25.0, 32.0, 28.0, 19.0, 11.0, 18.0, 12.0, 15.0, 8.0, 7.0, 4.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.069927215576172, -14.602636337280273, -14.135345458984375, -13.668054580688477, -13.200763702392578, -12.73347282409668, -12.266181945800781, -11.7988920211792, -11.3316011428833, -10.864310264587402, -10.397019386291504, -9.929728507995605, -9.462437629699707, -8.995147705078125, -8.527856826782227, -8.060565948486328, -7.5932745933532715, -7.125983715057373, -6.658692836761475, -6.191402435302734, -5.724111557006836, -5.2568206787109375, -4.789529800415039, -4.322238922119141, -3.8549482822418213, -3.387657403945923, -2.9203667640686035, -2.453075885772705, -1.9857851266860962, -1.5184943675994873, -1.0512034893035889, -0.5839128494262695, -0.1166219711303711, 0.3506688177585602, 0.8179596066474915, 1.2852504253387451, 1.752541184425354, 2.219831943511963, 2.6871228218078613, 3.1544134616851807, 3.621704339981079, 4.088994979858398, 4.556285858154297, 5.023576736450195, 5.490867614746094, 5.958158493041992, 6.425449371337891, 6.892739772796631, 7.360030651092529, 7.827321529388428, 8.294611930847168, 8.761902809143066, 9.229193687438965, 9.696484565734863, 10.163775444030762, 10.63106632232666, 11.098357200622559, 11.565648078918457, 12.032938957214355, 12.500229835510254, 12.967520713806152, 13.434810638427734, 13.902101516723633, 14.369392395019531, 14.83668327331543]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 3.0, 2.0, 4.0, 11.0, 7.0, 15.0, 14.0, 28.0, 42.0, 61.0, 78.0, 143.0, 223.0, 348.0, 602.0, 1115.0, 2324.0, 4762.0, 11598.0, 32795.0, 116644.0, 467103.0, 1492373.0, 1454243.0, 448417.0, 110703.0, 30575.0, 10702.0, 4589.0, 2142.0, 1051.0, 593.0, 363.0, 220.0, 135.0, 74.0, 59.0, 39.0, 28.0, 17.0, 10.0, 7.0, 11.0, 5.0, 5.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68408203125, -0.6577529907226562, -0.6314239501953125, -0.6050949096679688, -0.578765869140625, -0.5524368286132812, -0.5261077880859375, -0.49977874755859375, -0.47344970703125, -0.44712066650390625, -0.4207916259765625, -0.39446258544921875, -0.368133544921875, -0.34180450439453125, -0.3154754638671875, -0.28914642333984375, -0.2628173828125, -0.23648834228515625, -0.2101593017578125, -0.18383026123046875, -0.157501220703125, -0.13117218017578125, -0.1048431396484375, -0.07851409912109375, -0.05218505859375, -0.02585601806640625, 0.0004730224609375, 0.02680206298828125, 0.053131103515625, 0.07946014404296875, 0.1057891845703125, 0.13211822509765625, 0.158447265625, 0.18477630615234375, 0.2111053466796875, 0.23743438720703125, 0.263763427734375, 0.29009246826171875, 0.3164215087890625, 0.34275054931640625, 0.36907958984375, 0.39540863037109375, 0.4217376708984375, 0.44806671142578125, 0.474395751953125, 0.5007247924804688, 0.5270538330078125, 0.5533828735351562, 0.5797119140625, 0.6060409545898438, 0.6323699951171875, 0.6586990356445312, 0.685028076171875, 0.7113571166992188, 0.7376861572265625, 0.7640151977539062, 0.79034423828125, 0.8166732788085938, 0.8430023193359375, 0.8693313598632812, 0.895660400390625, 0.9219894409179688, 0.9483184814453125, 0.9746475219726562, 1.0009765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 5.0, 8.0, 9.0, 8.0, 8.0, 9.0, 15.0, 18.0, 24.0, 27.0, 31.0, 26.0, 34.0, 27.0, 31.0, 29.0, 38.0, 37.0, 39.0, 49.0, 47.0, 43.0, 34.0, 43.0, 50.0, 35.0, 33.0, 26.0, 32.0, 21.0, 24.0, 29.0, 18.0, 13.0, 11.0, 6.0, 12.0, 9.0, 11.0, 4.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.73193359375, -0.70849609375, -0.68505859375, -0.66162109375, -0.63818359375, -0.61474609375, -0.59130859375, -0.56787109375, -0.54443359375, -0.52099609375, -0.49755859375, -0.47412109375, -0.45068359375, -0.42724609375, -0.40380859375, -0.38037109375, -0.35693359375, -0.33349609375, -0.31005859375, -0.28662109375, -0.26318359375, -0.23974609375, -0.21630859375, -0.19287109375, -0.16943359375, -0.14599609375, -0.12255859375, -0.09912109375, -0.07568359375, -0.05224609375, -0.02880859375, -0.00537109375, 0.01806640625, 0.04150390625, 0.06494140625, 0.08837890625, 0.11181640625, 0.13525390625, 0.15869140625, 0.18212890625, 0.20556640625, 0.22900390625, 0.25244140625, 0.27587890625, 0.29931640625, 0.32275390625, 0.34619140625, 0.36962890625, 0.39306640625, 0.41650390625, 0.43994140625, 0.46337890625, 0.48681640625, 0.51025390625, 0.53369140625, 0.55712890625, 0.58056640625, 0.60400390625, 0.62744140625, 0.65087890625, 0.67431640625, 0.69775390625, 0.72119140625, 0.74462890625, 0.76806640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 3.0, 4.0, 16.0, 20.0, 40.0, 93.0, 164.0, 382.0, 1391.0, 13601.0, 1830684.0, 2330377.0, 15383.0, 1437.0, 356.0, 161.0, 98.0, 41.0, 17.0, 13.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.318359375, -3.180206298828125, -3.04205322265625, -2.903900146484375, -2.7657470703125, -2.627593994140625, -2.48944091796875, -2.351287841796875, -2.213134765625, -2.074981689453125, -1.93682861328125, -1.798675537109375, -1.6605224609375, -1.522369384765625, -1.38421630859375, -1.246063232421875, -1.10791015625, -0.969757080078125, -0.83160400390625, -0.693450927734375, -0.5552978515625, -0.417144775390625, -0.27899169921875, -0.140838623046875, -0.002685546875, 0.135467529296875, 0.27362060546875, 0.411773681640625, 0.5499267578125, 0.688079833984375, 0.82623291015625, 0.964385986328125, 1.1025390625, 1.240692138671875, 1.37884521484375, 1.516998291015625, 1.6551513671875, 1.793304443359375, 1.93145751953125, 2.069610595703125, 2.207763671875, 2.345916748046875, 2.48406982421875, 2.622222900390625, 2.7603759765625, 2.898529052734375, 3.03668212890625, 3.174835205078125, 3.31298828125, 3.451141357421875, 3.58929443359375, 3.727447509765625, 3.8656005859375, 4.003753662109375, 4.14190673828125, 4.280059814453125, 4.418212890625, 4.556365966796875, 4.69451904296875, 4.832672119140625, 4.9708251953125, 5.108978271484375, 5.24713134765625, 5.385284423828125, 5.5234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 14.0, 19.0, 38.0, 44.0, 70.0, 161.0, 244.0, 478.0, 777.0, 849.0, 595.0, 355.0, 156.0, 76.0, 73.0, 50.0, 26.0, 10.0, 7.0, 13.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0], "bins": [-4.01171875, -3.926544189453125, -3.84136962890625, -3.756195068359375, -3.6710205078125, -3.585845947265625, -3.50067138671875, -3.415496826171875, -3.330322265625, -3.245147705078125, -3.15997314453125, -3.074798583984375, -2.9896240234375, -2.904449462890625, -2.81927490234375, -2.734100341796875, -2.64892578125, -2.563751220703125, -2.47857666015625, -2.393402099609375, -2.3082275390625, -2.223052978515625, -2.13787841796875, -2.052703857421875, -1.967529296875, -1.882354736328125, -1.79718017578125, -1.712005615234375, -1.6268310546875, -1.541656494140625, -1.45648193359375, -1.371307373046875, -1.2861328125, -1.200958251953125, -1.11578369140625, -1.030609130859375, -0.9454345703125, -0.860260009765625, -0.77508544921875, -0.689910888671875, -0.604736328125, -0.519561767578125, -0.43438720703125, -0.349212646484375, -0.2640380859375, -0.178863525390625, -0.09368896484375, -0.008514404296875, 0.07666015625, 0.161834716796875, 0.24700927734375, 0.332183837890625, 0.4173583984375, 0.502532958984375, 0.58770751953125, 0.672882080078125, 0.758056640625, 0.843231201171875, 0.92840576171875, 1.013580322265625, 1.0987548828125, 1.183929443359375, 1.26910400390625, 1.354278564453125, 1.439453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 14.0, 37.0, 72.0, 208.0, 290.0, 195.0, 106.0, 40.0, 14.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.456514358520508, -23.56256675720215, -22.668621063232422, -21.774673461914062, -20.880725860595703, -19.986778259277344, -19.092830657958984, -18.198884963989258, -17.3049373626709, -16.41098976135254, -15.517043113708496, -14.623096466064453, -13.729148864746094, -12.835201263427734, -11.941254615783691, -11.047307968139648, -10.153360366821289, -9.25941276550293, -8.365466117858887, -7.4715189933776855, -6.577571868896484, -5.683624744415283, -4.789677619934082, -3.895730495452881, -3.0017833709716797, -2.1078362464904785, -1.2138891220092773, -0.31994199752807617, 0.574005126953125, 1.4679522514343262, 2.3618993759155273, 3.2558465003967285, 4.149791717529297, 5.043738842010498, 5.937685966491699, 6.8316330909729, 7.725580215454102, 8.619527816772461, 9.513474464416504, 10.407421112060547, 11.301368713378906, 12.195316314697266, 13.089262962341309, 13.983209609985352, 14.877157211303711, 15.77110481262207, 16.665050506591797, 17.558998107910156, 18.452945709228516, 19.346893310546875, 20.240840911865234, 21.13478660583496, 22.02873420715332, 22.92268180847168, 23.816627502441406, 24.710575103759766, 25.604522705078125, 26.498470306396484, 27.392417907714844, 28.28636360168457, 29.18031120300293, 30.07425880432129, 30.968204498291016, 31.862152099609375, 32.756099700927734]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 7.0, 4.0, 9.0, 14.0, 11.0, 10.0, 13.0, 17.0, 28.0, 24.0, 15.0, 28.0, 29.0, 24.0, 24.0, 57.0, 47.0, 37.0, 32.0, 43.0, 42.0, 42.0, 43.0, 42.0, 36.0, 46.0, 43.0, 31.0, 28.0, 32.0, 29.0, 25.0, 15.0, 11.0, 5.0, 17.0, 16.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.94741678237915, -7.677839279174805, -7.408262252807617, -7.1386847496032715, -6.869107246398926, -6.599530220031738, -6.329952716827393, -6.060375213623047, -5.790798187255859, -5.521220684051514, -5.251643657684326, -4.9820661544799805, -4.712488651275635, -4.442911148071289, -4.173334121704102, -3.903756618499756, -3.63417911529541, -3.3646018505096436, -3.095024347305298, -2.8254470825195312, -2.5558695793151855, -2.286292314529419, -2.0167150497436523, -1.7471376657485962, -1.47756028175354, -1.2079828977584839, -0.9384055733680725, -0.6688282489776611, -0.399250864982605, -0.12967348098754883, 0.13990378379821777, 0.4094811677932739, 0.6790590286254883, 0.9486364126205444, 1.2182137966156006, 1.4877910614013672, 1.7573684453964233, 2.0269458293914795, 2.296523094177246, 2.566100597381592, 2.8356778621673584, 3.105255126953125, 3.3748326301574707, 3.6444098949432373, 3.913987159729004, 4.18356466293335, 4.453142166137695, 4.722719192504883, 4.9922966957092285, 5.261874198913574, 5.531451225280762, 5.801028728485107, 6.070606231689453, 6.340183258056641, 6.609760761260986, 6.879338264465332, 7.1489152908325195, 7.418492794036865, 7.688069820404053, 7.957647323608398, 8.227224349975586, 8.49680233001709, 8.766379356384277, 9.035956382751465, 9.305534362792969]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 1.0, 13.0, 5.0, 18.0, 18.0, 35.0, 77.0, 103.0, 177.0, 266.0, 459.0, 835.0, 1529.0, 2833.0, 5593.0, 11086.0, 23603.0, 49528.0, 105862.0, 214314.0, 282944.0, 182519.0, 87214.0, 40688.0, 19363.0, 9294.0, 4708.0, 2316.0, 1331.0, 735.0, 456.0, 248.0, 131.0, 80.0, 61.0, 43.0, 29.0, 21.0, 5.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2978515625, -1.2621688842773438, -1.2264862060546875, -1.1908035278320312, -1.155120849609375, -1.1194381713867188, -1.0837554931640625, -1.0480728149414062, -1.01239013671875, -0.9767074584960938, -0.9410247802734375, -0.9053421020507812, -0.869659423828125, -0.8339767456054688, -0.7982940673828125, -0.7626113891601562, -0.7269287109375, -0.6912460327148438, -0.6555633544921875, -0.6198806762695312, -0.584197998046875, -0.5485153198242188, -0.5128326416015625, -0.47714996337890625, -0.44146728515625, -0.40578460693359375, -0.3701019287109375, -0.33441925048828125, -0.298736572265625, -0.26305389404296875, -0.2273712158203125, -0.19168853759765625, -0.156005859375, -0.12032318115234375, -0.0846405029296875, -0.04895782470703125, -0.013275146484375, 0.02240753173828125, 0.0580902099609375, 0.09377288818359375, 0.12945556640625, 0.16513824462890625, 0.2008209228515625, 0.23650360107421875, 0.272186279296875, 0.30786895751953125, 0.3435516357421875, 0.37923431396484375, 0.4149169921875, 0.45059967041015625, 0.4862823486328125, 0.5219650268554688, 0.557647705078125, 0.5933303833007812, 0.6290130615234375, 0.6646957397460938, 0.70037841796875, 0.7360610961914062, 0.7717437744140625, 0.8074264526367188, 0.843109130859375, 0.8787918090820312, 0.9144744873046875, 0.9501571655273438, 0.98583984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 1.0, 8.0, 2.0, 8.0, 6.0, 10.0, 5.0, 12.0, 15.0, 26.0, 18.0, 23.0, 25.0, 20.0, 35.0, 29.0, 32.0, 38.0, 44.0, 40.0, 42.0, 55.0, 47.0, 46.0, 52.0, 45.0, 28.0, 34.0, 46.0, 35.0, 29.0, 21.0, 21.0, 19.0, 20.0, 13.0, 9.0, 7.0, 7.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.93017578125, -0.9033966064453125, -0.876617431640625, -0.8498382568359375, -0.82305908203125, -0.7962799072265625, -0.769500732421875, -0.7427215576171875, -0.7159423828125, -0.6891632080078125, -0.662384033203125, -0.6356048583984375, -0.60882568359375, -0.5820465087890625, -0.555267333984375, -0.5284881591796875, -0.501708984375, -0.4749298095703125, -0.448150634765625, -0.4213714599609375, -0.39459228515625, -0.3678131103515625, -0.341033935546875, -0.3142547607421875, -0.2874755859375, -0.2606964111328125, -0.233917236328125, -0.2071380615234375, -0.18035888671875, -0.1535797119140625, -0.126800537109375, -0.1000213623046875, -0.0732421875, -0.0464630126953125, -0.019683837890625, 0.0070953369140625, 0.03387451171875, 0.0606536865234375, 0.087432861328125, 0.1142120361328125, 0.1409912109375, 0.1677703857421875, 0.194549560546875, 0.2213287353515625, 0.24810791015625, 0.2748870849609375, 0.301666259765625, 0.3284454345703125, 0.355224609375, 0.3820037841796875, 0.408782958984375, 0.4355621337890625, 0.46234130859375, 0.4891204833984375, 0.515899658203125, 0.5426788330078125, 0.5694580078125, 0.5962371826171875, 0.623016357421875, 0.6497955322265625, 0.67657470703125, 0.7033538818359375, 0.730133056640625, 0.7569122314453125, 0.78369140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 5.0, 12.0, 15.0, 15.0, 18.0, 36.0, 45.0, 67.0, 83.0, 150.0, 210.0, 280.0, 439.0, 761.0, 1656.0, 4188.0, 14431.0, 66892.0, 545313.0, 335038.0, 58200.0, 13224.0, 3775.0, 1484.0, 742.0, 477.0, 320.0, 193.0, 126.0, 81.0, 83.0, 45.0, 44.0, 23.0, 19.0, 9.0, 12.0, 7.0, 1.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.076141357421875, -2.00189208984375, -1.927642822265625, -1.8533935546875, -1.779144287109375, -1.70489501953125, -1.630645751953125, -1.556396484375, -1.482147216796875, -1.40789794921875, -1.333648681640625, -1.2593994140625, -1.185150146484375, -1.11090087890625, -1.036651611328125, -0.96240234375, -0.888153076171875, -0.81390380859375, -0.739654541015625, -0.6654052734375, -0.591156005859375, -0.51690673828125, -0.442657470703125, -0.368408203125, -0.294158935546875, -0.21990966796875, -0.145660400390625, -0.0714111328125, 0.002838134765625, 0.07708740234375, 0.151336669921875, 0.2255859375, 0.299835205078125, 0.37408447265625, 0.448333740234375, 0.5225830078125, 0.596832275390625, 0.67108154296875, 0.745330810546875, 0.819580078125, 0.893829345703125, 0.96807861328125, 1.042327880859375, 1.1165771484375, 1.190826416015625, 1.26507568359375, 1.339324951171875, 1.41357421875, 1.487823486328125, 1.56207275390625, 1.636322021484375, 1.7105712890625, 1.784820556640625, 1.85906982421875, 1.933319091796875, 2.007568359375, 2.081817626953125, 2.15606689453125, 2.230316162109375, 2.3045654296875, 2.378814697265625, 2.45306396484375, 2.527313232421875, 2.6015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 12.0, 8.0, 12.0, 12.0, 12.0, 12.0, 26.0, 26.0, 34.0, 36.0, 42.0, 50.0, 60.0, 63.0, 56.0, 66.0, 54.0, 56.0, 54.0, 51.0, 37.0, 38.0, 29.0, 26.0, 31.0, 20.0, 8.0, 16.0, 10.0, 9.0, 7.0, 2.0, 7.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.603515625, -3.481658935546875, -3.35980224609375, -3.237945556640625, -3.1160888671875, -2.994232177734375, -2.87237548828125, -2.750518798828125, -2.628662109375, -2.506805419921875, -2.38494873046875, -2.263092041015625, -2.1412353515625, -2.019378662109375, -1.89752197265625, -1.775665283203125, -1.65380859375, -1.531951904296875, -1.41009521484375, -1.288238525390625, -1.1663818359375, -1.044525146484375, -0.92266845703125, -0.800811767578125, -0.678955078125, -0.557098388671875, -0.43524169921875, -0.313385009765625, -0.1915283203125, -0.069671630859375, 0.05218505859375, 0.174041748046875, 0.2958984375, 0.417755126953125, 0.53961181640625, 0.661468505859375, 0.7833251953125, 0.905181884765625, 1.02703857421875, 1.148895263671875, 1.270751953125, 1.392608642578125, 1.51446533203125, 1.636322021484375, 1.7581787109375, 1.880035400390625, 2.00189208984375, 2.123748779296875, 2.24560546875, 2.367462158203125, 2.48931884765625, 2.611175537109375, 2.7330322265625, 2.854888916015625, 2.97674560546875, 3.098602294921875, 3.220458984375, 3.342315673828125, 3.46417236328125, 3.586029052734375, 3.7078857421875, 3.829742431640625, 3.95159912109375, 4.073455810546875, 4.1953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 13.0, 17.0, 24.0, 36.0, 38.0, 82.0, 95.0, 163.0, 233.0, 402.0, 691.0, 1409.0, 2856.0, 6533.0, 16705.0, 47859.0, 171561.0, 615126.0, 123519.0, 37190.0, 13427.0, 5318.0, 2420.0, 1214.0, 622.0, 332.0, 209.0, 122.0, 107.0, 58.0, 45.0, 33.0, 19.0, 9.0, 9.0, 12.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.486328125, -0.47083282470703125, -0.4553375244140625, -0.43984222412109375, -0.424346923828125, -0.40885162353515625, -0.3933563232421875, -0.37786102294921875, -0.36236572265625, -0.34687042236328125, -0.3313751220703125, -0.31587982177734375, -0.300384521484375, -0.28488922119140625, -0.2693939208984375, -0.25389862060546875, -0.2384033203125, -0.22290802001953125, -0.2074127197265625, -0.19191741943359375, -0.176422119140625, -0.16092681884765625, -0.1454315185546875, -0.12993621826171875, -0.11444091796875, -0.09894561767578125, -0.0834503173828125, -0.06795501708984375, -0.052459716796875, -0.03696441650390625, -0.0214691162109375, -0.00597381591796875, 0.009521484375, 0.02501678466796875, 0.0405120849609375, 0.05600738525390625, 0.071502685546875, 0.08699798583984375, 0.1024932861328125, 0.11798858642578125, 0.13348388671875, 0.14897918701171875, 0.1644744873046875, 0.17996978759765625, 0.195465087890625, 0.21096038818359375, 0.2264556884765625, 0.24195098876953125, 0.2574462890625, 0.27294158935546875, 0.2884368896484375, 0.30393218994140625, 0.319427490234375, 0.33492279052734375, 0.3504180908203125, 0.36591339111328125, 0.38140869140625, 0.39690399169921875, 0.4123992919921875, 0.42789459228515625, 0.443389892578125, 0.45888519287109375, 0.4743804931640625, 0.48987579345703125, 0.50537109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 8.0, 19.0, 15.0, 16.0, 12.0, 24.0, 31.0, 39.0, 41.0, 58.0, 90.0, 92.0, 97.0, 74.0, 73.0, 57.0, 47.0, 30.0, 29.0, 25.0, 24.0, 19.0, 7.0, 16.0, 7.0, 5.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0001785755157470703, -0.00017306208610534668, -0.00016754865646362305, -0.00016203522682189941, -0.00015652179718017578, -0.00015100836753845215, -0.00014549493789672852, -0.00013998150825500488, -0.00013446807861328125, -0.00012895464897155762, -0.00012344121932983398, -0.00011792778968811035, -0.00011241436004638672, -0.00010690093040466309, -0.00010138750076293945, -9.587407112121582e-05, -9.036064147949219e-05, -8.484721183776855e-05, -7.933378219604492e-05, -7.382035255432129e-05, -6.830692291259766e-05, -6.279349327087402e-05, -5.728006362915039e-05, -5.176663398742676e-05, -4.6253204345703125e-05, -4.073977470397949e-05, -3.522634506225586e-05, -2.9712915420532227e-05, -2.4199485778808594e-05, -1.868605613708496e-05, -1.3172626495361328e-05, -7.659196853637695e-06, -2.1457672119140625e-06, 3.3676624298095703e-06, 8.881092071533203e-06, 1.4394521713256836e-05, 1.990795135498047e-05, 2.54213809967041e-05, 3.0934810638427734e-05, 3.644824028015137e-05, 4.1961669921875e-05, 4.747509956359863e-05, 5.2988529205322266e-05, 5.85019588470459e-05, 6.401538848876953e-05, 6.952881813049316e-05, 7.50422477722168e-05, 8.055567741394043e-05, 8.606910705566406e-05, 9.15825366973877e-05, 9.709596633911133e-05, 0.00010260939598083496, 0.0001081228256225586, 0.00011363625526428223, 0.00011914968490600586, 0.0001246631145477295, 0.00013017654418945312, 0.00013568997383117676, 0.0001412034034729004, 0.00014671683311462402, 0.00015223026275634766, 0.0001577436923980713, 0.00016325712203979492, 0.00016877055168151855, 0.0001742839813232422]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 7.0, 4.0, 7.0, 5.0, 25.0, 23.0, 31.0, 67.0, 142.0, 211.0, 370.0, 728.0, 1661.0, 4783.0, 18186.0, 90932.0, 690608.0, 194396.0, 33553.0, 8075.0, 2640.0, 1021.0, 442.0, 242.0, 146.0, 77.0, 54.0, 31.0, 26.0, 11.0, 15.0, 12.0, 11.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.70263671875, -0.6804733276367188, -0.6583099365234375, -0.6361465454101562, -0.613983154296875, -0.5918197631835938, -0.5696563720703125, -0.5474929809570312, -0.52532958984375, -0.5031661987304688, -0.4810028076171875, -0.45883941650390625, -0.436676025390625, -0.41451263427734375, -0.3923492431640625, -0.37018585205078125, -0.3480224609375, -0.32585906982421875, -0.3036956787109375, -0.28153228759765625, -0.259368896484375, -0.23720550537109375, -0.2150421142578125, -0.19287872314453125, -0.17071533203125, -0.14855194091796875, -0.1263885498046875, -0.10422515869140625, -0.082061767578125, -0.05989837646484375, -0.0377349853515625, -0.01557159423828125, 0.006591796875, 0.02875518798828125, 0.0509185791015625, 0.07308197021484375, 0.095245361328125, 0.11740875244140625, 0.1395721435546875, 0.16173553466796875, 0.18389892578125, 0.20606231689453125, 0.2282257080078125, 0.25038909912109375, 0.272552490234375, 0.29471588134765625, 0.3168792724609375, 0.33904266357421875, 0.3612060546875, 0.38336944580078125, 0.4055328369140625, 0.42769622802734375, 0.449859619140625, 0.47202301025390625, 0.4941864013671875, 0.5163497924804688, 0.53851318359375, 0.5606765747070312, 0.5828399658203125, 0.6050033569335938, 0.627166748046875, 0.6493301391601562, 0.6714935302734375, 0.6936569213867188, 0.7158203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 10.0, 13.0, 14.0, 19.0, 26.0, 30.0, 48.0, 60.0, 86.0, 102.0, 110.0, 119.0, 96.0, 85.0, 46.0, 34.0, 38.0, 19.0, 10.0, 10.0, 14.0, 8.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.5998458862304688, -0.5722503662109375, -0.5446548461914062, -0.517059326171875, -0.48946380615234375, -0.4618682861328125, -0.43427276611328125, -0.40667724609375, -0.37908172607421875, -0.3514862060546875, -0.32389068603515625, -0.296295166015625, -0.26869964599609375, -0.2411041259765625, -0.21350860595703125, -0.1859130859375, -0.15831756591796875, -0.1307220458984375, -0.10312652587890625, -0.075531005859375, -0.04793548583984375, -0.0203399658203125, 0.00725555419921875, 0.03485107421875, 0.06244659423828125, 0.0900421142578125, 0.11763763427734375, 0.145233154296875, 0.17282867431640625, 0.2004241943359375, 0.22801971435546875, 0.255615234375, 0.28321075439453125, 0.3108062744140625, 0.33840179443359375, 0.365997314453125, 0.39359283447265625, 0.4211883544921875, 0.44878387451171875, 0.47637939453125, 0.5039749145507812, 0.5315704345703125, 0.5591659545898438, 0.586761474609375, 0.6143569946289062, 0.6419525146484375, 0.6695480346679688, 0.6971435546875, 0.7247390747070312, 0.7523345947265625, 0.7799301147460938, 0.807525634765625, 0.8351211547851562, 0.8627166748046875, 0.8903121948242188, 0.91790771484375, 0.9455032348632812, 0.9730987548828125, 1.0006942749023438, 1.028289794921875, 1.0558853149414062, 1.0834808349609375, 1.1110763549804688, 1.138671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 13.0, 22.0, 50.0, 83.0, 179.0, 282.0, 127.0, 93.0, 50.0, 32.0, 27.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.155160903930664, -19.598899841308594, -19.04263687133789, -18.48637580871582, -17.930112838745117, -17.373851776123047, -16.817588806152344, -16.261327743530273, -15.70506477355957, -15.148802757263184, -14.592540740966797, -14.03627872467041, -13.480016708374023, -12.923754692077637, -12.36749267578125, -11.81123161315918, -11.254969596862793, -10.698707580566406, -10.14244556427002, -9.586183547973633, -9.029921531677246, -8.47365951538086, -7.917397975921631, -7.361135959625244, -6.804873943328857, -6.248611927032471, -5.692349910736084, -5.1360883712768555, -4.579826354980469, -4.023564338684082, -3.4673023223876953, -2.9110403060913086, -2.3547773361206055, -1.7985153198242188, -1.2422534227371216, -0.6859915256500244, -0.1297295093536377, 0.426532506942749, 0.9827942848205566, 1.5390563011169434, 2.09531831741333, 2.651580333709717, 3.2078423500061035, 3.764104127883911, 4.320365905761719, 4.8766279220581055, 5.432889938354492, 5.989151954650879, 6.545413970947266, 7.101675987243652, 7.657938003540039, 8.214200019836426, 8.770462036132812, 9.3267240524292, 9.882986068725586, 10.439247131347656, 10.99551010131836, 11.551772117614746, 12.108034133911133, 12.66429615020752, 13.220558166503906, 13.776820182800293, 14.33308219909668, 14.88934326171875, 15.445605278015137]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 8.0, 16.0, 12.0, 14.0, 21.0, 18.0, 30.0, 18.0, 17.0, 22.0, 27.0, 29.0, 41.0, 48.0, 67.0, 99.0, 77.0, 61.0, 42.0, 32.0, 37.0, 29.0, 22.0, 27.0, 20.0, 21.0, 23.0, 13.0, 17.0, 10.0, 10.0, 8.0, 4.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.744348526000977, -9.394092559814453, -9.04383659362793, -8.693581581115723, -8.3433256149292, -7.993069648742676, -7.642813682556152, -7.292558193206787, -6.942302703857422, -6.592046737670898, -6.241791248321533, -5.89153528213501, -5.5412797927856445, -5.191023826599121, -4.840767860412598, -4.490512371063232, -4.140256404876709, -3.7900006771087646, -3.4397449493408203, -3.089488983154297, -2.7392334938049316, -2.388977527618408, -2.038721799850464, -1.6884660720825195, -1.3382103443145752, -0.9879546165466309, -0.6376988291740417, -0.28744304180145264, 0.0628126859664917, 0.41306841373443604, 0.7633242607116699, 1.1135799884796143, 1.4638357162475586, 1.814091444015503, 2.1643471717834473, 2.5146031379699707, 2.864858627319336, 3.2151145935058594, 3.5653703212738037, 3.915626049041748, 4.265881538391113, 4.616137504577637, 4.966392993927002, 5.316648960113525, 5.666904449462891, 6.017160415649414, 6.3674163818359375, 6.717671871185303, 7.067927837371826, 7.41818380355835, 7.768439292907715, 8.118695259094238, 8.468951225280762, 8.819206237792969, 9.169462203979492, 9.519718170166016, 9.869974136352539, 10.220230102539062, 10.570486068725586, 10.920741081237793, 11.270997047424316, 11.62125301361084, 11.971508979797363, 12.32176399230957, 12.672019958496094]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 14.0, 20.0, 20.0, 33.0, 51.0, 58.0, 93.0, 152.0, 254.0, 444.0, 760.0, 1389.0, 2724.0, 5713.0, 13580.0, 35936.0, 102796.0, 307497.0, 858521.0, 1485965.0, 888150.0, 319250.0, 106308.0, 38067.0, 14350.0, 5950.0, 2789.0, 1415.0, 796.0, 439.0, 230.0, 156.0, 111.0, 75.0, 59.0, 36.0, 16.0, 9.0, 18.0, 11.0, 2.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65380859375, -0.63238525390625, -0.6109619140625, -0.58953857421875, -0.568115234375, -0.54669189453125, -0.5252685546875, -0.50384521484375, -0.482421875, -0.46099853515625, -0.4395751953125, -0.41815185546875, -0.396728515625, -0.37530517578125, -0.3538818359375, -0.33245849609375, -0.31103515625, -0.28961181640625, -0.2681884765625, -0.24676513671875, -0.225341796875, -0.20391845703125, -0.1824951171875, -0.16107177734375, -0.1396484375, -0.11822509765625, -0.0968017578125, -0.07537841796875, -0.053955078125, -0.03253173828125, -0.0111083984375, 0.01031494140625, 0.03173828125, 0.05316162109375, 0.0745849609375, 0.09600830078125, 0.117431640625, 0.13885498046875, 0.1602783203125, 0.18170166015625, 0.203125, 0.22454833984375, 0.2459716796875, 0.26739501953125, 0.288818359375, 0.31024169921875, 0.3316650390625, 0.35308837890625, 0.37451171875, 0.39593505859375, 0.4173583984375, 0.43878173828125, 0.460205078125, 0.48162841796875, 0.5030517578125, 0.52447509765625, 0.5458984375, 0.56732177734375, 0.5887451171875, 0.61016845703125, 0.631591796875, 0.65301513671875, 0.6744384765625, 0.69586181640625, 0.71728515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 6.0, 3.0, 14.0, 11.0, 9.0, 15.0, 17.0, 25.0, 23.0, 26.0, 36.0, 34.0, 40.0, 43.0, 39.0, 58.0, 53.0, 35.0, 58.0, 43.0, 49.0, 46.0, 46.0, 40.0, 36.0, 30.0, 30.0, 23.0, 24.0, 17.0, 7.0, 14.0, 11.0, 7.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0263671875, -0.996856689453125, -0.96734619140625, -0.937835693359375, -0.9083251953125, -0.878814697265625, -0.84930419921875, -0.819793701171875, -0.790283203125, -0.760772705078125, -0.73126220703125, -0.701751708984375, -0.6722412109375, -0.642730712890625, -0.61322021484375, -0.583709716796875, -0.55419921875, -0.524688720703125, -0.49517822265625, -0.465667724609375, -0.4361572265625, -0.406646728515625, -0.37713623046875, -0.347625732421875, -0.318115234375, -0.288604736328125, -0.25909423828125, -0.229583740234375, -0.2000732421875, -0.170562744140625, -0.14105224609375, -0.111541748046875, -0.08203125, -0.052520751953125, -0.02301025390625, 0.006500244140625, 0.0360107421875, 0.065521240234375, 0.09503173828125, 0.124542236328125, 0.154052734375, 0.183563232421875, 0.21307373046875, 0.242584228515625, 0.2720947265625, 0.301605224609375, 0.33111572265625, 0.360626220703125, 0.39013671875, 0.419647216796875, 0.44915771484375, 0.478668212890625, 0.5081787109375, 0.537689208984375, 0.56719970703125, 0.596710205078125, 0.626220703125, 0.655731201171875, 0.68524169921875, 0.714752197265625, 0.7442626953125, 0.773773193359375, 0.80328369140625, 0.832794189453125, 0.8623046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 4.0, 11.0, 11.0, 14.0, 19.0, 31.0, 52.0, 73.0, 136.0, 258.0, 653.0, 2227.0, 12227.0, 174795.0, 3723573.0, 261202.0, 14999.0, 2711.0, 671.0, 273.0, 127.0, 58.0, 46.0, 28.0, 22.0, 12.0, 11.0, 5.0, 9.0, 5.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.556640625, -2.46710205078125, -2.3775634765625, -2.28802490234375, -2.198486328125, -2.10894775390625, -2.0194091796875, -1.92987060546875, -1.84033203125, -1.75079345703125, -1.6612548828125, -1.57171630859375, -1.482177734375, -1.39263916015625, -1.3031005859375, -1.21356201171875, -1.1240234375, -1.03448486328125, -0.9449462890625, -0.85540771484375, -0.765869140625, -0.67633056640625, -0.5867919921875, -0.49725341796875, -0.40771484375, -0.31817626953125, -0.2286376953125, -0.13909912109375, -0.049560546875, 0.03997802734375, 0.1295166015625, 0.21905517578125, 0.30859375, 0.39813232421875, 0.4876708984375, 0.57720947265625, 0.666748046875, 0.75628662109375, 0.8458251953125, 0.93536376953125, 1.02490234375, 1.11444091796875, 1.2039794921875, 1.29351806640625, 1.383056640625, 1.47259521484375, 1.5621337890625, 1.65167236328125, 1.7412109375, 1.83074951171875, 1.9202880859375, 2.00982666015625, 2.099365234375, 2.18890380859375, 2.2784423828125, 2.36798095703125, 2.45751953125, 2.54705810546875, 2.6365966796875, 2.72613525390625, 2.815673828125, 2.90521240234375, 2.9947509765625, 3.08428955078125, 3.173828125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 5.0, 5.0, 9.0, 4.0, 17.0, 26.0, 42.0, 48.0, 67.0, 100.0, 165.0, 243.0, 353.0, 453.0, 574.0, 570.0, 434.0, 318.0, 217.0, 125.0, 92.0, 61.0, 41.0, 32.0, 17.0, 8.0, 10.0, 9.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.171875, -2.109588623046875, -2.04730224609375, -1.985015869140625, -1.9227294921875, -1.860443115234375, -1.79815673828125, -1.735870361328125, -1.673583984375, -1.611297607421875, -1.54901123046875, -1.486724853515625, -1.4244384765625, -1.362152099609375, -1.29986572265625, -1.237579345703125, -1.17529296875, -1.113006591796875, -1.05072021484375, -0.988433837890625, -0.9261474609375, -0.863861083984375, -0.80157470703125, -0.739288330078125, -0.677001953125, -0.614715576171875, -0.55242919921875, -0.490142822265625, -0.4278564453125, -0.365570068359375, -0.30328369140625, -0.240997314453125, -0.1787109375, -0.116424560546875, -0.05413818359375, 0.008148193359375, 0.0704345703125, 0.132720947265625, 0.19500732421875, 0.257293701171875, 0.319580078125, 0.381866455078125, 0.44415283203125, 0.506439208984375, 0.5687255859375, 0.631011962890625, 0.69329833984375, 0.755584716796875, 0.81787109375, 0.880157470703125, 0.94244384765625, 1.004730224609375, 1.0670166015625, 1.129302978515625, 1.19158935546875, 1.253875732421875, 1.316162109375, 1.378448486328125, 1.44073486328125, 1.503021240234375, 1.5653076171875, 1.627593994140625, 1.68988037109375, 1.752166748046875, 1.814453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 11.0, 18.0, 34.0, 137.0, 300.0, 331.0, 119.0, 37.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.78962326049805, -55.70196533203125, -54.61430358886719, -53.52664566040039, -52.438987731933594, -51.35132598876953, -50.263668060302734, -49.17600631713867, -48.088348388671875, -47.00069046020508, -45.913028717041016, -44.82537078857422, -43.737709045410156, -42.65005111694336, -41.56239318847656, -40.4747314453125, -39.3870735168457, -38.299415588378906, -37.211753845214844, -36.12409591674805, -35.03643798828125, -33.94877624511719, -32.86111831665039, -31.77345848083496, -30.68579864501953, -29.5981388092041, -28.510478973388672, -27.422821044921875, -26.335161209106445, -25.247501373291016, -24.15984344482422, -23.07218360900879, -21.984525680541992, -20.896865844726562, -19.809207916259766, -18.721548080444336, -17.633888244628906, -16.546228408813477, -15.458569526672363, -14.37091064453125, -13.28325080871582, -12.19559097290039, -11.107932090759277, -10.020273208618164, -8.932613372802734, -7.844954013824463, -6.757294654846191, -5.66963529586792, -4.581975936889648, -3.494316577911377, -2.4066572189331055, -1.318997859954834, -0.2313385009765625, 0.856320858001709, 1.9439802169799805, 3.031639575958252, 4.119298934936523, 5.206958293914795, 6.294617652893066, 7.382277011871338, 8.46993637084961, 9.557596206665039, 10.645255088806152, 11.732913970947266, 12.820573806762695]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 10.0, 4.0, 12.0, 11.0, 10.0, 12.0, 20.0, 27.0, 29.0, 29.0, 43.0, 36.0, 55.0, 48.0, 52.0, 54.0, 47.0, 60.0, 54.0, 49.0, 70.0, 32.0, 42.0, 28.0, 32.0, 23.0, 17.0, 20.0, 13.0, 15.0, 16.0, 11.0, 7.0, 3.0, 0.0, 7.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.378660202026367, -10.024774551391602, -9.670888900756836, -9.31700325012207, -8.963116645812988, -8.609230995178223, -8.255345344543457, -7.901459693908691, -7.547573566436768, -7.193687915802002, -6.839801788330078, -6.4859161376953125, -6.132030487060547, -5.778144359588623, -5.424258708953857, -5.070372581481934, -4.716486930847168, -4.362601280212402, -4.0087151527404785, -3.654829502105713, -3.300943613052368, -2.9470577239990234, -2.593172073364258, -2.239286184310913, -1.8854002952575684, -1.5315144062042236, -1.1776286363601685, -0.8237428665161133, -0.46985697746276855, -0.11597108840942383, 0.2379145622253418, 0.5918004512786865, 0.9456863403320312, 1.299572229385376, 1.6534579992294312, 2.0073437690734863, 2.361229658126831, 2.715115547180176, 3.0690011978149414, 3.422887086868286, 3.776772975921631, 4.1306586265563965, 4.48454475402832, 4.838430404663086, 5.192316055297852, 5.546202182769775, 5.900087833404541, 6.253973960876465, 6.6078596115112305, 6.961745262145996, 7.31563138961792, 7.6695170402526855, 8.02340316772461, 8.377288818359375, 8.73117446899414, 9.085060119628906, 9.438945770263672, 9.792831420898438, 10.146717071533203, 10.500602722167969, 10.85448932647705, 11.208374977111816, 11.562260627746582, 11.916146278381348, 12.27003288269043]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 4.0, 1.0, 5.0, 10.0, 6.0, 12.0, 17.0, 25.0, 35.0, 48.0, 76.0, 96.0, 151.0, 209.0, 339.0, 429.0, 710.0, 1102.0, 1688.0, 2668.0, 4409.0, 7014.0, 12074.0, 21315.0, 39490.0, 76186.0, 148980.0, 251264.0, 223334.0, 120259.0, 60737.0, 32016.0, 17479.0, 10014.0, 5943.0, 3692.0, 2356.0, 1477.0, 950.0, 663.0, 391.0, 301.0, 165.0, 133.0, 81.0, 67.0, 43.0, 28.0, 19.0, 20.0, 9.0, 6.0, 9.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0384368896484375, -1.003631591796875, -0.9688262939453125, -0.93402099609375, -0.8992156982421875, -0.864410400390625, -0.8296051025390625, -0.7947998046875, -0.7599945068359375, -0.725189208984375, -0.6903839111328125, -0.65557861328125, -0.6207733154296875, -0.585968017578125, -0.5511627197265625, -0.516357421875, -0.4815521240234375, -0.446746826171875, -0.4119415283203125, -0.37713623046875, -0.3423309326171875, -0.307525634765625, -0.2727203369140625, -0.2379150390625, -0.2031097412109375, -0.168304443359375, -0.1334991455078125, -0.09869384765625, -0.0638885498046875, -0.029083251953125, 0.0057220458984375, 0.04052734375, 0.0753326416015625, 0.110137939453125, 0.1449432373046875, 0.17974853515625, 0.2145538330078125, 0.249359130859375, 0.2841644287109375, 0.3189697265625, 0.3537750244140625, 0.388580322265625, 0.4233856201171875, 0.45819091796875, 0.4929962158203125, 0.527801513671875, 0.5626068115234375, 0.597412109375, 0.6322174072265625, 0.667022705078125, 0.7018280029296875, 0.73663330078125, 0.7714385986328125, 0.806243896484375, 0.8410491943359375, 0.8758544921875, 0.9106597900390625, 0.945465087890625, 0.9802703857421875, 1.01507568359375, 1.0498809814453125, 1.084686279296875, 1.1194915771484375, 1.154296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 9.0, 8.0, 12.0, 19.0, 29.0, 25.0, 29.0, 29.0, 33.0, 33.0, 32.0, 32.0, 50.0, 54.0, 55.0, 41.0, 45.0, 44.0, 38.0, 43.0, 26.0, 35.0, 42.0, 31.0, 32.0, 22.0, 24.0, 16.0, 22.0, 15.0, 8.0, 9.0, 6.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.93798828125, -0.9094009399414062, -0.8808135986328125, -0.8522262573242188, -0.823638916015625, -0.7950515747070312, -0.7664642333984375, -0.7378768920898438, -0.70928955078125, -0.6807022094726562, -0.6521148681640625, -0.6235275268554688, -0.594940185546875, -0.5663528442382812, -0.5377655029296875, -0.5091781616210938, -0.4805908203125, -0.45200347900390625, -0.4234161376953125, -0.39482879638671875, -0.366241455078125, -0.33765411376953125, -0.3090667724609375, -0.28047943115234375, -0.25189208984375, -0.22330474853515625, -0.1947174072265625, -0.16613006591796875, -0.137542724609375, -0.10895538330078125, -0.0803680419921875, -0.05178070068359375, -0.023193359375, 0.00539398193359375, 0.0339813232421875, 0.06256866455078125, 0.091156005859375, 0.11974334716796875, 0.1483306884765625, 0.17691802978515625, 0.20550537109375, 0.23409271240234375, 0.2626800537109375, 0.29126739501953125, 0.319854736328125, 0.34844207763671875, 0.3770294189453125, 0.40561676025390625, 0.4342041015625, 0.46279144287109375, 0.4913787841796875, 0.5199661254882812, 0.548553466796875, 0.5771408081054688, 0.6057281494140625, 0.6343154907226562, 0.66290283203125, 0.6914901733398438, 0.7200775146484375, 0.7486648559570312, 0.777252197265625, 0.8058395385742188, 0.8344268798828125, 0.8630142211914062, 0.8916015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 10.0, 9.0, 11.0, 12.0, 26.0, 24.0, 39.0, 48.0, 63.0, 64.0, 128.0, 196.0, 253.0, 405.0, 630.0, 1016.0, 2240.0, 6583.0, 31354.0, 249152.0, 685188.0, 54852.0, 9734.0, 3021.0, 1337.0, 739.0, 442.0, 309.0, 191.0, 132.0, 88.0, 85.0, 51.0, 29.0, 29.0, 19.0, 10.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.930328369140625, -2.83917236328125, -2.748016357421875, -2.6568603515625, -2.565704345703125, -2.47454833984375, -2.383392333984375, -2.292236328125, -2.201080322265625, -2.10992431640625, -2.018768310546875, -1.9276123046875, -1.836456298828125, -1.74530029296875, -1.654144287109375, -1.56298828125, -1.471832275390625, -1.38067626953125, -1.289520263671875, -1.1983642578125, -1.107208251953125, -1.01605224609375, -0.924896240234375, -0.833740234375, -0.742584228515625, -0.65142822265625, -0.560272216796875, -0.4691162109375, -0.377960205078125, -0.28680419921875, -0.195648193359375, -0.1044921875, -0.013336181640625, 0.07781982421875, 0.168975830078125, 0.2601318359375, 0.351287841796875, 0.44244384765625, 0.533599853515625, 0.624755859375, 0.715911865234375, 0.80706787109375, 0.898223876953125, 0.9893798828125, 1.080535888671875, 1.17169189453125, 1.262847900390625, 1.35400390625, 1.445159912109375, 1.53631591796875, 1.627471923828125, 1.7186279296875, 1.809783935546875, 1.90093994140625, 1.992095947265625, 2.083251953125, 2.174407958984375, 2.26556396484375, 2.356719970703125, 2.4478759765625, 2.539031982421875, 2.63018798828125, 2.721343994140625, 2.8125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 10.0, 7.0, 7.0, 11.0, 13.0, 14.0, 15.0, 28.0, 27.0, 29.0, 36.0, 37.0, 67.0, 45.0, 68.0, 63.0, 49.0, 70.0, 53.0, 59.0, 61.0, 42.0, 27.0, 31.0, 20.0, 22.0, 16.0, 15.0, 8.0, 5.0, 7.0, 6.0, 8.0, 2.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.333099365234375, -3.21502685546875, -3.096954345703125, -2.9788818359375, -2.860809326171875, -2.74273681640625, -2.624664306640625, -2.506591796875, -2.388519287109375, -2.27044677734375, -2.152374267578125, -2.0343017578125, -1.916229248046875, -1.79815673828125, -1.680084228515625, -1.56201171875, -1.443939208984375, -1.32586669921875, -1.207794189453125, -1.0897216796875, -0.971649169921875, -0.85357666015625, -0.735504150390625, -0.617431640625, -0.499359130859375, -0.38128662109375, -0.263214111328125, -0.1451416015625, -0.027069091796875, 0.09100341796875, 0.209075927734375, 0.3271484375, 0.445220947265625, 0.56329345703125, 0.681365966796875, 0.7994384765625, 0.917510986328125, 1.03558349609375, 1.153656005859375, 1.271728515625, 1.389801025390625, 1.50787353515625, 1.625946044921875, 1.7440185546875, 1.862091064453125, 1.98016357421875, 2.098236083984375, 2.21630859375, 2.334381103515625, 2.45245361328125, 2.570526123046875, 2.6885986328125, 2.806671142578125, 2.92474365234375, 3.042816162109375, 3.160888671875, 3.278961181640625, 3.39703369140625, 3.515106201171875, 3.6331787109375, 3.751251220703125, 3.86932373046875, 3.987396240234375, 4.10546875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 9.0, 5.0, 12.0, 16.0, 19.0, 33.0, 48.0, 80.0, 135.0, 174.0, 327.0, 675.0, 1383.0, 3707.0, 12704.0, 58030.0, 630887.0, 278823.0, 45206.0, 10461.0, 3186.0, 1213.0, 584.0, 312.0, 175.0, 121.0, 77.0, 41.0, 41.0, 18.0, 18.0, 11.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.60968017578125, -0.5899658203125, -0.57025146484375, -0.550537109375, -0.53082275390625, -0.5111083984375, -0.49139404296875, -0.4716796875, -0.45196533203125, -0.4322509765625, -0.41253662109375, -0.392822265625, -0.37310791015625, -0.3533935546875, -0.33367919921875, -0.31396484375, -0.29425048828125, -0.2745361328125, -0.25482177734375, -0.235107421875, -0.21539306640625, -0.1956787109375, -0.17596435546875, -0.15625, -0.13653564453125, -0.1168212890625, -0.09710693359375, -0.077392578125, -0.05767822265625, -0.0379638671875, -0.01824951171875, 0.00146484375, 0.02117919921875, 0.0408935546875, 0.06060791015625, 0.080322265625, 0.10003662109375, 0.1197509765625, 0.13946533203125, 0.1591796875, 0.17889404296875, 0.1986083984375, 0.21832275390625, 0.238037109375, 0.25775146484375, 0.2774658203125, 0.29718017578125, 0.31689453125, 0.33660888671875, 0.3563232421875, 0.37603759765625, 0.395751953125, 0.41546630859375, 0.4351806640625, 0.45489501953125, 0.474609375, 0.49432373046875, 0.5140380859375, 0.53375244140625, 0.553466796875, 0.57318115234375, 0.5928955078125, 0.61260986328125, 0.63232421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 13.0, 20.0, 17.0, 16.0, 34.0, 27.0, 56.0, 73.0, 120.0, 149.0, 110.0, 100.0, 67.0, 43.0, 38.0, 23.0, 17.0, 11.0, 13.0, 12.0, 8.0, 3.0, 3.0, 6.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002951622009277344, -0.00028666481375694275, -0.0002781674265861511, -0.0002696700394153595, -0.00026117265224456787, -0.00025267526507377625, -0.0002441778779029846, -0.000235680490732193, -0.00022718310356140137, -0.00021868571639060974, -0.00021018832921981812, -0.0002016909420490265, -0.00019319355487823486, -0.00018469616770744324, -0.0001761987805366516, -0.00016770139336585999, -0.00015920400619506836, -0.00015070661902427673, -0.0001422092318534851, -0.00013371184468269348, -0.00012521445751190186, -0.00011671707034111023, -0.0001082196831703186, -9.972229599952698e-05, -9.122490882873535e-05, -8.272752165794373e-05, -7.42301344871521e-05, -6.573274731636047e-05, -5.723536014556885e-05, -4.873797297477722e-05, -4.0240585803985596e-05, -3.174319863319397e-05, -2.3245811462402344e-05, -1.4748424291610718e-05, -6.251037120819092e-06, 2.246350049972534e-06, 1.074373722076416e-05, 1.9241124391555786e-05, 2.7738511562347412e-05, 3.623589873313904e-05, 4.4733285903930664e-05, 5.323067307472229e-05, 6.172806024551392e-05, 7.022544741630554e-05, 7.872283458709717e-05, 8.72202217578888e-05, 9.571760892868042e-05, 0.00010421499609947205, 0.00011271238327026367, 0.0001212097704410553, 0.00012970715761184692, 0.00013820454478263855, 0.00014670193195343018, 0.0001551993191242218, 0.00016369670629501343, 0.00017219409346580505, 0.00018069148063659668, 0.0001891888678073883, 0.00019768625497817993, 0.00020618364214897156, 0.00021468102931976318, 0.0002231784164905548, 0.00023167580366134644, 0.00024017319083213806, 0.0002486705780029297]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 12.0, 31.0, 37.0, 78.0, 142.0, 321.0, 743.0, 2207.0, 11218.0, 162717.0, 824099.0, 40001.0, 4629.0, 1319.0, 505.0, 214.0, 115.0, 64.0, 31.0, 22.0, 11.0, 9.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -1.0068740844726562, -0.9756622314453125, -0.9444503784179688, -0.913238525390625, -0.8820266723632812, -0.8508148193359375, -0.8196029663085938, -0.78839111328125, -0.7571792602539062, -0.7259674072265625, -0.6947555541992188, -0.663543701171875, -0.6323318481445312, -0.6011199951171875, -0.5699081420898438, -0.5386962890625, -0.5074844360351562, -0.4762725830078125, -0.44506072998046875, -0.413848876953125, -0.38263702392578125, -0.3514251708984375, -0.32021331787109375, -0.28900146484375, -0.25778961181640625, -0.2265777587890625, -0.19536590576171875, -0.164154052734375, -0.13294219970703125, -0.1017303466796875, -0.07051849365234375, -0.039306640625, -0.00809478759765625, 0.0231170654296875, 0.05432891845703125, 0.085540771484375, 0.11675262451171875, 0.1479644775390625, 0.17917633056640625, 0.21038818359375, 0.24160003662109375, 0.2728118896484375, 0.30402374267578125, 0.335235595703125, 0.36644744873046875, 0.3976593017578125, 0.42887115478515625, 0.4600830078125, 0.49129486083984375, 0.5225067138671875, 0.5537185668945312, 0.584930419921875, 0.6161422729492188, 0.6473541259765625, 0.6785659790039062, 0.70977783203125, 0.7409896850585938, 0.7722015380859375, 0.8034133911132812, 0.834625244140625, 0.8658370971679688, 0.8970489501953125, 0.9282608032226562, 0.95947265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 3.0, 14.0, 11.0, 13.0, 16.0, 20.0, 22.0, 26.0, 55.0, 76.0, 66.0, 117.0, 121.0, 114.0, 93.0, 58.0, 37.0, 30.0, 33.0, 22.0, 11.0, 14.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.724609375, -0.7015380859375, -0.678466796875, -0.6553955078125, -0.63232421875, -0.6092529296875, -0.586181640625, -0.5631103515625, -0.5400390625, -0.5169677734375, -0.493896484375, -0.4708251953125, -0.44775390625, -0.4246826171875, -0.401611328125, -0.3785400390625, -0.35546875, -0.3323974609375, -0.309326171875, -0.2862548828125, -0.26318359375, -0.2401123046875, -0.217041015625, -0.1939697265625, -0.1708984375, -0.1478271484375, -0.124755859375, -0.1016845703125, -0.07861328125, -0.0555419921875, -0.032470703125, -0.0093994140625, 0.013671875, 0.0367431640625, 0.059814453125, 0.0828857421875, 0.10595703125, 0.1290283203125, 0.152099609375, 0.1751708984375, 0.1982421875, 0.2213134765625, 0.244384765625, 0.2674560546875, 0.29052734375, 0.3135986328125, 0.336669921875, 0.3597412109375, 0.3828125, 0.4058837890625, 0.428955078125, 0.4520263671875, 0.47509765625, 0.4981689453125, 0.521240234375, 0.5443115234375, 0.5673828125, 0.5904541015625, 0.613525390625, 0.6365966796875, 0.65966796875, 0.6827392578125, 0.705810546875, 0.7288818359375, 0.751953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 16.0, 13.0, 36.0, 90.0, 145.0, 390.0, 145.0, 82.0, 35.0, 20.0, 14.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.571950912475586, -24.851276397705078, -24.13060188293457, -23.409927368164062, -22.689252853393555, -21.968578338623047, -21.24790382385254, -20.52722930908203, -19.806554794311523, -19.085880279541016, -18.365205764770508, -17.64453125, -16.923856735229492, -16.203182220458984, -15.482507705688477, -14.761833190917969, -14.041158676147461, -13.320484161376953, -12.599809646606445, -11.879135131835938, -11.15846061706543, -10.437786102294922, -9.717111587524414, -8.996437072753906, -8.275762557983398, -7.555088043212891, -6.834413528442383, -6.113739013671875, -5.393064498901367, -4.672389984130859, -3.9517154693603516, -3.2310409545898438, -2.510364532470703, -1.7896900177001953, -1.0690155029296875, -0.3483409881591797, 0.3723335266113281, 1.093008041381836, 1.8136825561523438, 2.5343570709228516, 3.2550315856933594, 3.975706100463867, 4.696380615234375, 5.417055130004883, 6.137729644775391, 6.858404159545898, 7.579078674316406, 8.299753189086914, 9.020427703857422, 9.74110221862793, 10.461776733398438, 11.182451248168945, 11.903125762939453, 12.623800277709961, 13.344474792480469, 14.065149307250977, 14.785823822021484, 15.506498336791992, 16.2271728515625, 16.947847366333008, 17.668521881103516, 18.389196395874023, 19.10987091064453, 19.83054542541504, 20.551219940185547]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 3.0, 7.0, 11.0, 7.0, 8.0, 4.0, 8.0, 13.0, 18.0, 20.0, 29.0, 33.0, 24.0, 22.0, 28.0, 31.0, 41.0, 97.0, 159.0, 85.0, 48.0, 37.0, 33.0, 33.0, 38.0, 21.0, 21.0, 18.0, 7.0, 20.0, 10.0, 13.0, 11.0, 5.0, 11.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.804824829101562, -14.386870384216309, -13.968915939331055, -13.5509614944458, -13.133007049560547, -12.715051651000977, -12.297097206115723, -11.879142761230469, -11.461188316345215, -11.043233871459961, -10.625279426574707, -10.207324981689453, -9.789369583129883, -9.371416091918945, -8.953460693359375, -8.535506248474121, -8.117551803588867, -7.699597358703613, -7.281642913818359, -6.863687992095947, -6.445733547210693, -6.0277791023254395, -5.609824180603027, -5.191869735717773, -4.7739152908325195, -4.355960845947266, -3.9380061626434326, -3.5200514793395996, -3.1020970344543457, -2.684142589569092, -2.266187906265259, -1.8482332229614258, -1.4302787780761719, -1.0123242139816284, -0.594369649887085, -0.1764150857925415, 0.24153947830200195, 0.6594939231872559, 1.0774486064910889, 1.4954032897949219, 1.9133577346801758, 2.3313121795654297, 2.7492668628692627, 3.1672215461730957, 3.5851759910583496, 4.0031304359436035, 4.421085357666016, 4.8390398025512695, 5.256994247436523, 5.674948692321777, 6.092903137207031, 6.510858058929443, 6.928812503814697, 7.346766948699951, 7.764721870422363, 8.182676315307617, 8.600630760192871, 9.018585205078125, 9.436539649963379, 9.854494094848633, 10.272449493408203, 10.69040298461914, 11.108358383178711, 11.526312828063965, 11.944267272949219]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 11.0, 15.0, 25.0, 37.0, 46.0, 57.0, 119.0, 169.0, 216.0, 294.0, 485.0, 744.0, 1196.0, 1882.0, 3250.0, 6333.0, 13605.0, 34103.0, 100166.0, 312023.0, 813019.0, 1400626.0, 928624.0, 376205.0, 125352.0, 42614.0, 16124.0, 7309.0, 3723.0, 2126.0, 1245.0, 824.0, 522.0, 364.0, 256.0, 181.0, 121.0, 77.0, 69.0, 43.0, 19.0, 23.0, 8.0, 12.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.927734375, -0.8992691040039062, -0.8708038330078125, -0.8423385620117188, -0.813873291015625, -0.7854080200195312, -0.7569427490234375, -0.7284774780273438, -0.70001220703125, -0.6715469360351562, -0.6430816650390625, -0.6146163940429688, -0.586151123046875, -0.5576858520507812, -0.5292205810546875, -0.5007553100585938, -0.4722900390625, -0.44382476806640625, -0.4153594970703125, -0.38689422607421875, -0.358428955078125, -0.32996368408203125, -0.3014984130859375, -0.27303314208984375, -0.24456787109375, -0.21610260009765625, -0.1876373291015625, -0.15917205810546875, -0.130706787109375, -0.10224151611328125, -0.0737762451171875, -0.04531097412109375, -0.016845703125, 0.01161956787109375, 0.0400848388671875, 0.06855010986328125, 0.097015380859375, 0.12548065185546875, 0.1539459228515625, 0.18241119384765625, 0.21087646484375, 0.23934173583984375, 0.2678070068359375, 0.29627227783203125, 0.324737548828125, 0.35320281982421875, 0.3816680908203125, 0.41013336181640625, 0.4385986328125, 0.46706390380859375, 0.4955291748046875, 0.5239944458007812, 0.552459716796875, 0.5809249877929688, 0.6093902587890625, 0.6378555297851562, 0.66632080078125, 0.6947860717773438, 0.7232513427734375, 0.7517166137695312, 0.780181884765625, 0.8086471557617188, 0.8371124267578125, 0.8655776977539062, 0.89404296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 11.0, 10.0, 7.0, 7.0, 12.0, 16.0, 21.0, 21.0, 27.0, 26.0, 30.0, 20.0, 33.0, 26.0, 42.0, 51.0, 38.0, 43.0, 48.0, 38.0, 53.0, 43.0, 41.0, 43.0, 36.0, 32.0, 28.0, 29.0, 17.0, 28.0, 22.0, 17.0, 21.0, 12.0, 13.0, 6.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.9287109375, -0.9028244018554688, -0.8769378662109375, -0.8510513305664062, -0.825164794921875, -0.7992782592773438, -0.7733917236328125, -0.7475051879882812, -0.72161865234375, -0.6957321166992188, -0.6698455810546875, -0.6439590454101562, -0.618072509765625, -0.5921859741210938, -0.5662994384765625, -0.5404129028320312, -0.5145263671875, -0.48863983154296875, -0.4627532958984375, -0.43686676025390625, -0.410980224609375, -0.38509368896484375, -0.3592071533203125, -0.33332061767578125, -0.30743408203125, -0.28154754638671875, -0.2556610107421875, -0.22977447509765625, -0.203887939453125, -0.17800140380859375, -0.1521148681640625, -0.12622833251953125, -0.100341796875, -0.07445526123046875, -0.0485687255859375, -0.02268218994140625, 0.003204345703125, 0.02909088134765625, 0.0549774169921875, 0.08086395263671875, 0.10675048828125, 0.13263702392578125, 0.1585235595703125, 0.18441009521484375, 0.210296630859375, 0.23618316650390625, 0.2620697021484375, 0.28795623779296875, 0.3138427734375, 0.33972930908203125, 0.3656158447265625, 0.39150238037109375, 0.417388916015625, 0.44327545166015625, 0.4691619873046875, 0.49504852294921875, 0.52093505859375, 0.5468215942382812, 0.5727081298828125, 0.5985946655273438, 0.624481201171875, 0.6503677368164062, 0.6762542724609375, 0.7021408081054688, 0.72802734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 8.0, 18.0, 20.0, 39.0, 78.0, 154.0, 255.0, 531.0, 1283.0, 3634.0, 34863.0, 3941238.0, 202220.0, 6925.0, 1626.0, 717.0, 296.0, 151.0, 83.0, 57.0, 31.0, 12.0, 10.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04296875, -5.86358642578125, -5.6842041015625, -5.50482177734375, -5.325439453125, -5.14605712890625, -4.9666748046875, -4.78729248046875, -4.60791015625, -4.42852783203125, -4.2491455078125, -4.06976318359375, -3.890380859375, -3.71099853515625, -3.5316162109375, -3.35223388671875, -3.1728515625, -2.99346923828125, -2.8140869140625, -2.63470458984375, -2.455322265625, -2.27593994140625, -2.0965576171875, -1.91717529296875, -1.73779296875, -1.55841064453125, -1.3790283203125, -1.19964599609375, -1.020263671875, -0.84088134765625, -0.6614990234375, -0.48211669921875, -0.302734375, -0.12335205078125, 0.0560302734375, 0.23541259765625, 0.414794921875, 0.59417724609375, 0.7735595703125, 0.95294189453125, 1.13232421875, 1.31170654296875, 1.4910888671875, 1.67047119140625, 1.849853515625, 2.02923583984375, 2.2086181640625, 2.38800048828125, 2.5673828125, 2.74676513671875, 2.9261474609375, 3.10552978515625, 3.284912109375, 3.46429443359375, 3.6436767578125, 3.82305908203125, 4.00244140625, 4.18182373046875, 4.3612060546875, 4.54058837890625, 4.719970703125, 4.89935302734375, 5.0787353515625, 5.25811767578125, 5.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 21.0, 33.0, 57.0, 75.0, 155.0, 197.0, 373.0, 627.0, 787.0, 638.0, 380.0, 312.0, 149.0, 103.0, 61.0, 37.0, 20.0, 14.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.613983154296875, -3.49163818359375, -3.369293212890625, -3.2469482421875, -3.124603271484375, -3.00225830078125, -2.879913330078125, -2.757568359375, -2.635223388671875, -2.51287841796875, -2.390533447265625, -2.2681884765625, -2.145843505859375, -2.02349853515625, -1.901153564453125, -1.77880859375, -1.656463623046875, -1.53411865234375, -1.411773681640625, -1.2894287109375, -1.167083740234375, -1.04473876953125, -0.922393798828125, -0.800048828125, -0.677703857421875, -0.55535888671875, -0.433013916015625, -0.3106689453125, -0.188323974609375, -0.06597900390625, 0.056365966796875, 0.1787109375, 0.301055908203125, 0.42340087890625, 0.545745849609375, 0.6680908203125, 0.790435791015625, 0.91278076171875, 1.035125732421875, 1.157470703125, 1.279815673828125, 1.40216064453125, 1.524505615234375, 1.6468505859375, 1.769195556640625, 1.89154052734375, 2.013885498046875, 2.13623046875, 2.258575439453125, 2.38092041015625, 2.503265380859375, 2.6256103515625, 2.747955322265625, 2.87030029296875, 2.992645263671875, 3.114990234375, 3.237335205078125, 3.35968017578125, 3.482025146484375, 3.6043701171875, 3.726715087890625, 3.84906005859375, 3.971405029296875, 4.09375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 8.0, 8.0, 15.0, 18.0, 20.0, 44.0, 68.0, 92.0, 124.0, 162.0, 127.0, 108.0, 66.0, 45.0, 28.0, 17.0, 15.0, 15.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.93829345703125, -32.163124084472656, -31.387950897216797, -30.612781524658203, -29.837610244750977, -29.06243896484375, -28.287269592285156, -27.51209831237793, -26.736927032470703, -25.961755752563477, -25.18658447265625, -24.411415100097656, -23.63624382019043, -22.861072540283203, -22.08590316772461, -21.310731887817383, -20.535560607910156, -19.76038932800293, -18.985218048095703, -18.21004867553711, -17.434877395629883, -16.659706115722656, -15.884535789489746, -15.109365463256836, -14.33419418334961, -13.559022903442383, -12.783852577209473, -12.008682250976562, -11.233510971069336, -10.45833969116211, -9.6831693649292, -8.907999038696289, -8.13282585144043, -7.357655048370361, -6.582484245300293, -5.807313442230225, -5.032142639160156, -4.256971836090088, -3.4818010330200195, -2.706630229949951, -1.9314594268798828, -1.1562886238098145, -0.3811178207397461, 0.39405298233032227, 1.1692237854003906, 1.944394588470459, 2.7195653915405273, 3.4947361946105957, 4.269906997680664, 5.045077800750732, 5.820248603820801, 6.595419406890869, 7.3705902099609375, 8.145761489868164, 8.920931816101074, 9.696102142333984, 10.471273422241211, 11.246444702148438, 12.021615028381348, 12.796785354614258, 13.571956634521484, 14.347127914428711, 15.122298240661621, 15.897468566894531, 16.672639846801758]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 8.0, 11.0, 12.0, 15.0, 17.0, 17.0, 24.0, 27.0, 24.0, 26.0, 23.0, 29.0, 35.0, 31.0, 35.0, 45.0, 52.0, 45.0, 40.0, 45.0, 45.0, 29.0, 35.0, 39.0, 35.0, 34.0, 21.0, 27.0, 25.0, 27.0, 19.0, 16.0, 12.0, 11.0, 8.0, 8.0, 7.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.81635570526123, -12.397385597229004, -11.978415489196777, -11.559446334838867, -11.14047622680664, -10.721506118774414, -10.302536010742188, -9.883565902709961, -9.464595794677734, -9.045625686645508, -8.626655578613281, -8.207685470581055, -7.7887163162231445, -7.369746208190918, -6.950776100158691, -6.531805992126465, -6.112836837768555, -5.693866729736328, -5.27489709854126, -4.855926990509033, -4.436957359313965, -4.017987251281738, -3.5990171432495117, -3.1800472736358643, -2.761077404022217, -2.3421075344085693, -1.9231375455856323, -1.5041675567626953, -1.0851976871490479, -0.6662278175354004, -0.24725770950317383, 0.17171216011047363, 0.5906810760498047, 1.0096509456634521, 1.4286209344863892, 1.8475909233093262, 2.2665607929229736, 2.685530662536621, 3.1045007705688477, 3.523470640182495, 3.9424405097961426, 4.361410617828369, 4.7803802490234375, 5.199350357055664, 5.618320465087891, 6.037290096282959, 6.4562602043151855, 6.875229835510254, 7.2941999435424805, 7.713170051574707, 8.132140159606934, 8.551109313964844, 8.97007942199707, 9.389049530029297, 9.808019638061523, 10.22698974609375, 10.645959854125977, 11.064929962158203, 11.48390007019043, 11.902870178222656, 12.321839332580566, 12.740809440612793, 13.15977954864502, 13.578749656677246, 13.997718811035156]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 14.0, 22.0, 28.0, 41.0, 61.0, 105.0, 173.0, 216.0, 382.0, 620.0, 960.0, 1721.0, 3190.0, 6105.0, 13030.0, 32265.0, 93003.0, 387015.0, 363862.0, 88887.0, 30809.0, 12703.0, 5809.0, 3121.0, 1683.0, 1013.0, 601.0, 381.0, 265.0, 141.0, 86.0, 70.0, 46.0, 34.0, 19.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.5908203125, -1.54107666015625, -1.4913330078125, -1.44158935546875, -1.391845703125, -1.34210205078125, -1.2923583984375, -1.24261474609375, -1.19287109375, -1.14312744140625, -1.0933837890625, -1.04364013671875, -0.993896484375, -0.94415283203125, -0.8944091796875, -0.84466552734375, -0.794921875, -0.74517822265625, -0.6954345703125, -0.64569091796875, -0.595947265625, -0.54620361328125, -0.4964599609375, -0.44671630859375, -0.39697265625, -0.34722900390625, -0.2974853515625, -0.24774169921875, -0.197998046875, -0.14825439453125, -0.0985107421875, -0.04876708984375, 0.0009765625, 0.05072021484375, 0.1004638671875, 0.15020751953125, 0.199951171875, 0.24969482421875, 0.2994384765625, 0.34918212890625, 0.39892578125, 0.44866943359375, 0.4984130859375, 0.54815673828125, 0.597900390625, 0.64764404296875, 0.6973876953125, 0.74713134765625, 0.796875, 0.84661865234375, 0.8963623046875, 0.94610595703125, 0.995849609375, 1.04559326171875, 1.0953369140625, 1.14508056640625, 1.19482421875, 1.24456787109375, 1.2943115234375, 1.34405517578125, 1.393798828125, 1.44354248046875, 1.4932861328125, 1.54302978515625, 1.5927734375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 10.0, 8.0, 12.0, 12.0, 13.0, 16.0, 24.0, 26.0, 32.0, 43.0, 35.0, 42.0, 51.0, 50.0, 44.0, 50.0, 35.0, 54.0, 44.0, 47.0, 51.0, 45.0, 34.0, 37.0, 32.0, 23.0, 29.0, 19.0, 17.0, 14.0, 11.0, 9.0, 8.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.23046875, -1.1959075927734375, -1.161346435546875, -1.1267852783203125, -1.09222412109375, -1.0576629638671875, -1.023101806640625, -0.9885406494140625, -0.9539794921875, -0.9194183349609375, -0.884857177734375, -0.8502960205078125, -0.81573486328125, -0.7811737060546875, -0.746612548828125, -0.7120513916015625, -0.677490234375, -0.6429290771484375, -0.608367919921875, -0.5738067626953125, -0.53924560546875, -0.5046844482421875, -0.470123291015625, -0.4355621337890625, -0.4010009765625, -0.3664398193359375, -0.331878662109375, -0.2973175048828125, -0.26275634765625, -0.2281951904296875, -0.193634033203125, -0.1590728759765625, -0.12451171875, -0.0899505615234375, -0.055389404296875, -0.0208282470703125, 0.01373291015625, 0.0482940673828125, 0.082855224609375, 0.1174163818359375, 0.1519775390625, 0.1865386962890625, 0.221099853515625, 0.2556610107421875, 0.29022216796875, 0.3247833251953125, 0.359344482421875, 0.3939056396484375, 0.428466796875, 0.4630279541015625, 0.497589111328125, 0.5321502685546875, 0.56671142578125, 0.6012725830078125, 0.635833740234375, 0.6703948974609375, 0.7049560546875, 0.7395172119140625, 0.774078369140625, 0.8086395263671875, 0.84320068359375, 0.8777618408203125, 0.912322998046875, 0.9468841552734375, 0.9814453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 12.0, 12.0, 11.0, 24.0, 31.0, 42.0, 68.0, 115.0, 174.0, 329.0, 690.0, 1853.0, 7295.0, 60937.0, 909814.0, 56762.0, 7040.0, 1857.0, 682.0, 321.0, 172.0, 118.0, 61.0, 49.0, 23.0, 15.0, 14.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.70703125, -3.602569580078125, -3.49810791015625, -3.393646240234375, -3.2891845703125, -3.184722900390625, -3.08026123046875, -2.975799560546875, -2.871337890625, -2.766876220703125, -2.66241455078125, -2.557952880859375, -2.4534912109375, -2.349029541015625, -2.24456787109375, -2.140106201171875, -2.03564453125, -1.931182861328125, -1.82672119140625, -1.722259521484375, -1.6177978515625, -1.513336181640625, -1.40887451171875, -1.304412841796875, -1.199951171875, -1.095489501953125, -0.99102783203125, -0.886566162109375, -0.7821044921875, -0.677642822265625, -0.57318115234375, -0.468719482421875, -0.3642578125, -0.259796142578125, -0.15533447265625, -0.050872802734375, 0.0535888671875, 0.158050537109375, 0.26251220703125, 0.366973876953125, 0.471435546875, 0.575897216796875, 0.68035888671875, 0.784820556640625, 0.8892822265625, 0.993743896484375, 1.09820556640625, 1.202667236328125, 1.30712890625, 1.411590576171875, 1.51605224609375, 1.620513916015625, 1.7249755859375, 1.829437255859375, 1.93389892578125, 2.038360595703125, 2.142822265625, 2.247283935546875, 2.35174560546875, 2.456207275390625, 2.5606689453125, 2.665130615234375, 2.76959228515625, 2.874053955078125, 2.978515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 6.0, 7.0, 12.0, 19.0, 19.0, 15.0, 20.0, 16.0, 19.0, 20.0, 35.0, 34.0, 52.0, 53.0, 77.0, 73.0, 75.0, 78.0, 52.0, 47.0, 38.0, 25.0, 31.0, 15.0, 25.0, 16.0, 15.0, 21.0, 3.0, 12.0, 12.0, 6.0, 10.0, 5.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.2734375, -4.142822265625, -4.01220703125, -3.881591796875, -3.7509765625, -3.620361328125, -3.48974609375, -3.359130859375, -3.228515625, -3.097900390625, -2.96728515625, -2.836669921875, -2.7060546875, -2.575439453125, -2.44482421875, -2.314208984375, -2.18359375, -2.052978515625, -1.92236328125, -1.791748046875, -1.6611328125, -1.530517578125, -1.39990234375, -1.269287109375, -1.138671875, -1.008056640625, -0.87744140625, -0.746826171875, -0.6162109375, -0.485595703125, -0.35498046875, -0.224365234375, -0.09375, 0.036865234375, 0.16748046875, 0.298095703125, 0.4287109375, 0.559326171875, 0.68994140625, 0.820556640625, 0.951171875, 1.081787109375, 1.21240234375, 1.343017578125, 1.4736328125, 1.604248046875, 1.73486328125, 1.865478515625, 1.99609375, 2.126708984375, 2.25732421875, 2.387939453125, 2.5185546875, 2.649169921875, 2.77978515625, 2.910400390625, 3.041015625, 3.171630859375, 3.30224609375, 3.432861328125, 3.5634765625, 3.694091796875, 3.82470703125, 3.955322265625, 4.0859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 6.0, 13.0, 12.0, 17.0, 28.0, 37.0, 49.0, 49.0, 107.0, 196.0, 343.0, 919.0, 2852.0, 13383.0, 157082.0, 843301.0, 23542.0, 4312.0, 1263.0, 474.0, 212.0, 119.0, 78.0, 36.0, 33.0, 26.0, 12.0, 8.0, 10.0, 11.0, 11.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.822265625, -0.7966842651367188, -0.7711029052734375, -0.7455215454101562, -0.719940185546875, -0.6943588256835938, -0.6687774658203125, -0.6431961059570312, -0.61761474609375, -0.5920333862304688, -0.5664520263671875, -0.5408706665039062, -0.515289306640625, -0.48970794677734375, -0.4641265869140625, -0.43854522705078125, -0.4129638671875, -0.38738250732421875, -0.3618011474609375, -0.33621978759765625, -0.310638427734375, -0.28505706787109375, -0.2594757080078125, -0.23389434814453125, -0.20831298828125, -0.18273162841796875, -0.1571502685546875, -0.13156890869140625, -0.105987548828125, -0.08040618896484375, -0.0548248291015625, -0.02924346923828125, -0.003662109375, 0.02191925048828125, 0.0475006103515625, 0.07308197021484375, 0.098663330078125, 0.12424468994140625, 0.1498260498046875, 0.17540740966796875, 0.20098876953125, 0.22657012939453125, 0.2521514892578125, 0.27773284912109375, 0.303314208984375, 0.32889556884765625, 0.3544769287109375, 0.38005828857421875, 0.4056396484375, 0.43122100830078125, 0.4568023681640625, 0.48238372802734375, 0.507965087890625, 0.5335464477539062, 0.5591278076171875, 0.5847091674804688, 0.61029052734375, 0.6358718872070312, 0.6614532470703125, 0.6870346069335938, 0.712615966796875, 0.7381973266601562, 0.7637786865234375, 0.7893600463867188, 0.81494140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 7.0, 5.0, 13.0, 15.0, 22.0, 18.0, 23.0, 28.0, 54.0, 63.0, 95.0, 105.0, 103.0, 93.0, 65.0, 57.0, 48.0, 23.0, 35.0, 13.0, 14.0, 21.0, 7.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00016760826110839844, -0.00016271322965621948, -0.00015781819820404053, -0.00015292316675186157, -0.00014802813529968262, -0.00014313310384750366, -0.0001382380723953247, -0.00013334304094314575, -0.0001284480094909668, -0.00012355297803878784, -0.00011865794658660889, -0.00011376291513442993, -0.00010886788368225098, -0.00010397285223007202, -9.907782077789307e-05, -9.418278932571411e-05, -8.928775787353516e-05, -8.43927264213562e-05, -7.949769496917725e-05, -7.460266351699829e-05, -6.970763206481934e-05, -6.481260061264038e-05, -5.9917569160461426e-05, -5.502253770828247e-05, -5.0127506256103516e-05, -4.523247480392456e-05, -4.0337443351745605e-05, -3.544241189956665e-05, -3.0547380447387695e-05, -2.565234899520874e-05, -2.0757317543029785e-05, -1.586228609085083e-05, -1.0967254638671875e-05, -6.07222318649292e-06, -1.1771917343139648e-06, 3.7178397178649902e-06, 8.612871170043945e-06, 1.35079026222229e-05, 1.8402934074401855e-05, 2.329796552658081e-05, 2.8192996978759766e-05, 3.308802843093872e-05, 3.7983059883117676e-05, 4.287809133529663e-05, 4.7773122787475586e-05, 5.266815423965454e-05, 5.7563185691833496e-05, 6.245821714401245e-05, 6.73532485961914e-05, 7.224828004837036e-05, 7.714331150054932e-05, 8.203834295272827e-05, 8.693337440490723e-05, 9.182840585708618e-05, 9.672343730926514e-05, 0.00010161846876144409, 0.00010651350021362305, 0.000111408531665802, 0.00011630356311798096, 0.00012119859457015991, 0.00012609362602233887, 0.00013098865747451782, 0.00013588368892669678, 0.00014077872037887573, 0.0001456737518310547]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 6.0, 11.0, 19.0, 25.0, 35.0, 61.0, 92.0, 136.0, 216.0, 408.0, 755.0, 1852.0, 4892.0, 16288.0, 79402.0, 830221.0, 87473.0, 17547.0, 5232.0, 1915.0, 920.0, 384.0, 240.0, 154.0, 77.0, 56.0, 37.0, 20.0, 24.0, 12.0, 12.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.431640625, -0.4187660217285156, -0.40589141845703125, -0.3930168151855469, -0.3801422119140625, -0.3672676086425781, -0.35439300537109375, -0.3415184020996094, -0.328643798828125, -0.3157691955566406, -0.30289459228515625, -0.2900199890136719, -0.2771453857421875, -0.2642707824707031, -0.25139617919921875, -0.23852157592773438, -0.22564697265625, -0.21277236938476562, -0.19989776611328125, -0.18702316284179688, -0.1741485595703125, -0.16127395629882812, -0.14839935302734375, -0.13552474975585938, -0.122650146484375, -0.10977554321289062, -0.09690093994140625, -0.08402633666992188, -0.0711517333984375, -0.058277130126953125, -0.04540252685546875, -0.032527923583984375, -0.0196533203125, -0.006778717041015625, 0.00609588623046875, 0.018970489501953125, 0.0318450927734375, 0.044719696044921875, 0.05759429931640625, 0.07046890258789062, 0.083343505859375, 0.09621810913085938, 0.10909271240234375, 0.12196731567382812, 0.1348419189453125, 0.14771652221679688, 0.16059112548828125, 0.17346572875976562, 0.18634033203125, 0.19921493530273438, 0.21208953857421875, 0.22496414184570312, 0.2378387451171875, 0.2507133483886719, 0.26358795166015625, 0.2764625549316406, 0.289337158203125, 0.3022117614746094, 0.31508636474609375, 0.3279609680175781, 0.3408355712890625, 0.3537101745605469, 0.36658477783203125, 0.3794593811035156, 0.392333984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 4.0, 9.0, 12.0, 14.0, 11.0, 20.0, 7.0, 15.0, 11.0, 37.0, 36.0, 44.0, 65.0, 71.0, 108.0, 113.0, 75.0, 51.0, 55.0, 29.0, 26.0, 20.0, 32.0, 18.0, 10.0, 7.0, 7.0, 13.0, 13.0, 9.0, 3.0, 5.0, 4.0, 3.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.4091796875, -0.3961830139160156, -0.38318634033203125, -0.3701896667480469, -0.3571929931640625, -0.3441963195800781, -0.33119964599609375, -0.3182029724121094, -0.305206298828125, -0.2922096252441406, -0.27921295166015625, -0.2662162780761719, -0.2532196044921875, -0.24022293090820312, -0.22722625732421875, -0.21422958374023438, -0.20123291015625, -0.18823623657226562, -0.17523956298828125, -0.16224288940429688, -0.1492462158203125, -0.13624954223632812, -0.12325286865234375, -0.11025619506835938, -0.097259521484375, -0.08426284790039062, -0.07126617431640625, -0.058269500732421875, -0.0452728271484375, -0.032276153564453125, -0.01927947998046875, -0.006282806396484375, 0.0067138671875, 0.019710540771484375, 0.03270721435546875, 0.045703887939453125, 0.0587005615234375, 0.07169723510742188, 0.08469390869140625, 0.09769058227539062, 0.110687255859375, 0.12368392944335938, 0.13668060302734375, 0.14967727661132812, 0.1626739501953125, 0.17567062377929688, 0.18866729736328125, 0.20166397094726562, 0.21466064453125, 0.22765731811523438, 0.24065399169921875, 0.2536506652832031, 0.2666473388671875, 0.2796440124511719, 0.29264068603515625, 0.3056373596191406, 0.318634033203125, 0.3316307067871094, 0.34462738037109375, 0.3576240539550781, 0.3706207275390625, 0.3836174011230469, 0.39661407470703125, 0.4096107482910156, 0.422607421875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 12.0, 27.0, 92.0, 632.0, 155.0, 60.0, 17.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.067142486572266, -43.76972579956055, -42.47230911254883, -41.17489242553711, -39.877479553222656, -38.58006286621094, -37.28264617919922, -35.9852294921875, -34.68781280517578, -33.39039611816406, -32.092979431152344, -30.795564651489258, -29.49814796447754, -28.20073127746582, -26.903316497802734, -25.605899810791016, -24.308483123779297, -23.011066436767578, -21.71364974975586, -20.416234970092773, -19.118818283081055, -17.821401596069336, -16.52398681640625, -15.226570129394531, -13.929153442382812, -12.631736755371094, -11.334321022033691, -10.036905288696289, -8.73948860168457, -7.44207239151001, -6.144656181335449, -4.847240447998047, -3.5498275756835938, -2.252411365509033, -0.9549951553344727, 0.3424210548400879, 1.6398372650146484, 2.937253475189209, 4.2346696853637695, 5.532085418701172, 6.829502105712891, 8.12691879272461, 9.424334526062012, 10.721750259399414, 12.019166946411133, 13.316583633422852, 14.613999366760254, 15.911415100097656, 17.208831787109375, 18.506248474121094, 19.803665161132812, 21.1010799407959, 22.398496627807617, 23.695913314819336, 24.993328094482422, 26.29074478149414, 27.58816146850586, 28.885578155517578, 30.182994842529297, 31.480409622192383, 32.77782440185547, 34.07524108886719, 35.372657775878906, 36.670074462890625, 37.967491149902344]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 2.0, 11.0, 11.0, 7.0, 15.0, 16.0, 23.0, 21.0, 27.0, 32.0, 48.0, 133.0, 382.0, 62.0, 37.0, 29.0, 35.0, 23.0, 21.0, 17.0, 19.0, 9.0, 12.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.31124496459961, -25.717653274536133, -25.124059677124023, -24.530467987060547, -23.93687629699707, -23.343284606933594, -22.749691009521484, -22.156099319458008, -21.56250762939453, -20.968915939331055, -20.375322341918945, -19.78173065185547, -19.188138961791992, -18.594547271728516, -18.000953674316406, -17.40736198425293, -16.813770294189453, -16.220178604125977, -15.626585960388184, -15.03299331665039, -14.439401626586914, -13.845808982849121, -13.252216339111328, -12.658624649047852, -12.065031051635742, -11.47143840789795, -10.877846717834473, -10.28425407409668, -9.690662384033203, -9.09706974029541, -8.503477096557617, -7.909885406494141, -7.3162946701049805, -6.722702503204346, -6.129110336303711, -5.535517692565918, -4.941926002502441, -4.348333358764648, -3.7547411918640137, -3.161149024963379, -2.567556858062744, -1.9739646911621094, -1.380372405052185, -0.7867801189422607, -0.19318795204162598, 0.4004042148590088, 0.9939966201782227, 1.5875887870788574, 2.181180953979492, 2.774773120880127, 3.3683652877807617, 3.9619576930999756, 4.555549621582031, 5.149142265319824, 5.742734432220459, 6.336326599121094, 6.9299187660217285, 7.523510932922363, 8.117103576660156, 8.710695266723633, 9.304287910461426, 9.897879600524902, 10.491472244262695, 11.085063934326172, 11.678656578063965]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 8.0, 8.0, 9.0, 16.0, 17.0, 9.0, 20.0, 19.0, 28.0, 25.0, 24.0, 28.0, 45.0, 85.0, 201.0, 116.0, 53.0, 27.0, 27.0, 30.0, 27.0, 28.0, 17.0, 16.0, 19.0, 16.0, 22.0, 7.0, 11.0, 7.0, 6.0, 9.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.015625, -0.9863510131835938, -0.9570770263671875, -0.9278030395507812, -0.898529052734375, -0.8692550659179688, -0.8399810791015625, -0.8107070922851562, -0.78143310546875, -0.7521591186523438, -0.7228851318359375, -0.6936111450195312, -0.664337158203125, -0.6350631713867188, -0.6057891845703125, -0.5765151977539062, -0.5472412109375, -0.5179672241210938, -0.4886932373046875, -0.45941925048828125, -0.430145263671875, -0.40087127685546875, -0.3715972900390625, -0.34232330322265625, -0.31304931640625, -0.28377532958984375, -0.2545013427734375, -0.22522735595703125, -0.195953369140625, -0.16667938232421875, -0.1374053955078125, -0.10813140869140625, -0.078857421875, -0.04958343505859375, -0.0203094482421875, 0.00896453857421875, 0.038238525390625, 0.06751251220703125, 0.0967864990234375, 0.12606048583984375, 0.15533447265625, 0.18460845947265625, 0.2138824462890625, 0.24315643310546875, 0.272430419921875, 0.30170440673828125, 0.3309783935546875, 0.36025238037109375, 0.3895263671875, 0.41880035400390625, 0.4480743408203125, 0.47734832763671875, 0.506622314453125, 0.5358963012695312, 0.5651702880859375, 0.5944442749023438, 0.62371826171875, 0.6529922485351562, 0.6822662353515625, 0.7115402221679688, 0.740814208984375, 0.7700881958007812, 0.7993621826171875, 0.8286361694335938, 0.85791015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 15.0, 6.0, 21.0, 24.0, 57.0, 160.0, 483.0, 2502.0, 42343.0, 8336921.0, 4849.0, 800.0, 202.0, 75.0, 35.0, 31.0, 9.0, 6.0, 7.0, 6.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-14.636923789978027, -14.151557922363281, -13.666192054748535, -13.180826187133789, -12.695460319519043, -12.210094451904297, -11.724727630615234, -11.239362716674805, -10.753995895385742, -10.268630027770996, -9.78326416015625, -9.297898292541504, -8.812532424926758, -8.327166557312012, -7.841800212860107, -7.356434345245361, -6.871068954467773, -6.385703086853027, -5.900337219238281, -5.414971351623535, -4.929605484008789, -4.444239616394043, -3.9588732719421387, -3.4735074043273926, -2.9881415367126465, -2.5027756690979004, -2.0174098014831543, -1.532043695449829, -1.046677827835083, -0.5613119602203369, -0.07594585418701172, 0.4094200134277344, 0.8947849273681641, 1.3801507949829102, 1.8655167818069458, 2.3508827686309814, 2.8362486362457275, 3.3216145038604736, 3.806980609893799, 4.292346477508545, 4.777712345123291, 5.263078212738037, 5.748444080352783, 6.2338104248046875, 6.719176292419434, 7.20454216003418, 7.689908027648926, 8.175273895263672, 8.660639762878418, 9.146005630493164, 9.63137149810791, 10.116737365722656, 10.602103233337402, 11.087469100952148, 11.572835922241211, 12.05820083618164, 12.543567657470703, 13.02893352508545, 13.514299392700195, 13.999665260314941, 14.485031127929688, 14.970396995544434, 15.45576286315918, 15.941129684448242, 16.426494598388672]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 7.0, 1.0, 5.0, 4.0, 11.0, 4.0, 7.0, 4.0, 8.0, 5.0, 3.0, 6.0, 2.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-11.512982368469238, -11.189505577087402, -10.866028785705566, -10.54255199432373, -10.219076156616211, -9.895599365234375, -9.572122573852539, -9.248645782470703, -8.925168991088867, -8.601692199707031, -8.278215408325195, -7.954739093780518, -7.631262302398682, -7.307785511016846, -6.984309196472168, -6.660832405090332, -6.337355613708496, -6.01387882232666, -5.690402030944824, -5.3669257164001465, -5.0434489250183105, -4.719972133636475, -4.396495819091797, -4.073019027709961, -3.749542236328125, -3.426065444946289, -3.1025888919830322, -2.7791123390197754, -2.4556355476379395, -2.1321587562561035, -1.8086822032928467, -1.4852056503295898, -1.1617279052734375, -0.8382512331008911, -0.5147745609283447, -0.19129788875579834, 0.13217878341674805, 0.45565545558929443, 0.7791321277618408, 1.1026086807250977, 1.4260854721069336, 1.74956214427948, 2.0730388164520264, 2.396515369415283, 2.719992160797119, 3.043468952178955, 3.366945505142212, 3.6904220581054688, 4.013898849487305, 4.337375640869141, 4.660852432250977, 4.984328746795654, 5.30780553817749, 5.631282329559326, 5.954758644104004, 6.27823543548584, 6.601712226867676, 6.925189018249512, 7.248665809631348, 7.572142124176025, 7.895618915557861, 8.219095230102539, 8.542572021484375, 8.866048812866211, 9.189525604248047]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 15.0, 10.0, 14.0, 19.0, 16.0, 24.0, 38.0, 41.0, 53.0, 95.0, 117.0, 185.0, 312.0, 623.0, 1303.0, 3017.0, 7527.0, 20047.0, 55782.0, 149823.0, 175897.0, 69207.0, 24273.0, 9190.0, 3497.0, 1459.0, 683.0, 360.0, 189.0, 114.0, 91.0, 58.0, 48.0, 33.0, 23.0, 19.0, 15.0, 9.0, 7.0, 2.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.8671875, -7.629638671875, -7.39208984375, -7.154541015625, -6.9169921875, -6.679443359375, -6.44189453125, -6.204345703125, -5.966796875, -5.729248046875, -5.49169921875, -5.254150390625, -5.0166015625, -4.779052734375, -4.54150390625, -4.303955078125, -4.06640625, -3.828857421875, -3.59130859375, -3.353759765625, -3.1162109375, -2.878662109375, -2.64111328125, -2.403564453125, -2.166015625, -1.928466796875, -1.69091796875, -1.453369140625, -1.2158203125, -0.978271484375, -0.74072265625, -0.503173828125, -0.265625, -0.028076171875, 0.20947265625, 0.447021484375, 0.6845703125, 0.922119140625, 1.15966796875, 1.397216796875, 1.634765625, 1.872314453125, 2.10986328125, 2.347412109375, 2.5849609375, 2.822509765625, 3.06005859375, 3.297607421875, 3.53515625, 3.772705078125, 4.01025390625, 4.247802734375, 4.4853515625, 4.722900390625, 4.96044921875, 5.197998046875, 5.435546875, 5.673095703125, 5.91064453125, 6.148193359375, 6.3857421875, 6.623291015625, 6.86083984375, 7.098388671875, 7.3359375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 9.0, 4.0, 4.0, 20.0, 12.0, 20.0, 25.0, 28.0, 30.0, 51.0, 56.0, 56.0, 70.0, 69.0, 64.0, 84.0, 69.0, 57.0, 37.0, 54.0, 36.0, 26.0, 17.0, 17.0, 14.0, 18.0, 11.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3701171875, -1.33001708984375, -1.2899169921875, -1.24981689453125, -1.209716796875, -1.16961669921875, -1.1295166015625, -1.08941650390625, -1.04931640625, -1.00921630859375, -0.9691162109375, -0.92901611328125, -0.888916015625, -0.84881591796875, -0.8087158203125, -0.76861572265625, -0.728515625, -0.68841552734375, -0.6483154296875, -0.60821533203125, -0.568115234375, -0.52801513671875, -0.4879150390625, -0.44781494140625, -0.40771484375, -0.36761474609375, -0.3275146484375, -0.28741455078125, -0.247314453125, -0.20721435546875, -0.1671142578125, -0.12701416015625, -0.0869140625, -0.04681396484375, -0.0067138671875, 0.03338623046875, 0.073486328125, 0.11358642578125, 0.1536865234375, 0.19378662109375, 0.23388671875, 0.27398681640625, 0.3140869140625, 0.35418701171875, 0.394287109375, 0.43438720703125, 0.4744873046875, 0.51458740234375, 0.5546875, 0.59478759765625, 0.6348876953125, 0.67498779296875, 0.715087890625, 0.75518798828125, 0.7952880859375, 0.83538818359375, 0.87548828125, 0.91558837890625, 0.9556884765625, 0.99578857421875, 1.035888671875, 1.07598876953125, 1.1160888671875, 1.15618896484375, 1.1962890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 19.0, 16.0, 65.0, 133.0, 125.0, 70.0, 18.0, 10.0, 10.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671615600585938, -8.208333015441895, -7.74505090713501, -7.281768321990967, -6.818486213684082, -6.355203628540039, -5.891921043395996, -5.428638935089111, -4.965356826782227, -4.502074241638184, -4.038792133331299, -3.575509548187256, -3.112227439880371, -2.648944854736328, -2.1856625080108643, -1.7223801612854004, -1.2590975761413574, -0.7958152294158936, -0.3325328230857849, 0.13074958324432373, 0.5940319299697876, 1.057314395904541, 1.5205967426300049, 1.9838790893554688, 2.4471614360809326, 2.9104437828063965, 3.3737261295318604, 3.837008476257324, 4.300291061401367, 4.76357364654541, 5.226855754852295, 5.69013786315918, 6.153420448303223, 6.616703033447266, 7.07998514175415, 7.543267726898193, 8.006549835205078, 8.469832420349121, 8.933115005493164, 9.39639663696289, 9.859679222106934, 10.322961807250977, 10.78624439239502, 11.249526023864746, 11.712808609008789, 12.176091194152832, 12.639373779296875, 13.102655410766602, 13.565938949584961, 14.029221534729004, 14.492504119873047, 14.955785751342773, 15.419068336486816, 15.88235092163086, 16.345632553100586, 16.808916091918945, 17.272197723388672, 17.7354793548584, 18.198762893676758, 18.662044525146484, 19.125328063964844, 19.58860969543457, 20.051891326904297, 20.515174865722656, 20.978456497192383]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 7.0, 5.0, 9.0, 8.0, 21.0, 42.0, 127.0, 121.0, 60.0, 18.0, 13.0, 7.0, 6.0, 6.0, 7.0, 2.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.394720077514648, -9.122709274291992, -8.850698471069336, -8.578688621520996, -8.30667781829834, -8.034667015075684, -7.762656211853027, -7.490645408630371, -7.218635082244873, -6.946624279022217, -6.674613952636719, -6.4026031494140625, -6.130592346191406, -5.858582019805908, -5.586571216583252, -5.314560890197754, -5.042550086975098, -4.770539283752441, -4.498528957366943, -4.226518154144287, -3.95450758934021, -3.682497024536133, -3.4104862213134766, -3.1384756565093994, -2.8664650917053223, -2.594454526901245, -2.322443962097168, -2.0504331588745117, -1.7784225940704346, -1.5064120292663574, -1.2344013452529907, -0.962390661239624, -0.6903800964355469, -0.41836947202682495, -0.14635884761810303, 0.1256517767906189, 0.3976624011993408, 0.669672966003418, 0.9416836500167847, 1.2136943340301514, 1.4857048988342285, 1.7577154636383057, 2.029726028442383, 2.301736831665039, 2.573747396469116, 2.8457579612731934, 3.1177687644958496, 3.3897793292999268, 3.661789894104004, 3.933800458908081, 4.205811023712158, 4.4778218269348145, 4.7498321533203125, 5.021842956542969, 5.293853759765625, 5.565864562988281, 5.837874889373779, 6.1098856925964355, 6.381896018981934, 6.65390682220459, 6.925917625427246, 7.197927951812744, 7.4699387550354, 7.741949081420898, 8.013959884643555]}, "eval/loss": 4.192998886108398, "eval/wer": 1.903669178897263, "eval/runtime": 786.9912, "eval/samples_per_second": 3.357, "eval/steps_per_second": 0.281} \ No newline at end of file